From: Keir Fraser Date: Fri, 16 Jul 2010 12:54:44 +0000 (+0100) Subject: x86: use cpuid vector 0xb when available for detecting cpu topology X-Git-Tag: archive/raspbian/4.8.0-1+rpi1~1^2~11771 X-Git-Url: https://dgit.raspbian.org/?a=commitdiff_plain;h=6518d6c62b21a5c765a923a3e56312d942ddbbe3;p=xen.git x86: use cpuid vector 0xb when available for detecting cpu topology cpuid leaf 0xb provides extended topology enumeration. This interface provides the 32-bit x2APIC id of the logical processor and it also provides a new mechanism to detect SMT and core siblings (which provides increased addressability). Signed-off-by: Weidong Han --- diff --git a/xen/arch/x86/cpu/common.c b/xen/arch/x86/cpu/common.c index 3899a54260..ebe96a2f0d 100644 --- a/xen/arch/x86/cpu/common.c +++ b/xen/arch/x86/cpu/common.c @@ -469,7 +469,6 @@ void __cpuinit identify_cpu(struct cpuinfo_x86 *c) mtrr_bp_init(); } -#ifdef CONFIG_X86_HT /* cpuid returns the value latched in the HW at reset, not the APIC ID * register's value. For any box whose BIOS changes APIC IDs, like * clustered APIC systems, we must use hard_smp_processor_id. @@ -481,6 +480,81 @@ static inline u32 phys_pkg_id(u32 cpuid_apic, int index_msb) return hard_smp_processor_id() >> index_msb; } +/* leaf 0xb SMT level */ +#define SMT_LEVEL 0 + +/* leaf 0xb sub-leaf types */ +#define INVALID_TYPE 0 +#define SMT_TYPE 1 +#define CORE_TYPE 2 + +#define LEAFB_SUBTYPE(ecx) (((ecx) >> 8) & 0xff) +#define BITS_SHIFT_NEXT_LEVEL(eax) ((eax) & 0x1f) +#define LEVEL_MAX_SIBLINGS(ebx) ((ebx) & 0xffff) + +/* + * Check for extended topology enumeration cpuid leaf 0xb and if it + * exists, use it for cpu topology detection. + */ +void __cpuinit detect_extended_topology(struct cpuinfo_x86 *c) +{ + unsigned int eax, ebx, ecx, edx, sub_index; + unsigned int ht_mask_width, core_plus_mask_width; + unsigned int core_select_mask, core_level_siblings, smp_num_siblings; + unsigned int initial_apicid; + int cpu = smp_processor_id(); + + if ( c->cpuid_level < 0xb ) + return; + + cpuid_count(0xb, SMT_LEVEL, &eax, &ebx, &ecx, &edx); + + /* Check if the cpuid leaf 0xb is actually implemented */ + if ( ebx == 0 || (LEAFB_SUBTYPE(ecx) != SMT_TYPE) ) + return; + + set_bit(X86_FEATURE_XTOPOLOGY, c->x86_capability); + + initial_apicid = edx; + + /* Populate HT related information from sub-leaf level 0 */ + core_level_siblings = smp_num_siblings = LEVEL_MAX_SIBLINGS(ebx); + core_plus_mask_width = ht_mask_width = BITS_SHIFT_NEXT_LEVEL(eax); + + sub_index = 1; + do { + cpuid_count(0xb, sub_index, &eax, &ebx, &ecx, &edx); + + /* Check for the Core type in the implemented sub leaves */ + if ( LEAFB_SUBTYPE(ecx) == CORE_TYPE ) { + core_level_siblings = LEVEL_MAX_SIBLINGS(ebx); + core_plus_mask_width = BITS_SHIFT_NEXT_LEVEL(eax); + break; + } + + sub_index++; + } while ( LEAFB_SUBTYPE(ecx) != INVALID_TYPE ); + + core_select_mask = (~(-1 << core_plus_mask_width)) >> ht_mask_width; + + cpu_core_id[cpu] = phys_pkg_id(initial_apicid, ht_mask_width) + & core_select_mask; + phys_proc_id[cpu] = phys_pkg_id(initial_apicid, core_plus_mask_width); + + c->apicid = phys_pkg_id(initial_apicid, 0); + c->x86_max_cores = (core_level_siblings / smp_num_siblings); + + if ( opt_cpu_info ) + { + printk("CPU: Physical Processor ID: %d\n", + phys_proc_id[cpu]); + if ( c->x86_max_cores > 1 ) + printk("CPU: Processor Core ID: %d\n", + cpu_core_id[cpu]); + } +} + +#ifdef CONFIG_X86_HT void __cpuinit detect_ht(struct cpuinfo_x86 *c) { u32 eax, ebx, ecx, edx; @@ -491,7 +565,8 @@ void __cpuinit detect_ht(struct cpuinfo_x86 *c) c->apicid = phys_pkg_id((ebx >> 24) & 0xFF, 0); - if (!cpu_has(c, X86_FEATURE_HT) || cpu_has(c, X86_FEATURE_CMP_LEGACY)) + if (!cpu_has(c, X86_FEATURE_HT) || cpu_has(c, X86_FEATURE_CMP_LEGACY) + || cpu_has(c, X86_FEATURE_XTOPOLOGY)) return; c->x86_num_siblings = (ebx & 0xff0000) >> 16; diff --git a/xen/arch/x86/cpu/intel.c b/xen/arch/x86/cpu/intel.c index cccfa4bf14..67a40beb42 100644 --- a/xen/arch/x86/cpu/intel.c +++ b/xen/arch/x86/cpu/intel.c @@ -154,6 +154,9 @@ static void __devinit init_intel(struct cpuinfo_x86 *c) } #endif + /* Detect the extended topology information if available */ + detect_extended_topology(c); + select_idle_routine(c); l2 = init_intel_cacheinfo(c); if (c->cpuid_level > 9) { @@ -197,10 +200,12 @@ static void __devinit init_intel(struct cpuinfo_x86 *c) if ( p ) safe_strcpy(c->x86_model_id, p); - - c->x86_max_cores = num_cpu_cores(c); - detect_ht(c); + if ( !cpu_has(c, X86_FEATURE_XTOPOLOGY) ) + { + c->x86_max_cores = num_cpu_cores(c); + detect_ht(c); + } set_cpuidmask(c); diff --git a/xen/include/asm-x86/cpufeature.h b/xen/include/asm-x86/cpufeature.h index 72fe0db491..cd14b3b268 100644 --- a/xen/include/asm-x86/cpufeature.h +++ b/xen/include/asm-x86/cpufeature.h @@ -78,6 +78,7 @@ #define X86_FEATURE_ARAT (3*32+ 10) /* Always running APIC timer */ #define X86_FEATURE_ARCH_PERFMON (3*32+11) /* Intel Architectural PerfMon */ #define X86_FEATURE_TSC_RELIABLE (3*32+12) /* TSC is known to be reliable */ +#define X86_FEATURE_XTOPOLOGY (3*32+13) /* cpu topology enum extensions */ /* Intel-defined CPU features, CPUID level 0x00000001 (ecx), word 4 */ #define X86_FEATURE_XMM3 (4*32+ 0) /* Streaming SIMD Extensions-3 */ diff --git a/xen/include/asm-x86/processor.h b/xen/include/asm-x86/processor.h index 03791206aa..c9ae5cea03 100644 --- a/xen/include/asm-x86/processor.h +++ b/xen/include/asm-x86/processor.h @@ -202,6 +202,8 @@ extern void print_cpu_info(unsigned int cpu); extern unsigned int init_intel_cacheinfo(struct cpuinfo_x86 *c); extern void dodgy_tsc(void); +extern void detect_extended_topology(struct cpuinfo_x86 *c); + #ifdef CONFIG_X86_HT extern void detect_ht(struct cpuinfo_x86 *c); #else