| From 0422ee31d8accf9a0944f628bd7af1a8a8617dfb Mon Sep 17 00:00:00 2001 |
| From: Zhang Rui <rui.zhang@intel.com> |
| Date: Tue, 16 Aug 2022 13:16:31 +0800 |
| Subject: [PATCH] FROMLIST: x86/topology: Fix max_siblings calculation |
| |
| The max siblings value returned by CPUID.1F SMT level EBX differs among |
| CPUs on Intel Hybrid platforms like ADL-S/P. |
| It returns 2 for Pcore CPUs which have HT sibling and 1 for Ecore CPUs |
| which do not. |
| |
| Today, CPUID SMT level EBX sets the global variable smp_num_siblings. |
| Thus, smp_num_siblings is overridden to different values based on the CPU |
| Pcore/Ecore enumeration order. |
| |
| For example, |
| |
| [ 0.201005] detect_extended_topology: CPU APICID 0x0, smp_num_siblings 2, x86_max_cores 10 |
| [ 0.201117] start_kernel->check_bugs->cpu_smt_check_topology: smp_num_siblings 2 |
| ... |
| [ 0.010146] detect_extended_topology: CPU APICID 0x8, smp_num_siblings 2, x86_max_cores 10 |
| ... |
| [ 0.010146] detect_extended_topology: CPU APICID 0x39, smp_num_siblings 2, x86_max_cores 10 |
| [ 0.010146] detect_extended_topology: CPU APICID 0x48, smp_num_siblings 1, x86_max_cores 20 |
| ... |
| [ 0.010146] detect_extended_topology: CPU APICID 0x4e, smp_num_siblings 1, x86_max_cores 20 |
| [ 2.583800] sched_set_itmt_core_prio: smp_num_siblings 1 |
| |
| This inconsistency brings several potential issues: |
| 1. some kernel configuration like cpu_smt_control, as set in |
| start_kernel()->check_bugs()->cpu_smt_check_topology(), depends on |
| smp_num_siblings set by cpu0. |
| It is pure luck that all the current hybrid platforms use Pcore as cpu0 |
| and hide this problem. |
| 2. some per CPU data like cpuinfo_x86.x86_max_cores that depends on |
| smp_num_siblings becomes inconsistent and bogus. |
| 3. the final smp_num_siblings value after boot depends on the last CPU |
| enumerated, which could either be Pcore or Ecore CPU. |
| |
| The solution is to use CPUID EAX bits_shift to get the maximum number of |
| addressable logical processors, and use this to determin max siblings. |
| Because: |
| 1. the CPUID EAX bits_shift values are consistent among CPUs as far as |
| observed. |
| 2. some code already uses smp_num_siblings value to isolate the SMT ID |
| bits in APIC-ID, like apic_id_is_primary_thread(). |
| |
| Suggested-and-reviewed-by: Len Brown <len.brown@intel.com> |
| Signed-off-by: Zhang Rui <rui.zhang@intel.com> |
| (am from https://patchwork.kernel.org/patch/12944429/) |
| (also found at https://lore.kernel.org/r/20220816051633.17775-7-rui.zhang@intel.com) |
| |
| BUG=b:239519025 |
| TEST=None |
| |
| Signed-off-by: Srihari Uttanur <srihari.uttanur@intel.corp-partner.google.com> |
| Change-Id: I4bf9b7e1d7278ae1c182cafabf288f4c1713f47e |
| Reviewed-on: https://chromium-review.googlesource.com/c/chromiumos/third_party/kernel/+/3832287 |
| Reviewed-by: Sean Paul <sean@poorly.run> |
| Reviewed-by: Victor Ding <victording@chromium.org> |
| Reviewed-by: Sam McNally <sammc@chromium.org> |
| Commit-Queue: Victor Ding <victording@chromium.org> |
| Tested-by: Altaf Basha <altaf.basha@intel.com> |
| Commit-Queue: Sam McNally <sammc@chromium.org> |
| --- |
| arch/x86/kernel/cpu/topology.c | 19 ++++++++++++------- |
| 1 file changed, 12 insertions(+), 7 deletions(-) |
| |
| diff --git a/arch/x86/kernel/cpu/topology.c b/arch/x86/kernel/cpu/topology.c |
| index dc136703566f3fb97cc77fde581a373a8688c909..ad5d5aee8a6886c6690beb30c37643de7b74e537 100644 |
| --- a/arch/x86/kernel/cpu/topology.c |
| +++ b/arch/x86/kernel/cpu/topology.c |
| @@ -23,7 +23,12 @@ |
| |
| #define LEAFB_SUBTYPE(ecx) (((ecx) >> 8) & 0xff) |
| #define BITS_SHIFT_NEXT_LEVEL(eax) ((eax) & 0x1f) |
| -#define LEVEL_MAX_SIBLINGS(ebx) ((ebx) & 0xffff) |
| + |
| +/* |
| + * Use EAX bit_shift to calculate the maximum number of addressable logical |
| + * processors sharing the current level. |
| + */ |
| +#define LEVEL_MAX_SIBLINGS(eax) (1 << BITS_SHIFT_NEXT_LEVEL(eax)) |
| |
| unsigned int __max_die_per_package __read_mostly = 1; |
| EXPORT_SYMBOL(__max_die_per_package); |
| @@ -79,7 +84,7 @@ int detect_extended_topology_early(struct cpuinfo_x86 *c) |
| * initial apic id, which also represents 32-bit extended x2apic id. |
| */ |
| c->topo.initial_apicid = edx; |
| - smp_num_siblings = max_t(int, smp_num_siblings, LEVEL_MAX_SIBLINGS(ebx)); |
| + smp_num_siblings = max_t(int, smp_num_siblings, LEVEL_MAX_SIBLINGS(eax)); |
| #endif |
| return 0; |
| } |
| @@ -109,10 +114,10 @@ int detect_extended_topology(struct cpuinfo_x86 *c) |
| */ |
| cpuid_count(leaf, SMT_LEVEL, &eax, &ebx, &ecx, &edx); |
| c->topo.initial_apicid = edx; |
| - core_level_siblings = LEVEL_MAX_SIBLINGS(ebx); |
| - smp_num_siblings = max_t(int, smp_num_siblings, LEVEL_MAX_SIBLINGS(ebx)); |
| + core_level_siblings = LEVEL_MAX_SIBLINGS(eax); |
| + smp_num_siblings = max_t(int, smp_num_siblings, LEVEL_MAX_SIBLINGS(eax)); |
| core_plus_mask_width = ht_mask_width = BITS_SHIFT_NEXT_LEVEL(eax); |
| - die_level_siblings = LEVEL_MAX_SIBLINGS(ebx); |
| + die_level_siblings = LEVEL_MAX_SIBLINGS(eax); |
| pkg_mask_width = die_plus_mask_width = BITS_SHIFT_NEXT_LEVEL(eax); |
| |
| sub_index = 1; |
| @@ -123,14 +128,14 @@ int detect_extended_topology(struct cpuinfo_x86 *c) |
| * Check for the Core type in the implemented sub leaves. |
| */ |
| if (LEAFB_SUBTYPE(ecx) == CORE_TYPE) { |
| - core_level_siblings = LEVEL_MAX_SIBLINGS(ebx); |
| + core_level_siblings = LEVEL_MAX_SIBLINGS(eax); |
| core_plus_mask_width = BITS_SHIFT_NEXT_LEVEL(eax); |
| die_level_siblings = core_level_siblings; |
| die_plus_mask_width = BITS_SHIFT_NEXT_LEVEL(eax); |
| } |
| if (LEAFB_SUBTYPE(ecx) == DIE_TYPE) { |
| die_level_present = true; |
| - die_level_siblings = LEVEL_MAX_SIBLINGS(ebx); |
| + die_level_siblings = LEVEL_MAX_SIBLINGS(eax); |
| die_plus_mask_width = BITS_SHIFT_NEXT_LEVEL(eax); |
| } |
| |
| -- |
| 2.43.0.rc2.451.g8631bc7472-goog |
| |