Re: [patch v2 38/38] x86/apic/uv: Remove the private leaf 0xb parser

From: Steve Wahl
Date: Tue Aug 08 2023 - 16:45:04 EST


Looked closely at this one, was wondering about using TOPO_ROOT_DOMAIN
when the original looked at the leaf of TYPE_CORE. But I think you
probably have it right, and I checked both a newer and an older
system, and the UV info line that prints "apic_pns" gets the same
value as before.

Reviewed-by: Steve Wahl <steve.wahl@xxxxxxx>

On Fri, Jul 28, 2023 at 02:13:30PM +0200, Thomas Gleixner wrote:
> The package shift has been already evaluated by the early CPU init.
>
> Put the mindless copy right next to the original leaf 0xb parser.
>
> Signed-off-by: Thomas Gleixner <tglx@xxxxxxxxxxxxx>
> Cc: Steve Wahl <steve.wahl@xxxxxxx>
> Cc: Mike Travis <mike.travis@xxxxxxx>
> Cc: Dimitri Sivanich <dimitri.sivanich@xxxxxxx>
> Cc: Russ Anderson <russ.anderson@xxxxxxx>
> ---
> arch/x86/include/asm/topology.h | 5 +++
> arch/x86/kernel/apic/x2apic_uv_x.c | 52 ++++++-------------------------------
> 2 files changed, 14 insertions(+), 43 deletions(-)
>
> --- a/arch/x86/include/asm/topology.h
> +++ b/arch/x86/include/asm/topology.h
> @@ -126,6 +126,11 @@ static inline unsigned int topology_get_
> return x86_topo_system.dom_size[dom];
> }
>
> +static inline unsigned int topology_get_domain_shift(enum x86_topology_domains dom)
> +{
> + return dom == TOPO_SMT_DOMAIN ? 0 : x86_topo_system.dom_shifts[dom - 1];
> +}
> +
> extern const struct cpumask *cpu_coregroup_mask(int cpu);
> extern const struct cpumask *cpu_clustergroup_mask(int cpu);
>
> --- a/arch/x86/kernel/apic/x2apic_uv_x.c
> +++ b/arch/x86/kernel/apic/x2apic_uv_x.c
> @@ -241,54 +241,20 @@ static void __init uv_tsc_check_sync(voi
> is_uv(UV3) ? sname.s3.field : \
> undef)
>
> -/* [Copied from arch/x86/kernel/cpu/topology.c:detect_extended_topology()] */
> -
> -#define SMT_LEVEL 0 /* Leaf 0xb SMT level */
> -#define INVALID_TYPE 0 /* Leaf 0xb sub-leaf types */
> -#define SMT_TYPE 1
> -#define CORE_TYPE 2
> -#define LEAFB_SUBTYPE(ecx) (((ecx) >> 8) & 0xff)
> -#define BITS_SHIFT_NEXT_LEVEL(eax) ((eax) & 0x1f)
> -
> -static void set_x2apic_bits(void)
> -{
> - unsigned int eax, ebx, ecx, edx, sub_index;
> - unsigned int sid_shift;
> -
> - cpuid(0, &eax, &ebx, &ecx, &edx);
> - if (eax < 0xb) {
> - pr_info("UV: CPU does not have CPUID.11\n");
> - return;
> - }
> -
> - cpuid_count(0xb, SMT_LEVEL, &eax, &ebx, &ecx, &edx);
> - if (ebx == 0 || (LEAFB_SUBTYPE(ecx) != SMT_TYPE)) {
> - pr_info("UV: CPUID.11 not implemented\n");
> - return;
> - }
> -
> - sid_shift = BITS_SHIFT_NEXT_LEVEL(eax);
> - sub_index = 1;
> - do {
> - cpuid_count(0xb, sub_index, &eax, &ebx, &ecx, &edx);
> - if (LEAFB_SUBTYPE(ecx) == CORE_TYPE) {
> - sid_shift = BITS_SHIFT_NEXT_LEVEL(eax);
> - break;
> - }
> - sub_index++;
> - } while (LEAFB_SUBTYPE(ecx) != INVALID_TYPE);
> -
> - uv_cpuid.apicid_shift = 0;
> - uv_cpuid.apicid_mask = (~(-1 << sid_shift));
> - uv_cpuid.socketid_shift = sid_shift;
> -}
> -
> static void __init early_get_apic_socketid_shift(void)
> {
> + unsigned int sid_shift = topology_get_domain_shift(TOPO_ROOT_DOMAIN);
> +
> if (is_uv2_hub() || is_uv3_hub())
> uvh_apicid.v = uv_early_read_mmr(UVH_APICID);
>
> - set_x2apic_bits();
> + if (sid_shift) {
> + uv_cpuid.apicid_shift = 0;
> + uv_cpuid.apicid_mask = (~(-1 << sid_shift));
> + uv_cpuid.socketid_shift = sid_shift;
> + } else {
> + pr_info("UV: CPU does not have valid CPUID.11\n");
> + }
>
> pr_info("UV: apicid_shift:%d apicid_mask:0x%x\n", uv_cpuid.apicid_shift, uv_cpuid.apicid_mask);
> pr_info("UV: socketid_shift:%d pnode_mask:0x%x\n", uv_cpuid.socketid_shift, uv_cpuid.pnode_mask);
>

--
Steve Wahl, Hewlett Packard Enterprise