x86/cpu: Move cpu_l[l2]c_id into topology info

author Thomas Gleixner <tglx@linutronix.de>

Mon, 14 Aug 2023 08:18:38 +0000 (10:18 +0200)

committer Thomas Gleixner <tglx@linutronix.de>

Tue, 10 Oct 2023 12:38:18 +0000 (14:38 +0200)
author Thomas Gleixner <tglx@linutronix.de>
Mon, 14 Aug 2023 08:18:38 +0000 (10:18 +0200)
committer Thomas Gleixner <tglx@linutronix.de>
Tue, 10 Oct 2023 12:38:18 +0000 (14:38 +0200)
diff --git a/Documentation/arch/x86/topology.rst b/Documentation/arch/x86/topology.rst

index 88f29bab3ba1cc4631a67c706a6396622df88e28..08ebf9edbfc1ed4982e550c283a03bc00e6af345 100644 (file)
--- a/Documentation/arch/x86/topology.rst
+++ b/Documentation/arch/x86/topology.rst
@@ -79,9 +79,7 @@ Package-related topology information in the kernel:
      The maximum possible number of packages in the system. Helpful for per
      package facilities to preallocate per package information.
  
-  - cpu_llc_id:
-
-    A per-CPU variable containing:
+  - cpuinfo_x86.topo.llc_id:
  
        - On Intel, the first APIC ID of the list of CPUs sharing the Last Level
          Cache
diff --git a/arch/x86/events/amd/uncore.c b/arch/x86/events/amd/uncore.c

index 83f15fe411b3f4834b20ea588146dfe913a850d0..3213a39534cdc1c8acf3c1d84f4c8647b3133d49 100644 (file)
--- a/arch/x86/events/amd/uncore.c
+++ b/arch/x86/events/amd/uncore.c
@@ -537,7 +537,7 @@ static int amd_uncore_cpu_starting(unsigned int cpu)
  
         if (amd_uncore_llc) {
                 uncore = *per_cpu_ptr(amd_uncore_llc, cpu);
-               uncore->id = get_llc_id(cpu);
+               uncore->id = per_cpu_llc_id(cpu);
  
                 uncore = amd_uncore_find_online_sibling(uncore, amd_uncore_llc);
                 *per_cpu_ptr(amd_uncore_llc, cpu) = uncore;
diff --git a/arch/x86/include/asm/cacheinfo.h b/arch/x86/include/asm/cacheinfo.h

index ce9685fc78d8ffc125eaed0aa75f9e65135bfe79..5aa061199866591a35507b55b70c2fd625e8416f 100644 (file)
--- a/arch/x86/include/asm/cacheinfo.h
+++ b/arch/x86/include/asm/cacheinfo.h
@@ -7,9 +7,6 @@ extern unsigned int memory_caching_control;
  #define CACHE_MTRR 0x01
  #define CACHE_PAT  0x02
  
-void cacheinfo_amd_init_llc_id(struct cpuinfo_x86 *c, int cpu);
-void cacheinfo_hygon_init_llc_id(struct cpuinfo_x86 *c, int cpu);
-
  void cache_disable(void);
  void cache_enable(void);
  void set_cache_aps_delayed_init(bool val);
diff --git a/arch/x86/include/asm/processor.h b/arch/x86/include/asm/processor.h

index b2cf309eed99eb96fc38a7b9f21aefa30752d98c..d529d8a9ab5ed7e5f471974326ab182b48d9edc8 100644 (file)
--- a/arch/x86/include/asm/processor.h
+++ b/arch/x86/include/asm/processor.h
@@ -99,6 +99,10 @@ struct cpuinfo_topology {
         // Logical ID mappings
         u32                     logical_pkg_id;
         u32                     logical_die_id;
+
+       // Cache level topology IDs
+       u32                     llc_id;
+       u32                     l2c_id;
  };
  
  struct cpuinfo_x86 {
@@ -689,7 +693,15 @@ extern int set_tsc_mode(unsigned int val);
  
  DECLARE_PER_CPU(u64, msr_misc_features_shadow);
  
-extern u16 get_llc_id(unsigned int cpu);
+static inline u16 per_cpu_llc_id(unsigned int cpu)
+{
+       return per_cpu(cpu_info.topo.llc_id, cpu);
+}
+
+static inline u16 per_cpu_l2c_id(unsigned int cpu)
+{
+       return per_cpu(cpu_info.topo.l2c_id, cpu);
+}
  
  #ifdef CONFIG_CPU_SUP_AMD
  extern u32 amd_get_nodes_per_socket(void);
diff --git a/arch/x86/include/asm/smp.h b/arch/x86/include/asm/smp.h

index ad98dd1d9cfb9f95ac30a67405b52dcd9eddf192..b291db463b1dbdf7cdf130426dedc75f99945857 100644 (file)
--- a/arch/x86/include/asm/smp.h
+++ b/arch/x86/include/asm/smp.h
@@ -17,8 +17,6 @@ DECLARE_PER_CPU_READ_MOSTLY(cpumask_var_t, cpu_die_map);
  /* cpus sharing the last level cache: */
  DECLARE_PER_CPU_READ_MOSTLY(cpumask_var_t, cpu_llc_shared_map);
  DECLARE_PER_CPU_READ_MOSTLY(cpumask_var_t, cpu_l2c_shared_map);
-DECLARE_PER_CPU_READ_MOSTLY(u16, cpu_llc_id);
-DECLARE_PER_CPU_READ_MOSTLY(u16, cpu_l2c_id);
  
  DECLARE_EARLY_PER_CPU_READ_MOSTLY(u16, x86_cpu_to_apicid);
  DECLARE_EARLY_PER_CPU_READ_MOSTLY(u32, x86_cpu_to_acpiid);
diff --git a/arch/x86/include/asm/topology.h b/arch/x86/include/asm/topology.h

index ac0c274bd10691414d2f716c1d6a4bc7e97926ef..5f87f6b9b09e74c1a6d01a38777bdc9856ac2f81 100644 (file)
--- a/arch/x86/include/asm/topology.h
+++ b/arch/x86/include/asm/topology.h
@@ -115,7 +115,7 @@ extern const struct cpumask *cpu_clustergroup_mask(int cpu);
  extern unsigned int __max_die_per_package;
  
  #ifdef CONFIG_SMP
-#define topology_cluster_id(cpu)               (per_cpu(cpu_l2c_id, cpu))
+#define topology_cluster_id(cpu)               (cpu_data(cpu).topo.l2c_id)
  #define topology_die_cpumask(cpu)              (per_cpu(cpu_die_map, cpu))
  #define topology_cluster_cpumask(cpu)          (cpu_clustergroup_mask(cpu))
  #define topology_core_cpumask(cpu)             (per_cpu(cpu_core_map, cpu))
diff --git a/arch/x86/kernel/apic/apic_numachip.c b/arch/x86/kernel/apic/apic_numachip.c

index 578ded9abcabc66a52ebc9288052a1b891c70377..32a5e03238944bb222baa07a09bab65882ff7c53 100644 (file)
--- a/arch/x86/kernel/apic/apic_numachip.c
+++ b/arch/x86/kernel/apic/apic_numachip.c
@@ -161,7 +161,7 @@ static void fixup_cpu_id(struct cpuinfo_x86 *c, int node)
         u64 val;
         u32 nodes = 1;
  
-       this_cpu_write(cpu_llc_id, node);
+       c->topo.llc_id = node;
  
         /* Account for nodes per socket in multi-core-module processors */
         if (boot_cpu_has(X86_FEATURE_NODEID_MSR)) {
diff --git a/arch/x86/kernel/cpu/amd.c b/arch/x86/kernel/cpu/amd.c

index a744d8d51b394999b73dc6bb13ff73fca82169e2..2cf4cb165dd9c777b2cdf8dece2f60734351357a 100644 (file)
--- a/arch/x86/kernel/cpu/amd.c
+++ b/arch/x86/kernel/cpu/amd.c
@@ -401,8 +401,6 @@ static void legacy_fixup_core_id(struct cpuinfo_x86 *c)
   */
  static void amd_get_topology(struct cpuinfo_x86 *c)
  {
-       int cpu = smp_processor_id();
-
         /* get information required for multi-node processors */
         if (boot_cpu_has(X86_FEATURE_TOPOEXT)) {
                 int err;
@@ -430,15 +428,14 @@ static void amd_get_topology(struct cpuinfo_x86 *c)
                 if (!err)
                         c->x86_coreid_bits = get_count_order(c->x86_max_cores);
  
-               cacheinfo_amd_init_llc_id(c, cpu);
+               cacheinfo_amd_init_llc_id(c);
  
         } else if (cpu_has(c, X86_FEATURE_NODEID_MSR)) {
                 u64 value;
  
                 rdmsrl(MSR_FAM10H_NODE_ID, value);
                 c->topo.die_id = value & 7;
-
-               per_cpu(cpu_llc_id, cpu) = c->topo.die_id;
+               c->topo.llc_id = c->topo.die_id;
         } else
                 return;
  
@@ -455,7 +452,6 @@ static void amd_get_topology(struct cpuinfo_x86 *c)
  static void amd_detect_cmp(struct cpuinfo_x86 *c)
  {
         unsigned bits;
-       int cpu = smp_processor_id();
  
         bits = c->x86_coreid_bits;
         /* Low order bits define the core id (index of core in socket) */
@@ -463,7 +459,7 @@ static void amd_detect_cmp(struct cpuinfo_x86 *c)
         /* Convert the initial APIC ID into the socket ID */
         c->topo.pkg_id = c->topo.initial_apicid >> bits;
         /* use socket ID also for last level cache */
-       per_cpu(cpu_llc_id, cpu) = c->topo.die_id = c->topo.pkg_id;
+       c->topo.llc_id = c->topo.die_id = c->topo.pkg_id;
  }
  
  u32 amd_get_nodes_per_socket(void)
@@ -481,7 +477,7 @@ static void srat_detect_node(struct cpuinfo_x86 *c)
  
         node = numa_cpu_node(cpu);
         if (node == NUMA_NO_NODE)
-               node = get_llc_id(cpu);
+               node = per_cpu_llc_id(cpu);
  
         /*
          * On multi-fabric platform (e.g. Numascale NumaChip) a
diff --git a/arch/x86/kernel/cpu/cacheinfo.c b/arch/x86/kernel/cpu/cacheinfo.c

index e25368787c2691f3933ffc50378e15a2405f1c3f..c131c412db89c58e820cdfa6758c4db6b59d3429 100644 (file)
--- a/arch/x86/kernel/cpu/cacheinfo.c
+++ b/arch/x86/kernel/cpu/cacheinfo.c
@@ -661,7 +661,7 @@ static int find_num_cache_leaves(struct cpuinfo_x86 *c)
         return i;
  }
  
-void cacheinfo_amd_init_llc_id(struct cpuinfo_x86 *c, int cpu)
+void cacheinfo_amd_init_llc_id(struct cpuinfo_x86 *c)
  {
         /*
          * We may have multiple LLCs if L3 caches exist, so check if we
@@ -672,13 +672,13 @@ void cacheinfo_amd_init_llc_id(struct cpuinfo_x86 *c, int cpu)
  
         if (c->x86 < 0x17) {
                 /* LLC is at the node level. */
-               per_cpu(cpu_llc_id, cpu) = c->topo.die_id;
+               c->topo.llc_id = c->topo.die_id;
         } else if (c->x86 == 0x17 && c->x86_model <= 0x1F) {
                 /*
                  * LLC is at the core complex level.
                  * Core complex ID is ApicId[3] for these processors.
                  */
-               per_cpu(cpu_llc_id, cpu) = c->topo.apicid >> 3;
+               c->topo.llc_id = c->topo.apicid >> 3;
         } else {
                 /*
                  * LLC ID is calculated from the number of threads sharing the
@@ -694,12 +694,12 @@ void cacheinfo_amd_init_llc_id(struct cpuinfo_x86 *c, int cpu)
                 if (num_sharing_cache) {
                         int bits = get_count_order(num_sharing_cache);
  
-                       per_cpu(cpu_llc_id, cpu) = c->topo.apicid >> bits;
+                       c->topo.llc_id = c->topo.apicid >> bits;
                 }
         }
  }
  
-void cacheinfo_hygon_init_llc_id(struct cpuinfo_x86 *c, int cpu)
+void cacheinfo_hygon_init_llc_id(struct cpuinfo_x86 *c)
  {
         /*
          * We may have multiple LLCs if L3 caches exist, so check if we
@@ -712,7 +712,7 @@ void cacheinfo_hygon_init_llc_id(struct cpuinfo_x86 *c, int cpu)
          * LLC is at the core complex level.
          * Core complex ID is ApicId[3] for these processors.
          */
-       per_cpu(cpu_llc_id, cpu) = c->topo.apicid >> 3;
+       c->topo.llc_id = c->topo.apicid >> 3;
  }
  
  void init_amd_cacheinfo(struct cpuinfo_x86 *c)
@@ -740,9 +740,6 @@ void init_intel_cacheinfo(struct cpuinfo_x86 *c)
         unsigned int new_l1d = 0, new_l1i = 0; /* Cache sizes from cpuid(4) */
         unsigned int new_l2 = 0, new_l3 = 0, i; /* Cache sizes from cpuid(4) */
         unsigned int l2_id = 0, l3_id = 0, num_threads_sharing, index_msb;
-#ifdef CONFIG_SMP
-       unsigned int cpu = c->cpu_index;
-#endif
  
         if (c->cpuid_level > 3) {
                 static int is_initialized;
@@ -856,30 +853,24 @@ void init_intel_cacheinfo(struct cpuinfo_x86 *c)
  
         if (new_l2) {
                 l2 = new_l2;
-#ifdef CONFIG_SMP
-               per_cpu(cpu_llc_id, cpu) = l2_id;
-               per_cpu(cpu_l2c_id, cpu) = l2_id;
-#endif
+               c->topo.llc_id = l2_id;
+               c->topo.l2c_id = l2_id;
         }
  
         if (new_l3) {
                 l3 = new_l3;
-#ifdef CONFIG_SMP
-               per_cpu(cpu_llc_id, cpu) = l3_id;
-#endif
+               c->topo.llc_id = l3_id;
         }
  
-#ifdef CONFIG_SMP
         /*
-        * If cpu_llc_id is not yet set, this means cpuid_level < 4 which in
+        * If llc_id is not yet set, this means cpuid_level < 4 which in
          * turns means that the only possibility is SMT (as indicated in
          * cpuid1). Since cpuid2 doesn't specify shared caches, and we know
          * that SMT shares all caches, we can unconditionally set cpu_llc_id to
          * c->topo.pkg_id.
          */
-       if (per_cpu(cpu_llc_id, cpu) == BAD_APICID)
-               per_cpu(cpu_llc_id, cpu) = c->topo.pkg_id;
-#endif
+       if (c->topo.llc_id == BAD_APICID)
+               c->topo.llc_id = c->topo.pkg_id;
  
         c->x86_cache_size = l3 ? l3 : (l2 ? l2 : (l1i+l1d));
  
diff --git a/arch/x86/kernel/cpu/common.c b/arch/x86/kernel/cpu/common.c

index 052bd792c6d15ce173ebfe64ffa5757a28848eaf..f73a664bdcd4cf64d1a9bd3ad13f9c571e60b414 100644 (file)
--- a/arch/x86/kernel/cpu/common.c
+++ b/arch/x86/kernel/cpu/common.c
@@ -74,18 +74,6 @@ u32 elf_hwcap2 __read_mostly;
  int smp_num_siblings = 1;
  EXPORT_SYMBOL(smp_num_siblings);
  
-/* Last level cache ID of each logical CPU */
-DEFINE_PER_CPU_READ_MOSTLY(u16, cpu_llc_id) = BAD_APICID;
-
-u16 get_llc_id(unsigned int cpu)
-{
-       return per_cpu(cpu_llc_id, cpu);
-}
-EXPORT_SYMBOL_GPL(get_llc_id);
-
-/* L2 cache ID of each logical CPU */
-DEFINE_PER_CPU_READ_MOSTLY(u16, cpu_l2c_id) = BAD_APICID;
-
  static struct ppin_info {
         int     feature;
         int     msr_ppin_ctl;
@@ -1830,6 +1818,8 @@ static void identify_cpu(struct cpuinfo_x86 *c)
         c->x86_max_cores = 1;
         c->x86_coreid_bits = 0;
         c->topo.cu_id = 0xff;
+       c->topo.llc_id = BAD_APICID;
+       c->topo.l2c_id = BAD_APICID;
  #ifdef CONFIG_X86_64
         c->x86_clflush_size = 64;
         c->x86_phys_bits = 36;
diff --git a/arch/x86/kernel/cpu/cpu.h b/arch/x86/kernel/cpu/cpu.h

index 1dcd7d4e38ef17189f42e81b6842f2dd07448405..885281ae79a54c91172445f995519ab156113861 100644 (file)
--- a/arch/x86/kernel/cpu/cpu.h
+++ b/arch/x86/kernel/cpu/cpu.h
@@ -78,6 +78,9 @@ extern int detect_ht_early(struct cpuinfo_x86 *c);
  extern void detect_ht(struct cpuinfo_x86 *c);
  extern void check_null_seg_clears_base(struct cpuinfo_x86 *c);
  
+void cacheinfo_amd_init_llc_id(struct cpuinfo_x86 *c);
+void cacheinfo_hygon_init_llc_id(struct cpuinfo_x86 *c);
+
  unsigned int aperfmperf_get_khz(int cpu);
  void cpu_select_mitigations(void);
  
diff --git a/arch/x86/kernel/cpu/hygon.c b/arch/x86/kernel/cpu/hygon.c

index f3898b5af9f30b1fc859faa6108c02e3d25a1531..332c298afd96e62d5f303c520bdf85519046ed0c 100644 (file)
--- a/arch/x86/kernel/cpu/hygon.c
+++ b/arch/x86/kernel/cpu/hygon.c
@@ -63,8 +63,6 @@ static void hygon_get_topology_early(struct cpuinfo_x86 *c)
   */
  static void hygon_get_topology(struct cpuinfo_x86 *c)
  {
-       int cpu = smp_processor_id();
-
         /* get information required for multi-node processors */
         if (boot_cpu_has(X86_FEATURE_TOPOEXT)) {
                 int err;
@@ -94,14 +92,13 @@ static void hygon_get_topology(struct cpuinfo_x86 *c)
                 if (!boot_cpu_has(X86_FEATURE_HYPERVISOR) && c->x86_model <= 0x3)
                         c->topo.pkg_id = c->topo.apicid >> APICID_SOCKET_ID_BIT;
  
-               cacheinfo_hygon_init_llc_id(c, cpu);
+               cacheinfo_hygon_init_llc_id(c);
         } else if (cpu_has(c, X86_FEATURE_NODEID_MSR)) {
                 u64 value;
  
                 rdmsrl(MSR_FAM10H_NODE_ID, value);
                 c->topo.die_id = value & 7;
-
-               per_cpu(cpu_llc_id, cpu) = c->topo.die_id;
+               c->topo.llc_id = c->topo.die_id;
         } else
                 return;
  
@@ -116,15 +113,14 @@ static void hygon_get_topology(struct cpuinfo_x86 *c)
  static void hygon_detect_cmp(struct cpuinfo_x86 *c)
  {
         unsigned int bits;
-       int cpu = smp_processor_id();
  
         bits = c->x86_coreid_bits;
         /* Low order bits define the core id (index of core in socket) */
         c->topo.core_id = c->topo.initial_apicid & ((1 << bits)-1);
         /* Convert the initial APIC ID into the socket ID */
         c->topo.pkg_id = c->topo.initial_apicid >> bits;
-       /* use socket ID also for last level cache */
-       per_cpu(cpu_llc_id, cpu) = c->topo.die_id = c->topo.pkg_id;
+       /* Use package ID also for last level cache */
+       c->topo.llc_id = c->topo.die_id = c->topo.pkg_id;
  }
  
  static void srat_detect_node(struct cpuinfo_x86 *c)
@@ -136,7 +132,7 @@ static void srat_detect_node(struct cpuinfo_x86 *c)
  
         node = numa_cpu_node(cpu);
         if (node == NUMA_NO_NODE)
-               node = per_cpu(cpu_llc_id, cpu);
+               node = c->topo.llc_id;
  
         /*
          * On multi-fabric platform (e.g. Numascale NumaChip) a
diff --git a/arch/x86/kernel/smpboot.c b/arch/x86/kernel/smpboot.c

index 82a30d0f58d9029703574dbdbfd410141ca8e20f..fa05a63b1ed855f902afd8543505c21d3347eb29 100644 (file)
--- a/arch/x86/kernel/smpboot.c
+++ b/arch/x86/kernel/smpboot.c
@@ -478,7 +478,7 @@ static bool match_smt(struct cpuinfo_x86 *c, struct cpuinfo_x86 *o)
  
                 if (c->topo.pkg_id == o->topo.pkg_id &&
                     c->topo.die_id == o->topo.die_id &&
-                   per_cpu(cpu_llc_id, cpu1) == per_cpu(cpu_llc_id, cpu2)) {
+                   per_cpu_llc_id(cpu1) == per_cpu_llc_id(cpu2)) {
                         if (c->topo.core_id == o->topo.core_id)
                                 return topology_sane(c, o, "smt");
  
@@ -510,11 +510,11 @@ static bool match_l2c(struct cpuinfo_x86 *c, struct cpuinfo_x86 *o)
         int cpu1 = c->cpu_index, cpu2 = o->cpu_index;
  
         /* If the arch didn't set up l2c_id, fall back to SMT */
-       if (per_cpu(cpu_l2c_id, cpu1) == BAD_APICID)
+       if (per_cpu_l2c_id(cpu1) == BAD_APICID)
                 return match_smt(c, o);
  
         /* Do not match if L2 cache id does not match: */
-       if (per_cpu(cpu_l2c_id, cpu1) != per_cpu(cpu_l2c_id, cpu2))
+       if (per_cpu_l2c_id(cpu1) != per_cpu_l2c_id(cpu2))
                 return false;
  
         return topology_sane(c, o, "l2c");
@@ -560,11 +560,11 @@ static bool match_llc(struct cpuinfo_x86 *c, struct cpuinfo_x86 *o)
         bool intel_snc = id && id->driver_data;
  
         /* Do not match if we do not have a valid APICID for cpu: */
-       if (per_cpu(cpu_llc_id, cpu1) == BAD_APICID)
+       if (per_cpu_llc_id(cpu1) == BAD_APICID)
                 return false;
  
         /* Do not match if LLC id does not match: */
-       if (per_cpu(cpu_llc_id, cpu1) != per_cpu(cpu_llc_id, cpu2))
+       if (per_cpu_llc_id(cpu1) != per_cpu_llc_id(cpu2))
                 return false;
  
         /*
author	Thomas Gleixner <tglx@linutronix.de>
	Mon, 14 Aug 2023 08:18:38 +0000 (10:18 +0200)
committer	Thomas Gleixner <tglx@linutronix.de>
	Tue, 10 Oct 2023 12:38:18 +0000 (14:38 +0200)
Documentation/arch/x86/topology.rst		patch \| blob \| blame \| history
arch/x86/events/amd/uncore.c		patch \| blob \| blame \| history
arch/x86/include/asm/cacheinfo.h		patch \| blob \| blame \| history
arch/x86/include/asm/processor.h		patch \| blob \| blame \| history
arch/x86/include/asm/smp.h		patch \| blob \| blame \| history
arch/x86/include/asm/topology.h		patch \| blob \| blame \| history
arch/x86/kernel/apic/apic_numachip.c		patch \| blob \| blame \| history
arch/x86/kernel/cpu/amd.c		patch \| blob \| blame \| history
arch/x86/kernel/cpu/cacheinfo.c		patch \| blob \| blame \| history
arch/x86/kernel/cpu/common.c		patch \| blob \| blame \| history
arch/x86/kernel/cpu/cpu.h		patch \| blob \| blame \| history
arch/x86/kernel/cpu/hygon.c		patch \| blob \| blame \| history
arch/x86/kernel/smpboot.c		patch \| blob \| blame \| history