x86/apic: Optimize cpu traversal in __assign_irq_vector() using domain membership
authorSuresh Siddha <suresh.b.siddha@intel.com>
Mon, 25 Jun 2012 20:38:27 +0000 (13:38 -0700)
committerIngo Molnar <mingo@kernel.org>
Fri, 6 Jul 2012 09:00:21 +0000 (11:00 +0200)
Currently __assign_irq_vector() goes through each cpu in the
specified mask until it finds a free vector in all the cpu's
that are part of the same interrupt domain. We visit all the
interrupt domain sibling cpus to reserve the free vector. So,
when we fail to find a free vector in an interrupt domain, it is
safe to continue our search with a cpu belonging to a new
interrupt domain. No need to go through each cpu, if the domain
containing that cpu is already visited.

Use the irq_cfg's old_domain to track the visited domains and
optimize the cpu traversal while finding a free vector in the
given cpumask.

NOTE: We can also optimize the search by using for_each_cpu() and
skip the current cpu, if it is not the first cpu in the mask
returned by the vector_allocation_domain(). But re-using the
cfg->old_domain to track the visited domains will be slightly
faster.

Signed-off-by: Suresh Siddha <suresh.b.siddha@intel.com>
Acked-by: Yinghai Lu <yinghai@kernel.org>
Acked-by: Alexander Gordeev <agordeev@redhat.com>
Acked-by: Cyrill Gorcunov <gorcunov@openvz.org>
Link: http://lkml.kernel.org/r/1340656709-11423-2-git-send-email-suresh.b.siddha@intel.com
Signed-off-by: Ingo Molnar <mingo@kernel.org>
arch/x86/include/asm/apic.h
arch/x86/kernel/apic/apic_noop.c
arch/x86/kernel/apic/io_apic.c
arch/x86/kernel/apic/x2apic_cluster.c
arch/x86/kernel/vsmp_64.c

index eec240e120912bded87b854b2cbeffec16b9eb44..8bebeb8952fb2fc7a24b08f49ce5ab97a210f4fc 100644 (file)
@@ -306,7 +306,7 @@ struct apic {
        unsigned long (*check_apicid_used)(physid_mask_t *map, int apicid);
        unsigned long (*check_apicid_present)(int apicid);
 
-       bool (*vector_allocation_domain)(int cpu, struct cpumask *retmask);
+       void (*vector_allocation_domain)(int cpu, struct cpumask *retmask);
        void (*init_apic_ldr)(void);
 
        void (*ioapic_phys_id_map)(physid_mask_t *phys_map, physid_mask_t *retmap);
@@ -614,7 +614,7 @@ default_cpu_mask_to_apicid_and(const struct cpumask *cpumask,
                               const struct cpumask *andmask,
                               unsigned int *apicid);
 
-static inline bool
+static inline void
 flat_vector_allocation_domain(int cpu, struct cpumask *retmask)
 {
        /* Careful. Some cpus do not strictly honor the set of cpus
@@ -627,14 +627,12 @@ flat_vector_allocation_domain(int cpu, struct cpumask *retmask)
         */
        cpumask_clear(retmask);
        cpumask_bits(retmask)[0] = APIC_ALL_CPUS;
-       return false;
 }
 
-static inline bool
+static inline void
 default_vector_allocation_domain(int cpu, struct cpumask *retmask)
 {
        cpumask_copy(retmask, cpumask_of(cpu));
-       return true;
 }
 
 static inline unsigned long default_check_apicid_used(physid_mask_t *map, int apicid)
index 65c07fc630a14d01568248675876f9d7df92d8ce..08c337bc49ffa9c39d6fa07c1891a7030e18a813 100644 (file)
@@ -100,12 +100,11 @@ static unsigned long noop_check_apicid_present(int bit)
        return physid_isset(bit, phys_cpu_present_map);
 }
 
-static bool noop_vector_allocation_domain(int cpu, struct cpumask *retmask)
+static void noop_vector_allocation_domain(int cpu, struct cpumask *retmask)
 {
        if (cpu != 0)
                pr_warning("APIC: Vector allocated for non-BSP cpu\n");
        cpumask_copy(retmask, cpumask_of(cpu));
-       return true;
 }
 
 static u32 noop_apic_read(u32 reg)
index a951ef7decb10984340401e260c3d61b747215bd..8a08f09aa50513ffa5f7768a8ba1972290d86629 100644 (file)
@@ -1134,12 +1134,13 @@ __assign_irq_vector(int irq, struct irq_cfg *cfg, const struct cpumask *mask)
 
        /* Only try and allocate irqs on cpus that are present */
        err = -ENOSPC;
-       for_each_cpu_and(cpu, mask, cpu_online_mask) {
+       cpumask_clear(cfg->old_domain);
+       cpu = cpumask_first_and(mask, cpu_online_mask);
+       while (cpu < nr_cpu_ids) {
                int new_cpu;
                int vector, offset;
-               bool more_domains;
 
-               more_domains = apic->vector_allocation_domain(cpu, tmp_mask);
+               apic->vector_allocation_domain(cpu, tmp_mask);
 
                if (cpumask_subset(tmp_mask, cfg->domain)) {
                        free_cpumask_var(tmp_mask);
@@ -1156,10 +1157,10 @@ next:
                }
 
                if (unlikely(current_vector == vector)) {
-                       if (more_domains)
-                               continue;
-                       else
-                               break;
+                       cpumask_or(cfg->old_domain, cfg->old_domain, tmp_mask);
+                       cpumask_andnot(tmp_mask, mask, cfg->old_domain);
+                       cpu = cpumask_first_and(tmp_mask, cpu_online_mask);
+                       continue;
                }
 
                if (test_bit(vector, used_vectors))
index 943d03fc6fc499b1f1687009791203191732fcde..b5d889b5659ac4d9c9e91980bccb3dcb93fd6dd1 100644 (file)
@@ -212,11 +212,10 @@ static int x2apic_cluster_probe(void)
 /*
  * Each x2apic cluster is an allocation domain.
  */
-static bool cluster_vector_allocation_domain(int cpu, struct cpumask *retmask)
+static void cluster_vector_allocation_domain(int cpu, struct cpumask *retmask)
 {
        cpumask_clear(retmask);
        cpumask_copy(retmask, per_cpu(cpus_in_cluster, cpu));
-       return true;
 }
 
 static struct apic apic_x2apic_cluster = {
index fa5adb7c228c76805494038b5cf3015db7cc070e..3f0285ac00fa6536a19e9a6817fdcbc92c52c4ae 100644 (file)
@@ -208,10 +208,9 @@ static int apicid_phys_pkg_id(int initial_apic_id, int index_msb)
  * In vSMP, all cpus should be capable of handling interrupts, regardless of
  * the APIC used.
  */
-static bool fill_vector_allocation_domain(int cpu, struct cpumask *retmask)
+static void fill_vector_allocation_domain(int cpu, struct cpumask *retmask)
 {
        cpumask_setall(retmask);
-       return false;
 }
 
 static void vsmp_apic_post_init(void)