Commit 41541461 authored by Andrew Morton's avatar Andrew Morton Committed by Linus Torvalds

[PATCH] fix for clusterd io_apics

From: Keith Mannthey <kmannth@us.ibm.com>

The following is a patch to fix inconsistent use of the function
set_ioapic_affinity.  In the current kernel it is unclear as to weather the
value being passed to the function is a cpu mask or valid apic id.  In
irq_affinity_write_proc the kernel passes on a cpu mask but the kirqd thread
passes on logical apic ids.  In flat apic mode this is not an issue because a
cpu mask represents the apic value.  However in clustered apic mode the cpu
mask is very different from the logical apic id.

This is an attempt to do the right thing for clustered apics.  I clarify that
the value being passed to set_ioapic_affinity is a cpu mask not a apicid.
Set_ioapic_affinity will do the conversion to logical apic ids.  Since many
cpu masks don't map to valid apicids in clustered apic mode TARGET_CPUS is
used as a default value when such a situation occurs.  I think this is a good
step in making irq_affinity clustered apic safe.
parent cab0e744
...@@ -240,22 +240,22 @@ static void clear_IO_APIC (void) ...@@ -240,22 +240,22 @@ static void clear_IO_APIC (void)
clear_IO_APIC_pin(apic, pin); clear_IO_APIC_pin(apic, pin);
} }
static void set_ioapic_affinity (unsigned int irq, unsigned long mask) static void set_ioapic_affinity (unsigned int irq, unsigned long cpu_mask)
{ {
unsigned long flags; unsigned long flags;
int pin; int pin;
struct irq_pin_list *entry = irq_2_pin + irq; struct irq_pin_list *entry = irq_2_pin + irq;
unsigned int apicid_value;
/*
* Only the first 8 bits are valid. apicid_value = cpu_mask_to_apicid(cpu_mask);
*/ /* Prepare to do the io_apic_write */
mask = mask << 24; apicid_value = apicid_value << 24;
spin_lock_irqsave(&ioapic_lock, flags); spin_lock_irqsave(&ioapic_lock, flags);
for (;;) { for (;;) {
pin = entry->pin; pin = entry->pin;
if (pin == -1) if (pin == -1)
break; break;
io_apic_write(entry->apic, 0x10 + 1 + pin*2, mask); io_apic_write(entry->apic, 0x10 + 1 + pin*2, apicid_value);
if (!entry->next) if (!entry->next)
break; break;
entry = irq_2_pin + entry->next; entry = irq_2_pin + entry->next;
...@@ -279,7 +279,7 @@ static void set_ioapic_affinity (unsigned int irq, unsigned long mask) ...@@ -279,7 +279,7 @@ static void set_ioapic_affinity (unsigned int irq, unsigned long mask)
extern unsigned long irq_affinity[NR_IRQS]; extern unsigned long irq_affinity[NR_IRQS];
static int __cacheline_aligned pending_irq_balance_apicid[NR_IRQS]; static int __cacheline_aligned pending_irq_balance_cpumask[NR_IRQS];
#define IRQBALANCE_CHECK_ARCH -999 #define IRQBALANCE_CHECK_ARCH -999
static int irqbalance_disabled = IRQBALANCE_CHECK_ARCH; static int irqbalance_disabled = IRQBALANCE_CHECK_ARCH;
...@@ -356,7 +356,7 @@ static inline void balance_irq(int cpu, int irq) ...@@ -356,7 +356,7 @@ static inline void balance_irq(int cpu, int irq)
unsigned long flags; unsigned long flags;
spin_lock_irqsave(&desc->lock, flags); spin_lock_irqsave(&desc->lock, flags);
pending_irq_balance_apicid[irq]=cpu_to_logical_apicid(new_cpu); pending_irq_balance_cpumask[irq] = 1 << new_cpu;
spin_unlock_irqrestore(&desc->lock, flags); spin_unlock_irqrestore(&desc->lock, flags);
} }
} }
...@@ -553,8 +553,7 @@ static void do_irq_balance(void) ...@@ -553,8 +553,7 @@ static void do_irq_balance(void)
selected_irq, min_loaded); selected_irq, min_loaded);
/* mark for change destination */ /* mark for change destination */
spin_lock_irqsave(&desc->lock, flags); spin_lock_irqsave(&desc->lock, flags);
pending_irq_balance_apicid[selected_irq] = pending_irq_balance_cpumask[selected_irq] = 1 << min_loaded;
cpu_to_logical_apicid(min_loaded);
spin_unlock_irqrestore(&desc->lock, flags); spin_unlock_irqrestore(&desc->lock, flags);
/* Since we made a change, come back sooner to /* Since we made a change, come back sooner to
* check for more variation. * check for more variation.
...@@ -586,7 +585,7 @@ int balanced_irq(void *unused) ...@@ -586,7 +585,7 @@ int balanced_irq(void *unused)
/* push everything to CPU 0 to give us a starting point. */ /* push everything to CPU 0 to give us a starting point. */
for (i = 0 ; i < NR_IRQS ; i++) for (i = 0 ; i < NR_IRQS ; i++)
pending_irq_balance_apicid[i] = cpu_to_logical_apicid(0); pending_irq_balance_cpumask[i] = 1;
repeat: repeat:
set_current_state(TASK_INTERRUPTIBLE); set_current_state(TASK_INTERRUPTIBLE);
...@@ -663,9 +662,9 @@ static void set_ioapic_affinity (unsigned int irq, unsigned long mask); ...@@ -663,9 +662,9 @@ static void set_ioapic_affinity (unsigned int irq, unsigned long mask);
static inline void move_irq(int irq) static inline void move_irq(int irq)
{ {
/* note - we hold the desc->lock */ /* note - we hold the desc->lock */
if (unlikely(pending_irq_balance_apicid[irq])) { if (unlikely(pending_irq_balance_cpumask[irq])) {
set_ioapic_affinity(irq, pending_irq_balance_apicid[irq]); set_ioapic_affinity(irq, pending_irq_balance_cpumask[irq]);
pending_irq_balance_apicid[irq] = 0; pending_irq_balance_cpumask[irq] = 0;
} }
} }
......
...@@ -34,10 +34,12 @@ static inline unsigned long check_apicid_used(unsigned long bitmap, int apicid) ...@@ -34,10 +34,12 @@ static inline unsigned long check_apicid_used(unsigned long bitmap, int apicid)
return 0; return 0;
} }
static inline unsigned long check_apicid_present(int bit) static inline unsigned long check_apicid_present(int bit)
{ {
return (phys_cpu_present_map & (1 << bit)); return (phys_cpu_present_map & (1 << bit));
} }
#define apicid_cluster(apicid) (apicid & 0xF0)
static inline unsigned long calculate_ldr(unsigned long old) static inline unsigned long calculate_ldr(unsigned long old)
{ {
unsigned long id; unsigned long id;
...@@ -134,4 +136,37 @@ static inline unsigned get_apic_id(unsigned long x) ...@@ -134,4 +136,37 @@ static inline unsigned get_apic_id(unsigned long x)
#define GET_APIC_ID(x) get_apic_id(x) #define GET_APIC_ID(x) get_apic_id(x)
static inline unsigned int cpu_mask_to_apicid (unsigned long cpumask)
{
int num_bits_set;
int cpus_found = 0;
int cpu;
int apicid;
num_bits_set = hweight32(cpumask);
/* Return id to all */
if (num_bits_set == 32)
return (int) 0xFF;
/*
* The cpus in the mask must all be on the apic cluster. If are not
* on the same apicid cluster return default value of TARGET_CPUS.
*/
cpu = ffs(cpumask)-1;
apicid = cpu_to_logical_apicid(cpu);
while (cpus_found < num_bits_set) {
if (cpumask & (1 << cpu)) {
int new_apicid = cpu_to_logical_apicid(cpu);
if (apicid_cluster(apicid) !=
apicid_cluster(new_apicid)){
printk ("%s: Not a valid mask!\n",__FUNCTION__);
return TARGET_CPUS;
}
apicid = apicid | new_apicid;
cpus_found++;
}
cpu++;
}
return apicid;
}
#endif /* __ASM_MACH_APIC_H */ #endif /* __ASM_MACH_APIC_H */
...@@ -120,4 +120,9 @@ static inline int apic_id_registered(void) ...@@ -120,4 +120,9 @@ static inline int apic_id_registered(void)
&phys_cpu_present_map)); &phys_cpu_present_map));
} }
static inline unsigned int cpu_mask_to_apicid (unsigned long cpumask)
{
return cpumask;
}
#endif /* __ASM_MACH_APIC_H */ #endif /* __ASM_MACH_APIC_H */
...@@ -17,6 +17,7 @@ ...@@ -17,6 +17,7 @@
#define APIC_BROADCAST_ID 0x0F #define APIC_BROADCAST_ID 0x0F
#define check_apicid_used(bitmap, apicid) ((bitmap) & (1 << (apicid))) #define check_apicid_used(bitmap, apicid) ((bitmap) & (1 << (apicid)))
#define check_apicid_present(bit) (phys_cpu_present_map & (1 << bit)) #define check_apicid_present(bit) (phys_cpu_present_map & (1 << bit))
#define apicid_cluster(apicid) (apicid & 0xF0)
static inline int apic_id_registered(void) static inline int apic_id_registered(void)
{ {
...@@ -115,4 +116,37 @@ static inline unsigned get_apic_id(unsigned long x) ...@@ -115,4 +116,37 @@ static inline unsigned get_apic_id(unsigned long x)
#define GET_APIC_ID(x) get_apic_id(x) #define GET_APIC_ID(x) get_apic_id(x)
static inline unsigned int cpu_mask_to_apicid (unsigned long cpumask)
{
int num_bits_set;
int cpus_found = 0;
int cpu;
int apicid;
num_bits_set = hweight32(cpumask);
/* Return id to all */
if (num_bits_set == 32)
return (int) 0xFF;
/*
* The cpus in the mask must all be on the apic cluster. If are not
* on the same apicid cluster return default value of TARGET_CPUS.
*/
cpu = ffs(cpumask)-1;
apicid = cpu_to_logical_apicid(cpu);
while (cpus_found < num_bits_set) {
if (cpumask & (1 << cpu)) {
int new_apicid = cpu_to_logical_apicid(cpu);
if (apicid_cluster(apicid) !=
apicid_cluster(new_apicid)){
printk ("%s: Not a valid mask!\n",__FUNCTION__);
return TARGET_CPUS;
}
apicid = apicid | new_apicid;
cpus_found++;
}
cpu++;
}
return apicid;
}
#endif /* __ASM_MACH_APIC_H */ #endif /* __ASM_MACH_APIC_H */
...@@ -34,7 +34,7 @@ static inline unsigned long target_cpus(void) ...@@ -34,7 +34,7 @@ static inline unsigned long target_cpus(void)
#define APIC_BROADCAST_ID (0x0F) #define APIC_BROADCAST_ID (0x0F)
static inline unsigned long check_apicid_used(unsigned long bitmap, int apicid) static inline unsigned long check_apicid_used(unsigned long bitmap, int apicid)
{ {
return (x86_summit ? 0 : (bitmap & (1 << apicid))); return (x86_summit ? 0 : (bitmap & (1 << apicid)));
} }
...@@ -44,6 +44,8 @@ static inline unsigned long check_apicid_present(int bit) ...@@ -44,6 +44,8 @@ static inline unsigned long check_apicid_present(int bit)
return (x86_summit ? 1 : (phys_cpu_present_map & (1 << bit))); return (x86_summit ? 1 : (phys_cpu_present_map & (1 << bit)));
} }
#define apicid_cluster(apicid) (apicid & 0xF0)
extern u8 bios_cpu_apicid[]; extern u8 bios_cpu_apicid[];
static inline void init_apic_ldr(void) static inline void init_apic_ldr(void)
...@@ -142,4 +144,37 @@ static inline unsigned get_apic_id(unsigned long x) ...@@ -142,4 +144,37 @@ static inline unsigned get_apic_id(unsigned long x)
#define GET_APIC_ID(x) get_apic_id(x) #define GET_APIC_ID(x) get_apic_id(x)
static inline unsigned int cpu_mask_to_apicid (unsigned long cpumask)
{
int num_bits_set;
int cpus_found = 0;
int cpu;
int apicid;
num_bits_set = hweight32(cpumask);
/* Return id to all */
if (num_bits_set == 32)
return (int) 0xFF;
/*
* The cpus in the mask must all be on the apic cluster. If are not
* on the same apicid cluster return default value of TARGET_CPUS.
*/
cpu = ffs(cpumask)-1;
apicid = cpu_to_logical_apicid(cpu);
while (cpus_found < num_bits_set) {
if (cpumask & (1 << cpu)) {
int new_apicid = cpu_to_logical_apicid(cpu);
if (apicid_cluster(apicid) !=
apicid_cluster(new_apicid)){
printk ("%s: Not a valid mask!\n",__FUNCTION__);
return TARGET_CPUS;
}
apicid = apicid | new_apicid;
cpus_found++;
}
cpu++;
}
return apicid;
}
#endif /* __ASM_MACH_APIC_H */ #endif /* __ASM_MACH_APIC_H */
...@@ -77,4 +77,8 @@ static inline int check_phys_apicid_present(int boot_cpu_physical_apicid) ...@@ -77,4 +77,8 @@ static inline int check_phys_apicid_present(int boot_cpu_physical_apicid)
return test_bit(boot_cpu_physical_apicid, &phys_cpu_present_map); return test_bit(boot_cpu_physical_apicid, &phys_cpu_present_map);
} }
static inline unsigned int cpu_mask_to_apicid (unsigned long cpumask)
{
return cpumask;
}
#endif /* __ASM_MACH_APIC_H */ #endif /* __ASM_MACH_APIC_H */
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment