Commit 5f7f4b36 authored by Zwane Mwaikambo's avatar Zwane Mwaikambo Committed by Linus Torvalds

[PATCH] out-of-line locks / ppc64

Signed-off-by: default avatarZwane Mwaikambo <zwane@fsmlabs.com>
Signed-off-by: default avatarLinus Torvalds <torvalds@osdl.org>
parent c3892c11
...@@ -158,6 +158,20 @@ static __inline__ void timer_sync_xtime( unsigned long cur_tb ) ...@@ -158,6 +158,20 @@ static __inline__ void timer_sync_xtime( unsigned long cur_tb )
} }
} }
#ifdef CONFIG_SMP
unsigned long profile_pc(struct pt_regs *regs)
{
unsigned long pc = instruction_pointer(regs);
if (pc >= (unsigned long)&__lock_text_start &&
pc <= (unsigned long)&__lock_text_end)
return regs->link;
return pc;
}
EXPORT_SYMBOL(profile_pc);
#endif
#ifdef CONFIG_PPC_ISERIES #ifdef CONFIG_PPC_ISERIES
/* /*
......
...@@ -14,6 +14,7 @@ SECTIONS ...@@ -14,6 +14,7 @@ SECTIONS
.text : { .text : {
*(.text .text.*) *(.text .text.*)
SCHED_TEXT SCHED_TEXT
LOCK_TEXT
*(.fixup) *(.fixup)
. = ALIGN(4096); . = ALIGN(4096);
_etext = .; _etext = .;
......
...@@ -22,26 +22,9 @@ ...@@ -22,26 +22,9 @@
#ifndef CONFIG_SPINLINE #ifndef CONFIG_SPINLINE
/*
* On a system with shared processors (that is, where a physical
* processor is multiplexed between several virtual processors),
* there is no point spinning on a lock if the holder of the lock
* isn't currently scheduled on a physical processor. Instead
* we detect this situation and ask the hypervisor to give the
* rest of our timeslice to the lock holder.
*
* So that we can tell which virtual processor is holding a lock,
* we put 0x80000000 | smp_processor_id() in the lock when it is
* held. Conveniently, we have a word in the paca that holds this
* value.
*/
/* waiting for a spinlock... */ /* waiting for a spinlock... */
#if defined(CONFIG_PPC_SPLPAR) || defined(CONFIG_PPC_ISERIES) #if defined(CONFIG_PPC_SPLPAR) || defined(CONFIG_PPC_ISERIES)
/* We only yield to the hypervisor if we are in shared processor mode */
#define SHARED_PROCESSOR (get_paca()->lppaca.xSharedProc)
void __spin_yield(spinlock_t *lock) void __spin_yield(spinlock_t *lock)
{ {
unsigned int lock_value, holder_cpu, yield_count; unsigned int lock_value, holder_cpu, yield_count;
...@@ -68,96 +51,11 @@ void __spin_yield(spinlock_t *lock) ...@@ -68,96 +51,11 @@ void __spin_yield(spinlock_t *lock)
#endif #endif
} }
#else /* SPLPAR || ISERIES */
#define __spin_yield(x) barrier()
#define SHARED_PROCESSOR 0
#endif
/*
* This returns the old value in the lock, so we succeeded
* in getting the lock if the return value is 0.
*/
static __inline__ unsigned long __spin_trylock(spinlock_t *lock)
{
unsigned long tmp, tmp2;
__asm__ __volatile__(
" lwz %1,%3(13) # __spin_trylock\n\
1: lwarx %0,0,%2\n\
cmpwi 0,%0,0\n\
bne- 2f\n\
stwcx. %1,0,%2\n\
bne- 1b\n\
isync\n\
2:" : "=&r" (tmp), "=&r" (tmp2)
: "r" (&lock->lock), "i" (offsetof(struct paca_struct, lock_token))
: "cr0", "memory");
return tmp;
}
int _raw_spin_trylock(spinlock_t *lock)
{
return __spin_trylock(lock) == 0;
}
EXPORT_SYMBOL(_raw_spin_trylock);
void _raw_spin_lock(spinlock_t *lock)
{
while (1) {
if (likely(__spin_trylock(lock) == 0))
break;
do {
HMT_low();
if (SHARED_PROCESSOR)
__spin_yield(lock);
} while (likely(lock->lock != 0));
HMT_medium();
}
}
EXPORT_SYMBOL(_raw_spin_lock);
void _raw_spin_lock_flags(spinlock_t *lock, unsigned long flags)
{
unsigned long flags_dis;
while (1) {
if (likely(__spin_trylock(lock) == 0))
break;
local_save_flags(flags_dis);
local_irq_restore(flags);
do {
HMT_low();
if (SHARED_PROCESSOR)
__spin_yield(lock);
} while (likely(lock->lock != 0));
HMT_medium();
local_irq_restore(flags_dis);
}
}
EXPORT_SYMBOL(_raw_spin_lock_flags);
void spin_unlock_wait(spinlock_t *lock)
{
while (lock->lock) {
HMT_low();
if (SHARED_PROCESSOR)
__spin_yield(lock);
}
HMT_medium();
}
EXPORT_SYMBOL(spin_unlock_wait);
/* /*
* Waiting for a read lock or a write lock on a rwlock... * Waiting for a read lock or a write lock on a rwlock...
* This turns out to be the same for read and write locks, since * This turns out to be the same for read and write locks, since
* we only know the holder if it is write-locked. * we only know the holder if it is write-locked.
*/ */
#if defined(CONFIG_PPC_SPLPAR) || defined(CONFIG_PPC_ISERIES)
void __rw_yield(rwlock_t *rw) void __rw_yield(rwlock_t *rw)
{ {
int lock_value; int lock_value;
...@@ -184,118 +82,18 @@ void __rw_yield(rwlock_t *rw) ...@@ -184,118 +82,18 @@ void __rw_yield(rwlock_t *rw)
yield_count); yield_count);
#endif #endif
} }
#else /* SPLPAR || ISERIES */
#define __rw_yield(x) barrier()
#endif #endif
/* void spin_unlock_wait(spinlock_t *lock)
* This returns the old value in the lock + 1,
* so we got a read lock if the return value is > 0.
*/
static __inline__ long __read_trylock(rwlock_t *rw)
{
long tmp;
__asm__ __volatile__(
"1: lwarx %0,0,%1 # read_trylock\n\
extsw %0,%0\n\
addic. %0,%0,1\n\
ble- 2f\n\
stwcx. %0,0,%1\n\
bne- 1b\n\
isync\n\
2:" : "=&r" (tmp)
: "r" (&rw->lock)
: "cr0", "xer", "memory");
return tmp;
}
int _raw_read_trylock(rwlock_t *rw)
{
return __read_trylock(rw) > 0;
}
EXPORT_SYMBOL(_raw_read_trylock);
void _raw_read_lock(rwlock_t *rw)
{
while (1) {
if (likely(__read_trylock(rw) > 0))
break;
do {
HMT_low();
if (SHARED_PROCESSOR)
__rw_yield(rw);
} while (likely(rw->lock < 0));
HMT_medium();
}
}
EXPORT_SYMBOL(_raw_read_lock);
void _raw_read_unlock(rwlock_t *rw)
{
long tmp;
__asm__ __volatile__(
"eieio # read_unlock\n\
1: lwarx %0,0,%1\n\
addic %0,%0,-1\n\
stwcx. %0,0,%1\n\
bne- 1b"
: "=&r"(tmp)
: "r"(&rw->lock)
: "cr0", "memory");
}
EXPORT_SYMBOL(_raw_read_unlock);
/*
* This returns the old value in the lock,
* so we got the write lock if the return value is 0.
*/
static __inline__ long __write_trylock(rwlock_t *rw)
{
long tmp, tmp2;
__asm__ __volatile__(
" lwz %1,%3(13) # write_trylock\n\
1: lwarx %0,0,%2\n\
cmpwi 0,%0,0\n\
bne- 2f\n\
stwcx. %1,0,%2\n\
bne- 1b\n\
isync\n\
2:" : "=&r" (tmp), "=&r" (tmp2)
: "r" (&rw->lock), "i" (offsetof(struct paca_struct, lock_token))
: "cr0", "memory");
return tmp;
}
int _raw_write_trylock(rwlock_t *rw)
{
return __write_trylock(rw) == 0;
}
EXPORT_SYMBOL(_raw_write_trylock);
void _raw_write_lock(rwlock_t *rw)
{ {
while (1) { while (lock->lock) {
if (likely(__write_trylock(rw) == 0)) HMT_low();
break; if (SHARED_PROCESSOR)
do { __spin_yield(lock);
HMT_low();
if (SHARED_PROCESSOR)
__rw_yield(rw);
} while (likely(rw->lock != 0));
HMT_medium();
} }
HMT_medium();
} }
EXPORT_SYMBOL(_raw_write_lock); EXPORT_SYMBOL(spin_unlock_wait);
#endif /* CONFIG_SPINLINE */ #endif /* CONFIG_SPINLINE */
...@@ -69,7 +69,12 @@ struct pt_regs32 { ...@@ -69,7 +69,12 @@ struct pt_regs32 {
#define __SIGNAL_FRAMESIZE32 64 #define __SIGNAL_FRAMESIZE32 64
#define instruction_pointer(regs) ((regs)->nip) #define instruction_pointer(regs) ((regs)->nip)
#ifdef CONFIG_SMP
extern unsigned long profile_pc(struct pt_regs *regs);
#else
#define profile_pc(regs) instruction_pointer(regs) #define profile_pc(regs) instruction_pointer(regs)
#endif
#define user_mode(regs) ((((regs)->msr) >> MSR_PR_LG) & 0x1) #define user_mode(regs) ((((regs)->msr) >> MSR_PR_LG) & 0x1)
#define force_successful_syscall_return() \ #define force_successful_syscall_return() \
......
...@@ -6,6 +6,8 @@ ...@@ -6,6 +6,8 @@
* *
* Copyright (C) 2001-2004 Paul Mackerras <paulus@au.ibm.com>, IBM * Copyright (C) 2001-2004 Paul Mackerras <paulus@au.ibm.com>, IBM
* Copyright (C) 2001 Anton Blanchard <anton@au.ibm.com>, IBM * Copyright (C) 2001 Anton Blanchard <anton@au.ibm.com>, IBM
* Copyright (C) 2002 Dave Engebretsen <engebret@us.ibm.com>, IBM
* Rework to support virtual processors
* *
* Type of int is used as a full 64b word is not necessary. * Type of int is used as a full 64b word is not necessary.
* *
...@@ -16,6 +18,8 @@ ...@@ -16,6 +18,8 @@
*/ */
#include <linux/config.h> #include <linux/config.h>
#include <asm/paca.h> #include <asm/paca.h>
#include <asm/hvcall.h>
#include <asm/iSeries/HvCall.h>
typedef struct { typedef struct {
volatile unsigned int lock; volatile unsigned int lock;
...@@ -34,101 +38,91 @@ static __inline__ void _raw_spin_unlock(spinlock_t *lock) ...@@ -34,101 +38,91 @@ static __inline__ void _raw_spin_unlock(spinlock_t *lock)
} }
/* /*
* Normally we use the spinlock functions in arch/ppc64/lib/locks.c. * On a system with shared processors (that is, where a physical
* For special applications such as profiling, we can have the * processor is multiplexed between several virtual processors),
* spinlock functions inline by defining CONFIG_SPINLINE. * there is no point spinning on a lock if the holder of the lock
* This is not recommended on partitioned systems with shared * isn't currently scheduled on a physical processor. Instead
* processors, since the inline spinlock functions don't include * we detect this situation and ask the hypervisor to give the
* the code for yielding the CPU to the lock holder. * rest of our timeslice to the lock holder.
*
* So that we can tell which virtual processor is holding a lock,
* we put 0x80000000 | smp_processor_id() in the lock when it is
* held. Conveniently, we have a word in the paca that holds this
* value.
*/ */
#ifndef CONFIG_SPINLINE #if defined(CONFIG_PPC_SPLPAR) || defined(CONFIG_PPC_ISERIES)
extern int _raw_spin_trylock(spinlock_t *lock); /* We only yield to the hypervisor if we are in shared processor mode */
extern void _raw_spin_lock(spinlock_t *lock); #define SHARED_PROCESSOR (get_paca()->lppaca.xSharedProc)
extern void _raw_spin_lock_flags(spinlock_t *lock, unsigned long flags); extern void __spin_yield(spinlock_t *lock);
extern void __rw_yield(spinlock_t *lock);
#else /* SPLPAR || ISERIES */
#define __spin_yield(x) barrier()
#define __rw_yield(x) barrier()
#define SHARED_PROCESSOR 0
#endif
extern void spin_unlock_wait(spinlock_t *lock); extern void spin_unlock_wait(spinlock_t *lock);
#else /*
* This returns the old value in the lock, so we succeeded
static __inline__ int _raw_spin_trylock(spinlock_t *lock) * in getting the lock if the return value is 0.
*/
static __inline__ unsigned long __spin_trylock(spinlock_t *lock)
{ {
unsigned int tmp, tmp2; unsigned long tmp, tmp2;
__asm__ __volatile__( __asm__ __volatile__(
"1: lwarx %0,0,%2 # spin_trylock\n\ " lwz %1,%3(13) # __spin_trylock\n\
1: lwarx %0,0,%2\n\
cmpwi 0,%0,0\n\ cmpwi 0,%0,0\n\
bne- 2f\n\ bne- 2f\n\
lwz %1,%3(13)\n\
stwcx. %1,0,%2\n\ stwcx. %1,0,%2\n\
bne- 1b\n\ bne- 1b\n\
isync\n\ isync\n\
2:" : "=&r"(tmp), "=&r"(tmp2) 2:" : "=&r" (tmp), "=&r" (tmp2)
: "r"(&lock->lock), "i"(offsetof(struct paca_struct, lock_token)) : "r" (&lock->lock), "i" (offsetof(struct paca_struct, lock_token))
: "cr0", "memory"); : "cr0", "memory");
return tmp == 0; return tmp;
} }
static __inline__ void _raw_spin_lock(spinlock_t *lock) static int __inline__ _raw_spin_trylock(spinlock_t *lock)
{ {
unsigned int tmp; return __spin_trylock(lock) == 0;
__asm__ __volatile__(
"b 2f # spin_lock\n\
1:"
HMT_LOW
" lwzx %0,0,%1\n\
cmpwi 0,%0,0\n\
bne+ 1b\n"
HMT_MEDIUM
"2: lwarx %0,0,%1\n\
cmpwi 0,%0,0\n\
bne- 1b\n\
lwz %0,%2(13)\n\
stwcx. %0,0,%1\n\
bne- 2b\n\
isync"
: "=&r"(tmp)
: "r"(&lock->lock), "i"(offsetof(struct paca_struct, lock_token))
: "cr0", "memory");
} }
/* static void __inline__ _raw_spin_lock(spinlock_t *lock)
* Note: if we ever want to inline the spinlocks on iSeries,
* we will have to change the irq enable/disable stuff in here.
*/
static __inline__ void _raw_spin_lock_flags(spinlock_t *lock,
unsigned long flags)
{ {
unsigned int tmp; while (1) {
unsigned long tmp2; if (likely(__spin_trylock(lock) == 0))
break;
__asm__ __volatile__( do {
"b 3f # spin_lock\n\ HMT_low();
1: mfmsr %1\n\ if (SHARED_PROCESSOR)
mtmsrd %3,1\n\ __spin_yield(lock);
2:" HMT_LOW } while (likely(lock->lock != 0));
" lwzx %0,0,%2\n\ HMT_medium();
cmpwi 0,%0,0\n\ }
bne+ 2b\n"
HMT_MEDIUM
" mtmsrd %1,1\n\
3: lwarx %0,0,%2\n\
cmpwi 0,%0,0\n\
bne- 1b\n\
lwz %1,%4(13)\n\
stwcx. %1,0,%2\n\
bne- 3b\n\
isync"
: "=&r"(tmp), "=&r"(tmp2)
: "r"(&lock->lock), "r"(flags),
"i" (offsetof(struct paca_struct, lock_token))
: "cr0", "memory");
} }
#define spin_unlock_wait(x) do { cpu_relax(); } while (spin_is_locked(x)) static void __inline__ _raw_spin_lock_flags(spinlock_t *lock, unsigned long flags)
{
#endif /* CONFIG_SPINLINE */ unsigned long flags_dis;
while (1) {
if (likely(__spin_trylock(lock) == 0))
break;
local_save_flags(flags_dis);
local_irq_restore(flags);
do {
HMT_low();
if (SHARED_PROCESSOR)
__spin_yield(lock);
} while (likely(lock->lock != 0));
HMT_medium();
local_irq_restore(flags_dis);
}
}
/* /*
* Read-write spinlocks, allowing multiple readers * Read-write spinlocks, allowing multiple readers
...@@ -165,67 +159,54 @@ static __inline__ void _raw_write_unlock(rwlock_t *rw) ...@@ -165,67 +159,54 @@ static __inline__ void _raw_write_unlock(rwlock_t *rw)
rw->lock = 0; rw->lock = 0;
} }
#ifndef CONFIG_SPINLINE /*
extern int _raw_read_trylock(rwlock_t *rw); * This returns the old value in the lock + 1,
extern void _raw_read_lock(rwlock_t *rw); * so we got a read lock if the return value is > 0.
extern void _raw_read_unlock(rwlock_t *rw); */
extern int _raw_write_trylock(rwlock_t *rw); static long __inline__ __read_trylock(rwlock_t *rw)
extern void _raw_write_lock(rwlock_t *rw);
extern void _raw_write_unlock(rwlock_t *rw);
#else
static __inline__ int _raw_read_trylock(rwlock_t *rw)
{ {
unsigned int tmp; long tmp;
unsigned int ret;
__asm__ __volatile__( __asm__ __volatile__(
"1: lwarx %0,0,%2 # read_trylock\n\ "1: lwarx %0,0,%1 # read_trylock\n\
li %1,0\n\
extsw %0,%0\n\ extsw %0,%0\n\
addic. %0,%0,1\n\ addic. %0,%0,1\n\
ble- 2f\n\ ble- 2f\n\
stwcx. %0,0,%2\n\ stwcx. %0,0,%1\n\
bne- 1b\n\ bne- 1b\n\
li %1,1\n\
isync\n\ isync\n\
2:" : "=&r"(tmp), "=&r"(ret) 2:" : "=&r" (tmp)
: "r"(&rw->lock) : "r" (&rw->lock)
: "cr0", "memory"); : "cr0", "xer", "memory");
return ret; return tmp;
} }
static __inline__ void _raw_read_lock(rwlock_t *rw) static int __inline__ _raw_read_trylock(rwlock_t *rw)
{ {
unsigned int tmp; return __read_trylock(rw) > 0;
}
__asm__ __volatile__( static void __inline__ _raw_read_lock(rwlock_t *rw)
"b 2f # read_lock\n\ {
1:" while (1) {
HMT_LOW if (likely(__read_trylock(rw) > 0))
" lwax %0,0,%1\n\ break;
cmpwi 0,%0,0\n\ do {
blt+ 1b\n" HMT_low();
HMT_MEDIUM if (SHARED_PROCESSOR)
"2: lwarx %0,0,%1\n\ __rw_yield(rw);
extsw %0,%0\n\ } while (likely(rw->lock < 0));
addic. %0,%0,1\n\ HMT_medium();
ble- 1b\n\ }
stwcx. %0,0,%1\n\
bne- 2b\n\
isync"
: "=&r"(tmp)
: "r"(&rw->lock)
: "cr0", "memory");
} }
static __inline__ void _raw_read_unlock(rwlock_t *rw) static void __inline__ _raw_read_unlock(rwlock_t *rw)
{ {
unsigned int tmp; long tmp;
__asm__ __volatile__( __asm__ __volatile__(
"lwsync # read_unlock\n\ "eieio # read_unlock\n\
1: lwarx %0,0,%1\n\ 1: lwarx %0,0,%1\n\
addic %0,%0,-1\n\ addic %0,%0,-1\n\
stwcx. %0,0,%1\n\ stwcx. %0,0,%1\n\
...@@ -235,50 +216,47 @@ static __inline__ void _raw_read_unlock(rwlock_t *rw) ...@@ -235,50 +216,47 @@ static __inline__ void _raw_read_unlock(rwlock_t *rw)
: "cr0", "memory"); : "cr0", "memory");
} }
static __inline__ int _raw_write_trylock(rwlock_t *rw) /*
* This returns the old value in the lock,
* so we got the write lock if the return value is 0.
*/
static __inline__ long __write_trylock(rwlock_t *rw)
{ {
unsigned int tmp; long tmp, tmp2;
unsigned int ret;
__asm__ __volatile__( __asm__ __volatile__(
"1: lwarx %0,0,%2 # write_trylock\n\ " lwz %1,%3(13) # write_trylock\n\
1: lwarx %0,0,%2\n\
cmpwi 0,%0,0\n\ cmpwi 0,%0,0\n\
li %1,0\n\
bne- 2f\n\ bne- 2f\n\
stwcx. %3,0,%2\n\ stwcx. %1,0,%2\n\
bne- 1b\n\ bne- 1b\n\
li %1,1\n\
isync\n\ isync\n\
2:" : "=&r"(tmp), "=&r"(ret) 2:" : "=&r" (tmp), "=&r" (tmp2)
: "r"(&rw->lock), "r"(-1) : "r" (&rw->lock), "i" (offsetof(struct paca_struct, lock_token))
: "cr0", "memory"); : "cr0", "memory");
return ret; return tmp;
} }
static __inline__ void _raw_write_lock(rwlock_t *rw) static int __inline__ _raw_write_trylock(rwlock_t *rw)
{ {
unsigned int tmp; return __write_trylock(rw) == 0;
}
__asm__ __volatile__( static void __inline__ _raw_write_lock(rwlock_t *rw)
"b 2f # write_lock\n\ {
1:" while (1) {
HMT_LOW if (likely(__write_trylock(rw) == 0))
"lwax %0,0,%1\n\ break;
cmpwi 0,%0,0\n\ do {
bne+ 1b\n" HMT_low();
HMT_MEDIUM if (SHARED_PROCESSOR)
"2: lwarx %0,0,%1\n\ __rw_yield(rw);
cmpwi 0,%0,0\n\ } while (likely(rw->lock != 0));
bne- 1b\n\ HMT_medium();
stwcx. %2,0,%1\n\ }
bne- 2b\n\
isync"
: "=&r"(tmp)
: "r"(&rw->lock), "r"(-1)
: "cr0", "memory");
} }
#endif /* CONFIG_SPINLINE */
#endif /* __KERNEL__ */ #endif /* __KERNEL__ */
#endif /* __ASM_SPINLOCK_H */ #endif /* __ASM_SPINLOCK_H */
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment