Commit b341afb3 authored by Waiman Long's avatar Waiman Long Committed by Ingo Molnar

locking/mutex: Enable optimistic spinning of woken waiter

This patch makes the waiter that sets the HANDOFF flag start spinning
instead of sleeping until the handoff is complete or the owner
sleeps. Otherwise, the handoff will cause the optimistic spinners to
abort spinning as the handed-off owner may not be running.
Tested-by: default avatarJason Low <jason.low2@hpe.com>
Signed-off-by: default avatarWaiman Long <Waiman.Long@hpe.com>
Signed-off-by: default avatarPeter Zijlstra (Intel) <peterz@infradead.org>
Cc: Andrew Morton <akpm@linux-foundation.org>
Cc: Davidlohr Bueso <dave@stgolabs.net>
Cc: Ding Tianhong <dingtianhong@huawei.com>
Cc: Imre Deak <imre.deak@intel.com>
Cc: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Paul E. McKenney <paulmck@linux.vnet.ibm.com>
Cc: Paul E. McKenney <paulmck@us.ibm.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Tim Chen <tim.c.chen@linux.intel.com>
Cc: Will Deacon <Will.Deacon@arm.com>
Link: http://lkml.kernel.org/r/1472254509-27508-2-git-send-email-Waiman.Long@hpe.comSigned-off-by: default avatarIngo Molnar <mingo@kernel.org>
parent a40ca565
...@@ -416,14 +416,28 @@ static inline int mutex_can_spin_on_owner(struct mutex *lock) ...@@ -416,14 +416,28 @@ static inline int mutex_can_spin_on_owner(struct mutex *lock)
* *
* Returns true when the lock was taken, otherwise false, indicating * Returns true when the lock was taken, otherwise false, indicating
* that we need to jump to the slowpath and sleep. * that we need to jump to the slowpath and sleep.
*
* The waiter flag is set to true if the spinner is a waiter in the wait
* queue. The waiter-spinner will spin on the lock directly and concurrently
* with the spinner at the head of the OSQ, if present, until the owner is
* changed to itself.
*/ */
static bool mutex_optimistic_spin(struct mutex *lock, static bool mutex_optimistic_spin(struct mutex *lock,
struct ww_acquire_ctx *ww_ctx, const bool use_ww_ctx) struct ww_acquire_ctx *ww_ctx,
const bool use_ww_ctx, const bool waiter)
{ {
struct task_struct *task = current; struct task_struct *task = current;
if (!waiter) {
/*
* The purpose of the mutex_can_spin_on_owner() function is
* to eliminate the overhead of osq_lock() and osq_unlock()
* in case spinning isn't possible. As a waiter-spinner
* is not going to take OSQ lock anyway, there is no need
* to call mutex_can_spin_on_owner().
*/
if (!mutex_can_spin_on_owner(lock)) if (!mutex_can_spin_on_owner(lock))
goto done; goto fail;
/* /*
* In order to avoid a stampede of mutex spinners trying to * In order to avoid a stampede of mutex spinners trying to
...@@ -431,9 +445,10 @@ static bool mutex_optimistic_spin(struct mutex *lock, ...@@ -431,9 +445,10 @@ static bool mutex_optimistic_spin(struct mutex *lock,
* MCS (queued) lock first before spinning on the owner field. * MCS (queued) lock first before spinning on the owner field.
*/ */
if (!osq_lock(&lock->osq)) if (!osq_lock(&lock->osq))
goto done; goto fail;
}
while (true) { for (;;) {
struct task_struct *owner; struct task_struct *owner;
if (use_ww_ctx && ww_ctx->acquired > 0) { if (use_ww_ctx && ww_ctx->acquired > 0) {
...@@ -449,7 +464,7 @@ static bool mutex_optimistic_spin(struct mutex *lock, ...@@ -449,7 +464,7 @@ static bool mutex_optimistic_spin(struct mutex *lock,
* performed the optimistic spinning cannot be done. * performed the optimistic spinning cannot be done.
*/ */
if (READ_ONCE(ww->ctx)) if (READ_ONCE(ww->ctx))
break; goto fail_unlock;
} }
/* /*
...@@ -457,15 +472,20 @@ static bool mutex_optimistic_spin(struct mutex *lock, ...@@ -457,15 +472,20 @@ static bool mutex_optimistic_spin(struct mutex *lock,
* release the lock or go to sleep. * release the lock or go to sleep.
*/ */
owner = __mutex_owner(lock); owner = __mutex_owner(lock);
if (owner && !mutex_spin_on_owner(lock, owner)) if (owner) {
if (waiter && owner == task) {
smp_mb(); /* ACQUIRE */
break; break;
}
/* Try to acquire the mutex if it is unlocked. */ if (!mutex_spin_on_owner(lock, owner))
if (__mutex_trylock(lock, false)) { goto fail_unlock;
osq_unlock(&lock->osq);
return true;
} }
/* Try to acquire the mutex if it is unlocked. */
if (__mutex_trylock(lock, waiter))
break;
/* /*
* The cpu_relax() call is a compiler barrier which forces * The cpu_relax() call is a compiler barrier which forces
* everything in this loop to be re-loaded. We don't need * everything in this loop to be re-loaded. We don't need
...@@ -475,8 +495,17 @@ static bool mutex_optimistic_spin(struct mutex *lock, ...@@ -475,8 +495,17 @@ static bool mutex_optimistic_spin(struct mutex *lock,
cpu_relax_lowlatency(); cpu_relax_lowlatency();
} }
if (!waiter)
osq_unlock(&lock->osq); osq_unlock(&lock->osq);
done:
return true;
fail_unlock:
if (!waiter)
osq_unlock(&lock->osq);
fail:
/* /*
* If we fell out of the spin path because of need_resched(), * If we fell out of the spin path because of need_resched(),
* reschedule now, before we try-lock the mutex. This avoids getting * reschedule now, before we try-lock the mutex. This avoids getting
...@@ -495,7 +524,8 @@ static bool mutex_optimistic_spin(struct mutex *lock, ...@@ -495,7 +524,8 @@ static bool mutex_optimistic_spin(struct mutex *lock,
} }
#else #else
static bool mutex_optimistic_spin(struct mutex *lock, static bool mutex_optimistic_spin(struct mutex *lock,
struct ww_acquire_ctx *ww_ctx, const bool use_ww_ctx) struct ww_acquire_ctx *ww_ctx,
const bool use_ww_ctx, const bool waiter)
{ {
return false; return false;
} }
...@@ -600,7 +630,7 @@ __mutex_lock_common(struct mutex *lock, long state, unsigned int subclass, ...@@ -600,7 +630,7 @@ __mutex_lock_common(struct mutex *lock, long state, unsigned int subclass,
mutex_acquire_nest(&lock->dep_map, subclass, 0, nest_lock, ip); mutex_acquire_nest(&lock->dep_map, subclass, 0, nest_lock, ip);
if (__mutex_trylock(lock, false) || if (__mutex_trylock(lock, false) ||
mutex_optimistic_spin(lock, ww_ctx, use_ww_ctx)) { mutex_optimistic_spin(lock, ww_ctx, use_ww_ctx, false)) {
/* got the lock, yay! */ /* got the lock, yay! */
lock_acquired(&lock->dep_map, ip); lock_acquired(&lock->dep_map, ip);
if (use_ww_ctx) if (use_ww_ctx)
...@@ -669,7 +699,8 @@ __mutex_lock_common(struct mutex *lock, long state, unsigned int subclass, ...@@ -669,7 +699,8 @@ __mutex_lock_common(struct mutex *lock, long state, unsigned int subclass,
* state back to RUNNING and fall through the next schedule(), * state back to RUNNING and fall through the next schedule(),
* or we must see its unlock and acquire. * or we must see its unlock and acquire.
*/ */
if (__mutex_trylock(lock, first)) if ((first && mutex_optimistic_spin(lock, ww_ctx, use_ww_ctx, true)) ||
__mutex_trylock(lock, first))
break; break;
spin_lock_mutex(&lock->wait_lock, flags); spin_lock_mutex(&lock->wait_lock, flags);
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment