Specifically: Documentation/locking/lockdep-design.txt Documentation/locking/lockstat.txt Documentation/locking/mutex-design.txt Documentation/locking/rt-mutex-design.txt Documentation/locking/rt-mutex.txt Documentation/locking/spinlocks.txt Documentation/locking/ww-mutex-design.txt Signed-off-by: Davidlohr Bueso <davidlohr@hp.com> Acked-by: Randy Dunlap <rdunlap@infradead.org> Signed-off-by: Peter Zijlstra <peterz@infradead.org> Cc: jason.low2@hp.com Cc: aswin@hp.com Cc: Alexei Starovoitov <ast@plumgrid.com> Cc: Al Viro <viro@zeniv.linux.org.uk> Cc: Andrew Morton <akpm@linux-foundation.org> Cc: Chris Mason <clm@fb.com> Cc: Dan Streetman <ddstreet@ieee.org> Cc: David Airlie <airlied@linux.ie> Cc: Davidlohr Bueso <davidlohr@hp.com> Cc: David S. Miller <davem@davemloft.net> Cc: Greg Kroah-Hartman <gregkh@linuxfoundation.org> Cc: Heiko Carstens <heiko.carstens@de.ibm.com> Cc: Jason Low <jason.low2@hp.com> Cc: Josef Bacik <jbacik@fusionio.com> Cc: Kees Cook <keescook@chromium.org> Cc: Linus Torvalds <torvalds@linux-foundation.org> Cc: Lubomir Rintel <lkundrak@v3.sk> Cc: Masanari Iida <standby24x7@gmail.com> Cc: Paul E. McKenney <paulmck@linux.vnet.ibm.com> Cc: Randy Dunlap <rdunlap@infradead.org> Cc: Tim Chen <tim.c.chen@linux.intel.com> Cc: Vineet Gupta <vgupta@synopsys.com> Cc: fengguang.wu@intel.com Link: http://lkml.kernel.org/r/1406752916-3341-6-git-send-email-davidlohr@hp.com Signed-off-by: Ingo Molnar <mingo@kernel.org>
		
			
				
	
	
		
			971 lines
		
	
	
	
		
			25 KiB
			
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			971 lines
		
	
	
	
		
			25 KiB
			
		
	
	
	
		
			C
		
	
	
	
	
	
/*
 | 
						|
 * kernel/locking/mutex.c
 | 
						|
 *
 | 
						|
 * Mutexes: blocking mutual exclusion locks
 | 
						|
 *
 | 
						|
 * Started by Ingo Molnar:
 | 
						|
 *
 | 
						|
 *  Copyright (C) 2004, 2005, 2006 Red Hat, Inc., Ingo Molnar <mingo@redhat.com>
 | 
						|
 *
 | 
						|
 * Many thanks to Arjan van de Ven, Thomas Gleixner, Steven Rostedt and
 | 
						|
 * David Howells for suggestions and improvements.
 | 
						|
 *
 | 
						|
 *  - Adaptive spinning for mutexes by Peter Zijlstra. (Ported to mainline
 | 
						|
 *    from the -rt tree, where it was originally implemented for rtmutexes
 | 
						|
 *    by Steven Rostedt, based on work by Gregory Haskins, Peter Morreale
 | 
						|
 *    and Sven Dietrich.
 | 
						|
 *
 | 
						|
 * Also see Documentation/locking/mutex-design.txt.
 | 
						|
 */
 | 
						|
#include <linux/mutex.h>
 | 
						|
#include <linux/ww_mutex.h>
 | 
						|
#include <linux/sched.h>
 | 
						|
#include <linux/sched/rt.h>
 | 
						|
#include <linux/export.h>
 | 
						|
#include <linux/spinlock.h>
 | 
						|
#include <linux/interrupt.h>
 | 
						|
#include <linux/debug_locks.h>
 | 
						|
#include "mcs_spinlock.h"
 | 
						|
 | 
						|
/*
 | 
						|
 * In the DEBUG case we are using the "NULL fastpath" for mutexes,
 | 
						|
 * which forces all calls into the slowpath:
 | 
						|
 */
 | 
						|
#ifdef CONFIG_DEBUG_MUTEXES
 | 
						|
# include "mutex-debug.h"
 | 
						|
# include <asm-generic/mutex-null.h>
 | 
						|
/*
 | 
						|
 * Must be 0 for the debug case so we do not do the unlock outside of the
 | 
						|
 * wait_lock region. debug_mutex_unlock() will do the actual unlock in this
 | 
						|
 * case.
 | 
						|
 */
 | 
						|
# undef __mutex_slowpath_needs_to_unlock
 | 
						|
# define  __mutex_slowpath_needs_to_unlock()	0
 | 
						|
#else
 | 
						|
# include "mutex.h"
 | 
						|
# include <asm/mutex.h>
 | 
						|
#endif
 | 
						|
 | 
						|
void
 | 
						|
__mutex_init(struct mutex *lock, const char *name, struct lock_class_key *key)
 | 
						|
{
 | 
						|
	atomic_set(&lock->count, 1);
 | 
						|
	spin_lock_init(&lock->wait_lock);
 | 
						|
	INIT_LIST_HEAD(&lock->wait_list);
 | 
						|
	mutex_clear_owner(lock);
 | 
						|
#ifdef CONFIG_MUTEX_SPIN_ON_OWNER
 | 
						|
	osq_lock_init(&lock->osq);
 | 
						|
#endif
 | 
						|
 | 
						|
	debug_mutex_init(lock, name, key);
 | 
						|
}
 | 
						|
 | 
						|
EXPORT_SYMBOL(__mutex_init);
 | 
						|
 | 
						|
#ifndef CONFIG_DEBUG_LOCK_ALLOC
 | 
						|
/*
 | 
						|
 * We split the mutex lock/unlock logic into separate fastpath and
 | 
						|
 * slowpath functions, to reduce the register pressure on the fastpath.
 | 
						|
 * We also put the fastpath first in the kernel image, to make sure the
 | 
						|
 * branch is predicted by the CPU as default-untaken.
 | 
						|
 */
 | 
						|
__visible void __sched __mutex_lock_slowpath(atomic_t *lock_count);
 | 
						|
 | 
						|
/**
 | 
						|
 * mutex_lock - acquire the mutex
 | 
						|
 * @lock: the mutex to be acquired
 | 
						|
 *
 | 
						|
 * Lock the mutex exclusively for this task. If the mutex is not
 | 
						|
 * available right now, it will sleep until it can get it.
 | 
						|
 *
 | 
						|
 * The mutex must later on be released by the same task that
 | 
						|
 * acquired it. Recursive locking is not allowed. The task
 | 
						|
 * may not exit without first unlocking the mutex. Also, kernel
 | 
						|
 * memory where the mutex resides mutex must not be freed with
 | 
						|
 * the mutex still locked. The mutex must first be initialized
 | 
						|
 * (or statically defined) before it can be locked. memset()-ing
 | 
						|
 * the mutex to 0 is not allowed.
 | 
						|
 *
 | 
						|
 * ( The CONFIG_DEBUG_MUTEXES .config option turns on debugging
 | 
						|
 *   checks that will enforce the restrictions and will also do
 | 
						|
 *   deadlock debugging. )
 | 
						|
 *
 | 
						|
 * This function is similar to (but not equivalent to) down().
 | 
						|
 */
 | 
						|
void __sched mutex_lock(struct mutex *lock)
 | 
						|
{
 | 
						|
	might_sleep();
 | 
						|
	/*
 | 
						|
	 * The locking fastpath is the 1->0 transition from
 | 
						|
	 * 'unlocked' into 'locked' state.
 | 
						|
	 */
 | 
						|
	__mutex_fastpath_lock(&lock->count, __mutex_lock_slowpath);
 | 
						|
	mutex_set_owner(lock);
 | 
						|
}
 | 
						|
 | 
						|
EXPORT_SYMBOL(mutex_lock);
 | 
						|
#endif
 | 
						|
 | 
						|
static __always_inline void ww_mutex_lock_acquired(struct ww_mutex *ww,
 | 
						|
						   struct ww_acquire_ctx *ww_ctx)
 | 
						|
{
 | 
						|
#ifdef CONFIG_DEBUG_MUTEXES
 | 
						|
	/*
 | 
						|
	 * If this WARN_ON triggers, you used ww_mutex_lock to acquire,
 | 
						|
	 * but released with a normal mutex_unlock in this call.
 | 
						|
	 *
 | 
						|
	 * This should never happen, always use ww_mutex_unlock.
 | 
						|
	 */
 | 
						|
	DEBUG_LOCKS_WARN_ON(ww->ctx);
 | 
						|
 | 
						|
	/*
 | 
						|
	 * Not quite done after calling ww_acquire_done() ?
 | 
						|
	 */
 | 
						|
	DEBUG_LOCKS_WARN_ON(ww_ctx->done_acquire);
 | 
						|
 | 
						|
	if (ww_ctx->contending_lock) {
 | 
						|
		/*
 | 
						|
		 * After -EDEADLK you tried to
 | 
						|
		 * acquire a different ww_mutex? Bad!
 | 
						|
		 */
 | 
						|
		DEBUG_LOCKS_WARN_ON(ww_ctx->contending_lock != ww);
 | 
						|
 | 
						|
		/*
 | 
						|
		 * You called ww_mutex_lock after receiving -EDEADLK,
 | 
						|
		 * but 'forgot' to unlock everything else first?
 | 
						|
		 */
 | 
						|
		DEBUG_LOCKS_WARN_ON(ww_ctx->acquired > 0);
 | 
						|
		ww_ctx->contending_lock = NULL;
 | 
						|
	}
 | 
						|
 | 
						|
	/*
 | 
						|
	 * Naughty, using a different class will lead to undefined behavior!
 | 
						|
	 */
 | 
						|
	DEBUG_LOCKS_WARN_ON(ww_ctx->ww_class != ww->ww_class);
 | 
						|
#endif
 | 
						|
	ww_ctx->acquired++;
 | 
						|
}
 | 
						|
 | 
						|
/*
 | 
						|
 * after acquiring lock with fastpath or when we lost out in contested
 | 
						|
 * slowpath, set ctx and wake up any waiters so they can recheck.
 | 
						|
 *
 | 
						|
 * This function is never called when CONFIG_DEBUG_LOCK_ALLOC is set,
 | 
						|
 * as the fastpath and opportunistic spinning are disabled in that case.
 | 
						|
 */
 | 
						|
static __always_inline void
 | 
						|
ww_mutex_set_context_fastpath(struct ww_mutex *lock,
 | 
						|
			       struct ww_acquire_ctx *ctx)
 | 
						|
{
 | 
						|
	unsigned long flags;
 | 
						|
	struct mutex_waiter *cur;
 | 
						|
 | 
						|
	ww_mutex_lock_acquired(lock, ctx);
 | 
						|
 | 
						|
	lock->ctx = ctx;
 | 
						|
 | 
						|
	/*
 | 
						|
	 * The lock->ctx update should be visible on all cores before
 | 
						|
	 * the atomic read is done, otherwise contended waiters might be
 | 
						|
	 * missed. The contended waiters will either see ww_ctx == NULL
 | 
						|
	 * and keep spinning, or it will acquire wait_lock, add itself
 | 
						|
	 * to waiter list and sleep.
 | 
						|
	 */
 | 
						|
	smp_mb(); /* ^^^ */
 | 
						|
 | 
						|
	/*
 | 
						|
	 * Check if lock is contended, if not there is nobody to wake up
 | 
						|
	 */
 | 
						|
	if (likely(atomic_read(&lock->base.count) == 0))
 | 
						|
		return;
 | 
						|
 | 
						|
	/*
 | 
						|
	 * Uh oh, we raced in fastpath, wake up everyone in this case,
 | 
						|
	 * so they can see the new lock->ctx.
 | 
						|
	 */
 | 
						|
	spin_lock_mutex(&lock->base.wait_lock, flags);
 | 
						|
	list_for_each_entry(cur, &lock->base.wait_list, list) {
 | 
						|
		debug_mutex_wake_waiter(&lock->base, cur);
 | 
						|
		wake_up_process(cur->task);
 | 
						|
	}
 | 
						|
	spin_unlock_mutex(&lock->base.wait_lock, flags);
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
#ifdef CONFIG_MUTEX_SPIN_ON_OWNER
 | 
						|
/*
 | 
						|
 * In order to avoid a stampede of mutex spinners from acquiring the mutex
 | 
						|
 * more or less simultaneously, the spinners need to acquire a MCS lock
 | 
						|
 * first before spinning on the owner field.
 | 
						|
 *
 | 
						|
 */
 | 
						|
 | 
						|
/*
 | 
						|
 * Mutex spinning code migrated from kernel/sched/core.c
 | 
						|
 */
 | 
						|
 | 
						|
static inline bool owner_running(struct mutex *lock, struct task_struct *owner)
 | 
						|
{
 | 
						|
	if (lock->owner != owner)
 | 
						|
		return false;
 | 
						|
 | 
						|
	/*
 | 
						|
	 * Ensure we emit the owner->on_cpu, dereference _after_ checking
 | 
						|
	 * lock->owner still matches owner, if that fails, owner might
 | 
						|
	 * point to free()d memory, if it still matches, the rcu_read_lock()
 | 
						|
	 * ensures the memory stays valid.
 | 
						|
	 */
 | 
						|
	barrier();
 | 
						|
 | 
						|
	return owner->on_cpu;
 | 
						|
}
 | 
						|
 | 
						|
/*
 | 
						|
 * Look out! "owner" is an entirely speculative pointer
 | 
						|
 * access and not reliable.
 | 
						|
 */
 | 
						|
static noinline
 | 
						|
int mutex_spin_on_owner(struct mutex *lock, struct task_struct *owner)
 | 
						|
{
 | 
						|
	rcu_read_lock();
 | 
						|
	while (owner_running(lock, owner)) {
 | 
						|
		if (need_resched())
 | 
						|
			break;
 | 
						|
 | 
						|
		cpu_relax_lowlatency();
 | 
						|
	}
 | 
						|
	rcu_read_unlock();
 | 
						|
 | 
						|
	/*
 | 
						|
	 * We break out the loop above on need_resched() and when the
 | 
						|
	 * owner changed, which is a sign for heavy contention. Return
 | 
						|
	 * success only when lock->owner is NULL.
 | 
						|
	 */
 | 
						|
	return lock->owner == NULL;
 | 
						|
}
 | 
						|
 | 
						|
/*
 | 
						|
 * Initial check for entering the mutex spinning loop
 | 
						|
 */
 | 
						|
static inline int mutex_can_spin_on_owner(struct mutex *lock)
 | 
						|
{
 | 
						|
	struct task_struct *owner;
 | 
						|
	int retval = 1;
 | 
						|
 | 
						|
	if (need_resched())
 | 
						|
		return 0;
 | 
						|
 | 
						|
	rcu_read_lock();
 | 
						|
	owner = ACCESS_ONCE(lock->owner);
 | 
						|
	if (owner)
 | 
						|
		retval = owner->on_cpu;
 | 
						|
	rcu_read_unlock();
 | 
						|
	/*
 | 
						|
	 * if lock->owner is not set, the mutex owner may have just acquired
 | 
						|
	 * it and not set the owner yet or the mutex has been released.
 | 
						|
	 */
 | 
						|
	return retval;
 | 
						|
}
 | 
						|
 | 
						|
/*
 | 
						|
 * Atomically try to take the lock when it is available
 | 
						|
 */
 | 
						|
static inline bool mutex_try_to_acquire(struct mutex *lock)
 | 
						|
{
 | 
						|
	return !mutex_is_locked(lock) &&
 | 
						|
		(atomic_cmpxchg(&lock->count, 1, 0) == 1);
 | 
						|
}
 | 
						|
 | 
						|
/*
 | 
						|
 * Optimistic spinning.
 | 
						|
 *
 | 
						|
 * We try to spin for acquisition when we find that the lock owner
 | 
						|
 * is currently running on a (different) CPU and while we don't
 | 
						|
 * need to reschedule. The rationale is that if the lock owner is
 | 
						|
 * running, it is likely to release the lock soon.
 | 
						|
 *
 | 
						|
 * Since this needs the lock owner, and this mutex implementation
 | 
						|
 * doesn't track the owner atomically in the lock field, we need to
 | 
						|
 * track it non-atomically.
 | 
						|
 *
 | 
						|
 * We can't do this for DEBUG_MUTEXES because that relies on wait_lock
 | 
						|
 * to serialize everything.
 | 
						|
 *
 | 
						|
 * The mutex spinners are queued up using MCS lock so that only one
 | 
						|
 * spinner can compete for the mutex. However, if mutex spinning isn't
 | 
						|
 * going to happen, there is no point in going through the lock/unlock
 | 
						|
 * overhead.
 | 
						|
 *
 | 
						|
 * Returns true when the lock was taken, otherwise false, indicating
 | 
						|
 * that we need to jump to the slowpath and sleep.
 | 
						|
 */
 | 
						|
static bool mutex_optimistic_spin(struct mutex *lock,
 | 
						|
				  struct ww_acquire_ctx *ww_ctx, const bool use_ww_ctx)
 | 
						|
{
 | 
						|
	struct task_struct *task = current;
 | 
						|
 | 
						|
	if (!mutex_can_spin_on_owner(lock))
 | 
						|
		goto done;
 | 
						|
 | 
						|
	if (!osq_lock(&lock->osq))
 | 
						|
		goto done;
 | 
						|
 | 
						|
	while (true) {
 | 
						|
		struct task_struct *owner;
 | 
						|
 | 
						|
		if (use_ww_ctx && ww_ctx->acquired > 0) {
 | 
						|
			struct ww_mutex *ww;
 | 
						|
 | 
						|
			ww = container_of(lock, struct ww_mutex, base);
 | 
						|
			/*
 | 
						|
			 * If ww->ctx is set the contents are undefined, only
 | 
						|
			 * by acquiring wait_lock there is a guarantee that
 | 
						|
			 * they are not invalid when reading.
 | 
						|
			 *
 | 
						|
			 * As such, when deadlock detection needs to be
 | 
						|
			 * performed the optimistic spinning cannot be done.
 | 
						|
			 */
 | 
						|
			if (ACCESS_ONCE(ww->ctx))
 | 
						|
				break;
 | 
						|
		}
 | 
						|
 | 
						|
		/*
 | 
						|
		 * If there's an owner, wait for it to either
 | 
						|
		 * release the lock or go to sleep.
 | 
						|
		 */
 | 
						|
		owner = ACCESS_ONCE(lock->owner);
 | 
						|
		if (owner && !mutex_spin_on_owner(lock, owner))
 | 
						|
			break;
 | 
						|
 | 
						|
		/* Try to acquire the mutex if it is unlocked. */
 | 
						|
		if (mutex_try_to_acquire(lock)) {
 | 
						|
			lock_acquired(&lock->dep_map, ip);
 | 
						|
 | 
						|
			if (use_ww_ctx) {
 | 
						|
				struct ww_mutex *ww;
 | 
						|
				ww = container_of(lock, struct ww_mutex, base);
 | 
						|
 | 
						|
				ww_mutex_set_context_fastpath(ww, ww_ctx);
 | 
						|
			}
 | 
						|
 | 
						|
			mutex_set_owner(lock);
 | 
						|
			osq_unlock(&lock->osq);
 | 
						|
			return true;
 | 
						|
		}
 | 
						|
 | 
						|
		/*
 | 
						|
		 * When there's no owner, we might have preempted between the
 | 
						|
		 * owner acquiring the lock and setting the owner field. If
 | 
						|
		 * we're an RT task that will live-lock because we won't let
 | 
						|
		 * the owner complete.
 | 
						|
		 */
 | 
						|
		if (!owner && (need_resched() || rt_task(task)))
 | 
						|
			break;
 | 
						|
 | 
						|
		/*
 | 
						|
		 * The cpu_relax() call is a compiler barrier which forces
 | 
						|
		 * everything in this loop to be re-loaded. We don't need
 | 
						|
		 * memory barriers as we'll eventually observe the right
 | 
						|
		 * values at the cost of a few extra spins.
 | 
						|
		 */
 | 
						|
		cpu_relax_lowlatency();
 | 
						|
	}
 | 
						|
 | 
						|
	osq_unlock(&lock->osq);
 | 
						|
done:
 | 
						|
	/*
 | 
						|
	 * If we fell out of the spin path because of need_resched(),
 | 
						|
	 * reschedule now, before we try-lock the mutex. This avoids getting
 | 
						|
	 * scheduled out right after we obtained the mutex.
 | 
						|
	 */
 | 
						|
	if (need_resched())
 | 
						|
		schedule_preempt_disabled();
 | 
						|
 | 
						|
	return false;
 | 
						|
}
 | 
						|
#else
 | 
						|
static bool mutex_optimistic_spin(struct mutex *lock,
 | 
						|
				  struct ww_acquire_ctx *ww_ctx, const bool use_ww_ctx)
 | 
						|
{
 | 
						|
	return false;
 | 
						|
}
 | 
						|
#endif
 | 
						|
 | 
						|
__visible __used noinline
 | 
						|
void __sched __mutex_unlock_slowpath(atomic_t *lock_count);
 | 
						|
 | 
						|
/**
 | 
						|
 * mutex_unlock - release the mutex
 | 
						|
 * @lock: the mutex to be released
 | 
						|
 *
 | 
						|
 * Unlock a mutex that has been locked by this task previously.
 | 
						|
 *
 | 
						|
 * This function must not be used in interrupt context. Unlocking
 | 
						|
 * of a not locked mutex is not allowed.
 | 
						|
 *
 | 
						|
 * This function is similar to (but not equivalent to) up().
 | 
						|
 */
 | 
						|
void __sched mutex_unlock(struct mutex *lock)
 | 
						|
{
 | 
						|
	/*
 | 
						|
	 * The unlocking fastpath is the 0->1 transition from 'locked'
 | 
						|
	 * into 'unlocked' state:
 | 
						|
	 */
 | 
						|
#ifndef CONFIG_DEBUG_MUTEXES
 | 
						|
	/*
 | 
						|
	 * When debugging is enabled we must not clear the owner before time,
 | 
						|
	 * the slow path will always be taken, and that clears the owner field
 | 
						|
	 * after verifying that it was indeed current.
 | 
						|
	 */
 | 
						|
	mutex_clear_owner(lock);
 | 
						|
#endif
 | 
						|
	__mutex_fastpath_unlock(&lock->count, __mutex_unlock_slowpath);
 | 
						|
}
 | 
						|
 | 
						|
EXPORT_SYMBOL(mutex_unlock);
 | 
						|
 | 
						|
/**
 | 
						|
 * ww_mutex_unlock - release the w/w mutex
 | 
						|
 * @lock: the mutex to be released
 | 
						|
 *
 | 
						|
 * Unlock a mutex that has been locked by this task previously with any of the
 | 
						|
 * ww_mutex_lock* functions (with or without an acquire context). It is
 | 
						|
 * forbidden to release the locks after releasing the acquire context.
 | 
						|
 *
 | 
						|
 * This function must not be used in interrupt context. Unlocking
 | 
						|
 * of a unlocked mutex is not allowed.
 | 
						|
 */
 | 
						|
void __sched ww_mutex_unlock(struct ww_mutex *lock)
 | 
						|
{
 | 
						|
	/*
 | 
						|
	 * The unlocking fastpath is the 0->1 transition from 'locked'
 | 
						|
	 * into 'unlocked' state:
 | 
						|
	 */
 | 
						|
	if (lock->ctx) {
 | 
						|
#ifdef CONFIG_DEBUG_MUTEXES
 | 
						|
		DEBUG_LOCKS_WARN_ON(!lock->ctx->acquired);
 | 
						|
#endif
 | 
						|
		if (lock->ctx->acquired > 0)
 | 
						|
			lock->ctx->acquired--;
 | 
						|
		lock->ctx = NULL;
 | 
						|
	}
 | 
						|
 | 
						|
#ifndef CONFIG_DEBUG_MUTEXES
 | 
						|
	/*
 | 
						|
	 * When debugging is enabled we must not clear the owner before time,
 | 
						|
	 * the slow path will always be taken, and that clears the owner field
 | 
						|
	 * after verifying that it was indeed current.
 | 
						|
	 */
 | 
						|
	mutex_clear_owner(&lock->base);
 | 
						|
#endif
 | 
						|
	__mutex_fastpath_unlock(&lock->base.count, __mutex_unlock_slowpath);
 | 
						|
}
 | 
						|
EXPORT_SYMBOL(ww_mutex_unlock);
 | 
						|
 | 
						|
static inline int __sched
 | 
						|
__mutex_lock_check_stamp(struct mutex *lock, struct ww_acquire_ctx *ctx)
 | 
						|
{
 | 
						|
	struct ww_mutex *ww = container_of(lock, struct ww_mutex, base);
 | 
						|
	struct ww_acquire_ctx *hold_ctx = ACCESS_ONCE(ww->ctx);
 | 
						|
 | 
						|
	if (!hold_ctx)
 | 
						|
		return 0;
 | 
						|
 | 
						|
	if (unlikely(ctx == hold_ctx))
 | 
						|
		return -EALREADY;
 | 
						|
 | 
						|
	if (ctx->stamp - hold_ctx->stamp <= LONG_MAX &&
 | 
						|
	    (ctx->stamp != hold_ctx->stamp || ctx > hold_ctx)) {
 | 
						|
#ifdef CONFIG_DEBUG_MUTEXES
 | 
						|
		DEBUG_LOCKS_WARN_ON(ctx->contending_lock);
 | 
						|
		ctx->contending_lock = ww;
 | 
						|
#endif
 | 
						|
		return -EDEADLK;
 | 
						|
	}
 | 
						|
 | 
						|
	return 0;
 | 
						|
}
 | 
						|
 | 
						|
/*
 | 
						|
 * Lock a mutex (possibly interruptible), slowpath:
 | 
						|
 */
 | 
						|
static __always_inline int __sched
 | 
						|
__mutex_lock_common(struct mutex *lock, long state, unsigned int subclass,
 | 
						|
		    struct lockdep_map *nest_lock, unsigned long ip,
 | 
						|
		    struct ww_acquire_ctx *ww_ctx, const bool use_ww_ctx)
 | 
						|
{
 | 
						|
	struct task_struct *task = current;
 | 
						|
	struct mutex_waiter waiter;
 | 
						|
	unsigned long flags;
 | 
						|
	int ret;
 | 
						|
 | 
						|
	preempt_disable();
 | 
						|
	mutex_acquire_nest(&lock->dep_map, subclass, 0, nest_lock, ip);
 | 
						|
 | 
						|
	if (mutex_optimistic_spin(lock, ww_ctx, use_ww_ctx)) {
 | 
						|
		/* got the lock, yay! */
 | 
						|
		preempt_enable();
 | 
						|
		return 0;
 | 
						|
	}
 | 
						|
 | 
						|
	spin_lock_mutex(&lock->wait_lock, flags);
 | 
						|
 | 
						|
	/*
 | 
						|
	 * Once more, try to acquire the lock. Only try-lock the mutex if
 | 
						|
	 * it is unlocked to reduce unnecessary xchg() operations.
 | 
						|
	 */
 | 
						|
	if (!mutex_is_locked(lock) && (atomic_xchg(&lock->count, 0) == 1))
 | 
						|
		goto skip_wait;
 | 
						|
 | 
						|
	debug_mutex_lock_common(lock, &waiter);
 | 
						|
	debug_mutex_add_waiter(lock, &waiter, task_thread_info(task));
 | 
						|
 | 
						|
	/* add waiting tasks to the end of the waitqueue (FIFO): */
 | 
						|
	list_add_tail(&waiter.list, &lock->wait_list);
 | 
						|
	waiter.task = task;
 | 
						|
 | 
						|
	lock_contended(&lock->dep_map, ip);
 | 
						|
 | 
						|
	for (;;) {
 | 
						|
		/*
 | 
						|
		 * Lets try to take the lock again - this is needed even if
 | 
						|
		 * we get here for the first time (shortly after failing to
 | 
						|
		 * acquire the lock), to make sure that we get a wakeup once
 | 
						|
		 * it's unlocked. Later on, if we sleep, this is the
 | 
						|
		 * operation that gives us the lock. We xchg it to -1, so
 | 
						|
		 * that when we release the lock, we properly wake up the
 | 
						|
		 * other waiters. We only attempt the xchg if the count is
 | 
						|
		 * non-negative in order to avoid unnecessary xchg operations:
 | 
						|
		 */
 | 
						|
		if (atomic_read(&lock->count) >= 0 &&
 | 
						|
		    (atomic_xchg(&lock->count, -1) == 1))
 | 
						|
			break;
 | 
						|
 | 
						|
		/*
 | 
						|
		 * got a signal? (This code gets eliminated in the
 | 
						|
		 * TASK_UNINTERRUPTIBLE case.)
 | 
						|
		 */
 | 
						|
		if (unlikely(signal_pending_state(state, task))) {
 | 
						|
			ret = -EINTR;
 | 
						|
			goto err;
 | 
						|
		}
 | 
						|
 | 
						|
		if (use_ww_ctx && ww_ctx->acquired > 0) {
 | 
						|
			ret = __mutex_lock_check_stamp(lock, ww_ctx);
 | 
						|
			if (ret)
 | 
						|
				goto err;
 | 
						|
		}
 | 
						|
 | 
						|
		__set_task_state(task, state);
 | 
						|
 | 
						|
		/* didn't get the lock, go to sleep: */
 | 
						|
		spin_unlock_mutex(&lock->wait_lock, flags);
 | 
						|
		schedule_preempt_disabled();
 | 
						|
		spin_lock_mutex(&lock->wait_lock, flags);
 | 
						|
	}
 | 
						|
	mutex_remove_waiter(lock, &waiter, current_thread_info());
 | 
						|
	/* set it to 0 if there are no waiters left: */
 | 
						|
	if (likely(list_empty(&lock->wait_list)))
 | 
						|
		atomic_set(&lock->count, 0);
 | 
						|
	debug_mutex_free_waiter(&waiter);
 | 
						|
 | 
						|
skip_wait:
 | 
						|
	/* got the lock - cleanup and rejoice! */
 | 
						|
	lock_acquired(&lock->dep_map, ip);
 | 
						|
	mutex_set_owner(lock);
 | 
						|
 | 
						|
	if (use_ww_ctx) {
 | 
						|
		struct ww_mutex *ww = container_of(lock, struct ww_mutex, base);
 | 
						|
		struct mutex_waiter *cur;
 | 
						|
 | 
						|
		/*
 | 
						|
		 * This branch gets optimized out for the common case,
 | 
						|
		 * and is only important for ww_mutex_lock.
 | 
						|
		 */
 | 
						|
		ww_mutex_lock_acquired(ww, ww_ctx);
 | 
						|
		ww->ctx = ww_ctx;
 | 
						|
 | 
						|
		/*
 | 
						|
		 * Give any possible sleeping processes the chance to wake up,
 | 
						|
		 * so they can recheck if they have to back off.
 | 
						|
		 */
 | 
						|
		list_for_each_entry(cur, &lock->wait_list, list) {
 | 
						|
			debug_mutex_wake_waiter(lock, cur);
 | 
						|
			wake_up_process(cur->task);
 | 
						|
		}
 | 
						|
	}
 | 
						|
 | 
						|
	spin_unlock_mutex(&lock->wait_lock, flags);
 | 
						|
	preempt_enable();
 | 
						|
	return 0;
 | 
						|
 | 
						|
err:
 | 
						|
	mutex_remove_waiter(lock, &waiter, task_thread_info(task));
 | 
						|
	spin_unlock_mutex(&lock->wait_lock, flags);
 | 
						|
	debug_mutex_free_waiter(&waiter);
 | 
						|
	mutex_release(&lock->dep_map, 1, ip);
 | 
						|
	preempt_enable();
 | 
						|
	return ret;
 | 
						|
}
 | 
						|
 | 
						|
#ifdef CONFIG_DEBUG_LOCK_ALLOC
 | 
						|
void __sched
 | 
						|
mutex_lock_nested(struct mutex *lock, unsigned int subclass)
 | 
						|
{
 | 
						|
	might_sleep();
 | 
						|
	__mutex_lock_common(lock, TASK_UNINTERRUPTIBLE,
 | 
						|
			    subclass, NULL, _RET_IP_, NULL, 0);
 | 
						|
}
 | 
						|
 | 
						|
EXPORT_SYMBOL_GPL(mutex_lock_nested);
 | 
						|
 | 
						|
void __sched
 | 
						|
_mutex_lock_nest_lock(struct mutex *lock, struct lockdep_map *nest)
 | 
						|
{
 | 
						|
	might_sleep();
 | 
						|
	__mutex_lock_common(lock, TASK_UNINTERRUPTIBLE,
 | 
						|
			    0, nest, _RET_IP_, NULL, 0);
 | 
						|
}
 | 
						|
 | 
						|
EXPORT_SYMBOL_GPL(_mutex_lock_nest_lock);
 | 
						|
 | 
						|
int __sched
 | 
						|
mutex_lock_killable_nested(struct mutex *lock, unsigned int subclass)
 | 
						|
{
 | 
						|
	might_sleep();
 | 
						|
	return __mutex_lock_common(lock, TASK_KILLABLE,
 | 
						|
				   subclass, NULL, _RET_IP_, NULL, 0);
 | 
						|
}
 | 
						|
EXPORT_SYMBOL_GPL(mutex_lock_killable_nested);
 | 
						|
 | 
						|
int __sched
 | 
						|
mutex_lock_interruptible_nested(struct mutex *lock, unsigned int subclass)
 | 
						|
{
 | 
						|
	might_sleep();
 | 
						|
	return __mutex_lock_common(lock, TASK_INTERRUPTIBLE,
 | 
						|
				   subclass, NULL, _RET_IP_, NULL, 0);
 | 
						|
}
 | 
						|
 | 
						|
EXPORT_SYMBOL_GPL(mutex_lock_interruptible_nested);
 | 
						|
 | 
						|
static inline int
 | 
						|
ww_mutex_deadlock_injection(struct ww_mutex *lock, struct ww_acquire_ctx *ctx)
 | 
						|
{
 | 
						|
#ifdef CONFIG_DEBUG_WW_MUTEX_SLOWPATH
 | 
						|
	unsigned tmp;
 | 
						|
 | 
						|
	if (ctx->deadlock_inject_countdown-- == 0) {
 | 
						|
		tmp = ctx->deadlock_inject_interval;
 | 
						|
		if (tmp > UINT_MAX/4)
 | 
						|
			tmp = UINT_MAX;
 | 
						|
		else
 | 
						|
			tmp = tmp*2 + tmp + tmp/2;
 | 
						|
 | 
						|
		ctx->deadlock_inject_interval = tmp;
 | 
						|
		ctx->deadlock_inject_countdown = tmp;
 | 
						|
		ctx->contending_lock = lock;
 | 
						|
 | 
						|
		ww_mutex_unlock(lock);
 | 
						|
 | 
						|
		return -EDEADLK;
 | 
						|
	}
 | 
						|
#endif
 | 
						|
 | 
						|
	return 0;
 | 
						|
}
 | 
						|
 | 
						|
int __sched
 | 
						|
__ww_mutex_lock(struct ww_mutex *lock, struct ww_acquire_ctx *ctx)
 | 
						|
{
 | 
						|
	int ret;
 | 
						|
 | 
						|
	might_sleep();
 | 
						|
	ret =  __mutex_lock_common(&lock->base, TASK_UNINTERRUPTIBLE,
 | 
						|
				   0, &ctx->dep_map, _RET_IP_, ctx, 1);
 | 
						|
	if (!ret && ctx->acquired > 1)
 | 
						|
		return ww_mutex_deadlock_injection(lock, ctx);
 | 
						|
 | 
						|
	return ret;
 | 
						|
}
 | 
						|
EXPORT_SYMBOL_GPL(__ww_mutex_lock);
 | 
						|
 | 
						|
int __sched
 | 
						|
__ww_mutex_lock_interruptible(struct ww_mutex *lock, struct ww_acquire_ctx *ctx)
 | 
						|
{
 | 
						|
	int ret;
 | 
						|
 | 
						|
	might_sleep();
 | 
						|
	ret = __mutex_lock_common(&lock->base, TASK_INTERRUPTIBLE,
 | 
						|
				  0, &ctx->dep_map, _RET_IP_, ctx, 1);
 | 
						|
 | 
						|
	if (!ret && ctx->acquired > 1)
 | 
						|
		return ww_mutex_deadlock_injection(lock, ctx);
 | 
						|
 | 
						|
	return ret;
 | 
						|
}
 | 
						|
EXPORT_SYMBOL_GPL(__ww_mutex_lock_interruptible);
 | 
						|
 | 
						|
#endif
 | 
						|
 | 
						|
/*
 | 
						|
 * Release the lock, slowpath:
 | 
						|
 */
 | 
						|
static inline void
 | 
						|
__mutex_unlock_common_slowpath(struct mutex *lock, int nested)
 | 
						|
{
 | 
						|
	unsigned long flags;
 | 
						|
 | 
						|
	/*
 | 
						|
	 * As a performance measurement, release the lock before doing other
 | 
						|
	 * wakeup related duties to follow. This allows other tasks to acquire
 | 
						|
	 * the lock sooner, while still handling cleanups in past unlock calls.
 | 
						|
	 * This can be done as we do not enforce strict equivalence between the
 | 
						|
	 * mutex counter and wait_list.
 | 
						|
	 *
 | 
						|
	 *
 | 
						|
	 * Some architectures leave the lock unlocked in the fastpath failure
 | 
						|
	 * case, others need to leave it locked. In the later case we have to
 | 
						|
	 * unlock it here - as the lock counter is currently 0 or negative.
 | 
						|
	 */
 | 
						|
	if (__mutex_slowpath_needs_to_unlock())
 | 
						|
		atomic_set(&lock->count, 1);
 | 
						|
 | 
						|
	spin_lock_mutex(&lock->wait_lock, flags);
 | 
						|
	mutex_release(&lock->dep_map, nested, _RET_IP_);
 | 
						|
	debug_mutex_unlock(lock);
 | 
						|
 | 
						|
	if (!list_empty(&lock->wait_list)) {
 | 
						|
		/* get the first entry from the wait-list: */
 | 
						|
		struct mutex_waiter *waiter =
 | 
						|
				list_entry(lock->wait_list.next,
 | 
						|
					   struct mutex_waiter, list);
 | 
						|
 | 
						|
		debug_mutex_wake_waiter(lock, waiter);
 | 
						|
 | 
						|
		wake_up_process(waiter->task);
 | 
						|
	}
 | 
						|
 | 
						|
	spin_unlock_mutex(&lock->wait_lock, flags);
 | 
						|
}
 | 
						|
 | 
						|
/*
 | 
						|
 * Release the lock, slowpath:
 | 
						|
 */
 | 
						|
__visible void
 | 
						|
__mutex_unlock_slowpath(atomic_t *lock_count)
 | 
						|
{
 | 
						|
	struct mutex *lock = container_of(lock_count, struct mutex, count);
 | 
						|
 | 
						|
	__mutex_unlock_common_slowpath(lock, 1);
 | 
						|
}
 | 
						|
 | 
						|
#ifndef CONFIG_DEBUG_LOCK_ALLOC
 | 
						|
/*
 | 
						|
 * Here come the less common (and hence less performance-critical) APIs:
 | 
						|
 * mutex_lock_interruptible() and mutex_trylock().
 | 
						|
 */
 | 
						|
static noinline int __sched
 | 
						|
__mutex_lock_killable_slowpath(struct mutex *lock);
 | 
						|
 | 
						|
static noinline int __sched
 | 
						|
__mutex_lock_interruptible_slowpath(struct mutex *lock);
 | 
						|
 | 
						|
/**
 | 
						|
 * mutex_lock_interruptible - acquire the mutex, interruptible
 | 
						|
 * @lock: the mutex to be acquired
 | 
						|
 *
 | 
						|
 * Lock the mutex like mutex_lock(), and return 0 if the mutex has
 | 
						|
 * been acquired or sleep until the mutex becomes available. If a
 | 
						|
 * signal arrives while waiting for the lock then this function
 | 
						|
 * returns -EINTR.
 | 
						|
 *
 | 
						|
 * This function is similar to (but not equivalent to) down_interruptible().
 | 
						|
 */
 | 
						|
int __sched mutex_lock_interruptible(struct mutex *lock)
 | 
						|
{
 | 
						|
	int ret;
 | 
						|
 | 
						|
	might_sleep();
 | 
						|
	ret =  __mutex_fastpath_lock_retval(&lock->count);
 | 
						|
	if (likely(!ret)) {
 | 
						|
		mutex_set_owner(lock);
 | 
						|
		return 0;
 | 
						|
	} else
 | 
						|
		return __mutex_lock_interruptible_slowpath(lock);
 | 
						|
}
 | 
						|
 | 
						|
EXPORT_SYMBOL(mutex_lock_interruptible);
 | 
						|
 | 
						|
int __sched mutex_lock_killable(struct mutex *lock)
 | 
						|
{
 | 
						|
	int ret;
 | 
						|
 | 
						|
	might_sleep();
 | 
						|
	ret = __mutex_fastpath_lock_retval(&lock->count);
 | 
						|
	if (likely(!ret)) {
 | 
						|
		mutex_set_owner(lock);
 | 
						|
		return 0;
 | 
						|
	} else
 | 
						|
		return __mutex_lock_killable_slowpath(lock);
 | 
						|
}
 | 
						|
EXPORT_SYMBOL(mutex_lock_killable);
 | 
						|
 | 
						|
__visible void __sched
 | 
						|
__mutex_lock_slowpath(atomic_t *lock_count)
 | 
						|
{
 | 
						|
	struct mutex *lock = container_of(lock_count, struct mutex, count);
 | 
						|
 | 
						|
	__mutex_lock_common(lock, TASK_UNINTERRUPTIBLE, 0,
 | 
						|
			    NULL, _RET_IP_, NULL, 0);
 | 
						|
}
 | 
						|
 | 
						|
static noinline int __sched
 | 
						|
__mutex_lock_killable_slowpath(struct mutex *lock)
 | 
						|
{
 | 
						|
	return __mutex_lock_common(lock, TASK_KILLABLE, 0,
 | 
						|
				   NULL, _RET_IP_, NULL, 0);
 | 
						|
}
 | 
						|
 | 
						|
static noinline int __sched
 | 
						|
__mutex_lock_interruptible_slowpath(struct mutex *lock)
 | 
						|
{
 | 
						|
	return __mutex_lock_common(lock, TASK_INTERRUPTIBLE, 0,
 | 
						|
				   NULL, _RET_IP_, NULL, 0);
 | 
						|
}
 | 
						|
 | 
						|
static noinline int __sched
 | 
						|
__ww_mutex_lock_slowpath(struct ww_mutex *lock, struct ww_acquire_ctx *ctx)
 | 
						|
{
 | 
						|
	return __mutex_lock_common(&lock->base, TASK_UNINTERRUPTIBLE, 0,
 | 
						|
				   NULL, _RET_IP_, ctx, 1);
 | 
						|
}
 | 
						|
 | 
						|
static noinline int __sched
 | 
						|
__ww_mutex_lock_interruptible_slowpath(struct ww_mutex *lock,
 | 
						|
					    struct ww_acquire_ctx *ctx)
 | 
						|
{
 | 
						|
	return __mutex_lock_common(&lock->base, TASK_INTERRUPTIBLE, 0,
 | 
						|
				   NULL, _RET_IP_, ctx, 1);
 | 
						|
}
 | 
						|
 | 
						|
#endif
 | 
						|
 | 
						|
/*
 | 
						|
 * Spinlock based trylock, we take the spinlock and check whether we
 | 
						|
 * can get the lock:
 | 
						|
 */
 | 
						|
static inline int __mutex_trylock_slowpath(atomic_t *lock_count)
 | 
						|
{
 | 
						|
	struct mutex *lock = container_of(lock_count, struct mutex, count);
 | 
						|
	unsigned long flags;
 | 
						|
	int prev;
 | 
						|
 | 
						|
	/* No need to trylock if the mutex is locked. */
 | 
						|
	if (mutex_is_locked(lock))
 | 
						|
		return 0;
 | 
						|
 | 
						|
	spin_lock_mutex(&lock->wait_lock, flags);
 | 
						|
 | 
						|
	prev = atomic_xchg(&lock->count, -1);
 | 
						|
	if (likely(prev == 1)) {
 | 
						|
		mutex_set_owner(lock);
 | 
						|
		mutex_acquire(&lock->dep_map, 0, 1, _RET_IP_);
 | 
						|
	}
 | 
						|
 | 
						|
	/* Set it back to 0 if there are no waiters: */
 | 
						|
	if (likely(list_empty(&lock->wait_list)))
 | 
						|
		atomic_set(&lock->count, 0);
 | 
						|
 | 
						|
	spin_unlock_mutex(&lock->wait_lock, flags);
 | 
						|
 | 
						|
	return prev == 1;
 | 
						|
}
 | 
						|
 | 
						|
/**
 | 
						|
 * mutex_trylock - try to acquire the mutex, without waiting
 | 
						|
 * @lock: the mutex to be acquired
 | 
						|
 *
 | 
						|
 * Try to acquire the mutex atomically. Returns 1 if the mutex
 | 
						|
 * has been acquired successfully, and 0 on contention.
 | 
						|
 *
 | 
						|
 * NOTE: this function follows the spin_trylock() convention, so
 | 
						|
 * it is negated from the down_trylock() return values! Be careful
 | 
						|
 * about this when converting semaphore users to mutexes.
 | 
						|
 *
 | 
						|
 * This function must not be used in interrupt context. The
 | 
						|
 * mutex must be released by the same task that acquired it.
 | 
						|
 */
 | 
						|
int __sched mutex_trylock(struct mutex *lock)
 | 
						|
{
 | 
						|
	int ret;
 | 
						|
 | 
						|
	ret = __mutex_fastpath_trylock(&lock->count, __mutex_trylock_slowpath);
 | 
						|
	if (ret)
 | 
						|
		mutex_set_owner(lock);
 | 
						|
 | 
						|
	return ret;
 | 
						|
}
 | 
						|
EXPORT_SYMBOL(mutex_trylock);
 | 
						|
 | 
						|
#ifndef CONFIG_DEBUG_LOCK_ALLOC
 | 
						|
int __sched
 | 
						|
__ww_mutex_lock(struct ww_mutex *lock, struct ww_acquire_ctx *ctx)
 | 
						|
{
 | 
						|
	int ret;
 | 
						|
 | 
						|
	might_sleep();
 | 
						|
 | 
						|
	ret = __mutex_fastpath_lock_retval(&lock->base.count);
 | 
						|
 | 
						|
	if (likely(!ret)) {
 | 
						|
		ww_mutex_set_context_fastpath(lock, ctx);
 | 
						|
		mutex_set_owner(&lock->base);
 | 
						|
	} else
 | 
						|
		ret = __ww_mutex_lock_slowpath(lock, ctx);
 | 
						|
	return ret;
 | 
						|
}
 | 
						|
EXPORT_SYMBOL(__ww_mutex_lock);
 | 
						|
 | 
						|
int __sched
 | 
						|
__ww_mutex_lock_interruptible(struct ww_mutex *lock, struct ww_acquire_ctx *ctx)
 | 
						|
{
 | 
						|
	int ret;
 | 
						|
 | 
						|
	might_sleep();
 | 
						|
 | 
						|
	ret = __mutex_fastpath_lock_retval(&lock->base.count);
 | 
						|
 | 
						|
	if (likely(!ret)) {
 | 
						|
		ww_mutex_set_context_fastpath(lock, ctx);
 | 
						|
		mutex_set_owner(&lock->base);
 | 
						|
	} else
 | 
						|
		ret = __ww_mutex_lock_interruptible_slowpath(lock, ctx);
 | 
						|
	return ret;
 | 
						|
}
 | 
						|
EXPORT_SYMBOL(__ww_mutex_lock_interruptible);
 | 
						|
 | 
						|
#endif
 | 
						|
 | 
						|
/**
 | 
						|
 * atomic_dec_and_mutex_lock - return holding mutex if we dec to 0
 | 
						|
 * @cnt: the atomic which we are to dec
 | 
						|
 * @lock: the mutex to return holding if we dec to 0
 | 
						|
 *
 | 
						|
 * return true and hold lock if we dec to 0, return false otherwise
 | 
						|
 */
 | 
						|
int atomic_dec_and_mutex_lock(atomic_t *cnt, struct mutex *lock)
 | 
						|
{
 | 
						|
	/* dec if we can't possibly hit 0 */
 | 
						|
	if (atomic_add_unless(cnt, -1, 1))
 | 
						|
		return 0;
 | 
						|
	/* we might hit 0, so take the lock */
 | 
						|
	mutex_lock(lock);
 | 
						|
	if (!atomic_dec_and_test(cnt)) {
 | 
						|
		/* when we actually did the dec, we didn't hit 0 */
 | 
						|
		mutex_unlock(lock);
 | 
						|
		return 0;
 | 
						|
	}
 | 
						|
	/* we hit 0, and we hold the lock */
 | 
						|
	return 1;
 | 
						|
}
 | 
						|
EXPORT_SYMBOL(atomic_dec_and_mutex_lock);
 |