101768b42SPeter Zijlstra /* 267a6de49SPeter Zijlstra * kernel/locking/mutex.c 301768b42SPeter Zijlstra * 401768b42SPeter Zijlstra * Mutexes: blocking mutual exclusion locks 501768b42SPeter Zijlstra * 601768b42SPeter Zijlstra * Started by Ingo Molnar: 701768b42SPeter Zijlstra * 801768b42SPeter Zijlstra * Copyright (C) 2004, 2005, 2006 Red Hat, Inc., Ingo Molnar <mingo@redhat.com> 901768b42SPeter Zijlstra * 1001768b42SPeter Zijlstra * Many thanks to Arjan van de Ven, Thomas Gleixner, Steven Rostedt and 1101768b42SPeter Zijlstra * David Howells for suggestions and improvements. 1201768b42SPeter Zijlstra * 1301768b42SPeter Zijlstra * - Adaptive spinning for mutexes by Peter Zijlstra. (Ported to mainline 1401768b42SPeter Zijlstra * from the -rt tree, where it was originally implemented for rtmutexes 1501768b42SPeter Zijlstra * by Steven Rostedt, based on work by Gregory Haskins, Peter Morreale 1601768b42SPeter Zijlstra * and Sven Dietrich. 1701768b42SPeter Zijlstra * 18214e0aedSDavidlohr Bueso * Also see Documentation/locking/mutex-design.txt. 1901768b42SPeter Zijlstra */ 2001768b42SPeter Zijlstra #include <linux/mutex.h> 2101768b42SPeter Zijlstra #include <linux/ww_mutex.h> 2201768b42SPeter Zijlstra #include <linux/sched.h> 2301768b42SPeter Zijlstra #include <linux/sched/rt.h> 2401768b42SPeter Zijlstra #include <linux/export.h> 2501768b42SPeter Zijlstra #include <linux/spinlock.h> 2601768b42SPeter Zijlstra #include <linux/interrupt.h> 2701768b42SPeter Zijlstra #include <linux/debug_locks.h> 287a215f89SDavidlohr Bueso #include <linux/osq_lock.h> 2901768b42SPeter Zijlstra 3001768b42SPeter Zijlstra #ifdef CONFIG_DEBUG_MUTEXES 3101768b42SPeter Zijlstra # include "mutex-debug.h" 3201768b42SPeter Zijlstra #else 3301768b42SPeter Zijlstra # include "mutex.h" 3401768b42SPeter Zijlstra #endif 3501768b42SPeter Zijlstra 3601768b42SPeter Zijlstra void 3701768b42SPeter Zijlstra __mutex_init(struct mutex *lock, const char *name, struct lock_class_key *key) 3801768b42SPeter Zijlstra { 393ca0ff57SPeter Zijlstra atomic_long_set(&lock->owner, 0); 4001768b42SPeter Zijlstra spin_lock_init(&lock->wait_lock); 4101768b42SPeter Zijlstra INIT_LIST_HEAD(&lock->wait_list); 4201768b42SPeter Zijlstra #ifdef CONFIG_MUTEX_SPIN_ON_OWNER 434d9d951eSJason Low osq_lock_init(&lock->osq); 4401768b42SPeter Zijlstra #endif 4501768b42SPeter Zijlstra 4601768b42SPeter Zijlstra debug_mutex_init(lock, name, key); 4701768b42SPeter Zijlstra } 4801768b42SPeter Zijlstra EXPORT_SYMBOL(__mutex_init); 4901768b42SPeter Zijlstra 503ca0ff57SPeter Zijlstra /* 513ca0ff57SPeter Zijlstra * @owner: contains: 'struct task_struct *' to the current lock owner, 523ca0ff57SPeter Zijlstra * NULL means not owned. Since task_struct pointers are aligned at 533ca0ff57SPeter Zijlstra * ARCH_MIN_TASKALIGN (which is at least sizeof(void *)), we have low 543ca0ff57SPeter Zijlstra * bits to store extra state. 553ca0ff57SPeter Zijlstra * 563ca0ff57SPeter Zijlstra * Bit0 indicates a non-empty waiter list; unlock must issue a wakeup. 579d659ae1SPeter Zijlstra * Bit1 indicates unlock needs to hand the lock to the top-waiter 583ca0ff57SPeter Zijlstra */ 593ca0ff57SPeter Zijlstra #define MUTEX_FLAG_WAITERS 0x01 609d659ae1SPeter Zijlstra #define MUTEX_FLAG_HANDOFF 0x02 613ca0ff57SPeter Zijlstra 623ca0ff57SPeter Zijlstra #define MUTEX_FLAGS 0x03 633ca0ff57SPeter Zijlstra 643ca0ff57SPeter Zijlstra static inline struct task_struct *__owner_task(unsigned long owner) 653ca0ff57SPeter Zijlstra { 663ca0ff57SPeter Zijlstra return (struct task_struct *)(owner & ~MUTEX_FLAGS); 673ca0ff57SPeter Zijlstra } 683ca0ff57SPeter Zijlstra 693ca0ff57SPeter Zijlstra static inline unsigned long __owner_flags(unsigned long owner) 703ca0ff57SPeter Zijlstra { 713ca0ff57SPeter Zijlstra return owner & MUTEX_FLAGS; 723ca0ff57SPeter Zijlstra } 733ca0ff57SPeter Zijlstra 743ca0ff57SPeter Zijlstra /* 753ca0ff57SPeter Zijlstra * Actual trylock that will work on any unlocked state. 769d659ae1SPeter Zijlstra * 779d659ae1SPeter Zijlstra * When setting the owner field, we must preserve the low flag bits. 789d659ae1SPeter Zijlstra * 799d659ae1SPeter Zijlstra * Be careful with @handoff, only set that in a wait-loop (where you set 809d659ae1SPeter Zijlstra * HANDOFF) to avoid recursive lock attempts. 813ca0ff57SPeter Zijlstra */ 829d659ae1SPeter Zijlstra static inline bool __mutex_trylock(struct mutex *lock, const bool handoff) 833ca0ff57SPeter Zijlstra { 843ca0ff57SPeter Zijlstra unsigned long owner, curr = (unsigned long)current; 853ca0ff57SPeter Zijlstra 863ca0ff57SPeter Zijlstra owner = atomic_long_read(&lock->owner); 873ca0ff57SPeter Zijlstra for (;;) { /* must loop, can race against a flag */ 889d659ae1SPeter Zijlstra unsigned long old, flags = __owner_flags(owner); 893ca0ff57SPeter Zijlstra 909d659ae1SPeter Zijlstra if (__owner_task(owner)) { 919d659ae1SPeter Zijlstra if (handoff && unlikely(__owner_task(owner) == current)) { 929d659ae1SPeter Zijlstra /* 939d659ae1SPeter Zijlstra * Provide ACQUIRE semantics for the lock-handoff. 949d659ae1SPeter Zijlstra * 959d659ae1SPeter Zijlstra * We cannot easily use load-acquire here, since 969d659ae1SPeter Zijlstra * the actual load is a failed cmpxchg, which 979d659ae1SPeter Zijlstra * doesn't imply any barriers. 989d659ae1SPeter Zijlstra * 999d659ae1SPeter Zijlstra * Also, this is a fairly unlikely scenario, and 1009d659ae1SPeter Zijlstra * this contains the cost. 1019d659ae1SPeter Zijlstra */ 1029d659ae1SPeter Zijlstra smp_mb(); /* ACQUIRE */ 1039d659ae1SPeter Zijlstra return true; 1049d659ae1SPeter Zijlstra } 1059d659ae1SPeter Zijlstra 1063ca0ff57SPeter Zijlstra return false; 1079d659ae1SPeter Zijlstra } 1083ca0ff57SPeter Zijlstra 1099d659ae1SPeter Zijlstra /* 1109d659ae1SPeter Zijlstra * We set the HANDOFF bit, we must make sure it doesn't live 1119d659ae1SPeter Zijlstra * past the point where we acquire it. This would be possible 1129d659ae1SPeter Zijlstra * if we (accidentally) set the bit on an unlocked mutex. 1139d659ae1SPeter Zijlstra */ 1149d659ae1SPeter Zijlstra if (handoff) 1159d659ae1SPeter Zijlstra flags &= ~MUTEX_FLAG_HANDOFF; 1169d659ae1SPeter Zijlstra 1179d659ae1SPeter Zijlstra old = atomic_long_cmpxchg_acquire(&lock->owner, owner, curr | flags); 1183ca0ff57SPeter Zijlstra if (old == owner) 1193ca0ff57SPeter Zijlstra return true; 1203ca0ff57SPeter Zijlstra 1213ca0ff57SPeter Zijlstra owner = old; 1223ca0ff57SPeter Zijlstra } 1233ca0ff57SPeter Zijlstra } 1243ca0ff57SPeter Zijlstra 1253ca0ff57SPeter Zijlstra #ifndef CONFIG_DEBUG_LOCK_ALLOC 1263ca0ff57SPeter Zijlstra /* 1273ca0ff57SPeter Zijlstra * Lockdep annotations are contained to the slow paths for simplicity. 1283ca0ff57SPeter Zijlstra * There is nothing that would stop spreading the lockdep annotations outwards 1293ca0ff57SPeter Zijlstra * except more code. 1303ca0ff57SPeter Zijlstra */ 1313ca0ff57SPeter Zijlstra 1323ca0ff57SPeter Zijlstra /* 1333ca0ff57SPeter Zijlstra * Optimistic trylock that only works in the uncontended case. Make sure to 1343ca0ff57SPeter Zijlstra * follow with a __mutex_trylock() before failing. 1353ca0ff57SPeter Zijlstra */ 1363ca0ff57SPeter Zijlstra static __always_inline bool __mutex_trylock_fast(struct mutex *lock) 1373ca0ff57SPeter Zijlstra { 1383ca0ff57SPeter Zijlstra unsigned long curr = (unsigned long)current; 1393ca0ff57SPeter Zijlstra 1403ca0ff57SPeter Zijlstra if (!atomic_long_cmpxchg_acquire(&lock->owner, 0UL, curr)) 1413ca0ff57SPeter Zijlstra return true; 1423ca0ff57SPeter Zijlstra 1433ca0ff57SPeter Zijlstra return false; 1443ca0ff57SPeter Zijlstra } 1453ca0ff57SPeter Zijlstra 1463ca0ff57SPeter Zijlstra static __always_inline bool __mutex_unlock_fast(struct mutex *lock) 1473ca0ff57SPeter Zijlstra { 1483ca0ff57SPeter Zijlstra unsigned long curr = (unsigned long)current; 1493ca0ff57SPeter Zijlstra 1503ca0ff57SPeter Zijlstra if (atomic_long_cmpxchg_release(&lock->owner, curr, 0UL) == curr) 1513ca0ff57SPeter Zijlstra return true; 1523ca0ff57SPeter Zijlstra 1533ca0ff57SPeter Zijlstra return false; 1543ca0ff57SPeter Zijlstra } 1553ca0ff57SPeter Zijlstra #endif 1563ca0ff57SPeter Zijlstra 1573ca0ff57SPeter Zijlstra static inline void __mutex_set_flag(struct mutex *lock, unsigned long flag) 1583ca0ff57SPeter Zijlstra { 1593ca0ff57SPeter Zijlstra atomic_long_or(flag, &lock->owner); 1603ca0ff57SPeter Zijlstra } 1613ca0ff57SPeter Zijlstra 1623ca0ff57SPeter Zijlstra static inline void __mutex_clear_flag(struct mutex *lock, unsigned long flag) 1633ca0ff57SPeter Zijlstra { 1643ca0ff57SPeter Zijlstra atomic_long_andnot(flag, &lock->owner); 1653ca0ff57SPeter Zijlstra } 1663ca0ff57SPeter Zijlstra 1679d659ae1SPeter Zijlstra static inline bool __mutex_waiter_is_first(struct mutex *lock, struct mutex_waiter *waiter) 1689d659ae1SPeter Zijlstra { 1699d659ae1SPeter Zijlstra return list_first_entry(&lock->wait_list, struct mutex_waiter, list) == waiter; 1709d659ae1SPeter Zijlstra } 1719d659ae1SPeter Zijlstra 1729d659ae1SPeter Zijlstra /* 1739d659ae1SPeter Zijlstra * Give up ownership to a specific task, when @task = NULL, this is equivalent 1749d659ae1SPeter Zijlstra * to a regular unlock. Clears HANDOFF, preserves WAITERS. Provides RELEASE 1759d659ae1SPeter Zijlstra * semantics like a regular unlock, the __mutex_trylock() provides matching 1769d659ae1SPeter Zijlstra * ACQUIRE semantics for the handoff. 1779d659ae1SPeter Zijlstra */ 1789d659ae1SPeter Zijlstra static void __mutex_handoff(struct mutex *lock, struct task_struct *task) 1799d659ae1SPeter Zijlstra { 1809d659ae1SPeter Zijlstra unsigned long owner = atomic_long_read(&lock->owner); 1819d659ae1SPeter Zijlstra 1829d659ae1SPeter Zijlstra for (;;) { 1839d659ae1SPeter Zijlstra unsigned long old, new; 1849d659ae1SPeter Zijlstra 1859d659ae1SPeter Zijlstra #ifdef CONFIG_DEBUG_MUTEXES 1869d659ae1SPeter Zijlstra DEBUG_LOCKS_WARN_ON(__owner_task(owner) != current); 1879d659ae1SPeter Zijlstra #endif 1889d659ae1SPeter Zijlstra 1899d659ae1SPeter Zijlstra new = (owner & MUTEX_FLAG_WAITERS); 1909d659ae1SPeter Zijlstra new |= (unsigned long)task; 1919d659ae1SPeter Zijlstra 1929d659ae1SPeter Zijlstra old = atomic_long_cmpxchg_release(&lock->owner, owner, new); 1939d659ae1SPeter Zijlstra if (old == owner) 1949d659ae1SPeter Zijlstra break; 1959d659ae1SPeter Zijlstra 1969d659ae1SPeter Zijlstra owner = old; 1979d659ae1SPeter Zijlstra } 1989d659ae1SPeter Zijlstra } 1999d659ae1SPeter Zijlstra 20001768b42SPeter Zijlstra #ifndef CONFIG_DEBUG_LOCK_ALLOC 20101768b42SPeter Zijlstra /* 20201768b42SPeter Zijlstra * We split the mutex lock/unlock logic into separate fastpath and 20301768b42SPeter Zijlstra * slowpath functions, to reduce the register pressure on the fastpath. 20401768b42SPeter Zijlstra * We also put the fastpath first in the kernel image, to make sure the 20501768b42SPeter Zijlstra * branch is predicted by the CPU as default-untaken. 20601768b42SPeter Zijlstra */ 2073ca0ff57SPeter Zijlstra static void __sched __mutex_lock_slowpath(struct mutex *lock); 20801768b42SPeter Zijlstra 20901768b42SPeter Zijlstra /** 21001768b42SPeter Zijlstra * mutex_lock - acquire the mutex 21101768b42SPeter Zijlstra * @lock: the mutex to be acquired 21201768b42SPeter Zijlstra * 21301768b42SPeter Zijlstra * Lock the mutex exclusively for this task. If the mutex is not 21401768b42SPeter Zijlstra * available right now, it will sleep until it can get it. 21501768b42SPeter Zijlstra * 21601768b42SPeter Zijlstra * The mutex must later on be released by the same task that 21701768b42SPeter Zijlstra * acquired it. Recursive locking is not allowed. The task 21801768b42SPeter Zijlstra * may not exit without first unlocking the mutex. Also, kernel 219139b6fd2SSharon Dvir * memory where the mutex resides must not be freed with 22001768b42SPeter Zijlstra * the mutex still locked. The mutex must first be initialized 22101768b42SPeter Zijlstra * (or statically defined) before it can be locked. memset()-ing 22201768b42SPeter Zijlstra * the mutex to 0 is not allowed. 22301768b42SPeter Zijlstra * 22401768b42SPeter Zijlstra * ( The CONFIG_DEBUG_MUTEXES .config option turns on debugging 22501768b42SPeter Zijlstra * checks that will enforce the restrictions and will also do 22601768b42SPeter Zijlstra * deadlock debugging. ) 22701768b42SPeter Zijlstra * 22801768b42SPeter Zijlstra * This function is similar to (but not equivalent to) down(). 22901768b42SPeter Zijlstra */ 23001768b42SPeter Zijlstra void __sched mutex_lock(struct mutex *lock) 23101768b42SPeter Zijlstra { 23201768b42SPeter Zijlstra might_sleep(); 23301768b42SPeter Zijlstra 2343ca0ff57SPeter Zijlstra if (!__mutex_trylock_fast(lock)) 2353ca0ff57SPeter Zijlstra __mutex_lock_slowpath(lock); 2363ca0ff57SPeter Zijlstra } 23701768b42SPeter Zijlstra EXPORT_SYMBOL(mutex_lock); 23801768b42SPeter Zijlstra #endif 23901768b42SPeter Zijlstra 24076916515SDavidlohr Bueso static __always_inline void ww_mutex_lock_acquired(struct ww_mutex *ww, 24176916515SDavidlohr Bueso struct ww_acquire_ctx *ww_ctx) 24276916515SDavidlohr Bueso { 24376916515SDavidlohr Bueso #ifdef CONFIG_DEBUG_MUTEXES 24476916515SDavidlohr Bueso /* 24576916515SDavidlohr Bueso * If this WARN_ON triggers, you used ww_mutex_lock to acquire, 24676916515SDavidlohr Bueso * but released with a normal mutex_unlock in this call. 24776916515SDavidlohr Bueso * 24876916515SDavidlohr Bueso * This should never happen, always use ww_mutex_unlock. 24976916515SDavidlohr Bueso */ 25076916515SDavidlohr Bueso DEBUG_LOCKS_WARN_ON(ww->ctx); 25176916515SDavidlohr Bueso 25276916515SDavidlohr Bueso /* 25376916515SDavidlohr Bueso * Not quite done after calling ww_acquire_done() ? 25476916515SDavidlohr Bueso */ 25576916515SDavidlohr Bueso DEBUG_LOCKS_WARN_ON(ww_ctx->done_acquire); 25676916515SDavidlohr Bueso 25776916515SDavidlohr Bueso if (ww_ctx->contending_lock) { 25876916515SDavidlohr Bueso /* 25976916515SDavidlohr Bueso * After -EDEADLK you tried to 26076916515SDavidlohr Bueso * acquire a different ww_mutex? Bad! 26176916515SDavidlohr Bueso */ 26276916515SDavidlohr Bueso DEBUG_LOCKS_WARN_ON(ww_ctx->contending_lock != ww); 26376916515SDavidlohr Bueso 26476916515SDavidlohr Bueso /* 26576916515SDavidlohr Bueso * You called ww_mutex_lock after receiving -EDEADLK, 26676916515SDavidlohr Bueso * but 'forgot' to unlock everything else first? 26776916515SDavidlohr Bueso */ 26876916515SDavidlohr Bueso DEBUG_LOCKS_WARN_ON(ww_ctx->acquired > 0); 26976916515SDavidlohr Bueso ww_ctx->contending_lock = NULL; 27076916515SDavidlohr Bueso } 27176916515SDavidlohr Bueso 27276916515SDavidlohr Bueso /* 27376916515SDavidlohr Bueso * Naughty, using a different class will lead to undefined behavior! 27476916515SDavidlohr Bueso */ 27576916515SDavidlohr Bueso DEBUG_LOCKS_WARN_ON(ww_ctx->ww_class != ww->ww_class); 27676916515SDavidlohr Bueso #endif 27776916515SDavidlohr Bueso ww_ctx->acquired++; 27876916515SDavidlohr Bueso } 27976916515SDavidlohr Bueso 28076916515SDavidlohr Bueso /* 2814bd19084SDavidlohr Bueso * After acquiring lock with fastpath or when we lost out in contested 28276916515SDavidlohr Bueso * slowpath, set ctx and wake up any waiters so they can recheck. 28376916515SDavidlohr Bueso */ 28476916515SDavidlohr Bueso static __always_inline void 28576916515SDavidlohr Bueso ww_mutex_set_context_fastpath(struct ww_mutex *lock, 28676916515SDavidlohr Bueso struct ww_acquire_ctx *ctx) 28776916515SDavidlohr Bueso { 28876916515SDavidlohr Bueso unsigned long flags; 28976916515SDavidlohr Bueso struct mutex_waiter *cur; 29076916515SDavidlohr Bueso 29176916515SDavidlohr Bueso ww_mutex_lock_acquired(lock, ctx); 29276916515SDavidlohr Bueso 29376916515SDavidlohr Bueso lock->ctx = ctx; 29476916515SDavidlohr Bueso 29576916515SDavidlohr Bueso /* 29676916515SDavidlohr Bueso * The lock->ctx update should be visible on all cores before 29776916515SDavidlohr Bueso * the atomic read is done, otherwise contended waiters might be 29876916515SDavidlohr Bueso * missed. The contended waiters will either see ww_ctx == NULL 29976916515SDavidlohr Bueso * and keep spinning, or it will acquire wait_lock, add itself 30076916515SDavidlohr Bueso * to waiter list and sleep. 30176916515SDavidlohr Bueso */ 30276916515SDavidlohr Bueso smp_mb(); /* ^^^ */ 30376916515SDavidlohr Bueso 30476916515SDavidlohr Bueso /* 30576916515SDavidlohr Bueso * Check if lock is contended, if not there is nobody to wake up 30676916515SDavidlohr Bueso */ 3073ca0ff57SPeter Zijlstra if (likely(!(atomic_long_read(&lock->base.owner) & MUTEX_FLAG_WAITERS))) 30876916515SDavidlohr Bueso return; 30976916515SDavidlohr Bueso 31076916515SDavidlohr Bueso /* 31176916515SDavidlohr Bueso * Uh oh, we raced in fastpath, wake up everyone in this case, 31276916515SDavidlohr Bueso * so they can see the new lock->ctx. 31376916515SDavidlohr Bueso */ 31476916515SDavidlohr Bueso spin_lock_mutex(&lock->base.wait_lock, flags); 31576916515SDavidlohr Bueso list_for_each_entry(cur, &lock->base.wait_list, list) { 31676916515SDavidlohr Bueso debug_mutex_wake_waiter(&lock->base, cur); 31776916515SDavidlohr Bueso wake_up_process(cur->task); 31876916515SDavidlohr Bueso } 31976916515SDavidlohr Bueso spin_unlock_mutex(&lock->base.wait_lock, flags); 32076916515SDavidlohr Bueso } 32176916515SDavidlohr Bueso 3224bd19084SDavidlohr Bueso /* 3234bd19084SDavidlohr Bueso * After acquiring lock in the slowpath set ctx and wake up any 3244bd19084SDavidlohr Bueso * waiters so they can recheck. 3254bd19084SDavidlohr Bueso * 3264bd19084SDavidlohr Bueso * Callers must hold the mutex wait_lock. 3274bd19084SDavidlohr Bueso */ 3284bd19084SDavidlohr Bueso static __always_inline void 3294bd19084SDavidlohr Bueso ww_mutex_set_context_slowpath(struct ww_mutex *lock, 3304bd19084SDavidlohr Bueso struct ww_acquire_ctx *ctx) 3314bd19084SDavidlohr Bueso { 3324bd19084SDavidlohr Bueso struct mutex_waiter *cur; 3334bd19084SDavidlohr Bueso 3344bd19084SDavidlohr Bueso ww_mutex_lock_acquired(lock, ctx); 3354bd19084SDavidlohr Bueso lock->ctx = ctx; 3364bd19084SDavidlohr Bueso 3374bd19084SDavidlohr Bueso /* 3384bd19084SDavidlohr Bueso * Give any possible sleeping processes the chance to wake up, 3394bd19084SDavidlohr Bueso * so they can recheck if they have to back off. 3404bd19084SDavidlohr Bueso */ 3414bd19084SDavidlohr Bueso list_for_each_entry(cur, &lock->base.wait_list, list) { 3424bd19084SDavidlohr Bueso debug_mutex_wake_waiter(&lock->base, cur); 3434bd19084SDavidlohr Bueso wake_up_process(cur->task); 3444bd19084SDavidlohr Bueso } 3454bd19084SDavidlohr Bueso } 34676916515SDavidlohr Bueso 34701768b42SPeter Zijlstra #ifdef CONFIG_MUTEX_SPIN_ON_OWNER 34801768b42SPeter Zijlstra /* 34901768b42SPeter Zijlstra * Look out! "owner" is an entirely speculative pointer 35001768b42SPeter Zijlstra * access and not reliable. 35101768b42SPeter Zijlstra */ 35201768b42SPeter Zijlstra static noinline 353be1f7bf2SJason Low bool mutex_spin_on_owner(struct mutex *lock, struct task_struct *owner) 35401768b42SPeter Zijlstra { 35501ac33c1SJason Low bool ret = true; 356be1f7bf2SJason Low 35701768b42SPeter Zijlstra rcu_read_lock(); 3583ca0ff57SPeter Zijlstra while (__mutex_owner(lock) == owner) { 359be1f7bf2SJason Low /* 360be1f7bf2SJason Low * Ensure we emit the owner->on_cpu, dereference _after_ 36101ac33c1SJason Low * checking lock->owner still matches owner. If that fails, 36201ac33c1SJason Low * owner might point to freed memory. If it still matches, 363be1f7bf2SJason Low * the rcu_read_lock() ensures the memory stays valid. 364be1f7bf2SJason Low */ 365be1f7bf2SJason Low barrier(); 366be1f7bf2SJason Low 36705ffc951SPan Xinhui /* 36805ffc951SPan Xinhui * Use vcpu_is_preempted to detect lock holder preemption issue. 36905ffc951SPan Xinhui */ 37005ffc951SPan Xinhui if (!owner->on_cpu || need_resched() || 37105ffc951SPan Xinhui vcpu_is_preempted(task_cpu(owner))) { 372be1f7bf2SJason Low ret = false; 373be1f7bf2SJason Low break; 374be1f7bf2SJason Low } 37501768b42SPeter Zijlstra 376f2f09a4cSChristian Borntraeger cpu_relax(); 37701768b42SPeter Zijlstra } 37801768b42SPeter Zijlstra rcu_read_unlock(); 37901768b42SPeter Zijlstra 380be1f7bf2SJason Low return ret; 38101768b42SPeter Zijlstra } 38201768b42SPeter Zijlstra 38301768b42SPeter Zijlstra /* 38401768b42SPeter Zijlstra * Initial check for entering the mutex spinning loop 38501768b42SPeter Zijlstra */ 38601768b42SPeter Zijlstra static inline int mutex_can_spin_on_owner(struct mutex *lock) 38701768b42SPeter Zijlstra { 38801768b42SPeter Zijlstra struct task_struct *owner; 38901768b42SPeter Zijlstra int retval = 1; 39001768b42SPeter Zijlstra 39146af29e4SJason Low if (need_resched()) 39246af29e4SJason Low return 0; 39346af29e4SJason Low 39401768b42SPeter Zijlstra rcu_read_lock(); 3953ca0ff57SPeter Zijlstra owner = __mutex_owner(lock); 39605ffc951SPan Xinhui 39705ffc951SPan Xinhui /* 39805ffc951SPan Xinhui * As lock holder preemption issue, we both skip spinning if task is not 39905ffc951SPan Xinhui * on cpu or its cpu is preempted 40005ffc951SPan Xinhui */ 40101768b42SPeter Zijlstra if (owner) 40205ffc951SPan Xinhui retval = owner->on_cpu && !vcpu_is_preempted(task_cpu(owner)); 40301768b42SPeter Zijlstra rcu_read_unlock(); 40476916515SDavidlohr Bueso 40576916515SDavidlohr Bueso /* 4063ca0ff57SPeter Zijlstra * If lock->owner is not set, the mutex has been released. Return true 4073ca0ff57SPeter Zijlstra * such that we'll trylock in the spin path, which is a faster option 4083ca0ff57SPeter Zijlstra * than the blocking slow path. 40976916515SDavidlohr Bueso */ 4103ca0ff57SPeter Zijlstra return retval; 41176916515SDavidlohr Bueso } 41276916515SDavidlohr Bueso 41376916515SDavidlohr Bueso /* 41476916515SDavidlohr Bueso * Optimistic spinning. 41576916515SDavidlohr Bueso * 41676916515SDavidlohr Bueso * We try to spin for acquisition when we find that the lock owner 41776916515SDavidlohr Bueso * is currently running on a (different) CPU and while we don't 41876916515SDavidlohr Bueso * need to reschedule. The rationale is that if the lock owner is 41976916515SDavidlohr Bueso * running, it is likely to release the lock soon. 42076916515SDavidlohr Bueso * 42176916515SDavidlohr Bueso * The mutex spinners are queued up using MCS lock so that only one 42276916515SDavidlohr Bueso * spinner can compete for the mutex. However, if mutex spinning isn't 42376916515SDavidlohr Bueso * going to happen, there is no point in going through the lock/unlock 42476916515SDavidlohr Bueso * overhead. 42576916515SDavidlohr Bueso * 42676916515SDavidlohr Bueso * Returns true when the lock was taken, otherwise false, indicating 42776916515SDavidlohr Bueso * that we need to jump to the slowpath and sleep. 428b341afb3SWaiman Long * 429b341afb3SWaiman Long * The waiter flag is set to true if the spinner is a waiter in the wait 430b341afb3SWaiman Long * queue. The waiter-spinner will spin on the lock directly and concurrently 431b341afb3SWaiman Long * with the spinner at the head of the OSQ, if present, until the owner is 432b341afb3SWaiman Long * changed to itself. 43376916515SDavidlohr Bueso */ 43476916515SDavidlohr Bueso static bool mutex_optimistic_spin(struct mutex *lock, 435b341afb3SWaiman Long struct ww_acquire_ctx *ww_ctx, 436b341afb3SWaiman Long const bool use_ww_ctx, const bool waiter) 43776916515SDavidlohr Bueso { 43876916515SDavidlohr Bueso struct task_struct *task = current; 43976916515SDavidlohr Bueso 440b341afb3SWaiman Long if (!waiter) { 441b341afb3SWaiman Long /* 442b341afb3SWaiman Long * The purpose of the mutex_can_spin_on_owner() function is 443b341afb3SWaiman Long * to eliminate the overhead of osq_lock() and osq_unlock() 444b341afb3SWaiman Long * in case spinning isn't possible. As a waiter-spinner 445b341afb3SWaiman Long * is not going to take OSQ lock anyway, there is no need 446b341afb3SWaiman Long * to call mutex_can_spin_on_owner(). 447b341afb3SWaiman Long */ 44876916515SDavidlohr Bueso if (!mutex_can_spin_on_owner(lock)) 449b341afb3SWaiman Long goto fail; 45076916515SDavidlohr Bueso 451e42f678aSDavidlohr Bueso /* 452e42f678aSDavidlohr Bueso * In order to avoid a stampede of mutex spinners trying to 453e42f678aSDavidlohr Bueso * acquire the mutex all at once, the spinners need to take a 454e42f678aSDavidlohr Bueso * MCS (queued) lock first before spinning on the owner field. 455e42f678aSDavidlohr Bueso */ 45676916515SDavidlohr Bueso if (!osq_lock(&lock->osq)) 457b341afb3SWaiman Long goto fail; 458b341afb3SWaiman Long } 45976916515SDavidlohr Bueso 460b341afb3SWaiman Long for (;;) { 46176916515SDavidlohr Bueso struct task_struct *owner; 46276916515SDavidlohr Bueso 46376916515SDavidlohr Bueso if (use_ww_ctx && ww_ctx->acquired > 0) { 46476916515SDavidlohr Bueso struct ww_mutex *ww; 46576916515SDavidlohr Bueso 46676916515SDavidlohr Bueso ww = container_of(lock, struct ww_mutex, base); 46776916515SDavidlohr Bueso /* 46876916515SDavidlohr Bueso * If ww->ctx is set the contents are undefined, only 46976916515SDavidlohr Bueso * by acquiring wait_lock there is a guarantee that 47076916515SDavidlohr Bueso * they are not invalid when reading. 47176916515SDavidlohr Bueso * 47276916515SDavidlohr Bueso * As such, when deadlock detection needs to be 47376916515SDavidlohr Bueso * performed the optimistic spinning cannot be done. 47476916515SDavidlohr Bueso */ 4754d3199e4SDavidlohr Bueso if (READ_ONCE(ww->ctx)) 476b341afb3SWaiman Long goto fail_unlock; 47776916515SDavidlohr Bueso } 47876916515SDavidlohr Bueso 47976916515SDavidlohr Bueso /* 48076916515SDavidlohr Bueso * If there's an owner, wait for it to either 48176916515SDavidlohr Bueso * release the lock or go to sleep. 48276916515SDavidlohr Bueso */ 4833ca0ff57SPeter Zijlstra owner = __mutex_owner(lock); 484b341afb3SWaiman Long if (owner) { 485b341afb3SWaiman Long if (waiter && owner == task) { 486b341afb3SWaiman Long smp_mb(); /* ACQUIRE */ 48776916515SDavidlohr Bueso break; 488b341afb3SWaiman Long } 489b341afb3SWaiman Long 490b341afb3SWaiman Long if (!mutex_spin_on_owner(lock, owner)) 491b341afb3SWaiman Long goto fail_unlock; 492b341afb3SWaiman Long } 49376916515SDavidlohr Bueso 49476916515SDavidlohr Bueso /* Try to acquire the mutex if it is unlocked. */ 495b341afb3SWaiman Long if (__mutex_trylock(lock, waiter)) 496b341afb3SWaiman Long break; 49776916515SDavidlohr Bueso 49876916515SDavidlohr Bueso /* 49976916515SDavidlohr Bueso * The cpu_relax() call is a compiler barrier which forces 50076916515SDavidlohr Bueso * everything in this loop to be re-loaded. We don't need 50176916515SDavidlohr Bueso * memory barriers as we'll eventually observe the right 50276916515SDavidlohr Bueso * values at the cost of a few extra spins. 50376916515SDavidlohr Bueso */ 504f2f09a4cSChristian Borntraeger cpu_relax(); 50576916515SDavidlohr Bueso } 50676916515SDavidlohr Bueso 507b341afb3SWaiman Long if (!waiter) 50876916515SDavidlohr Bueso osq_unlock(&lock->osq); 509b341afb3SWaiman Long 510b341afb3SWaiman Long return true; 511b341afb3SWaiman Long 512b341afb3SWaiman Long 513b341afb3SWaiman Long fail_unlock: 514b341afb3SWaiman Long if (!waiter) 515b341afb3SWaiman Long osq_unlock(&lock->osq); 516b341afb3SWaiman Long 517b341afb3SWaiman Long fail: 51876916515SDavidlohr Bueso /* 51976916515SDavidlohr Bueso * If we fell out of the spin path because of need_resched(), 52076916515SDavidlohr Bueso * reschedule now, before we try-lock the mutex. This avoids getting 52176916515SDavidlohr Bueso * scheduled out right after we obtained the mutex. 52276916515SDavidlohr Bueso */ 5236f942a1fSPeter Zijlstra if (need_resched()) { 5246f942a1fSPeter Zijlstra /* 5256f942a1fSPeter Zijlstra * We _should_ have TASK_RUNNING here, but just in case 5266f942a1fSPeter Zijlstra * we do not, make it so, otherwise we might get stuck. 5276f942a1fSPeter Zijlstra */ 5286f942a1fSPeter Zijlstra __set_current_state(TASK_RUNNING); 52976916515SDavidlohr Bueso schedule_preempt_disabled(); 5306f942a1fSPeter Zijlstra } 53176916515SDavidlohr Bueso 53276916515SDavidlohr Bueso return false; 53376916515SDavidlohr Bueso } 53476916515SDavidlohr Bueso #else 53576916515SDavidlohr Bueso static bool mutex_optimistic_spin(struct mutex *lock, 536b341afb3SWaiman Long struct ww_acquire_ctx *ww_ctx, 537b341afb3SWaiman Long const bool use_ww_ctx, const bool waiter) 53876916515SDavidlohr Bueso { 53976916515SDavidlohr Bueso return false; 54076916515SDavidlohr Bueso } 54101768b42SPeter Zijlstra #endif 54201768b42SPeter Zijlstra 5433ca0ff57SPeter Zijlstra static noinline void __sched __mutex_unlock_slowpath(struct mutex *lock, unsigned long ip); 54401768b42SPeter Zijlstra 54501768b42SPeter Zijlstra /** 54601768b42SPeter Zijlstra * mutex_unlock - release the mutex 54701768b42SPeter Zijlstra * @lock: the mutex to be released 54801768b42SPeter Zijlstra * 54901768b42SPeter Zijlstra * Unlock a mutex that has been locked by this task previously. 55001768b42SPeter Zijlstra * 55101768b42SPeter Zijlstra * This function must not be used in interrupt context. Unlocking 55201768b42SPeter Zijlstra * of a not locked mutex is not allowed. 55301768b42SPeter Zijlstra * 55401768b42SPeter Zijlstra * This function is similar to (but not equivalent to) up(). 55501768b42SPeter Zijlstra */ 55601768b42SPeter Zijlstra void __sched mutex_unlock(struct mutex *lock) 55701768b42SPeter Zijlstra { 5583ca0ff57SPeter Zijlstra #ifndef CONFIG_DEBUG_LOCK_ALLOC 5593ca0ff57SPeter Zijlstra if (__mutex_unlock_fast(lock)) 5603ca0ff57SPeter Zijlstra return; 56101768b42SPeter Zijlstra #endif 5623ca0ff57SPeter Zijlstra __mutex_unlock_slowpath(lock, _RET_IP_); 56301768b42SPeter Zijlstra } 56401768b42SPeter Zijlstra EXPORT_SYMBOL(mutex_unlock); 56501768b42SPeter Zijlstra 56601768b42SPeter Zijlstra /** 56701768b42SPeter Zijlstra * ww_mutex_unlock - release the w/w mutex 56801768b42SPeter Zijlstra * @lock: the mutex to be released 56901768b42SPeter Zijlstra * 57001768b42SPeter Zijlstra * Unlock a mutex that has been locked by this task previously with any of the 57101768b42SPeter Zijlstra * ww_mutex_lock* functions (with or without an acquire context). It is 57201768b42SPeter Zijlstra * forbidden to release the locks after releasing the acquire context. 57301768b42SPeter Zijlstra * 57401768b42SPeter Zijlstra * This function must not be used in interrupt context. Unlocking 57501768b42SPeter Zijlstra * of a unlocked mutex is not allowed. 57601768b42SPeter Zijlstra */ 57701768b42SPeter Zijlstra void __sched ww_mutex_unlock(struct ww_mutex *lock) 57801768b42SPeter Zijlstra { 57901768b42SPeter Zijlstra /* 58001768b42SPeter Zijlstra * The unlocking fastpath is the 0->1 transition from 'locked' 58101768b42SPeter Zijlstra * into 'unlocked' state: 58201768b42SPeter Zijlstra */ 58301768b42SPeter Zijlstra if (lock->ctx) { 58401768b42SPeter Zijlstra #ifdef CONFIG_DEBUG_MUTEXES 58501768b42SPeter Zijlstra DEBUG_LOCKS_WARN_ON(!lock->ctx->acquired); 58601768b42SPeter Zijlstra #endif 58701768b42SPeter Zijlstra if (lock->ctx->acquired > 0) 58801768b42SPeter Zijlstra lock->ctx->acquired--; 58901768b42SPeter Zijlstra lock->ctx = NULL; 59001768b42SPeter Zijlstra } 59101768b42SPeter Zijlstra 5923ca0ff57SPeter Zijlstra mutex_unlock(&lock->base); 59301768b42SPeter Zijlstra } 59401768b42SPeter Zijlstra EXPORT_SYMBOL(ww_mutex_unlock); 59501768b42SPeter Zijlstra 59601768b42SPeter Zijlstra static inline int __sched 59763dc47e9SDavidlohr Bueso __ww_mutex_lock_check_stamp(struct mutex *lock, struct ww_acquire_ctx *ctx) 59801768b42SPeter Zijlstra { 59901768b42SPeter Zijlstra struct ww_mutex *ww = container_of(lock, struct ww_mutex, base); 6004d3199e4SDavidlohr Bueso struct ww_acquire_ctx *hold_ctx = READ_ONCE(ww->ctx); 60101768b42SPeter Zijlstra 60201768b42SPeter Zijlstra if (!hold_ctx) 60301768b42SPeter Zijlstra return 0; 60401768b42SPeter Zijlstra 60501768b42SPeter Zijlstra if (ctx->stamp - hold_ctx->stamp <= LONG_MAX && 60601768b42SPeter Zijlstra (ctx->stamp != hold_ctx->stamp || ctx > hold_ctx)) { 60701768b42SPeter Zijlstra #ifdef CONFIG_DEBUG_MUTEXES 60801768b42SPeter Zijlstra DEBUG_LOCKS_WARN_ON(ctx->contending_lock); 60901768b42SPeter Zijlstra ctx->contending_lock = ww; 61001768b42SPeter Zijlstra #endif 61101768b42SPeter Zijlstra return -EDEADLK; 61201768b42SPeter Zijlstra } 61301768b42SPeter Zijlstra 61401768b42SPeter Zijlstra return 0; 61501768b42SPeter Zijlstra } 61601768b42SPeter Zijlstra 61701768b42SPeter Zijlstra /* 61801768b42SPeter Zijlstra * Lock a mutex (possibly interruptible), slowpath: 61901768b42SPeter Zijlstra */ 62001768b42SPeter Zijlstra static __always_inline int __sched 62101768b42SPeter Zijlstra __mutex_lock_common(struct mutex *lock, long state, unsigned int subclass, 62201768b42SPeter Zijlstra struct lockdep_map *nest_lock, unsigned long ip, 62301768b42SPeter Zijlstra struct ww_acquire_ctx *ww_ctx, const bool use_ww_ctx) 62401768b42SPeter Zijlstra { 62501768b42SPeter Zijlstra struct task_struct *task = current; 62601768b42SPeter Zijlstra struct mutex_waiter waiter; 62701768b42SPeter Zijlstra unsigned long flags; 6289d659ae1SPeter Zijlstra bool first = false; 629a40ca565SWaiman Long struct ww_mutex *ww; 63001768b42SPeter Zijlstra int ret; 63101768b42SPeter Zijlstra 6320422e83dSChris Wilson if (use_ww_ctx) { 633a40ca565SWaiman Long ww = container_of(lock, struct ww_mutex, base); 6340422e83dSChris Wilson if (unlikely(ww_ctx == READ_ONCE(ww->ctx))) 6350422e83dSChris Wilson return -EALREADY; 6360422e83dSChris Wilson } 6370422e83dSChris Wilson 63801768b42SPeter Zijlstra preempt_disable(); 63901768b42SPeter Zijlstra mutex_acquire_nest(&lock->dep_map, subclass, 0, nest_lock, ip); 64001768b42SPeter Zijlstra 6419d659ae1SPeter Zijlstra if (__mutex_trylock(lock, false) || 642b341afb3SWaiman Long mutex_optimistic_spin(lock, ww_ctx, use_ww_ctx, false)) { 64376916515SDavidlohr Bueso /* got the lock, yay! */ 6443ca0ff57SPeter Zijlstra lock_acquired(&lock->dep_map, ip); 645a40ca565SWaiman Long if (use_ww_ctx) 6463ca0ff57SPeter Zijlstra ww_mutex_set_context_fastpath(ww, ww_ctx); 64701768b42SPeter Zijlstra preempt_enable(); 64801768b42SPeter Zijlstra return 0; 64901768b42SPeter Zijlstra } 65001768b42SPeter Zijlstra 65101768b42SPeter Zijlstra spin_lock_mutex(&lock->wait_lock, flags); 6521e820c96SJason Low /* 6533ca0ff57SPeter Zijlstra * After waiting to acquire the wait_lock, try again. 6541e820c96SJason Low */ 6559d659ae1SPeter Zijlstra if (__mutex_trylock(lock, false)) 65601768b42SPeter Zijlstra goto skip_wait; 65701768b42SPeter Zijlstra 65801768b42SPeter Zijlstra debug_mutex_lock_common(lock, &waiter); 6596720a305SLinus Torvalds debug_mutex_add_waiter(lock, &waiter, task); 66001768b42SPeter Zijlstra 66101768b42SPeter Zijlstra /* add waiting tasks to the end of the waitqueue (FIFO): */ 66201768b42SPeter Zijlstra list_add_tail(&waiter.list, &lock->wait_list); 66301768b42SPeter Zijlstra waiter.task = task; 66401768b42SPeter Zijlstra 6659d659ae1SPeter Zijlstra if (__mutex_waiter_is_first(lock, &waiter)) 6663ca0ff57SPeter Zijlstra __mutex_set_flag(lock, MUTEX_FLAG_WAITERS); 6673ca0ff57SPeter Zijlstra 66801768b42SPeter Zijlstra lock_contended(&lock->dep_map, ip); 66901768b42SPeter Zijlstra 6705bbd7e64SPeter Zijlstra set_task_state(task, state); 67101768b42SPeter Zijlstra for (;;) { 6725bbd7e64SPeter Zijlstra /* 6735bbd7e64SPeter Zijlstra * Once we hold wait_lock, we're serialized against 6745bbd7e64SPeter Zijlstra * mutex_unlock() handing the lock off to us, do a trylock 6755bbd7e64SPeter Zijlstra * before testing the error conditions to make sure we pick up 6765bbd7e64SPeter Zijlstra * the handoff. 6775bbd7e64SPeter Zijlstra */ 6789d659ae1SPeter Zijlstra if (__mutex_trylock(lock, first)) 6795bbd7e64SPeter Zijlstra goto acquired; 68001768b42SPeter Zijlstra 68101768b42SPeter Zijlstra /* 6825bbd7e64SPeter Zijlstra * Check for signals and wound conditions while holding 6835bbd7e64SPeter Zijlstra * wait_lock. This ensures the lock cancellation is ordered 6845bbd7e64SPeter Zijlstra * against mutex_unlock() and wake-ups do not go missing. 68501768b42SPeter Zijlstra */ 68601768b42SPeter Zijlstra if (unlikely(signal_pending_state(state, task))) { 68701768b42SPeter Zijlstra ret = -EINTR; 68801768b42SPeter Zijlstra goto err; 68901768b42SPeter Zijlstra } 69001768b42SPeter Zijlstra 69101768b42SPeter Zijlstra if (use_ww_ctx && ww_ctx->acquired > 0) { 69263dc47e9SDavidlohr Bueso ret = __ww_mutex_lock_check_stamp(lock, ww_ctx); 69301768b42SPeter Zijlstra if (ret) 69401768b42SPeter Zijlstra goto err; 69501768b42SPeter Zijlstra } 69601768b42SPeter Zijlstra 69701768b42SPeter Zijlstra spin_unlock_mutex(&lock->wait_lock, flags); 69801768b42SPeter Zijlstra schedule_preempt_disabled(); 6999d659ae1SPeter Zijlstra 7009d659ae1SPeter Zijlstra if (!first && __mutex_waiter_is_first(lock, &waiter)) { 7019d659ae1SPeter Zijlstra first = true; 7029d659ae1SPeter Zijlstra __mutex_set_flag(lock, MUTEX_FLAG_HANDOFF); 7039d659ae1SPeter Zijlstra } 7045bbd7e64SPeter Zijlstra 7055bbd7e64SPeter Zijlstra set_task_state(task, state); 7065bbd7e64SPeter Zijlstra /* 7075bbd7e64SPeter Zijlstra * Here we order against unlock; we must either see it change 7085bbd7e64SPeter Zijlstra * state back to RUNNING and fall through the next schedule(), 7095bbd7e64SPeter Zijlstra * or we must see its unlock and acquire. 7105bbd7e64SPeter Zijlstra */ 711b341afb3SWaiman Long if ((first && mutex_optimistic_spin(lock, ww_ctx, use_ww_ctx, true)) || 712b341afb3SWaiman Long __mutex_trylock(lock, first)) 7135bbd7e64SPeter Zijlstra break; 7145bbd7e64SPeter Zijlstra 7155bbd7e64SPeter Zijlstra spin_lock_mutex(&lock->wait_lock, flags); 71601768b42SPeter Zijlstra } 7175bbd7e64SPeter Zijlstra spin_lock_mutex(&lock->wait_lock, flags); 7185bbd7e64SPeter Zijlstra acquired: 71951587bcfSDavidlohr Bueso __set_task_state(task, TASK_RUNNING); 72051587bcfSDavidlohr Bueso 7216720a305SLinus Torvalds mutex_remove_waiter(lock, &waiter, task); 72201768b42SPeter Zijlstra if (likely(list_empty(&lock->wait_list))) 7239d659ae1SPeter Zijlstra __mutex_clear_flag(lock, MUTEX_FLAGS); 7243ca0ff57SPeter Zijlstra 72501768b42SPeter Zijlstra debug_mutex_free_waiter(&waiter); 72601768b42SPeter Zijlstra 72701768b42SPeter Zijlstra skip_wait: 72801768b42SPeter Zijlstra /* got the lock - cleanup and rejoice! */ 72901768b42SPeter Zijlstra lock_acquired(&lock->dep_map, ip); 73001768b42SPeter Zijlstra 731a40ca565SWaiman Long if (use_ww_ctx) 7324bd19084SDavidlohr Bueso ww_mutex_set_context_slowpath(ww, ww_ctx); 73301768b42SPeter Zijlstra 73401768b42SPeter Zijlstra spin_unlock_mutex(&lock->wait_lock, flags); 73501768b42SPeter Zijlstra preempt_enable(); 73601768b42SPeter Zijlstra return 0; 73701768b42SPeter Zijlstra 73801768b42SPeter Zijlstra err: 7395bbd7e64SPeter Zijlstra __set_task_state(task, TASK_RUNNING); 7406720a305SLinus Torvalds mutex_remove_waiter(lock, &waiter, task); 74101768b42SPeter Zijlstra spin_unlock_mutex(&lock->wait_lock, flags); 74201768b42SPeter Zijlstra debug_mutex_free_waiter(&waiter); 74301768b42SPeter Zijlstra mutex_release(&lock->dep_map, 1, ip); 74401768b42SPeter Zijlstra preempt_enable(); 74501768b42SPeter Zijlstra return ret; 74601768b42SPeter Zijlstra } 74701768b42SPeter Zijlstra 74801768b42SPeter Zijlstra #ifdef CONFIG_DEBUG_LOCK_ALLOC 74901768b42SPeter Zijlstra void __sched 75001768b42SPeter Zijlstra mutex_lock_nested(struct mutex *lock, unsigned int subclass) 75101768b42SPeter Zijlstra { 75201768b42SPeter Zijlstra might_sleep(); 75301768b42SPeter Zijlstra __mutex_lock_common(lock, TASK_UNINTERRUPTIBLE, 75401768b42SPeter Zijlstra subclass, NULL, _RET_IP_, NULL, 0); 75501768b42SPeter Zijlstra } 75601768b42SPeter Zijlstra 75701768b42SPeter Zijlstra EXPORT_SYMBOL_GPL(mutex_lock_nested); 75801768b42SPeter Zijlstra 75901768b42SPeter Zijlstra void __sched 76001768b42SPeter Zijlstra _mutex_lock_nest_lock(struct mutex *lock, struct lockdep_map *nest) 76101768b42SPeter Zijlstra { 76201768b42SPeter Zijlstra might_sleep(); 76301768b42SPeter Zijlstra __mutex_lock_common(lock, TASK_UNINTERRUPTIBLE, 76401768b42SPeter Zijlstra 0, nest, _RET_IP_, NULL, 0); 76501768b42SPeter Zijlstra } 76601768b42SPeter Zijlstra EXPORT_SYMBOL_GPL(_mutex_lock_nest_lock); 76701768b42SPeter Zijlstra 76801768b42SPeter Zijlstra int __sched 76901768b42SPeter Zijlstra mutex_lock_killable_nested(struct mutex *lock, unsigned int subclass) 77001768b42SPeter Zijlstra { 77101768b42SPeter Zijlstra might_sleep(); 77201768b42SPeter Zijlstra return __mutex_lock_common(lock, TASK_KILLABLE, 77301768b42SPeter Zijlstra subclass, NULL, _RET_IP_, NULL, 0); 77401768b42SPeter Zijlstra } 77501768b42SPeter Zijlstra EXPORT_SYMBOL_GPL(mutex_lock_killable_nested); 77601768b42SPeter Zijlstra 77701768b42SPeter Zijlstra int __sched 77801768b42SPeter Zijlstra mutex_lock_interruptible_nested(struct mutex *lock, unsigned int subclass) 77901768b42SPeter Zijlstra { 78001768b42SPeter Zijlstra might_sleep(); 78101768b42SPeter Zijlstra return __mutex_lock_common(lock, TASK_INTERRUPTIBLE, 78201768b42SPeter Zijlstra subclass, NULL, _RET_IP_, NULL, 0); 78301768b42SPeter Zijlstra } 78401768b42SPeter Zijlstra EXPORT_SYMBOL_GPL(mutex_lock_interruptible_nested); 78501768b42SPeter Zijlstra 786*1460cb65STejun Heo void __sched 787*1460cb65STejun Heo mutex_lock_io_nested(struct mutex *lock, unsigned int subclass) 788*1460cb65STejun Heo { 789*1460cb65STejun Heo int token; 790*1460cb65STejun Heo 791*1460cb65STejun Heo might_sleep(); 792*1460cb65STejun Heo 793*1460cb65STejun Heo token = io_schedule_prepare(); 794*1460cb65STejun Heo __mutex_lock_common(lock, TASK_UNINTERRUPTIBLE, 795*1460cb65STejun Heo subclass, NULL, _RET_IP_, NULL, 0); 796*1460cb65STejun Heo io_schedule_finish(token); 797*1460cb65STejun Heo } 798*1460cb65STejun Heo EXPORT_SYMBOL_GPL(mutex_lock_io_nested); 799*1460cb65STejun Heo 80001768b42SPeter Zijlstra static inline int 80101768b42SPeter Zijlstra ww_mutex_deadlock_injection(struct ww_mutex *lock, struct ww_acquire_ctx *ctx) 80201768b42SPeter Zijlstra { 80301768b42SPeter Zijlstra #ifdef CONFIG_DEBUG_WW_MUTEX_SLOWPATH 80401768b42SPeter Zijlstra unsigned tmp; 80501768b42SPeter Zijlstra 80601768b42SPeter Zijlstra if (ctx->deadlock_inject_countdown-- == 0) { 80701768b42SPeter Zijlstra tmp = ctx->deadlock_inject_interval; 80801768b42SPeter Zijlstra if (tmp > UINT_MAX/4) 80901768b42SPeter Zijlstra tmp = UINT_MAX; 81001768b42SPeter Zijlstra else 81101768b42SPeter Zijlstra tmp = tmp*2 + tmp + tmp/2; 81201768b42SPeter Zijlstra 81301768b42SPeter Zijlstra ctx->deadlock_inject_interval = tmp; 81401768b42SPeter Zijlstra ctx->deadlock_inject_countdown = tmp; 81501768b42SPeter Zijlstra ctx->contending_lock = lock; 81601768b42SPeter Zijlstra 81701768b42SPeter Zijlstra ww_mutex_unlock(lock); 81801768b42SPeter Zijlstra 81901768b42SPeter Zijlstra return -EDEADLK; 82001768b42SPeter Zijlstra } 82101768b42SPeter Zijlstra #endif 82201768b42SPeter Zijlstra 82301768b42SPeter Zijlstra return 0; 82401768b42SPeter Zijlstra } 82501768b42SPeter Zijlstra 82601768b42SPeter Zijlstra int __sched 82701768b42SPeter Zijlstra __ww_mutex_lock(struct ww_mutex *lock, struct ww_acquire_ctx *ctx) 82801768b42SPeter Zijlstra { 82901768b42SPeter Zijlstra int ret; 83001768b42SPeter Zijlstra 83101768b42SPeter Zijlstra might_sleep(); 83201768b42SPeter Zijlstra ret = __mutex_lock_common(&lock->base, TASK_UNINTERRUPTIBLE, 83301768b42SPeter Zijlstra 0, &ctx->dep_map, _RET_IP_, ctx, 1); 83401768b42SPeter Zijlstra if (!ret && ctx->acquired > 1) 83501768b42SPeter Zijlstra return ww_mutex_deadlock_injection(lock, ctx); 83601768b42SPeter Zijlstra 83701768b42SPeter Zijlstra return ret; 83801768b42SPeter Zijlstra } 83901768b42SPeter Zijlstra EXPORT_SYMBOL_GPL(__ww_mutex_lock); 84001768b42SPeter Zijlstra 84101768b42SPeter Zijlstra int __sched 84201768b42SPeter Zijlstra __ww_mutex_lock_interruptible(struct ww_mutex *lock, struct ww_acquire_ctx *ctx) 84301768b42SPeter Zijlstra { 84401768b42SPeter Zijlstra int ret; 84501768b42SPeter Zijlstra 84601768b42SPeter Zijlstra might_sleep(); 84701768b42SPeter Zijlstra ret = __mutex_lock_common(&lock->base, TASK_INTERRUPTIBLE, 84801768b42SPeter Zijlstra 0, &ctx->dep_map, _RET_IP_, ctx, 1); 84901768b42SPeter Zijlstra 85001768b42SPeter Zijlstra if (!ret && ctx->acquired > 1) 85101768b42SPeter Zijlstra return ww_mutex_deadlock_injection(lock, ctx); 85201768b42SPeter Zijlstra 85301768b42SPeter Zijlstra return ret; 85401768b42SPeter Zijlstra } 85501768b42SPeter Zijlstra EXPORT_SYMBOL_GPL(__ww_mutex_lock_interruptible); 85601768b42SPeter Zijlstra 85701768b42SPeter Zijlstra #endif 85801768b42SPeter Zijlstra 85901768b42SPeter Zijlstra /* 86001768b42SPeter Zijlstra * Release the lock, slowpath: 86101768b42SPeter Zijlstra */ 8623ca0ff57SPeter Zijlstra static noinline void __sched __mutex_unlock_slowpath(struct mutex *lock, unsigned long ip) 86301768b42SPeter Zijlstra { 8649d659ae1SPeter Zijlstra struct task_struct *next = NULL; 8653ca0ff57SPeter Zijlstra unsigned long owner, flags; 866194a6b5bSWaiman Long DEFINE_WAKE_Q(wake_q); 86701768b42SPeter Zijlstra 8683ca0ff57SPeter Zijlstra mutex_release(&lock->dep_map, 1, ip); 8693ca0ff57SPeter Zijlstra 87001768b42SPeter Zijlstra /* 8719d659ae1SPeter Zijlstra * Release the lock before (potentially) taking the spinlock such that 8729d659ae1SPeter Zijlstra * other contenders can get on with things ASAP. 8739d659ae1SPeter Zijlstra * 8749d659ae1SPeter Zijlstra * Except when HANDOFF, in that case we must not clear the owner field, 8759d659ae1SPeter Zijlstra * but instead set it to the top waiter. 87601768b42SPeter Zijlstra */ 8779d659ae1SPeter Zijlstra owner = atomic_long_read(&lock->owner); 8789d659ae1SPeter Zijlstra for (;;) { 8799d659ae1SPeter Zijlstra unsigned long old; 8809d659ae1SPeter Zijlstra 8819d659ae1SPeter Zijlstra #ifdef CONFIG_DEBUG_MUTEXES 8829d659ae1SPeter Zijlstra DEBUG_LOCKS_WARN_ON(__owner_task(owner) != current); 8839d659ae1SPeter Zijlstra #endif 8849d659ae1SPeter Zijlstra 8859d659ae1SPeter Zijlstra if (owner & MUTEX_FLAG_HANDOFF) 8869d659ae1SPeter Zijlstra break; 8879d659ae1SPeter Zijlstra 8889d659ae1SPeter Zijlstra old = atomic_long_cmpxchg_release(&lock->owner, owner, 8899d659ae1SPeter Zijlstra __owner_flags(owner)); 8909d659ae1SPeter Zijlstra if (old == owner) { 8919d659ae1SPeter Zijlstra if (owner & MUTEX_FLAG_WAITERS) 8929d659ae1SPeter Zijlstra break; 8939d659ae1SPeter Zijlstra 8943ca0ff57SPeter Zijlstra return; 8959d659ae1SPeter Zijlstra } 8969d659ae1SPeter Zijlstra 8979d659ae1SPeter Zijlstra owner = old; 8989d659ae1SPeter Zijlstra } 89901768b42SPeter Zijlstra 9001d8fe7dcSJason Low spin_lock_mutex(&lock->wait_lock, flags); 9011d8fe7dcSJason Low debug_mutex_unlock(lock); 90201768b42SPeter Zijlstra if (!list_empty(&lock->wait_list)) { 90301768b42SPeter Zijlstra /* get the first entry from the wait-list: */ 90401768b42SPeter Zijlstra struct mutex_waiter *waiter = 9059d659ae1SPeter Zijlstra list_first_entry(&lock->wait_list, 90601768b42SPeter Zijlstra struct mutex_waiter, list); 90701768b42SPeter Zijlstra 9089d659ae1SPeter Zijlstra next = waiter->task; 9099d659ae1SPeter Zijlstra 91001768b42SPeter Zijlstra debug_mutex_wake_waiter(lock, waiter); 9119d659ae1SPeter Zijlstra wake_q_add(&wake_q, next); 91201768b42SPeter Zijlstra } 91301768b42SPeter Zijlstra 9149d659ae1SPeter Zijlstra if (owner & MUTEX_FLAG_HANDOFF) 9159d659ae1SPeter Zijlstra __mutex_handoff(lock, next); 9169d659ae1SPeter Zijlstra 91701768b42SPeter Zijlstra spin_unlock_mutex(&lock->wait_lock, flags); 9189d659ae1SPeter Zijlstra 9191329ce6fSDavidlohr Bueso wake_up_q(&wake_q); 92001768b42SPeter Zijlstra } 92101768b42SPeter Zijlstra 92201768b42SPeter Zijlstra #ifndef CONFIG_DEBUG_LOCK_ALLOC 92301768b42SPeter Zijlstra /* 92401768b42SPeter Zijlstra * Here come the less common (and hence less performance-critical) APIs: 92501768b42SPeter Zijlstra * mutex_lock_interruptible() and mutex_trylock(). 92601768b42SPeter Zijlstra */ 92701768b42SPeter Zijlstra static noinline int __sched 92801768b42SPeter Zijlstra __mutex_lock_killable_slowpath(struct mutex *lock); 92901768b42SPeter Zijlstra 93001768b42SPeter Zijlstra static noinline int __sched 93101768b42SPeter Zijlstra __mutex_lock_interruptible_slowpath(struct mutex *lock); 93201768b42SPeter Zijlstra 93301768b42SPeter Zijlstra /** 93401768b42SPeter Zijlstra * mutex_lock_interruptible - acquire the mutex, interruptible 93501768b42SPeter Zijlstra * @lock: the mutex to be acquired 93601768b42SPeter Zijlstra * 93701768b42SPeter Zijlstra * Lock the mutex like mutex_lock(), and return 0 if the mutex has 93801768b42SPeter Zijlstra * been acquired or sleep until the mutex becomes available. If a 93901768b42SPeter Zijlstra * signal arrives while waiting for the lock then this function 94001768b42SPeter Zijlstra * returns -EINTR. 94101768b42SPeter Zijlstra * 94201768b42SPeter Zijlstra * This function is similar to (but not equivalent to) down_interruptible(). 94301768b42SPeter Zijlstra */ 94401768b42SPeter Zijlstra int __sched mutex_lock_interruptible(struct mutex *lock) 94501768b42SPeter Zijlstra { 94601768b42SPeter Zijlstra might_sleep(); 9473ca0ff57SPeter Zijlstra 9483ca0ff57SPeter Zijlstra if (__mutex_trylock_fast(lock)) 94901768b42SPeter Zijlstra return 0; 9503ca0ff57SPeter Zijlstra 95101768b42SPeter Zijlstra return __mutex_lock_interruptible_slowpath(lock); 95201768b42SPeter Zijlstra } 95301768b42SPeter Zijlstra 95401768b42SPeter Zijlstra EXPORT_SYMBOL(mutex_lock_interruptible); 95501768b42SPeter Zijlstra 95601768b42SPeter Zijlstra int __sched mutex_lock_killable(struct mutex *lock) 95701768b42SPeter Zijlstra { 95801768b42SPeter Zijlstra might_sleep(); 9593ca0ff57SPeter Zijlstra 9603ca0ff57SPeter Zijlstra if (__mutex_trylock_fast(lock)) 96101768b42SPeter Zijlstra return 0; 9623ca0ff57SPeter Zijlstra 96301768b42SPeter Zijlstra return __mutex_lock_killable_slowpath(lock); 96401768b42SPeter Zijlstra } 96501768b42SPeter Zijlstra EXPORT_SYMBOL(mutex_lock_killable); 96601768b42SPeter Zijlstra 967*1460cb65STejun Heo void __sched mutex_lock_io(struct mutex *lock) 968*1460cb65STejun Heo { 969*1460cb65STejun Heo int token; 970*1460cb65STejun Heo 971*1460cb65STejun Heo token = io_schedule_prepare(); 972*1460cb65STejun Heo mutex_lock(lock); 973*1460cb65STejun Heo io_schedule_finish(token); 974*1460cb65STejun Heo } 975*1460cb65STejun Heo EXPORT_SYMBOL_GPL(mutex_lock_io); 976*1460cb65STejun Heo 9773ca0ff57SPeter Zijlstra static noinline void __sched 9783ca0ff57SPeter Zijlstra __mutex_lock_slowpath(struct mutex *lock) 97901768b42SPeter Zijlstra { 98001768b42SPeter Zijlstra __mutex_lock_common(lock, TASK_UNINTERRUPTIBLE, 0, 98101768b42SPeter Zijlstra NULL, _RET_IP_, NULL, 0); 98201768b42SPeter Zijlstra } 98301768b42SPeter Zijlstra 98401768b42SPeter Zijlstra static noinline int __sched 98501768b42SPeter Zijlstra __mutex_lock_killable_slowpath(struct mutex *lock) 98601768b42SPeter Zijlstra { 98701768b42SPeter Zijlstra return __mutex_lock_common(lock, TASK_KILLABLE, 0, 98801768b42SPeter Zijlstra NULL, _RET_IP_, NULL, 0); 98901768b42SPeter Zijlstra } 99001768b42SPeter Zijlstra 99101768b42SPeter Zijlstra static noinline int __sched 99201768b42SPeter Zijlstra __mutex_lock_interruptible_slowpath(struct mutex *lock) 99301768b42SPeter Zijlstra { 99401768b42SPeter Zijlstra return __mutex_lock_common(lock, TASK_INTERRUPTIBLE, 0, 99501768b42SPeter Zijlstra NULL, _RET_IP_, NULL, 0); 99601768b42SPeter Zijlstra } 99701768b42SPeter Zijlstra 99801768b42SPeter Zijlstra static noinline int __sched 99901768b42SPeter Zijlstra __ww_mutex_lock_slowpath(struct ww_mutex *lock, struct ww_acquire_ctx *ctx) 100001768b42SPeter Zijlstra { 100101768b42SPeter Zijlstra return __mutex_lock_common(&lock->base, TASK_UNINTERRUPTIBLE, 0, 100201768b42SPeter Zijlstra NULL, _RET_IP_, ctx, 1); 100301768b42SPeter Zijlstra } 100401768b42SPeter Zijlstra 100501768b42SPeter Zijlstra static noinline int __sched 100601768b42SPeter Zijlstra __ww_mutex_lock_interruptible_slowpath(struct ww_mutex *lock, 100701768b42SPeter Zijlstra struct ww_acquire_ctx *ctx) 100801768b42SPeter Zijlstra { 100901768b42SPeter Zijlstra return __mutex_lock_common(&lock->base, TASK_INTERRUPTIBLE, 0, 101001768b42SPeter Zijlstra NULL, _RET_IP_, ctx, 1); 101101768b42SPeter Zijlstra } 101201768b42SPeter Zijlstra 101301768b42SPeter Zijlstra #endif 101401768b42SPeter Zijlstra 101501768b42SPeter Zijlstra /** 101601768b42SPeter Zijlstra * mutex_trylock - try to acquire the mutex, without waiting 101701768b42SPeter Zijlstra * @lock: the mutex to be acquired 101801768b42SPeter Zijlstra * 101901768b42SPeter Zijlstra * Try to acquire the mutex atomically. Returns 1 if the mutex 102001768b42SPeter Zijlstra * has been acquired successfully, and 0 on contention. 102101768b42SPeter Zijlstra * 102201768b42SPeter Zijlstra * NOTE: this function follows the spin_trylock() convention, so 102301768b42SPeter Zijlstra * it is negated from the down_trylock() return values! Be careful 102401768b42SPeter Zijlstra * about this when converting semaphore users to mutexes. 102501768b42SPeter Zijlstra * 102601768b42SPeter Zijlstra * This function must not be used in interrupt context. The 102701768b42SPeter Zijlstra * mutex must be released by the same task that acquired it. 102801768b42SPeter Zijlstra */ 102901768b42SPeter Zijlstra int __sched mutex_trylock(struct mutex *lock) 103001768b42SPeter Zijlstra { 10319d659ae1SPeter Zijlstra bool locked = __mutex_trylock(lock, false); 103201768b42SPeter Zijlstra 10333ca0ff57SPeter Zijlstra if (locked) 10343ca0ff57SPeter Zijlstra mutex_acquire(&lock->dep_map, 0, 1, _RET_IP_); 103501768b42SPeter Zijlstra 10363ca0ff57SPeter Zijlstra return locked; 103701768b42SPeter Zijlstra } 103801768b42SPeter Zijlstra EXPORT_SYMBOL(mutex_trylock); 103901768b42SPeter Zijlstra 104001768b42SPeter Zijlstra #ifndef CONFIG_DEBUG_LOCK_ALLOC 104101768b42SPeter Zijlstra int __sched 104201768b42SPeter Zijlstra __ww_mutex_lock(struct ww_mutex *lock, struct ww_acquire_ctx *ctx) 104301768b42SPeter Zijlstra { 104401768b42SPeter Zijlstra might_sleep(); 104501768b42SPeter Zijlstra 10463ca0ff57SPeter Zijlstra if (__mutex_trylock_fast(&lock->base)) { 104701768b42SPeter Zijlstra ww_mutex_set_context_fastpath(lock, ctx); 10483ca0ff57SPeter Zijlstra return 0; 10493ca0ff57SPeter Zijlstra } 10503ca0ff57SPeter Zijlstra 10513ca0ff57SPeter Zijlstra return __ww_mutex_lock_slowpath(lock, ctx); 105201768b42SPeter Zijlstra } 105301768b42SPeter Zijlstra EXPORT_SYMBOL(__ww_mutex_lock); 105401768b42SPeter Zijlstra 105501768b42SPeter Zijlstra int __sched 105601768b42SPeter Zijlstra __ww_mutex_lock_interruptible(struct ww_mutex *lock, struct ww_acquire_ctx *ctx) 105701768b42SPeter Zijlstra { 105801768b42SPeter Zijlstra might_sleep(); 105901768b42SPeter Zijlstra 10603ca0ff57SPeter Zijlstra if (__mutex_trylock_fast(&lock->base)) { 106101768b42SPeter Zijlstra ww_mutex_set_context_fastpath(lock, ctx); 10623ca0ff57SPeter Zijlstra return 0; 10633ca0ff57SPeter Zijlstra } 10643ca0ff57SPeter Zijlstra 10653ca0ff57SPeter Zijlstra return __ww_mutex_lock_interruptible_slowpath(lock, ctx); 106601768b42SPeter Zijlstra } 106701768b42SPeter Zijlstra EXPORT_SYMBOL(__ww_mutex_lock_interruptible); 106801768b42SPeter Zijlstra 106901768b42SPeter Zijlstra #endif 107001768b42SPeter Zijlstra 107101768b42SPeter Zijlstra /** 107201768b42SPeter Zijlstra * atomic_dec_and_mutex_lock - return holding mutex if we dec to 0 107301768b42SPeter Zijlstra * @cnt: the atomic which we are to dec 107401768b42SPeter Zijlstra * @lock: the mutex to return holding if we dec to 0 107501768b42SPeter Zijlstra * 107601768b42SPeter Zijlstra * return true and hold lock if we dec to 0, return false otherwise 107701768b42SPeter Zijlstra */ 107801768b42SPeter Zijlstra int atomic_dec_and_mutex_lock(atomic_t *cnt, struct mutex *lock) 107901768b42SPeter Zijlstra { 108001768b42SPeter Zijlstra /* dec if we can't possibly hit 0 */ 108101768b42SPeter Zijlstra if (atomic_add_unless(cnt, -1, 1)) 108201768b42SPeter Zijlstra return 0; 108301768b42SPeter Zijlstra /* we might hit 0, so take the lock */ 108401768b42SPeter Zijlstra mutex_lock(lock); 108501768b42SPeter Zijlstra if (!atomic_dec_and_test(cnt)) { 108601768b42SPeter Zijlstra /* when we actually did the dec, we didn't hit 0 */ 108701768b42SPeter Zijlstra mutex_unlock(lock); 108801768b42SPeter Zijlstra return 0; 108901768b42SPeter Zijlstra } 109001768b42SPeter Zijlstra /* we hit 0, and we hold the lock */ 109101768b42SPeter Zijlstra return 1; 109201768b42SPeter Zijlstra } 109301768b42SPeter Zijlstra EXPORT_SYMBOL(atomic_dec_and_mutex_lock); 1094