101768b42SPeter Zijlstra /* 267a6de49SPeter Zijlstra * kernel/locking/mutex.c 301768b42SPeter Zijlstra * 401768b42SPeter Zijlstra * Mutexes: blocking mutual exclusion locks 501768b42SPeter Zijlstra * 601768b42SPeter Zijlstra * Started by Ingo Molnar: 701768b42SPeter Zijlstra * 801768b42SPeter Zijlstra * Copyright (C) 2004, 2005, 2006 Red Hat, Inc., Ingo Molnar <mingo@redhat.com> 901768b42SPeter Zijlstra * 1001768b42SPeter Zijlstra * Many thanks to Arjan van de Ven, Thomas Gleixner, Steven Rostedt and 1101768b42SPeter Zijlstra * David Howells for suggestions and improvements. 1201768b42SPeter Zijlstra * 1301768b42SPeter Zijlstra * - Adaptive spinning for mutexes by Peter Zijlstra. (Ported to mainline 1401768b42SPeter Zijlstra * from the -rt tree, where it was originally implemented for rtmutexes 1501768b42SPeter Zijlstra * by Steven Rostedt, based on work by Gregory Haskins, Peter Morreale 1601768b42SPeter Zijlstra * and Sven Dietrich. 1701768b42SPeter Zijlstra * 18214e0aedSDavidlohr Bueso * Also see Documentation/locking/mutex-design.txt. 1901768b42SPeter Zijlstra */ 2001768b42SPeter Zijlstra #include <linux/mutex.h> 2101768b42SPeter Zijlstra #include <linux/ww_mutex.h> 2201768b42SPeter Zijlstra #include <linux/sched.h> 2301768b42SPeter Zijlstra #include <linux/sched/rt.h> 2401768b42SPeter Zijlstra #include <linux/export.h> 2501768b42SPeter Zijlstra #include <linux/spinlock.h> 2601768b42SPeter Zijlstra #include <linux/interrupt.h> 2701768b42SPeter Zijlstra #include <linux/debug_locks.h> 287a215f89SDavidlohr Bueso #include <linux/osq_lock.h> 2901768b42SPeter Zijlstra 3001768b42SPeter Zijlstra #ifdef CONFIG_DEBUG_MUTEXES 3101768b42SPeter Zijlstra # include "mutex-debug.h" 3201768b42SPeter Zijlstra #else 3301768b42SPeter Zijlstra # include "mutex.h" 3401768b42SPeter Zijlstra #endif 3501768b42SPeter Zijlstra 3601768b42SPeter Zijlstra void 3701768b42SPeter Zijlstra __mutex_init(struct mutex *lock, const char *name, struct lock_class_key *key) 3801768b42SPeter Zijlstra { 393ca0ff57SPeter Zijlstra atomic_long_set(&lock->owner, 0); 4001768b42SPeter Zijlstra spin_lock_init(&lock->wait_lock); 4101768b42SPeter Zijlstra INIT_LIST_HEAD(&lock->wait_list); 4201768b42SPeter Zijlstra #ifdef CONFIG_MUTEX_SPIN_ON_OWNER 434d9d951eSJason Low osq_lock_init(&lock->osq); 4401768b42SPeter Zijlstra #endif 4501768b42SPeter Zijlstra 4601768b42SPeter Zijlstra debug_mutex_init(lock, name, key); 4701768b42SPeter Zijlstra } 4801768b42SPeter Zijlstra EXPORT_SYMBOL(__mutex_init); 4901768b42SPeter Zijlstra 503ca0ff57SPeter Zijlstra /* 513ca0ff57SPeter Zijlstra * @owner: contains: 'struct task_struct *' to the current lock owner, 523ca0ff57SPeter Zijlstra * NULL means not owned. Since task_struct pointers are aligned at 53*e274795eSPeter Zijlstra * at least L1_CACHE_BYTES, we have low bits to store extra state. 543ca0ff57SPeter Zijlstra * 553ca0ff57SPeter Zijlstra * Bit0 indicates a non-empty waiter list; unlock must issue a wakeup. 569d659ae1SPeter Zijlstra * Bit1 indicates unlock needs to hand the lock to the top-waiter 57*e274795eSPeter Zijlstra * Bit2 indicates handoff has been done and we're waiting for pickup. 583ca0ff57SPeter Zijlstra */ 593ca0ff57SPeter Zijlstra #define MUTEX_FLAG_WAITERS 0x01 609d659ae1SPeter Zijlstra #define MUTEX_FLAG_HANDOFF 0x02 61*e274795eSPeter Zijlstra #define MUTEX_FLAG_PICKUP 0x04 623ca0ff57SPeter Zijlstra 63*e274795eSPeter Zijlstra #define MUTEX_FLAGS 0x07 643ca0ff57SPeter Zijlstra 653ca0ff57SPeter Zijlstra static inline struct task_struct *__owner_task(unsigned long owner) 663ca0ff57SPeter Zijlstra { 673ca0ff57SPeter Zijlstra return (struct task_struct *)(owner & ~MUTEX_FLAGS); 683ca0ff57SPeter Zijlstra } 693ca0ff57SPeter Zijlstra 703ca0ff57SPeter Zijlstra static inline unsigned long __owner_flags(unsigned long owner) 713ca0ff57SPeter Zijlstra { 723ca0ff57SPeter Zijlstra return owner & MUTEX_FLAGS; 733ca0ff57SPeter Zijlstra } 743ca0ff57SPeter Zijlstra 753ca0ff57SPeter Zijlstra /* 76*e274795eSPeter Zijlstra * Trylock variant that retuns the owning task on failure. 773ca0ff57SPeter Zijlstra */ 78*e274795eSPeter Zijlstra static inline struct task_struct *__mutex_trylock_or_owner(struct mutex *lock) 793ca0ff57SPeter Zijlstra { 803ca0ff57SPeter Zijlstra unsigned long owner, curr = (unsigned long)current; 813ca0ff57SPeter Zijlstra 823ca0ff57SPeter Zijlstra owner = atomic_long_read(&lock->owner); 833ca0ff57SPeter Zijlstra for (;;) { /* must loop, can race against a flag */ 849d659ae1SPeter Zijlstra unsigned long old, flags = __owner_flags(owner); 85*e274795eSPeter Zijlstra unsigned long task = owner & ~MUTEX_FLAGS; 863ca0ff57SPeter Zijlstra 87*e274795eSPeter Zijlstra if (task) { 88*e274795eSPeter Zijlstra if (likely(task != curr)) 89*e274795eSPeter Zijlstra break; 909d659ae1SPeter Zijlstra 91*e274795eSPeter Zijlstra if (likely(!(flags & MUTEX_FLAG_PICKUP))) 92*e274795eSPeter Zijlstra break; 93*e274795eSPeter Zijlstra 94*e274795eSPeter Zijlstra flags &= ~MUTEX_FLAG_PICKUP; 95*e274795eSPeter Zijlstra } else { 96*e274795eSPeter Zijlstra #ifdef CONFIG_DEBUG_MUTEXES 97*e274795eSPeter Zijlstra DEBUG_LOCKS_WARN_ON(flags & MUTEX_FLAG_PICKUP); 98*e274795eSPeter Zijlstra #endif 999d659ae1SPeter Zijlstra } 1003ca0ff57SPeter Zijlstra 1019d659ae1SPeter Zijlstra /* 1029d659ae1SPeter Zijlstra * We set the HANDOFF bit, we must make sure it doesn't live 1039d659ae1SPeter Zijlstra * past the point where we acquire it. This would be possible 1049d659ae1SPeter Zijlstra * if we (accidentally) set the bit on an unlocked mutex. 1059d659ae1SPeter Zijlstra */ 1069d659ae1SPeter Zijlstra flags &= ~MUTEX_FLAG_HANDOFF; 1079d659ae1SPeter Zijlstra 1089d659ae1SPeter Zijlstra old = atomic_long_cmpxchg_acquire(&lock->owner, owner, curr | flags); 1093ca0ff57SPeter Zijlstra if (old == owner) 110*e274795eSPeter Zijlstra return NULL; 1113ca0ff57SPeter Zijlstra 1123ca0ff57SPeter Zijlstra owner = old; 1133ca0ff57SPeter Zijlstra } 114*e274795eSPeter Zijlstra 115*e274795eSPeter Zijlstra return __owner_task(owner); 116*e274795eSPeter Zijlstra } 117*e274795eSPeter Zijlstra 118*e274795eSPeter Zijlstra /* 119*e274795eSPeter Zijlstra * Actual trylock that will work on any unlocked state. 120*e274795eSPeter Zijlstra */ 121*e274795eSPeter Zijlstra static inline bool __mutex_trylock(struct mutex *lock) 122*e274795eSPeter Zijlstra { 123*e274795eSPeter Zijlstra return !__mutex_trylock_or_owner(lock); 1243ca0ff57SPeter Zijlstra } 1253ca0ff57SPeter Zijlstra 1263ca0ff57SPeter Zijlstra #ifndef CONFIG_DEBUG_LOCK_ALLOC 1273ca0ff57SPeter Zijlstra /* 1283ca0ff57SPeter Zijlstra * Lockdep annotations are contained to the slow paths for simplicity. 1293ca0ff57SPeter Zijlstra * There is nothing that would stop spreading the lockdep annotations outwards 1303ca0ff57SPeter Zijlstra * except more code. 1313ca0ff57SPeter Zijlstra */ 1323ca0ff57SPeter Zijlstra 1333ca0ff57SPeter Zijlstra /* 1343ca0ff57SPeter Zijlstra * Optimistic trylock that only works in the uncontended case. Make sure to 1353ca0ff57SPeter Zijlstra * follow with a __mutex_trylock() before failing. 1363ca0ff57SPeter Zijlstra */ 1373ca0ff57SPeter Zijlstra static __always_inline bool __mutex_trylock_fast(struct mutex *lock) 1383ca0ff57SPeter Zijlstra { 1393ca0ff57SPeter Zijlstra unsigned long curr = (unsigned long)current; 1403ca0ff57SPeter Zijlstra 1413ca0ff57SPeter Zijlstra if (!atomic_long_cmpxchg_acquire(&lock->owner, 0UL, curr)) 1423ca0ff57SPeter Zijlstra return true; 1433ca0ff57SPeter Zijlstra 1443ca0ff57SPeter Zijlstra return false; 1453ca0ff57SPeter Zijlstra } 1463ca0ff57SPeter Zijlstra 1473ca0ff57SPeter Zijlstra static __always_inline bool __mutex_unlock_fast(struct mutex *lock) 1483ca0ff57SPeter Zijlstra { 1493ca0ff57SPeter Zijlstra unsigned long curr = (unsigned long)current; 1503ca0ff57SPeter Zijlstra 1513ca0ff57SPeter Zijlstra if (atomic_long_cmpxchg_release(&lock->owner, curr, 0UL) == curr) 1523ca0ff57SPeter Zijlstra return true; 1533ca0ff57SPeter Zijlstra 1543ca0ff57SPeter Zijlstra return false; 1553ca0ff57SPeter Zijlstra } 1563ca0ff57SPeter Zijlstra #endif 1573ca0ff57SPeter Zijlstra 1583ca0ff57SPeter Zijlstra static inline void __mutex_set_flag(struct mutex *lock, unsigned long flag) 1593ca0ff57SPeter Zijlstra { 1603ca0ff57SPeter Zijlstra atomic_long_or(flag, &lock->owner); 1613ca0ff57SPeter Zijlstra } 1623ca0ff57SPeter Zijlstra 1633ca0ff57SPeter Zijlstra static inline void __mutex_clear_flag(struct mutex *lock, unsigned long flag) 1643ca0ff57SPeter Zijlstra { 1653ca0ff57SPeter Zijlstra atomic_long_andnot(flag, &lock->owner); 1663ca0ff57SPeter Zijlstra } 1673ca0ff57SPeter Zijlstra 1689d659ae1SPeter Zijlstra static inline bool __mutex_waiter_is_first(struct mutex *lock, struct mutex_waiter *waiter) 1699d659ae1SPeter Zijlstra { 1709d659ae1SPeter Zijlstra return list_first_entry(&lock->wait_list, struct mutex_waiter, list) == waiter; 1719d659ae1SPeter Zijlstra } 1729d659ae1SPeter Zijlstra 1739d659ae1SPeter Zijlstra /* 1749d659ae1SPeter Zijlstra * Give up ownership to a specific task, when @task = NULL, this is equivalent 175*e274795eSPeter Zijlstra * to a regular unlock. Sets PICKUP on a handoff, clears HANDOF, preserves 176*e274795eSPeter Zijlstra * WAITERS. Provides RELEASE semantics like a regular unlock, the 177*e274795eSPeter Zijlstra * __mutex_trylock() provides a matching ACQUIRE semantics for the handoff. 1789d659ae1SPeter Zijlstra */ 1799d659ae1SPeter Zijlstra static void __mutex_handoff(struct mutex *lock, struct task_struct *task) 1809d659ae1SPeter Zijlstra { 1819d659ae1SPeter Zijlstra unsigned long owner = atomic_long_read(&lock->owner); 1829d659ae1SPeter Zijlstra 1839d659ae1SPeter Zijlstra for (;;) { 1849d659ae1SPeter Zijlstra unsigned long old, new; 1859d659ae1SPeter Zijlstra 1869d659ae1SPeter Zijlstra #ifdef CONFIG_DEBUG_MUTEXES 1879d659ae1SPeter Zijlstra DEBUG_LOCKS_WARN_ON(__owner_task(owner) != current); 188*e274795eSPeter Zijlstra DEBUG_LOCKS_WARN_ON(owner & MUTEX_FLAG_PICKUP); 1899d659ae1SPeter Zijlstra #endif 1909d659ae1SPeter Zijlstra 1919d659ae1SPeter Zijlstra new = (owner & MUTEX_FLAG_WAITERS); 1929d659ae1SPeter Zijlstra new |= (unsigned long)task; 193*e274795eSPeter Zijlstra if (task) 194*e274795eSPeter Zijlstra new |= MUTEX_FLAG_PICKUP; 1959d659ae1SPeter Zijlstra 1969d659ae1SPeter Zijlstra old = atomic_long_cmpxchg_release(&lock->owner, owner, new); 1979d659ae1SPeter Zijlstra if (old == owner) 1989d659ae1SPeter Zijlstra break; 1999d659ae1SPeter Zijlstra 2009d659ae1SPeter Zijlstra owner = old; 2019d659ae1SPeter Zijlstra } 2029d659ae1SPeter Zijlstra } 2039d659ae1SPeter Zijlstra 20401768b42SPeter Zijlstra #ifndef CONFIG_DEBUG_LOCK_ALLOC 20501768b42SPeter Zijlstra /* 20601768b42SPeter Zijlstra * We split the mutex lock/unlock logic into separate fastpath and 20701768b42SPeter Zijlstra * slowpath functions, to reduce the register pressure on the fastpath. 20801768b42SPeter Zijlstra * We also put the fastpath first in the kernel image, to make sure the 20901768b42SPeter Zijlstra * branch is predicted by the CPU as default-untaken. 21001768b42SPeter Zijlstra */ 2113ca0ff57SPeter Zijlstra static void __sched __mutex_lock_slowpath(struct mutex *lock); 21201768b42SPeter Zijlstra 21301768b42SPeter Zijlstra /** 21401768b42SPeter Zijlstra * mutex_lock - acquire the mutex 21501768b42SPeter Zijlstra * @lock: the mutex to be acquired 21601768b42SPeter Zijlstra * 21701768b42SPeter Zijlstra * Lock the mutex exclusively for this task. If the mutex is not 21801768b42SPeter Zijlstra * available right now, it will sleep until it can get it. 21901768b42SPeter Zijlstra * 22001768b42SPeter Zijlstra * The mutex must later on be released by the same task that 22101768b42SPeter Zijlstra * acquired it. Recursive locking is not allowed. The task 22201768b42SPeter Zijlstra * may not exit without first unlocking the mutex. Also, kernel 223139b6fd2SSharon Dvir * memory where the mutex resides must not be freed with 22401768b42SPeter Zijlstra * the mutex still locked. The mutex must first be initialized 22501768b42SPeter Zijlstra * (or statically defined) before it can be locked. memset()-ing 22601768b42SPeter Zijlstra * the mutex to 0 is not allowed. 22701768b42SPeter Zijlstra * 22801768b42SPeter Zijlstra * ( The CONFIG_DEBUG_MUTEXES .config option turns on debugging 22901768b42SPeter Zijlstra * checks that will enforce the restrictions and will also do 23001768b42SPeter Zijlstra * deadlock debugging. ) 23101768b42SPeter Zijlstra * 23201768b42SPeter Zijlstra * This function is similar to (but not equivalent to) down(). 23301768b42SPeter Zijlstra */ 23401768b42SPeter Zijlstra void __sched mutex_lock(struct mutex *lock) 23501768b42SPeter Zijlstra { 23601768b42SPeter Zijlstra might_sleep(); 23701768b42SPeter Zijlstra 2383ca0ff57SPeter Zijlstra if (!__mutex_trylock_fast(lock)) 2393ca0ff57SPeter Zijlstra __mutex_lock_slowpath(lock); 2403ca0ff57SPeter Zijlstra } 24101768b42SPeter Zijlstra EXPORT_SYMBOL(mutex_lock); 24201768b42SPeter Zijlstra #endif 24301768b42SPeter Zijlstra 24476916515SDavidlohr Bueso static __always_inline void ww_mutex_lock_acquired(struct ww_mutex *ww, 24576916515SDavidlohr Bueso struct ww_acquire_ctx *ww_ctx) 24676916515SDavidlohr Bueso { 24776916515SDavidlohr Bueso #ifdef CONFIG_DEBUG_MUTEXES 24876916515SDavidlohr Bueso /* 24976916515SDavidlohr Bueso * If this WARN_ON triggers, you used ww_mutex_lock to acquire, 25076916515SDavidlohr Bueso * but released with a normal mutex_unlock in this call. 25176916515SDavidlohr Bueso * 25276916515SDavidlohr Bueso * This should never happen, always use ww_mutex_unlock. 25376916515SDavidlohr Bueso */ 25476916515SDavidlohr Bueso DEBUG_LOCKS_WARN_ON(ww->ctx); 25576916515SDavidlohr Bueso 25676916515SDavidlohr Bueso /* 25776916515SDavidlohr Bueso * Not quite done after calling ww_acquire_done() ? 25876916515SDavidlohr Bueso */ 25976916515SDavidlohr Bueso DEBUG_LOCKS_WARN_ON(ww_ctx->done_acquire); 26076916515SDavidlohr Bueso 26176916515SDavidlohr Bueso if (ww_ctx->contending_lock) { 26276916515SDavidlohr Bueso /* 26376916515SDavidlohr Bueso * After -EDEADLK you tried to 26476916515SDavidlohr Bueso * acquire a different ww_mutex? Bad! 26576916515SDavidlohr Bueso */ 26676916515SDavidlohr Bueso DEBUG_LOCKS_WARN_ON(ww_ctx->contending_lock != ww); 26776916515SDavidlohr Bueso 26876916515SDavidlohr Bueso /* 26976916515SDavidlohr Bueso * You called ww_mutex_lock after receiving -EDEADLK, 27076916515SDavidlohr Bueso * but 'forgot' to unlock everything else first? 27176916515SDavidlohr Bueso */ 27276916515SDavidlohr Bueso DEBUG_LOCKS_WARN_ON(ww_ctx->acquired > 0); 27376916515SDavidlohr Bueso ww_ctx->contending_lock = NULL; 27476916515SDavidlohr Bueso } 27576916515SDavidlohr Bueso 27676916515SDavidlohr Bueso /* 27776916515SDavidlohr Bueso * Naughty, using a different class will lead to undefined behavior! 27876916515SDavidlohr Bueso */ 27976916515SDavidlohr Bueso DEBUG_LOCKS_WARN_ON(ww_ctx->ww_class != ww->ww_class); 28076916515SDavidlohr Bueso #endif 28176916515SDavidlohr Bueso ww_ctx->acquired++; 28276916515SDavidlohr Bueso } 28376916515SDavidlohr Bueso 28476916515SDavidlohr Bueso /* 2854bd19084SDavidlohr Bueso * After acquiring lock with fastpath or when we lost out in contested 28676916515SDavidlohr Bueso * slowpath, set ctx and wake up any waiters so they can recheck. 28776916515SDavidlohr Bueso */ 28876916515SDavidlohr Bueso static __always_inline void 28976916515SDavidlohr Bueso ww_mutex_set_context_fastpath(struct ww_mutex *lock, 29076916515SDavidlohr Bueso struct ww_acquire_ctx *ctx) 29176916515SDavidlohr Bueso { 29276916515SDavidlohr Bueso unsigned long flags; 29376916515SDavidlohr Bueso struct mutex_waiter *cur; 29476916515SDavidlohr Bueso 29576916515SDavidlohr Bueso ww_mutex_lock_acquired(lock, ctx); 29676916515SDavidlohr Bueso 29776916515SDavidlohr Bueso lock->ctx = ctx; 29876916515SDavidlohr Bueso 29976916515SDavidlohr Bueso /* 30076916515SDavidlohr Bueso * The lock->ctx update should be visible on all cores before 30176916515SDavidlohr Bueso * the atomic read is done, otherwise contended waiters might be 30276916515SDavidlohr Bueso * missed. The contended waiters will either see ww_ctx == NULL 30376916515SDavidlohr Bueso * and keep spinning, or it will acquire wait_lock, add itself 30476916515SDavidlohr Bueso * to waiter list and sleep. 30576916515SDavidlohr Bueso */ 30676916515SDavidlohr Bueso smp_mb(); /* ^^^ */ 30776916515SDavidlohr Bueso 30876916515SDavidlohr Bueso /* 30976916515SDavidlohr Bueso * Check if lock is contended, if not there is nobody to wake up 31076916515SDavidlohr Bueso */ 3113ca0ff57SPeter Zijlstra if (likely(!(atomic_long_read(&lock->base.owner) & MUTEX_FLAG_WAITERS))) 31276916515SDavidlohr Bueso return; 31376916515SDavidlohr Bueso 31476916515SDavidlohr Bueso /* 31576916515SDavidlohr Bueso * Uh oh, we raced in fastpath, wake up everyone in this case, 31676916515SDavidlohr Bueso * so they can see the new lock->ctx. 31776916515SDavidlohr Bueso */ 31876916515SDavidlohr Bueso spin_lock_mutex(&lock->base.wait_lock, flags); 31976916515SDavidlohr Bueso list_for_each_entry(cur, &lock->base.wait_list, list) { 32076916515SDavidlohr Bueso debug_mutex_wake_waiter(&lock->base, cur); 32176916515SDavidlohr Bueso wake_up_process(cur->task); 32276916515SDavidlohr Bueso } 32376916515SDavidlohr Bueso spin_unlock_mutex(&lock->base.wait_lock, flags); 32476916515SDavidlohr Bueso } 32576916515SDavidlohr Bueso 3264bd19084SDavidlohr Bueso /* 3274bd19084SDavidlohr Bueso * After acquiring lock in the slowpath set ctx and wake up any 3284bd19084SDavidlohr Bueso * waiters so they can recheck. 3294bd19084SDavidlohr Bueso * 3304bd19084SDavidlohr Bueso * Callers must hold the mutex wait_lock. 3314bd19084SDavidlohr Bueso */ 3324bd19084SDavidlohr Bueso static __always_inline void 3334bd19084SDavidlohr Bueso ww_mutex_set_context_slowpath(struct ww_mutex *lock, 3344bd19084SDavidlohr Bueso struct ww_acquire_ctx *ctx) 3354bd19084SDavidlohr Bueso { 3364bd19084SDavidlohr Bueso struct mutex_waiter *cur; 3374bd19084SDavidlohr Bueso 3384bd19084SDavidlohr Bueso ww_mutex_lock_acquired(lock, ctx); 3394bd19084SDavidlohr Bueso lock->ctx = ctx; 3404bd19084SDavidlohr Bueso 3414bd19084SDavidlohr Bueso /* 3424bd19084SDavidlohr Bueso * Give any possible sleeping processes the chance to wake up, 3434bd19084SDavidlohr Bueso * so they can recheck if they have to back off. 3444bd19084SDavidlohr Bueso */ 3454bd19084SDavidlohr Bueso list_for_each_entry(cur, &lock->base.wait_list, list) { 3464bd19084SDavidlohr Bueso debug_mutex_wake_waiter(&lock->base, cur); 3474bd19084SDavidlohr Bueso wake_up_process(cur->task); 3484bd19084SDavidlohr Bueso } 3494bd19084SDavidlohr Bueso } 35076916515SDavidlohr Bueso 35101768b42SPeter Zijlstra #ifdef CONFIG_MUTEX_SPIN_ON_OWNER 35201768b42SPeter Zijlstra /* 35301768b42SPeter Zijlstra * Look out! "owner" is an entirely speculative pointer 35401768b42SPeter Zijlstra * access and not reliable. 35501768b42SPeter Zijlstra */ 35601768b42SPeter Zijlstra static noinline 357be1f7bf2SJason Low bool mutex_spin_on_owner(struct mutex *lock, struct task_struct *owner) 35801768b42SPeter Zijlstra { 35901ac33c1SJason Low bool ret = true; 360be1f7bf2SJason Low 36101768b42SPeter Zijlstra rcu_read_lock(); 3623ca0ff57SPeter Zijlstra while (__mutex_owner(lock) == owner) { 363be1f7bf2SJason Low /* 364be1f7bf2SJason Low * Ensure we emit the owner->on_cpu, dereference _after_ 36501ac33c1SJason Low * checking lock->owner still matches owner. If that fails, 36601ac33c1SJason Low * owner might point to freed memory. If it still matches, 367be1f7bf2SJason Low * the rcu_read_lock() ensures the memory stays valid. 368be1f7bf2SJason Low */ 369be1f7bf2SJason Low barrier(); 370be1f7bf2SJason Low 37105ffc951SPan Xinhui /* 37205ffc951SPan Xinhui * Use vcpu_is_preempted to detect lock holder preemption issue. 37305ffc951SPan Xinhui */ 37405ffc951SPan Xinhui if (!owner->on_cpu || need_resched() || 37505ffc951SPan Xinhui vcpu_is_preempted(task_cpu(owner))) { 376be1f7bf2SJason Low ret = false; 377be1f7bf2SJason Low break; 378be1f7bf2SJason Low } 37901768b42SPeter Zijlstra 380f2f09a4cSChristian Borntraeger cpu_relax(); 38101768b42SPeter Zijlstra } 38201768b42SPeter Zijlstra rcu_read_unlock(); 38301768b42SPeter Zijlstra 384be1f7bf2SJason Low return ret; 38501768b42SPeter Zijlstra } 38601768b42SPeter Zijlstra 38701768b42SPeter Zijlstra /* 38801768b42SPeter Zijlstra * Initial check for entering the mutex spinning loop 38901768b42SPeter Zijlstra */ 39001768b42SPeter Zijlstra static inline int mutex_can_spin_on_owner(struct mutex *lock) 39101768b42SPeter Zijlstra { 39201768b42SPeter Zijlstra struct task_struct *owner; 39301768b42SPeter Zijlstra int retval = 1; 39401768b42SPeter Zijlstra 39546af29e4SJason Low if (need_resched()) 39646af29e4SJason Low return 0; 39746af29e4SJason Low 39801768b42SPeter Zijlstra rcu_read_lock(); 3993ca0ff57SPeter Zijlstra owner = __mutex_owner(lock); 40005ffc951SPan Xinhui 40105ffc951SPan Xinhui /* 40205ffc951SPan Xinhui * As lock holder preemption issue, we both skip spinning if task is not 40305ffc951SPan Xinhui * on cpu or its cpu is preempted 40405ffc951SPan Xinhui */ 40501768b42SPeter Zijlstra if (owner) 40605ffc951SPan Xinhui retval = owner->on_cpu && !vcpu_is_preempted(task_cpu(owner)); 40701768b42SPeter Zijlstra rcu_read_unlock(); 40876916515SDavidlohr Bueso 40976916515SDavidlohr Bueso /* 4103ca0ff57SPeter Zijlstra * If lock->owner is not set, the mutex has been released. Return true 4113ca0ff57SPeter Zijlstra * such that we'll trylock in the spin path, which is a faster option 4123ca0ff57SPeter Zijlstra * than the blocking slow path. 41376916515SDavidlohr Bueso */ 4143ca0ff57SPeter Zijlstra return retval; 41576916515SDavidlohr Bueso } 41676916515SDavidlohr Bueso 41776916515SDavidlohr Bueso /* 41876916515SDavidlohr Bueso * Optimistic spinning. 41976916515SDavidlohr Bueso * 42076916515SDavidlohr Bueso * We try to spin for acquisition when we find that the lock owner 42176916515SDavidlohr Bueso * is currently running on a (different) CPU and while we don't 42276916515SDavidlohr Bueso * need to reschedule. The rationale is that if the lock owner is 42376916515SDavidlohr Bueso * running, it is likely to release the lock soon. 42476916515SDavidlohr Bueso * 42576916515SDavidlohr Bueso * The mutex spinners are queued up using MCS lock so that only one 42676916515SDavidlohr Bueso * spinner can compete for the mutex. However, if mutex spinning isn't 42776916515SDavidlohr Bueso * going to happen, there is no point in going through the lock/unlock 42876916515SDavidlohr Bueso * overhead. 42976916515SDavidlohr Bueso * 43076916515SDavidlohr Bueso * Returns true when the lock was taken, otherwise false, indicating 43176916515SDavidlohr Bueso * that we need to jump to the slowpath and sleep. 432b341afb3SWaiman Long * 433b341afb3SWaiman Long * The waiter flag is set to true if the spinner is a waiter in the wait 434b341afb3SWaiman Long * queue. The waiter-spinner will spin on the lock directly and concurrently 435b341afb3SWaiman Long * with the spinner at the head of the OSQ, if present, until the owner is 436b341afb3SWaiman Long * changed to itself. 43776916515SDavidlohr Bueso */ 43876916515SDavidlohr Bueso static bool mutex_optimistic_spin(struct mutex *lock, 439b341afb3SWaiman Long struct ww_acquire_ctx *ww_ctx, 440b341afb3SWaiman Long const bool use_ww_ctx, const bool waiter) 44176916515SDavidlohr Bueso { 442b341afb3SWaiman Long if (!waiter) { 443b341afb3SWaiman Long /* 444b341afb3SWaiman Long * The purpose of the mutex_can_spin_on_owner() function is 445b341afb3SWaiman Long * to eliminate the overhead of osq_lock() and osq_unlock() 446b341afb3SWaiman Long * in case spinning isn't possible. As a waiter-spinner 447b341afb3SWaiman Long * is not going to take OSQ lock anyway, there is no need 448b341afb3SWaiman Long * to call mutex_can_spin_on_owner(). 449b341afb3SWaiman Long */ 45076916515SDavidlohr Bueso if (!mutex_can_spin_on_owner(lock)) 451b341afb3SWaiman Long goto fail; 45276916515SDavidlohr Bueso 453e42f678aSDavidlohr Bueso /* 454e42f678aSDavidlohr Bueso * In order to avoid a stampede of mutex spinners trying to 455e42f678aSDavidlohr Bueso * acquire the mutex all at once, the spinners need to take a 456e42f678aSDavidlohr Bueso * MCS (queued) lock first before spinning on the owner field. 457e42f678aSDavidlohr Bueso */ 45876916515SDavidlohr Bueso if (!osq_lock(&lock->osq)) 459b341afb3SWaiman Long goto fail; 460b341afb3SWaiman Long } 46176916515SDavidlohr Bueso 462b341afb3SWaiman Long for (;;) { 46376916515SDavidlohr Bueso struct task_struct *owner; 46476916515SDavidlohr Bueso 46576916515SDavidlohr Bueso if (use_ww_ctx && ww_ctx->acquired > 0) { 46676916515SDavidlohr Bueso struct ww_mutex *ww; 46776916515SDavidlohr Bueso 46876916515SDavidlohr Bueso ww = container_of(lock, struct ww_mutex, base); 46976916515SDavidlohr Bueso /* 47076916515SDavidlohr Bueso * If ww->ctx is set the contents are undefined, only 47176916515SDavidlohr Bueso * by acquiring wait_lock there is a guarantee that 47276916515SDavidlohr Bueso * they are not invalid when reading. 47376916515SDavidlohr Bueso * 47476916515SDavidlohr Bueso * As such, when deadlock detection needs to be 47576916515SDavidlohr Bueso * performed the optimistic spinning cannot be done. 47676916515SDavidlohr Bueso */ 4774d3199e4SDavidlohr Bueso if (READ_ONCE(ww->ctx)) 478b341afb3SWaiman Long goto fail_unlock; 47976916515SDavidlohr Bueso } 48076916515SDavidlohr Bueso 481*e274795eSPeter Zijlstra /* Try to acquire the mutex... */ 482*e274795eSPeter Zijlstra owner = __mutex_trylock_or_owner(lock); 483*e274795eSPeter Zijlstra if (!owner) 484*e274795eSPeter Zijlstra break; 485*e274795eSPeter Zijlstra 48676916515SDavidlohr Bueso /* 487*e274795eSPeter Zijlstra * There's an owner, wait for it to either 48876916515SDavidlohr Bueso * release the lock or go to sleep. 48976916515SDavidlohr Bueso */ 490b341afb3SWaiman Long if (!mutex_spin_on_owner(lock, owner)) 491b341afb3SWaiman Long goto fail_unlock; 49276916515SDavidlohr Bueso 49376916515SDavidlohr Bueso /* 49476916515SDavidlohr Bueso * The cpu_relax() call is a compiler barrier which forces 49576916515SDavidlohr Bueso * everything in this loop to be re-loaded. We don't need 49676916515SDavidlohr Bueso * memory barriers as we'll eventually observe the right 49776916515SDavidlohr Bueso * values at the cost of a few extra spins. 49876916515SDavidlohr Bueso */ 499f2f09a4cSChristian Borntraeger cpu_relax(); 50076916515SDavidlohr Bueso } 50176916515SDavidlohr Bueso 502b341afb3SWaiman Long if (!waiter) 50376916515SDavidlohr Bueso osq_unlock(&lock->osq); 504b341afb3SWaiman Long 505b341afb3SWaiman Long return true; 506b341afb3SWaiman Long 507b341afb3SWaiman Long 508b341afb3SWaiman Long fail_unlock: 509b341afb3SWaiman Long if (!waiter) 510b341afb3SWaiman Long osq_unlock(&lock->osq); 511b341afb3SWaiman Long 512b341afb3SWaiman Long fail: 51376916515SDavidlohr Bueso /* 51476916515SDavidlohr Bueso * If we fell out of the spin path because of need_resched(), 51576916515SDavidlohr Bueso * reschedule now, before we try-lock the mutex. This avoids getting 51676916515SDavidlohr Bueso * scheduled out right after we obtained the mutex. 51776916515SDavidlohr Bueso */ 5186f942a1fSPeter Zijlstra if (need_resched()) { 5196f942a1fSPeter Zijlstra /* 5206f942a1fSPeter Zijlstra * We _should_ have TASK_RUNNING here, but just in case 5216f942a1fSPeter Zijlstra * we do not, make it so, otherwise we might get stuck. 5226f942a1fSPeter Zijlstra */ 5236f942a1fSPeter Zijlstra __set_current_state(TASK_RUNNING); 52476916515SDavidlohr Bueso schedule_preempt_disabled(); 5256f942a1fSPeter Zijlstra } 52676916515SDavidlohr Bueso 52776916515SDavidlohr Bueso return false; 52876916515SDavidlohr Bueso } 52976916515SDavidlohr Bueso #else 53076916515SDavidlohr Bueso static bool mutex_optimistic_spin(struct mutex *lock, 531b341afb3SWaiman Long struct ww_acquire_ctx *ww_ctx, 532b341afb3SWaiman Long const bool use_ww_ctx, const bool waiter) 53376916515SDavidlohr Bueso { 53476916515SDavidlohr Bueso return false; 53576916515SDavidlohr Bueso } 53601768b42SPeter Zijlstra #endif 53701768b42SPeter Zijlstra 5383ca0ff57SPeter Zijlstra static noinline void __sched __mutex_unlock_slowpath(struct mutex *lock, unsigned long ip); 53901768b42SPeter Zijlstra 54001768b42SPeter Zijlstra /** 54101768b42SPeter Zijlstra * mutex_unlock - release the mutex 54201768b42SPeter Zijlstra * @lock: the mutex to be released 54301768b42SPeter Zijlstra * 54401768b42SPeter Zijlstra * Unlock a mutex that has been locked by this task previously. 54501768b42SPeter Zijlstra * 54601768b42SPeter Zijlstra * This function must not be used in interrupt context. Unlocking 54701768b42SPeter Zijlstra * of a not locked mutex is not allowed. 54801768b42SPeter Zijlstra * 54901768b42SPeter Zijlstra * This function is similar to (but not equivalent to) up(). 55001768b42SPeter Zijlstra */ 55101768b42SPeter Zijlstra void __sched mutex_unlock(struct mutex *lock) 55201768b42SPeter Zijlstra { 5533ca0ff57SPeter Zijlstra #ifndef CONFIG_DEBUG_LOCK_ALLOC 5543ca0ff57SPeter Zijlstra if (__mutex_unlock_fast(lock)) 5553ca0ff57SPeter Zijlstra return; 55601768b42SPeter Zijlstra #endif 5573ca0ff57SPeter Zijlstra __mutex_unlock_slowpath(lock, _RET_IP_); 55801768b42SPeter Zijlstra } 55901768b42SPeter Zijlstra EXPORT_SYMBOL(mutex_unlock); 56001768b42SPeter Zijlstra 56101768b42SPeter Zijlstra /** 56201768b42SPeter Zijlstra * ww_mutex_unlock - release the w/w mutex 56301768b42SPeter Zijlstra * @lock: the mutex to be released 56401768b42SPeter Zijlstra * 56501768b42SPeter Zijlstra * Unlock a mutex that has been locked by this task previously with any of the 56601768b42SPeter Zijlstra * ww_mutex_lock* functions (with or without an acquire context). It is 56701768b42SPeter Zijlstra * forbidden to release the locks after releasing the acquire context. 56801768b42SPeter Zijlstra * 56901768b42SPeter Zijlstra * This function must not be used in interrupt context. Unlocking 57001768b42SPeter Zijlstra * of a unlocked mutex is not allowed. 57101768b42SPeter Zijlstra */ 57201768b42SPeter Zijlstra void __sched ww_mutex_unlock(struct ww_mutex *lock) 57301768b42SPeter Zijlstra { 57401768b42SPeter Zijlstra /* 57501768b42SPeter Zijlstra * The unlocking fastpath is the 0->1 transition from 'locked' 57601768b42SPeter Zijlstra * into 'unlocked' state: 57701768b42SPeter Zijlstra */ 57801768b42SPeter Zijlstra if (lock->ctx) { 57901768b42SPeter Zijlstra #ifdef CONFIG_DEBUG_MUTEXES 58001768b42SPeter Zijlstra DEBUG_LOCKS_WARN_ON(!lock->ctx->acquired); 58101768b42SPeter Zijlstra #endif 58201768b42SPeter Zijlstra if (lock->ctx->acquired > 0) 58301768b42SPeter Zijlstra lock->ctx->acquired--; 58401768b42SPeter Zijlstra lock->ctx = NULL; 58501768b42SPeter Zijlstra } 58601768b42SPeter Zijlstra 5873ca0ff57SPeter Zijlstra mutex_unlock(&lock->base); 58801768b42SPeter Zijlstra } 58901768b42SPeter Zijlstra EXPORT_SYMBOL(ww_mutex_unlock); 59001768b42SPeter Zijlstra 59101768b42SPeter Zijlstra static inline int __sched 59263dc47e9SDavidlohr Bueso __ww_mutex_lock_check_stamp(struct mutex *lock, struct ww_acquire_ctx *ctx) 59301768b42SPeter Zijlstra { 59401768b42SPeter Zijlstra struct ww_mutex *ww = container_of(lock, struct ww_mutex, base); 5954d3199e4SDavidlohr Bueso struct ww_acquire_ctx *hold_ctx = READ_ONCE(ww->ctx); 59601768b42SPeter Zijlstra 59701768b42SPeter Zijlstra if (!hold_ctx) 59801768b42SPeter Zijlstra return 0; 59901768b42SPeter Zijlstra 60001768b42SPeter Zijlstra if (ctx->stamp - hold_ctx->stamp <= LONG_MAX && 60101768b42SPeter Zijlstra (ctx->stamp != hold_ctx->stamp || ctx > hold_ctx)) { 60201768b42SPeter Zijlstra #ifdef CONFIG_DEBUG_MUTEXES 60301768b42SPeter Zijlstra DEBUG_LOCKS_WARN_ON(ctx->contending_lock); 60401768b42SPeter Zijlstra ctx->contending_lock = ww; 60501768b42SPeter Zijlstra #endif 60601768b42SPeter Zijlstra return -EDEADLK; 60701768b42SPeter Zijlstra } 60801768b42SPeter Zijlstra 60901768b42SPeter Zijlstra return 0; 61001768b42SPeter Zijlstra } 61101768b42SPeter Zijlstra 61201768b42SPeter Zijlstra /* 61301768b42SPeter Zijlstra * Lock a mutex (possibly interruptible), slowpath: 61401768b42SPeter Zijlstra */ 61501768b42SPeter Zijlstra static __always_inline int __sched 61601768b42SPeter Zijlstra __mutex_lock_common(struct mutex *lock, long state, unsigned int subclass, 61701768b42SPeter Zijlstra struct lockdep_map *nest_lock, unsigned long ip, 61801768b42SPeter Zijlstra struct ww_acquire_ctx *ww_ctx, const bool use_ww_ctx) 61901768b42SPeter Zijlstra { 62001768b42SPeter Zijlstra struct mutex_waiter waiter; 62101768b42SPeter Zijlstra unsigned long flags; 6229d659ae1SPeter Zijlstra bool first = false; 623a40ca565SWaiman Long struct ww_mutex *ww; 62401768b42SPeter Zijlstra int ret; 62501768b42SPeter Zijlstra 6260422e83dSChris Wilson if (use_ww_ctx) { 627a40ca565SWaiman Long ww = container_of(lock, struct ww_mutex, base); 6280422e83dSChris Wilson if (unlikely(ww_ctx == READ_ONCE(ww->ctx))) 6290422e83dSChris Wilson return -EALREADY; 6300422e83dSChris Wilson } 6310422e83dSChris Wilson 63201768b42SPeter Zijlstra preempt_disable(); 63301768b42SPeter Zijlstra mutex_acquire_nest(&lock->dep_map, subclass, 0, nest_lock, ip); 63401768b42SPeter Zijlstra 635*e274795eSPeter Zijlstra if (__mutex_trylock(lock) || 636b341afb3SWaiman Long mutex_optimistic_spin(lock, ww_ctx, use_ww_ctx, false)) { 63776916515SDavidlohr Bueso /* got the lock, yay! */ 6383ca0ff57SPeter Zijlstra lock_acquired(&lock->dep_map, ip); 639a40ca565SWaiman Long if (use_ww_ctx) 6403ca0ff57SPeter Zijlstra ww_mutex_set_context_fastpath(ww, ww_ctx); 64101768b42SPeter Zijlstra preempt_enable(); 64201768b42SPeter Zijlstra return 0; 64301768b42SPeter Zijlstra } 64401768b42SPeter Zijlstra 64501768b42SPeter Zijlstra spin_lock_mutex(&lock->wait_lock, flags); 6461e820c96SJason Low /* 6473ca0ff57SPeter Zijlstra * After waiting to acquire the wait_lock, try again. 6481e820c96SJason Low */ 649*e274795eSPeter Zijlstra if (__mutex_trylock(lock)) 65001768b42SPeter Zijlstra goto skip_wait; 65101768b42SPeter Zijlstra 65201768b42SPeter Zijlstra debug_mutex_lock_common(lock, &waiter); 653d269a8b8SDavidlohr Bueso debug_mutex_add_waiter(lock, &waiter, current); 65401768b42SPeter Zijlstra 65501768b42SPeter Zijlstra /* add waiting tasks to the end of the waitqueue (FIFO): */ 65601768b42SPeter Zijlstra list_add_tail(&waiter.list, &lock->wait_list); 657d269a8b8SDavidlohr Bueso waiter.task = current; 65801768b42SPeter Zijlstra 6599d659ae1SPeter Zijlstra if (__mutex_waiter_is_first(lock, &waiter)) 6603ca0ff57SPeter Zijlstra __mutex_set_flag(lock, MUTEX_FLAG_WAITERS); 6613ca0ff57SPeter Zijlstra 66201768b42SPeter Zijlstra lock_contended(&lock->dep_map, ip); 66301768b42SPeter Zijlstra 664642fa448SDavidlohr Bueso set_current_state(state); 66501768b42SPeter Zijlstra for (;;) { 6665bbd7e64SPeter Zijlstra /* 6675bbd7e64SPeter Zijlstra * Once we hold wait_lock, we're serialized against 6685bbd7e64SPeter Zijlstra * mutex_unlock() handing the lock off to us, do a trylock 6695bbd7e64SPeter Zijlstra * before testing the error conditions to make sure we pick up 6705bbd7e64SPeter Zijlstra * the handoff. 6715bbd7e64SPeter Zijlstra */ 672*e274795eSPeter Zijlstra if (__mutex_trylock(lock)) 6735bbd7e64SPeter Zijlstra goto acquired; 67401768b42SPeter Zijlstra 67501768b42SPeter Zijlstra /* 6765bbd7e64SPeter Zijlstra * Check for signals and wound conditions while holding 6775bbd7e64SPeter Zijlstra * wait_lock. This ensures the lock cancellation is ordered 6785bbd7e64SPeter Zijlstra * against mutex_unlock() and wake-ups do not go missing. 67901768b42SPeter Zijlstra */ 680d269a8b8SDavidlohr Bueso if (unlikely(signal_pending_state(state, current))) { 68101768b42SPeter Zijlstra ret = -EINTR; 68201768b42SPeter Zijlstra goto err; 68301768b42SPeter Zijlstra } 68401768b42SPeter Zijlstra 68501768b42SPeter Zijlstra if (use_ww_ctx && ww_ctx->acquired > 0) { 68663dc47e9SDavidlohr Bueso ret = __ww_mutex_lock_check_stamp(lock, ww_ctx); 68701768b42SPeter Zijlstra if (ret) 68801768b42SPeter Zijlstra goto err; 68901768b42SPeter Zijlstra } 69001768b42SPeter Zijlstra 69101768b42SPeter Zijlstra spin_unlock_mutex(&lock->wait_lock, flags); 69201768b42SPeter Zijlstra schedule_preempt_disabled(); 6939d659ae1SPeter Zijlstra 6949d659ae1SPeter Zijlstra if (!first && __mutex_waiter_is_first(lock, &waiter)) { 6959d659ae1SPeter Zijlstra first = true; 6969d659ae1SPeter Zijlstra __mutex_set_flag(lock, MUTEX_FLAG_HANDOFF); 6979d659ae1SPeter Zijlstra } 6985bbd7e64SPeter Zijlstra 699642fa448SDavidlohr Bueso set_current_state(state); 7005bbd7e64SPeter Zijlstra /* 7015bbd7e64SPeter Zijlstra * Here we order against unlock; we must either see it change 7025bbd7e64SPeter Zijlstra * state back to RUNNING and fall through the next schedule(), 7035bbd7e64SPeter Zijlstra * or we must see its unlock and acquire. 7045bbd7e64SPeter Zijlstra */ 705*e274795eSPeter Zijlstra if (__mutex_trylock(lock) || 706*e274795eSPeter Zijlstra (first && mutex_optimistic_spin(lock, ww_ctx, use_ww_ctx, true))) 7075bbd7e64SPeter Zijlstra break; 7085bbd7e64SPeter Zijlstra 7095bbd7e64SPeter Zijlstra spin_lock_mutex(&lock->wait_lock, flags); 71001768b42SPeter Zijlstra } 7115bbd7e64SPeter Zijlstra spin_lock_mutex(&lock->wait_lock, flags); 7125bbd7e64SPeter Zijlstra acquired: 713642fa448SDavidlohr Bueso __set_current_state(TASK_RUNNING); 71451587bcfSDavidlohr Bueso 715d269a8b8SDavidlohr Bueso mutex_remove_waiter(lock, &waiter, current); 71601768b42SPeter Zijlstra if (likely(list_empty(&lock->wait_list))) 7179d659ae1SPeter Zijlstra __mutex_clear_flag(lock, MUTEX_FLAGS); 7183ca0ff57SPeter Zijlstra 71901768b42SPeter Zijlstra debug_mutex_free_waiter(&waiter); 72001768b42SPeter Zijlstra 72101768b42SPeter Zijlstra skip_wait: 72201768b42SPeter Zijlstra /* got the lock - cleanup and rejoice! */ 72301768b42SPeter Zijlstra lock_acquired(&lock->dep_map, ip); 72401768b42SPeter Zijlstra 725a40ca565SWaiman Long if (use_ww_ctx) 7264bd19084SDavidlohr Bueso ww_mutex_set_context_slowpath(ww, ww_ctx); 72701768b42SPeter Zijlstra 72801768b42SPeter Zijlstra spin_unlock_mutex(&lock->wait_lock, flags); 72901768b42SPeter Zijlstra preempt_enable(); 73001768b42SPeter Zijlstra return 0; 73101768b42SPeter Zijlstra 73201768b42SPeter Zijlstra err: 733642fa448SDavidlohr Bueso __set_current_state(TASK_RUNNING); 734d269a8b8SDavidlohr Bueso mutex_remove_waiter(lock, &waiter, current); 73501768b42SPeter Zijlstra spin_unlock_mutex(&lock->wait_lock, flags); 73601768b42SPeter Zijlstra debug_mutex_free_waiter(&waiter); 73701768b42SPeter Zijlstra mutex_release(&lock->dep_map, 1, ip); 73801768b42SPeter Zijlstra preempt_enable(); 73901768b42SPeter Zijlstra return ret; 74001768b42SPeter Zijlstra } 74101768b42SPeter Zijlstra 74201768b42SPeter Zijlstra #ifdef CONFIG_DEBUG_LOCK_ALLOC 74301768b42SPeter Zijlstra void __sched 74401768b42SPeter Zijlstra mutex_lock_nested(struct mutex *lock, unsigned int subclass) 74501768b42SPeter Zijlstra { 74601768b42SPeter Zijlstra might_sleep(); 74701768b42SPeter Zijlstra __mutex_lock_common(lock, TASK_UNINTERRUPTIBLE, 74801768b42SPeter Zijlstra subclass, NULL, _RET_IP_, NULL, 0); 74901768b42SPeter Zijlstra } 75001768b42SPeter Zijlstra 75101768b42SPeter Zijlstra EXPORT_SYMBOL_GPL(mutex_lock_nested); 75201768b42SPeter Zijlstra 75301768b42SPeter Zijlstra void __sched 75401768b42SPeter Zijlstra _mutex_lock_nest_lock(struct mutex *lock, struct lockdep_map *nest) 75501768b42SPeter Zijlstra { 75601768b42SPeter Zijlstra might_sleep(); 75701768b42SPeter Zijlstra __mutex_lock_common(lock, TASK_UNINTERRUPTIBLE, 75801768b42SPeter Zijlstra 0, nest, _RET_IP_, NULL, 0); 75901768b42SPeter Zijlstra } 76001768b42SPeter Zijlstra EXPORT_SYMBOL_GPL(_mutex_lock_nest_lock); 76101768b42SPeter Zijlstra 76201768b42SPeter Zijlstra int __sched 76301768b42SPeter Zijlstra mutex_lock_killable_nested(struct mutex *lock, unsigned int subclass) 76401768b42SPeter Zijlstra { 76501768b42SPeter Zijlstra might_sleep(); 76601768b42SPeter Zijlstra return __mutex_lock_common(lock, TASK_KILLABLE, 76701768b42SPeter Zijlstra subclass, NULL, _RET_IP_, NULL, 0); 76801768b42SPeter Zijlstra } 76901768b42SPeter Zijlstra EXPORT_SYMBOL_GPL(mutex_lock_killable_nested); 77001768b42SPeter Zijlstra 77101768b42SPeter Zijlstra int __sched 77201768b42SPeter Zijlstra mutex_lock_interruptible_nested(struct mutex *lock, unsigned int subclass) 77301768b42SPeter Zijlstra { 77401768b42SPeter Zijlstra might_sleep(); 77501768b42SPeter Zijlstra return __mutex_lock_common(lock, TASK_INTERRUPTIBLE, 77601768b42SPeter Zijlstra subclass, NULL, _RET_IP_, NULL, 0); 77701768b42SPeter Zijlstra } 77801768b42SPeter Zijlstra EXPORT_SYMBOL_GPL(mutex_lock_interruptible_nested); 77901768b42SPeter Zijlstra 78001768b42SPeter Zijlstra static inline int 78101768b42SPeter Zijlstra ww_mutex_deadlock_injection(struct ww_mutex *lock, struct ww_acquire_ctx *ctx) 78201768b42SPeter Zijlstra { 78301768b42SPeter Zijlstra #ifdef CONFIG_DEBUG_WW_MUTEX_SLOWPATH 78401768b42SPeter Zijlstra unsigned tmp; 78501768b42SPeter Zijlstra 78601768b42SPeter Zijlstra if (ctx->deadlock_inject_countdown-- == 0) { 78701768b42SPeter Zijlstra tmp = ctx->deadlock_inject_interval; 78801768b42SPeter Zijlstra if (tmp > UINT_MAX/4) 78901768b42SPeter Zijlstra tmp = UINT_MAX; 79001768b42SPeter Zijlstra else 79101768b42SPeter Zijlstra tmp = tmp*2 + tmp + tmp/2; 79201768b42SPeter Zijlstra 79301768b42SPeter Zijlstra ctx->deadlock_inject_interval = tmp; 79401768b42SPeter Zijlstra ctx->deadlock_inject_countdown = tmp; 79501768b42SPeter Zijlstra ctx->contending_lock = lock; 79601768b42SPeter Zijlstra 79701768b42SPeter Zijlstra ww_mutex_unlock(lock); 79801768b42SPeter Zijlstra 79901768b42SPeter Zijlstra return -EDEADLK; 80001768b42SPeter Zijlstra } 80101768b42SPeter Zijlstra #endif 80201768b42SPeter Zijlstra 80301768b42SPeter Zijlstra return 0; 80401768b42SPeter Zijlstra } 80501768b42SPeter Zijlstra 80601768b42SPeter Zijlstra int __sched 80701768b42SPeter Zijlstra __ww_mutex_lock(struct ww_mutex *lock, struct ww_acquire_ctx *ctx) 80801768b42SPeter Zijlstra { 80901768b42SPeter Zijlstra int ret; 81001768b42SPeter Zijlstra 81101768b42SPeter Zijlstra might_sleep(); 81201768b42SPeter Zijlstra ret = __mutex_lock_common(&lock->base, TASK_UNINTERRUPTIBLE, 81301768b42SPeter Zijlstra 0, &ctx->dep_map, _RET_IP_, ctx, 1); 81401768b42SPeter Zijlstra if (!ret && ctx->acquired > 1) 81501768b42SPeter Zijlstra return ww_mutex_deadlock_injection(lock, ctx); 81601768b42SPeter Zijlstra 81701768b42SPeter Zijlstra return ret; 81801768b42SPeter Zijlstra } 81901768b42SPeter Zijlstra EXPORT_SYMBOL_GPL(__ww_mutex_lock); 82001768b42SPeter Zijlstra 82101768b42SPeter Zijlstra int __sched 82201768b42SPeter Zijlstra __ww_mutex_lock_interruptible(struct ww_mutex *lock, struct ww_acquire_ctx *ctx) 82301768b42SPeter Zijlstra { 82401768b42SPeter Zijlstra int ret; 82501768b42SPeter Zijlstra 82601768b42SPeter Zijlstra might_sleep(); 82701768b42SPeter Zijlstra ret = __mutex_lock_common(&lock->base, TASK_INTERRUPTIBLE, 82801768b42SPeter Zijlstra 0, &ctx->dep_map, _RET_IP_, ctx, 1); 82901768b42SPeter Zijlstra 83001768b42SPeter Zijlstra if (!ret && ctx->acquired > 1) 83101768b42SPeter Zijlstra return ww_mutex_deadlock_injection(lock, ctx); 83201768b42SPeter Zijlstra 83301768b42SPeter Zijlstra return ret; 83401768b42SPeter Zijlstra } 83501768b42SPeter Zijlstra EXPORT_SYMBOL_GPL(__ww_mutex_lock_interruptible); 83601768b42SPeter Zijlstra 83701768b42SPeter Zijlstra #endif 83801768b42SPeter Zijlstra 83901768b42SPeter Zijlstra /* 84001768b42SPeter Zijlstra * Release the lock, slowpath: 84101768b42SPeter Zijlstra */ 8423ca0ff57SPeter Zijlstra static noinline void __sched __mutex_unlock_slowpath(struct mutex *lock, unsigned long ip) 84301768b42SPeter Zijlstra { 8449d659ae1SPeter Zijlstra struct task_struct *next = NULL; 8453ca0ff57SPeter Zijlstra unsigned long owner, flags; 846194a6b5bSWaiman Long DEFINE_WAKE_Q(wake_q); 84701768b42SPeter Zijlstra 8483ca0ff57SPeter Zijlstra mutex_release(&lock->dep_map, 1, ip); 8493ca0ff57SPeter Zijlstra 85001768b42SPeter Zijlstra /* 8519d659ae1SPeter Zijlstra * Release the lock before (potentially) taking the spinlock such that 8529d659ae1SPeter Zijlstra * other contenders can get on with things ASAP. 8539d659ae1SPeter Zijlstra * 8549d659ae1SPeter Zijlstra * Except when HANDOFF, in that case we must not clear the owner field, 8559d659ae1SPeter Zijlstra * but instead set it to the top waiter. 85601768b42SPeter Zijlstra */ 8579d659ae1SPeter Zijlstra owner = atomic_long_read(&lock->owner); 8589d659ae1SPeter Zijlstra for (;;) { 8599d659ae1SPeter Zijlstra unsigned long old; 8609d659ae1SPeter Zijlstra 8619d659ae1SPeter Zijlstra #ifdef CONFIG_DEBUG_MUTEXES 8629d659ae1SPeter Zijlstra DEBUG_LOCKS_WARN_ON(__owner_task(owner) != current); 863*e274795eSPeter Zijlstra DEBUG_LOCKS_WARN_ON(owner & MUTEX_FLAG_PICKUP); 8649d659ae1SPeter Zijlstra #endif 8659d659ae1SPeter Zijlstra 8669d659ae1SPeter Zijlstra if (owner & MUTEX_FLAG_HANDOFF) 8679d659ae1SPeter Zijlstra break; 8689d659ae1SPeter Zijlstra 8699d659ae1SPeter Zijlstra old = atomic_long_cmpxchg_release(&lock->owner, owner, 8709d659ae1SPeter Zijlstra __owner_flags(owner)); 8719d659ae1SPeter Zijlstra if (old == owner) { 8729d659ae1SPeter Zijlstra if (owner & MUTEX_FLAG_WAITERS) 8739d659ae1SPeter Zijlstra break; 8749d659ae1SPeter Zijlstra 8753ca0ff57SPeter Zijlstra return; 8769d659ae1SPeter Zijlstra } 8779d659ae1SPeter Zijlstra 8789d659ae1SPeter Zijlstra owner = old; 8799d659ae1SPeter Zijlstra } 88001768b42SPeter Zijlstra 8811d8fe7dcSJason Low spin_lock_mutex(&lock->wait_lock, flags); 8821d8fe7dcSJason Low debug_mutex_unlock(lock); 88301768b42SPeter Zijlstra if (!list_empty(&lock->wait_list)) { 88401768b42SPeter Zijlstra /* get the first entry from the wait-list: */ 88501768b42SPeter Zijlstra struct mutex_waiter *waiter = 8869d659ae1SPeter Zijlstra list_first_entry(&lock->wait_list, 88701768b42SPeter Zijlstra struct mutex_waiter, list); 88801768b42SPeter Zijlstra 8899d659ae1SPeter Zijlstra next = waiter->task; 8909d659ae1SPeter Zijlstra 89101768b42SPeter Zijlstra debug_mutex_wake_waiter(lock, waiter); 8929d659ae1SPeter Zijlstra wake_q_add(&wake_q, next); 89301768b42SPeter Zijlstra } 89401768b42SPeter Zijlstra 8959d659ae1SPeter Zijlstra if (owner & MUTEX_FLAG_HANDOFF) 8969d659ae1SPeter Zijlstra __mutex_handoff(lock, next); 8979d659ae1SPeter Zijlstra 89801768b42SPeter Zijlstra spin_unlock_mutex(&lock->wait_lock, flags); 8999d659ae1SPeter Zijlstra 9001329ce6fSDavidlohr Bueso wake_up_q(&wake_q); 90101768b42SPeter Zijlstra } 90201768b42SPeter Zijlstra 90301768b42SPeter Zijlstra #ifndef CONFIG_DEBUG_LOCK_ALLOC 90401768b42SPeter Zijlstra /* 90501768b42SPeter Zijlstra * Here come the less common (and hence less performance-critical) APIs: 90601768b42SPeter Zijlstra * mutex_lock_interruptible() and mutex_trylock(). 90701768b42SPeter Zijlstra */ 90801768b42SPeter Zijlstra static noinline int __sched 90901768b42SPeter Zijlstra __mutex_lock_killable_slowpath(struct mutex *lock); 91001768b42SPeter Zijlstra 91101768b42SPeter Zijlstra static noinline int __sched 91201768b42SPeter Zijlstra __mutex_lock_interruptible_slowpath(struct mutex *lock); 91301768b42SPeter Zijlstra 91401768b42SPeter Zijlstra /** 91501768b42SPeter Zijlstra * mutex_lock_interruptible - acquire the mutex, interruptible 91601768b42SPeter Zijlstra * @lock: the mutex to be acquired 91701768b42SPeter Zijlstra * 91801768b42SPeter Zijlstra * Lock the mutex like mutex_lock(), and return 0 if the mutex has 91901768b42SPeter Zijlstra * been acquired or sleep until the mutex becomes available. If a 92001768b42SPeter Zijlstra * signal arrives while waiting for the lock then this function 92101768b42SPeter Zijlstra * returns -EINTR. 92201768b42SPeter Zijlstra * 92301768b42SPeter Zijlstra * This function is similar to (but not equivalent to) down_interruptible(). 92401768b42SPeter Zijlstra */ 92501768b42SPeter Zijlstra int __sched mutex_lock_interruptible(struct mutex *lock) 92601768b42SPeter Zijlstra { 92701768b42SPeter Zijlstra might_sleep(); 9283ca0ff57SPeter Zijlstra 9293ca0ff57SPeter Zijlstra if (__mutex_trylock_fast(lock)) 93001768b42SPeter Zijlstra return 0; 9313ca0ff57SPeter Zijlstra 93201768b42SPeter Zijlstra return __mutex_lock_interruptible_slowpath(lock); 93301768b42SPeter Zijlstra } 93401768b42SPeter Zijlstra 93501768b42SPeter Zijlstra EXPORT_SYMBOL(mutex_lock_interruptible); 93601768b42SPeter Zijlstra 93701768b42SPeter Zijlstra int __sched mutex_lock_killable(struct mutex *lock) 93801768b42SPeter Zijlstra { 93901768b42SPeter Zijlstra might_sleep(); 9403ca0ff57SPeter Zijlstra 9413ca0ff57SPeter Zijlstra if (__mutex_trylock_fast(lock)) 94201768b42SPeter Zijlstra return 0; 9433ca0ff57SPeter Zijlstra 94401768b42SPeter Zijlstra return __mutex_lock_killable_slowpath(lock); 94501768b42SPeter Zijlstra } 94601768b42SPeter Zijlstra EXPORT_SYMBOL(mutex_lock_killable); 94701768b42SPeter Zijlstra 9483ca0ff57SPeter Zijlstra static noinline void __sched 9493ca0ff57SPeter Zijlstra __mutex_lock_slowpath(struct mutex *lock) 95001768b42SPeter Zijlstra { 95101768b42SPeter Zijlstra __mutex_lock_common(lock, TASK_UNINTERRUPTIBLE, 0, 95201768b42SPeter Zijlstra NULL, _RET_IP_, NULL, 0); 95301768b42SPeter Zijlstra } 95401768b42SPeter Zijlstra 95501768b42SPeter Zijlstra static noinline int __sched 95601768b42SPeter Zijlstra __mutex_lock_killable_slowpath(struct mutex *lock) 95701768b42SPeter Zijlstra { 95801768b42SPeter Zijlstra return __mutex_lock_common(lock, TASK_KILLABLE, 0, 95901768b42SPeter Zijlstra NULL, _RET_IP_, NULL, 0); 96001768b42SPeter Zijlstra } 96101768b42SPeter Zijlstra 96201768b42SPeter Zijlstra static noinline int __sched 96301768b42SPeter Zijlstra __mutex_lock_interruptible_slowpath(struct mutex *lock) 96401768b42SPeter Zijlstra { 96501768b42SPeter Zijlstra return __mutex_lock_common(lock, TASK_INTERRUPTIBLE, 0, 96601768b42SPeter Zijlstra NULL, _RET_IP_, NULL, 0); 96701768b42SPeter Zijlstra } 96801768b42SPeter Zijlstra 96901768b42SPeter Zijlstra static noinline int __sched 97001768b42SPeter Zijlstra __ww_mutex_lock_slowpath(struct ww_mutex *lock, struct ww_acquire_ctx *ctx) 97101768b42SPeter Zijlstra { 97201768b42SPeter Zijlstra return __mutex_lock_common(&lock->base, TASK_UNINTERRUPTIBLE, 0, 97301768b42SPeter Zijlstra NULL, _RET_IP_, ctx, 1); 97401768b42SPeter Zijlstra } 97501768b42SPeter Zijlstra 97601768b42SPeter Zijlstra static noinline int __sched 97701768b42SPeter Zijlstra __ww_mutex_lock_interruptible_slowpath(struct ww_mutex *lock, 97801768b42SPeter Zijlstra struct ww_acquire_ctx *ctx) 97901768b42SPeter Zijlstra { 98001768b42SPeter Zijlstra return __mutex_lock_common(&lock->base, TASK_INTERRUPTIBLE, 0, 98101768b42SPeter Zijlstra NULL, _RET_IP_, ctx, 1); 98201768b42SPeter Zijlstra } 98301768b42SPeter Zijlstra 98401768b42SPeter Zijlstra #endif 98501768b42SPeter Zijlstra 98601768b42SPeter Zijlstra /** 98701768b42SPeter Zijlstra * mutex_trylock - try to acquire the mutex, without waiting 98801768b42SPeter Zijlstra * @lock: the mutex to be acquired 98901768b42SPeter Zijlstra * 99001768b42SPeter Zijlstra * Try to acquire the mutex atomically. Returns 1 if the mutex 99101768b42SPeter Zijlstra * has been acquired successfully, and 0 on contention. 99201768b42SPeter Zijlstra * 99301768b42SPeter Zijlstra * NOTE: this function follows the spin_trylock() convention, so 99401768b42SPeter Zijlstra * it is negated from the down_trylock() return values! Be careful 99501768b42SPeter Zijlstra * about this when converting semaphore users to mutexes. 99601768b42SPeter Zijlstra * 99701768b42SPeter Zijlstra * This function must not be used in interrupt context. The 99801768b42SPeter Zijlstra * mutex must be released by the same task that acquired it. 99901768b42SPeter Zijlstra */ 100001768b42SPeter Zijlstra int __sched mutex_trylock(struct mutex *lock) 100101768b42SPeter Zijlstra { 1002*e274795eSPeter Zijlstra bool locked = __mutex_trylock(lock); 100301768b42SPeter Zijlstra 10043ca0ff57SPeter Zijlstra if (locked) 10053ca0ff57SPeter Zijlstra mutex_acquire(&lock->dep_map, 0, 1, _RET_IP_); 100601768b42SPeter Zijlstra 10073ca0ff57SPeter Zijlstra return locked; 100801768b42SPeter Zijlstra } 100901768b42SPeter Zijlstra EXPORT_SYMBOL(mutex_trylock); 101001768b42SPeter Zijlstra 101101768b42SPeter Zijlstra #ifndef CONFIG_DEBUG_LOCK_ALLOC 101201768b42SPeter Zijlstra int __sched 101301768b42SPeter Zijlstra __ww_mutex_lock(struct ww_mutex *lock, struct ww_acquire_ctx *ctx) 101401768b42SPeter Zijlstra { 101501768b42SPeter Zijlstra might_sleep(); 101601768b42SPeter Zijlstra 10173ca0ff57SPeter Zijlstra if (__mutex_trylock_fast(&lock->base)) { 101801768b42SPeter Zijlstra ww_mutex_set_context_fastpath(lock, ctx); 10193ca0ff57SPeter Zijlstra return 0; 10203ca0ff57SPeter Zijlstra } 10213ca0ff57SPeter Zijlstra 10223ca0ff57SPeter Zijlstra return __ww_mutex_lock_slowpath(lock, ctx); 102301768b42SPeter Zijlstra } 102401768b42SPeter Zijlstra EXPORT_SYMBOL(__ww_mutex_lock); 102501768b42SPeter Zijlstra 102601768b42SPeter Zijlstra int __sched 102701768b42SPeter Zijlstra __ww_mutex_lock_interruptible(struct ww_mutex *lock, struct ww_acquire_ctx *ctx) 102801768b42SPeter Zijlstra { 102901768b42SPeter Zijlstra might_sleep(); 103001768b42SPeter Zijlstra 10313ca0ff57SPeter Zijlstra if (__mutex_trylock_fast(&lock->base)) { 103201768b42SPeter Zijlstra ww_mutex_set_context_fastpath(lock, ctx); 10333ca0ff57SPeter Zijlstra return 0; 10343ca0ff57SPeter Zijlstra } 10353ca0ff57SPeter Zijlstra 10363ca0ff57SPeter Zijlstra return __ww_mutex_lock_interruptible_slowpath(lock, ctx); 103701768b42SPeter Zijlstra } 103801768b42SPeter Zijlstra EXPORT_SYMBOL(__ww_mutex_lock_interruptible); 103901768b42SPeter Zijlstra 104001768b42SPeter Zijlstra #endif 104101768b42SPeter Zijlstra 104201768b42SPeter Zijlstra /** 104301768b42SPeter Zijlstra * atomic_dec_and_mutex_lock - return holding mutex if we dec to 0 104401768b42SPeter Zijlstra * @cnt: the atomic which we are to dec 104501768b42SPeter Zijlstra * @lock: the mutex to return holding if we dec to 0 104601768b42SPeter Zijlstra * 104701768b42SPeter Zijlstra * return true and hold lock if we dec to 0, return false otherwise 104801768b42SPeter Zijlstra */ 104901768b42SPeter Zijlstra int atomic_dec_and_mutex_lock(atomic_t *cnt, struct mutex *lock) 105001768b42SPeter Zijlstra { 105101768b42SPeter Zijlstra /* dec if we can't possibly hit 0 */ 105201768b42SPeter Zijlstra if (atomic_add_unless(cnt, -1, 1)) 105301768b42SPeter Zijlstra return 0; 105401768b42SPeter Zijlstra /* we might hit 0, so take the lock */ 105501768b42SPeter Zijlstra mutex_lock(lock); 105601768b42SPeter Zijlstra if (!atomic_dec_and_test(cnt)) { 105701768b42SPeter Zijlstra /* when we actually did the dec, we didn't hit 0 */ 105801768b42SPeter Zijlstra mutex_unlock(lock); 105901768b42SPeter Zijlstra return 0; 106001768b42SPeter Zijlstra } 106101768b42SPeter Zijlstra /* we hit 0, and we hold the lock */ 106201768b42SPeter Zijlstra return 1; 106301768b42SPeter Zijlstra } 106401768b42SPeter Zijlstra EXPORT_SYMBOL(atomic_dec_and_mutex_lock); 1065