kernel/locking/qspinlock.c

c942fddfSThomas Gleixner// SPDX-License-Identifier: GPL-2.0-or-later
a33fda35SWaiman Long/*
a33fda35SWaiman Long * Queued spinlock
a33fda35SWaiman Long *
a33fda35SWaiman Long * (C) Copyright 2013-2015 Hewlett-Packard Development Company, L.P.
81d3dc9aSWaiman Long * (C) Copyright 2013-2014,2018 Red Hat, Inc.
a33fda35SWaiman Long * (C) Copyright 2015 Intel Corp.
64d816cbSWaiman Long * (C) Copyright 2015 Hewlett-Packard Enterprise Development LP
a33fda35SWaiman Long *
81d3dc9aSWaiman Long * Authors: Waiman Long <[email protected]>
a33fda35SWaiman Long *          Peter Zijlstra <[email protected]>
a33fda35SWaiman Long */
a23db284SWaiman Long
a23db284SWaiman Long#ifndef _GEN_PV_LOCK_SLOWPATH
a23db284SWaiman Long
a33fda35SWaiman Long#include <linux/smp.h>
a33fda35SWaiman Long#include <linux/bug.h>
a33fda35SWaiman Long#include <linux/cpumask.h>
a33fda35SWaiman Long#include <linux/percpu.h>
a33fda35SWaiman Long#include <linux/hardirq.h>
a33fda35SWaiman Long#include <linux/mutex.h>
5671360fSStafford Horne#include <linux/prefetch.h>
69f9cae9SPeter Zijlstra (Intel)#include <asm/byteorder.h>
a33fda35SWaiman Long#include <asm/qspinlock.h>
ee042be1SNamhyung Kim#include <trace/events/lock.h>
a33fda35SWaiman Long
a33fda35SWaiman Long/*
*ac08f68fSKumar Kartikeya Dwivedi * Include queued spinlock definitions and statistics code
81d3dc9aSWaiman Long */
*ac08f68fSKumar Kartikeya Dwivedi#include "qspinlock.h"
81d3dc9aSWaiman Long#include "qspinlock_stat.h"
81d3dc9aSWaiman Long
81d3dc9aSWaiman Long/*
a33fda35SWaiman Long * The basic principle of a queue-based spinlock can best be understood
a33fda35SWaiman Long * by studying a classic queue-based spinlock implementation called the
57097124SWaiman Long * MCS lock. A copy of the original MCS lock paper ("Algorithms for Scalable
57097124SWaiman Long * Synchronization on Shared-Memory Multiprocessors by Mellor-Crummey and
57097124SWaiman Long * Scott") is available at
a33fda35SWaiman Long *
57097124SWaiman Long * https://bugzilla.kernel.org/show_bug.cgi?id=206115
a33fda35SWaiman Long *
57097124SWaiman Long * This queued spinlock implementation is based on the MCS lock, however to
57097124SWaiman Long * make it fit the 4 bytes we assume spinlock_t to be, and preserve its
57097124SWaiman Long * existing API, we must modify it somehow.
a33fda35SWaiman Long *
a33fda35SWaiman Long * In particular; where the traditional MCS lock consists of a tail pointer
a33fda35SWaiman Long * (8 bytes) and needs the next pointer (another 8 bytes) of its own node to
a33fda35SWaiman Long * unlock the next pending (next->locked), we compress both these: {tail,
a33fda35SWaiman Long * next->locked} into a single u32 value.
a33fda35SWaiman Long *
a33fda35SWaiman Long * Since a spinlock disables recursion of its own context and there is a limit
a33fda35SWaiman Long * to the contexts that can nest; namely: task, softirq, hardirq, nmi. As there
a33fda35SWaiman Long * are at most 4 nesting levels, it can be encoded by a 2-bit number. Now
a33fda35SWaiman Long * we can encode the tail by combining the 2-bit nesting level with the cpu
a33fda35SWaiman Long * number. With one byte for the lock value and 3 bytes for the tail, only a
a33fda35SWaiman Long * 32-bit word is now needed. Even though we only need 1 bit for the lock,
a33fda35SWaiman Long * we extend it to a full byte to achieve better performance for architectures
a33fda35SWaiman Long * that support atomic byte write.
a33fda35SWaiman Long *
a33fda35SWaiman Long * We also change the first spinner to spin on the lock bit instead of its
a33fda35SWaiman Long * node; whereby avoiding the need to carry a node from lock to unlock, and
a33fda35SWaiman Long * preserving existing lock API. This also makes the unlock code simpler and
a33fda35SWaiman Long * faster.
69f9cae9SPeter Zijlstra (Intel) *
69f9cae9SPeter Zijlstra (Intel) * N.B. The current implementation only supports architectures that allow
69f9cae9SPeter Zijlstra (Intel) *      atomic operations on smaller 8-bit and 16-bit data types.
69f9cae9SPeter Zijlstra (Intel) *
a33fda35SWaiman Long */
a33fda35SWaiman Long
a33fda35SWaiman Long#include "mcs_spinlock.h"
6512276dSWill Deacon
6512276dSWill Deacon/*
a33fda35SWaiman Long * Per-CPU queue node structures; we can never have more than 4 nested
a33fda35SWaiman Long * contexts: task, softirq, hardirq, nmi.
a33fda35SWaiman Long *
a33fda35SWaiman Long * Exactly fits one 64-byte cacheline on a 64-bit architecture.
a23db284SWaiman Long *
a23db284SWaiman Long * PV doubles the storage and uses the second cacheline for PV state.
a33fda35SWaiman Long */
*ac08f68fSKumar Kartikeya Dwivedistatic DEFINE_PER_CPU_ALIGNED(struct qnode, qnodes[_Q_MAX_NODES]);
a23db284SWaiman Long
a23db284SWaiman Long/*
a23db284SWaiman Long * Generate the native code for queued_spin_unlock_slowpath(); provide NOPs for
a23db284SWaiman Long * all the PV callbacks.
a23db284SWaiman Long */
a23db284SWaiman Long
a23db284SWaiman Longstatic __always_inline void __pv_init_node(struct mcs_spinlock *node) { }
cd0272faSWaiman Longstatic __always_inline void __pv_wait_node(struct mcs_spinlock *node,
cd0272faSWaiman Long					   struct mcs_spinlock *prev) { }
75d22702SWaiman Longstatic __always_inline void __pv_kick_node(struct qspinlock *lock,
75d22702SWaiman Long					   struct mcs_spinlock *node) { }
1c4941fdSWaiman Longstatic __always_inline u32  __pv_wait_head_or_lock(struct qspinlock *lock,
1c4941fdSWaiman Long						   struct mcs_spinlock *node)
1c4941fdSWaiman Long						   { return 0; }
a23db284SWaiman Long
a23db284SWaiman Long#define pv_enabled()		false
a23db284SWaiman Long
a23db284SWaiman Long#define pv_init_node		__pv_init_node
a23db284SWaiman Long#define pv_wait_node		__pv_wait_node
a23db284SWaiman Long#define pv_kick_node		__pv_kick_node
1c4941fdSWaiman Long#define pv_wait_head_or_lock	__pv_wait_head_or_lock
a23db284SWaiman Long
a23db284SWaiman Long#ifdef CONFIG_PARAVIRT_SPINLOCKS
a23db284SWaiman Long#define queued_spin_lock_slowpath	native_queued_spin_lock_slowpath
a23db284SWaiman Long#endif
a23db284SWaiman Long
a23db284SWaiman Long#endif /* _GEN_PV_LOCK_SLOWPATH */
a23db284SWaiman Long
2c83e8e9SWaiman Long/**
a33fda35SWaiman Long * queued_spin_lock_slowpath - acquire the queued spinlock
a33fda35SWaiman Long * @lock: Pointer to queued spinlock structure
a33fda35SWaiman Long * @val: Current value of the queued spinlock 32-bit word
a33fda35SWaiman Long *
c1fb159dSPeter Zijlstra (Intel) * (queue tail, pending bit, lock value)
a33fda35SWaiman Long *
a33fda35SWaiman Long *              fast     :    slow                                  :    unlock
a33fda35SWaiman Long *                       :                                          :
c1fb159dSPeter Zijlstra (Intel) * uncontended  (0,0,0) -:--> (0,0,1) ------------------------------:--> (*,*,0)
c1fb159dSPeter Zijlstra (Intel) *                       :       | ^--------.------.             /  :
c1fb159dSPeter Zijlstra (Intel) *                       :       v           \      \            |  :
c1fb159dSPeter Zijlstra (Intel) * pending               :    (0,1,1) +--> (0,1,0)   \           |  :
c1fb159dSPeter Zijlstra (Intel) *                       :       | ^--'              |           |  :
c1fb159dSPeter Zijlstra (Intel) *                       :       v                   |           |  :
c1fb159dSPeter Zijlstra (Intel) * uncontended           :    (n,x,y) +--> (n,0,0) --'           |  :
a33fda35SWaiman Long *   queue               :       | ^--'                          |  :
a33fda35SWaiman Long *                       :       v                               |  :
c1fb159dSPeter Zijlstra (Intel) * contended             :    (*,x,y) +--> (*,0,0) ---> (*,0,1) -'  :
a33fda35SWaiman Long *   queue               :         ^--'                             :
a33fda35SWaiman Long */
501f7f69SNamhyung Kimvoid __lockfunc queued_spin_lock_slowpath(struct qspinlock *lock, u32 val)
a33fda35SWaiman Long{
a33fda35SWaiman Long	struct mcs_spinlock *prev, *next, *node;
59fb586bSWill Deacon	u32 old, tail;
a33fda35SWaiman Long	int idx;
a33fda35SWaiman Long
a33fda35SWaiman Long	BUILD_BUG_ON(CONFIG_NR_CPUS >= (1U << _Q_TAIL_CPU_BITS));
a33fda35SWaiman Long
a23db284SWaiman Long	if (pv_enabled())
81d3dc9aSWaiman Long		goto pv_queue;
a23db284SWaiman Long
43b3f028SPeter Zijlstra	if (virt_spin_lock(lock))
2aa79af6SPeter Zijlstra (Intel)		return;
2aa79af6SPeter Zijlstra (Intel)
c1fb159dSPeter Zijlstra (Intel)	/*
6512276dSWill Deacon	 * Wait for in-progress pending->locked hand-overs with a bounded
6512276dSWill Deacon	 * number of spins so that we guarantee forward progress.
c1fb159dSPeter Zijlstra (Intel)	 *
c1fb159dSPeter Zijlstra (Intel)	 * 0,1,0 -> 0,0,1
c1fb159dSPeter Zijlstra (Intel)	 */
c1fb159dSPeter Zijlstra (Intel)	if (val == _Q_PENDING_VAL) {
6512276dSWill Deacon		int cnt = _Q_PENDING_LOOPS;
6512276dSWill Deacon		val = atomic_cond_read_relaxed(&lock->val,
6512276dSWill Deacon					       (VAL != _Q_PENDING_VAL) || !cnt--);
c1fb159dSPeter Zijlstra (Intel)	}
c1fb159dSPeter Zijlstra (Intel)
c1fb159dSPeter Zijlstra (Intel)	/*
c1fb159dSPeter Zijlstra (Intel)	 * If we observe any contention; queue.
c1fb159dSPeter Zijlstra (Intel)	 */
c1fb159dSPeter Zijlstra (Intel)	if (val & ~_Q_LOCKED_MASK)
c1fb159dSPeter Zijlstra (Intel)		goto queue;
c1fb159dSPeter Zijlstra (Intel)
64d816cbSWaiman Long	/*
59fb586bSWill Deacon	 * trylock || pending
59fb586bSWill Deacon	 *
756b1df4SPeter Zijlstra	 * 0,0,* -> 0,1,* -> 0,0,1 pending, trylock
64d816cbSWaiman Long	 */
7aa54be2SPeter Zijlstra	val = queued_fetch_set_pending_acquire(lock);
756b1df4SPeter Zijlstra
53bf57faSPeter Zijlstra	/*
756b1df4SPeter Zijlstra	 * If we observe contention, there is a concurrent locker.
756b1df4SPeter Zijlstra	 *
756b1df4SPeter Zijlstra	 * Undo and queue; our setting of PENDING might have made the
756b1df4SPeter Zijlstra	 * n,0,0 -> 0,0,0 transition fail and it will now be waiting
756b1df4SPeter Zijlstra	 * on @next to become !NULL.
53bf57faSPeter Zijlstra	 */
53bf57faSPeter Zijlstra	if (unlikely(val & ~_Q_LOCKED_MASK)) {
756b1df4SPeter Zijlstra
756b1df4SPeter Zijlstra		/* Undo PENDING if we set it. */
53bf57faSPeter Zijlstra		if (!(val & _Q_PENDING_MASK))
53bf57faSPeter Zijlstra			clear_pending(lock);
756b1df4SPeter Zijlstra
53bf57faSPeter Zijlstra		goto queue;
53bf57faSPeter Zijlstra	}
53bf57faSPeter Zijlstra
c1fb159dSPeter Zijlstra (Intel)	/*
59fb586bSWill Deacon	 * We're pending, wait for the owner to go away.
c1fb159dSPeter Zijlstra (Intel)	 *
4282494aSGuo Ren	 * 0,1,1 -> *,1,0
69f9cae9SPeter Zijlstra (Intel)	 *
69f9cae9SPeter Zijlstra (Intel)	 * this wait loop must be a load-acquire such that we match the
69f9cae9SPeter Zijlstra (Intel)	 * store-release that clears the locked bit and create lock
59fb586bSWill Deacon	 * sequentiality; this is because not all
59fb586bSWill Deacon	 * clear_pending_set_locked() implementations imply full
59fb586bSWill Deacon	 * barriers.
c1fb159dSPeter Zijlstra (Intel)	 */
53bf57faSPeter Zijlstra	if (val & _Q_LOCKED_MASK)
4282494aSGuo Ren		smp_cond_load_acquire(&lock->locked, !VAL);
c1fb159dSPeter Zijlstra (Intel)
c1fb159dSPeter Zijlstra (Intel)	/*
c1fb159dSPeter Zijlstra (Intel)	 * take ownership and clear the pending bit.
c1fb159dSPeter Zijlstra (Intel)	 *
53bf57faSPeter Zijlstra	 * 0,1,0 -> 0,0,1
c1fb159dSPeter Zijlstra (Intel)	 */
6403bd7dSWaiman Long	clear_pending_set_locked(lock);
ad53fa10SWaiman Long	lockevent_inc(lock_pending);
c1fb159dSPeter Zijlstra (Intel)	return;
c1fb159dSPeter Zijlstra (Intel)
c1fb159dSPeter Zijlstra (Intel)	/*
c1fb159dSPeter Zijlstra (Intel)	 * End of pending bit optimistic spinning and beginning of MCS
c1fb159dSPeter Zijlstra (Intel)	 * queuing.
c1fb159dSPeter Zijlstra (Intel)	 */
c1fb159dSPeter Zijlstra (Intel)queue:
ad53fa10SWaiman Long	lockevent_inc(lock_slowpath);
81d3dc9aSWaiman Longpv_queue:
0fa809caSWaiman Long	node = this_cpu_ptr(&qnodes[0].mcs);
a33fda35SWaiman Long	idx = node->count++;
a33fda35SWaiman Long	tail = encode_tail(smp_processor_id(), idx);
a33fda35SWaiman Long
ee042be1SNamhyung Kim	trace_contention_begin(lock, LCB_F_SPIN);
ee042be1SNamhyung Kim
d682b596SWaiman Long	/*
d682b596SWaiman Long	 * 4 nodes are allocated based on the assumption that there will
d682b596SWaiman Long	 * not be nested NMIs taking spinlocks. That may not be true in
d682b596SWaiman Long	 * some architectures even though the chance of needing more than
d682b596SWaiman Long	 * 4 nodes will still be extremely unlikely. When that happens,
d682b596SWaiman Long	 * we fall back to spinning on the lock directly without using
d682b596SWaiman Long	 * any MCS node. This is not the most elegant solution, but is
d682b596SWaiman Long	 * simple enough.
d682b596SWaiman Long	 */
*ac08f68fSKumar Kartikeya Dwivedi	if (unlikely(idx >= _Q_MAX_NODES)) {
ad53fa10SWaiman Long		lockevent_inc(lock_no_node);
d682b596SWaiman Long		while (!queued_spin_trylock(lock))
d682b596SWaiman Long			cpu_relax();
d682b596SWaiman Long		goto release;
d682b596SWaiman Long	}
d682b596SWaiman Long
0fa809caSWaiman Long	node = grab_mcs_node(node, idx);
11dc1322SWill Deacon
11dc1322SWill Deacon	/*
1222109aSWaiman Long	 * Keep counts of non-zero index values:
1222109aSWaiman Long	 */
ad53fa10SWaiman Long	lockevent_cond_inc(lock_use_node2 + idx - 1, idx);
1222109aSWaiman Long
1222109aSWaiman Long	/*
11dc1322SWill Deacon	 * Ensure that we increment the head node->count before initialising
11dc1322SWill Deacon	 * the actual node. If the compiler is kind enough to reorder these
11dc1322SWill Deacon	 * stores, then an IRQ could overwrite our assignments.
11dc1322SWill Deacon	 */
11dc1322SWill Deacon	barrier();
11dc1322SWill Deacon
a33fda35SWaiman Long	node->locked = 0;
a33fda35SWaiman Long	node->next = NULL;
a23db284SWaiman Long	pv_init_node(node);
a33fda35SWaiman Long
a33fda35SWaiman Long	/*
6403bd7dSWaiman Long	 * We touched a (possibly) cold cacheline in the per-cpu queue node;
6403bd7dSWaiman Long	 * attempt the trylock once more in the hope someone let go while we
6403bd7dSWaiman Long	 * weren't watching.
6403bd7dSWaiman Long	 */
6403bd7dSWaiman Long	if (queued_spin_trylock(lock))
6403bd7dSWaiman Long		goto release;
6403bd7dSWaiman Long
6403bd7dSWaiman Long	/*
9d4646d1SWill Deacon	 * Ensure that the initialisation of @node is complete before we
9d4646d1SWill Deacon	 * publish the updated tail via xchg_tail() and potentially link
9d4646d1SWill Deacon	 * @node into the waitqueue via WRITE_ONCE(prev->next, node) below.
9d4646d1SWill Deacon	 */
9d4646d1SWill Deacon	smp_wmb();
9d4646d1SWill Deacon
9d4646d1SWill Deacon	/*
9d4646d1SWill Deacon	 * Publish the updated tail.
c1fb159dSPeter Zijlstra (Intel)	 * We have already touched the queueing cacheline; don't bother with
c1fb159dSPeter Zijlstra (Intel)	 * pending stuff.
c1fb159dSPeter Zijlstra (Intel)	 *
6403bd7dSWaiman Long	 * p,*,* -> n,*,*
a33fda35SWaiman Long	 */
6403bd7dSWaiman Long	old = xchg_tail(lock, tail);
aa68744fSWaiman Long	next = NULL;
a33fda35SWaiman Long
a33fda35SWaiman Long	/*
a33fda35SWaiman Long	 * if there was a previous node; link it and wait until reaching the
a33fda35SWaiman Long	 * head of the waitqueue.
a33fda35SWaiman Long	 */
6403bd7dSWaiman Long	if (old & _Q_TAIL_MASK) {
*ac08f68fSKumar Kartikeya Dwivedi		prev = decode_tail(old, qnodes);
8d53fa19SPeter Zijlstra
9d4646d1SWill Deacon		/* Link @node into the waitqueue. */
9d4646d1SWill Deacon		WRITE_ONCE(prev->next, node);
a33fda35SWaiman Long
cd0272faSWaiman Long		pv_wait_node(node, prev);
a33fda35SWaiman Long		arch_mcs_spin_lock_contended(&node->locked);
81b55986SWaiman Long
81b55986SWaiman Long		/*
81b55986SWaiman Long		 * While waiting for the MCS lock, the next pointer may have
81b55986SWaiman Long		 * been set by another lock waiter. We optimistically load
81b55986SWaiman Long		 * the next pointer & prefetch the cacheline for writing
81b55986SWaiman Long		 * to reduce latency in the upcoming MCS unlock operation.
81b55986SWaiman Long		 */
81b55986SWaiman Long		next = READ_ONCE(node->next);
81b55986SWaiman Long		if (next)
81b55986SWaiman Long			prefetchw(next);
a33fda35SWaiman Long	}
a33fda35SWaiman Long
a33fda35SWaiman Long	/*
c1fb159dSPeter Zijlstra (Intel)	 * we're at the head of the waitqueue, wait for the owner & pending to
c1fb159dSPeter Zijlstra (Intel)	 * go away.
a33fda35SWaiman Long	 *
c1fb159dSPeter Zijlstra (Intel)	 * *,x,y -> *,0,0
2c83e8e9SWaiman Long	 *
2c83e8e9SWaiman Long	 * this wait loop must use a load-acquire such that we match the
2c83e8e9SWaiman Long	 * store-release that clears the locked bit and create lock
2c83e8e9SWaiman Long	 * sequentiality; this is because the set_locked() function below
2c83e8e9SWaiman Long	 * does not imply a full barrier.
2c83e8e9SWaiman Long	 *
1c4941fdSWaiman Long	 * The PV pv_wait_head_or_lock function, if active, will acquire
1c4941fdSWaiman Long	 * the lock and return a non-zero value. So we have to skip the
f9c811faSWill Deacon	 * atomic_cond_read_acquire() call. As the next PV queue head hasn't
f9c811faSWill Deacon	 * been designated yet, there is no way for the locked value to become
1c4941fdSWaiman Long	 * _Q_SLOW_VAL. So both the set_locked() and the
1c4941fdSWaiman Long	 * atomic_cmpxchg_relaxed() calls will be safe.
1c4941fdSWaiman Long	 *
1c4941fdSWaiman Long	 * If PV isn't active, 0 will be returned instead.
1c4941fdSWaiman Long	 *
a33fda35SWaiman Long	 */
1c4941fdSWaiman Long	if ((val = pv_wait_head_or_lock(lock, node)))
1c4941fdSWaiman Long		goto locked;
1c4941fdSWaiman Long
f9c811faSWill Deacon	val = atomic_cond_read_acquire(&lock->val, !(VAL & _Q_LOCKED_PENDING_MASK));
a33fda35SWaiman Long
1c4941fdSWaiman Longlocked:
a33fda35SWaiman Long	/*
a33fda35SWaiman Long	 * claim the lock:
a33fda35SWaiman Long	 *
c1fb159dSPeter Zijlstra (Intel)	 * n,0,0 -> 0,0,1 : lock, uncontended
59fb586bSWill Deacon	 * *,*,0 -> *,*,1 : lock, contended
2c83e8e9SWaiman Long	 *
59fb586bSWill Deacon	 * If the queue head is the only one in the queue (lock value == tail)
59fb586bSWill Deacon	 * and nobody is pending, clear the tail code and grab the lock.
59fb586bSWill Deacon	 * Otherwise, we only need to grab the lock.
a33fda35SWaiman Long	 */
c61da58dSWill Deacon
64d816cbSWaiman Long	/*
756b1df4SPeter Zijlstra	 * In the PV case we might already have _Q_LOCKED_VAL set, because
756b1df4SPeter Zijlstra	 * of lock stealing; therefore we must also allow:
ae75d908SWill Deacon	 *
756b1df4SPeter Zijlstra	 * n,0,1 -> 0,0,1
756b1df4SPeter Zijlstra	 *
756b1df4SPeter Zijlstra	 * Note: at this point: (val & _Q_PENDING_MASK) == 0, because of the
756b1df4SPeter Zijlstra	 *       above wait condition, therefore any concurrent setting of
756b1df4SPeter Zijlstra	 *       PENDING will make the uncontended transition fail.
64d816cbSWaiman Long	 */
756b1df4SPeter Zijlstra	if ((val & _Q_TAIL_MASK) == tail) {
756b1df4SPeter Zijlstra		if (atomic_try_cmpxchg_relaxed(&lock->val, &val, _Q_LOCKED_VAL))
2c83e8e9SWaiman Long			goto release; /* No contention */
756b1df4SPeter Zijlstra	}
a33fda35SWaiman Long
756b1df4SPeter Zijlstra	/*
756b1df4SPeter Zijlstra	 * Either somebody is queued behind us or _Q_PENDING_VAL got set
756b1df4SPeter Zijlstra	 * which will then detect the remaining tail and queue behind us
756b1df4SPeter Zijlstra	 * ensuring we'll see a @next.
756b1df4SPeter Zijlstra	 */
c61da58dSWill Deacon	set_locked(lock);
c61da58dSWill Deacon
a33fda35SWaiman Long	/*
aa68744fSWaiman Long	 * contended path; wait for next if not observed yet, release.
a33fda35SWaiman Long	 */
c131a198SWill Deacon	if (!next)
c131a198SWill Deacon		next = smp_cond_load_relaxed(&node->next, (VAL));
a33fda35SWaiman Long
a33fda35SWaiman Long	arch_mcs_spin_unlock_contended(&next->locked);
75d22702SWaiman Long	pv_kick_node(lock, next);
a33fda35SWaiman Long
a33fda35SWaiman Longrelease:
ee042be1SNamhyung Kim	trace_contention_end(lock, 0);
ee042be1SNamhyung Kim
a33fda35SWaiman Long	/*
a33fda35SWaiman Long	 * release the node
a33fda35SWaiman Long	 */
0fa809caSWaiman Long	__this_cpu_dec(qnodes[0].mcs.count);
a33fda35SWaiman Long}
a33fda35SWaiman LongEXPORT_SYMBOL(queued_spin_lock_slowpath);
a23db284SWaiman Long
a23db284SWaiman Long/*
a23db284SWaiman Long * Generate the paravirt code for queued_spin_unlock_slowpath().
a23db284SWaiman Long */
a23db284SWaiman Long#if !defined(_GEN_PV_LOCK_SLOWPATH) && defined(CONFIG_PARAVIRT_SPINLOCKS)
a23db284SWaiman Long#define _GEN_PV_LOCK_SLOWPATH
a23db284SWaiman Long
a23db284SWaiman Long#undef  pv_enabled
a23db284SWaiman Long#define pv_enabled()	true
a23db284SWaiman Long
a23db284SWaiman Long#undef pv_init_node
a23db284SWaiman Long#undef pv_wait_node
a23db284SWaiman Long#undef pv_kick_node
1c4941fdSWaiman Long#undef pv_wait_head_or_lock
a23db284SWaiman Long
a23db284SWaiman Long#undef  queued_spin_lock_slowpath
a23db284SWaiman Long#define queued_spin_lock_slowpath	__pv_queued_spin_lock_slowpath
a23db284SWaiman Long
a23db284SWaiman Long#include "qspinlock_paravirt.h"
a23db284SWaiman Long#include "qspinlock.c"
a23db284SWaiman Long
9fe6a8c5SJuergen Grossbool nopvspin;
05eee619SZhenzhong Duanstatic __init int parse_nopvspin(char *arg)
05eee619SZhenzhong Duan{
05eee619SZhenzhong Duan	nopvspin = true;
05eee619SZhenzhong Duan	return 0;
05eee619SZhenzhong Duan}
05eee619SZhenzhong Duanearly_param("nopvspin", parse_nopvspin);
a23db284SWaiman Long#endif