qspinlock.h source code [Linux/kernel/locking/qspinlock.h]

1	/ SPDX-License-Identifier: GPL-2.0-or-later /
2	/*
3	* Queued spinlock defines
4	*
5	* This file contains macro definitions and functions shared between different
6	* qspinlock slow path implementations.
7	*/
8	#ifndef __LINUX_QSPINLOCK_H
9	#define __LINUX_QSPINLOCK_H
10
11	#include <asm-generic/percpu.h>
12	#include <linux/percpu-defs.h>
13	#include <asm-generic/qspinlock.h>
14	#include <asm-generic/mcs_spinlock.h>
15
16	#define _Q_MAX_NODES 4
17
18	/*
19	* The pending bit spinning loop count.
20	* This heuristic is used to limit the number of lockword accesses
21	* made by atomic_cond_read_relaxed when waiting for the lock to
22	* transition out of the "== _Q_PENDING_VAL" state. We don't spin
23	* indefinitely because there's no guarantee that we'll make forward
24	* progress.
25	*/
26	#ifndef _Q_PENDING_LOOPS
27	#define _Q_PENDING_LOOPS 1
28	#endif
29
30	/*
31	* On 64-bit architectures, the mcs_spinlock structure will be 16 bytes in
32	* size and four of them will fit nicely in one 64-byte cacheline. For
33	* pvqspinlock, however, we need more space for extra data. To accommodate
34	* that, we insert two more long words to pad it up to 32 bytes. IOW, only
35	* two of them can fit in a cacheline in this case. That is OK as it is rare
36	* to have more than 2 levels of slowpath nesting in actual use. We don't
37	* want to penalize pvqspinlocks to optimize for a rare case in native
38	* qspinlocks.
39	*/
40	struct qnode {
41	struct mcs_spinlock mcs;
42	#ifdef CONFIG_PARAVIRT_SPINLOCKS
43	long reserved[`2`];
44	#endif
45	};
46
47	/*
48	* We must be able to distinguish between no-tail and the tail at 0:0,
49	* therefore increment the cpu number by one.
50	*/
51
52	static inline __pure u32 encode_tail(int cpu, int idx)
53	{
54	u32 tail;
55
56	tail = (cpu + `1`) << _Q_TAIL_CPU_OFFSET;
57	tail \|= idx << _Q_TAIL_IDX_OFFSET; / assume < 4 /
58
59	return tail;
60	}
61
62	static inline __pure struct mcs_spinlock *decode_tail(u32 tail,
63	struct qnode __percpu *qnodes)
64	{
65	int cpu = (tail >> _Q_TAIL_CPU_OFFSET) - `1`;
66	int idx = (tail & _Q_TAIL_IDX_MASK) >> _Q_TAIL_IDX_OFFSET;
67
68	return per_cpu_ptr(&qnodes[idx].mcs, cpu);
69	}
70
71	static inline __pure
72	struct mcs_spinlock grab_mcs_node(struct* mcs_spinlock base, int* idx)
73	{
74	return &((struct qnode *)base + idx)->mcs;
75	}
76
77	#define _Q_LOCKED_PENDING_MASK (_Q_LOCKED_MASK \| _Q_PENDING_MASK)
78
79	#if _Q_PENDING_BITS == 8
80	/**
81	* clear_pending - clear the pending bit.
82	* @lock: Pointer to queued spinlock structure
83	*
84	* ,1, -> ,0,
85	*/
86	static __always_inline void clear_pending(struct qspinlock *lock)
87	{
88	WRITE_ONCE(lock->pending, `0`);
89	}
90
91	/**
92	* clear_pending_set_locked - take ownership and clear the pending bit.
93	* @lock: Pointer to queued spinlock structure
94	*
95	* ,1,0 -> ,0,1
96	*
97	* Lock stealing is not allowed if this function is used.
98	*/
99	static __always_inline void clear_pending_set_locked(struct qspinlock *lock)
100	{
101	WRITE_ONCE(lock->locked_pending, _Q_LOCKED_VAL);
102	}
103
104	/*
105	* xchg_tail - Put in the new queue tail code word & retrieve previous one
106	* @lock : Pointer to queued spinlock structure
107	* @tail : The new queue tail code word
108	* Return: The previous queue tail code word
109	*
110	* xchg(lock, tail), which heads an address dependency
111	*
112	* p,, -> n,, ; prev = xchg(lock, node)
113	*/
114	static __always_inline u32 xchg_tail(struct qspinlock *lock, u32 tail)
115	{
116	/*
117	* We can use relaxed semantics since the caller ensures that the
118	* MCS node is properly initialized before updating the tail.
119	*/
120	return (u32)xchg_relaxed(&lock->tail,
121	tail >> _Q_TAIL_OFFSET) << _Q_TAIL_OFFSET;
122	}
123
124	#else /* _Q_PENDING_BITS == 8 */
125
126	/**
127	* clear_pending - clear the pending bit.
128	* @lock: Pointer to queued spinlock structure
129	*
130	* ,1, -> ,0,
131	*/
132	static __always_inline void clear_pending(struct qspinlock *lock)
133	{
134	atomic_andnot(_Q_PENDING_VAL, &lock->val);
135	}
136
137	/**
138	* clear_pending_set_locked - take ownership and clear the pending bit.
139	* @lock: Pointer to queued spinlock structure
140	*
141	* ,1,0 -> ,0,1
142	*/
143	static __always_inline void clear_pending_set_locked(struct qspinlock *lock)
144	{
145	atomic_add(-_Q_PENDING_VAL + _Q_LOCKED_VAL, &lock->val);
146	}
147
148	/**
149	* xchg_tail - Put in the new queue tail code word & retrieve previous one
150	* @lock : Pointer to queued spinlock structure
151	* @tail : The new queue tail code word
152	* Return: The previous queue tail code word
153	*
154	* xchg(lock, tail)
155	*
156	* p,, -> n,, ; prev = xchg(lock, node)
157	*/
158	static __always_inline u32 xchg_tail(struct qspinlock *lock, u32 tail)
159	{
160	u32 old, new;
161
162	old = atomic_read(&lock->val);
163	do {
164	new = (old & _Q_LOCKED_PENDING_MASK) \| tail;
165	/*
166	* We can use relaxed semantics since the caller ensures that
167	* the MCS node is properly initialized before updating the
168	* tail.
169	*/
170	} while (!atomic_try_cmpxchg_relaxed(&lock->val, &old, new));
171
172	return old;
173	}
174	#endif /* _Q_PENDING_BITS == 8 */
175
176	/**
177	* queued_fetch_set_pending_acquire - fetch the whole lock value and set pending
178	* @lock : Pointer to queued spinlock structure
179	* Return: The previous lock value
180	*
181	* ,,* -> ,1,
182	*/
183	#ifndef queued_fetch_set_pending_acquire
184	static __always_inline u32 queued_fetch_set_pending_acquire(struct qspinlock *lock)
185	{
186	return atomic_fetch_or_acquire(_Q_PENDING_VAL, &lock->val);
187	}
188	#endif
189
190	/**
191	* set_locked - Set the lock bit and own the lock
192	* @lock: Pointer to queued spinlock structure
193	*
194	* ,,0 -> *,0,1
195	*/
196	static __always_inline void set_locked(struct qspinlock *lock)
197	{
198	WRITE_ONCE(lock->locked, _Q_LOCKED_VAL);
199	}
200
201	#endif /* __LINUX_QSPINLOCK_H */
202

Browse the source code of Linux/kernel/locking/qspinlock.h