wfstack: implement mutex-free wfstack with transparent union
[urcu.git] / urcu / static / wfstack.h
CommitLineData
edac6b69
MD
1#ifndef _URCU_STATIC_WFSTACK_H
2#define _URCU_STATIC_WFSTACK_H
294d3396
MD
3
4/*
edac6b69 5 * urcu/static/wfstack.h
294d3396 6 *
edac6b69 7 * Userspace RCU library - Stack with with wait-free push, blocking traversal.
294d3396 8 *
07c2a4fd
MD
9 * TO BE INCLUDED ONLY IN LGPL-COMPATIBLE CODE. See urcu/wfstack.h for
10 * linking dynamically with the userspace rcu library.
294d3396 11 *
a03a0f42 12 * Copyright 2010-2012 - Mathieu Desnoyers <mathieu.desnoyers@efficios.com>
294d3396
MD
13 *
14 * This library is free software; you can redistribute it and/or
15 * modify it under the terms of the GNU Lesser General Public
16 * License as published by the Free Software Foundation; either
17 * version 2.1 of the License, or (at your option) any later version.
18 *
19 * This library is distributed in the hope that it will be useful,
20 * but WITHOUT ANY WARRANTY; without even the implied warranty of
21 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
22 * Lesser General Public License for more details.
23 *
24 * You should have received a copy of the GNU Lesser General Public
25 * License along with this library; if not, write to the Free Software
26 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
27 */
28
29#include <pthread.h>
30#include <assert.h>
b57aee66 31#include <poll.h>
edac6b69 32#include <stdbool.h>
294d3396 33#include <urcu/compiler.h>
a2e7bf9c 34#include <urcu/uatomic.h>
294d3396
MD
35
36#ifdef __cplusplus
37extern "C" {
38#endif
39
edac6b69 40#define CDS_WFS_END ((void *) 0x1UL)
16aa9ee8
DG
41#define CDS_WFS_ADAPT_ATTEMPTS 10 /* Retry if being set */
42#define CDS_WFS_WAIT 10 /* Wait 10 ms if being set */
294d3396 43
edac6b69
MD
44/*
45 * Stack with wait-free push, blocking traversal.
46 *
47 * Stack implementing push, pop, pop_all operations, as well as iterator
48 * on the stack head returned by pop_all.
49 *
c97c6ce5
MD
50 * Wait-free operations: cds_wfs_push, __cds_wfs_pop_all, cds_wfs_empty,
51 * cds_wfs_first.
52 * Blocking operations: cds_wfs_pop, cds_wfs_pop_all, cds_wfs_next,
53 * iteration on stack head returned by pop_all.
edac6b69
MD
54 *
55 * Synchronization table:
56 *
57 * External synchronization techniques described in the API below is
58 * required between pairs marked with "X". No external synchronization
59 * required between pairs marked with "-".
60 *
61 * cds_wfs_push __cds_wfs_pop __cds_wfs_pop_all
62 * cds_wfs_push - - -
63 * __cds_wfs_pop - X X
64 * __cds_wfs_pop_all - X -
65 *
66 * cds_wfs_pop and cds_wfs_pop_all use an internal mutex to provide
67 * synchronization.
68 */
69
70/*
71 * cds_wfs_node_init: initialize wait-free stack node.
72 */
756a0322 73static inline
16aa9ee8 74void _cds_wfs_node_init(struct cds_wfs_node *node)
294d3396
MD
75{
76 node->next = NULL;
77}
78
718eb63e
EW
79/*
80 * __cds_wfs_init: initialize wait-free stack.
81 */
82static inline void ___cds_wfs_init(struct __cds_wfs_stack *s)
83{
84 s->head = CDS_WFS_END;
85}
86
edac6b69
MD
87/*
88 * cds_wfs_init: initialize wait-free stack.
89 */
756a0322 90static inline
16aa9ee8 91void _cds_wfs_init(struct cds_wfs_stack *s)
294d3396
MD
92{
93 int ret;
94
edac6b69 95 s->head = CDS_WFS_END;
294d3396
MD
96 ret = pthread_mutex_init(&s->lock, NULL);
97 assert(!ret);
98}
99
edac6b69
MD
100static inline bool ___cds_wfs_end(void *node)
101{
102 return node == CDS_WFS_END;
103}
104
191098fc 105/*
edac6b69
MD
106 * cds_wfs_empty: return whether wait-free stack is empty.
107 *
108 * No memory barrier is issued. No mutual exclusion is required.
109 */
718eb63e 110static inline bool _cds_wfs_empty(cds_wfs_stack_ptr_t u_stack)
edac6b69 111{
718eb63e
EW
112 struct __cds_wfs_stack *s = u_stack._s;
113
edac6b69
MD
114 return ___cds_wfs_end(CMM_LOAD_SHARED(s->head));
115}
116
117/*
118 * cds_wfs_push: push a node into the stack.
119 *
120 * Issues a full memory barrier before push. No mutual exclusion is
121 * required.
122 *
123 * Returns 0 if the stack was empty prior to adding the node.
124 * Returns non-zero otherwise.
191098fc 125 */
756a0322 126static inline
718eb63e 127int _cds_wfs_push(cds_wfs_stack_ptr_t u_stack, struct cds_wfs_node *node)
294d3396 128{
718eb63e 129 struct __cds_wfs_stack *s = u_stack._s;
edac6b69 130 struct cds_wfs_head *old_head, *new_head;
294d3396
MD
131
132 assert(node->next == NULL);
edac6b69 133 new_head = caa_container_of(node, struct cds_wfs_head, node);
294d3396 134 /*
edac6b69
MD
135 * uatomic_xchg() implicit memory barrier orders earlier stores
136 * to node (setting it to NULL) before publication.
294d3396 137 */
edac6b69 138 old_head = uatomic_xchg(&s->head, new_head);
294d3396 139 /*
edac6b69
MD
140 * At this point, dequeuers see a NULL node->next, they should
141 * busy-wait until node->next is set to old_head.
294d3396 142 */
edac6b69
MD
143 CMM_STORE_SHARED(node->next, &old_head->node);
144 return !___cds_wfs_end(old_head);
294d3396
MD
145}
146
147/*
edac6b69 148 * Waiting for push to complete enqueue and return the next node.
294d3396 149 */
edac6b69 150static inline struct cds_wfs_node *
af67624d 151___cds_wfs_node_sync_next(struct cds_wfs_node *node, int blocking)
294d3396 152{
edac6b69 153 struct cds_wfs_node *next;
294d3396
MD
154 int attempt = 0;
155
294d3396
MD
156 /*
157 * Adaptative busy-looping waiting for push to complete.
158 */
edac6b69 159 while ((next = CMM_LOAD_SHARED(node->next)) == NULL) {
af67624d
MD
160 if (!blocking)
161 return CDS_WFS_WOULDBLOCK;
16aa9ee8
DG
162 if (++attempt >= CDS_WFS_ADAPT_ATTEMPTS) {
163 poll(NULL, 0, CDS_WFS_WAIT); /* Wait for 10ms */
294d3396 164 attempt = 0;
edac6b69 165 } else {
06f22bdb 166 caa_cpu_relax();
edac6b69 167 }
294d3396 168 }
edac6b69
MD
169
170 return next;
294d3396
MD
171}
172
af67624d
MD
173static inline
174struct cds_wfs_node *
c8975b94 175___cds_wfs_pop(struct cds_wfs_stack *s, int *state, int blocking)
af67624d
MD
176{
177 struct cds_wfs_head *head, *new_head;
178 struct cds_wfs_node *next;
179
c8975b94
MD
180 if (state)
181 *state = 0;
af67624d
MD
182 for (;;) {
183 head = CMM_LOAD_SHARED(s->head);
c8975b94 184 if (___cds_wfs_end(head)) {
af67624d 185 return NULL;
c8975b94 186 }
af67624d 187 next = ___cds_wfs_node_sync_next(&head->node, blocking);
c8975b94 188 if (!blocking && next == CDS_WFS_WOULDBLOCK) {
af67624d 189 return CDS_WFS_WOULDBLOCK;
c8975b94 190 }
af67624d 191 new_head = caa_container_of(next, struct cds_wfs_head, node);
c8975b94
MD
192 if (uatomic_cmpxchg(&s->head, head, new_head) == head) {
193 if (state && ___cds_wfs_end(new_head))
194 *state |= CDS_WFS_STATE_LAST;
af67624d 195 return &head->node;
c8975b94
MD
196 }
197 if (!blocking) {
af67624d 198 return CDS_WFS_WOULDBLOCK;
c8975b94 199 }
af67624d
MD
200 /* busy-loop if head changed under us */
201 }
202}
203
edac6b69 204/*
c8975b94 205 * __cds_wfs_pop_with_state_blocking: pop a node from the stack, with state.
edac6b69
MD
206 *
207 * Returns NULL if stack is empty.
208 *
209 * __cds_wfs_pop_blocking needs to be synchronized using one of the
210 * following techniques:
211 *
212 * 1) Calling __cds_wfs_pop_blocking under rcu read lock critical
213 * section. The caller must wait for a grace period to pass before
214 * freeing the returned node or modifying the cds_wfs_node structure.
215 * 2) Using mutual exclusion (e.g. mutexes) to protect
216 * __cds_wfs_pop_blocking and __cds_wfs_pop_all callers.
217 * 3) Ensuring that only ONE thread can call __cds_wfs_pop_blocking()
218 * and __cds_wfs_pop_all(). (multi-provider/single-consumer scheme).
c8975b94
MD
219 *
220 * "state" saves state flags atomically sampled with pop operation.
edac6b69 221 */
c8975b94
MD
222static inline
223struct cds_wfs_node *
224___cds_wfs_pop_with_state_blocking(struct cds_wfs_stack *s, int *state)
225{
226 return ___cds_wfs_pop(s, state, 1);
227}
228
756a0322 229static inline
16aa9ee8 230struct cds_wfs_node *
edac6b69
MD
231___cds_wfs_pop_blocking(struct cds_wfs_stack *s)
232{
c8975b94
MD
233 return ___cds_wfs_pop_with_state_blocking(s, NULL);
234}
235
236/*
237 * __cds_wfs_pop_with_state_nonblocking: pop a node from the stack.
238 *
239 * Same as __cds_wfs_pop_with_state_blocking, but returns
240 * CDS_WFS_WOULDBLOCK if it needs to block.
241 *
242 * "state" saves state flags atomically sampled with pop operation.
243 */
244static inline
245struct cds_wfs_node *
246___cds_wfs_pop_with_state_nonblocking(struct cds_wfs_stack *s, int *state)
247{
248 return ___cds_wfs_pop(s, state, 0);
af67624d 249}
edac6b69 250
af67624d
MD
251/*
252 * __cds_wfs_pop_nonblocking: pop a node from the stack.
253 *
254 * Same as __cds_wfs_pop_blocking, but returns CDS_WFS_WOULDBLOCK if
255 * it needs to block.
256 */
257static inline
258struct cds_wfs_node *
259___cds_wfs_pop_nonblocking(struct cds_wfs_stack *s)
260{
c8975b94 261 return ___cds_wfs_pop_with_state_nonblocking(s, NULL);
edac6b69
MD
262}
263
264/*
265 * __cds_wfs_pop_all: pop all nodes from a stack.
266 *
267 * __cds_wfs_pop_all does not require any synchronization with other
268 * push, nor with other __cds_wfs_pop_all, but requires synchronization
269 * matching the technique used to synchronize __cds_wfs_pop_blocking:
270 *
271 * 1) If __cds_wfs_pop_blocking is called under rcu read lock critical
272 * section, both __cds_wfs_pop_blocking and cds_wfs_pop_all callers
273 * must wait for a grace period to pass before freeing the returned
274 * node or modifying the cds_wfs_node structure. However, no RCU
275 * read-side critical section is needed around __cds_wfs_pop_all.
276 * 2) Using mutual exclusion (e.g. mutexes) to protect
277 * __cds_wfs_pop_blocking and __cds_wfs_pop_all callers.
278 * 3) Ensuring that only ONE thread can call __cds_wfs_pop_blocking()
279 * and __cds_wfs_pop_all(). (multi-provider/single-consumer scheme).
280 */
281static inline
282struct cds_wfs_head *
718eb63e 283___cds_wfs_pop_all(cds_wfs_stack_ptr_t u_stack)
edac6b69 284{
718eb63e 285 struct __cds_wfs_stack *s = u_stack._s;
edac6b69
MD
286 struct cds_wfs_head *head;
287
288 /*
289 * Implicit memory barrier after uatomic_xchg() matches implicit
290 * memory barrier before uatomic_xchg() in cds_wfs_push. It
291 * ensures that all nodes of the returned list are consistent.
292 * There is no need to issue memory barriers when iterating on
293 * the returned list, because the full memory barrier issued
294 * prior to each uatomic_cmpxchg, which each write to head, are
295 * taking care to order writes to each node prior to the full
296 * memory barrier after this uatomic_xchg().
297 */
298 head = uatomic_xchg(&s->head, CDS_WFS_END);
299 if (___cds_wfs_end(head))
300 return NULL;
301 return head;
302}
303
304/*
305 * cds_wfs_pop_lock: lock stack pop-protection mutex.
306 */
307static inline void _cds_wfs_pop_lock(struct cds_wfs_stack *s)
294d3396 308{
294d3396
MD
309 int ret;
310
311 ret = pthread_mutex_lock(&s->lock);
312 assert(!ret);
edac6b69
MD
313}
314
315/*
316 * cds_wfs_pop_unlock: unlock stack pop-protection mutex.
317 */
318static inline void _cds_wfs_pop_unlock(struct cds_wfs_stack *s)
319{
320 int ret;
321
294d3396
MD
322 ret = pthread_mutex_unlock(&s->lock);
323 assert(!ret);
edac6b69
MD
324}
325
326/*
c8975b94 327 * Call __cds_wfs_pop_with_state_blocking with an internal pop mutex held.
edac6b69
MD
328 */
329static inline
330struct cds_wfs_node *
c8975b94 331_cds_wfs_pop_with_state_blocking(struct cds_wfs_stack *s, int *state)
edac6b69
MD
332{
333 struct cds_wfs_node *retnode;
334
335 _cds_wfs_pop_lock(s);
c8975b94 336 retnode = ___cds_wfs_pop_with_state_blocking(s, state);
edac6b69 337 _cds_wfs_pop_unlock(s);
294d3396
MD
338 return retnode;
339}
340
c8975b94
MD
341/*
342 * Call _cds_wfs_pop_with_state_blocking without saving any state.
343 */
344static inline
345struct cds_wfs_node *
346_cds_wfs_pop_blocking(struct cds_wfs_stack *s)
347{
348 return _cds_wfs_pop_with_state_blocking(s, NULL);
349}
350
edac6b69
MD
351/*
352 * Call __cds_wfs_pop_all with an internal pop mutex held.
353 */
354static inline
355struct cds_wfs_head *
356_cds_wfs_pop_all_blocking(struct cds_wfs_stack *s)
357{
358 struct cds_wfs_head *rethead;
359
360 _cds_wfs_pop_lock(s);
361 rethead = ___cds_wfs_pop_all(s);
362 _cds_wfs_pop_unlock(s);
363 return rethead;
364}
365
366/*
c7ba06ba 367 * cds_wfs_first: get first node of a popped stack.
edac6b69
MD
368 *
369 * Content written into the node before enqueue is guaranteed to be
370 * consistent, but no other memory ordering is ensured.
371 *
372 * Used by for-like iteration macros in urcu/wfstack.h:
373 * cds_wfs_for_each_blocking()
374 * cds_wfs_for_each_blocking_safe()
8af2956c
MD
375 *
376 * Returns NULL if popped stack is empty, top stack node otherwise.
edac6b69
MD
377 */
378static inline struct cds_wfs_node *
c7ba06ba 379_cds_wfs_first(struct cds_wfs_head *head)
edac6b69
MD
380{
381 if (___cds_wfs_end(head))
382 return NULL;
383 return &head->node;
384}
385
af67624d
MD
386static inline struct cds_wfs_node *
387___cds_wfs_next(struct cds_wfs_node *node, int blocking)
388{
389 struct cds_wfs_node *next;
390
391 next = ___cds_wfs_node_sync_next(node, blocking);
392 /*
393 * CDS_WFS_WOULDBLOCK != CSD_WFS_END, so we can check for end
394 * even if ___cds_wfs_node_sync_next returns CDS_WFS_WOULDBLOCK,
395 * and still return CDS_WFS_WOULDBLOCK.
396 */
397 if (___cds_wfs_end(next))
398 return NULL;
399 return next;
400}
401
edac6b69
MD
402/*
403 * cds_wfs_next_blocking: get next node of a popped stack.
404 *
405 * Content written into the node before enqueue is guaranteed to be
406 * consistent, but no other memory ordering is ensured.
407 *
408 * Used by for-like iteration macros in urcu/wfstack.h:
409 * cds_wfs_for_each_blocking()
410 * cds_wfs_for_each_blocking_safe()
8af2956c
MD
411 *
412 * Returns NULL if reached end of popped stack, non-NULL next stack
413 * node otherwise.
edac6b69
MD
414 */
415static inline struct cds_wfs_node *
416_cds_wfs_next_blocking(struct cds_wfs_node *node)
417{
af67624d
MD
418 return ___cds_wfs_next(node, 1);
419}
edac6b69 420
af67624d
MD
421
422/*
423 * cds_wfs_next_nonblocking: get next node of a popped stack.
424 *
425 * Same as cds_wfs_next_blocking, but returns CDS_WFS_WOULDBLOCK if it
426 * needs to block.
427 */
428static inline struct cds_wfs_node *
429_cds_wfs_next_nonblocking(struct cds_wfs_node *node)
430{
431 return ___cds_wfs_next(node, 0);
edac6b69
MD
432}
433
294d3396
MD
434#ifdef __cplusplus
435}
436#endif
437
edac6b69 438#endif /* _URCU_STATIC_WFSTACK_H */
This page took 0.046065 seconds and 4 git commands to generate.