Version 0.9.5
[userspace-rcu.git] / urcu-bp.c
CommitLineData
fdee2e6d
MD
1/*
2 * urcu-bp.c
3 *
4 * Userspace RCU library, "bulletproof" version.
5 *
6982d6d7 6 * Copyright (c) 2009 Mathieu Desnoyers <mathieu.desnoyers@efficios.com>
fdee2e6d
MD
7 * Copyright (c) 2009 Paul E. McKenney, IBM Corporation.
8 *
9 * This library is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU Lesser General Public
11 * License as published by the Free Software Foundation; either
12 * version 2.1 of the License, or (at your option) any later version.
13 *
14 * This library is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
17 * Lesser General Public License for more details.
18 *
19 * You should have received a copy of the GNU Lesser General Public
20 * License along with this library; if not, write to the Free Software
21 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
22 *
23 * IBM's contributions to this file may be relicensed under LGPLv2 or later.
24 */
25
0617bf4c 26#define _GNU_SOURCE
71c811bf 27#define _LGPL_SOURCE
fdee2e6d
MD
28#include <stdio.h>
29#include <pthread.h>
30#include <signal.h>
31#include <assert.h>
32#include <stdlib.h>
33#include <string.h>
34#include <errno.h>
35#include <poll.h>
36#include <unistd.h>
37#include <sys/mman.h>
38
999991c6 39#include "urcu/arch.h"
d73fb81f 40#include "urcu/wfcqueue.h"
57760d44 41#include "urcu/map/urcu-bp.h"
af7c2dbe 42#include "urcu/static/urcu-bp.h"
618b2595 43#include "urcu-pointer.h"
bd252a04 44#include "urcu/tls-compat.h"
71c811bf 45
4a6d7378
MD
46#include "urcu-die.h"
47
fdee2e6d 48/* Do not #define _LGPL_SOURCE to ensure we can emit the wrapper symbols */
71c811bf 49#undef _LGPL_SOURCE
fdee2e6d 50#include "urcu-bp.h"
71c811bf 51#define _LGPL_SOURCE
fdee2e6d 52
4c1ae2ea
MD
53#ifndef MAP_ANONYMOUS
54#define MAP_ANONYMOUS MAP_ANON
55#endif
56
c7eaf61c
MD
57#ifdef __linux__
58static
59void *mremap_wrapper(void *old_address, size_t old_size,
60 size_t new_size, int flags)
61{
62 return mremap(old_address, old_size, new_size, flags);
63}
64#else
45a4872f
MD
65
66#define MREMAP_MAYMOVE 1
67#define MREMAP_FIXED 2
68
69/*
95b94246 70 * mremap wrapper for non-Linux systems not allowing MAYMOVE.
45a4872f
MD
71 * This is not generic.
72*/
c7eaf61c
MD
73static
74void *mremap_wrapper(void *old_address, size_t old_size,
75 size_t new_size, int flags)
45a4872f 76{
95b94246
MD
77 assert(!(flags & MREMAP_MAYMOVE));
78
79 return MAP_FAILED;
45a4872f
MD
80}
81#endif
82
9340c38d
MD
83/* Sleep delay in ms */
84#define RCU_SLEEP_DELAY_MS 10
95b94246
MD
85#define INIT_NR_THREADS 8
86#define ARENA_INIT_ALLOC \
87 sizeof(struct registry_chunk) \
88 + INIT_NR_THREADS * sizeof(struct rcu_reader)
fdee2e6d 89
b7b6a8f5
PB
90/*
91 * Active attempts to check for reader Q.S. before calling sleep().
92 */
93#define RCU_QS_ACTIVE_ATTEMPTS 100
94
76d6a951
MD
95static
96int rcu_bp_refcount;
97
999991c6
MD
98/* If the headers do not support membarrier system call, fall back smp_mb. */
99#ifdef __NR_membarrier
100# define membarrier(...) syscall(__NR_membarrier, __VA_ARGS__)
f541831e
MD
101#else
102# define membarrier(...) -ENOSYS
103#endif
104
105enum membarrier_cmd {
106 MEMBARRIER_CMD_QUERY = 0,
107 MEMBARRIER_CMD_SHARED = (1 << 0),
108};
109
c1be8fb9
MD
110static
111void __attribute__((constructor)) rcu_bp_init(void);
112static
02be5561 113void __attribute__((destructor)) rcu_bp_exit(void);
fdee2e6d 114
f541831e
MD
115int urcu_bp_has_sys_membarrier;
116
731ccb96
MD
117/*
118 * rcu_gp_lock ensures mutual exclusion between threads calling
119 * synchronize_rcu().
120 */
6abb4bd5 121static pthread_mutex_t rcu_gp_lock = PTHREAD_MUTEX_INITIALIZER;
731ccb96
MD
122/*
123 * rcu_registry_lock ensures mutual exclusion between threads
124 * registering and unregistering themselves to/from the registry, and
125 * with threads reading that registry from synchronize_rcu(). However,
126 * this lock is not held all the way through the completion of awaiting
127 * for the grace period. It is sporadically released between iterations
128 * on the registry.
129 * rcu_registry_lock may nest inside rcu_gp_lock.
130 */
131static pthread_mutex_t rcu_registry_lock = PTHREAD_MUTEX_INITIALIZER;
fdee2e6d 132
c1be8fb9
MD
133static pthread_mutex_t init_lock = PTHREAD_MUTEX_INITIALIZER;
134static int initialized;
135
136static pthread_key_t urcu_bp_key;
137
c13c2e55 138struct rcu_gp rcu_gp = { .ctr = RCU_GP_COUNT };
fdee2e6d
MD
139
140/*
141 * Pointer to registry elements. Written to only by each individual reader. Read
142 * by both the reader and the writers.
143 */
bd252a04 144DEFINE_URCU_TLS(struct rcu_reader *, rcu_reader);
fdee2e6d 145
16aa9ee8 146static CDS_LIST_HEAD(registry);
fdee2e6d 147
95b94246
MD
148struct registry_chunk {
149 size_t data_len; /* data length */
c1be8fb9 150 size_t used; /* amount of data used */
95b94246
MD
151 struct cds_list_head node; /* chunk_list node */
152 char data[];
153};
154
fdee2e6d 155struct registry_arena {
95b94246 156 struct cds_list_head chunk_list;
fdee2e6d
MD
157};
158
95b94246
MD
159static struct registry_arena registry_arena = {
160 .chunk_list = CDS_LIST_HEAD_INIT(registry_arena.chunk_list),
161};
fdee2e6d 162
4cf1675f
MD
163/* Saved fork signal mask, protected by rcu_gp_lock */
164static sigset_t saved_fork_signal_mask;
165
6abb4bd5 166static void mutex_lock(pthread_mutex_t *mutex)
fdee2e6d
MD
167{
168 int ret;
169
170#ifndef DISTRUST_SIGNALS_EXTREME
6abb4bd5 171 ret = pthread_mutex_lock(mutex);
4a6d7378
MD
172 if (ret)
173 urcu_die(ret);
fdee2e6d 174#else /* #ifndef DISTRUST_SIGNALS_EXTREME */
6abb4bd5 175 while ((ret = pthread_mutex_trylock(mutex)) != 0) {
4a6d7378
MD
176 if (ret != EBUSY && ret != EINTR)
177 urcu_die(ret);
fdee2e6d
MD
178 poll(NULL,0,10);
179 }
180#endif /* #else #ifndef DISTRUST_SIGNALS_EXTREME */
181}
182
6abb4bd5 183static void mutex_unlock(pthread_mutex_t *mutex)
fdee2e6d
MD
184{
185 int ret;
186
6abb4bd5 187 ret = pthread_mutex_unlock(mutex);
4a6d7378
MD
188 if (ret)
189 urcu_die(ret);
fdee2e6d
MD
190}
191
f541831e
MD
192static void smp_mb_master(void)
193{
194 if (caa_likely(urcu_bp_has_sys_membarrier))
195 (void) membarrier(MEMBARRIER_CMD_SHARED, 0);
196 else
197 cmm_smp_mb();
198}
199
731ccb96
MD
200/*
201 * Always called with rcu_registry lock held. Releases this lock between
202 * iterations and grabs it again. Holds the lock when it returns.
203 */
52c75091
MD
204static void wait_for_readers(struct cds_list_head *input_readers,
205 struct cds_list_head *cur_snap_readers,
206 struct cds_list_head *qsreaders)
fdee2e6d 207{
9340c38d 208 unsigned int wait_loops = 0;
02be5561 209 struct rcu_reader *index, *tmp;
fdee2e6d 210
fdee2e6d 211 /*
dd61d077
MD
212 * Wait for each thread URCU_TLS(rcu_reader).ctr to either
213 * indicate quiescence (not nested), or observe the current
c13c2e55 214 * rcu_gp.ctr value.
fdee2e6d
MD
215 */
216 for (;;) {
9340c38d
MD
217 if (wait_loops < RCU_QS_ACTIVE_ATTEMPTS)
218 wait_loops++;
219
52c75091
MD
220 cds_list_for_each_entry_safe(index, tmp, input_readers, node) {
221 switch (rcu_reader_state(&index->ctr)) {
222 case RCU_READER_ACTIVE_CURRENT:
223 if (cur_snap_readers) {
224 cds_list_move(&index->node,
225 cur_snap_readers);
226 break;
227 }
228 /* Fall-through */
229 case RCU_READER_INACTIVE:
230 cds_list_move(&index->node, qsreaders);
231 break;
232 case RCU_READER_ACTIVE_OLD:
233 /*
234 * Old snapshot. Leaving node in
235 * input_readers will make us busy-loop
236 * until the snapshot becomes current or
237 * the reader becomes inactive.
238 */
239 break;
240 }
fdee2e6d
MD
241 }
242
52c75091 243 if (cds_list_empty(input_readers)) {
fdee2e6d
MD
244 break;
245 } else {
731ccb96
MD
246 /* Temporarily unlock the registry lock. */
247 mutex_unlock(&rcu_registry_lock);
9340c38d
MD
248 if (wait_loops >= RCU_QS_ACTIVE_ATTEMPTS)
249 (void) poll(NULL, 0, RCU_SLEEP_DELAY_MS);
fdee2e6d 250 else
06f22bdb 251 caa_cpu_relax();
731ccb96
MD
252 /* Re-lock the registry lock before the next loop. */
253 mutex_lock(&rcu_registry_lock);
fdee2e6d
MD
254 }
255 }
fdee2e6d
MD
256}
257
258void synchronize_rcu(void)
259{
52c75091
MD
260 CDS_LIST_HEAD(cur_snap_readers);
261 CDS_LIST_HEAD(qsreaders);
fdee2e6d
MD
262 sigset_t newmask, oldmask;
263 int ret;
264
6ed4b2e6 265 ret = sigfillset(&newmask);
fdee2e6d 266 assert(!ret);
6ed4b2e6 267 ret = pthread_sigmask(SIG_BLOCK, &newmask, &oldmask);
fdee2e6d
MD
268 assert(!ret);
269
6abb4bd5 270 mutex_lock(&rcu_gp_lock);
fdee2e6d 271
731ccb96
MD
272 mutex_lock(&rcu_registry_lock);
273
16aa9ee8 274 if (cds_list_empty(&registry))
2dfb8b5e 275 goto out;
fdee2e6d
MD
276
277 /* All threads should read qparity before accessing data structure
2dfb8b5e 278 * where new ptr points to. */
fdee2e6d 279 /* Write new ptr before changing the qparity */
f541831e 280 smp_mb_master();
fdee2e6d 281
fdee2e6d 282 /*
dd61d077 283 * Wait for readers to observe original parity or be quiescent.
731ccb96
MD
284 * wait_for_readers() can release and grab again rcu_registry_lock
285 * interally.
dd61d077 286 */
52c75091 287 wait_for_readers(&registry, &cur_snap_readers, &qsreaders);
dd61d077
MD
288
289 /*
290 * Adding a cmm_smp_mb() which is _not_ formally required, but makes the
291 * model easier to understand. It does not have a big performance impact
292 * anyway, given this is the write-side.
293 */
294 cmm_smp_mb();
295
296 /* Switch parity: 0 -> 1, 1 -> 0 */
c13c2e55 297 CMM_STORE_SHARED(rcu_gp.ctr, rcu_gp.ctr ^ RCU_GP_CTR_PHASE);
dd61d077
MD
298
299 /*
300 * Must commit qparity update to memory before waiting for other parity
301 * quiescent state. Failure to do so could result in the writer waiting
302 * forever while new readers are always accessing data (no progress).
303 * Ensured by CMM_STORE_SHARED and CMM_LOAD_SHARED.
fdee2e6d 304 */
fdee2e6d
MD
305
306 /*
5481ddb3 307 * Adding a cmm_smp_mb() which is _not_ formally required, but makes the
fdee2e6d
MD
308 * model easier to understand. It does not have a big performance impact
309 * anyway, given this is the write-side.
310 */
5481ddb3 311 cmm_smp_mb();
fdee2e6d 312
fdee2e6d 313 /*
dd61d077 314 * Wait for readers to observe new parity or be quiescent.
731ccb96
MD
315 * wait_for_readers() can release and grab again rcu_registry_lock
316 * interally.
fdee2e6d 317 */
52c75091
MD
318 wait_for_readers(&cur_snap_readers, NULL, &qsreaders);
319
320 /*
321 * Put quiescent reader list back into registry.
322 */
323 cds_list_splice(&qsreaders, &registry);
fdee2e6d
MD
324
325 /*
2dfb8b5e
MD
326 * Finish waiting for reader threads before letting the old ptr being
327 * freed.
fdee2e6d 328 */
f541831e 329 smp_mb_master();
2dfb8b5e 330out:
731ccb96 331 mutex_unlock(&rcu_registry_lock);
6abb4bd5 332 mutex_unlock(&rcu_gp_lock);
fdee2e6d
MD
333 ret = pthread_sigmask(SIG_SETMASK, &oldmask, NULL);
334 assert(!ret);
335}
336
337/*
338 * library wrappers to be used by non-LGPL compatible source code.
339 */
340
341void rcu_read_lock(void)
342{
343 _rcu_read_lock();
344}
345
346void rcu_read_unlock(void)
347{
348 _rcu_read_unlock();
349}
350
882f3357
MD
351int rcu_read_ongoing(void)
352{
353 return _rcu_read_ongoing();
354}
355
fdee2e6d 356/*
95b94246
MD
357 * Only grow for now. If empty, allocate a ARENA_INIT_ALLOC sized chunk.
358 * Else, try expanding the last chunk. If this fails, allocate a new
359 * chunk twice as big as the last chunk.
360 * Memory used by chunks _never_ moves. A chunk could theoretically be
361 * freed when all "used" slots are released, but we don't do it at this
362 * point.
fdee2e6d 363 */
95b94246
MD
364static
365void expand_arena(struct registry_arena *arena)
fdee2e6d 366{
95b94246
MD
367 struct registry_chunk *new_chunk, *last_chunk;
368 size_t old_chunk_len, new_chunk_len;
369
370 /* No chunk. */
371 if (cds_list_empty(&arena->chunk_list)) {
372 assert(ARENA_INIT_ALLOC >=
373 sizeof(struct registry_chunk)
374 + sizeof(struct rcu_reader));
375 new_chunk_len = ARENA_INIT_ALLOC;
181ca7a6
MJ
376 new_chunk = (struct registry_chunk *) mmap(NULL,
377 new_chunk_len,
9d8612b7
MD
378 PROT_READ | PROT_WRITE,
379 MAP_ANONYMOUS | MAP_PRIVATE,
380 -1, 0);
95b94246
MD
381 if (new_chunk == MAP_FAILED)
382 abort();
d3ac5bb7 383 memset(new_chunk, 0, new_chunk_len);
95b94246
MD
384 new_chunk->data_len =
385 new_chunk_len - sizeof(struct registry_chunk);
386 cds_list_add_tail(&new_chunk->node, &arena->chunk_list);
387 return; /* We're done. */
388 }
9d8612b7 389
95b94246
MD
390 /* Try expanding last chunk. */
391 last_chunk = cds_list_entry(arena->chunk_list.prev,
392 struct registry_chunk, node);
393 old_chunk_len =
394 last_chunk->data_len + sizeof(struct registry_chunk);
395 new_chunk_len = old_chunk_len << 1;
396
397 /* Don't allow memory mapping to move, just expand. */
398 new_chunk = mremap_wrapper(last_chunk, old_chunk_len,
399 new_chunk_len, 0);
400 if (new_chunk != MAP_FAILED) {
401 /* Should not have moved. */
402 assert(new_chunk == last_chunk);
d3ac5bb7 403 memset((char *) last_chunk + old_chunk_len, 0,
95b94246
MD
404 new_chunk_len - old_chunk_len);
405 last_chunk->data_len =
406 new_chunk_len - sizeof(struct registry_chunk);
407 return; /* We're done. */
408 }
0617bf4c 409
95b94246 410 /* Remap did not succeed, we need to add a new chunk. */
181ca7a6
MJ
411 new_chunk = (struct registry_chunk *) mmap(NULL,
412 new_chunk_len,
95b94246
MD
413 PROT_READ | PROT_WRITE,
414 MAP_ANONYMOUS | MAP_PRIVATE,
415 -1, 0);
416 if (new_chunk == MAP_FAILED)
417 abort();
d3ac5bb7 418 memset(new_chunk, 0, new_chunk_len);
95b94246
MD
419 new_chunk->data_len =
420 new_chunk_len - sizeof(struct registry_chunk);
421 cds_list_add_tail(&new_chunk->node, &arena->chunk_list);
422}
fdee2e6d 423
95b94246
MD
424static
425struct rcu_reader *arena_alloc(struct registry_arena *arena)
426{
427 struct registry_chunk *chunk;
428 struct rcu_reader *rcu_reader_reg;
429 int expand_done = 0; /* Only allow to expand once per alloc */
430 size_t len = sizeof(struct rcu_reader);
431
432retry:
433 cds_list_for_each_entry(chunk, &arena->chunk_list, node) {
434 if (chunk->data_len - chunk->used < len)
435 continue;
436 /* Find spot */
437 for (rcu_reader_reg = (struct rcu_reader *) &chunk->data[0];
438 rcu_reader_reg < (struct rcu_reader *) &chunk->data[chunk->data_len];
439 rcu_reader_reg++) {
440 if (!rcu_reader_reg->alloc) {
441 rcu_reader_reg->alloc = 1;
442 chunk->used += len;
443 return rcu_reader_reg;
444 }
445 }
446 }
447
448 if (!expand_done) {
449 expand_arena(arena);
450 expand_done = 1;
451 goto retry;
452 }
453
454 return NULL;
fdee2e6d
MD
455}
456
457/* Called with signals off and mutex locked */
95b94246
MD
458static
459void add_thread(void)
fdee2e6d 460{
02be5561 461 struct rcu_reader *rcu_reader_reg;
c1be8fb9 462 int ret;
fdee2e6d 463
95b94246
MD
464 rcu_reader_reg = arena_alloc(&registry_arena);
465 if (!rcu_reader_reg)
466 abort();
c1be8fb9
MD
467 ret = pthread_setspecific(urcu_bp_key, rcu_reader_reg);
468 if (ret)
469 abort();
fdee2e6d
MD
470
471 /* Add to registry */
02be5561
MD
472 rcu_reader_reg->tid = pthread_self();
473 assert(rcu_reader_reg->ctr == 0);
16aa9ee8 474 cds_list_add(&rcu_reader_reg->node, &registry);
95b94246
MD
475 /*
476 * Reader threads are pointing to the reader registry. This is
477 * why its memory should never be relocated.
478 */
bd252a04 479 URCU_TLS(rcu_reader) = rcu_reader_reg;
fdee2e6d
MD
480}
481
c1be8fb9
MD
482/* Called with mutex locked */
483static
484void cleanup_thread(struct registry_chunk *chunk,
485 struct rcu_reader *rcu_reader_reg)
486{
487 rcu_reader_reg->ctr = 0;
488 cds_list_del(&rcu_reader_reg->node);
489 rcu_reader_reg->tid = 0;
490 rcu_reader_reg->alloc = 0;
491 chunk->used -= sizeof(struct rcu_reader);
492}
493
494static
495struct registry_chunk *find_chunk(struct rcu_reader *rcu_reader_reg)
fdee2e6d 496{
95b94246 497 struct registry_chunk *chunk;
fdee2e6d 498
95b94246 499 cds_list_for_each_entry(chunk, &registry_arena.chunk_list, node) {
c1be8fb9
MD
500 if (rcu_reader_reg < (struct rcu_reader *) &chunk->data[0])
501 continue;
502 if (rcu_reader_reg >= (struct rcu_reader *) &chunk->data[chunk->data_len])
503 continue;
504 return chunk;
505 }
506 return NULL;
507}
95b94246 508
c1be8fb9
MD
509/* Called with signals off and mutex locked */
510static
76d6a951 511void remove_thread(struct rcu_reader *rcu_reader_reg)
c1be8fb9 512{
c1be8fb9
MD
513 cleanup_thread(find_chunk(rcu_reader_reg), rcu_reader_reg);
514 URCU_TLS(rcu_reader) = NULL;
fdee2e6d
MD
515}
516
517/* Disable signals, take mutex, add to registry */
518void rcu_bp_register(void)
519{
520 sigset_t newmask, oldmask;
521 int ret;
522
6ed4b2e6 523 ret = sigfillset(&newmask);
c1be8fb9
MD
524 if (ret)
525 abort();
6ed4b2e6 526 ret = pthread_sigmask(SIG_BLOCK, &newmask, &oldmask);
c1be8fb9
MD
527 if (ret)
528 abort();
fdee2e6d
MD
529
530 /*
531 * Check if a signal concurrently registered our thread since
c1be8fb9
MD
532 * the check in rcu_read_lock().
533 */
bd252a04 534 if (URCU_TLS(rcu_reader))
fdee2e6d
MD
535 goto end;
536
c1be8fb9
MD
537 /*
538 * Take care of early registration before urcu_bp constructor.
539 */
540 rcu_bp_init();
541
731ccb96 542 mutex_lock(&rcu_registry_lock);
fdee2e6d 543 add_thread();
731ccb96 544 mutex_unlock(&rcu_registry_lock);
fdee2e6d
MD
545end:
546 ret = pthread_sigmask(SIG_SETMASK, &oldmask, NULL);
c1be8fb9
MD
547 if (ret)
548 abort();
549}
550
551/* Disable signals, take mutex, remove from registry */
552static
76d6a951 553void rcu_bp_unregister(struct rcu_reader *rcu_reader_reg)
c1be8fb9
MD
554{
555 sigset_t newmask, oldmask;
556 int ret;
557
558 ret = sigfillset(&newmask);
559 if (ret)
560 abort();
561 ret = pthread_sigmask(SIG_BLOCK, &newmask, &oldmask);
562 if (ret)
563 abort();
564
731ccb96 565 mutex_lock(&rcu_registry_lock);
76d6a951 566 remove_thread(rcu_reader_reg);
731ccb96 567 mutex_unlock(&rcu_registry_lock);
c1be8fb9
MD
568 ret = pthread_sigmask(SIG_SETMASK, &oldmask, NULL);
569 if (ret)
570 abort();
76d6a951 571 rcu_bp_exit();
c1be8fb9
MD
572}
573
574/*
575 * Remove thread from the registry when it exits, and flag it as
576 * destroyed so garbage collection can take care of it.
577 */
578static
579void urcu_bp_thread_exit_notifier(void *rcu_key)
580{
76d6a951 581 rcu_bp_unregister(rcu_key);
c1be8fb9
MD
582}
583
d4dae7fc
MD
584static
585void rcu_sys_membarrier_status(int available)
586{
587 /*
588 * membarrier has blocking behavior, which changes the
589 * application behavior too much compared to using barriers when
590 * synchronize_rcu is used repeatedly (without using call_rcu).
591 * Don't use membarrier for now.
592 */
593}
594
c1be8fb9
MD
595static
596void rcu_bp_init(void)
597{
598 mutex_lock(&init_lock);
76d6a951 599 if (!rcu_bp_refcount++) {
c1be8fb9
MD
600 int ret;
601
602 ret = pthread_key_create(&urcu_bp_key,
603 urcu_bp_thread_exit_notifier);
604 if (ret)
605 abort();
f541831e 606 ret = membarrier(MEMBARRIER_CMD_QUERY, 0);
d4dae7fc
MD
607 rcu_sys_membarrier_status(ret >= 0
608 && (ret & MEMBARRIER_CMD_SHARED));
c1be8fb9
MD
609 initialized = 1;
610 }
611 mutex_unlock(&init_lock);
fdee2e6d
MD
612}
613
c1be8fb9 614static
9380711a 615void rcu_bp_exit(void)
fdee2e6d 616{
76d6a951
MD
617 mutex_lock(&init_lock);
618 if (!--rcu_bp_refcount) {
619 struct registry_chunk *chunk, *tmp;
620 int ret;
95b94246 621
76d6a951
MD
622 cds_list_for_each_entry_safe(chunk, tmp,
623 &registry_arena.chunk_list, node) {
181ca7a6 624 munmap((void *) chunk, chunk->data_len
76d6a951
MD
625 + sizeof(struct registry_chunk));
626 }
e44dd88a 627 CDS_INIT_LIST_HEAD(&registry_arena.chunk_list);
76d6a951
MD
628 ret = pthread_key_delete(urcu_bp_key);
629 if (ret)
630 abort();
95b94246 631 }
76d6a951 632 mutex_unlock(&init_lock);
fdee2e6d 633}
4cf1675f
MD
634
635/*
731ccb96
MD
636 * Holding the rcu_gp_lock and rcu_registry_lock across fork will make
637 * sure we fork() don't race with a concurrent thread executing with
638 * any of those locks held. This ensures that the registry and data
639 * protected by rcu_gp_lock are in a coherent state in the child.
4cf1675f
MD
640 */
641void rcu_bp_before_fork(void)
642{
643 sigset_t newmask, oldmask;
644 int ret;
645
6ed4b2e6 646 ret = sigfillset(&newmask);
4cf1675f 647 assert(!ret);
6ed4b2e6 648 ret = pthread_sigmask(SIG_BLOCK, &newmask, &oldmask);
4cf1675f
MD
649 assert(!ret);
650 mutex_lock(&rcu_gp_lock);
731ccb96 651 mutex_lock(&rcu_registry_lock);
4cf1675f
MD
652 saved_fork_signal_mask = oldmask;
653}
654
655void rcu_bp_after_fork_parent(void)
656{
657 sigset_t oldmask;
658 int ret;
659
660 oldmask = saved_fork_signal_mask;
731ccb96 661 mutex_unlock(&rcu_registry_lock);
4cf1675f
MD
662 mutex_unlock(&rcu_gp_lock);
663 ret = pthread_sigmask(SIG_SETMASK, &oldmask, NULL);
664 assert(!ret);
665}
666
c1be8fb9
MD
667/*
668 * Prune all entries from registry except our own thread. Fits the Linux
731ccb96 669 * fork behavior. Called with rcu_gp_lock and rcu_registry_lock held.
c1be8fb9
MD
670 */
671static
672void urcu_bp_prune_registry(void)
673{
674 struct registry_chunk *chunk;
675 struct rcu_reader *rcu_reader_reg;
676
677 cds_list_for_each_entry(chunk, &registry_arena.chunk_list, node) {
678 for (rcu_reader_reg = (struct rcu_reader *) &chunk->data[0];
679 rcu_reader_reg < (struct rcu_reader *) &chunk->data[chunk->data_len];
680 rcu_reader_reg++) {
681 if (!rcu_reader_reg->alloc)
682 continue;
683 if (rcu_reader_reg->tid == pthread_self())
684 continue;
685 cleanup_thread(chunk, rcu_reader_reg);
686 }
687 }
688}
689
4cf1675f
MD
690void rcu_bp_after_fork_child(void)
691{
692 sigset_t oldmask;
693 int ret;
694
c1be8fb9 695 urcu_bp_prune_registry();
4cf1675f 696 oldmask = saved_fork_signal_mask;
731ccb96 697 mutex_unlock(&rcu_registry_lock);
4cf1675f
MD
698 mutex_unlock(&rcu_gp_lock);
699 ret = pthread_sigmask(SIG_SETMASK, &oldmask, NULL);
700 assert(!ret);
701}
5e77fc1f 702
9b7981bb
MD
703void *rcu_dereference_sym_bp(void *p)
704{
705 return _rcu_dereference(p);
706}
707
5efd3cd2
MD
708void *rcu_set_pointer_sym_bp(void **p, void *v)
709{
710 cmm_wmb();
424d4ed5
MD
711 uatomic_set(p, v);
712 return v;
5efd3cd2
MD
713}
714
715void *rcu_xchg_pointer_sym_bp(void **p, void *v)
716{
717 cmm_wmb();
718 return uatomic_xchg(p, v);
719}
720
721void *rcu_cmpxchg_pointer_sym_bp(void **p, void *old, void *_new)
722{
723 cmm_wmb();
724 return uatomic_cmpxchg(p, old, _new);
725}
726
5e6b23a6 727DEFINE_RCU_FLAVOR(rcu_flavor);
541d828d 728
5e77fc1f 729#include "urcu-call-rcu-impl.h"
0376e7b2 730#include "urcu-defer-impl.h"
This page took 0.06803 seconds and 4 git commands to generate.