urcu-qsbr: document compiler barrier
[urcu.git] / urcu-qsbr.c
1 /*
2 * urcu-qsbr.c
3 *
4 * Userspace RCU QSBR library
5 *
6 * Copyright (c) 2009 Mathieu Desnoyers <mathieu.desnoyers@polymtl.ca>
7 * Copyright (c) 2009 Paul E. McKenney, IBM Corporation.
8 *
9 * This library is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU Lesser General Public
11 * License as published by the Free Software Foundation; either
12 * version 2.1 of the License, or (at your option) any later version.
13 *
14 * This library is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
17 * Lesser General Public License for more details.
18 *
19 * You should have received a copy of the GNU Lesser General Public
20 * License along with this library; if not, write to the Free Software
21 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
22 *
23 * IBM's contributions to this file may be relicensed under LGPLv2 or later.
24 */
25
26 #include <stdio.h>
27 #include <pthread.h>
28 #include <signal.h>
29 #include <assert.h>
30 #include <stdlib.h>
31 #include <string.h>
32 #include <errno.h>
33 #include <poll.h>
34
35 #define BUILD_QSBR_LIB
36 #include "urcu-qsbr-static.h"
37 /* Do not #define _LGPL_SOURCE to ensure we can emit the wrapper symbols */
38 #include "urcu-qsbr.h"
39
40 void __attribute__((destructor)) rcu_exit(void);
41
42 static pthread_mutex_t rcu_gp_lock = PTHREAD_MUTEX_INITIALIZER;
43
44 int gp_futex;
45
46 /*
47 * Global grace period counter.
48 */
49 unsigned long rcu_gp_ctr = RCU_GP_ONLINE;
50
51 /*
52 * Written to only by each individual reader. Read by both the reader and the
53 * writers.
54 */
55 struct rcu_reader __thread rcu_reader;
56
57 #ifdef DEBUG_YIELD
58 unsigned int yield_active;
59 unsigned int __thread rand_yield;
60 #endif
61
62 static LIST_HEAD(registry);
63
64 static void mutex_lock(pthread_mutex_t *mutex)
65 {
66 int ret;
67
68 #ifndef DISTRUST_SIGNALS_EXTREME
69 ret = pthread_mutex_lock(mutex);
70 if (ret) {
71 perror("Error in pthread mutex lock");
72 exit(-1);
73 }
74 #else /* #ifndef DISTRUST_SIGNALS_EXTREME */
75 while ((ret = pthread_mutex_trylock(mutex)) != 0) {
76 if (ret != EBUSY && ret != EINTR) {
77 printf("ret = %d, errno = %d\n", ret, errno);
78 perror("Error in pthread mutex lock");
79 exit(-1);
80 }
81 poll(NULL,0,10);
82 }
83 #endif /* #else #ifndef DISTRUST_SIGNALS_EXTREME */
84 }
85
86 static void mutex_unlock(pthread_mutex_t *mutex)
87 {
88 int ret;
89
90 ret = pthread_mutex_unlock(mutex);
91 if (ret) {
92 perror("Error in pthread mutex unlock");
93 exit(-1);
94 }
95 }
96
97 /*
98 * synchronize_rcu() waiting. Single thread.
99 */
100 static void wait_gp(void)
101 {
102 /* Read reader_gp before read futex */
103 smp_rmb();
104 if (uatomic_read(&gp_futex) == -1)
105 futex_noasync(&gp_futex, FUTEX_WAIT, -1,
106 NULL, NULL, 0);
107 }
108
109 static void update_counter_and_wait(void)
110 {
111 LIST_HEAD(qsreaders);
112 int wait_loops = 0;
113 struct rcu_reader *index, *tmp;
114
115 #if (BITS_PER_LONG < 64)
116 /* Switch parity: 0 -> 1, 1 -> 0 */
117 STORE_SHARED(rcu_gp_ctr, rcu_gp_ctr ^ RCU_GP_CTR);
118 #else /* !(BITS_PER_LONG < 64) */
119 /* Increment current G.P. */
120 STORE_SHARED(rcu_gp_ctr, rcu_gp_ctr + RCU_GP_CTR);
121 #endif /* !(BITS_PER_LONG < 64) */
122
123 /*
124 * Enforce compiler-order of store to rcu_gp_ctr before before
125 * load rcu_reader ctr.
126 * This ensures synchronize_rcu() cannot be starved by readers.
127 */
128 barrier();
129
130 /*
131 * Wait for each thread rcu_reader_qs_gp count to become 0.
132 */
133 for (;;) {
134 wait_loops++;
135 if (wait_loops == RCU_QS_ACTIVE_ATTEMPTS) {
136 uatomic_dec(&gp_futex);
137 /* Write futex before read reader_gp */
138 smp_mb();
139 }
140
141 list_for_each_entry_safe(index, tmp, &registry, head) {
142 if (!rcu_gp_ongoing(&index->ctr))
143 list_move(&index->head, &qsreaders);
144 }
145
146 if (list_empty(&registry)) {
147 if (wait_loops == RCU_QS_ACTIVE_ATTEMPTS) {
148 /* Read reader_gp before write futex */
149 smp_mb();
150 uatomic_set(&gp_futex, 0);
151 }
152 break;
153 } else {
154 if (wait_loops == RCU_QS_ACTIVE_ATTEMPTS) {
155 wait_gp();
156 } else {
157 #ifndef HAS_INCOHERENT_CACHES
158 cpu_relax();
159 #else /* #ifndef HAS_INCOHERENT_CACHES */
160 smp_mb();
161 #endif /* #else #ifndef HAS_INCOHERENT_CACHES */
162 }
163 }
164 }
165 /* put back the reader list in the registry */
166 list_splice(&qsreaders, &registry);
167 }
168
169 /*
170 * Using a two-subphases algorithm for architectures with smaller than 64-bit
171 * long-size to ensure we do not encounter an overflow bug.
172 */
173
174 #if (BITS_PER_LONG < 64)
175 void synchronize_rcu(void)
176 {
177 unsigned long was_online;
178
179 was_online = rcu_reader.ctr;
180
181 /* All threads should read qparity before accessing data structure
182 * where new ptr points to.
183 */
184 /* Write new ptr before changing the qparity */
185 smp_mb();
186
187 /*
188 * Mark the writer thread offline to make sure we don't wait for
189 * our own quiescent state. This allows using synchronize_rcu() in
190 * threads registered as readers.
191 */
192 if (was_online)
193 STORE_SHARED(rcu_reader.ctr, 0);
194
195 mutex_lock(&rcu_gp_lock);
196
197 if (list_empty(&registry))
198 goto out;
199
200 /*
201 * Wait for previous parity to be empty of readers.
202 */
203 update_counter_and_wait(); /* 0 -> 1, wait readers in parity 0 */
204
205 /*
206 * Must finish waiting for quiescent state for parity 0 before
207 * committing qparity update to memory. Failure to do so could result in
208 * the writer waiting forever while new readers are always accessing
209 * data (no progress).
210 * Ensured by STORE_SHARED and LOAD_SHARED.
211 */
212
213 /*
214 * Adding a smp_mb() which is _not_ formally required, but makes the
215 * model easier to understand. It does not have a big performance impact
216 * anyway, given this is the write-side.
217 */
218 smp_mb();
219
220 /*
221 * Wait for previous parity to be empty of readers.
222 */
223 update_counter_and_wait(); /* 1 -> 0, wait readers in parity 1 */
224 out:
225 mutex_unlock(&rcu_gp_lock);
226
227 /*
228 * Finish waiting for reader threads before letting the old ptr being
229 * freed.
230 */
231 if (was_online)
232 _STORE_SHARED(rcu_reader.ctr, LOAD_SHARED(rcu_gp_ctr));
233 smp_mb();
234 }
235 #else /* !(BITS_PER_LONG < 64) */
236 void synchronize_rcu(void)
237 {
238 unsigned long was_online;
239
240 was_online = rcu_reader.ctr;
241
242 /*
243 * Mark the writer thread offline to make sure we don't wait for
244 * our own quiescent state. This allows using synchronize_rcu() in
245 * threads registered as readers.
246 */
247 smp_mb();
248 if (was_online)
249 STORE_SHARED(rcu_reader.ctr, 0);
250
251 mutex_lock(&rcu_gp_lock);
252 if (list_empty(&registry))
253 goto out;
254 update_counter_and_wait();
255 out:
256 mutex_unlock(&rcu_gp_lock);
257
258 if (was_online)
259 _STORE_SHARED(rcu_reader.ctr, LOAD_SHARED(rcu_gp_ctr));
260 smp_mb();
261 }
262 #endif /* !(BITS_PER_LONG < 64) */
263
264 /*
265 * library wrappers to be used by non-LGPL compatible source code.
266 */
267
268 void rcu_read_lock(void)
269 {
270 _rcu_read_lock();
271 }
272
273 void rcu_read_unlock(void)
274 {
275 _rcu_read_unlock();
276 }
277
278 void rcu_quiescent_state(void)
279 {
280 _rcu_quiescent_state();
281 }
282
283 void rcu_thread_offline(void)
284 {
285 _rcu_thread_offline();
286 }
287
288 void rcu_thread_online(void)
289 {
290 _rcu_thread_online();
291 }
292
293 void rcu_register_thread(void)
294 {
295 rcu_reader.tid = pthread_self();
296 assert(rcu_reader.ctr == 0);
297
298 mutex_lock(&rcu_gp_lock);
299 list_add(&rcu_reader.head, &registry);
300 mutex_unlock(&rcu_gp_lock);
301 _rcu_thread_online();
302 }
303
304 void rcu_unregister_thread(void)
305 {
306 /*
307 * We have to make the thread offline otherwise we end up dealocking
308 * with a waiting writer.
309 */
310 _rcu_thread_offline();
311 mutex_lock(&rcu_gp_lock);
312 list_del(&rcu_reader.head);
313 mutex_unlock(&rcu_gp_lock);
314 }
315
316 void rcu_exit(void)
317 {
318 assert(list_empty(&registry));
319 }
This page took 0.035753 seconds and 5 git commands to generate.