[urcu.git] / urcu-call-rcu.c

/*
 * urcu-call-rcu.c
 *
 * Userspace RCU library - batch memory reclamation with kernel API
 *
 * Copyright (c) 2010 Paul E. McKenney <paulmck@linux.vnet.ibm.com>
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#include <stdio.h>
#include <pthread.h>
#include <signal.h>
#include <assert.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <poll.h>
#include <sys/time.h>
#include <syscall.h>
#include <unistd.h>

#include "config.h"
#include "urcu/wfqueue.h"
#include "urcu-call-rcu.h"
#include "urcu-pointer.h"

/* Data structure that identifies a call_rcu thread. */

struct call_rcu_data {
	struct cds_wfq_queue cbs;
	unsigned long flags;
	pthread_mutex_t mtx;
	pthread_cond_t cond;
	unsigned long qlen;
	pthread_t tid;
} __attribute__((aligned(CAA_CACHE_LINE_SIZE)));

/* Link a thread using call_rcu() to its call_rcu thread. */

static __thread struct call_rcu_data *thread_call_rcu_data;

/* Guard call_rcu thread creation. */

static pthread_mutex_t call_rcu_mutex = PTHREAD_MUTEX_INITIALIZER;

/* If a given thread does not have its own call_rcu thread, this is default. */

static struct call_rcu_data *default_call_rcu_data;

extern void synchronize_rcu(void);

/*
 * If the sched_getcpu() and sysconf(_SC_NPROCESSORS_CONF) calls are
 * available, then we can have call_rcu threads assigned to individual
 * CPUs rather than only to specific threads.
 */

#if defined(HAVE_SCHED_GETCPU) && defined(HAVE_SYSCONF)

/*
 * Pointer to array of pointers to per-CPU call_rcu_data structures
 * and # CPUs.
 */

static struct call_rcu_data **per_cpu_call_rcu_data;
static long maxcpus;

/* Allocate the array if it has not already been allocated. */

static void alloc_cpu_call_rcu_data(void)
{
	struct call_rcu_data **p;
	static int warned = 0;

	if (maxcpus != 0)
		return;
	maxcpus = sysconf(_SC_NPROCESSORS_CONF);
	if (maxcpus <= 0) {
		return;
	}
	p = malloc(maxcpus * sizeof(*per_cpu_call_rcu_data));
	if (p != NULL) {
		memset(p, '\0', maxcpus * sizeof(*per_cpu_call_rcu_data));
		per_cpu_call_rcu_data = p;
	} else {
		if (!warned) {
			fprintf(stderr, "[error] liburcu: unable to allocate per-CPU pointer array\n");
		}
		warned = 1;
	}
}

#else /* #if defined(HAVE_SCHED_GETCPU) && defined(HAVE_SYSCONF) */

static const struct call_rcu_data **per_cpu_call_rcu_data = NULL;
static const long maxcpus = -1;

static void alloc_cpu_call_rcu_data(void)
{
}

static int sched_getcpu(void)
{
	return -1;
}

#endif /* #else #if defined(HAVE_SCHED_GETCPU) && defined(HAVE_SYSCONF) */

/* Acquire the specified pthread mutex. */

static void call_rcu_lock(pthread_mutex_t *pmp)
{
	if (pthread_mutex_lock(pmp) != 0) {
		perror("pthread_mutex_lock");
		exit(-1);
	}
}

/* Release the specified pthread mutex. */

static void call_rcu_unlock(pthread_mutex_t *pmp)
{
	if (pthread_mutex_unlock(pmp) != 0) {
		perror("pthread_mutex_unlock");
		exit(-1);
	}
}

/* This is the code run by each call_rcu thread. */

static void *call_rcu_thread(void *arg)
{
	unsigned long cbcount;
	struct cds_wfq_node *cbs;
	struct cds_wfq_node **cbs_tail;
	struct call_rcu_data *crdp = (struct call_rcu_data *)arg;
	struct rcu_head *rhp;

	thread_call_rcu_data = crdp;
	for (;;) {
		if (&crdp->cbs.head != _CMM_LOAD_SHARED(crdp->cbs.tail)) {
			while ((cbs = _CMM_LOAD_SHARED(crdp->cbs.head)) == NULL)
				poll(NULL, 0, 1);
			_CMM_STORE_SHARED(crdp->cbs.head, NULL);
			cbs_tail = (struct cds_wfq_node **)
				uatomic_xchg(&crdp->cbs.tail, &crdp->cbs.head);
			synchronize_rcu();
			cbcount = 0;
			do {
				while (cbs->next == NULL &&
				       &cbs->next != cbs_tail)
				       	poll(NULL, 0, 1);
				if (cbs == &crdp->cbs.dummy) {
					cbs = cbs->next;
					continue;
				}
				rhp = (struct rcu_head *)cbs;
				cbs = cbs->next;
				rhp->func(rhp);
				cbcount++;
			} while (cbs != NULL);
			uatomic_sub(&crdp->qlen, cbcount);
		}
		if (crdp->flags & URCU_CALL_RCU_RT)
			poll(NULL, 0, 10);
		else {
			call_rcu_lock(&crdp->mtx);
			_CMM_STORE_SHARED(crdp->flags,
				     crdp->flags & ~URCU_CALL_RCU_RUNNING);
			if (&crdp->cbs.head ==
			    _CMM_LOAD_SHARED(crdp->cbs.tail) &&
			    pthread_cond_wait(&crdp->cond, &crdp->mtx) != 0) {
				perror("pthread_cond_wait");
				exit(-1);
			}
			_CMM_STORE_SHARED(crdp->flags,
				     crdp->flags | URCU_CALL_RCU_RUNNING);
			poll(NULL, 0, 10);
			call_rcu_unlock(&crdp->mtx);
		}
	}
	return NULL;  /* NOTREACHED */
}

/*
 * Create both a call_rcu thread and the corresponding call_rcu_data
 * structure, linking the structure in as specified.
 */

void call_rcu_data_init(struct call_rcu_data **crdpp, unsigned long flags)
{
	struct call_rcu_data *crdp;

	crdp = malloc(sizeof(*crdp));
	if (crdp == NULL) {
		fprintf(stderr, "Out of memory.\n");
		exit(-1);
	}
	memset(crdp, '\0', sizeof(*crdp));
	cds_wfq_init(&crdp->cbs);
	crdp->qlen = 0;
	if (pthread_mutex_init(&crdp->mtx, NULL) != 0) {
		perror("pthread_mutex_init");
		exit(-1);
	}
	if (pthread_cond_init(&crdp->cond, NULL) != 0) {
		perror("pthread_cond_init");
		exit(-1);
	}
	crdp->flags = flags | URCU_CALL_RCU_RUNNING;
	cmm_smp_mb();  /* Structure initialized before pointer is planted. */
	*crdpp = crdp;
	if (pthread_create(&crdp->tid, NULL, call_rcu_thread, crdp) != 0) {
		perror("pthread_create");
		exit(-1);
	}
}

/*
 * Return a pointer to the call_rcu_data structure for the specified
 * CPU, returning NULL if there is none.  We cannot automatically
 * created it because the platform we are running on might not define
 * sched_getcpu().
 */

struct call_rcu_data *get_cpu_call_rcu_data(int cpu)
{
	static int warned = 0;

	if (per_cpu_call_rcu_data == NULL)
		return NULL;
	if (!warned && maxcpus > 0 && (cpu < 0 || maxcpus <= cpu)) {
		fprintf(stderr, "[error] liburcu: get CPU # out of range\n");
		warned = 1;
	}
	if (cpu < 0 || maxcpus <= cpu)
		return NULL;
	return per_cpu_call_rcu_data[cpu];
}

/*
 * Return the tid corresponding to the call_rcu thread whose
 * call_rcu_data structure is specified.
 */

pthread_t get_call_rcu_thread(struct call_rcu_data *crdp)
{
	return crdp->tid;
}

/*
 * Create a call_rcu_data structure (with thread) and return a pointer.
 */

struct call_rcu_data *create_call_rcu_data(unsigned long flags)
{
	struct call_rcu_data *crdp;

	call_rcu_data_init(&crdp, flags);
	return crdp;
}

/*
 * Set the specified CPU to use the specified call_rcu_data structure.
 */

int set_cpu_call_rcu_data(int cpu, struct call_rcu_data *crdp)
{
	int warned = 0;

	call_rcu_lock(&call_rcu_mutex);
	if (cpu < 0 || maxcpus <= cpu) {
		if (!warned) {
			fprintf(stderr, "[error] liburcu: set CPU # out of range\n");
			warned = 1;
		}
		call_rcu_unlock(&call_rcu_mutex);
		errno = EINVAL;
		return -EINVAL;
	}
	alloc_cpu_call_rcu_data();
	call_rcu_unlock(&call_rcu_mutex);
	if (per_cpu_call_rcu_data == NULL) {
		errno = ENOMEM;
		return -ENOMEM;
	}
	per_cpu_call_rcu_data[cpu] = crdp;
	return 0;
}

/*
 * Return a pointer to the default call_rcu_data structure, creating
 * one if need be.  Because we never free call_rcu_data structures,
 * we don't need to be in an RCU read-side critical section.
 */

struct call_rcu_data *get_default_call_rcu_data(void)
{
	if (default_call_rcu_data != NULL)
		return rcu_dereference(default_call_rcu_data);
	call_rcu_lock(&call_rcu_mutex);
	if (default_call_rcu_data != NULL) {
		call_rcu_unlock(&call_rcu_mutex);
		return default_call_rcu_data;
	}
	call_rcu_data_init(&default_call_rcu_data, 0);
	call_rcu_unlock(&call_rcu_mutex);
	return default_call_rcu_data;
}

/*
 * Return the call_rcu_data structure that applies to the currently
 * running thread.  Any call_rcu_data structure assigned specifically
 * to this thread has first priority, followed by any call_rcu_data
 * structure assigned to the CPU on which the thread is running,
 * followed by the default call_rcu_data structure.  If there is not
 * yet a default call_rcu_data structure, one will be created.
 */
struct call_rcu_data *get_call_rcu_data(void)
{
	int curcpu;
	static int warned = 0;

	if (thread_call_rcu_data != NULL)
		return thread_call_rcu_data;
	if (maxcpus <= 0)
		return get_default_call_rcu_data();
	curcpu = sched_getcpu();
	if (!warned && (curcpu < 0 || maxcpus <= curcpu)) {
		fprintf(stderr, "[error] liburcu: gcrd CPU # out of range\n");
		warned = 1;
	}
	if (curcpu >= 0 && maxcpus > curcpu &&
	    per_cpu_call_rcu_data != NULL &&
	    per_cpu_call_rcu_data[curcpu] != NULL)
	    	return per_cpu_call_rcu_data[curcpu];
	return get_default_call_rcu_data();
}

/*
 * Return a pointer to this task's call_rcu_data if there is one.
 */

struct call_rcu_data *get_thread_call_rcu_data(void)
{
	return thread_call_rcu_data;
}

/*
 * Set this task's call_rcu_data structure as specified, regardless
 * of whether or not this task already had one.  (This allows switching
 * to and from real-time call_rcu threads, for example.)
 */

void set_thread_call_rcu_data(struct call_rcu_data *crdp)
{
	thread_call_rcu_data = crdp;
}

/*
 * Create a separate call_rcu thread for each CPU.  This does not
 * replace a pre-existing call_rcu thread -- use the set_cpu_call_rcu_data()
 * function if you want that behavior.
 */

int create_all_cpu_call_rcu_data(unsigned long flags)
{
	int i;
	struct call_rcu_data *crdp;
	int ret;

	call_rcu_lock(&call_rcu_mutex);
	alloc_cpu_call_rcu_data();
	call_rcu_unlock(&call_rcu_mutex);
	if (maxcpus <= 0) {
		errno = EINVAL;
		return -EINVAL;
	}
	if (per_cpu_call_rcu_data == NULL) {
		errno = ENOMEM;
		return -ENOMEM;
	}
	for (i = 0; i < maxcpus; i++) {
		call_rcu_lock(&call_rcu_mutex);
		if (get_cpu_call_rcu_data(i)) {
			call_rcu_unlock(&call_rcu_mutex);
			continue;
		}
		crdp = create_call_rcu_data(flags);
		if (crdp == NULL) {
			call_rcu_unlock(&call_rcu_mutex);
			errno = ENOMEM;
			return -ENOMEM;
		}
		call_rcu_unlock(&call_rcu_mutex);
		if ((ret = set_cpu_call_rcu_data(i, crdp)) != 0) {
			/* FIXME: Leaks crdp for now. */
			return ret; /* Can happen on race. */
		}
	}
	return 0;
}

/*
 * Schedule a function to be invoked after a following grace period.
 * This is the only function that must be called -- the others are
 * only present to allow applications to tune their use of RCU for
 * maximum performance.
 *
 * Note that unless a call_rcu thread has not already been created,
 * the first invocation of call_rcu() will create one.  So, if you
 * need the first invocation of call_rcu() to be fast, make sure
 * to create a call_rcu thread first.  One way to accomplish this is
 * "get_call_rcu_data();", and another is create_all_cpu_call_rcu_data().
 */

void call_rcu(struct rcu_head *head,
	      void (*func)(struct rcu_head *head))
{
	struct call_rcu_data *crdp;

	cds_wfq_node_init(&head->next);
	head->func = func;
	crdp = get_call_rcu_data();
	cds_wfq_enqueue(&crdp->cbs, &head->next);
	uatomic_inc(&crdp->qlen);
	if (!(_CMM_LOAD_SHARED(crdp->flags) & URCU_CALL_RCU_RT)) {
		call_rcu_lock(&crdp->mtx);
		if (!(_CMM_LOAD_SHARED(crdp->flags) & URCU_CALL_RCU_RUNNING)) {
			if (pthread_cond_signal(&crdp->cond) != 0) {
				perror("pthread_cond_signal");
				exit(-1);
			}
		}
		call_rcu_unlock(&crdp->mtx);
	}
}
Commit	Line	Data
b57aee66 PM	1	/*
	2	* urcu-call-rcu.c
	3	*
	4	* Userspace RCU library - batch memory reclamation with kernel API
	5	*
	6	* Copyright (c) 2010 Paul E. McKenney <paulmck@linux.vnet.ibm.com>
	7	*
	8	* This library is free software; you can redistribute it and/or
	9	* modify it under the terms of the GNU Lesser General Public
	10	* License as published by the Free Software Foundation; either
	11	* version 2.1 of the License, or (at your option) any later version.
	12	*
	13	* This library is distributed in the hope that it will be useful,
	14	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	15	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
	16	* Lesser General Public License for more details.
	17	*
	18	* You should have received a copy of the GNU Lesser General Public
	19	* License along with this library; if not, write to the Free Software
	20	* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
	21	*/
	22
	23	#include <stdio.h>
	24	#include <pthread.h>
	25	#include <signal.h>
	26	#include <assert.h>
	27	#include <stdlib.h>
	28	#include <string.h>
	29	#include <errno.h>
	30	#include <poll.h>
	31	#include <sys/time.h>
	32	#include <syscall.h>
	33	#include <unistd.h>
	34
	35	#include "config.h"
	36	#include "urcu/wfqueue.h"
	37	#include "urcu-call-rcu.h"
	38	#include "urcu-pointer.h"
	39
	40	/* Data structure that identifies a call_rcu thread. */
	41
	42	struct call_rcu_data {
	43	struct cds_wfq_queue cbs;
	44	unsigned long flags;
	45	pthread_mutex_t mtx;
	46	pthread_cond_t cond;
	47	unsigned long qlen;
	48	pthread_t tid;
	49	} __attribute__((aligned(CAA_CACHE_LINE_SIZE)));
	50
	51	/* Link a thread using call_rcu() to its call_rcu thread. */
	52
	53	static __thread struct call_rcu_data *thread_call_rcu_data;
	54
	55	/* Guard call_rcu thread creation. */
	56
	57	static pthread_mutex_t call_rcu_mutex = PTHREAD_MUTEX_INITIALIZER;
	58
	59	/* If a given thread does not have its own call_rcu thread, this is default. */
	60
	61	static struct call_rcu_data *default_call_rcu_data;
	62
	63	extern void synchronize_rcu(void);
	64
65	/*
66	* If the sched_getcpu() and sysconf(_SC_NPROCESSORS_CONF) calls are
67	* available, then we can have call_rcu threads assigned to individual
68	* CPUs rather than only to specific threads.
69	*/
70
71	#if defined(HAVE_SCHED_GETCPU) && defined(HAVE_SYSCONF)
72
73	/*
74	* Pointer to array of pointers to per-CPU call_rcu_data structures
75	* and # CPUs.
76	*/
77
78	static struct call_rcu_data **per_cpu_call_rcu_data;
79	static long maxcpus;
80
81	/* Allocate the array if it has not already been allocated. */
82
83	static void alloc_cpu_call_rcu_data(void)
84	{
85	struct call_rcu_data **p;
86	static int warned = 0;
87
88	if (maxcpus != 0)
89	return;
90	maxcpus = sysconf(_SC_NPROCESSORS_CONF);
91	if (maxcpus <= 0) {
92	return;
93	}
94	p = malloc(maxcpus * sizeof(*per_cpu_call_rcu_data));
95	if (p != NULL) {
96	memset(p, '\0', maxcpus * sizeof(*per_cpu_call_rcu_data));
97	per_cpu_call_rcu_data = p;
98	} else {
99	if (!warned) {
100	fprintf(stderr, "[error] liburcu: unable to allocate per-CPU pointer array\n");
101	}
102	warned = 1;
103	}
104	}
105
106	#else /* #if defined(HAVE_SCHED_GETCPU) && defined(HAVE_SYSCONF) */
107
108	static const struct call_rcu_data **per_cpu_call_rcu_data = NULL;
109	static const long maxcpus = -1;
110
111	static void alloc_cpu_call_rcu_data(void)
112	{
113	}
114
115	static int sched_getcpu(void)
116	{
117	return -1;
118	}
119
120	#endif /* #else #if defined(HAVE_SCHED_GETCPU) && defined(HAVE_SYSCONF) */
121
122	/* Acquire the specified pthread mutex. */
123
124	static void call_rcu_lock(pthread_mutex_t *pmp)
125	{
126	if (pthread_mutex_lock(pmp) != 0) {
127	perror("pthread_mutex_lock");
128	exit(-1);
129	}
130	}
131
132	/* Release the specified pthread mutex. */
133
134	static void call_rcu_unlock(pthread_mutex_t *pmp)
135	{
136	if (pthread_mutex_unlock(pmp) != 0) {
137	perror("pthread_mutex_unlock");
138	exit(-1);
139	}
140	}
141
142	/* This is the code run by each call_rcu thread. */
143
144	static void call_rcu_thread(void arg)
145	{
146	unsigned long cbcount;
147	struct cds_wfq_node *cbs;
148	struct cds_wfq_node **cbs_tail;
149	struct call_rcu_data crdp = (struct call_rcu_data )arg;
150	struct rcu_head *rhp;
151
152	thread_call_rcu_data = crdp;
153	for (;;) {
154	if (&crdp->cbs.head != _CMM_LOAD_SHARED(crdp->cbs.tail)) {
155	while ((cbs = _CMM_LOAD_SHARED(crdp->cbs.head)) == NULL)
156	poll(NULL, 0, 1);
157	_CMM_STORE_SHARED(crdp->cbs.head, NULL);
158	cbs_tail = (struct cds_wfq_node **)
159	uatomic_xchg(&crdp->cbs.tail, &crdp->cbs.head);
160	synchronize_rcu();
161	cbcount = 0;
162	do {
163	while (cbs->next == NULL &&
164	&cbs->next != cbs_tail)
165	poll(NULL, 0, 1);
166	if (cbs == &crdp->cbs.dummy) {
167	cbs = cbs->next;
168	continue;
169	}
170	rhp = (struct rcu_head *)cbs;
171	cbs = cbs->next;
172	rhp->func(rhp);
173	cbcount++;
174	} while (cbs != NULL);
175	uatomic_sub(&crdp->qlen, cbcount);
176	}
177	if (crdp->flags & URCU_CALL_RCU_RT)
178	poll(NULL, 0, 10);
179	else {
180	call_rcu_lock(&crdp->mtx);
181	_CMM_STORE_SHARED(crdp->flags,
182	crdp->flags & ~URCU_CALL_RCU_RUNNING);
183	if (&crdp->cbs.head ==
184	_CMM_LOAD_SHARED(crdp->cbs.tail) &&
185	pthread_cond_wait(&crdp->cond, &crdp->mtx) != 0) {
186	perror("pthread_cond_wait");
187	exit(-1);
188	}
189	_CMM_STORE_SHARED(crdp->flags,
190	crdp->flags \| URCU_CALL_RCU_RUNNING);
191	poll(NULL, 0, 10);
192	call_rcu_unlock(&crdp->mtx);
193	}
194	}
195	return NULL; /* NOTREACHED */
196	}
197
198	/*
199	* Create both a call_rcu thread and the corresponding call_rcu_data
200	* structure, linking the structure in as specified.
201	*/
202
203	void call_rcu_data_init(struct call_rcu_data **crdpp, unsigned long flags)
204	{
205	struct call_rcu_data *crdp;
206
207	crdp = malloc(sizeof(*crdp));
208	if (crdp == NULL) {
209	fprintf(stderr, "Out of memory.\n");
210	exit(-1);
211	}
212	memset(crdp, '\0', sizeof(*crdp));
213	cds_wfq_init(&crdp->cbs);
214	crdp->qlen = 0;
215	if (pthread_mutex_init(&crdp->mtx, NULL) != 0) {
216	perror("pthread_mutex_init");
217	exit(-1);
218	}
219	if (pthread_cond_init(&crdp->cond, NULL) != 0) {
220	perror("pthread_cond_init");
221	exit(-1);
222	}
223	crdp->flags = flags \| URCU_CALL_RCU_RUNNING;
224	cmm_smp_mb(); /* Structure initialized before pointer is planted. */
225	*crdpp = crdp;
226	if (pthread_create(&crdp->tid, NULL, call_rcu_thread, crdp) != 0) {
227	perror("pthread_create");
228	exit(-1);
229	}
230	}
231
232	/*
233	* Return a pointer to the call_rcu_data structure for the specified
234	* CPU, returning NULL if there is none. We cannot automatically
235	* created it because the platform we are running on might not define
236	* sched_getcpu().
237	*/
238
239	struct call_rcu_data *get_cpu_call_rcu_data(int cpu)
240	{
241	static int warned = 0;
242
243	if (per_cpu_call_rcu_data == NULL)
244	return NULL;
245	if (!warned && maxcpus > 0 && (cpu < 0 \|\| maxcpus <= cpu)) {
246	fprintf(stderr, "[error] liburcu: get CPU # out of range\n");
247	warned = 1;
248	}
249	if (cpu < 0 \|\| maxcpus <= cpu)
250	return NULL;
251	return per_cpu_call_rcu_data[cpu];
252	}
253
254	/*
255	* Return the tid corresponding to the call_rcu thread whose
256	* call_rcu_data structure is specified.
257	*/
258
259	pthread_t get_call_rcu_thread(struct call_rcu_data *crdp)
260	{
261	return crdp->tid;
262	}
263
264	/*
265	* Create a call_rcu_data structure (with thread) and return a pointer.
266	*/
267
268	struct call_rcu_data *create_call_rcu_data(unsigned long flags)
269	{
270	struct call_rcu_data *crdp;
271
272	call_rcu_data_init(&crdp, flags);
273	return crdp;
274	}
275
276	/*
277	* Set the specified CPU to use the specified call_rcu_data structure.
278	*/
279
280	int set_cpu_call_rcu_data(int cpu, struct call_rcu_data *crdp)
281	{
282	int warned = 0;
283
284	call_rcu_lock(&call_rcu_mutex);
285	if (cpu < 0 \|\| maxcpus <= cpu) {
286	if (!warned) {
287	fprintf(stderr, "[error] liburcu: set CPU # out of range\n");
288	warned = 1;
289	}
290	call_rcu_unlock(&call_rcu_mutex);
291	errno = EINVAL;
292	return -EINVAL;
293	}
294	alloc_cpu_call_rcu_data();
295	call_rcu_unlock(&call_rcu_mutex);
296	if (per_cpu_call_rcu_data == NULL) {
297	errno = ENOMEM;
298	return -ENOMEM;
299	}
300	per_cpu_call_rcu_data[cpu] = crdp;
301	return 0;
302	}
303
304	/*
305	* Return a pointer to the default call_rcu_data structure, creating
306	* one if need be. Because we never free call_rcu_data structures,
307	* we don't need to be in an RCU read-side critical section.
308	*/
309
310	struct call_rcu_data *get_default_call_rcu_data(void)
311	{
312	if (default_call_rcu_data != NULL)
313	return rcu_dereference(default_call_rcu_data);
314	call_rcu_lock(&call_rcu_mutex);
315	if (default_call_rcu_data != NULL) {
316	call_rcu_unlock(&call_rcu_mutex);
317	return default_call_rcu_data;
318	}
319	call_rcu_data_init(&default_call_rcu_data, 0);
320	call_rcu_unlock(&call_rcu_mutex);
321	return default_call_rcu_data;
322	}
323
324	/*
325	* Return the call_rcu_data structure that applies to the currently
326	* running thread. Any call_rcu_data structure assigned specifically
327	* to this thread has first priority, followed by any call_rcu_data
328	* structure assigned to the CPU on which the thread is running,
329	* followed by the default call_rcu_data structure. If there is not
330	* yet a default call_rcu_data structure, one will be created.
331	*/
332	struct call_rcu_data *get_call_rcu_data(void)
333	{
334	int curcpu;
335	static int warned = 0;
336
337	if (thread_call_rcu_data != NULL)
338	return thread_call_rcu_data;
339	if (maxcpus <= 0)
340	return get_default_call_rcu_data();
341	curcpu = sched_getcpu();
342	if (!warned && (curcpu < 0 \|\| maxcpus <= curcpu)) {
343	fprintf(stderr, "[error] liburcu: gcrd CPU # out of range\n");
344	warned = 1;
345	}
346	if (curcpu >= 0 && maxcpus > curcpu &&
347	per_cpu_call_rcu_data != NULL &&
348	per_cpu_call_rcu_data[curcpu] != NULL)
349	return per_cpu_call_rcu_data[curcpu];
350	return get_default_call_rcu_data();
351	}
352
353	/*
354	* Return a pointer to this task's call_rcu_data if there is one.
355	*/
356
357	struct call_rcu_data *get_thread_call_rcu_data(void)
358	{
359	return thread_call_rcu_data;
360	}
361
362	/*
363	* Set this task's call_rcu_data structure as specified, regardless
364	* of whether or not this task already had one. (This allows switching
365	* to and from real-time call_rcu threads, for example.)
366	*/
367
368	void set_thread_call_rcu_data(struct call_rcu_data *crdp)
369	{
370	thread_call_rcu_data = crdp;
371	}
372
373	/*
374	* Create a separate call_rcu thread for each CPU. This does not
375	* replace a pre-existing call_rcu thread -- use the set_cpu_call_rcu_data()
376	* function if you want that behavior.
377	*/
378
379	int create_all_cpu_call_rcu_data(unsigned long flags)
380	{
381	int i;
382	struct call_rcu_data *crdp;
383	int ret;
384
385	call_rcu_lock(&call_rcu_mutex);
386	alloc_cpu_call_rcu_data();
387	call_rcu_unlock(&call_rcu_mutex);
388	if (maxcpus <= 0) {
389	errno = EINVAL;
390	return -EINVAL;
391	}
392	if (per_cpu_call_rcu_data == NULL) {
393	errno = ENOMEM;
394	return -ENOMEM;
395	}
396	for (i = 0; i < maxcpus; i++) {
397	call_rcu_lock(&call_rcu_mutex);
398	if (get_cpu_call_rcu_data(i)) {
399	call_rcu_unlock(&call_rcu_mutex);
400	continue;
401	}
402	crdp = create_call_rcu_data(flags);
403	if (crdp == NULL) {
404	call_rcu_unlock(&call_rcu_mutex);
405	errno = ENOMEM;
406	return -ENOMEM;
407	}
408	call_rcu_unlock(&call_rcu_mutex);
409	if ((ret = set_cpu_call_rcu_data(i, crdp)) != 0) {
410	/* FIXME: Leaks crdp for now. */
411	return ret; /* Can happen on race. */
412	}
413	}
414	return 0;
415	}
416
417	/*
418	* Schedule a function to be invoked after a following grace period.
419	* This is the only function that must be called -- the others are
420	* only present to allow applications to tune their use of RCU for
421	* maximum performance.
422	*
423	* Note that unless a call_rcu thread has not already been created,
424	* the first invocation of call_rcu() will create one. So, if you
425	* need the first invocation of call_rcu() to be fast, make sure
426	* to create a call_rcu thread first. One way to accomplish this is
427	* "get_call_rcu_data();", and another is create_all_cpu_call_rcu_data().
428	*/
429
430	void call_rcu(struct rcu_head *head,
431	void (func)(struct rcu_head head))
432	{
433	struct call_rcu_data *crdp;
434
435	cds_wfq_node_init(&head->next);
436	head->func = func;
437	crdp = get_call_rcu_data();
438	cds_wfq_enqueue(&crdp->cbs, &head->next);
439	uatomic_inc(&crdp->qlen);
440	if (!(_CMM_LOAD_SHARED(crdp->flags) & URCU_CALL_RCU_RT)) {
441	call_rcu_lock(&crdp->mtx);
442	if (!(_CMM_LOAD_SHARED(crdp->flags) & URCU_CALL_RCU_RUNNING)) {
443	if (pthread_cond_signal(&crdp->cond) != 0) {
444	perror("pthread_cond_signal");
445	exit(-1);
446	}
447	}
448	call_rcu_unlock(&crdp->mtx);
449	}
450	}