[userspace-rcu.git] / urcu-call-rcu.c

/*
 * urcu-call-rcu.c
 *
 * Userspace RCU library - batch memory reclamation with kernel API
 *
 * Copyright (c) 2010 Paul E. McKenney <paulmck@linux.vnet.ibm.com>
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#include <stdio.h>
#include <pthread.h>
#include <signal.h>
#include <assert.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <poll.h>
#include <sys/time.h>
#include <syscall.h>
#include <unistd.h>

#include "config.h"
#include "urcu/wfqueue.h"
#include "urcu-call-rcu.h"
#include "urcu-pointer.h"

/* Data structure that identifies a call_rcu thread. */

struct call_rcu_data {
	struct cds_wfq_queue cbs;
	unsigned long flags;
	pthread_mutex_t mtx;
	pthread_cond_t cond;
	unsigned long qlen;
	pthread_t tid;
} __attribute__((aligned(CAA_CACHE_LINE_SIZE)));

/* Link a thread using call_rcu() to its call_rcu thread. */

static __thread struct call_rcu_data *thread_call_rcu_data;

/* Guard call_rcu thread creation. */

static pthread_mutex_t call_rcu_mutex = PTHREAD_MUTEX_INITIALIZER;

/* If a given thread does not have its own call_rcu thread, this is default. */

static struct call_rcu_data *default_call_rcu_data;

extern void synchronize_rcu(void);

/*
 * If the sched_getcpu() and sysconf(_SC_NPROCESSORS_CONF) calls are
 * available, then we can have call_rcu threads assigned to individual
 * CPUs rather than only to specific threads.
 */

#if defined(HAVE_SCHED_GETCPU) && defined(HAVE_SYSCONF)

/*
 * Pointer to array of pointers to per-CPU call_rcu_data structures
 * and # CPUs.
 */

static struct call_rcu_data **per_cpu_call_rcu_data;
static long maxcpus;

/* Allocate the array if it has not already been allocated. */

static void alloc_cpu_call_rcu_data(void)
{
	struct call_rcu_data **p;
	static int warned = 0;

	if (maxcpus != 0)
		return;
	maxcpus = sysconf(_SC_NPROCESSORS_CONF);
	if (maxcpus <= 0) {
		return;
	}
	p = malloc(maxcpus * sizeof(*per_cpu_call_rcu_data));
	if (p != NULL) {
		memset(p, '\0', maxcpus * sizeof(*per_cpu_call_rcu_data));
		per_cpu_call_rcu_data = p;
	} else {
		if (!warned) {
			fprintf(stderr, "[error] liburcu: unable to allocate per-CPU pointer array\n");
		}
		warned = 1;
	}
}

#else /* #if defined(HAVE_SCHED_GETCPU) && defined(HAVE_SYSCONF) */

static const struct call_rcu_data **per_cpu_call_rcu_data = NULL;
static const long maxcpus = -1;

static void alloc_cpu_call_rcu_data(void)
{
}

static int sched_getcpu(void)
{
	return -1;
}

#endif /* #else #if defined(HAVE_SCHED_GETCPU) && defined(HAVE_SYSCONF) */

/* Acquire the specified pthread mutex. */

static void call_rcu_lock(pthread_mutex_t *pmp)
{
	if (pthread_mutex_lock(pmp) != 0) {
		perror("pthread_mutex_lock");
		exit(-1);
	}
}

/* Release the specified pthread mutex. */

static void call_rcu_unlock(pthread_mutex_t *pmp)
{
	if (pthread_mutex_unlock(pmp) != 0) {
		perror("pthread_mutex_unlock");
		exit(-1);
	}
}

/* This is the code run by each call_rcu thread. */

static void *call_rcu_thread(void *arg)
{
	unsigned long cbcount;
	struct cds_wfq_node *cbs;
	struct cds_wfq_node **cbs_tail;
	struct call_rcu_data *crdp = (struct call_rcu_data *)arg;
	struct rcu_head *rhp;

	thread_call_rcu_data = crdp;
	for (;;) {
		if (&crdp->cbs.head != _CMM_LOAD_SHARED(crdp->cbs.tail)) {
			while ((cbs = _CMM_LOAD_SHARED(crdp->cbs.head)) == NULL)
				poll(NULL, 0, 1);
			_CMM_STORE_SHARED(crdp->cbs.head, NULL);
			cbs_tail = (struct cds_wfq_node **)
				uatomic_xchg(&crdp->cbs.tail, &crdp->cbs.head);
			synchronize_rcu();
			cbcount = 0;
			do {
				while (cbs->next == NULL &&
				       &cbs->next != cbs_tail)
				       	poll(NULL, 0, 1);
				if (cbs == &crdp->cbs.dummy) {
					cbs = cbs->next;
					continue;
				}
				rhp = (struct rcu_head *)cbs;
				cbs = cbs->next;
				rhp->func(rhp);
				cbcount++;
			} while (cbs != NULL);
			uatomic_sub(&crdp->qlen, cbcount);
		}
		if (crdp->flags & URCU_CALL_RCU_RT)
			poll(NULL, 0, 10);
		else {
			call_rcu_lock(&crdp->mtx);
			_CMM_STORE_SHARED(crdp->flags,
				     crdp->flags & ~URCU_CALL_RCU_RUNNING);
			if (&crdp->cbs.head ==
			    _CMM_LOAD_SHARED(crdp->cbs.tail) &&
			    pthread_cond_wait(&crdp->cond, &crdp->mtx) != 0) {
				perror("pthread_cond_wait");
				exit(-1);
			}
			_CMM_STORE_SHARED(crdp->flags,
				     crdp->flags | URCU_CALL_RCU_RUNNING);
			poll(NULL, 0, 10);
			call_rcu_unlock(&crdp->mtx);
		}
	}
	return NULL;  /* NOTREACHED */
}

/*
 * Create both a call_rcu thread and the corresponding call_rcu_data
 * structure, linking the structure in as specified.
 */

void call_rcu_data_init(struct call_rcu_data **crdpp, unsigned long flags)
{
	struct call_rcu_data *crdp;

	crdp = malloc(sizeof(*crdp));
	if (crdp == NULL) {
		fprintf(stderr, "Out of memory.\n");
		exit(-1);
	}
	memset(crdp, '\0', sizeof(*crdp));
	cds_wfq_init(&crdp->cbs);
	crdp->qlen = 0;
	if (pthread_mutex_init(&crdp->mtx, NULL) != 0) {
		perror("pthread_mutex_init");
		exit(-1);
	}
	if (pthread_cond_init(&crdp->cond, NULL) != 0) {
		perror("pthread_cond_init");
		exit(-1);
	}
	crdp->flags = flags | URCU_CALL_RCU_RUNNING;
	cmm_smp_mb();  /* Structure initialized before pointer is planted. */
	*crdpp = crdp;
	if (pthread_create(&crdp->tid, NULL, call_rcu_thread, crdp) != 0) {
		perror("pthread_create");
		exit(-1);
	}
}

/*
 * Return a pointer to the call_rcu_data structure for the specified
 * CPU, returning NULL if there is none.  We cannot automatically
 * created it because the platform we are running on might not define
 * sched_getcpu().
 */

struct call_rcu_data *get_cpu_call_rcu_data(int cpu)
{
	static int warned = 0;

	if (per_cpu_call_rcu_data == NULL)
		return NULL;
	if (!warned && maxcpus > 0 && (cpu < 0 || maxcpus <= cpu)) {
		fprintf(stderr, "[error] liburcu: get CPU # out of range\n");
		warned = 1;
	}
	if (cpu < 0 || maxcpus <= cpu)
		return NULL;
	return per_cpu_call_rcu_data[cpu];
}

/*
 * Return the tid corresponding to the call_rcu thread whose
 * call_rcu_data structure is specified.
 */

pthread_t get_call_rcu_thread(struct call_rcu_data *crdp)
{
	return crdp->tid;
}

/*
 * Create a call_rcu_data structure (with thread) and return a pointer.
 */

struct call_rcu_data *create_call_rcu_data(unsigned long flags)
{
	struct call_rcu_data *crdp;

	call_rcu_data_init(&crdp, flags);
	return crdp;
}

/*
 * Set the specified CPU to use the specified call_rcu_data structure.
 */

int set_cpu_call_rcu_data(int cpu, struct call_rcu_data *crdp)
{
	int warned = 0;

	call_rcu_lock(&call_rcu_mutex);
	if (cpu < 0 || maxcpus <= cpu) {
		if (!warned) {
			fprintf(stderr, "[error] liburcu: set CPU # out of range\n");
			warned = 1;
		}
		call_rcu_unlock(&call_rcu_mutex);
		errno = EINVAL;
		return -EINVAL;
	}
	alloc_cpu_call_rcu_data();
	call_rcu_unlock(&call_rcu_mutex);
	if (per_cpu_call_rcu_data == NULL) {
		errno = ENOMEM;
		return -ENOMEM;
	}
	per_cpu_call_rcu_data[cpu] = crdp;
	return 0;
}

/*
 * Return a pointer to the default call_rcu_data structure, creating
 * one if need be.  Because we never free call_rcu_data structures,
 * we don't need to be in an RCU read-side critical section.
 */

struct call_rcu_data *get_default_call_rcu_data(void)
{
	if (default_call_rcu_data != NULL)
		return rcu_dereference(default_call_rcu_data);
	call_rcu_lock(&call_rcu_mutex);
	if (default_call_rcu_data != NULL) {
		call_rcu_unlock(&call_rcu_mutex);
		return default_call_rcu_data;
	}
	call_rcu_data_init(&default_call_rcu_data, 0);
	call_rcu_unlock(&call_rcu_mutex);
	return default_call_rcu_data;
}

/*
 * Return the call_rcu_data structure that applies to the currently
 * running thread.  Any call_rcu_data structure assigned specifically
 * to this thread has first priority, followed by any call_rcu_data
 * structure assigned to the CPU on which the thread is running,
 * followed by the default call_rcu_data structure.  If there is not
 * yet a default call_rcu_data structure, one will be created.
 */
struct call_rcu_data *get_call_rcu_data(void)
{
	int curcpu;
	static int warned = 0;

	if (thread_call_rcu_data != NULL)
		return thread_call_rcu_data;
	if (maxcpus <= 0)
		return get_default_call_rcu_data();
	curcpu = sched_getcpu();
	if (!warned && (curcpu < 0 || maxcpus <= curcpu)) {
		fprintf(stderr, "[error] liburcu: gcrd CPU # out of range\n");
		warned = 1;
	}
	if (curcpu >= 0 && maxcpus > curcpu &&
	    per_cpu_call_rcu_data != NULL &&
	    per_cpu_call_rcu_data[curcpu] != NULL)
	    	return per_cpu_call_rcu_data[curcpu];
	return get_default_call_rcu_data();
}

/*
 * Return a pointer to this task's call_rcu_data if there is one.
 */

struct call_rcu_data *get_thread_call_rcu_data(void)
{
	return thread_call_rcu_data;
}

/*
 * Set this task's call_rcu_data structure as specified, regardless
 * of whether or not this task already had one.  (This allows switching
 * to and from real-time call_rcu threads, for example.)
 */

void set_thread_call_rcu_data(struct call_rcu_data *crdp)
{
	thread_call_rcu_data = crdp;
}

/*
 * Create a separate call_rcu thread for each CPU.  This does not
 * replace a pre-existing call_rcu thread -- use the set_cpu_call_rcu_data()
 * function if you want that behavior.
 */

int create_all_cpu_call_rcu_data(unsigned long flags)
{
	int i;
	struct call_rcu_data *crdp;
	int ret;

	call_rcu_lock(&call_rcu_mutex);
	alloc_cpu_call_rcu_data();
	call_rcu_unlock(&call_rcu_mutex);
	if (maxcpus <= 0) {
		errno = EINVAL;
		return -EINVAL;
	}
	if (per_cpu_call_rcu_data == NULL) {
		errno = ENOMEM;
		return -ENOMEM;
	}
	for (i = 0; i < maxcpus; i++) {
		call_rcu_lock(&call_rcu_mutex);
		if (get_cpu_call_rcu_data(i)) {
			call_rcu_unlock(&call_rcu_mutex);
			continue;
		}
		crdp = create_call_rcu_data(flags);
		if (crdp == NULL) {
			call_rcu_unlock(&call_rcu_mutex);
			errno = ENOMEM;
			return -ENOMEM;
		}
		call_rcu_unlock(&call_rcu_mutex);
		if ((ret = set_cpu_call_rcu_data(i, crdp)) != 0) {
			/* FIXME: Leaks crdp for now. */
			return ret; /* Can happen on race. */
		}
	}
	return 0;
}

/*
 * Schedule a function to be invoked after a following grace period.
 * This is the only function that must be called -- the others are
 * only present to allow applications to tune their use of RCU for
 * maximum performance.
 *
 * Note that unless a call_rcu thread has not already been created,
 * the first invocation of call_rcu() will create one.  So, if you
 * need the first invocation of call_rcu() to be fast, make sure
 * to create a call_rcu thread first.  One way to accomplish this is
 * "get_call_rcu_data();", and another is create_all_cpu_call_rcu_data().
 */

void call_rcu(struct rcu_head *head,
	      void (*func)(struct rcu_head *head))
{
	struct call_rcu_data *crdp;

	cds_wfq_node_init(&head->next);
	head->func = func;
	crdp = get_call_rcu_data();
	cds_wfq_enqueue(&crdp->cbs, &head->next);
	uatomic_inc(&crdp->qlen);
	if (!(_CMM_LOAD_SHARED(crdp->flags) & URCU_CALL_RCU_RT)) {
		call_rcu_lock(&crdp->mtx);
		if (!(_CMM_LOAD_SHARED(crdp->flags) & URCU_CALL_RCU_RUNNING)) {
			if (pthread_cond_signal(&crdp->cond) != 0) {
				perror("pthread_cond_signal");
				exit(-1);
			}
		}
		call_rcu_unlock(&crdp->mtx);
	}
}
Commit	Line	Data
	1	/*
	2	* urcu-call-rcu.c
	3	*
	4	* Userspace RCU library - batch memory reclamation with kernel API
	5	*
	6	* Copyright (c) 2010 Paul E. McKenney <paulmck@linux.vnet.ibm.com>
	7	*
	8	* This library is free software; you can redistribute it and/or
	9	* modify it under the terms of the GNU Lesser General Public
	10	* License as published by the Free Software Foundation; either
	11	* version 2.1 of the License, or (at your option) any later version.
	12	*
	13	* This library is distributed in the hope that it will be useful,
	14	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	15	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
	16	* Lesser General Public License for more details.
	17	*
	18	* You should have received a copy of the GNU Lesser General Public
	19	* License along with this library; if not, write to the Free Software
	20	* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
	21	*/
	22
	23	#include <stdio.h>
	24	#include <pthread.h>
	25	#include <signal.h>
	26	#include <assert.h>
	27	#include <stdlib.h>
	28	#include <string.h>
	29	#include <errno.h>
	30	#include <poll.h>
	31	#include <sys/time.h>
	32	#include <syscall.h>
	33	#include <unistd.h>
	34
	35	#include "config.h"
	36	#include "urcu/wfqueue.h"
	37	#include "urcu-call-rcu.h"
	38	#include "urcu-pointer.h"
	39
	40	/* Data structure that identifies a call_rcu thread. */
	41
	42	struct call_rcu_data {
	43	struct cds_wfq_queue cbs;
	44	unsigned long flags;
	45	pthread_mutex_t mtx;
	46	pthread_cond_t cond;
	47	unsigned long qlen;
	48	pthread_t tid;
	49	} __attribute__((aligned(CAA_CACHE_LINE_SIZE)));
	50
	51	/* Link a thread using call_rcu() to its call_rcu thread. */
	52
	53	static __thread struct call_rcu_data *thread_call_rcu_data;
	54
	55	/* Guard call_rcu thread creation. */
	56
	57	static pthread_mutex_t call_rcu_mutex = PTHREAD_MUTEX_INITIALIZER;
	58
	59	/* If a given thread does not have its own call_rcu thread, this is default. */
	60
	61	static struct call_rcu_data *default_call_rcu_data;
	62
	63	extern void synchronize_rcu(void);
	64
	65	/*
	66	* If the sched_getcpu() and sysconf(_SC_NPROCESSORS_CONF) calls are
	67	* available, then we can have call_rcu threads assigned to individual
	68	* CPUs rather than only to specific threads.
	69	*/
	70
	71	#if defined(HAVE_SCHED_GETCPU) && defined(HAVE_SYSCONF)
	72
	73	/*
	74	* Pointer to array of pointers to per-CPU call_rcu_data structures
	75	* and # CPUs.
	76	*/
	77
	78	static struct call_rcu_data **per_cpu_call_rcu_data;
	79	static long maxcpus;
	80
	81	/* Allocate the array if it has not already been allocated. */
	82
	83	static void alloc_cpu_call_rcu_data(void)
	84	{
	85	struct call_rcu_data **p;
	86	static int warned = 0;
	87
	88	if (maxcpus != 0)
	89	return;
	90	maxcpus = sysconf(_SC_NPROCESSORS_CONF);
	91	if (maxcpus <= 0) {
	92	return;
	93	}
	94	p = malloc(maxcpus * sizeof(*per_cpu_call_rcu_data));
	95	if (p != NULL) {
	96	memset(p, '\0', maxcpus * sizeof(*per_cpu_call_rcu_data));
	97	per_cpu_call_rcu_data = p;
	98	} else {
	99	if (!warned) {
	100	fprintf(stderr, "[error] liburcu: unable to allocate per-CPU pointer array\n");
	101	}
	102	warned = 1;
	103	}
	104	}
	105
	106	#else /* #if defined(HAVE_SCHED_GETCPU) && defined(HAVE_SYSCONF) */
	107
	108	static const struct call_rcu_data **per_cpu_call_rcu_data = NULL;
	109	static const long maxcpus = -1;
	110
	111	static void alloc_cpu_call_rcu_data(void)
	112	{
	113	}
	114
	115	static int sched_getcpu(void)
	116	{
	117	return -1;
	118	}
	119
	120	#endif /* #else #if defined(HAVE_SCHED_GETCPU) && defined(HAVE_SYSCONF) */
	121
	122	/* Acquire the specified pthread mutex. */
	123
	124	static void call_rcu_lock(pthread_mutex_t *pmp)
	125	{
	126	if (pthread_mutex_lock(pmp) != 0) {
	127	perror("pthread_mutex_lock");
	128	exit(-1);
	129	}
	130	}
	131
	132	/* Release the specified pthread mutex. */
	133
	134	static void call_rcu_unlock(pthread_mutex_t *pmp)
	135	{
	136	if (pthread_mutex_unlock(pmp) != 0) {
	137	perror("pthread_mutex_unlock");
	138	exit(-1);
	139	}
	140	}
	141
	142	/* This is the code run by each call_rcu thread. */
	143
	144	static void call_rcu_thread(void arg)
	145	{
	146	unsigned long cbcount;
	147	struct cds_wfq_node *cbs;
	148	struct cds_wfq_node **cbs_tail;
	149	struct call_rcu_data crdp = (struct call_rcu_data )arg;
	150	struct rcu_head *rhp;
	151
	152	thread_call_rcu_data = crdp;
	153	for (;;) {
	154	if (&crdp->cbs.head != _CMM_LOAD_SHARED(crdp->cbs.tail)) {
	155	while ((cbs = _CMM_LOAD_SHARED(crdp->cbs.head)) == NULL)
	156	poll(NULL, 0, 1);
	157	_CMM_STORE_SHARED(crdp->cbs.head, NULL);
	158	cbs_tail = (struct cds_wfq_node **)
	159	uatomic_xchg(&crdp->cbs.tail, &crdp->cbs.head);
	160	synchronize_rcu();
	161	cbcount = 0;
	162	do {
	163	while (cbs->next == NULL &&
	164	&cbs->next != cbs_tail)
	165	poll(NULL, 0, 1);
	166	if (cbs == &crdp->cbs.dummy) {
	167	cbs = cbs->next;
	168	continue;
	169	}
	170	rhp = (struct rcu_head *)cbs;
	171	cbs = cbs->next;
	172	rhp->func(rhp);
	173	cbcount++;
	174	} while (cbs != NULL);
	175	uatomic_sub(&crdp->qlen, cbcount);
	176	}
	177	if (crdp->flags & URCU_CALL_RCU_RT)
	178	poll(NULL, 0, 10);
	179	else {
	180	call_rcu_lock(&crdp->mtx);
	181	_CMM_STORE_SHARED(crdp->flags,
	182	crdp->flags & ~URCU_CALL_RCU_RUNNING);
	183	if (&crdp->cbs.head ==
	184	_CMM_LOAD_SHARED(crdp->cbs.tail) &&
	185	pthread_cond_wait(&crdp->cond, &crdp->mtx) != 0) {
	186	perror("pthread_cond_wait");
	187	exit(-1);
	188	}
	189	_CMM_STORE_SHARED(crdp->flags,
	190	crdp->flags \| URCU_CALL_RCU_RUNNING);
	191	poll(NULL, 0, 10);
	192	call_rcu_unlock(&crdp->mtx);
	193	}
	194	}
	195	return NULL; /* NOTREACHED */
	196	}
	197
	198	/*
	199	* Create both a call_rcu thread and the corresponding call_rcu_data
	200	* structure, linking the structure in as specified.
	201	*/
	202
	203	void call_rcu_data_init(struct call_rcu_data **crdpp, unsigned long flags)
	204	{
	205	struct call_rcu_data *crdp;
	206
	207	crdp = malloc(sizeof(*crdp));
	208	if (crdp == NULL) {
	209	fprintf(stderr, "Out of memory.\n");
	210	exit(-1);
	211	}
	212	memset(crdp, '\0', sizeof(*crdp));
	213	cds_wfq_init(&crdp->cbs);
	214	crdp->qlen = 0;
	215	if (pthread_mutex_init(&crdp->mtx, NULL) != 0) {
	216	perror("pthread_mutex_init");
	217	exit(-1);
	218	}
	219	if (pthread_cond_init(&crdp->cond, NULL) != 0) {
	220	perror("pthread_cond_init");
	221	exit(-1);
	222	}
	223	crdp->flags = flags \| URCU_CALL_RCU_RUNNING;
	224	cmm_smp_mb(); /* Structure initialized before pointer is planted. */
	225	*crdpp = crdp;
	226	if (pthread_create(&crdp->tid, NULL, call_rcu_thread, crdp) != 0) {
	227	perror("pthread_create");
	228	exit(-1);
	229	}
	230	}
	231
	232	/*
	233	* Return a pointer to the call_rcu_data structure for the specified
	234	* CPU, returning NULL if there is none. We cannot automatically
	235	* created it because the platform we are running on might not define
	236	* sched_getcpu().
	237	*/
	238
	239	struct call_rcu_data *get_cpu_call_rcu_data(int cpu)
	240	{
	241	static int warned = 0;
	242
	243	if (per_cpu_call_rcu_data == NULL)
	244	return NULL;
	245	if (!warned && maxcpus > 0 && (cpu < 0 \|\| maxcpus <= cpu)) {
	246	fprintf(stderr, "[error] liburcu: get CPU # out of range\n");
	247	warned = 1;
	248	}
	249	if (cpu < 0 \|\| maxcpus <= cpu)
	250	return NULL;
	251	return per_cpu_call_rcu_data[cpu];
	252	}
	253
	254	/*
	255	* Return the tid corresponding to the call_rcu thread whose
	256	* call_rcu_data structure is specified.
	257	*/
	258
	259	pthread_t get_call_rcu_thread(struct call_rcu_data *crdp)
	260	{
	261	return crdp->tid;
	262	}
	263
	264	/*
	265	* Create a call_rcu_data structure (with thread) and return a pointer.
	266	*/
	267
	268	struct call_rcu_data *create_call_rcu_data(unsigned long flags)
	269	{
	270	struct call_rcu_data *crdp;
	271
	272	call_rcu_data_init(&crdp, flags);
	273	return crdp;
	274	}
	275
	276	/*
	277	* Set the specified CPU to use the specified call_rcu_data structure.
	278	*/
	279
	280	int set_cpu_call_rcu_data(int cpu, struct call_rcu_data *crdp)
	281	{
	282	int warned = 0;
	283
	284	call_rcu_lock(&call_rcu_mutex);
	285	if (cpu < 0 \|\| maxcpus <= cpu) {
	286	if (!warned) {
	287	fprintf(stderr, "[error] liburcu: set CPU # out of range\n");
	288	warned = 1;
	289	}
	290	call_rcu_unlock(&call_rcu_mutex);
	291	errno = EINVAL;
	292	return -EINVAL;
	293	}
	294	alloc_cpu_call_rcu_data();
	295	call_rcu_unlock(&call_rcu_mutex);
	296	if (per_cpu_call_rcu_data == NULL) {
	297	errno = ENOMEM;
	298	return -ENOMEM;
	299	}
	300	per_cpu_call_rcu_data[cpu] = crdp;
	301	return 0;
	302	}
	303
	304	/*
	305	* Return a pointer to the default call_rcu_data structure, creating
	306	* one if need be. Because we never free call_rcu_data structures,
	307	* we don't need to be in an RCU read-side critical section.
	308	*/
	309
	310	struct call_rcu_data *get_default_call_rcu_data(void)
	311	{
	312	if (default_call_rcu_data != NULL)
	313	return rcu_dereference(default_call_rcu_data);
	314	call_rcu_lock(&call_rcu_mutex);
	315	if (default_call_rcu_data != NULL) {
	316	call_rcu_unlock(&call_rcu_mutex);
	317	return default_call_rcu_data;
	318	}
	319	call_rcu_data_init(&default_call_rcu_data, 0);
	320	call_rcu_unlock(&call_rcu_mutex);
	321	return default_call_rcu_data;
	322	}
	323
	324	/*
	325	* Return the call_rcu_data structure that applies to the currently
	326	* running thread. Any call_rcu_data structure assigned specifically
	327	* to this thread has first priority, followed by any call_rcu_data
	328	* structure assigned to the CPU on which the thread is running,
	329	* followed by the default call_rcu_data structure. If there is not
	330	* yet a default call_rcu_data structure, one will be created.
	331	*/
	332	struct call_rcu_data *get_call_rcu_data(void)
	333	{
	334	int curcpu;
	335	static int warned = 0;
	336
	337	if (thread_call_rcu_data != NULL)
	338	return thread_call_rcu_data;
	339	if (maxcpus <= 0)
	340	return get_default_call_rcu_data();
	341	curcpu = sched_getcpu();
	342	if (!warned && (curcpu < 0 \|\| maxcpus <= curcpu)) {
	343	fprintf(stderr, "[error] liburcu: gcrd CPU # out of range\n");
	344	warned = 1;
	345	}
	346	if (curcpu >= 0 && maxcpus > curcpu &&
	347	per_cpu_call_rcu_data != NULL &&
	348	per_cpu_call_rcu_data[curcpu] != NULL)
	349	return per_cpu_call_rcu_data[curcpu];
	350	return get_default_call_rcu_data();
	351	}
	352
	353	/*
	354	* Return a pointer to this task's call_rcu_data if there is one.
	355	*/
	356
	357	struct call_rcu_data *get_thread_call_rcu_data(void)
	358	{
	359	return thread_call_rcu_data;
	360	}
	361
	362	/*
	363	* Set this task's call_rcu_data structure as specified, regardless
	364	* of whether or not this task already had one. (This allows switching
	365	* to and from real-time call_rcu threads, for example.)
	366	*/
	367
	368	void set_thread_call_rcu_data(struct call_rcu_data *crdp)
	369	{
	370	thread_call_rcu_data = crdp;
	371	}
	372
	373	/*
	374	* Create a separate call_rcu thread for each CPU. This does not
	375	* replace a pre-existing call_rcu thread -- use the set_cpu_call_rcu_data()
	376	* function if you want that behavior.
	377	*/
	378
	379	int create_all_cpu_call_rcu_data(unsigned long flags)
	380	{
	381	int i;
	382	struct call_rcu_data *crdp;
	383	int ret;
	384
	385	call_rcu_lock(&call_rcu_mutex);
	386	alloc_cpu_call_rcu_data();
	387	call_rcu_unlock(&call_rcu_mutex);
	388	if (maxcpus <= 0) {
	389	errno = EINVAL;
	390	return -EINVAL;
	391	}
	392	if (per_cpu_call_rcu_data == NULL) {
	393	errno = ENOMEM;
	394	return -ENOMEM;
	395	}
	396	for (i = 0; i < maxcpus; i++) {
	397	call_rcu_lock(&call_rcu_mutex);
	398	if (get_cpu_call_rcu_data(i)) {
	399	call_rcu_unlock(&call_rcu_mutex);
	400	continue;
	401	}
	402	crdp = create_call_rcu_data(flags);
	403	if (crdp == NULL) {
	404	call_rcu_unlock(&call_rcu_mutex);
	405	errno = ENOMEM;
	406	return -ENOMEM;
	407	}
	408	call_rcu_unlock(&call_rcu_mutex);
	409	if ((ret = set_cpu_call_rcu_data(i, crdp)) != 0) {
	410	/* FIXME: Leaks crdp for now. */
	411	return ret; /* Can happen on race. */
	412	}
	413	}
	414	return 0;
	415	}
	416
	417	/*
	418	* Schedule a function to be invoked after a following grace period.
	419	* This is the only function that must be called -- the others are
	420	* only present to allow applications to tune their use of RCU for
	421	* maximum performance.
	422	*
	423	* Note that unless a call_rcu thread has not already been created,
	424	* the first invocation of call_rcu() will create one. So, if you
	425	* need the first invocation of call_rcu() to be fast, make sure
	426	* to create a call_rcu thread first. One way to accomplish this is
	427	* "get_call_rcu_data();", and another is create_all_cpu_call_rcu_data().
	428	*/
	429
	430	void call_rcu(struct rcu_head *head,
	431	void (func)(struct rcu_head head))
	432	{
	433	struct call_rcu_data *crdp;
	434
	435	cds_wfq_node_init(&head->next);
	436	head->func = func;
	437	crdp = get_call_rcu_data();
	438	cds_wfq_enqueue(&crdp->cbs, &head->next);
	439	uatomic_inc(&crdp->qlen);
	440	if (!(_CMM_LOAD_SHARED(crdp->flags) & URCU_CALL_RCU_RT)) {
	441	call_rcu_lock(&crdp->mtx);
	442	if (!(_CMM_LOAD_SHARED(crdp->flags) & URCU_CALL_RCU_RUNNING)) {
	443	if (pthread_cond_signal(&crdp->cond) != 0) {
	444	perror("pthread_cond_signal");
	445	exit(-1);
	446	}
	447	}
	448	call_rcu_unlock(&crdp->mtx);
	449	}
	450	}