[urcu.git] / urcu.h

#ifndef _URCU_H
#define _URCU_H

/*
 * urcu.h
 *
 * Userspace RCU header
 *
 * Copyright February 2009 - Mathieu Desnoyers <mathieu.desnoyers@polymtl.ca>
 *
 * Credits for Paul e. McKenney <paulmck@linux.vnet.ibm.com>
 * for inspiration coming from the Linux kernel RCU and rcu-preempt.
 *
 * The barrier, mb, rmb, wmb, atomic_inc, smp_read_barrier_depends, ACCESS_ONCE
 * and rcu_dereference primitives come from the Linux kernel.
 *
 * Distributed under GPLv2
 */

#include <stdlib.h>
#include <pthread.h>

/* The "volatile" is due to gcc bugs */
#define barrier() __asm__ __volatile__("": : :"memory")

#define likely(x)       __builtin_expect(!!(x), 1)
#define unlikely(x)     __builtin_expect(!!(x), 0)

/* Assume SMP machine, given we don't have this information */
#define CONFIG_SMP 1


#ifdef CONFIG_SMP
#define smp_mb()	mb()
#define smp_rmb()	rmb()
#define smp_wmb()	wmb()
#define smp_mc()	mc()
#define smp_rmc()	rmc()
#define smp_wmc()	wmc()
#else
#define smp_mb()	barrier()
#define smp_rmb()	barrier()
#define smp_wmb()	barrier()
#define smp_mc()	barrier()
#define smp_rmc()	barrier()
#define smp_wmc()	barrier()
#endif

#include "arch.h"

/* Nop everywhere except on alpha. */
#define smp_read_barrier_depends()

/*
 * Prevent the compiler from merging or refetching accesses.  The compiler
 * is also forbidden from reordering successive instances of ACCESS_ONCE(),
 * but only when the compiler is aware of some particular ordering.  One way
 * to make the compiler aware of ordering is to put the two invocations of
 * ACCESS_ONCE() in different C statements.
 *
 * This macro does absolutely -nothing- to prevent the CPU from reordering,
 * merging, or refetching absolutely anything at any time.  Its main intended
 * use is to mediate communication between process-level code and irq/NMI
 * handlers, all running on the same CPU.
 */
#define ACCESS_ONCE(x) (*(volatile typeof(x) *)&(x))

/*
 * Identify a shared load. A smp_rmc() or smp_mc() should come before the load.
 */
#define _LOAD_SHARED(p)	       ACCESS_ONCE(p)

/*
 * Load a data from shared memory, doing a cache flush if required.
 */
#define LOAD_SHARED(p) \
	({ \
		smp_rmc(); \
		_LOAD_SHARED(p); \
	})


/*
 * Identify a shared store. A smp_wmc() or smp_mc() should follow the store.
 */
#define _STORE_SHARED(x, v) \
	do { \
		(x) = (v); \
	} while (0)

/*
 * Store v into x, where x is located in shared memory. Performs the required
 * cache flush after writing.
 */
#define STORE_SHARED(x, v) \
	do { \
		_STORE_SHARED(x, v); \
		smp_wmc(); \
	} while (0)

/**
 * rcu_dereference - fetch an RCU-protected pointer in an
 * RCU read-side critical section.  This pointer may later
 * be safely dereferenced.
 *
 * Inserts memory barriers on architectures that require them
 * (currently only the Alpha), and, more importantly, documents
 * exactly which pointers are protected by RCU.
 */

#define rcu_dereference(p)     ({ \
				typeof(p) _________p1 = LOAD_SHARED(p); \
				smp_read_barrier_depends(); \
				(_________p1); \
				})

#define SIGURCU SIGUSR1

/*
 * If a reader is really non-cooperative and refuses to commit its
 * urcu_active_readers count to memory (there is no barrier in the reader
 * per-se), kick it after a few loops waiting for it.
 */
#define KICK_READER_LOOPS 10000

#ifdef DEBUG_YIELD
#include <sched.h>
#include <time.h>
#include <pthread.h>
#include <unistd.h>

#define YIELD_READ 	(1 << 0)
#define YIELD_WRITE	(1 << 1)

/* Updates without DEBUG_FULL_MB are much slower. Account this in the delay */
#ifdef DEBUG_FULL_MB
/* maximum sleep delay, in us */
#define MAX_SLEEP 50
#else
#define MAX_SLEEP 30000
#endif

extern unsigned int yield_active;
extern unsigned int __thread rand_yield;

static inline void debug_yield_read(void)
{
	if (yield_active & YIELD_READ)
		if (rand_r(&rand_yield) & 0x1)
			usleep(rand_r(&rand_yield) % MAX_SLEEP);
}

static inline void debug_yield_write(void)
{
	if (yield_active & YIELD_WRITE)
		if (rand_r(&rand_yield) & 0x1)
			usleep(rand_r(&rand_yield) % MAX_SLEEP);
}

static inline void debug_yield_init(void)
{
	rand_yield = time(NULL) ^ pthread_self();
}
#else
static inline void debug_yield_read(void)
{
}

static inline void debug_yield_write(void)
{
}

static inline void debug_yield_init(void)
{

}
#endif

#ifdef DEBUG_FULL_MB
static inline void reader_barrier()
{
	smp_mb();
}
#else
static inline void reader_barrier()
{
	barrier();
}
#endif

/*
 * The trick here is that RCU_GP_CTR_BIT must be a multiple of 8 so we can use a
 * full 8-bits, 16-bits or 32-bits bitmask for the lower order bits.
 */
#define RCU_GP_COUNT		(1UL << 0)
/* Use the amount of bits equal to half of the architecture long size */
#define RCU_GP_CTR_BIT		(1UL << (sizeof(long) << 2))
#define RCU_GP_CTR_NEST_MASK	(RCU_GP_CTR_BIT - 1)

/*
 * Global quiescent period counter with low-order bits unused.
 * Using a int rather than a char to eliminate false register dependencies
 * causing stalls on some architectures.
 */
extern long urcu_gp_ctr;

extern long __thread urcu_active_readers;

static inline int rcu_old_gp_ongoing(long *value)
{
	long v;

	if (value == NULL)
		return 0;
	/*
	 * Make sure both tests below are done on the same version of *value
	 * to insure consistency.
	 */
	v = LOAD_SHARED(*value);
	return (v & RCU_GP_CTR_NEST_MASK) &&
		 ((v ^ urcu_gp_ctr) & RCU_GP_CTR_BIT);
}

static inline void rcu_read_lock(void)
{
	long tmp;

	tmp = urcu_active_readers;
	/* urcu_gp_ctr = RCU_GP_COUNT | (~RCU_GP_CTR_BIT or RCU_GP_CTR_BIT) */
	/*
	 * The data dependency "read urcu_gp_ctr, write urcu_active_readers",
	 * serializes those two memory operations. The memory barrier in the
	 * signal handler ensures we receive the proper memory commit barriers
	 * required by _STORE_SHARED and _LOAD_SHARED whenever communication
	 * with the writer is needed.
	 */
	if (likely(!(tmp & RCU_GP_CTR_NEST_MASK)))
		_STORE_SHARED(urcu_active_readers, _LOAD_SHARED(urcu_gp_ctr));
	else
		_STORE_SHARED(urcu_active_readers, tmp + RCU_GP_COUNT);
	/*
	 * Increment active readers count before accessing the pointer.
	 * See force_mb_all_threads().
	 */
	reader_barrier();
}

static inline void rcu_read_unlock(void)
{
	reader_barrier();
	/*
	 * Finish using rcu before decrementing the pointer.
	 * See force_mb_all_threads().
	 */
	_STORE_SHARED(urcu_active_readers, urcu_active_readers - RCU_GP_COUNT);
}

/**
 * rcu_assign_pointer - assign (publicize) a pointer to a newly
 * initialized structure that will be dereferenced by RCU read-side
 * critical sections.  Returns the value assigned.
 *
 * Inserts memory barriers on architectures that require them
 * (pretty much all of them other than x86), and also prevents
 * the compiler from reordering the code that initializes the
 * structure after the pointer assignment.  More importantly, this
 * call documents which pointers will be dereferenced by RCU read-side
 * code.
 */

#define rcu_assign_pointer(p, v) \
	({ \
		if (!__builtin_constant_p(v) || \
		    ((v) != NULL)) \
			wmb(); \
		STORE_SHARED(p, v); \
	})

#define rcu_xchg_pointer(p, v) \
	({ \
		if (!__builtin_constant_p(v) || \
		    ((v) != NULL)) \
			wmb(); \
		xchg(p, v); \
	})

extern void synchronize_rcu(void);

/*
 * Exchanges the pointer and waits for quiescent state.
 * The pointer returned can be freed.
 */
#define urcu_publish_content(p, v) \
	({ \
		void *oldptr; \
		oldptr = rcu_xchg_pointer(p, v); \
		synchronize_rcu(); \
		oldptr; \
	})

/*
 * Reader thread registration.
 */
extern void urcu_register_thread(void);
extern void urcu_unregister_thread(void);

#endif /* _URCU_H */
Commit	Line	Data
	1	#ifndef _URCU_H
	2	#define _URCU_H
	3
	4	/*
	5	* urcu.h
	6	*
	7	* Userspace RCU header
	8	*
	9	* Copyright February 2009 - Mathieu Desnoyers <mathieu.desnoyers@polymtl.ca>
	10	*
	11	* Credits for Paul e. McKenney <paulmck@linux.vnet.ibm.com>
	12	* for inspiration coming from the Linux kernel RCU and rcu-preempt.
	13	*
	14	* The barrier, mb, rmb, wmb, atomic_inc, smp_read_barrier_depends, ACCESS_ONCE
	15	* and rcu_dereference primitives come from the Linux kernel.
	16	*
	17	* Distributed under GPLv2
	18	*/
	19
	20	#include <stdlib.h>
	21	#include <pthread.h>
	22
	23	/* The "volatile" is due to gcc bugs */
	24	#define barrier() __asm__ __volatile__("": : :"memory")
	25
	26	#define likely(x) __builtin_expect(!!(x), 1)
	27	#define unlikely(x) __builtin_expect(!!(x), 0)
	28
	29	/* Assume SMP machine, given we don't have this information */
	30	#define CONFIG_SMP 1
	31
	32
	33	#ifdef CONFIG_SMP
	34	#define smp_mb() mb()
	35	#define smp_rmb() rmb()
	36	#define smp_wmb() wmb()
	37	#define smp_mc() mc()
	38	#define smp_rmc() rmc()
	39	#define smp_wmc() wmc()
	40	#else
	41	#define smp_mb() barrier()
	42	#define smp_rmb() barrier()
	43	#define smp_wmb() barrier()
	44	#define smp_mc() barrier()
	45	#define smp_rmc() barrier()
	46	#define smp_wmc() barrier()
	47	#endif
	48
	49	#include "arch.h"
	50
	51	/* Nop everywhere except on alpha. */
	52	#define smp_read_barrier_depends()
	53
	54	/*
	55	* Prevent the compiler from merging or refetching accesses. The compiler
	56	* is also forbidden from reordering successive instances of ACCESS_ONCE(),
	57	* but only when the compiler is aware of some particular ordering. One way
	58	* to make the compiler aware of ordering is to put the two invocations of
	59	* ACCESS_ONCE() in different C statements.
	60	*
	61	* This macro does absolutely -nothing- to prevent the CPU from reordering,
	62	* merging, or refetching absolutely anything at any time. Its main intended
	63	* use is to mediate communication between process-level code and irq/NMI
	64	* handlers, all running on the same CPU.
	65	*/
	66	#define ACCESS_ONCE(x) ((volatile typeof(x) )&(x))
	67
	68	/*
	69	* Identify a shared load. A smp_rmc() or smp_mc() should come before the load.
	70	*/
	71	#define _LOAD_SHARED(p) ACCESS_ONCE(p)
	72
	73	/*
	74	* Load a data from shared memory, doing a cache flush if required.
	75	*/
	76	#define LOAD_SHARED(p) \
	77	({ \
	78	smp_rmc(); \
	79	_LOAD_SHARED(p); \
	80	})
	81
	82
	83	/*
	84	* Identify a shared store. A smp_wmc() or smp_mc() should follow the store.
	85	*/
	86	#define _STORE_SHARED(x, v) \
	87	do { \
	88	(x) = (v); \
	89	} while (0)
	90
	91	/*
	92	* Store v into x, where x is located in shared memory. Performs the required
	93	* cache flush after writing.
	94	*/
	95	#define STORE_SHARED(x, v) \
	96	do { \
	97	_STORE_SHARED(x, v); \
	98	smp_wmc(); \
	99	} while (0)
	100
	101	/**
	102	* rcu_dereference - fetch an RCU-protected pointer in an
	103	* RCU read-side critical section. This pointer may later
	104	* be safely dereferenced.
	105	*
	106	* Inserts memory barriers on architectures that require them
	107	* (currently only the Alpha), and, more importantly, documents
	108	* exactly which pointers are protected by RCU.
	109	*/
	110
	111	#define rcu_dereference(p) ({ \
	112	typeof(p) _________p1 = LOAD_SHARED(p); \
	113	smp_read_barrier_depends(); \
	114	(_________p1); \
	115	})
	116
	117	#define SIGURCU SIGUSR1
	118
	119	/*
	120	* If a reader is really non-cooperative and refuses to commit its
	121	* urcu_active_readers count to memory (there is no barrier in the reader
	122	* per-se), kick it after a few loops waiting for it.
	123	*/
	124	#define KICK_READER_LOOPS 10000
	125
	126	#ifdef DEBUG_YIELD
	127	#include <sched.h>
	128	#include <time.h>
	129	#include <pthread.h>
	130	#include <unistd.h>
	131
	132	#define YIELD_READ (1 << 0)
	133	#define YIELD_WRITE (1 << 1)
	134
	135	/* Updates without DEBUG_FULL_MB are much slower. Account this in the delay */
	136	#ifdef DEBUG_FULL_MB
	137	/* maximum sleep delay, in us */
	138	#define MAX_SLEEP 50
	139	#else
	140	#define MAX_SLEEP 30000
	141	#endif
	142
	143	extern unsigned int yield_active;
	144	extern unsigned int __thread rand_yield;
	145
	146	static inline void debug_yield_read(void)
	147	{
	148	if (yield_active & YIELD_READ)
	149	if (rand_r(&rand_yield) & 0x1)
	150	usleep(rand_r(&rand_yield) % MAX_SLEEP);
	151	}
	152
	153	static inline void debug_yield_write(void)
	154	{
	155	if (yield_active & YIELD_WRITE)
	156	if (rand_r(&rand_yield) & 0x1)
	157	usleep(rand_r(&rand_yield) % MAX_SLEEP);
	158	}
	159
	160	static inline void debug_yield_init(void)
	161	{
	162	rand_yield = time(NULL) ^ pthread_self();
	163	}
	164	#else
	165	static inline void debug_yield_read(void)
	166	{
	167	}
	168
	169	static inline void debug_yield_write(void)
	170	{
	171	}
	172
	173	static inline void debug_yield_init(void)
	174	{
	175
	176	}
	177	#endif
	178
	179	#ifdef DEBUG_FULL_MB
	180	static inline void reader_barrier()
	181	{
	182	smp_mb();
	183	}
	184	#else
	185	static inline void reader_barrier()
	186	{
	187	barrier();
	188	}
	189	#endif
	190
	191	/*
	192	* The trick here is that RCU_GP_CTR_BIT must be a multiple of 8 so we can use a
	193	* full 8-bits, 16-bits or 32-bits bitmask for the lower order bits.
	194	*/
	195	#define RCU_GP_COUNT (1UL << 0)
	196	/* Use the amount of bits equal to half of the architecture long size */
	197	#define RCU_GP_CTR_BIT (1UL << (sizeof(long) << 2))
	198	#define RCU_GP_CTR_NEST_MASK (RCU_GP_CTR_BIT - 1)
	199
	200	/*
	201	* Global quiescent period counter with low-order bits unused.
	202	* Using a int rather than a char to eliminate false register dependencies
	203	* causing stalls on some architectures.
	204	*/
	205	extern long urcu_gp_ctr;
	206
	207	extern long __thread urcu_active_readers;
	208
	209	static inline int rcu_old_gp_ongoing(long *value)
	210	{
	211	long v;
	212
	213	if (value == NULL)
	214	return 0;
	215	/*
	216	* Make sure both tests below are done on the same version of *value
	217	* to insure consistency.
	218	*/
	219	v = LOAD_SHARED(*value);
	220	return (v & RCU_GP_CTR_NEST_MASK) &&
	221	((v ^ urcu_gp_ctr) & RCU_GP_CTR_BIT);
	222	}
	223
	224	static inline void rcu_read_lock(void)
	225	{
	226	long tmp;
	227
	228	tmp = urcu_active_readers;
	229	/* urcu_gp_ctr = RCU_GP_COUNT \| (~RCU_GP_CTR_BIT or RCU_GP_CTR_BIT) */
	230	/*
	231	* The data dependency "read urcu_gp_ctr, write urcu_active_readers",
	232	* serializes those two memory operations. The memory barrier in the
	233	* signal handler ensures we receive the proper memory commit barriers
	234	* required by _STORE_SHARED and _LOAD_SHARED whenever communication
	235	* with the writer is needed.
	236	*/
	237	if (likely(!(tmp & RCU_GP_CTR_NEST_MASK)))
	238	_STORE_SHARED(urcu_active_readers, _LOAD_SHARED(urcu_gp_ctr));
	239	else
	240	_STORE_SHARED(urcu_active_readers, tmp + RCU_GP_COUNT);
	241	/*
	242	* Increment active readers count before accessing the pointer.
	243	* See force_mb_all_threads().
	244	*/
	245	reader_barrier();
	246	}
	247
	248	static inline void rcu_read_unlock(void)
	249	{
	250	reader_barrier();
	251	/*
	252	* Finish using rcu before decrementing the pointer.
	253	* See force_mb_all_threads().
	254	*/
	255	_STORE_SHARED(urcu_active_readers, urcu_active_readers - RCU_GP_COUNT);
	256	}
	257
	258	/**
	259	* rcu_assign_pointer - assign (publicize) a pointer to a newly
	260	* initialized structure that will be dereferenced by RCU read-side
	261	* critical sections. Returns the value assigned.
	262	*
	263	* Inserts memory barriers on architectures that require them
	264	* (pretty much all of them other than x86), and also prevents
	265	* the compiler from reordering the code that initializes the
	266	* structure after the pointer assignment. More importantly, this
	267	* call documents which pointers will be dereferenced by RCU read-side
	268	* code.
	269	*/
	270
	271	#define rcu_assign_pointer(p, v) \
	272	({ \
	273	if (!__builtin_constant_p(v) \|\| \
	274	((v) != NULL)) \
	275	wmb(); \
	276	STORE_SHARED(p, v); \
	277	})
	278
	279	#define rcu_xchg_pointer(p, v) \
	280	({ \
	281	if (!__builtin_constant_p(v) \|\| \
	282	((v) != NULL)) \
	283	wmb(); \
	284	xchg(p, v); \
	285	})
	286
	287	extern void synchronize_rcu(void);
	288
	289	/*
	290	* Exchanges the pointer and waits for quiescent state.
	291	* The pointer returned can be freed.
	292	*/
	293	#define urcu_publish_content(p, v) \
	294	({ \
	295	void *oldptr; \
	296	oldptr = rcu_xchg_pointer(p, v); \
	297	synchronize_rcu(); \
	298	oldptr; \
	299	})
	300
	301	/*
	302	* Reader thread registration.
	303	*/
	304	extern void urcu_register_thread(void);
	305	extern void urcu_unregister_thread(void);
	306
	307	#endif /* _URCU_H */