Implement rcu_barrier()
authorMathieu Desnoyers <mathieu.desnoyers@efficios.com>
Fri, 31 May 2013 15:32:16 +0000 (11:32 -0400)
committerMathieu Desnoyers <mathieu.desnoyers@efficios.com>
Fri, 14 Jun 2013 21:23:34 +0000 (17:23 -0400)
Awaits for all in-flight call_rcu handlers to complete execution before
returning.

Signed-off-by: Mathieu Desnoyers <mathieu.desnoyers@efficios.com>
urcu-call-rcu-impl.h
urcu-call-rcu.h
urcu-flavor.h
urcu/map/urcu-bp.h
urcu/map/urcu-qsbr.h
urcu/map/urcu.h

index f7f0f71eeeb28fec5152a8a81194c141035cd550..fb3568f802f210d2015b9a42e9d20691ee59df4c 100644 (file)
@@ -64,6 +64,16 @@ struct call_rcu_data {
        struct cds_list_head list;
 } __attribute__((aligned(CAA_CACHE_LINE_SIZE)));
 
+struct call_rcu_completion {
+       int barrier_count;
+       int32_t futex;
+};
+
+struct call_rcu_completion_work {
+       struct rcu_head head;
+       struct call_rcu_completion *completion;
+};
+
 /*
  * List of all call_rcu_data structures to keep valgrind happy.
  * Protected by call_rcu_mutex.
@@ -236,6 +246,26 @@ static void call_rcu_wake_up(struct call_rcu_data *crdp)
        }
 }
 
+static void call_rcu_completion_wait(struct call_rcu_completion *completion)
+{
+       /* Read completion barrier count before read futex */
+       cmm_smp_mb();
+       if (uatomic_read(&completion->futex) == -1)
+               futex_async(&completion->futex, FUTEX_WAIT, -1,
+                     NULL, NULL, 0);
+}
+
+static void call_rcu_completion_wake_up(struct call_rcu_completion *completion)
+{
+       /* Write to completion barrier count before reading/writing futex */
+       cmm_smp_mb();
+       if (caa_unlikely(uatomic_read(&completion->futex) == -1)) {
+               uatomic_set(&completion->futex, 0);
+               futex_async(&completion->futex, FUTEX_WAKE, 1,
+                     NULL, NULL, 0);
+       }
+}
+
 /* This is the code run by each call_rcu thread. */
 
 static void *call_rcu_thread(void *arg)
@@ -604,6 +634,17 @@ static void wake_call_rcu_thread(struct call_rcu_data *crdp)
                call_rcu_wake_up(crdp);
 }
 
+static void _call_rcu(struct rcu_head *head,
+                     void (*func)(struct rcu_head *head),
+                     struct call_rcu_data *crdp)
+{
+       cds_wfcq_node_init(&head->next);
+       head->func = func;
+       cds_wfcq_enqueue(&crdp->cbs_head, &crdp->cbs_tail, &head->next);
+       uatomic_inc(&crdp->qlen);
+       wake_call_rcu_thread(crdp);
+}
+
 /*
  * Schedule a function to be invoked after a following grace period.
  * This is the only function that must be called -- the others are
@@ -618,20 +659,15 @@ static void wake_call_rcu_thread(struct call_rcu_data *crdp)
  *
  * call_rcu must be called by registered RCU read-side threads.
  */
-
 void call_rcu(struct rcu_head *head,
              void (*func)(struct rcu_head *head))
 {
        struct call_rcu_data *crdp;
 
-       cds_wfcq_node_init(&head->next);
-       head->func = func;
        /* Holding rcu read-side lock across use of per-cpu crdp */
        rcu_read_lock();
        crdp = get_call_rcu_data();
-       cds_wfcq_enqueue(&crdp->cbs_head, &crdp->cbs_tail, &head->next);
-       uatomic_inc(&crdp->qlen);
-       wake_call_rcu_thread(crdp);
+       _call_rcu(head, func, crdp);
        rcu_read_unlock();
 }
 
@@ -730,6 +766,89 @@ void free_all_cpu_call_rcu_data(void)
        free(crdp);
 }
 
+static
+void _rcu_barrier_complete(struct rcu_head *head)
+{
+       struct call_rcu_completion_work *work;
+       struct call_rcu_completion *completion;
+
+       work = caa_container_of(head, struct call_rcu_completion_work, head);
+       completion = work->completion;
+       uatomic_dec(&completion->barrier_count);
+       call_rcu_completion_wake_up(completion);
+       free(work);
+}
+
+/*
+ * Wait for all in-flight call_rcu callbacks to complete execution.
+ */
+void rcu_barrier(void)
+{
+       struct call_rcu_data *crdp;
+       struct call_rcu_completion completion;
+       int count = 0, work_count = 0;
+       int was_online;
+
+       /* Put in offline state in QSBR. */
+       was_online = rcu_read_ongoing();
+       if (was_online)
+               rcu_thread_offline();
+       /*
+        * Calling a rcu_barrier() within a RCU read-side critical
+        * section is an error.
+        */
+       if (rcu_read_ongoing()) {
+               static int warned = 0;
+
+               if (!warned) {
+                       fprintf(stderr, "[error] liburcu: rcu_barrier() called from within RCU read-side critical section.\n");
+               }
+               warned = 1;
+               goto online;
+       }
+
+       call_rcu_lock(&call_rcu_mutex);
+       cds_list_for_each_entry(crdp, &call_rcu_data_list, list)
+               count++;
+
+       completion.barrier_count = count;
+
+       cds_list_for_each_entry(crdp, &call_rcu_data_list, list) {
+               struct call_rcu_completion_work *work;
+
+               work = calloc(sizeof(*work), 1);
+               if (!work) {
+                       static int warned = 0;
+
+                       if (!warned) {
+                               fprintf(stderr, "[error] liburcu: unable to allocate memory for rcu_barrier()\n");
+                       }
+                       warned = 1;
+                       break;
+               }
+               work->completion = &completion;
+               _call_rcu(&work->head, _rcu_barrier_complete, crdp);
+               work_count++;
+       }
+       call_rcu_unlock(&call_rcu_mutex);
+
+       if (work_count != count)
+               uatomic_sub(&completion.barrier_count, count - work_count);
+
+       /* Wait for them */
+       for (;;) {
+               uatomic_dec(&completion.futex);
+               /* Decrement futex before reading barrier_count */
+               cmm_smp_mb();
+               if (!uatomic_read(&completion.barrier_count))
+                       break;
+               call_rcu_completion_wait(&completion);
+       }
+online:
+       if (was_online)
+               rcu_thread_online();
+}
+
 /*
  * Acquire the call_rcu_mutex in order to ensure that the child sees
  * all of the call_rcu() data structures in a consistent state. Ensure
index 997bb2f19a7a0e1547f4cb009b48db8d42d4ee72..30388c5316776bac79722f541ccdf370ccbf7549 100644 (file)
@@ -92,6 +92,8 @@ void call_rcu_before_fork(void);
 void call_rcu_after_fork_parent(void);
 void call_rcu_after_fork_child(void);
 
+void rcu_barrier(void);
+
 #ifdef __cplusplus 
 }
 #endif
index c04f1db78ba1e113a7ff85e9d8552cfe08b342c8..5e7f292514fd389c2982c36c9d51e45265f5fa0d 100644 (file)
@@ -41,6 +41,8 @@ struct rcu_flavor_struct {
        void (*thread_online)(void);
        void (*register_thread)(void);
        void (*unregister_thread)(void);
+
+       void (*barrier)(void);
 };
 
 #define DEFINE_RCU_FLAVOR(x)                           \
@@ -56,6 +58,7 @@ const struct rcu_flavor_struct x = {                  \
        .thread_online          = rcu_thread_online,    \
        .register_thread        = rcu_register_thread,  \
        .unregister_thread      = rcu_unregister_thread,\
+       .barrier                = rcu_barrier,          \
 }
 
 extern const struct rcu_flavor_struct rcu_flavor;
index 92863fef257dfd3d5757c855a5afdf98cfa3a197..67ba5c3088fa6ebaee811367e485cc0be3c26859 100644 (file)
@@ -63,6 +63,7 @@
 #define call_rcu_before_fork           call_rcu_before_fork_bp
 #define call_rcu_after_fork_parent     call_rcu_after_fork_parent_bp
 #define call_rcu_after_fork_child      call_rcu_after_fork_child_bp
+#define rcu_barrier                    rcu_barrier_bp
 
 #define defer_rcu                      defer_rcu_bp
 #define rcu_defer_register_thread      rcu_defer_register_thread_bp
index e3261ff0c316b88efd309360d43b3d6fa2d7b33b..b89dd2487e34e35673e15879b7fe910b0e425679 100644 (file)
@@ -65,6 +65,7 @@
 #define call_rcu_before_fork           call_rcu_before_fork_qsbr
 #define call_rcu_after_fork_parent     call_rcu_after_fork_parent_qsbr
 #define call_rcu_after_fork_child      call_rcu_after_fork_child_qsbr
+#define rcu_barrier                    rcu_barrier_qsbr
 
 #define defer_rcu                      defer_rcu_qsbr
 #define rcu_defer_register_thread      rcu_defer_register_thread_qsbr
index 77b37215734bfa163fbe680a3582a5b8a0b2af66..8f04cafcde5df141f84bd4f9067e0485147fd1d7 100644 (file)
@@ -69,6 +69,7 @@
 #define call_rcu_before_fork           call_rcu_before_fork_memb
 #define call_rcu_after_fork_parent     call_rcu_after_fork_parent_memb
 #define call_rcu_after_fork_child      call_rcu_after_fork_child_memb
+#define rcu_barrier                    rcu_barrier_memb
 
 #define defer_rcu                      defer_rcu_memb
 #define rcu_defer_register_thread      rcu_defer_register_thread_memb
 #define call_rcu_before_fork           call_rcu_before_fork_sig
 #define call_rcu_after_fork_parent     call_rcu_after_fork_parent_sig
 #define call_rcu_after_fork_child      call_rcu_after_fork_child_sig
+#define rcu_barrier                    rcu_barrier_sig
 
 #define defer_rcu                      defer_rcu_sig
 #define rcu_defer_register_thread      rcu_defer_register_thread_sig
 #define call_rcu_before_fork           call_rcu_before_fork_mb
 #define call_rcu_after_fork_parent     call_rcu_after_fork_parent_mb
 #define call_rcu_after_fork_child      call_rcu_after_fork_child_mb
+#define rcu_barrier                    rcu_barrier_mb
 
 #define defer_rcu                      defer_rcu_mb
 #define rcu_defer_register_thread      rcu_defer_register_thread_mb
This page took 0.028912 seconds and 4 git commands to generate.