Commit 15fecf89 authored by Paul E. McKenney's avatar Paul E. McKenney

srcu: Abstract multi-tail callback list handling

RCU has only one multi-tail callback list, which is implemented via
the nxtlist, nxttail, nxtcompleted, qlen_lazy, and qlen fields in the
rcu_data structure, and whose operations are open-code throughout the
Tree RCU implementation.  This has been more or less OK in the past,
but upcoming callback-list optimizations in SRCU could really use
a multi-tail callback list there as well.

This commit therefore abstracts the multi-tail callback list handling
into a new kernel/rcu/rcu_segcblist.h file, and uses this new API.
The simple head-and-tail pointer callback list is also abstracted and
applied everywhere except for the NOCB callback-offload lists.  (Yes,
the plan is to apply them there as well, but this commit is already
bigger than would be good.)
Signed-off-by: default avatarPaul E. McKenney <paulmck@linux.vnet.ibm.com>
parent b8c78d3a
This diff is collapsed.
This diff is collapsed.
...@@ -30,6 +30,7 @@ ...@@ -30,6 +30,7 @@
#include <linux/seqlock.h> #include <linux/seqlock.h>
#include <linux/swait.h> #include <linux/swait.h>
#include <linux/stop_machine.h> #include <linux/stop_machine.h>
#include "rcu_segcblist.h"
/* /*
* Define shape of hierarchy based on NR_CPUS, CONFIG_RCU_FANOUT, and * Define shape of hierarchy based on NR_CPUS, CONFIG_RCU_FANOUT, and
...@@ -335,34 +336,9 @@ struct rcu_data { ...@@ -335,34 +336,9 @@ struct rcu_data {
/* period it is aware of. */ /* period it is aware of. */
/* 2) batch handling */ /* 2) batch handling */
/* struct rcu_segcblist cblist; /* Segmented callback list, with */
* If nxtlist is not NULL, it is partitioned as follows. /* different callbacks waiting for */
* Any of the partitions might be empty, in which case the /* different grace periods. */
* pointer to that partition will be equal to the pointer for
* the following partition. When the list is empty, all of
* the nxttail elements point to the ->nxtlist pointer itself,
* which in that case is NULL.
*
* [nxtlist, *nxttail[RCU_DONE_TAIL]):
* Entries that batch # <= ->completed
* The grace period for these entries has completed, and
* the other grace-period-completed entries may be moved
* here temporarily in rcu_process_callbacks().
* [*nxttail[RCU_DONE_TAIL], *nxttail[RCU_WAIT_TAIL]):
* Entries that batch # <= ->completed - 1: waiting for current GP
* [*nxttail[RCU_WAIT_TAIL], *nxttail[RCU_NEXT_READY_TAIL]):
* Entries known to have arrived before current GP ended
* [*nxttail[RCU_NEXT_READY_TAIL], *nxttail[RCU_NEXT_TAIL]):
* Entries that might have arrived after current GP ended
* Note that the value of *nxttail[RCU_NEXT_TAIL] will
* always be NULL, as this is the end of the list.
*/
struct rcu_head *nxtlist;
struct rcu_head **nxttail[RCU_NEXT_SIZE];
unsigned long nxtcompleted[RCU_NEXT_SIZE];
/* grace periods for sublists. */
long qlen_lazy; /* # of lazy queued callbacks */
long qlen; /* # of queued callbacks, incl lazy */
long qlen_last_fqs_check; long qlen_last_fqs_check;
/* qlen at last check for QS forcing */ /* qlen at last check for QS forcing */
unsigned long n_cbs_invoked; /* count of RCU cbs invoked. */ unsigned long n_cbs_invoked; /* count of RCU cbs invoked. */
...@@ -500,14 +476,11 @@ struct rcu_state { ...@@ -500,14 +476,11 @@ struct rcu_state {
raw_spinlock_t orphan_lock ____cacheline_internodealigned_in_smp; raw_spinlock_t orphan_lock ____cacheline_internodealigned_in_smp;
/* Protect following fields. */ /* Protect following fields. */
struct rcu_head *orphan_nxtlist; /* Orphaned callbacks that */ struct rcu_cblist orphan_pend; /* Orphaned callbacks that */
/* need a grace period. */ /* need a grace period. */
struct rcu_head **orphan_nxttail; /* Tail of above. */ struct rcu_cblist orphan_done; /* Orphaned callbacks that */
struct rcu_head *orphan_donelist; /* Orphaned callbacks that */
/* are ready to invoke. */ /* are ready to invoke. */
struct rcu_head **orphan_donetail; /* Tail of above. */ /* (Contains counts.) */
long qlen_lazy; /* Number of lazy callbacks. */
long qlen; /* Total number of callbacks. */
/* End of fields guarded by orphan_lock. */ /* End of fields guarded by orphan_lock. */
struct mutex barrier_mutex; /* Guards barrier fields. */ struct mutex barrier_mutex; /* Guards barrier fields. */
......
...@@ -1350,10 +1350,10 @@ static bool __maybe_unused rcu_try_advance_all_cbs(void) ...@@ -1350,10 +1350,10 @@ static bool __maybe_unused rcu_try_advance_all_cbs(void)
*/ */
if ((rdp->completed != rnp->completed || if ((rdp->completed != rnp->completed ||
unlikely(READ_ONCE(rdp->gpwrap))) && unlikely(READ_ONCE(rdp->gpwrap))) &&
rdp->nxttail[RCU_DONE_TAIL] != rdp->nxttail[RCU_NEXT_TAIL]) rcu_segcblist_pend_cbs(&rdp->cblist))
note_gp_changes(rsp, rdp); note_gp_changes(rsp, rdp);
if (cpu_has_callbacks_ready_to_invoke(rdp)) if (rcu_segcblist_ready_cbs(&rdp->cblist))
cbs_ready = true; cbs_ready = true;
} }
return cbs_ready; return cbs_ready;
...@@ -1461,7 +1461,7 @@ static void rcu_prepare_for_idle(void) ...@@ -1461,7 +1461,7 @@ static void rcu_prepare_for_idle(void)
rdtp->last_accelerate = jiffies; rdtp->last_accelerate = jiffies;
for_each_rcu_flavor(rsp) { for_each_rcu_flavor(rsp) {
rdp = this_cpu_ptr(rsp->rda); rdp = this_cpu_ptr(rsp->rda);
if (!*rdp->nxttail[RCU_DONE_TAIL]) if (rcu_segcblist_pend_cbs(&rdp->cblist))
continue; continue;
rnp = rdp->mynode; rnp = rdp->mynode;
raw_spin_lock_rcu_node(rnp); /* irqs already disabled. */ raw_spin_lock_rcu_node(rnp); /* irqs already disabled. */
...@@ -1529,7 +1529,7 @@ static void rcu_oom_notify_cpu(void *unused) ...@@ -1529,7 +1529,7 @@ static void rcu_oom_notify_cpu(void *unused)
for_each_rcu_flavor(rsp) { for_each_rcu_flavor(rsp) {
rdp = raw_cpu_ptr(rsp->rda); rdp = raw_cpu_ptr(rsp->rda);
if (rdp->qlen_lazy != 0) { if (rcu_segcblist_n_lazy_cbs(&rdp->cblist)) {
atomic_inc(&oom_callback_count); atomic_inc(&oom_callback_count);
rsp->call(&rdp->oom_head, rcu_oom_callback); rsp->call(&rdp->oom_head, rcu_oom_callback);
} }
...@@ -1934,30 +1934,26 @@ static bool __maybe_unused rcu_nocb_adopt_orphan_cbs(struct rcu_state *rsp, ...@@ -1934,30 +1934,26 @@ static bool __maybe_unused rcu_nocb_adopt_orphan_cbs(struct rcu_state *rsp,
struct rcu_data *rdp, struct rcu_data *rdp,
unsigned long flags) unsigned long flags)
{ {
long ql = rsp->qlen; long ql = rcu_cblist_n_cbs(&rsp->orphan_done);
long qll = rsp->qlen_lazy; long qll = rcu_cblist_n_lazy_cbs(&rsp->orphan_done);
/* If this is not a no-CBs CPU, tell the caller to do it the old way. */ /* If this is not a no-CBs CPU, tell the caller to do it the old way. */
if (!rcu_is_nocb_cpu(smp_processor_id())) if (!rcu_is_nocb_cpu(smp_processor_id()))
return false; return false;
rsp->qlen = 0;
rsp->qlen_lazy = 0;
/* First, enqueue the donelist, if any. This preserves CB ordering. */ /* First, enqueue the donelist, if any. This preserves CB ordering. */
if (rsp->orphan_donelist != NULL) { if (!rcu_cblist_empty(&rsp->orphan_done)) {
__call_rcu_nocb_enqueue(rdp, rsp->orphan_donelist, __call_rcu_nocb_enqueue(rdp, rcu_cblist_head(&rsp->orphan_done),
rsp->orphan_donetail, ql, qll, flags); rcu_cblist_tail(&rsp->orphan_done),
ql = qll = 0; ql, qll, flags);
rsp->orphan_donelist = NULL;
rsp->orphan_donetail = &rsp->orphan_donelist;
} }
if (rsp->orphan_nxtlist != NULL) { if (!rcu_cblist_empty(&rsp->orphan_pend)) {
__call_rcu_nocb_enqueue(rdp, rsp->orphan_nxtlist, __call_rcu_nocb_enqueue(rdp, rcu_cblist_head(&rsp->orphan_pend),
rsp->orphan_nxttail, ql, qll, flags); rcu_cblist_tail(&rsp->orphan_pend),
ql = qll = 0; ql, qll, flags);
rsp->orphan_nxtlist = NULL;
rsp->orphan_nxttail = &rsp->orphan_nxtlist;
} }
rcu_cblist_init(&rsp->orphan_done);
rcu_cblist_init(&rsp->orphan_pend);
return true; return true;
} }
...@@ -2399,16 +2395,16 @@ static bool init_nocb_callback_list(struct rcu_data *rdp) ...@@ -2399,16 +2395,16 @@ static bool init_nocb_callback_list(struct rcu_data *rdp)
return false; return false;
/* If there are early-boot callbacks, move them to nocb lists. */ /* If there are early-boot callbacks, move them to nocb lists. */
if (rdp->nxtlist) { if (!rcu_segcblist_empty(&rdp->cblist)) {
rdp->nocb_head = rdp->nxtlist; rdp->nocb_head = rcu_segcblist_head(&rdp->cblist);
rdp->nocb_tail = rdp->nxttail[RCU_NEXT_TAIL]; rdp->nocb_tail = rcu_segcblist_tail(&rdp->cblist);
atomic_long_set(&rdp->nocb_q_count, rdp->qlen); atomic_long_set(&rdp->nocb_q_count,
atomic_long_set(&rdp->nocb_q_count_lazy, rdp->qlen_lazy); rcu_segcblist_n_cbs(&rdp->cblist));
rdp->nxtlist = NULL; atomic_long_set(&rdp->nocb_q_count_lazy,
rdp->qlen = 0; rcu_segcblist_n_lazy_cbs(&rdp->cblist));
rdp->qlen_lazy = 0; rcu_segcblist_init(&rdp->cblist);
} }
rdp->nxttail[RCU_NEXT_TAIL] = NULL; rcu_segcblist_disable(&rdp->cblist);
return true; return true;
} }
......
...@@ -41,6 +41,7 @@ ...@@ -41,6 +41,7 @@
#include <linux/mutex.h> #include <linux/mutex.h>
#include <linux/debugfs.h> #include <linux/debugfs.h>
#include <linux/seq_file.h> #include <linux/seq_file.h>
#include <linux/prefetch.h>
#define RCU_TREE_NONCORE #define RCU_TREE_NONCORE
#include "tree.h" #include "tree.h"
...@@ -128,17 +129,15 @@ static void print_one_rcu_data(struct seq_file *m, struct rcu_data *rdp) ...@@ -128,17 +129,15 @@ static void print_one_rcu_data(struct seq_file *m, struct rcu_data *rdp)
rdp->dynticks_fqs); rdp->dynticks_fqs);
seq_printf(m, " of=%lu", rdp->offline_fqs); seq_printf(m, " of=%lu", rdp->offline_fqs);
rcu_nocb_q_lengths(rdp, &ql, &qll); rcu_nocb_q_lengths(rdp, &ql, &qll);
qll += rdp->qlen_lazy; qll += rcu_segcblist_n_lazy_cbs(&rdp->cblist);
ql += rdp->qlen; ql += rcu_segcblist_n_cbs(&rdp->cblist);
seq_printf(m, " ql=%ld/%ld qs=%c%c%c%c", seq_printf(m, " ql=%ld/%ld qs=%c%c%c%c",
qll, ql, qll, ql,
".N"[rdp->nxttail[RCU_NEXT_READY_TAIL] != ".N"[!rcu_segcblist_segempty(&rdp->cblist, RCU_NEXT_TAIL)],
rdp->nxttail[RCU_NEXT_TAIL]], ".R"[!rcu_segcblist_segempty(&rdp->cblist,
".R"[rdp->nxttail[RCU_WAIT_TAIL] != RCU_NEXT_READY_TAIL)],
rdp->nxttail[RCU_NEXT_READY_TAIL]], ".W"[!rcu_segcblist_segempty(&rdp->cblist, RCU_WAIT_TAIL)],
".W"[rdp->nxttail[RCU_DONE_TAIL] != ".D"[!rcu_segcblist_segempty(&rdp->cblist, RCU_DONE_TAIL)]);
rdp->nxttail[RCU_WAIT_TAIL]],
".D"[&rdp->nxtlist != rdp->nxttail[RCU_DONE_TAIL]]);
#ifdef CONFIG_RCU_BOOST #ifdef CONFIG_RCU_BOOST
seq_printf(m, " kt=%d/%c ktl=%x", seq_printf(m, " kt=%d/%c ktl=%x",
per_cpu(rcu_cpu_has_work, rdp->cpu), per_cpu(rcu_cpu_has_work, rdp->cpu),
...@@ -276,7 +275,9 @@ static void print_one_rcu_state(struct seq_file *m, struct rcu_state *rsp) ...@@ -276,7 +275,9 @@ static void print_one_rcu_state(struct seq_file *m, struct rcu_state *rsp)
seq_printf(m, "nfqs=%lu/nfqsng=%lu(%lu) fqlh=%lu oqlen=%ld/%ld\n", seq_printf(m, "nfqs=%lu/nfqsng=%lu(%lu) fqlh=%lu oqlen=%ld/%ld\n",
rsp->n_force_qs, rsp->n_force_qs_ngp, rsp->n_force_qs, rsp->n_force_qs_ngp,
rsp->n_force_qs - rsp->n_force_qs_ngp, rsp->n_force_qs - rsp->n_force_qs_ngp,
READ_ONCE(rsp->n_force_qs_lh), rsp->qlen_lazy, rsp->qlen); READ_ONCE(rsp->n_force_qs_lh),
rcu_cblist_n_lazy_cbs(&rsp->orphan_done),
rcu_cblist_n_cbs(&rsp->orphan_done));
for (rnp = &rsp->node[0]; rnp - &rsp->node[0] < rcu_num_nodes; rnp++) { for (rnp = &rsp->node[0]; rnp - &rsp->node[0] < rcu_num_nodes; rnp++) {
if (rnp->level != level) { if (rnp->level != level) {
seq_puts(m, "\n"); seq_puts(m, "\n");
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment