Blame view

kernel/rcutree.c 101 KB
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
  /*
   * Read-Copy Update mechanism for mutual exclusion
   *
   * This program is free software; you can redistribute it and/or modify
   * it under the terms of the GNU General Public License as published by
   * the Free Software Foundation; either version 2 of the License, or
   * (at your option) any later version.
   *
   * This program is distributed in the hope that it will be useful,
   * but WITHOUT ANY WARRANTY; without even the implied warranty of
   * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
   * GNU General Public License for more details.
   *
   * You should have received a copy of the GNU General Public License
   * along with this program; if not, write to the Free Software
   * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
   *
   * Copyright IBM Corporation, 2008
   *
   * Authors: Dipankar Sarma <dipankar@in.ibm.com>
   *	    Manfred Spraul <manfred@colorfullife.com>
   *	    Paul E. McKenney <paulmck@linux.vnet.ibm.com> Hierarchical version
   *
   * Based on the original work by Paul McKenney <paulmck@us.ibm.com>
   * and inputs from Rusty Russell, Andrea Arcangeli and Andi Kleen.
   *
   * For detailed explanation of Read-Copy Update mechanism see -
a71fca58b   Paul E. McKenney   rcu: Fix whitespa...
28
   *	Documentation/RCU
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
29
30
31
32
33
34
35
36
37
   */
  #include <linux/types.h>
  #include <linux/kernel.h>
  #include <linux/init.h>
  #include <linux/spinlock.h>
  #include <linux/smp.h>
  #include <linux/rcupdate.h>
  #include <linux/interrupt.h>
  #include <linux/sched.h>
c1dc0b9c0   Ingo Molnar   debug lockups: Im...
38
  #include <linux/nmi.h>
8826f3b03   Paul E. McKenney   rcu: Avoid acquir...
39
  #include <linux/atomic.h>
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
40
  #include <linux/bitops.h>
9984de1a5   Paul Gortmaker   kernel: Map most ...
41
  #include <linux/export.h>
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
42
43
44
45
46
47
48
  #include <linux/completion.h>
  #include <linux/moduleparam.h>
  #include <linux/percpu.h>
  #include <linux/notifier.h>
  #include <linux/cpu.h>
  #include <linux/mutex.h>
  #include <linux/time.h>
bbad93798   Paul E. McKenney   rcu: slim down rc...
49
  #include <linux/kernel_stat.h>
a26ac2455   Paul E. McKenney   rcu: move TREE_RC...
50
51
  #include <linux/wait.h>
  #include <linux/kthread.h>
268bb0ce3   Linus Torvalds   sanitize <linux/p...
52
  #include <linux/prefetch.h>
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
53
54
  #include <linux/delay.h>
  #include <linux/stop_machine.h>
661a85dc0   Paul E. McKenney   rcu: Add random P...
55
  #include <linux/random.h>
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
56

9f77da9f4   Paul E. McKenney   rcu: Move private...
57
  #include "rcutree.h"
29c00b4a1   Paul E. McKenney   rcu: Add event-tr...
58
59
60
  #include <trace/events/rcu.h>
  
  #include "rcu.h"
9f77da9f4   Paul E. McKenney   rcu: Move private...
61

64db4cfff   Paul E. McKenney   "Tree RCU": scala...
62
  /* Data structures. */
f885b7f2b   Paul E. McKenney   rcu: Control RCU_...
63
  static struct lock_class_key rcu_node_class[RCU_NUM_LVLS];
394f2769a   Paul E. McKenney   rcu: Prevent forc...
64
  static struct lock_class_key rcu_fqs_class[RCU_NUM_LVLS];
88b91c7ca   Peter Zijlstra   rcu: Simplify cre...
65

a48898585   Paul E. McKenney   rcu: Distinguish ...
66
  #define RCU_STATE_INITIALIZER(sname, sabbr, cr) { \
6c90cc7bf   Paul E. McKenney   rcu: Prevent exce...
67
  	.level = { &sname##_state.node[0] }, \
037b64ed0   Paul E. McKenney   rcu: Place pointe...
68
  	.call = cr, \
af446b702   Paul E. McKenney   rcu: ->signaled b...
69
  	.fqs_state = RCU_GP_IDLE, \
42c3533ee   Paul E. McKenney   rcu: Fix tracing ...
70
71
  	.gpnum = 0UL - 300UL, \
  	.completed = 0UL - 300UL, \
7b2e6011f   Paul E. McKenney   rcu: Rename ->ono...
72
  	.orphan_lock = __RAW_SPIN_LOCK_UNLOCKED(&sname##_state.orphan_lock), \
6c90cc7bf   Paul E. McKenney   rcu: Prevent exce...
73
74
  	.orphan_nxttail = &sname##_state.orphan_nxtlist, \
  	.orphan_donetail = &sname##_state.orphan_donelist, \
7be7f0be9   Paul E. McKenney   rcu: Move rcu_bar...
75
  	.barrier_mutex = __MUTEX_INITIALIZER(sname##_state.barrier_mutex), \
a4fbe35a1   Paul E. McKenney   rcu: Grace-period...
76
  	.onoff_mutex = __MUTEX_INITIALIZER(sname##_state.onoff_mutex), \
6c90cc7bf   Paul E. McKenney   rcu: Prevent exce...
77
  	.name = #sname, \
a48898585   Paul E. McKenney   rcu: Distinguish ...
78
  	.abbr = sabbr, \
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
79
  }
037b64ed0   Paul E. McKenney   rcu: Place pointe...
80
  struct rcu_state rcu_sched_state =
a48898585   Paul E. McKenney   rcu: Distinguish ...
81
  	RCU_STATE_INITIALIZER(rcu_sched, 's', call_rcu_sched);
d6714c22b   Paul E. McKenney   rcu: Renamings to...
82
  DEFINE_PER_CPU(struct rcu_data, rcu_sched_data);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
83

a48898585   Paul E. McKenney   rcu: Distinguish ...
84
  struct rcu_state rcu_bh_state = RCU_STATE_INITIALIZER(rcu_bh, 'b', call_rcu_bh);
6258c4fb5   Ingo Molnar   kmemtrace, rcu: f...
85
  DEFINE_PER_CPU(struct rcu_data, rcu_bh_data);
b1f77b058   Ingo Molnar   kmemtrace, rcu: f...
86

27f4d2805   Paul E. McKenney   rcu: priority boo...
87
  static struct rcu_state *rcu_state;
6ce75a232   Paul E. McKenney   rcu: Introduce fo...
88
  LIST_HEAD(rcu_struct_flavors);
27f4d2805   Paul E. McKenney   rcu: priority boo...
89

f885b7f2b   Paul E. McKenney   rcu: Control RCU_...
90
91
  /* Increase (but not decrease) the CONFIG_RCU_FANOUT_LEAF at boot time. */
  static int rcu_fanout_leaf = CONFIG_RCU_FANOUT_LEAF;
7e5c2dfb4   Paul E. McKenney   rcu: Make rcutree...
92
  module_param(rcu_fanout_leaf, int, 0444);
f885b7f2b   Paul E. McKenney   rcu: Control RCU_...
93
94
95
96
97
98
99
100
101
  int rcu_num_lvls __read_mostly = RCU_NUM_LVLS;
  static int num_rcu_lvl[] = {  /* Number of rcu_nodes at specified level. */
  	NUM_RCU_LVL_0,
  	NUM_RCU_LVL_1,
  	NUM_RCU_LVL_2,
  	NUM_RCU_LVL_3,
  	NUM_RCU_LVL_4,
  };
  int rcu_num_nodes __read_mostly = NUM_RCU_NODES; /* Total # rcu_nodes in use. */
b0d304172   Paul E. McKenney   rcu: Prevent RCU ...
102
103
104
105
  /*
   * The rcu_scheduler_active variable transitions from zero to one just
   * before the first task is spawned.  So when this variable is zero, RCU
   * can assume that there is but one task, allowing RCU to (for example)
b44f66562   Cody P Schafer   rcu: Correct 'opt...
106
   * optimize synchronize_sched() to a simple barrier().  When this variable
b0d304172   Paul E. McKenney   rcu: Prevent RCU ...
107
108
109
110
   * is one, RCU must actually do all the hard work required to detect real
   * grace periods.  This variable is also used to suppress boot-time false
   * positives from lockdep-RCU error checking.
   */
bbad93798   Paul E. McKenney   rcu: slim down rc...
111
112
  int rcu_scheduler_active __read_mostly;
  EXPORT_SYMBOL_GPL(rcu_scheduler_active);
b0d304172   Paul E. McKenney   rcu: Prevent RCU ...
113
114
115
116
117
118
119
120
121
122
123
124
125
  /*
   * The rcu_scheduler_fully_active variable transitions from zero to one
   * during the early_initcall() processing, which is after the scheduler
   * is capable of creating new tasks.  So RCU processing (for example,
   * creating tasks for RCU priority boosting) must be delayed until after
   * rcu_scheduler_fully_active transitions from zero to one.  We also
   * currently delay invocation of any RCU callbacks until after this point.
   *
   * It might later prove better for people registering RCU callbacks during
   * early boot to take responsibility for these callbacks, but one step at
   * a time.
   */
  static int rcu_scheduler_fully_active __read_mostly;
a46e0899e   Paul E. McKenney   rcu: use softirq ...
126
  #ifdef CONFIG_RCU_BOOST
b1f77b058   Ingo Molnar   kmemtrace, rcu: f...
127
  /*
a26ac2455   Paul E. McKenney   rcu: move TREE_RC...
128
129
130
131
   * Control variables for per-CPU and per-rcu_node kthreads.  These
   * handle all flavors of RCU.
   */
  static DEFINE_PER_CPU(struct task_struct *, rcu_cpu_kthread_task);
d71df90ea   Paul E. McKenney   rcu: add tracing ...
132
  DEFINE_PER_CPU(unsigned int, rcu_cpu_kthread_status);
5ece5bab3   Paul E. McKenney   rcu: Add forward-...
133
  DEFINE_PER_CPU(unsigned int, rcu_cpu_kthread_loops);
d71df90ea   Paul E. McKenney   rcu: add tracing ...
134
  DEFINE_PER_CPU(char, rcu_cpu_has_work);
a26ac2455   Paul E. McKenney   rcu: move TREE_RC...
135

a46e0899e   Paul E. McKenney   rcu: use softirq ...
136
  #endif /* #ifdef CONFIG_RCU_BOOST */
5d01bbd11   Thomas Gleixner   rcu: Yield simpler
137
  static void rcu_boost_kthread_setaffinity(struct rcu_node *rnp, int outgoingcpu);
a46e0899e   Paul E. McKenney   rcu: use softirq ...
138
139
  static void invoke_rcu_core(void);
  static void invoke_rcu_callbacks(struct rcu_state *rsp, struct rcu_data *rdp);
a26ac2455   Paul E. McKenney   rcu: move TREE_RC...
140

a26ac2455   Paul E. McKenney   rcu: move TREE_RC...
141
  /*
4a2986568   Paul E. McKenney   rcu: make rcutort...
142
143
144
145
146
147
148
149
150
151
152
153
   * Track the rcutorture test sequence number and the update version
   * number within a given test.  The rcutorture_testseq is incremented
   * on every rcutorture module load and unload, so has an odd value
   * when a test is running.  The rcutorture_vernum is set to zero
   * when rcutorture starts and is incremented on each rcutorture update.
   * These variables enable correlating rcutorture output with the
   * RCU tracing information.
   */
  unsigned long rcutorture_testseq;
  unsigned long rcutorture_vernum;
  
  /*
fc2219d49   Paul E. McKenney   rcu: Clean up cod...
154
155
156
157
158
159
160
161
162
163
   * Return true if an RCU grace period is in progress.  The ACCESS_ONCE()s
   * permit this function to be invoked without holding the root rcu_node
   * structure's ->lock, but of course results can be subject to change.
   */
  static int rcu_gp_in_progress(struct rcu_state *rsp)
  {
  	return ACCESS_ONCE(rsp->completed) != ACCESS_ONCE(rsp->gpnum);
  }
  
  /*
d6714c22b   Paul E. McKenney   rcu: Renamings to...
164
   * Note a quiescent state.  Because we do not need to know
b1f77b058   Ingo Molnar   kmemtrace, rcu: f...
165
   * how many quiescent states passed, just if there was at least
d6714c22b   Paul E. McKenney   rcu: Renamings to...
166
   * one since the start of the grace period, this just sets a flag.
e4cc1f22b   Paul E. McKenney   rcu: Simplify qui...
167
   * The caller must have disabled preemption.
b1f77b058   Ingo Molnar   kmemtrace, rcu: f...
168
   */
d6714c22b   Paul E. McKenney   rcu: Renamings to...
169
  void rcu_sched_qs(int cpu)
b1f77b058   Ingo Molnar   kmemtrace, rcu: f...
170
  {
25502a6c1   Paul E. McKenney   rcu: refactor RCU...
171
  	struct rcu_data *rdp = &per_cpu(rcu_sched_data, cpu);
f41d911f8   Paul E. McKenney   rcu: Merge preemp...
172

e4cc1f22b   Paul E. McKenney   rcu: Simplify qui...
173
  	if (rdp->passed_quiesce == 0)
d4c08f2ac   Paul E. McKenney   rcu: Add grace-pe...
174
  		trace_rcu_grace_period("rcu_sched", rdp->gpnum, "cpuqs");
e4cc1f22b   Paul E. McKenney   rcu: Simplify qui...
175
  	rdp->passed_quiesce = 1;
b1f77b058   Ingo Molnar   kmemtrace, rcu: f...
176
  }
d6714c22b   Paul E. McKenney   rcu: Renamings to...
177
  void rcu_bh_qs(int cpu)
b1f77b058   Ingo Molnar   kmemtrace, rcu: f...
178
  {
25502a6c1   Paul E. McKenney   rcu: refactor RCU...
179
  	struct rcu_data *rdp = &per_cpu(rcu_bh_data, cpu);
f41d911f8   Paul E. McKenney   rcu: Merge preemp...
180

e4cc1f22b   Paul E. McKenney   rcu: Simplify qui...
181
  	if (rdp->passed_quiesce == 0)
d4c08f2ac   Paul E. McKenney   rcu: Add grace-pe...
182
  		trace_rcu_grace_period("rcu_bh", rdp->gpnum, "cpuqs");
e4cc1f22b   Paul E. McKenney   rcu: Simplify qui...
183
  	rdp->passed_quiesce = 1;
b1f77b058   Ingo Molnar   kmemtrace, rcu: f...
184
  }
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
185

25502a6c1   Paul E. McKenney   rcu: refactor RCU...
186
187
188
  /*
   * Note a context switch.  This is a quiescent state for RCU-sched,
   * and requires special handling for preemptible RCU.
e4cc1f22b   Paul E. McKenney   rcu: Simplify qui...
189
   * The caller must have disabled preemption.
25502a6c1   Paul E. McKenney   rcu: refactor RCU...
190
191
192
   */
  void rcu_note_context_switch(int cpu)
  {
300df91ca   Paul E. McKenney   rcu: Event-trace ...
193
  	trace_rcu_utilization("Start context switch");
25502a6c1   Paul E. McKenney   rcu: refactor RCU...
194
  	rcu_sched_qs(cpu);
cba6d0d64   Paul E. McKenney   Revert "rcu: Move...
195
  	rcu_preempt_note_context_switch(cpu);
300df91ca   Paul E. McKenney   rcu: Event-trace ...
196
  	trace_rcu_utilization("End context switch");
25502a6c1   Paul E. McKenney   rcu: refactor RCU...
197
  }
29ce83100   Gleb Natapov   rcu: provide rcu_...
198
  EXPORT_SYMBOL_GPL(rcu_note_context_switch);
25502a6c1   Paul E. McKenney   rcu: refactor RCU...
199

90a4d2c01   Paul E. McKenney   rcu: make treercu...
200
  DEFINE_PER_CPU(struct rcu_dynticks, rcu_dynticks) = {
29e37d814   Paul E. McKenney   rcu: Allow nestin...
201
  	.dynticks_nesting = DYNTICK_TASK_EXIT_IDLE,
23b5c8fa0   Paul E. McKenney   rcu: Decrease mem...
202
  	.dynticks = ATOMIC_INIT(1),
90a4d2c01   Paul E. McKenney   rcu: make treercu...
203
  };
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
204

878d7439d   Eric Dumazet   rcu: Fix batch-li...
205
206
207
  static long blimit = 10;	/* Maximum callbacks per rcu_do_batch. */
  static long qhimark = 10000;	/* If this many pending, ignore blimit. */
  static long qlowmark = 100;	/* Once only this many pending, use blimit. */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
208

878d7439d   Eric Dumazet   rcu: Fix batch-li...
209
210
211
  module_param(blimit, long, 0444);
  module_param(qhimark, long, 0444);
  module_param(qlowmark, long, 0444);
3d76c0829   Paul E. McKenney   rcu: Clean up cod...
212

026ad2835   Paul E. McKenney   rcu: Drive quiesc...
213
214
  static ulong jiffies_till_first_fqs = ULONG_MAX;
  static ulong jiffies_till_next_fqs = ULONG_MAX;
d40011f60   Paul E. McKenney   rcu: Control grac...
215
216
217
  
  module_param(jiffies_till_first_fqs, ulong, 0644);
  module_param(jiffies_till_next_fqs, ulong, 0644);
910ee45db   Paul E. McKenney   rcu: Make rcu_acc...
218
219
  static void rcu_start_gp_advanced(struct rcu_state *rsp, struct rcu_node *rnp,
  				  struct rcu_data *rdp);
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
220
221
  static void force_qs_rnp(struct rcu_state *rsp, int (*f)(struct rcu_data *));
  static void force_quiescent_state(struct rcu_state *rsp);
a157229ca   Paul E. McKenney   rcu: Simplify rcu...
222
  static int rcu_pending(int cpu);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
223
224
  
  /*
d6714c22b   Paul E. McKenney   rcu: Renamings to...
225
   * Return the number of RCU-sched batches processed thus far for debug & stats.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
226
   */
d6714c22b   Paul E. McKenney   rcu: Renamings to...
227
  long rcu_batches_completed_sched(void)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
228
  {
d6714c22b   Paul E. McKenney   rcu: Renamings to...
229
  	return rcu_sched_state.completed;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
230
  }
d6714c22b   Paul E. McKenney   rcu: Renamings to...
231
  EXPORT_SYMBOL_GPL(rcu_batches_completed_sched);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
232
233
234
235
236
237
238
239
240
241
242
  
  /*
   * Return the number of RCU BH batches processed thus far for debug & stats.
   */
  long rcu_batches_completed_bh(void)
  {
  	return rcu_bh_state.completed;
  }
  EXPORT_SYMBOL_GPL(rcu_batches_completed_bh);
  
  /*
bf66f18e7   Paul E. McKenney   rcu: Add force_qu...
243
244
245
246
   * Force a quiescent state for RCU BH.
   */
  void rcu_bh_force_quiescent_state(void)
  {
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
247
  	force_quiescent_state(&rcu_bh_state);
bf66f18e7   Paul E. McKenney   rcu: Add force_qu...
248
249
250
251
  }
  EXPORT_SYMBOL_GPL(rcu_bh_force_quiescent_state);
  
  /*
4a2986568   Paul E. McKenney   rcu: make rcutort...
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
   * Record the number of times rcutorture tests have been initiated and
   * terminated.  This information allows the debugfs tracing stats to be
   * correlated to the rcutorture messages, even when the rcutorture module
   * is being repeatedly loaded and unloaded.  In other words, we cannot
   * store this state in rcutorture itself.
   */
  void rcutorture_record_test_transition(void)
  {
  	rcutorture_testseq++;
  	rcutorture_vernum = 0;
  }
  EXPORT_SYMBOL_GPL(rcutorture_record_test_transition);
  
  /*
   * Record the number of writer passes through the current rcutorture test.
   * This is also used to correlate debugfs tracing stats with the rcutorture
   * messages.
   */
  void rcutorture_record_progress(unsigned long vernum)
  {
  	rcutorture_vernum++;
  }
  EXPORT_SYMBOL_GPL(rcutorture_record_progress);
  
  /*
bf66f18e7   Paul E. McKenney   rcu: Add force_qu...
277
278
279
280
   * Force a quiescent state for RCU-sched.
   */
  void rcu_sched_force_quiescent_state(void)
  {
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
281
  	force_quiescent_state(&rcu_sched_state);
bf66f18e7   Paul E. McKenney   rcu: Add force_qu...
282
283
284
285
  }
  EXPORT_SYMBOL_GPL(rcu_sched_force_quiescent_state);
  
  /*
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
286
287
288
289
290
   * Does the CPU have callbacks ready to be invoked?
   */
  static int
  cpu_has_callbacks_ready_to_invoke(struct rcu_data *rdp)
  {
3fbfbf7a3   Paul E. McKenney   rcu: Add callback...
291
292
  	return &rdp->nxtlist != rdp->nxttail[RCU_DONE_TAIL] &&
  	       rdp->nxttail[RCU_DONE_TAIL] != NULL;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
293
294
295
  }
  
  /*
dc35c8934   Paul E. McKenney   rcu: Tag callback...
296
297
298
   * Does the current CPU require a not-yet-started grace period?
   * The caller must have disabled interrupts to prevent races with
   * normal callback registry.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
299
300
301
302
   */
  static int
  cpu_needs_another_gp(struct rcu_state *rsp, struct rcu_data *rdp)
  {
dc35c8934   Paul E. McKenney   rcu: Tag callback...
303
  	int i;
3fbfbf7a3   Paul E. McKenney   rcu: Add callback...
304

dc35c8934   Paul E. McKenney   rcu: Tag callback...
305
306
  	if (rcu_gp_in_progress(rsp))
  		return 0;  /* No, a grace period is already in progress. */
dae6e64d2   Paul E. McKenney   rcu: Introduce pr...
307
  	if (rcu_nocb_needs_gp(rsp))
34ed62461   Paul E. McKenney   rcu: Remove restr...
308
  		return 1;  /* Yes, a no-CBs CPU needs one. */
dc35c8934   Paul E. McKenney   rcu: Tag callback...
309
310
311
312
313
314
315
316
317
318
  	if (!rdp->nxttail[RCU_NEXT_TAIL])
  		return 0;  /* No, this is a no-CBs (or offline) CPU. */
  	if (*rdp->nxttail[RCU_NEXT_READY_TAIL])
  		return 1;  /* Yes, this CPU has newly registered callbacks. */
  	for (i = RCU_WAIT_TAIL; i < RCU_NEXT_TAIL; i++)
  		if (rdp->nxttail[i - 1] != rdp->nxttail[i] &&
  		    ULONG_CMP_LT(ACCESS_ONCE(rsp->completed),
  				 rdp->nxtcompleted[i]))
  			return 1;  /* Yes, CBs for future grace period. */
  	return 0; /* No grace period needed. */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
319
320
321
322
323
324
325
326
327
  }
  
  /*
   * Return the root node of the specified rcu_state structure.
   */
  static struct rcu_node *rcu_get_root(struct rcu_state *rsp)
  {
  	return &rsp->node[0];
  }
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
328
  /*
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
329
   * rcu_eqs_enter_common - current CPU is moving towards extended quiescent state
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
330
331
332
333
334
   *
   * If the new value of the ->dynticks_nesting counter now is zero,
   * we really have entered idle, and must do the appropriate accounting.
   * The caller must have disabled interrupts.
   */
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
335
336
  static void rcu_eqs_enter_common(struct rcu_dynticks *rdtp, long long oldval,
  				bool user)
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
337
  {
1bdc2b7d2   Li Zhong   rcu: Use new nest...
338
  	trace_rcu_dyntick("Start", oldval, rdtp->dynticks_nesting);
cb349ca95   Paul E. McKenney   rcu: Apply micro-...
339
  	if (!user && !is_idle_task(current)) {
0989cb467   Paul E. McKenney   rcu: Add more inf...
340
  		struct task_struct *idle = idle_task(smp_processor_id());
facc4e159   Frederic Weisbecker   rcu: Irq nesting ...
341
  		trace_rcu_dyntick("Error on entry: not idle task", oldval, 0);
bf1304e9c   Paul E. McKenney   rcu: Dump only th...
342
  		ftrace_dump(DUMP_ORIG);
0989cb467   Paul E. McKenney   rcu: Add more inf...
343
344
345
  		WARN_ONCE(1, "Current pid: %d comm: %s / Idle pid: %d comm: %s",
  			  current->pid, current->comm,
  			  idle->pid, idle->comm); /* must be idle task! */
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
346
  	}
aea1b35e2   Paul E. McKenney   rcu: Allow dyntic...
347
  	rcu_prepare_for_idle(smp_processor_id());
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
348
349
350
351
352
  	/* CPUs seeing atomic_inc() must see prior RCU read-side crit sects */
  	smp_mb__before_atomic_inc();  /* See above. */
  	atomic_inc(&rdtp->dynticks);
  	smp_mb__after_atomic_inc();  /* Force ordering with next sojourn. */
  	WARN_ON_ONCE(atomic_read(&rdtp->dynticks) & 0x1);
c44e2cdda   Paul E. McKenney   rcu: Check for id...
353
354
  
  	/*
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
355
  	 * It is illegal to enter an extended quiescent state while
c44e2cdda   Paul E. McKenney   rcu: Check for id...
356
357
358
359
360
361
362
363
  	 * in an RCU read-side critical section.
  	 */
  	rcu_lockdep_assert(!lock_is_held(&rcu_lock_map),
  			   "Illegal idle entry in RCU read-side critical section.");
  	rcu_lockdep_assert(!lock_is_held(&rcu_bh_lock_map),
  			   "Illegal idle entry in RCU-bh read-side critical section.");
  	rcu_lockdep_assert(!lock_is_held(&rcu_sched_lock_map),
  			   "Illegal idle entry in RCU-sched read-side critical section.");
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
364
  }
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
365

adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
366
367
368
  /*
   * Enter an RCU extended quiescent state, which can be either the
   * idle loop or adaptive-tickless usermode execution.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
369
   */
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
370
  static void rcu_eqs_enter(bool user)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
371
  {
4145fa7fb   Paul E. McKenney   rcu: Deconfuse dy...
372
  	long long oldval;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
373
  	struct rcu_dynticks *rdtp;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
374
  	rdtp = &__get_cpu_var(rcu_dynticks);
4145fa7fb   Paul E. McKenney   rcu: Deconfuse dy...
375
  	oldval = rdtp->dynticks_nesting;
29e37d814   Paul E. McKenney   rcu: Allow nestin...
376
377
378
379
380
  	WARN_ON_ONCE((oldval & DYNTICK_TASK_NEST_MASK) == 0);
  	if ((oldval & DYNTICK_TASK_NEST_MASK) == DYNTICK_TASK_NEST_VALUE)
  		rdtp->dynticks_nesting = 0;
  	else
  		rdtp->dynticks_nesting -= DYNTICK_TASK_NEST_VALUE;
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
381
  	rcu_eqs_enter_common(rdtp, oldval, user);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
382
  }
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
  
  /**
   * rcu_idle_enter - inform RCU that current CPU is entering idle
   *
   * Enter idle mode, in other words, -leave- the mode in which RCU
   * read-side critical sections can occur.  (Though RCU read-side
   * critical sections can occur in irq handlers in idle, a possibility
   * handled by irq_enter() and irq_exit().)
   *
   * We crowbar the ->dynticks_nesting field to zero to allow for
   * the possibility of usermode upcalls having messed up our count
   * of interrupt nesting level during the prior busy period.
   */
  void rcu_idle_enter(void)
  {
c5d900bf6   Frederic Weisbecker   rcu: Allow rcu_us...
398
399
400
  	unsigned long flags;
  
  	local_irq_save(flags);
cb349ca95   Paul E. McKenney   rcu: Apply micro-...
401
  	rcu_eqs_enter(false);
c5d900bf6   Frederic Weisbecker   rcu: Allow rcu_us...
402
  	local_irq_restore(flags);
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
403
  }
8a2ecf474   Paul E. McKenney   rcu: Add RCU_NONI...
404
  EXPORT_SYMBOL_GPL(rcu_idle_enter);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
405

2b1d5024e   Frederic Weisbecker   rcu: Settle confi...
406
  #ifdef CONFIG_RCU_USER_QS
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
407
  /**
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
408
409
410
411
412
413
414
415
416
   * rcu_user_enter - inform RCU that we are resuming userspace.
   *
   * Enter RCU idle mode right before resuming userspace.  No use of RCU
   * is permitted between this call and rcu_user_exit(). This way the
   * CPU doesn't need to maintain the tick for RCU maintenance purposes
   * when the CPU runs in userspace.
   */
  void rcu_user_enter(void)
  {
91d1aa43d   Frederic Weisbecker   context_tracking:...
417
  	rcu_eqs_enter(1);
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
418
  }
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
419
  /**
19dd1591f   Frederic Weisbecker   rcu: New rcu_user...
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
   * rcu_user_enter_after_irq - inform RCU that we are going to resume userspace
   * after the current irq returns.
   *
   * This is similar to rcu_user_enter() but in the context of a non-nesting
   * irq. After this call, RCU enters into idle mode when the interrupt
   * returns.
   */
  void rcu_user_enter_after_irq(void)
  {
  	unsigned long flags;
  	struct rcu_dynticks *rdtp;
  
  	local_irq_save(flags);
  	rdtp = &__get_cpu_var(rcu_dynticks);
  	/* Ensure this irq is interrupting a non-idle RCU state.  */
  	WARN_ON_ONCE(!(rdtp->dynticks_nesting & DYNTICK_TASK_MASK));
  	rdtp->dynticks_nesting = 1;
  	local_irq_restore(flags);
  }
2b1d5024e   Frederic Weisbecker   rcu: Settle confi...
439
  #endif /* CONFIG_RCU_USER_QS */
19dd1591f   Frederic Weisbecker   rcu: New rcu_user...
440
441
  
  /**
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
442
443
444
445
446
   * rcu_irq_exit - inform RCU that current CPU is exiting irq towards idle
   *
   * Exit from an interrupt handler, which might possibly result in entering
   * idle mode, in other words, leaving the mode in which read-side critical
   * sections can occur.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
447
   *
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
448
449
450
451
452
453
454
455
   * This code assumes that the idle loop never does anything that might
   * result in unbalanced calls to irq_enter() and irq_exit().  If your
   * architecture violates this assumption, RCU will give you what you
   * deserve, good and hard.  But very infrequently and irreproducibly.
   *
   * Use things like work queues to work around this limitation.
   *
   * You have been warned.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
456
   */
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
457
  void rcu_irq_exit(void)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
458
459
  {
  	unsigned long flags;
4145fa7fb   Paul E. McKenney   rcu: Deconfuse dy...
460
  	long long oldval;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
461
462
463
464
  	struct rcu_dynticks *rdtp;
  
  	local_irq_save(flags);
  	rdtp = &__get_cpu_var(rcu_dynticks);
4145fa7fb   Paul E. McKenney   rcu: Deconfuse dy...
465
  	oldval = rdtp->dynticks_nesting;
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
466
467
  	rdtp->dynticks_nesting--;
  	WARN_ON_ONCE(rdtp->dynticks_nesting < 0);
b6fc60201   Frederic Weisbecker   rcu: Don't check ...
468
469
470
  	if (rdtp->dynticks_nesting)
  		trace_rcu_dyntick("--=", oldval, rdtp->dynticks_nesting);
  	else
cb349ca95   Paul E. McKenney   rcu: Apply micro-...
471
  		rcu_eqs_enter_common(rdtp, oldval, true);
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
472
473
474
475
  	local_irq_restore(flags);
  }
  
  /*
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
476
   * rcu_eqs_exit_common - current CPU moving away from extended quiescent state
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
477
478
479
480
481
   *
   * If the new value of the ->dynticks_nesting counter was previously zero,
   * we really have exited idle, and must do the appropriate accounting.
   * The caller must have disabled interrupts.
   */
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
482
483
  static void rcu_eqs_exit_common(struct rcu_dynticks *rdtp, long long oldval,
  			       int user)
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
484
  {
23b5c8fa0   Paul E. McKenney   rcu: Decrease mem...
485
486
487
488
489
  	smp_mb__before_atomic_inc();  /* Force ordering w/previous sojourn. */
  	atomic_inc(&rdtp->dynticks);
  	/* CPUs seeing atomic_inc() must see later RCU read-side crit sects */
  	smp_mb__after_atomic_inc();  /* See above. */
  	WARN_ON_ONCE(!(atomic_read(&rdtp->dynticks) & 0x1));
7cb924990   Paul E. McKenney   rcu: Permit dynti...
490
  	rcu_cleanup_after_idle(smp_processor_id());
4145fa7fb   Paul E. McKenney   rcu: Deconfuse dy...
491
  	trace_rcu_dyntick("End", oldval, rdtp->dynticks_nesting);
cb349ca95   Paul E. McKenney   rcu: Apply micro-...
492
  	if (!user && !is_idle_task(current)) {
0989cb467   Paul E. McKenney   rcu: Add more inf...
493
  		struct task_struct *idle = idle_task(smp_processor_id());
4145fa7fb   Paul E. McKenney   rcu: Deconfuse dy...
494
495
  		trace_rcu_dyntick("Error on exit: not idle task",
  				  oldval, rdtp->dynticks_nesting);
bf1304e9c   Paul E. McKenney   rcu: Dump only th...
496
  		ftrace_dump(DUMP_ORIG);
0989cb467   Paul E. McKenney   rcu: Add more inf...
497
498
499
  		WARN_ONCE(1, "Current pid: %d comm: %s / Idle pid: %d comm: %s",
  			  current->pid, current->comm,
  			  idle->pid, idle->comm); /* must be idle task! */
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
500
501
  	}
  }
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
502
503
504
  /*
   * Exit an RCU extended quiescent state, which can be either the
   * idle loop or adaptive-tickless usermode execution.
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
505
   */
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
506
  static void rcu_eqs_exit(bool user)
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
507
  {
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
508
509
  	struct rcu_dynticks *rdtp;
  	long long oldval;
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
510
511
  	rdtp = &__get_cpu_var(rcu_dynticks);
  	oldval = rdtp->dynticks_nesting;
29e37d814   Paul E. McKenney   rcu: Allow nestin...
512
513
514
515
516
  	WARN_ON_ONCE(oldval < 0);
  	if (oldval & DYNTICK_TASK_NEST_MASK)
  		rdtp->dynticks_nesting += DYNTICK_TASK_NEST_VALUE;
  	else
  		rdtp->dynticks_nesting = DYNTICK_TASK_EXIT_IDLE;
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
517
  	rcu_eqs_exit_common(rdtp, oldval, user);
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
518
  }
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
519
520
521
522
523
524
525
526
527
528
529
530
531
532
  
  /**
   * rcu_idle_exit - inform RCU that current CPU is leaving idle
   *
   * Exit idle mode, in other words, -enter- the mode in which RCU
   * read-side critical sections can occur.
   *
   * We crowbar the ->dynticks_nesting field to DYNTICK_TASK_NEST to
   * allow for the possibility of usermode upcalls messing up our count
   * of interrupt nesting level during the busy period that is just
   * now starting.
   */
  void rcu_idle_exit(void)
  {
c5d900bf6   Frederic Weisbecker   rcu: Allow rcu_us...
533
534
535
  	unsigned long flags;
  
  	local_irq_save(flags);
cb349ca95   Paul E. McKenney   rcu: Apply micro-...
536
  	rcu_eqs_exit(false);
c5d900bf6   Frederic Weisbecker   rcu: Allow rcu_us...
537
  	local_irq_restore(flags);
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
538
  }
8a2ecf474   Paul E. McKenney   rcu: Add RCU_NONI...
539
  EXPORT_SYMBOL_GPL(rcu_idle_exit);
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
540

2b1d5024e   Frederic Weisbecker   rcu: Settle confi...
541
  #ifdef CONFIG_RCU_USER_QS
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
542
  /**
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
543
544
545
546
547
548
549
   * rcu_user_exit - inform RCU that we are exiting userspace.
   *
   * Exit RCU idle mode while entering the kernel because it can
   * run a RCU read side critical section anytime.
   */
  void rcu_user_exit(void)
  {
91d1aa43d   Frederic Weisbecker   context_tracking:...
550
  	rcu_eqs_exit(1);
adf5091e6   Frederic Weisbecker   rcu: New rcu_user...
551
552
553
  }
  
  /**
19dd1591f   Frederic Weisbecker   rcu: New rcu_user...
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
   * rcu_user_exit_after_irq - inform RCU that we won't resume to userspace
   * idle mode after the current non-nesting irq returns.
   *
   * This is similar to rcu_user_exit() but in the context of an irq.
   * This is called when the irq has interrupted a userspace RCU idle mode
   * context. When the current non-nesting interrupt returns after this call,
   * the CPU won't restore the RCU idle mode.
   */
  void rcu_user_exit_after_irq(void)
  {
  	unsigned long flags;
  	struct rcu_dynticks *rdtp;
  
  	local_irq_save(flags);
  	rdtp = &__get_cpu_var(rcu_dynticks);
  	/* Ensure we are interrupting an RCU idle mode. */
  	WARN_ON_ONCE(rdtp->dynticks_nesting & DYNTICK_TASK_NEST_MASK);
  	rdtp->dynticks_nesting += DYNTICK_TASK_EXIT_IDLE;
  	local_irq_restore(flags);
  }
2b1d5024e   Frederic Weisbecker   rcu: Settle confi...
574
  #endif /* CONFIG_RCU_USER_QS */
19dd1591f   Frederic Weisbecker   rcu: New rcu_user...
575
576
  
  /**
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
   * rcu_irq_enter - inform RCU that current CPU is entering irq away from idle
   *
   * Enter an interrupt handler, which might possibly result in exiting
   * idle mode, in other words, entering the mode in which read-side critical
   * sections can occur.
   *
   * Note that the Linux kernel is fully capable of entering an interrupt
   * handler that it never exits, for example when doing upcalls to
   * user mode!  This code assumes that the idle loop never does upcalls to
   * user mode.  If your architecture does do upcalls from the idle loop (or
   * does anything else that results in unbalanced calls to the irq_enter()
   * and irq_exit() functions), RCU will give you what you deserve, good
   * and hard.  But very infrequently and irreproducibly.
   *
   * Use things like work queues to work around this limitation.
   *
   * You have been warned.
   */
  void rcu_irq_enter(void)
  {
  	unsigned long flags;
  	struct rcu_dynticks *rdtp;
  	long long oldval;
  
  	local_irq_save(flags);
  	rdtp = &__get_cpu_var(rcu_dynticks);
  	oldval = rdtp->dynticks_nesting;
  	rdtp->dynticks_nesting++;
  	WARN_ON_ONCE(rdtp->dynticks_nesting == 0);
b6fc60201   Frederic Weisbecker   rcu: Don't check ...
606
607
608
  	if (oldval)
  		trace_rcu_dyntick("++=", oldval, rdtp->dynticks_nesting);
  	else
cb349ca95   Paul E. McKenney   rcu: Apply micro-...
609
  		rcu_eqs_exit_common(rdtp, oldval, true);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
610
  	local_irq_restore(flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
611
612
613
614
615
616
617
618
619
620
621
622
  }
  
  /**
   * rcu_nmi_enter - inform RCU of entry to NMI context
   *
   * If the CPU was idle with dynamic ticks active, and there is no
   * irq handler running, this updates rdtp->dynticks_nmi to let the
   * RCU grace-period handling know that the CPU is active.
   */
  void rcu_nmi_enter(void)
  {
  	struct rcu_dynticks *rdtp = &__get_cpu_var(rcu_dynticks);
23b5c8fa0   Paul E. McKenney   rcu: Decrease mem...
623
624
  	if (rdtp->dynticks_nmi_nesting == 0 &&
  	    (atomic_read(&rdtp->dynticks) & 0x1))
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
625
  		return;
23b5c8fa0   Paul E. McKenney   rcu: Decrease mem...
626
627
628
629
630
631
  	rdtp->dynticks_nmi_nesting++;
  	smp_mb__before_atomic_inc();  /* Force delay from prior write. */
  	atomic_inc(&rdtp->dynticks);
  	/* CPUs seeing atomic_inc() must see later RCU read-side crit sects */
  	smp_mb__after_atomic_inc();  /* See above. */
  	WARN_ON_ONCE(!(atomic_read(&rdtp->dynticks) & 0x1));
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
632
633
634
635
636
637
638
639
640
641
642
643
  }
  
  /**
   * rcu_nmi_exit - inform RCU of exit from NMI context
   *
   * If the CPU was idle with dynamic ticks active, and there is no
   * irq handler running, this updates rdtp->dynticks_nmi to let the
   * RCU grace-period handling know that the CPU is no longer active.
   */
  void rcu_nmi_exit(void)
  {
  	struct rcu_dynticks *rdtp = &__get_cpu_var(rcu_dynticks);
23b5c8fa0   Paul E. McKenney   rcu: Decrease mem...
644
645
  	if (rdtp->dynticks_nmi_nesting == 0 ||
  	    --rdtp->dynticks_nmi_nesting != 0)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
646
  		return;
23b5c8fa0   Paul E. McKenney   rcu: Decrease mem...
647
648
649
650
651
  	/* CPUs seeing atomic_inc() must see prior RCU read-side crit sects */
  	smp_mb__before_atomic_inc();  /* See above. */
  	atomic_inc(&rdtp->dynticks);
  	smp_mb__after_atomic_inc();  /* Force delay to next write. */
  	WARN_ON_ONCE(atomic_read(&rdtp->dynticks) & 0x1);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
652
653
654
  }
  
  /**
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
655
   * rcu_is_cpu_idle - see if RCU thinks that the current CPU is idle
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
656
   *
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
657
   * If the current CPU is in its idle loop and is neither in an interrupt
34240697d   Paul E. McKenney   rcu: Disable pree...
658
   * or NMI handler, return true.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
659
   */
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
660
  int rcu_is_cpu_idle(void)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
661
  {
34240697d   Paul E. McKenney   rcu: Disable pree...
662
663
664
665
666
667
  	int ret;
  
  	preempt_disable();
  	ret = (atomic_read(&__get_cpu_var(rcu_dynticks).dynticks) & 0x1) == 0;
  	preempt_enable();
  	return ret;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
668
  }
e6b80a3b0   Frederic Weisbecker   rcu: Detect illeg...
669
  EXPORT_SYMBOL(rcu_is_cpu_idle);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
670

62fde6edf   Paul E. McKenney   rcu: Make __call_...
671
  #if defined(CONFIG_PROVE_RCU) && defined(CONFIG_HOTPLUG_CPU)
c0d6d01bf   Paul E. McKenney   rcu: Check for il...
672
673
674
675
676
677
678
  
  /*
   * Is the current CPU online?  Disable preemption to avoid false positives
   * that could otherwise happen due to the current CPU number being sampled,
   * this task being preempted, its old CPU being taken offline, resuming
   * on some other CPU, then determining that its old CPU is now offline.
   * It is OK to use RCU on an offline processor during initial boot, hence
2036d94a7   Paul E. McKenney   rcu: Rework detec...
679
680
681
682
683
684
685
686
687
688
689
   * the check for rcu_scheduler_fully_active.  Note also that it is OK
   * for a CPU coming online to use RCU for one jiffy prior to marking itself
   * online in the cpu_online_mask.  Similarly, it is OK for a CPU going
   * offline to continue to use RCU for one jiffy after marking itself
   * offline in the cpu_online_mask.  This leniency is necessary given the
   * non-atomic nature of the online and offline processing, for example,
   * the fact that a CPU enters the scheduler after completing the CPU_DYING
   * notifiers.
   *
   * This is also why RCU internally marks CPUs online during the
   * CPU_UP_PREPARE phase and offline during the CPU_DEAD phase.
c0d6d01bf   Paul E. McKenney   rcu: Check for il...
690
691
692
693
694
695
   *
   * Disable checking if in an NMI handler because we cannot safely report
   * errors from NMI handlers anyway.
   */
  bool rcu_lockdep_current_cpu_online(void)
  {
2036d94a7   Paul E. McKenney   rcu: Rework detec...
696
697
  	struct rcu_data *rdp;
  	struct rcu_node *rnp;
c0d6d01bf   Paul E. McKenney   rcu: Check for il...
698
699
700
701
702
  	bool ret;
  
  	if (in_nmi())
  		return 1;
  	preempt_disable();
2036d94a7   Paul E. McKenney   rcu: Rework detec...
703
704
705
  	rdp = &__get_cpu_var(rcu_sched_data);
  	rnp = rdp->mynode;
  	ret = (rdp->grpmask & rnp->qsmaskinit) ||
c0d6d01bf   Paul E. McKenney   rcu: Check for il...
706
707
708
709
710
  	      !rcu_scheduler_fully_active;
  	preempt_enable();
  	return ret;
  }
  EXPORT_SYMBOL_GPL(rcu_lockdep_current_cpu_online);
62fde6edf   Paul E. McKenney   rcu: Make __call_...
711
  #endif /* #if defined(CONFIG_PROVE_RCU) && defined(CONFIG_HOTPLUG_CPU) */
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
712

64db4cfff   Paul E. McKenney   "Tree RCU": scala...
713
  /**
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
714
   * rcu_is_cpu_rrupt_from_idle - see if idle or immediately interrupted from idle
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
715
   *
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
716
717
718
   * If the current CPU is idle or running at a first-level (not nested)
   * interrupt from idle, return true.  The caller must have at least
   * disabled preemption.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
719
   */
62e3cb143   Josh Triplett   rcu: Make rcu_is_...
720
  static int rcu_is_cpu_rrupt_from_idle(void)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
721
  {
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
722
  	return __get_cpu_var(rcu_dynticks).dynticks_nesting <= 1;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
723
  }
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
724
  /*
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
725
726
   * Snapshot the specified CPU's dynticks counter so that we can later
   * credit them with an implicit quiescent state.  Return 1 if this CPU
1eba8f843   Paul E. McKenney   rcu: Clean up cod...
727
   * is in dynticks idle mode, which is an extended quiescent state.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
728
729
730
   */
  static int dyntick_save_progress_counter(struct rcu_data *rdp)
  {
23b5c8fa0   Paul E. McKenney   rcu: Decrease mem...
731
  	rdp->dynticks_snap = atomic_add_return(0, &rdp->dynticks->dynticks);
f0e7c19db   Paul E. McKenney   rcu: Identify dyn...
732
  	return (rdp->dynticks_snap & 0x1) == 0;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
733
734
735
736
737
738
  }
  
  /*
   * Return true if the specified CPU has passed through a quiescent
   * state by virtue of being in or having passed through an dynticks
   * idle state since the last call to dyntick_save_progress_counter()
a82dcc760   Paul E. McKenney   rcu: Make offline...
739
   * for this same CPU, or by virtue of having been offline.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
740
741
742
   */
  static int rcu_implicit_dynticks_qs(struct rcu_data *rdp)
  {
7eb4f4553   Paul E. McKenney   rcu: Make rcu_imp...
743
744
  	unsigned int curr;
  	unsigned int snap;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
745

7eb4f4553   Paul E. McKenney   rcu: Make rcu_imp...
746
747
  	curr = (unsigned int)atomic_add_return(0, &rdp->dynticks->dynticks);
  	snap = (unsigned int)rdp->dynticks_snap;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
748
749
750
751
752
753
754
755
756
  
  	/*
  	 * If the CPU passed through or entered a dynticks idle phase with
  	 * no active irq/NMI handlers, then we can safely pretend that the CPU
  	 * already acknowledged the request to pass through a quiescent
  	 * state.  Either way, that CPU cannot possibly be in an RCU
  	 * read-side critical section that started before the beginning
  	 * of the current RCU grace period.
  	 */
7eb4f4553   Paul E. McKenney   rcu: Make rcu_imp...
757
  	if ((curr & 0x1) == 0 || UINT_CMP_GE(curr, snap + 2)) {
d4c08f2ac   Paul E. McKenney   rcu: Add grace-pe...
758
  		trace_rcu_fqs(rdp->rsp->name, rdp->gpnum, rdp->cpu, "dti");
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
759
760
761
  		rdp->dynticks_fqs++;
  		return 1;
  	}
a82dcc760   Paul E. McKenney   rcu: Make offline...
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
  	/*
  	 * Check for the CPU being offline, but only if the grace period
  	 * is old enough.  We don't need to worry about the CPU changing
  	 * state: If we see it offline even once, it has been through a
  	 * quiescent state.
  	 *
  	 * The reason for insisting that the grace period be at least
  	 * one jiffy old is that CPUs that are not quite online and that
  	 * have just gone offline can still execute RCU read-side critical
  	 * sections.
  	 */
  	if (ULONG_CMP_GE(rdp->rsp->gp_start + 2, jiffies))
  		return 0;  /* Grace period is not old enough. */
  	barrier();
  	if (cpu_is_offline(rdp->cpu)) {
  		trace_rcu_fqs(rdp->rsp->name, rdp->gpnum, rdp->cpu, "ofl");
  		rdp->offline_fqs++;
  		return 1;
  	}
65d798f0f   Paul E. McKenney   rcu: Kick adaptiv...
781
782
783
784
785
786
787
788
789
  
  	/*
  	 * There is a possibility that a CPU in adaptive-ticks state
  	 * might run in the kernel with the scheduling-clock tick disabled
  	 * for an extended time period.  Invoke rcu_kick_nohz_cpu() to
  	 * force the CPU to restart the scheduling-clock tick in this
  	 * CPU is in this state.
  	 */
  	rcu_kick_nohz_cpu(rdp->cpu);
a82dcc760   Paul E. McKenney   rcu: Make offline...
790
  	return 0;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
791
  }
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
792
793
794
  static void record_gp_stall_check_time(struct rcu_state *rsp)
  {
  	rsp->gp_start = jiffies;
6bfc09e23   Paul E. McKenney   rcu: Provide RCU ...
795
  	rsp->jiffies_stall = jiffies + rcu_jiffies_till_stall_check();
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
796
  }
b637a328b   Paul E. McKenney   rcu: Print remote...
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
  /*
   * Dump stacks of all tasks running on stalled CPUs.  This is a fallback
   * for architectures that do not implement trigger_all_cpu_backtrace().
   * The NMI-triggered stack traces are more accurate because they are
   * printed by the target CPU.
   */
  static void rcu_dump_cpu_stacks(struct rcu_state *rsp)
  {
  	int cpu;
  	unsigned long flags;
  	struct rcu_node *rnp;
  
  	rcu_for_each_leaf_node(rsp, rnp) {
  		raw_spin_lock_irqsave(&rnp->lock, flags);
  		if (rnp->qsmask != 0) {
  			for (cpu = 0; cpu <= rnp->grphi - rnp->grplo; cpu++)
  				if (rnp->qsmask & (1UL << cpu))
  					dump_cpu_task(rnp->grplo + cpu);
  		}
  		raw_spin_unlock_irqrestore(&rnp->lock, flags);
  	}
  }
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
819
820
821
822
823
  static void print_other_cpu_stall(struct rcu_state *rsp)
  {
  	int cpu;
  	long delta;
  	unsigned long flags;
285fe2948   Paul E. McKenney   rcu: Fix detectio...
824
  	int ndetected = 0;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
825
  	struct rcu_node *rnp = rcu_get_root(rsp);
53bb857c3   Paul E. McKenney   rcu: Dump number ...
826
  	long totqlen = 0;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
827
828
  
  	/* Only let one CPU complain about others per time interval. */
1304afb22   Paul E. McKenney   rcu: Convert to r...
829
  	raw_spin_lock_irqsave(&rnp->lock, flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
830
  	delta = jiffies - rsp->jiffies_stall;
fc2219d49   Paul E. McKenney   rcu: Clean up cod...
831
  	if (delta < RCU_STALL_RAT_DELAY || !rcu_gp_in_progress(rsp)) {
1304afb22   Paul E. McKenney   rcu: Convert to r...
832
  		raw_spin_unlock_irqrestore(&rnp->lock, flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
833
834
  		return;
  	}
6bfc09e23   Paul E. McKenney   rcu: Provide RCU ...
835
  	rsp->jiffies_stall = jiffies + 3 * rcu_jiffies_till_stall_check() + 3;
1304afb22   Paul E. McKenney   rcu: Convert to r...
836
  	raw_spin_unlock_irqrestore(&rnp->lock, flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
837

8cdd32a91   Paul E. McKenney   rcu: refer RCU CP...
838
839
840
841
842
  	/*
  	 * OK, time to rat on our buddy...
  	 * See Documentation/RCU/stallwarn.txt for info on how to debug
  	 * RCU CPU stall warnings.
  	 */
d7f3e2073   Paul E. McKenney   rcu: Convert rcut...
843
  	pr_err("INFO: %s detected stalls on CPUs/tasks:",
4300aa642   Paul E. McKenney   rcu: improve RCU ...
844
  	       rsp->name);
a858af287   Paul E. McKenney   rcu: Print schedu...
845
  	print_cpu_stall_info_begin();
a0b6c9a78   Paul E. McKenney   rcu: Clean up cod...
846
  	rcu_for_each_leaf_node(rsp, rnp) {
3acd9eb31   Paul E. McKenney   rcu: Fix deadlock...
847
  		raw_spin_lock_irqsave(&rnp->lock, flags);
9bc8b5586   Paul E. McKenney   rcu: Suppress NMI...
848
  		ndetected += rcu_print_task_stall(rnp);
c8020a67e   Paul E. McKenney   rcu: Protect rcu_...
849
850
851
852
853
854
855
856
  		if (rnp->qsmask != 0) {
  			for (cpu = 0; cpu <= rnp->grphi - rnp->grplo; cpu++)
  				if (rnp->qsmask & (1UL << cpu)) {
  					print_cpu_stall_info(rsp,
  							     rnp->grplo + cpu);
  					ndetected++;
  				}
  		}
3acd9eb31   Paul E. McKenney   rcu: Fix deadlock...
857
  		raw_spin_unlock_irqrestore(&rnp->lock, flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
858
  	}
a858af287   Paul E. McKenney   rcu: Print schedu...
859
860
861
862
863
864
865
  
  	/*
  	 * Now rat on any tasks that got kicked up to the root rcu_node
  	 * due to CPU offlining.
  	 */
  	rnp = rcu_get_root(rsp);
  	raw_spin_lock_irqsave(&rnp->lock, flags);
285fe2948   Paul E. McKenney   rcu: Fix detectio...
866
  	ndetected += rcu_print_task_stall(rnp);
a858af287   Paul E. McKenney   rcu: Print schedu...
867
868
869
  	raw_spin_unlock_irqrestore(&rnp->lock, flags);
  
  	print_cpu_stall_info_end();
53bb857c3   Paul E. McKenney   rcu: Dump number ...
870
871
872
873
  	for_each_possible_cpu(cpu)
  		totqlen += per_cpu_ptr(rsp->rda, cpu)->qlen;
  	pr_cont("(detected by %d, t=%ld jiffies, g=%lu, c=%lu, q=%lu)
  ",
eee058826   Paul E. McKenney   rcu: Add grace-pe...
874
  	       smp_processor_id(), (long)(jiffies - rsp->gp_start),
53bb857c3   Paul E. McKenney   rcu: Dump number ...
875
  	       rsp->gpnum, rsp->completed, totqlen);
9bc8b5586   Paul E. McKenney   rcu: Suppress NMI...
876
  	if (ndetected == 0)
d7f3e2073   Paul E. McKenney   rcu: Convert rcut...
877
878
  		pr_err("INFO: Stall ended before state dump start
  ");
9bc8b5586   Paul E. McKenney   rcu: Suppress NMI...
879
  	else if (!trigger_all_cpu_backtrace())
b637a328b   Paul E. McKenney   rcu: Print remote...
880
  		rcu_dump_cpu_stacks(rsp);
c1dc0b9c0   Ingo Molnar   debug lockups: Im...
881

4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
882
  	/* Complain about tasks blocking the grace period. */
1ed509a22   Paul E. McKenney   rcu: Add RCU_CPU_...
883
884
  
  	rcu_print_detail_task_stall(rsp);
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
885
  	force_quiescent_state(rsp);  /* Kick them all. */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
886
887
888
889
  }
  
  static void print_cpu_stall(struct rcu_state *rsp)
  {
53bb857c3   Paul E. McKenney   rcu: Dump number ...
890
  	int cpu;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
891
892
  	unsigned long flags;
  	struct rcu_node *rnp = rcu_get_root(rsp);
53bb857c3   Paul E. McKenney   rcu: Dump number ...
893
  	long totqlen = 0;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
894

8cdd32a91   Paul E. McKenney   rcu: refer RCU CP...
895
896
897
898
899
  	/*
  	 * OK, time to rat on ourselves...
  	 * See Documentation/RCU/stallwarn.txt for info on how to debug
  	 * RCU CPU stall warnings.
  	 */
d7f3e2073   Paul E. McKenney   rcu: Convert rcut...
900
  	pr_err("INFO: %s self-detected stall on CPU", rsp->name);
a858af287   Paul E. McKenney   rcu: Print schedu...
901
902
903
  	print_cpu_stall_info_begin();
  	print_cpu_stall_info(rsp, smp_processor_id());
  	print_cpu_stall_info_end();
53bb857c3   Paul E. McKenney   rcu: Dump number ...
904
905
906
907
908
  	for_each_possible_cpu(cpu)
  		totqlen += per_cpu_ptr(rsp->rda, cpu)->qlen;
  	pr_cont(" (t=%lu jiffies g=%lu c=%lu q=%lu)
  ",
  		jiffies - rsp->gp_start, rsp->gpnum, rsp->completed, totqlen);
4627e240d   Paul E. McKenney   rcu: Dump local s...
909
910
  	if (!trigger_all_cpu_backtrace())
  		dump_stack();
c1dc0b9c0   Ingo Molnar   debug lockups: Im...
911

1304afb22   Paul E. McKenney   rcu: Convert to r...
912
  	raw_spin_lock_irqsave(&rnp->lock, flags);
20133cfce   Paul E. McKenney   rcu: Stop overflo...
913
  	if (ULONG_CMP_GE(jiffies, rsp->jiffies_stall))
13cfcca0e   Paul E. McKenney   rcu: Set RCU CPU ...
914
  		rsp->jiffies_stall = jiffies +
6bfc09e23   Paul E. McKenney   rcu: Provide RCU ...
915
  				     3 * rcu_jiffies_till_stall_check() + 3;
1304afb22   Paul E. McKenney   rcu: Convert to r...
916
  	raw_spin_unlock_irqrestore(&rnp->lock, flags);
c1dc0b9c0   Ingo Molnar   debug lockups: Im...
917

64db4cfff   Paul E. McKenney   "Tree RCU": scala...
918
919
920
921
922
  	set_need_resched();  /* kick ourselves to get things going. */
  }
  
  static void check_cpu_stall(struct rcu_state *rsp, struct rcu_data *rdp)
  {
bad6e1393   Paul E. McKenney   rcu: get rid of s...
923
924
  	unsigned long j;
  	unsigned long js;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
925
  	struct rcu_node *rnp;
742734eea   Paul E. McKenney   rcu: add boot par...
926
  	if (rcu_cpu_stall_suppress)
c68de2097   Paul E. McKenney   rcu: disable CPU ...
927
  		return;
bad6e1393   Paul E. McKenney   rcu: get rid of s...
928
929
  	j = ACCESS_ONCE(jiffies);
  	js = ACCESS_ONCE(rsp->jiffies_stall);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
930
  	rnp = rdp->mynode;
c96ea7cfd   Paul E. McKenney   rcu: Avoid spurio...
931
932
  	if (rcu_gp_in_progress(rsp) &&
  	    (ACCESS_ONCE(rnp->qsmask) & rdp->grpmask) && ULONG_CMP_GE(j, js)) {
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
933
934
935
  
  		/* We haven't checked in, so go dump stack. */
  		print_cpu_stall(rsp);
bad6e1393   Paul E. McKenney   rcu: get rid of s...
936
937
  	} else if (rcu_gp_in_progress(rsp) &&
  		   ULONG_CMP_GE(j, js + RCU_STALL_RAT_DELAY)) {
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
938

bad6e1393   Paul E. McKenney   rcu: get rid of s...
939
  		/* They had a few time units to dump stack, so complain. */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
940
941
942
  		print_other_cpu_stall(rsp);
  	}
  }
53d84e004   Paul E. McKenney   rcu: permit suppr...
943
944
945
946
947
948
949
950
951
952
953
  /**
   * rcu_cpu_stall_reset - prevent further stall warnings in current grace period
   *
   * Set the stall-warning timeout way off into the future, thus preventing
   * any RCU CPU stall-warning messages from appearing in the current set of
   * RCU grace periods.
   *
   * The caller must disable hard irqs.
   */
  void rcu_cpu_stall_reset(void)
  {
6ce75a232   Paul E. McKenney   rcu: Introduce fo...
954
955
956
957
  	struct rcu_state *rsp;
  
  	for_each_rcu_flavor(rsp)
  		rsp->jiffies_stall = jiffies + ULONG_MAX / 2;
53d84e004   Paul E. McKenney   rcu: permit suppr...
958
  }
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
959
  /*
3f5d3ea64   Paul E. McKenney   rcu: Consolidate ...
960
961
962
963
964
   * Initialize the specified rcu_data structure's callback list to empty.
   */
  static void init_callback_list(struct rcu_data *rdp)
  {
  	int i;
34ed62461   Paul E. McKenney   rcu: Remove restr...
965
966
  	if (init_nocb_callback_list(rdp))
  		return;
3f5d3ea64   Paul E. McKenney   rcu: Consolidate ...
967
968
969
970
971
972
  	rdp->nxtlist = NULL;
  	for (i = 0; i < RCU_NEXT_SIZE; i++)
  		rdp->nxttail[i] = &rdp->nxtlist;
  }
  
  /*
dc35c8934   Paul E. McKenney   rcu: Tag callback...
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
1001
   * Determine the value that ->completed will have at the end of the
   * next subsequent grace period.  This is used to tag callbacks so that
   * a CPU can invoke callbacks in a timely fashion even if that CPU has
   * been dyntick-idle for an extended period with callbacks under the
   * influence of RCU_FAST_NO_HZ.
   *
   * The caller must hold rnp->lock with interrupts disabled.
   */
  static unsigned long rcu_cbs_completed(struct rcu_state *rsp,
  				       struct rcu_node *rnp)
  {
  	/*
  	 * If RCU is idle, we just wait for the next grace period.
  	 * But we can only be sure that RCU is idle if we are looking
  	 * at the root rcu_node structure -- otherwise, a new grace
  	 * period might have started, but just not yet gotten around
  	 * to initializing the current non-root rcu_node structure.
  	 */
  	if (rcu_get_root(rsp) == rnp && rnp->gpnum == rnp->completed)
  		return rnp->completed + 1;
  
  	/*
  	 * Otherwise, wait for a possible partial grace period and
  	 * then the subsequent full grace period.
  	 */
  	return rnp->completed + 2;
  }
  
  /*
0446be489   Paul E. McKenney   rcu: Abstract rcu...
1002
1003
1004
1005
1006
1007
1008
1009
1010
1011
1012
1013
1014
1015
1016
1017
1018
1019
1020
1021
1022
1023
1024
1025
1026
1027
1028
1029
1030
1031
1032
1033
1034
1035
1036
1037
1038
1039
1040
1041
1042
1043
1044
1045
1046
1047
1048
1049
1050
1051
1052
1053
1054
1055
1056
1057
1058
1059
1060
1061
1062
1063
1064
1065
1066
1067
1068
1069
1070
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
1081
1082
1083
1084
1085
1086
1087
   * Trace-event helper function for rcu_start_future_gp() and
   * rcu_nocb_wait_gp().
   */
  static void trace_rcu_future_gp(struct rcu_node *rnp, struct rcu_data *rdp,
  				unsigned long c, char *s)
  {
  	trace_rcu_future_grace_period(rdp->rsp->name, rnp->gpnum,
  				      rnp->completed, c, rnp->level,
  				      rnp->grplo, rnp->grphi, s);
  }
  
  /*
   * Start some future grace period, as needed to handle newly arrived
   * callbacks.  The required future grace periods are recorded in each
   * rcu_node structure's ->need_future_gp field.
   *
   * The caller must hold the specified rcu_node structure's ->lock.
   */
  static unsigned long __maybe_unused
  rcu_start_future_gp(struct rcu_node *rnp, struct rcu_data *rdp)
  {
  	unsigned long c;
  	int i;
  	struct rcu_node *rnp_root = rcu_get_root(rdp->rsp);
  
  	/*
  	 * Pick up grace-period number for new callbacks.  If this
  	 * grace period is already marked as needed, return to the caller.
  	 */
  	c = rcu_cbs_completed(rdp->rsp, rnp);
  	trace_rcu_future_gp(rnp, rdp, c, "Startleaf");
  	if (rnp->need_future_gp[c & 0x1]) {
  		trace_rcu_future_gp(rnp, rdp, c, "Prestartleaf");
  		return c;
  	}
  
  	/*
  	 * If either this rcu_node structure or the root rcu_node structure
  	 * believe that a grace period is in progress, then we must wait
  	 * for the one following, which is in "c".  Because our request
  	 * will be noticed at the end of the current grace period, we don't
  	 * need to explicitly start one.
  	 */
  	if (rnp->gpnum != rnp->completed ||
  	    ACCESS_ONCE(rnp->gpnum) != ACCESS_ONCE(rnp->completed)) {
  		rnp->need_future_gp[c & 0x1]++;
  		trace_rcu_future_gp(rnp, rdp, c, "Startedleaf");
  		return c;
  	}
  
  	/*
  	 * There might be no grace period in progress.  If we don't already
  	 * hold it, acquire the root rcu_node structure's lock in order to
  	 * start one (if needed).
  	 */
  	if (rnp != rnp_root)
  		raw_spin_lock(&rnp_root->lock);
  
  	/*
  	 * Get a new grace-period number.  If there really is no grace
  	 * period in progress, it will be smaller than the one we obtained
  	 * earlier.  Adjust callbacks as needed.  Note that even no-CBs
  	 * CPUs have a ->nxtcompleted[] array, so no no-CBs checks needed.
  	 */
  	c = rcu_cbs_completed(rdp->rsp, rnp_root);
  	for (i = RCU_DONE_TAIL; i < RCU_NEXT_TAIL; i++)
  		if (ULONG_CMP_LT(c, rdp->nxtcompleted[i]))
  			rdp->nxtcompleted[i] = c;
  
  	/*
  	 * If the needed for the required grace period is already
  	 * recorded, trace and leave.
  	 */
  	if (rnp_root->need_future_gp[c & 0x1]) {
  		trace_rcu_future_gp(rnp, rdp, c, "Prestartedroot");
  		goto unlock_out;
  	}
  
  	/* Record the need for the future grace period. */
  	rnp_root->need_future_gp[c & 0x1]++;
  
  	/* If a grace period is not already in progress, start one. */
  	if (rnp_root->gpnum != rnp_root->completed) {
  		trace_rcu_future_gp(rnp, rdp, c, "Startedleafroot");
  	} else {
  		trace_rcu_future_gp(rnp, rdp, c, "Startedroot");
910ee45db   Paul E. McKenney   rcu: Make rcu_acc...
1088
  		rcu_start_gp_advanced(rdp->rsp, rnp_root, rdp);
0446be489   Paul E. McKenney   rcu: Abstract rcu...
1089
1090
1091
1092
1093
1094
1095
1096
1097
1098
1099
1100
1101
1102
1103
1104
1105
1106
1107
1108
1109
1110
1111
1112
1113
1114
1115
  	}
  unlock_out:
  	if (rnp != rnp_root)
  		raw_spin_unlock(&rnp_root->lock);
  	return c;
  }
  
  /*
   * Clean up any old requests for the just-ended grace period.  Also return
   * whether any additional grace periods have been requested.  Also invoke
   * rcu_nocb_gp_cleanup() in order to wake up any no-callbacks kthreads
   * waiting for this grace period to complete.
   */
  static int rcu_future_gp_cleanup(struct rcu_state *rsp, struct rcu_node *rnp)
  {
  	int c = rnp->completed;
  	int needmore;
  	struct rcu_data *rdp = this_cpu_ptr(rsp->rda);
  
  	rcu_nocb_gp_cleanup(rsp, rnp);
  	rnp->need_future_gp[c & 0x1] = 0;
  	needmore = rnp->need_future_gp[(c + 1) & 0x1];
  	trace_rcu_future_gp(rnp, rdp, c, needmore ? "CleanupMore" : "Cleanup");
  	return needmore;
  }
  
  /*
dc35c8934   Paul E. McKenney   rcu: Tag callback...
1116
1117
1118
1119
1120
1121
1122
1123
1124
1125
1126
1127
1128
1129
1130
1131
1132
1133
1134
1135
1136
1137
1138
1139
1140
1141
1142
1143
1144
1145
1146
1147
1148
1149
1150
1151
1152
1153
1154
1155
1156
1157
1158
1159
1160
1161
1162
1163
1164
1165
1166
1167
1168
1169
1170
1171
1172
1173
   * If there is room, assign a ->completed number to any callbacks on
   * this CPU that have not already been assigned.  Also accelerate any
   * callbacks that were previously assigned a ->completed number that has
   * since proven to be too conservative, which can happen if callbacks get
   * assigned a ->completed number while RCU is idle, but with reference to
   * a non-root rcu_node structure.  This function is idempotent, so it does
   * not hurt to call it repeatedly.
   *
   * The caller must hold rnp->lock with interrupts disabled.
   */
  static void rcu_accelerate_cbs(struct rcu_state *rsp, struct rcu_node *rnp,
  			       struct rcu_data *rdp)
  {
  	unsigned long c;
  	int i;
  
  	/* If the CPU has no callbacks, nothing to do. */
  	if (!rdp->nxttail[RCU_NEXT_TAIL] || !*rdp->nxttail[RCU_DONE_TAIL])
  		return;
  
  	/*
  	 * Starting from the sublist containing the callbacks most
  	 * recently assigned a ->completed number and working down, find the
  	 * first sublist that is not assignable to an upcoming grace period.
  	 * Such a sublist has something in it (first two tests) and has
  	 * a ->completed number assigned that will complete sooner than
  	 * the ->completed number for newly arrived callbacks (last test).
  	 *
  	 * The key point is that any later sublist can be assigned the
  	 * same ->completed number as the newly arrived callbacks, which
  	 * means that the callbacks in any of these later sublist can be
  	 * grouped into a single sublist, whether or not they have already
  	 * been assigned a ->completed number.
  	 */
  	c = rcu_cbs_completed(rsp, rnp);
  	for (i = RCU_NEXT_TAIL - 1; i > RCU_DONE_TAIL; i--)
  		if (rdp->nxttail[i] != rdp->nxttail[i - 1] &&
  		    !ULONG_CMP_GE(rdp->nxtcompleted[i], c))
  			break;
  
  	/*
  	 * If there are no sublist for unassigned callbacks, leave.
  	 * At the same time, advance "i" one sublist, so that "i" will
  	 * index into the sublist where all the remaining callbacks should
  	 * be grouped into.
  	 */
  	if (++i >= RCU_NEXT_TAIL)
  		return;
  
  	/*
  	 * Assign all subsequent callbacks' ->completed number to the next
  	 * full grace period and group them all in the sublist initially
  	 * indexed by "i".
  	 */
  	for (; i <= RCU_NEXT_TAIL; i++) {
  		rdp->nxttail[i] = rdp->nxttail[RCU_NEXT_TAIL];
  		rdp->nxtcompleted[i] = c;
  	}
910ee45db   Paul E. McKenney   rcu: Make rcu_acc...
1174
1175
  	/* Record any needed additional grace periods. */
  	rcu_start_future_gp(rnp, rdp);
6d4b418c7   Paul E. McKenney   rcu: Trace callba...
1176
1177
1178
1179
1180
1181
  
  	/* Trace depending on how much we were able to accelerate. */
  	if (!*rdp->nxttail[RCU_WAIT_TAIL])
  		trace_rcu_grace_period(rsp->name, rdp->gpnum, "AccWaitCB");
  	else
  		trace_rcu_grace_period(rsp->name, rdp->gpnum, "AccReadyCB");
dc35c8934   Paul E. McKenney   rcu: Tag callback...
1182
1183
1184
1185
1186
1187
1188
1189
1190
1191
1192
1193
1194
1195
1196
1197
1198
1199
1200
1201
1202
1203
1204
1205
1206
1207
1208
1209
1210
1211
1212
1213
1214
1215
1216
1217
1218
1219
1220
1221
1222
1223
1224
1225
1226
1227
  }
  
  /*
   * Move any callbacks whose grace period has completed to the
   * RCU_DONE_TAIL sublist, then compact the remaining sublists and
   * assign ->completed numbers to any callbacks in the RCU_NEXT_TAIL
   * sublist.  This function is idempotent, so it does not hurt to
   * invoke it repeatedly.  As long as it is not invoked -too- often...
   *
   * The caller must hold rnp->lock with interrupts disabled.
   */
  static void rcu_advance_cbs(struct rcu_state *rsp, struct rcu_node *rnp,
  			    struct rcu_data *rdp)
  {
  	int i, j;
  
  	/* If the CPU has no callbacks, nothing to do. */
  	if (!rdp->nxttail[RCU_NEXT_TAIL] || !*rdp->nxttail[RCU_DONE_TAIL])
  		return;
  
  	/*
  	 * Find all callbacks whose ->completed numbers indicate that they
  	 * are ready to invoke, and put them into the RCU_DONE_TAIL sublist.
  	 */
  	for (i = RCU_WAIT_TAIL; i < RCU_NEXT_TAIL; i++) {
  		if (ULONG_CMP_LT(rnp->completed, rdp->nxtcompleted[i]))
  			break;
  		rdp->nxttail[RCU_DONE_TAIL] = rdp->nxttail[i];
  	}
  	/* Clean up any sublist tail pointers that were misordered above. */
  	for (j = RCU_WAIT_TAIL; j < i; j++)
  		rdp->nxttail[j] = rdp->nxttail[RCU_DONE_TAIL];
  
  	/* Copy down callbacks to fill in empty sublists. */
  	for (j = RCU_WAIT_TAIL; i < RCU_NEXT_TAIL; i++, j++) {
  		if (rdp->nxttail[j] == rdp->nxttail[RCU_NEXT_TAIL])
  			break;
  		rdp->nxttail[j] = rdp->nxttail[i];
  		rdp->nxtcompleted[j] = rdp->nxtcompleted[i];
  	}
  
  	/* Classify any remaining callbacks. */
  	rcu_accelerate_cbs(rsp, rnp, rdp);
  }
  
  /*
ba9fbe955   Paul E. McKenney   rcu: Merge __rcu_...
1228
1229
1230
   * Update CPU-local rcu_data state to record the beginnings and ends of
   * grace periods.  The caller must hold the ->lock of the leaf rcu_node
   * structure corresponding to the current CPU, and must have irqs disabled.
d09b62dfa   Paul E. McKenney   rcu: Fix synchron...
1231
   */
ba9fbe955   Paul E. McKenney   rcu: Merge __rcu_...
1232
  static void __note_gp_changes(struct rcu_state *rsp, struct rcu_node *rnp, struct rcu_data *rdp)
d09b62dfa   Paul E. McKenney   rcu: Fix synchron...
1233
  {
ba9fbe955   Paul E. McKenney   rcu: Merge __rcu_...
1234
  	/* Handle the ends of any preceding grace periods first. */
dc35c8934   Paul E. McKenney   rcu: Tag callback...
1235
  	if (rdp->completed == rnp->completed) {
d09b62dfa   Paul E. McKenney   rcu: Fix synchron...
1236

ba9fbe955   Paul E. McKenney   rcu: Merge __rcu_...
1237
  		/* No grace period end, so just accelerate recent callbacks. */
dc35c8934   Paul E. McKenney   rcu: Tag callback...
1238
  		rcu_accelerate_cbs(rsp, rnp, rdp);
d09b62dfa   Paul E. McKenney   rcu: Fix synchron...
1239

dc35c8934   Paul E. McKenney   rcu: Tag callback...
1240
1241
1242
1243
  	} else {
  
  		/* Advance callbacks. */
  		rcu_advance_cbs(rsp, rnp, rdp);
d09b62dfa   Paul E. McKenney   rcu: Fix synchron...
1244
1245
1246
  
  		/* Remember that we saw this grace-period completion. */
  		rdp->completed = rnp->completed;
d4c08f2ac   Paul E. McKenney   rcu: Add grace-pe...
1247
  		trace_rcu_grace_period(rsp->name, rdp->gpnum, "cpuend");
d09b62dfa   Paul E. McKenney   rcu: Fix synchron...
1248
  	}
398ebe600   Paul E. McKenney   rcu: Make __note_...
1249

6eaef633d   Paul E. McKenney   rcu: Move code to...
1250
1251
1252
1253
1254
1255
1256
1257
1258
1259
1260
1261
1262
  	if (rdp->gpnum != rnp->gpnum) {
  		/*
  		 * If the current grace period is waiting for this CPU,
  		 * set up to detect a quiescent state, otherwise don't
  		 * go looking for one.
  		 */
  		rdp->gpnum = rnp->gpnum;
  		trace_rcu_grace_period(rsp->name, rdp->gpnum, "cpustart");
  		rdp->passed_quiesce = 0;
  		rdp->qs_pending = !!(rnp->qsmask & rdp->grpmask);
  		zero_cpu_stall_ticks(rdp);
  	}
  }
d34ea3221   Paul E. McKenney   rcu: Rename note_...
1263
  static void note_gp_changes(struct rcu_state *rsp, struct rcu_data *rdp)
6eaef633d   Paul E. McKenney   rcu: Move code to...
1264
1265
1266
1267
1268
1269
  {
  	unsigned long flags;
  	struct rcu_node *rnp;
  
  	local_irq_save(flags);
  	rnp = rdp->mynode;
d34ea3221   Paul E. McKenney   rcu: Rename note_...
1270
1271
  	if ((rdp->gpnum == ACCESS_ONCE(rnp->gpnum) &&
  	     rdp->completed == ACCESS_ONCE(rnp->completed)) || /* w/out lock. */
6eaef633d   Paul E. McKenney   rcu: Move code to...
1272
1273
1274
1275
  	    !raw_spin_trylock(&rnp->lock)) { /* irqs already off, so later. */
  		local_irq_restore(flags);
  		return;
  	}
d34ea3221   Paul E. McKenney   rcu: Rename note_...
1276
  	__note_gp_changes(rsp, rnp, rdp);
6eaef633d   Paul E. McKenney   rcu: Move code to...
1277
1278
1279
1280
  	raw_spin_unlock_irqrestore(&rnp->lock, flags);
  }
  
  /*
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1281
   * Initialize a new grace period.
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1282
   */
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1283
  static int rcu_gp_init(struct rcu_state *rsp)
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1284
1285
  {
  	struct rcu_data *rdp;
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1286
  	struct rcu_node *rnp = rcu_get_root(rsp);
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1287

7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1288
  	raw_spin_lock_irq(&rnp->lock);
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
1289
  	rsp->gp_flags = 0; /* Clear all flags: New grace period. */
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1290

7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1291
1292
1293
1294
1295
  	if (rcu_gp_in_progress(rsp)) {
  		/* Grace period already in progress, don't start another.  */
  		raw_spin_unlock_irq(&rnp->lock);
  		return 0;
  	}
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1296
1297
1298
  	/* Advance to a new grace period and initialize state. */
  	rsp->gpnum++;
  	trace_rcu_grace_period(rsp->name, rsp->gpnum, "start");
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1299
1300
1301
1302
  	record_gp_stall_check_time(rsp);
  	raw_spin_unlock_irq(&rnp->lock);
  
  	/* Exclude any concurrent CPU-hotplug operations. */
a4fbe35a1   Paul E. McKenney   rcu: Grace-period...
1303
  	mutex_lock(&rsp->onoff_mutex);
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1304
1305
1306
1307
1308
1309
1310
1311
1312
1313
1314
1315
1316
1317
1318
  
  	/*
  	 * Set the quiescent-state-needed bits in all the rcu_node
  	 * structures for all currently online CPUs in breadth-first order,
  	 * starting from the root rcu_node structure, relying on the layout
  	 * of the tree within the rsp->node[] array.  Note that other CPUs
  	 * will access only the leaves of the hierarchy, thus seeing that no
  	 * grace period is in progress, at least until the corresponding
  	 * leaf node has been initialized.  In addition, we have excluded
  	 * CPU-hotplug operations.
  	 *
  	 * The grace period cannot complete until the initialization
  	 * process finishes, because this kthread handles both.
  	 */
  	rcu_for_each_node_breadth_first(rsp, rnp) {
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1319
  		raw_spin_lock_irq(&rnp->lock);
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1320
  		rdp = this_cpu_ptr(rsp->rda);
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1321
1322
  		rcu_preempt_check_blocked_tasks(rnp);
  		rnp->qsmask = rnp->qsmaskinit;
0446be489   Paul E. McKenney   rcu: Abstract rcu...
1323
  		ACCESS_ONCE(rnp->gpnum) = rsp->gpnum;
25d30cf42   Paul E. McKenney   rcu: Adjust for u...
1324
  		WARN_ON_ONCE(rnp->completed != rsp->completed);
0446be489   Paul E. McKenney   rcu: Abstract rcu...
1325
  		ACCESS_ONCE(rnp->completed) = rsp->completed;
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1326
  		if (rnp == rdp->mynode)
ce3d9c03d   Paul E. McKenney   rcu: Inline trivi...
1327
  			__note_gp_changes(rsp, rnp, rdp);
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1328
1329
1330
1331
1332
  		rcu_preempt_boost_start_gp(rnp);
  		trace_rcu_grace_period_init(rsp->name, rnp->gpnum,
  					    rnp->level, rnp->grplo,
  					    rnp->grphi, rnp->qsmask);
  		raw_spin_unlock_irq(&rnp->lock);
661a85dc0   Paul E. McKenney   rcu: Add random P...
1333
  #ifdef CONFIG_PROVE_RCU_DELAY
971394f38   Paul E. McKenney   rcu: Fix deadlock...
1334
  		if ((prandom_u32() % (rcu_num_nodes + 1)) == 0 &&
81e59494a   Paul E. McKenney   rcu: Tone down de...
1335
  		    system_state == SYSTEM_RUNNING)
971394f38   Paul E. McKenney   rcu: Fix deadlock...
1336
  			udelay(200);
661a85dc0   Paul E. McKenney   rcu: Add random P...
1337
  #endif /* #ifdef CONFIG_PROVE_RCU_DELAY */
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1338
1339
  		cond_resched();
  	}
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1340

a4fbe35a1   Paul E. McKenney   rcu: Grace-period...
1341
  	mutex_unlock(&rsp->onoff_mutex);
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1342
1343
  	return 1;
  }
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1344

7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1345
  /*
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
1346
1347
1348
1349
1350
1351
1352
1353
1354
1355
1356
1357
1358
1359
1360
1361
1362
1363
1364
1365
1366
1367
1368
1369
1370
1371
   * Do one round of quiescent-state forcing.
   */
  int rcu_gp_fqs(struct rcu_state *rsp, int fqs_state_in)
  {
  	int fqs_state = fqs_state_in;
  	struct rcu_node *rnp = rcu_get_root(rsp);
  
  	rsp->n_force_qs++;
  	if (fqs_state == RCU_SAVE_DYNTICK) {
  		/* Collect dyntick-idle snapshots. */
  		force_qs_rnp(rsp, dyntick_save_progress_counter);
  		fqs_state = RCU_FORCE_QS;
  	} else {
  		/* Handle dyntick-idle and offline CPUs. */
  		force_qs_rnp(rsp, rcu_implicit_dynticks_qs);
  	}
  	/* Clear flag to prevent immediate re-entry. */
  	if (ACCESS_ONCE(rsp->gp_flags) & RCU_GP_FLAG_FQS) {
  		raw_spin_lock_irq(&rnp->lock);
  		rsp->gp_flags &= ~RCU_GP_FLAG_FQS;
  		raw_spin_unlock_irq(&rnp->lock);
  	}
  	return fqs_state;
  }
  
  /*
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1372
1373
   * Clean up after the old grace period.
   */
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
1374
  static void rcu_gp_cleanup(struct rcu_state *rsp)
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1375
1376
  {
  	unsigned long gp_duration;
dae6e64d2   Paul E. McKenney   rcu: Introduce pr...
1377
  	int nocb = 0;
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1378
1379
  	struct rcu_data *rdp;
  	struct rcu_node *rnp = rcu_get_root(rsp);
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1380

7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1381
1382
1383
1384
  	raw_spin_lock_irq(&rnp->lock);
  	gp_duration = jiffies - rsp->gp_start;
  	if (gp_duration > rsp->gp_max)
  		rsp->gp_max = gp_duration;
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1385

7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1386
1387
1388
1389
1390
1391
1392
  	/*
  	 * We know the grace period is complete, but to everyone else
  	 * it appears to still be ongoing.  But it is also the case
  	 * that to everyone else it looks like there is nothing that
  	 * they can do to advance the grace period.  It is therefore
  	 * safe for us to drop the lock in order to mark the grace
  	 * period as completed in all of the rcu_node structures.
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1393
  	 */
5d4b86594   Paul E. McKenney   rcu: Fix day-zero...
1394
  	raw_spin_unlock_irq(&rnp->lock);
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1395

5d4b86594   Paul E. McKenney   rcu: Fix day-zero...
1396
1397
1398
1399
1400
1401
1402
1403
1404
1405
  	/*
  	 * Propagate new ->completed value to rcu_node structures so
  	 * that other CPUs don't have to wait until the start of the next
  	 * grace period to process their callbacks.  This also avoids
  	 * some nasty RCU grace-period initialization races by forcing
  	 * the end of the current grace period to be completely recorded in
  	 * all of the rcu_node structures before the beginning of the next
  	 * grace period is recorded in any of the rcu_node structures.
  	 */
  	rcu_for_each_node_breadth_first(rsp, rnp) {
755609a90   Paul E. McKenney   rcu: Allow RCU gr...
1406
  		raw_spin_lock_irq(&rnp->lock);
0446be489   Paul E. McKenney   rcu: Abstract rcu...
1407
  		ACCESS_ONCE(rnp->completed) = rsp->gpnum;
b11cc5760   Paul E. McKenney   rcu: Accelerate R...
1408
1409
  		rdp = this_cpu_ptr(rsp->rda);
  		if (rnp == rdp->mynode)
470716fc0   Paul E. McKenney   rcu: Switch calle...
1410
  			__note_gp_changes(rsp, rnp, rdp);
0446be489   Paul E. McKenney   rcu: Abstract rcu...
1411
  		nocb += rcu_future_gp_cleanup(rsp, rnp);
5d4b86594   Paul E. McKenney   rcu: Fix day-zero...
1412
1413
  		raw_spin_unlock_irq(&rnp->lock);
  		cond_resched();
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1414
  	}
5d4b86594   Paul E. McKenney   rcu: Fix day-zero...
1415
1416
  	rnp = rcu_get_root(rsp);
  	raw_spin_lock_irq(&rnp->lock);
dae6e64d2   Paul E. McKenney   rcu: Introduce pr...
1417
  	rcu_nocb_gp_set(rnp, nocb);
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1418
1419
1420
1421
  
  	rsp->completed = rsp->gpnum; /* Declare grace period done. */
  	trace_rcu_grace_period(rsp->name, rsp->completed, "end");
  	rsp->fqs_state = RCU_GP_IDLE;
5d4b86594   Paul E. McKenney   rcu: Fix day-zero...
1422
  	rdp = this_cpu_ptr(rsp->rda);
b11cc5760   Paul E. McKenney   rcu: Accelerate R...
1423
  	rcu_advance_cbs(rsp, rnp, rdp);  /* Reduce false positives below. */
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1424
1425
1426
  	if (cpu_needs_another_gp(rsp, rdp))
  		rsp->gp_flags = 1;
  	raw_spin_unlock_irq(&rnp->lock);
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1427
1428
1429
1430
1431
1432
1433
  }
  
  /*
   * Body of kthread that handles grace periods.
   */
  static int __noreturn rcu_gp_kthread(void *arg)
  {
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
1434
  	int fqs_state;
d40011f60   Paul E. McKenney   rcu: Control grac...
1435
  	unsigned long j;
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
1436
  	int ret;
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1437
1438
1439
1440
1441
1442
1443
  	struct rcu_state *rsp = arg;
  	struct rcu_node *rnp = rcu_get_root(rsp);
  
  	for (;;) {
  
  		/* Handle grace-period start. */
  		for (;;) {
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
1444
1445
1446
1447
1448
  			wait_event_interruptible(rsp->gp_wq,
  						 rsp->gp_flags &
  						 RCU_GP_FLAG_INIT);
  			if ((rsp->gp_flags & RCU_GP_FLAG_INIT) &&
  			    rcu_gp_init(rsp))
7fdefc10e   Paul E. McKenney   rcu: Break up rcu...
1449
1450
1451
1452
  				break;
  			cond_resched();
  			flush_signals(current);
  		}
cabc49c1f   Paul E. McKenney   rcu: Move RCU gra...
1453

4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
1454
1455
  		/* Handle quiescent-state forcing. */
  		fqs_state = RCU_SAVE_DYNTICK;
d40011f60   Paul E. McKenney   rcu: Control grac...
1456
1457
1458
1459
1460
  		j = jiffies_till_first_fqs;
  		if (j > HZ) {
  			j = HZ;
  			jiffies_till_first_fqs = HZ;
  		}
cabc49c1f   Paul E. McKenney   rcu: Move RCU gra...
1461
  		for (;;) {
d40011f60   Paul E. McKenney   rcu: Control grac...
1462
  			rsp->jiffies_force_qs = jiffies + j;
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
1463
1464
1465
1466
  			ret = wait_event_interruptible_timeout(rsp->gp_wq,
  					(rsp->gp_flags & RCU_GP_FLAG_FQS) ||
  					(!ACCESS_ONCE(rnp->qsmask) &&
  					 !rcu_preempt_blocked_readers_cgp(rnp)),
d40011f60   Paul E. McKenney   rcu: Control grac...
1467
  					j);
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
1468
  			/* If grace period done, leave loop. */
cabc49c1f   Paul E. McKenney   rcu: Move RCU gra...
1469
  			if (!ACCESS_ONCE(rnp->qsmask) &&
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
1470
  			    !rcu_preempt_blocked_readers_cgp(rnp))
cabc49c1f   Paul E. McKenney   rcu: Move RCU gra...
1471
  				break;
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
1472
1473
1474
1475
1476
1477
1478
1479
1480
  			/* If time for quiescent-state forcing, do it. */
  			if (ret == 0 || (rsp->gp_flags & RCU_GP_FLAG_FQS)) {
  				fqs_state = rcu_gp_fqs(rsp, fqs_state);
  				cond_resched();
  			} else {
  				/* Deal with stray signal. */
  				cond_resched();
  				flush_signals(current);
  			}
d40011f60   Paul E. McKenney   rcu: Control grac...
1481
1482
1483
1484
1485
1486
1487
1488
  			j = jiffies_till_next_fqs;
  			if (j > HZ) {
  				j = HZ;
  				jiffies_till_next_fqs = HZ;
  			} else if (j < 1) {
  				j = 1;
  				jiffies_till_next_fqs = 1;
  			}
cabc49c1f   Paul E. McKenney   rcu: Move RCU gra...
1489
  		}
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
1490
1491
1492
  
  		/* Handle grace-period end. */
  		rcu_gp_cleanup(rsp);
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1493
  	}
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1494
  }
016a8d5be   Steven Rostedt   rcu: Don't call w...
1495
1496
1497
1498
1499
1500
1501
  static void rsp_wakeup(struct irq_work *work)
  {
  	struct rcu_state *rsp = container_of(work, struct rcu_state, wakeup_work);
  
  	/* Wake up rcu_gp_kthread() to start the grace period. */
  	wake_up(&rsp->gp_wq);
  }
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1502
  /*
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1503
1504
   * Start a new RCU grace period if warranted, re-initializing the hierarchy
   * in preparation for detecting the next grace period.  The caller must hold
b8462084a   Paul E. McKenney   rcu: Push lock re...
1505
   * the root node's ->lock and hard irqs must be disabled.
e56014000   Paul E. McKenney   rcu: Simplify off...
1506
1507
1508
1509
   *
   * Note that it is legal for a dying CPU (which is marked as offline) to
   * invoke this function.  This can happen when the dying CPU reports its
   * quiescent state.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1510
1511
   */
  static void
910ee45db   Paul E. McKenney   rcu: Make rcu_acc...
1512
1513
  rcu_start_gp_advanced(struct rcu_state *rsp, struct rcu_node *rnp,
  		      struct rcu_data *rdp)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1514
  {
b8462084a   Paul E. McKenney   rcu: Push lock re...
1515
  	if (!rsp->gp_kthread || !cpu_needs_another_gp(rsp, rdp)) {
afe24b122   Paul E. McKenney   rcu: Move propaga...
1516
  		/*
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1517
  		 * Either we have not yet spawned the grace-period
62da19212   Paul E. McKenney   rcu: Accelerate c...
1518
1519
  		 * task, this CPU does not need another grace period,
  		 * or a grace period is already in progress.
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
1520
  		 * Either way, don't start a new grace period.
afe24b122   Paul E. McKenney   rcu: Move propaga...
1521
  		 */
afe24b122   Paul E. McKenney   rcu: Move propaga...
1522
1523
  		return;
  	}
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
1524
  	rsp->gp_flags = RCU_GP_FLAG_INIT;
62da19212   Paul E. McKenney   rcu: Accelerate c...
1525

016a8d5be   Steven Rostedt   rcu: Don't call w...
1526
1527
1528
1529
1530
1531
  	/*
  	 * We can't do wakeups while holding the rnp->lock, as that
  	 * could cause possible deadlocks with the rq->lock. Deter
  	 * the wakeup to interrupt context.
  	 */
  	irq_work_queue(&rsp->wakeup_work);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1532
1533
1534
  }
  
  /*
910ee45db   Paul E. McKenney   rcu: Make rcu_acc...
1535
1536
1537
1538
1539
1540
1541
1542
1543
1544
1545
1546
1547
1548
1549
1550
1551
1552
1553
1554
1555
1556
1557
1558
1559
   * Similar to rcu_start_gp_advanced(), but also advance the calling CPU's
   * callbacks.  Note that rcu_start_gp_advanced() cannot do this because it
   * is invoked indirectly from rcu_advance_cbs(), which would result in
   * endless recursion -- or would do so if it wasn't for the self-deadlock
   * that is encountered beforehand.
   */
  static void
  rcu_start_gp(struct rcu_state *rsp)
  {
  	struct rcu_data *rdp = this_cpu_ptr(rsp->rda);
  	struct rcu_node *rnp = rcu_get_root(rsp);
  
  	/*
  	 * If there is no grace period in progress right now, any
  	 * callbacks we have up to this point will be satisfied by the
  	 * next grace period.  Also, advancing the callbacks reduces the
  	 * probability of false positives from cpu_needs_another_gp()
  	 * resulting in pointless grace periods.  So, advance callbacks
  	 * then start the grace period!
  	 */
  	rcu_advance_cbs(rsp, rnp, rdp);
  	rcu_start_gp_advanced(rsp, rnp, rdp);
  }
  
  /*
d3f6bad39   Paul E. McKenney   rcu: Rename "quie...
1560
1561
1562
   * Report a full set of quiescent states to the specified rcu_state
   * data structure.  This involves cleaning up after the prior grace
   * period and letting rcu_start_gp() start up the next grace period
b8462084a   Paul E. McKenney   rcu: Push lock re...
1563
1564
   * if one is needed.  Note that the caller must hold rnp->lock, which
   * is released before return.
f41d911f8   Paul E. McKenney   rcu: Merge preemp...
1565
   */
d3f6bad39   Paul E. McKenney   rcu: Rename "quie...
1566
  static void rcu_report_qs_rsp(struct rcu_state *rsp, unsigned long flags)
fc2219d49   Paul E. McKenney   rcu: Clean up cod...
1567
  	__releases(rcu_get_root(rsp)->lock)
f41d911f8   Paul E. McKenney   rcu: Merge preemp...
1568
  {
fc2219d49   Paul E. McKenney   rcu: Clean up cod...
1569
  	WARN_ON_ONCE(!rcu_gp_in_progress(rsp));
cabc49c1f   Paul E. McKenney   rcu: Move RCU gra...
1570
1571
  	raw_spin_unlock_irqrestore(&rcu_get_root(rsp)->lock, flags);
  	wake_up(&rsp->gp_wq);  /* Memory barrier implied by wake_up() path. */
f41d911f8   Paul E. McKenney   rcu: Merge preemp...
1572
1573
1574
  }
  
  /*
d3f6bad39   Paul E. McKenney   rcu: Rename "quie...
1575
1576
1577
1578
1579
1580
   * Similar to rcu_report_qs_rdp(), for which it is a helper function.
   * Allows quiescent states for a group of CPUs to be reported at one go
   * to the specified rcu_node structure, though all the CPUs in the group
   * must be represented by the same rcu_node structure (which need not be
   * a leaf rcu_node structure, though it often will be).  That structure's
   * lock must be held upon entry, and it is released before return.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1581
1582
   */
  static void
d3f6bad39   Paul E. McKenney   rcu: Rename "quie...
1583
1584
  rcu_report_qs_rnp(unsigned long mask, struct rcu_state *rsp,
  		  struct rcu_node *rnp, unsigned long flags)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1585
1586
  	__releases(rnp->lock)
  {
28ecd5802   Paul E. McKenney   rcu: Add WARN_ON_...
1587
  	struct rcu_node *rnp_c;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1588
1589
1590
1591
1592
  	/* Walk up the rcu_node hierarchy. */
  	for (;;) {
  		if (!(rnp->qsmask & mask)) {
  
  			/* Our bit has already been cleared, so done. */
1304afb22   Paul E. McKenney   rcu: Convert to r...
1593
  			raw_spin_unlock_irqrestore(&rnp->lock, flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1594
1595
1596
  			return;
  		}
  		rnp->qsmask &= ~mask;
d4c08f2ac   Paul E. McKenney   rcu: Add grace-pe...
1597
1598
1599
1600
  		trace_rcu_quiescent_state_report(rsp->name, rnp->gpnum,
  						 mask, rnp->qsmask, rnp->level,
  						 rnp->grplo, rnp->grphi,
  						 !!rnp->gp_tasks);
27f4d2805   Paul E. McKenney   rcu: priority boo...
1601
  		if (rnp->qsmask != 0 || rcu_preempt_blocked_readers_cgp(rnp)) {
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1602
1603
  
  			/* Other bits still set at this level, so done. */
1304afb22   Paul E. McKenney   rcu: Convert to r...
1604
  			raw_spin_unlock_irqrestore(&rnp->lock, flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1605
1606
1607
1608
1609
1610
1611
1612
1613
  			return;
  		}
  		mask = rnp->grpmask;
  		if (rnp->parent == NULL) {
  
  			/* No more levels.  Exit loop holding root lock. */
  
  			break;
  		}
1304afb22   Paul E. McKenney   rcu: Convert to r...
1614
  		raw_spin_unlock_irqrestore(&rnp->lock, flags);
28ecd5802   Paul E. McKenney   rcu: Add WARN_ON_...
1615
  		rnp_c = rnp;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1616
  		rnp = rnp->parent;
1304afb22   Paul E. McKenney   rcu: Convert to r...
1617
  		raw_spin_lock_irqsave(&rnp->lock, flags);
28ecd5802   Paul E. McKenney   rcu: Add WARN_ON_...
1618
  		WARN_ON_ONCE(rnp_c->qsmask);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1619
1620
1621
1622
  	}
  
  	/*
  	 * Get here if we are the last CPU to pass through a quiescent
d3f6bad39   Paul E. McKenney   rcu: Rename "quie...
1623
  	 * state for this grace period.  Invoke rcu_report_qs_rsp()
f41d911f8   Paul E. McKenney   rcu: Merge preemp...
1624
  	 * to clean up and start the next grace period if one is needed.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1625
  	 */
d3f6bad39   Paul E. McKenney   rcu: Rename "quie...
1626
  	rcu_report_qs_rsp(rsp, flags); /* releases rnp->lock. */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1627
1628
1629
  }
  
  /*
d3f6bad39   Paul E. McKenney   rcu: Rename "quie...
1630
1631
1632
1633
1634
1635
1636
   * Record a quiescent state for the specified CPU to that CPU's rcu_data
   * structure.  This must be either called from the specified CPU, or
   * called when the specified CPU is known to be offline (and when it is
   * also known that no other CPU is concurrently trying to help the offline
   * CPU).  The lastcomp argument is used to make sure we are still in the
   * grace period of interest.  We don't want to end the current grace period
   * based on quiescent states detected in an earlier grace period!
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1637
1638
   */
  static void
d7d6a11e8   Paul E. McKenney   rcu: Simplify qui...
1639
  rcu_report_qs_rdp(int cpu, struct rcu_state *rsp, struct rcu_data *rdp)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1640
1641
1642
1643
1644
1645
  {
  	unsigned long flags;
  	unsigned long mask;
  	struct rcu_node *rnp;
  
  	rnp = rdp->mynode;
1304afb22   Paul E. McKenney   rcu: Convert to r...
1646
  	raw_spin_lock_irqsave(&rnp->lock, flags);
d7d6a11e8   Paul E. McKenney   rcu: Simplify qui...
1647
1648
  	if (rdp->passed_quiesce == 0 || rdp->gpnum != rnp->gpnum ||
  	    rnp->completed == rnp->gpnum) {
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1649
1650
  
  		/*
e4cc1f22b   Paul E. McKenney   rcu: Simplify qui...
1651
1652
1653
1654
  		 * The grace period in which this quiescent state was
  		 * recorded has ended, so don't report it upwards.
  		 * We will instead need a new quiescent state that lies
  		 * within the current grace period.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1655
  		 */
e4cc1f22b   Paul E. McKenney   rcu: Simplify qui...
1656
  		rdp->passed_quiesce = 0;	/* need qs for new gp. */
1304afb22   Paul E. McKenney   rcu: Convert to r...
1657
  		raw_spin_unlock_irqrestore(&rnp->lock, flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1658
1659
1660
1661
  		return;
  	}
  	mask = rdp->grpmask;
  	if ((rnp->qsmask & mask) == 0) {
1304afb22   Paul E. McKenney   rcu: Convert to r...
1662
  		raw_spin_unlock_irqrestore(&rnp->lock, flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1663
1664
1665
1666
1667
1668
1669
  	} else {
  		rdp->qs_pending = 0;
  
  		/*
  		 * This GP can't end until cpu checks in, so all of our
  		 * callbacks can be processed during the next GP.
  		 */
dc35c8934   Paul E. McKenney   rcu: Tag callback...
1670
  		rcu_accelerate_cbs(rsp, rnp, rdp);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1671

d3f6bad39   Paul E. McKenney   rcu: Rename "quie...
1672
  		rcu_report_qs_rnp(mask, rsp, rnp, flags); /* rlses rnp->lock */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1673
1674
1675
1676
1677
1678
1679
1680
1681
1682
1683
1684
  	}
  }
  
  /*
   * Check to see if there is a new grace period of which this CPU
   * is not yet aware, and if so, set up local rcu_data state for it.
   * Otherwise, see if this CPU has just passed through its first
   * quiescent state for this grace period, and record that fact if so.
   */
  static void
  rcu_check_quiescent_state(struct rcu_state *rsp, struct rcu_data *rdp)
  {
05eb552bf   Paul E. McKenney   rcu: Move redunda...
1685
1686
  	/* Check for grace-period ends and beginnings. */
  	note_gp_changes(rsp, rdp);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1687
1688
1689
1690
1691
1692
1693
1694
1695
1696
1697
1698
  
  	/*
  	 * Does this CPU still need to do its part for current grace period?
  	 * If no, return and let the other CPUs do their part as well.
  	 */
  	if (!rdp->qs_pending)
  		return;
  
  	/*
  	 * Was there a quiescent state since the beginning of the grace
  	 * period? If no, then exit and wait for the next call.
  	 */
e4cc1f22b   Paul E. McKenney   rcu: Simplify qui...
1699
  	if (!rdp->passed_quiesce)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1700
  		return;
d3f6bad39   Paul E. McKenney   rcu: Rename "quie...
1701
1702
1703
1704
  	/*
  	 * Tell RCU we are done (but rcu_report_qs_rdp() will be the
  	 * judge of that).
  	 */
d7d6a11e8   Paul E. McKenney   rcu: Simplify qui...
1705
  	rcu_report_qs_rdp(rdp->cpu, rsp, rdp);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1706
1707
1708
1709
1710
  }
  
  #ifdef CONFIG_HOTPLUG_CPU
  
  /*
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1711
1712
   * Send the specified CPU's RCU callbacks to the orphanage.  The
   * specified CPU must be offline, and the caller must hold the
7b2e6011f   Paul E. McKenney   rcu: Rename ->ono...
1713
   * ->orphan_lock.
e74f4c456   Paul E. McKenney   rcu: Make hot-unp...
1714
   */
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1715
1716
1717
  static void
  rcu_send_cbs_to_orphanage(int cpu, struct rcu_state *rsp,
  			  struct rcu_node *rnp, struct rcu_data *rdp)
e74f4c456   Paul E. McKenney   rcu: Make hot-unp...
1718
  {
3fbfbf7a3   Paul E. McKenney   rcu: Add callback...
1719
  	/* No-CBs CPUs do not have orphanable callbacks. */
d1e43fa5f   Frederic Weisbecker   nohz: Ensure full...
1720
  	if (rcu_is_nocb_cpu(rdp->cpu))
3fbfbf7a3   Paul E. McKenney   rcu: Add callback...
1721
  		return;
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1722
1723
  	/*
  	 * Orphan the callbacks.  First adjust the counts.  This is safe
abfd6e58a   Paul E. McKenney   rcu: Fix comment ...
1724
1725
  	 * because _rcu_barrier() excludes CPU-hotplug operations, so it
  	 * cannot be running now.  Thus no memory barrier is required.
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1726
  	 */
a50c3af91   Paul E. McKenney   rcu: Don't make c...
1727
  	if (rdp->nxtlist != NULL) {
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1728
1729
1730
  		rsp->qlen_lazy += rdp->qlen_lazy;
  		rsp->qlen += rdp->qlen;
  		rdp->n_cbs_orphaned += rdp->qlen;
a50c3af91   Paul E. McKenney   rcu: Don't make c...
1731
  		rdp->qlen_lazy = 0;
1d1fb395f   Paul E. McKenney   rcu: Add ACCESS_O...
1732
  		ACCESS_ONCE(rdp->qlen) = 0;
a50c3af91   Paul E. McKenney   rcu: Don't make c...
1733
1734
1735
  	}
  
  	/*
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1736
1737
1738
1739
1740
1741
1742
  	 * Next, move those callbacks still needing a grace period to
  	 * the orphanage, where some other CPU will pick them up.
  	 * Some of the callbacks might have gone partway through a grace
  	 * period, but that is too bad.  They get to start over because we
  	 * cannot assume that grace periods are synchronized across CPUs.
  	 * We don't bother updating the ->nxttail[] array yet, instead
  	 * we just reset the whole thing later on.
a50c3af91   Paul E. McKenney   rcu: Don't make c...
1743
  	 */
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1744
1745
1746
1747
  	if (*rdp->nxttail[RCU_DONE_TAIL] != NULL) {
  		*rsp->orphan_nxttail = *rdp->nxttail[RCU_DONE_TAIL];
  		rsp->orphan_nxttail = rdp->nxttail[RCU_NEXT_TAIL];
  		*rdp->nxttail[RCU_DONE_TAIL] = NULL;
a50c3af91   Paul E. McKenney   rcu: Don't make c...
1748
1749
1750
  	}
  
  	/*
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1751
1752
1753
  	 * Then move the ready-to-invoke callbacks to the orphanage,
  	 * where some other CPU will pick them up.  These will not be
  	 * required to pass though another grace period: They are done.
a50c3af91   Paul E. McKenney   rcu: Don't make c...
1754
  	 */
e56014000   Paul E. McKenney   rcu: Simplify off...
1755
  	if (rdp->nxtlist != NULL) {
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1756
1757
  		*rsp->orphan_donetail = rdp->nxtlist;
  		rsp->orphan_donetail = rdp->nxttail[RCU_DONE_TAIL];
e56014000   Paul E. McKenney   rcu: Simplify off...
1758
  	}
e74f4c456   Paul E. McKenney   rcu: Make hot-unp...
1759

b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1760
  	/* Finally, initialize the rcu_data structure's list to empty.  */
3f5d3ea64   Paul E. McKenney   rcu: Consolidate ...
1761
  	init_callback_list(rdp);
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1762
1763
1764
1765
  }
  
  /*
   * Adopt the RCU callbacks from the specified rcu_state structure's
7b2e6011f   Paul E. McKenney   rcu: Rename ->ono...
1766
   * orphanage.  The caller must hold the ->orphan_lock.
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1767
1768
1769
1770
1771
   */
  static void rcu_adopt_orphan_cbs(struct rcu_state *rsp)
  {
  	int i;
  	struct rcu_data *rdp = __this_cpu_ptr(rsp->rda);
3fbfbf7a3   Paul E. McKenney   rcu: Add callback...
1772
1773
1774
  	/* No-CBs CPUs are handled specially. */
  	if (rcu_nocb_adopt_orphan_cbs(rsp, rdp))
  		return;
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1775
1776
1777
1778
  	/* Do the accounting first. */
  	rdp->qlen_lazy += rsp->qlen_lazy;
  	rdp->qlen += rsp->qlen;
  	rdp->n_cbs_adopted += rsp->qlen;
8f5af6f1f   Paul E. McKenney   rcu: RCU_FAST_NO_...
1779
1780
  	if (rsp->qlen_lazy != rsp->qlen)
  		rcu_idle_count_callbacks_posted();
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1781
1782
1783
1784
1785
1786
1787
1788
1789
1790
1791
1792
1793
1794
1795
1796
1797
1798
1799
1800
1801
1802
1803
1804
1805
1806
1807
1808
1809
1810
1811
1812
1813
1814
1815
1816
1817
1818
1819
  	rsp->qlen_lazy = 0;
  	rsp->qlen = 0;
  
  	/*
  	 * We do not need a memory barrier here because the only way we
  	 * can get here if there is an rcu_barrier() in flight is if
  	 * we are the task doing the rcu_barrier().
  	 */
  
  	/* First adopt the ready-to-invoke callbacks. */
  	if (rsp->orphan_donelist != NULL) {
  		*rsp->orphan_donetail = *rdp->nxttail[RCU_DONE_TAIL];
  		*rdp->nxttail[RCU_DONE_TAIL] = rsp->orphan_donelist;
  		for (i = RCU_NEXT_SIZE - 1; i >= RCU_DONE_TAIL; i--)
  			if (rdp->nxttail[i] == rdp->nxttail[RCU_DONE_TAIL])
  				rdp->nxttail[i] = rsp->orphan_donetail;
  		rsp->orphan_donelist = NULL;
  		rsp->orphan_donetail = &rsp->orphan_donelist;
  	}
  
  	/* And then adopt the callbacks that still need a grace period. */
  	if (rsp->orphan_nxtlist != NULL) {
  		*rdp->nxttail[RCU_NEXT_TAIL] = rsp->orphan_nxtlist;
  		rdp->nxttail[RCU_NEXT_TAIL] = rsp->orphan_nxttail;
  		rsp->orphan_nxtlist = NULL;
  		rsp->orphan_nxttail = &rsp->orphan_nxtlist;
  	}
  }
  
  /*
   * Trace the fact that this CPU is going offline.
   */
  static void rcu_cleanup_dying_cpu(struct rcu_state *rsp)
  {
  	RCU_TRACE(unsigned long mask);
  	RCU_TRACE(struct rcu_data *rdp = this_cpu_ptr(rsp->rda));
  	RCU_TRACE(struct rcu_node *rnp = rdp->mynode);
  
  	RCU_TRACE(mask = rdp->grpmask);
e56014000   Paul E. McKenney   rcu: Simplify off...
1820
1821
1822
  	trace_rcu_grace_period(rsp->name,
  			       rnp->gpnum + 1 - !!(rnp->qsmask & mask),
  			       "cpuofl");
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1823
1824
1825
  }
  
  /*
e56014000   Paul E. McKenney   rcu: Simplify off...
1826
   * The CPU has been completely removed, and some other CPU is reporting
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1827
1828
   * this fact from process context.  Do the remainder of the cleanup,
   * including orphaning the outgoing CPU's RCU callbacks, and also
1331e7a1b   Paul E. McKenney   rcu: Remove _rcu_...
1829
1830
   * adopting them.  There can only be one CPU hotplug operation at a time,
   * so no other CPU can be attempting to update rcu_cpu_kthread_task.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1831
   */
e56014000   Paul E. McKenney   rcu: Simplify off...
1832
  static void rcu_cleanup_dead_cpu(int cpu, struct rcu_state *rsp)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1833
  {
2036d94a7   Paul E. McKenney   rcu: Rework detec...
1834
1835
1836
  	unsigned long flags;
  	unsigned long mask;
  	int need_report = 0;
e56014000   Paul E. McKenney   rcu: Simplify off...
1837
  	struct rcu_data *rdp = per_cpu_ptr(rsp->rda, cpu);
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1838
  	struct rcu_node *rnp = rdp->mynode;  /* Outgoing CPU's rdp & rnp. */
e56014000   Paul E. McKenney   rcu: Simplify off...
1839

2036d94a7   Paul E. McKenney   rcu: Rework detec...
1840
  	/* Adjust any no-longer-needed kthreads. */
5d01bbd11   Thomas Gleixner   rcu: Yield simpler
1841
  	rcu_boost_kthread_setaffinity(rnp, -1);
2036d94a7   Paul E. McKenney   rcu: Rework detec...
1842

b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1843
  	/* Remove the dead CPU from the bitmasks in the rcu_node hierarchy. */
2036d94a7   Paul E. McKenney   rcu: Rework detec...
1844
1845
  
  	/* Exclude any attempts to start a new grace period. */
a4fbe35a1   Paul E. McKenney   rcu: Grace-period...
1846
  	mutex_lock(&rsp->onoff_mutex);
7b2e6011f   Paul E. McKenney   rcu: Rename ->ono...
1847
  	raw_spin_lock_irqsave(&rsp->orphan_lock, flags);
2036d94a7   Paul E. McKenney   rcu: Rework detec...
1848

b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1849
1850
1851
  	/* Orphan the dead CPU's callbacks, and adopt them if appropriate. */
  	rcu_send_cbs_to_orphanage(cpu, rsp, rnp, rdp);
  	rcu_adopt_orphan_cbs(rsp);
2036d94a7   Paul E. McKenney   rcu: Rework detec...
1852
1853
1854
1855
1856
1857
1858
1859
1860
1861
1862
1863
1864
1865
1866
1867
1868
1869
1870
1871
1872
  	/* Remove the outgoing CPU from the masks in the rcu_node hierarchy. */
  	mask = rdp->grpmask;	/* rnp->grplo is constant. */
  	do {
  		raw_spin_lock(&rnp->lock);	/* irqs already disabled. */
  		rnp->qsmaskinit &= ~mask;
  		if (rnp->qsmaskinit != 0) {
  			if (rnp != rdp->mynode)
  				raw_spin_unlock(&rnp->lock); /* irqs remain disabled. */
  			break;
  		}
  		if (rnp == rdp->mynode)
  			need_report = rcu_preempt_offline_tasks(rsp, rnp, rdp);
  		else
  			raw_spin_unlock(&rnp->lock); /* irqs remain disabled. */
  		mask = rnp->grpmask;
  		rnp = rnp->parent;
  	} while (rnp != NULL);
  
  	/*
  	 * We still hold the leaf rcu_node structure lock here, and
  	 * irqs are still disabled.  The reason for this subterfuge is
7b2e6011f   Paul E. McKenney   rcu: Rename ->ono...
1873
  	 * because invoking rcu_report_unblock_qs_rnp() with ->orphan_lock
2036d94a7   Paul E. McKenney   rcu: Rework detec...
1874
1875
  	 * held leads to deadlock.
  	 */
7b2e6011f   Paul E. McKenney   rcu: Rename ->ono...
1876
  	raw_spin_unlock(&rsp->orphan_lock); /* irqs remain disabled. */
2036d94a7   Paul E. McKenney   rcu: Rework detec...
1877
1878
1879
1880
1881
1882
1883
  	rnp = rdp->mynode;
  	if (need_report & RCU_OFL_TASKS_NORM_GP)
  		rcu_report_unblock_qs_rnp(rnp, flags);
  	else
  		raw_spin_unlock_irqrestore(&rnp->lock, flags);
  	if (need_report & RCU_OFL_TASKS_EXP_GP)
  		rcu_report_exp_rnp(rsp, rnp, true);
cf01537ec   Paul E. McKenney   rcu: Add check fo...
1884
1885
1886
1887
  	WARN_ONCE(rdp->qlen != 0 || rdp->nxtlist != NULL,
  		  "rcu_cleanup_dead_cpu: Callbacks on offline CPU %d: qlen=%lu, nxtlist=%p
  ",
  		  cpu, rdp->qlen, rdp->nxtlist);
0d8ee37e2   Paul E. McKenney   rcu: Disallow cal...
1888
1889
1890
  	init_callback_list(rdp);
  	/* Disallow further callbacks on this CPU. */
  	rdp->nxttail[RCU_NEXT_TAIL] = NULL;
a4fbe35a1   Paul E. McKenney   rcu: Grace-period...
1891
  	mutex_unlock(&rsp->onoff_mutex);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1892
1893
1894
  }
  
  #else /* #ifdef CONFIG_HOTPLUG_CPU */
e56014000   Paul E. McKenney   rcu: Simplify off...
1895
  static void rcu_cleanup_dying_cpu(struct rcu_state *rsp)
e74f4c456   Paul E. McKenney   rcu: Make hot-unp...
1896
1897
  {
  }
e56014000   Paul E. McKenney   rcu: Simplify off...
1898
  static void rcu_cleanup_dead_cpu(int cpu, struct rcu_state *rsp)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1899
1900
1901
1902
1903
1904
1905
1906
1907
  {
  }
  
  #endif /* #else #ifdef CONFIG_HOTPLUG_CPU */
  
  /*
   * Invoke any RCU callbacks that have made it to the end of their grace
   * period.  Thottle as specified by rdp->blimit.
   */
37c72e56f   Paul E. McKenney   rcu: Prevent RCU ...
1908
  static void rcu_do_batch(struct rcu_state *rsp, struct rcu_data *rdp)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1909
1910
1911
  {
  	unsigned long flags;
  	struct rcu_head *next, *list, **tail;
878d7439d   Eric Dumazet   rcu: Fix batch-li...
1912
1913
  	long bl, count, count_lazy;
  	int i;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1914

dc35c8934   Paul E. McKenney   rcu: Tag callback...
1915
  	/* If no callbacks are ready, just return. */
29c00b4a1   Paul E. McKenney   rcu: Add event-tr...
1916
  	if (!cpu_has_callbacks_ready_to_invoke(rdp)) {
486e25934   Paul E. McKenney   rcu: Avoid waking...
1917
  		trace_rcu_batch_start(rsp->name, rdp->qlen_lazy, rdp->qlen, 0);
4968c300e   Paul E. McKenney   rcu: Augment rcu_...
1918
1919
1920
  		trace_rcu_batch_end(rsp->name, 0, !!ACCESS_ONCE(rdp->nxtlist),
  				    need_resched(), is_idle_task(current),
  				    rcu_is_callbacks_kthread());
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1921
  		return;
29c00b4a1   Paul E. McKenney   rcu: Add event-tr...
1922
  	}
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1923
1924
1925
1926
1927
1928
  
  	/*
  	 * Extract the list of ready callbacks, disabling to prevent
  	 * races with call_rcu() from interrupt handlers.
  	 */
  	local_irq_save(flags);
8146c4e2e   Paul E. McKenney   rcu: Check for ca...
1929
  	WARN_ON_ONCE(cpu_is_offline(smp_processor_id()));
29c00b4a1   Paul E. McKenney   rcu: Add event-tr...
1930
  	bl = rdp->blimit;
486e25934   Paul E. McKenney   rcu: Avoid waking...
1931
  	trace_rcu_batch_start(rsp->name, rdp->qlen_lazy, rdp->qlen, bl);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1932
1933
1934
1935
  	list = rdp->nxtlist;
  	rdp->nxtlist = *rdp->nxttail[RCU_DONE_TAIL];
  	*rdp->nxttail[RCU_DONE_TAIL] = NULL;
  	tail = rdp->nxttail[RCU_DONE_TAIL];
b41772abe   Paul E. McKenney   rcu: Stop rcu_do_...
1936
1937
1938
  	for (i = RCU_NEXT_SIZE - 1; i >= 0; i--)
  		if (rdp->nxttail[i] == rdp->nxttail[RCU_DONE_TAIL])
  			rdp->nxttail[i] = &rdp->nxtlist;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1939
1940
1941
  	local_irq_restore(flags);
  
  	/* Invoke callbacks. */
486e25934   Paul E. McKenney   rcu: Avoid waking...
1942
  	count = count_lazy = 0;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1943
1944
1945
  	while (list) {
  		next = list->next;
  		prefetch(next);
551d55a94   Mathieu Desnoyers   tree/tiny rcu: Ad...
1946
  		debug_rcu_head_unqueue(list);
486e25934   Paul E. McKenney   rcu: Avoid waking...
1947
1948
  		if (__rcu_reclaim(rsp->name, list))
  			count_lazy++;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1949
  		list = next;
dff1672d9   Paul E. McKenney   rcu: Keep invokin...
1950
1951
1952
1953
  		/* Stop only if limit reached and CPU has something to do. */
  		if (++count >= bl &&
  		    (need_resched() ||
  		     (!is_idle_task(current) && !rcu_is_callbacks_kthread())))
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1954
1955
1956
1957
  			break;
  	}
  
  	local_irq_save(flags);
4968c300e   Paul E. McKenney   rcu: Augment rcu_...
1958
1959
1960
  	trace_rcu_batch_end(rsp->name, count, !!list, need_resched(),
  			    is_idle_task(current),
  			    rcu_is_callbacks_kthread());
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1961
1962
  
  	/* Update count, and requeue any remaining callbacks. */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1963
1964
1965
  	if (list != NULL) {
  		*tail = rdp->nxtlist;
  		rdp->nxtlist = list;
b41772abe   Paul E. McKenney   rcu: Stop rcu_do_...
1966
1967
1968
  		for (i = 0; i < RCU_NEXT_SIZE; i++)
  			if (&rdp->nxtlist == rdp->nxttail[i])
  				rdp->nxttail[i] = tail;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1969
1970
1971
  			else
  				break;
  	}
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1972
1973
  	smp_mb(); /* List handling before counting for rcu_barrier(). */
  	rdp->qlen_lazy -= count_lazy;
1d1fb395f   Paul E. McKenney   rcu: Add ACCESS_O...
1974
  	ACCESS_ONCE(rdp->qlen) -= count;
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
1975
  	rdp->n_cbs_invoked += count;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1976
1977
1978
1979
  
  	/* Reinstate batch limit if we have worked down the excess. */
  	if (rdp->blimit == LONG_MAX && rdp->qlen <= qlowmark)
  		rdp->blimit = blimit;
37c72e56f   Paul E. McKenney   rcu: Prevent RCU ...
1980
1981
1982
1983
1984
1985
  	/* Reset ->qlen_last_fqs_check trigger if enough CBs have drained. */
  	if (rdp->qlen == 0 && rdp->qlen_last_fqs_check != 0) {
  		rdp->qlen_last_fqs_check = 0;
  		rdp->n_force_qs_snap = rsp->n_force_qs;
  	} else if (rdp->qlen < rdp->qlen_last_fqs_check - qhimark)
  		rdp->qlen_last_fqs_check = rdp->qlen;
cfca92797   Paul E. McKenney   rcu: Introduce ch...
1986
  	WARN_ON_ONCE((rdp->nxtlist == NULL) != (rdp->qlen == 0));
37c72e56f   Paul E. McKenney   rcu: Prevent RCU ...
1987

64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1988
  	local_irq_restore(flags);
e0f23060a   Paul E. McKenney   rcu: Update comme...
1989
  	/* Re-invoke RCU core processing if there are callbacks remaining. */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1990
  	if (cpu_has_callbacks_ready_to_invoke(rdp))
a46e0899e   Paul E. McKenney   rcu: use softirq ...
1991
  		invoke_rcu_core();
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1992
1993
1994
1995
1996
  }
  
  /*
   * Check to see if this CPU is in a non-context-switch quiescent state
   * (user mode or idle loop for rcu, non-softirq execution for rcu_bh).
e0f23060a   Paul E. McKenney   rcu: Update comme...
1997
   * Also schedule RCU core processing.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
1998
   *
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
1999
   * This function must be called from hardirq context.  It is normally
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2000
2001
2002
2003
2004
   * invoked from the scheduling-clock interrupt.  If rcu_pending returns
   * false, there is no point in invoking rcu_check_callbacks().
   */
  void rcu_check_callbacks(int cpu, int user)
  {
300df91ca   Paul E. McKenney   rcu: Event-trace ...
2005
  	trace_rcu_utilization("Start scheduler-tick");
a858af287   Paul E. McKenney   rcu: Print schedu...
2006
  	increment_cpu_stall_ticks();
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
2007
  	if (user || rcu_is_cpu_rrupt_from_idle()) {
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2008
2009
2010
2011
2012
  
  		/*
  		 * Get here if this CPU took its interrupt from user
  		 * mode or from the idle loop, and if this is not a
  		 * nested interrupt.  In this case, the CPU is in
d6714c22b   Paul E. McKenney   rcu: Renamings to...
2013
  		 * a quiescent state, so note it.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2014
2015
  		 *
  		 * No memory barrier is required here because both
d6714c22b   Paul E. McKenney   rcu: Renamings to...
2016
2017
2018
  		 * rcu_sched_qs() and rcu_bh_qs() reference only CPU-local
  		 * variables that other CPUs neither access nor modify,
  		 * at least not while the corresponding CPU is online.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2019
  		 */
d6714c22b   Paul E. McKenney   rcu: Renamings to...
2020
2021
  		rcu_sched_qs(cpu);
  		rcu_bh_qs(cpu);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2022
2023
2024
2025
2026
2027
2028
  
  	} else if (!in_softirq()) {
  
  		/*
  		 * Get here if this CPU did not take its interrupt from
  		 * softirq, in other words, if it is not interrupting
  		 * a rcu_bh read-side critical section.  This is an _bh
d6714c22b   Paul E. McKenney   rcu: Renamings to...
2029
  		 * critical section, so note it.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2030
  		 */
d6714c22b   Paul E. McKenney   rcu: Renamings to...
2031
  		rcu_bh_qs(cpu);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2032
  	}
f41d911f8   Paul E. McKenney   rcu: Merge preemp...
2033
  	rcu_preempt_check_callbacks(cpu);
d21670aca   Paul E. McKenney   rcu: reduce the n...
2034
  	if (rcu_pending(cpu))
a46e0899e   Paul E. McKenney   rcu: use softirq ...
2035
  		invoke_rcu_core();
300df91ca   Paul E. McKenney   rcu: Event-trace ...
2036
  	trace_rcu_utilization("End scheduler-tick");
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2037
  }
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2038
2039
2040
  /*
   * Scan the leaf rcu_node structures, processing dyntick state for any that
   * have not yet encountered a quiescent state, using the function specified.
27f4d2805   Paul E. McKenney   rcu: priority boo...
2041
2042
   * Also initiate boosting for any threads blocked on the root rcu_node.
   *
ee47eb9f4   Paul E. McKenney   rcu: Remove leg o...
2043
   * The caller must have suppressed start of new grace periods.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2044
   */
45f014c52   Paul E. McKenney   rcu: Remove redun...
2045
  static void force_qs_rnp(struct rcu_state *rsp, int (*f)(struct rcu_data *))
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2046
2047
2048
2049
2050
  {
  	unsigned long bit;
  	int cpu;
  	unsigned long flags;
  	unsigned long mask;
a0b6c9a78   Paul E. McKenney   rcu: Clean up cod...
2051
  	struct rcu_node *rnp;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2052

a0b6c9a78   Paul E. McKenney   rcu: Clean up cod...
2053
  	rcu_for_each_leaf_node(rsp, rnp) {
b4be093fe   Paul E. McKenney   rcu: Allow RCU qu...
2054
  		cond_resched();
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2055
  		mask = 0;
1304afb22   Paul E. McKenney   rcu: Convert to r...
2056
  		raw_spin_lock_irqsave(&rnp->lock, flags);
ee47eb9f4   Paul E. McKenney   rcu: Remove leg o...
2057
  		if (!rcu_gp_in_progress(rsp)) {
1304afb22   Paul E. McKenney   rcu: Convert to r...
2058
  			raw_spin_unlock_irqrestore(&rnp->lock, flags);
0f10dc826   Paul E. McKenney   rcu: Eliminate rc...
2059
  			return;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2060
  		}
a0b6c9a78   Paul E. McKenney   rcu: Clean up cod...
2061
  		if (rnp->qsmask == 0) {
1217ed1ba   Paul E. McKenney   rcu: permit rcu_r...
2062
  			rcu_initiate_boost(rnp, flags); /* releases rnp->lock */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2063
2064
  			continue;
  		}
a0b6c9a78   Paul E. McKenney   rcu: Clean up cod...
2065
  		cpu = rnp->grplo;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2066
  		bit = 1;
a0b6c9a78   Paul E. McKenney   rcu: Clean up cod...
2067
  		for (; cpu <= rnp->grphi; cpu++, bit <<= 1) {
394f99a90   Lai Jiangshan   rcu: simplify the...
2068
2069
  			if ((rnp->qsmask & bit) != 0 &&
  			    f(per_cpu_ptr(rsp->rda, cpu)))
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2070
2071
  				mask |= bit;
  		}
45f014c52   Paul E. McKenney   rcu: Remove redun...
2072
  		if (mask != 0) {
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2073

d3f6bad39   Paul E. McKenney   rcu: Rename "quie...
2074
2075
  			/* rcu_report_qs_rnp() releases rnp->lock. */
  			rcu_report_qs_rnp(mask, rsp, rnp, flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2076
2077
  			continue;
  		}
1304afb22   Paul E. McKenney   rcu: Convert to r...
2078
  		raw_spin_unlock_irqrestore(&rnp->lock, flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2079
  	}
27f4d2805   Paul E. McKenney   rcu: priority boo...
2080
  	rnp = rcu_get_root(rsp);
1217ed1ba   Paul E. McKenney   rcu: permit rcu_r...
2081
2082
2083
2084
  	if (rnp->qsmask == 0) {
  		raw_spin_lock_irqsave(&rnp->lock, flags);
  		rcu_initiate_boost(rnp, flags); /* releases rnp->lock. */
  	}
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2085
2086
2087
2088
2089
2090
  }
  
  /*
   * Force quiescent states on reluctant CPUs, and also detect which
   * CPUs are in dyntick-idle mode.
   */
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
2091
  static void force_quiescent_state(struct rcu_state *rsp)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2092
2093
  {
  	unsigned long flags;
394f2769a   Paul E. McKenney   rcu: Prevent forc...
2094
2095
2096
2097
2098
2099
2100
2101
2102
2103
2104
2105
2106
2107
2108
2109
2110
2111
  	bool ret;
  	struct rcu_node *rnp;
  	struct rcu_node *rnp_old = NULL;
  
  	/* Funnel through hierarchy to reduce memory contention. */
  	rnp = per_cpu_ptr(rsp->rda, raw_smp_processor_id())->mynode;
  	for (; rnp != NULL; rnp = rnp->parent) {
  		ret = (ACCESS_ONCE(rsp->gp_flags) & RCU_GP_FLAG_FQS) ||
  		      !raw_spin_trylock(&rnp->fqslock);
  		if (rnp_old != NULL)
  			raw_spin_unlock(&rnp_old->fqslock);
  		if (ret) {
  			rsp->n_force_qs_lh++;
  			return;
  		}
  		rnp_old = rnp;
  	}
  	/* rnp_old == rcu_get_root(rsp), rnp == NULL. */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2112

394f2769a   Paul E. McKenney   rcu: Prevent forc...
2113
2114
2115
2116
2117
2118
  	/* Reached the root of the rcu_node tree, acquire lock. */
  	raw_spin_lock_irqsave(&rnp_old->lock, flags);
  	raw_spin_unlock(&rnp_old->fqslock);
  	if (ACCESS_ONCE(rsp->gp_flags) & RCU_GP_FLAG_FQS) {
  		rsp->n_force_qs_lh++;
  		raw_spin_unlock_irqrestore(&rnp_old->lock, flags);
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
2119
  		return;  /* Someone beat us to it. */
46a1e34ed   Paul E. McKenney   rcu: Make force_q...
2120
  	}
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
2121
  	rsp->gp_flags |= RCU_GP_FLAG_FQS;
394f2769a   Paul E. McKenney   rcu: Prevent forc...
2122
  	raw_spin_unlock_irqrestore(&rnp_old->lock, flags);
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
2123
  	wake_up(&rsp->gp_wq);  /* Memory barrier implied by wake_up() path. */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2124
  }
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2125
  /*
e0f23060a   Paul E. McKenney   rcu: Update comme...
2126
2127
2128
   * This does the RCU core processing work for the specified rcu_state
   * and rcu_data structures.  This may be called only from the CPU to
   * whom the rdp belongs.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2129
2130
   */
  static void
1bca8cf1a   Paul E. McKenney   rcu: Remove unnee...
2131
  __rcu_process_callbacks(struct rcu_state *rsp)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2132
2133
  {
  	unsigned long flags;
1bca8cf1a   Paul E. McKenney   rcu: Remove unnee...
2134
  	struct rcu_data *rdp = __this_cpu_ptr(rsp->rda);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2135

2e5975580   Paul E. McKenney   rcu: Simplify RCU...
2136
  	WARN_ON_ONCE(rdp->beenonline == 0);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2137
2138
2139
2140
  	/* Update RCU state based on any recent quiescent states. */
  	rcu_check_quiescent_state(rsp, rdp);
  
  	/* Does this CPU require a not-yet-started grace period? */
dc35c8934   Paul E. McKenney   rcu: Tag callback...
2141
  	local_irq_save(flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2142
  	if (cpu_needs_another_gp(rsp, rdp)) {
dc35c8934   Paul E. McKenney   rcu: Tag callback...
2143
  		raw_spin_lock(&rcu_get_root(rsp)->lock); /* irqs disabled. */
b8462084a   Paul E. McKenney   rcu: Push lock re...
2144
2145
  		rcu_start_gp(rsp);
  		raw_spin_unlock_irqrestore(&rcu_get_root(rsp)->lock, flags);
dc35c8934   Paul E. McKenney   rcu: Tag callback...
2146
2147
  	} else {
  		local_irq_restore(flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2148
2149
2150
  	}
  
  	/* If there are callbacks ready, invoke them. */
09223371d   Shaohua Li   rcu: Use softirq ...
2151
  	if (cpu_has_callbacks_ready_to_invoke(rdp))
a46e0899e   Paul E. McKenney   rcu: use softirq ...
2152
  		invoke_rcu_callbacks(rsp, rdp);
09223371d   Shaohua Li   rcu: Use softirq ...
2153
  }
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2154
  /*
e0f23060a   Paul E. McKenney   rcu: Update comme...
2155
   * Do RCU core processing for the current CPU.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2156
   */
09223371d   Shaohua Li   rcu: Use softirq ...
2157
  static void rcu_process_callbacks(struct softirq_action *unused)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2158
  {
6ce75a232   Paul E. McKenney   rcu: Introduce fo...
2159
  	struct rcu_state *rsp;
bfa00b4c4   Paul E. McKenney   rcu: Prevent offl...
2160
2161
  	if (cpu_is_offline(smp_processor_id()))
  		return;
300df91ca   Paul E. McKenney   rcu: Event-trace ...
2162
  	trace_rcu_utilization("Start RCU core");
6ce75a232   Paul E. McKenney   rcu: Introduce fo...
2163
2164
  	for_each_rcu_flavor(rsp)
  		__rcu_process_callbacks(rsp);
300df91ca   Paul E. McKenney   rcu: Event-trace ...
2165
  	trace_rcu_utilization("End RCU core");
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2166
  }
a26ac2455   Paul E. McKenney   rcu: move TREE_RC...
2167
  /*
e0f23060a   Paul E. McKenney   rcu: Update comme...
2168
2169
2170
2171
2172
   * Schedule RCU callback invocation.  If the specified type of RCU
   * does not support RCU priority boosting, just do a direct call,
   * otherwise wake up the per-CPU kernel kthread.  Note that because we
   * are running on the current CPU with interrupts disabled, the
   * rcu_cpu_kthread_task cannot disappear out from under us.
a26ac2455   Paul E. McKenney   rcu: move TREE_RC...
2173
   */
a46e0899e   Paul E. McKenney   rcu: use softirq ...
2174
  static void invoke_rcu_callbacks(struct rcu_state *rsp, struct rcu_data *rdp)
a26ac2455   Paul E. McKenney   rcu: move TREE_RC...
2175
  {
b0d304172   Paul E. McKenney   rcu: Prevent RCU ...
2176
2177
  	if (unlikely(!ACCESS_ONCE(rcu_scheduler_fully_active)))
  		return;
a46e0899e   Paul E. McKenney   rcu: use softirq ...
2178
2179
  	if (likely(!rsp->boost)) {
  		rcu_do_batch(rsp, rdp);
a26ac2455   Paul E. McKenney   rcu: move TREE_RC...
2180
2181
  		return;
  	}
a46e0899e   Paul E. McKenney   rcu: use softirq ...
2182
  	invoke_rcu_callbacks_kthread();
a26ac2455   Paul E. McKenney   rcu: move TREE_RC...
2183
  }
a46e0899e   Paul E. McKenney   rcu: use softirq ...
2184
  static void invoke_rcu_core(void)
09223371d   Shaohua Li   rcu: Use softirq ...
2185
  {
b0f740360   Paul E. McKenney   rcu: Avoid invoki...
2186
2187
  	if (cpu_online(smp_processor_id()))
  		raise_softirq(RCU_SOFTIRQ);
09223371d   Shaohua Li   rcu: Use softirq ...
2188
  }
29154c57e   Paul E. McKenney   rcu: Split RCU co...
2189
2190
2191
2192
2193
  /*
   * Handle any core-RCU processing required by a call_rcu() invocation.
   */
  static void __call_rcu_core(struct rcu_state *rsp, struct rcu_data *rdp,
  			    struct rcu_head *head, unsigned long flags)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2194
  {
62fde6edf   Paul E. McKenney   rcu: Make __call_...
2195
2196
2197
2198
  	/*
  	 * If called from an extended quiescent state, invoke the RCU
  	 * core in order to force a re-evaluation of RCU's idleness.
  	 */
a16b7a693   Paul E. McKenney   rcu: Prevent __ca...
2199
  	if (rcu_is_cpu_idle() && cpu_online(smp_processor_id()))
62fde6edf   Paul E. McKenney   rcu: Make __call_...
2200
  		invoke_rcu_core();
a16b7a693   Paul E. McKenney   rcu: Prevent __ca...
2201
  	/* If interrupts were disabled or CPU offline, don't invoke RCU core. */
29154c57e   Paul E. McKenney   rcu: Split RCU co...
2202
  	if (irqs_disabled_flags(flags) || cpu_is_offline(smp_processor_id()))
2655d57ef   Paul E. McKenney   rcu: prevent call...
2203
  		return;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2204

37c72e56f   Paul E. McKenney   rcu: Prevent RCU ...
2205
2206
2207
2208
2209
2210
2211
  	/*
  	 * Force the grace period if too many callbacks or too long waiting.
  	 * Enforce hysteresis, and don't invoke force_quiescent_state()
  	 * if some other CPU has recently done so.  Also, don't bother
  	 * invoking force_quiescent_state() if the newly enqueued callback
  	 * is the only one waiting for a grace period to complete.
  	 */
2655d57ef   Paul E. McKenney   rcu: prevent call...
2212
  	if (unlikely(rdp->qlen > rdp->qlen_last_fqs_check + qhimark)) {
b52573d27   Paul E. McKenney   rcu: reduce __cal...
2213
2214
  
  		/* Are we ignoring a completed grace period? */
470716fc0   Paul E. McKenney   rcu: Switch calle...
2215
  		note_gp_changes(rsp, rdp);
b52573d27   Paul E. McKenney   rcu: reduce __cal...
2216
2217
2218
  
  		/* Start a new grace period if one not already started. */
  		if (!rcu_gp_in_progress(rsp)) {
b52573d27   Paul E. McKenney   rcu: reduce __cal...
2219
  			struct rcu_node *rnp_root = rcu_get_root(rsp);
b8462084a   Paul E. McKenney   rcu: Push lock re...
2220
2221
2222
  			raw_spin_lock(&rnp_root->lock);
  			rcu_start_gp(rsp);
  			raw_spin_unlock(&rnp_root->lock);
b52573d27   Paul E. McKenney   rcu: reduce __cal...
2223
2224
2225
2226
2227
  		} else {
  			/* Give the grace period a kick. */
  			rdp->blimit = LONG_MAX;
  			if (rsp->n_force_qs == rdp->n_force_qs_snap &&
  			    *rdp->nxttail[RCU_DONE_TAIL] != head)
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
2228
  				force_quiescent_state(rsp);
b52573d27   Paul E. McKenney   rcu: reduce __cal...
2229
2230
2231
  			rdp->n_force_qs_snap = rsp->n_force_qs;
  			rdp->qlen_last_fqs_check = rdp->qlen;
  		}
4cdfc175c   Paul E. McKenney   rcu: Move quiesce...
2232
  	}
29154c57e   Paul E. McKenney   rcu: Split RCU co...
2233
  }
3fbfbf7a3   Paul E. McKenney   rcu: Add callback...
2234
2235
2236
2237
2238
2239
  /*
   * Helper function for call_rcu() and friends.  The cpu argument will
   * normally be -1, indicating "currently running CPU".  It may specify
   * a CPU only if that CPU is a no-CBs CPU.  Currently, only _rcu_barrier()
   * is expected to specify a CPU.
   */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2240
2241
  static void
  __call_rcu(struct rcu_head *head, void (*func)(struct rcu_head *rcu),
3fbfbf7a3   Paul E. McKenney   rcu: Add callback...
2242
  	   struct rcu_state *rsp, int cpu, bool lazy)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2243
2244
2245
  {
  	unsigned long flags;
  	struct rcu_data *rdp;
0bb7b59d6   Paul E. McKenney   rcu: Add diagnost...
2246
  	WARN_ON_ONCE((unsigned long)head & 0x3); /* Misaligned rcu_head! */
551d55a94   Mathieu Desnoyers   tree/tiny rcu: Ad...
2247
  	debug_rcu_head_queue(head);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2248
2249
  	head->func = func;
  	head->next = NULL;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2250
2251
2252
2253
2254
2255
2256
  	/*
  	 * Opportunistically note grace-period endings and beginnings.
  	 * Note that we might see a beginning right after we see an
  	 * end, but never vice versa, since this CPU has to pass through
  	 * a quiescent state betweentimes.
  	 */
  	local_irq_save(flags);
394f99a90   Lai Jiangshan   rcu: simplify the...
2257
  	rdp = this_cpu_ptr(rsp->rda);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2258
2259
  
  	/* Add the callback to our list. */
3fbfbf7a3   Paul E. McKenney   rcu: Add callback...
2260
2261
2262
2263
2264
2265
2266
  	if (unlikely(rdp->nxttail[RCU_NEXT_TAIL] == NULL) || cpu != -1) {
  		int offline;
  
  		if (cpu != -1)
  			rdp = per_cpu_ptr(rsp->rda, cpu);
  		offline = !__call_rcu_nocb(rdp, head, lazy);
  		WARN_ON_ONCE(offline);
0d8ee37e2   Paul E. McKenney   rcu: Disallow cal...
2267
  		/* _call_rcu() is illegal on offline CPU; leak the callback. */
0d8ee37e2   Paul E. McKenney   rcu: Disallow cal...
2268
2269
2270
  		local_irq_restore(flags);
  		return;
  	}
29154c57e   Paul E. McKenney   rcu: Split RCU co...
2271
  	ACCESS_ONCE(rdp->qlen)++;
486e25934   Paul E. McKenney   rcu: Avoid waking...
2272
2273
  	if (lazy)
  		rdp->qlen_lazy++;
c57afe80d   Paul E. McKenney   rcu: Make RCU_FAS...
2274
2275
  	else
  		rcu_idle_count_callbacks_posted();
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2276
2277
2278
  	smp_mb();  /* Count before adding callback for rcu_barrier(). */
  	*rdp->nxttail[RCU_NEXT_TAIL] = head;
  	rdp->nxttail[RCU_NEXT_TAIL] = &head->next;
2655d57ef   Paul E. McKenney   rcu: prevent call...
2279

d4c08f2ac   Paul E. McKenney   rcu: Add grace-pe...
2280
2281
  	if (__is_kfree_rcu_offset((unsigned long)func))
  		trace_rcu_kfree_callback(rsp->name, head, (unsigned long)func,
486e25934   Paul E. McKenney   rcu: Avoid waking...
2282
  					 rdp->qlen_lazy, rdp->qlen);
d4c08f2ac   Paul E. McKenney   rcu: Add grace-pe...
2283
  	else
486e25934   Paul E. McKenney   rcu: Avoid waking...
2284
  		trace_rcu_callback(rsp->name, head, rdp->qlen_lazy, rdp->qlen);
d4c08f2ac   Paul E. McKenney   rcu: Add grace-pe...
2285

29154c57e   Paul E. McKenney   rcu: Split RCU co...
2286
2287
  	/* Go handle any RCU core processing required. */
  	__call_rcu_core(rsp, rdp, head, flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2288
2289
2290
2291
  	local_irq_restore(flags);
  }
  
  /*
d6714c22b   Paul E. McKenney   rcu: Renamings to...
2292
   * Queue an RCU-sched callback for invocation after a grace period.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2293
   */
d6714c22b   Paul E. McKenney   rcu: Renamings to...
2294
  void call_rcu_sched(struct rcu_head *head, void (*func)(struct rcu_head *rcu))
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2295
  {
3fbfbf7a3   Paul E. McKenney   rcu: Add callback...
2296
  	__call_rcu(head, func, &rcu_sched_state, -1, 0);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2297
  }
d6714c22b   Paul E. McKenney   rcu: Renamings to...
2298
  EXPORT_SYMBOL_GPL(call_rcu_sched);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2299
2300
  
  /*
486e25934   Paul E. McKenney   rcu: Avoid waking...
2301
   * Queue an RCU callback for invocation after a quicker grace period.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2302
2303
2304
   */
  void call_rcu_bh(struct rcu_head *head, void (*func)(struct rcu_head *rcu))
  {
3fbfbf7a3   Paul E. McKenney   rcu: Add callback...
2305
  	__call_rcu(head, func, &rcu_bh_state, -1, 0);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2306
2307
  }
  EXPORT_SYMBOL_GPL(call_rcu_bh);
6d8133919   Paul E. McKenney   rcu: Document why...
2308
2309
2310
2311
2312
2313
2314
2315
  /*
   * Because a context switch is a grace period for RCU-sched and RCU-bh,
   * any blocking grace-period wait automatically implies a grace period
   * if there is only one CPU online at any point time during execution
   * of either synchronize_sched() or synchronize_rcu_bh().  It is OK to
   * occasionally incorrectly indicate that there are multiple CPUs online
   * when there was in fact only one the whole time, as this just adds
   * some overhead: RCU still operates correctly.
6d8133919   Paul E. McKenney   rcu: Document why...
2316
2317
2318
   */
  static inline int rcu_blocking_is_gp(void)
  {
95f0c1de3   Paul E. McKenney   rcu: Disable pree...
2319
  	int ret;
6d8133919   Paul E. McKenney   rcu: Document why...
2320
  	might_sleep();  /* Check for RCU read-side critical section. */
95f0c1de3   Paul E. McKenney   rcu: Disable pree...
2321
2322
2323
2324
  	preempt_disable();
  	ret = num_online_cpus() <= 1;
  	preempt_enable();
  	return ret;
6d8133919   Paul E. McKenney   rcu: Document why...
2325
  }
6ebb237be   Paul E. McKenney   rcu: Re-arrange c...
2326
2327
2328
2329
2330
2331
2332
2333
2334
2335
2336
2337
  /**
   * synchronize_sched - wait until an rcu-sched grace period has elapsed.
   *
   * Control will return to the caller some time after a full rcu-sched
   * grace period has elapsed, in other words after all currently executing
   * rcu-sched read-side critical sections have completed.   These read-side
   * critical sections are delimited by rcu_read_lock_sched() and
   * rcu_read_unlock_sched(), and may be nested.  Note that preempt_disable(),
   * local_irq_disable(), and so on may be used in place of
   * rcu_read_lock_sched().
   *
   * This means that all preempt_disable code sequences, including NMI and
f0a0e6f28   Paul E. McKenney   rcu: Clarify memo...
2338
2339
2340
2341
2342
2343
2344
2345
2346
2347
2348
2349
2350
2351
2352
2353
2354
2355
2356
2357
2358
2359
   * non-threaded hardware-interrupt handlers, in progress on entry will
   * have completed before this primitive returns.  However, this does not
   * guarantee that softirq handlers will have completed, since in some
   * kernels, these handlers can run in process context, and can block.
   *
   * Note that this guarantee implies further memory-ordering guarantees.
   * On systems with more than one CPU, when synchronize_sched() returns,
   * each CPU is guaranteed to have executed a full memory barrier since the
   * end of its last RCU-sched read-side critical section whose beginning
   * preceded the call to synchronize_sched().  In addition, each CPU having
   * an RCU read-side critical section that extends beyond the return from
   * synchronize_sched() is guaranteed to have executed a full memory barrier
   * after the beginning of synchronize_sched() and before the beginning of
   * that RCU read-side critical section.  Note that these guarantees include
   * CPUs that are offline, idle, or executing in user mode, as well as CPUs
   * that are executing in the kernel.
   *
   * Furthermore, if CPU A invoked synchronize_sched(), which returned
   * to its caller on CPU B, then both CPU A and CPU B are guaranteed
   * to have executed a full memory barrier during the execution of
   * synchronize_sched() -- even if CPU A and CPU B are the same CPU (but
   * again only if the system has more than one CPU).
6ebb237be   Paul E. McKenney   rcu: Re-arrange c...
2360
2361
2362
2363
2364
2365
2366
2367
2368
   *
   * This primitive provides the guarantees made by the (now removed)
   * synchronize_kernel() API.  In contrast, synchronize_rcu() only
   * guarantees that rcu_read_lock() sections will have completed.
   * In "classic RCU", these two guarantees happen to be one and
   * the same, but can differ in realtime RCU implementations.
   */
  void synchronize_sched(void)
  {
fe15d706c   Paul E. McKenney   rcu: Add lockdep-...
2369
2370
2371
2372
  	rcu_lockdep_assert(!lock_is_held(&rcu_bh_lock_map) &&
  			   !lock_is_held(&rcu_lock_map) &&
  			   !lock_is_held(&rcu_sched_lock_map),
  			   "Illegal synchronize_sched() in RCU-sched read-side critical section");
6ebb237be   Paul E. McKenney   rcu: Re-arrange c...
2373
2374
  	if (rcu_blocking_is_gp())
  		return;
3705b88db   Antti P Miettinen   rcu: Add a module...
2375
2376
2377
2378
  	if (rcu_expedited)
  		synchronize_sched_expedited();
  	else
  		wait_rcu_gp(call_rcu_sched);
6ebb237be   Paul E. McKenney   rcu: Re-arrange c...
2379
2380
2381
2382
2383
2384
2385
2386
2387
2388
2389
  }
  EXPORT_SYMBOL_GPL(synchronize_sched);
  
  /**
   * synchronize_rcu_bh - wait until an rcu_bh grace period has elapsed.
   *
   * Control will return to the caller some time after a full rcu_bh grace
   * period has elapsed, in other words after all currently executing rcu_bh
   * read-side critical sections have completed.  RCU read-side critical
   * sections are delimited by rcu_read_lock_bh() and rcu_read_unlock_bh(),
   * and may be nested.
f0a0e6f28   Paul E. McKenney   rcu: Clarify memo...
2390
2391
2392
   *
   * See the description of synchronize_sched() for more detailed information
   * on memory ordering guarantees.
6ebb237be   Paul E. McKenney   rcu: Re-arrange c...
2393
2394
2395
   */
  void synchronize_rcu_bh(void)
  {
fe15d706c   Paul E. McKenney   rcu: Add lockdep-...
2396
2397
2398
2399
  	rcu_lockdep_assert(!lock_is_held(&rcu_bh_lock_map) &&
  			   !lock_is_held(&rcu_lock_map) &&
  			   !lock_is_held(&rcu_sched_lock_map),
  			   "Illegal synchronize_rcu_bh() in RCU-bh read-side critical section");
6ebb237be   Paul E. McKenney   rcu: Re-arrange c...
2400
2401
  	if (rcu_blocking_is_gp())
  		return;
3705b88db   Antti P Miettinen   rcu: Add a module...
2402
2403
2404
2405
  	if (rcu_expedited)
  		synchronize_rcu_bh_expedited();
  	else
  		wait_rcu_gp(call_rcu_bh);
6ebb237be   Paul E. McKenney   rcu: Re-arrange c...
2406
2407
  }
  EXPORT_SYMBOL_GPL(synchronize_rcu_bh);
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2408
2409
2410
2411
2412
2413
2414
2415
2416
2417
2418
2419
2420
2421
2422
2423
  static int synchronize_sched_expedited_cpu_stop(void *data)
  {
  	/*
  	 * There must be a full memory barrier on each affected CPU
  	 * between the time that try_stop_cpus() is called and the
  	 * time that it returns.
  	 *
  	 * In the current initial implementation of cpu_stop, the
  	 * above condition is already met when the control reaches
  	 * this point and the following smp_mb() is not strictly
  	 * necessary.  Do smp_mb() anyway for documentation and
  	 * robustness against future implementation changes.
  	 */
  	smp_mb(); /* See above comment block. */
  	return 0;
  }
236fefafe   Paul E. McKenney   rcu: Call out dan...
2424
2425
2426
2427
2428
2429
2430
2431
2432
2433
  /**
   * synchronize_sched_expedited - Brute-force RCU-sched grace period
   *
   * Wait for an RCU-sched grace period to elapse, but use a "big hammer"
   * approach to force the grace period to end quickly.  This consumes
   * significant time on all CPUs and is unfriendly to real-time workloads,
   * so is thus not recommended for any sort of common-case code.  In fact,
   * if you are using synchronize_sched_expedited() in a loop, please
   * restructure your code to batch your updates, and then use a single
   * synchronize_sched() instead.
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2434
   *
236fefafe   Paul E. McKenney   rcu: Call out dan...
2435
2436
2437
2438
   * Note that it is illegal to call this function while holding any lock
   * that is acquired by a CPU-hotplug notifier.  And yes, it is also illegal
   * to call this function from a CPU-hotplug notifier.  Failing to observe
   * these restriction will result in deadlock.
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2439
2440
2441
2442
2443
2444
2445
2446
2447
2448
2449
2450
2451
2452
2453
2454
2455
2456
2457
2458
2459
2460
2461
2462
   *
   * This implementation can be thought of as an application of ticket
   * locking to RCU, with sync_sched_expedited_started and
   * sync_sched_expedited_done taking on the roles of the halves
   * of the ticket-lock word.  Each task atomically increments
   * sync_sched_expedited_started upon entry, snapshotting the old value,
   * then attempts to stop all the CPUs.  If this succeeds, then each
   * CPU will have executed a context switch, resulting in an RCU-sched
   * grace period.  We are then done, so we use atomic_cmpxchg() to
   * update sync_sched_expedited_done to match our snapshot -- but
   * only if someone else has not already advanced past our snapshot.
   *
   * On the other hand, if try_stop_cpus() fails, we check the value
   * of sync_sched_expedited_done.  If it has advanced past our
   * initial snapshot, then someone else must have forced a grace period
   * some time after we took our snapshot.  In this case, our work is
   * done for us, and we can simply return.  Otherwise, we try again,
   * but keep our initial snapshot for purposes of checking for someone
   * doing our work for us.
   *
   * If we fail too many times in a row, we fall back to synchronize_sched().
   */
  void synchronize_sched_expedited(void)
  {
1924bcb02   Paul E. McKenney   rcu: Avoid counte...
2463
2464
  	long firstsnap, s, snap;
  	int trycount = 0;
40694d664   Paul E. McKenney   rcu: Move synchro...
2465
  	struct rcu_state *rsp = &rcu_sched_state;
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2466

1924bcb02   Paul E. McKenney   rcu: Avoid counte...
2467
2468
2469
2470
2471
2472
2473
2474
  	/*
  	 * If we are in danger of counter wrap, just do synchronize_sched().
  	 * By allowing sync_sched_expedited_started to advance no more than
  	 * ULONG_MAX/8 ahead of sync_sched_expedited_done, we are ensuring
  	 * that more than 3.5 billion CPUs would be required to force a
  	 * counter wrap on a 32-bit system.  Quite a few more CPUs would of
  	 * course be required on a 64-bit system.
  	 */
40694d664   Paul E. McKenney   rcu: Move synchro...
2475
2476
  	if (ULONG_CMP_GE((ulong)atomic_long_read(&rsp->expedited_start),
  			 (ulong)atomic_long_read(&rsp->expedited_done) +
1924bcb02   Paul E. McKenney   rcu: Avoid counte...
2477
2478
  			 ULONG_MAX / 8)) {
  		synchronize_sched();
a30489c52   Paul E. McKenney   rcu: Instrument s...
2479
  		atomic_long_inc(&rsp->expedited_wrap);
1924bcb02   Paul E. McKenney   rcu: Avoid counte...
2480
2481
  		return;
  	}
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2482

1924bcb02   Paul E. McKenney   rcu: Avoid counte...
2483
2484
2485
2486
  	/*
  	 * Take a ticket.  Note that atomic_inc_return() implies a
  	 * full memory barrier.
  	 */
40694d664   Paul E. McKenney   rcu: Move synchro...
2487
  	snap = atomic_long_inc_return(&rsp->expedited_start);
1924bcb02   Paul E. McKenney   rcu: Avoid counte...
2488
  	firstsnap = snap;
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2489
  	get_online_cpus();
1cc85961e   Hugh Dickins   rcu: Stop spuriou...
2490
  	WARN_ON_ONCE(cpu_is_offline(raw_smp_processor_id()));
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2491
2492
2493
2494
2495
2496
2497
2498
2499
  
  	/*
  	 * Each pass through the following loop attempts to force a
  	 * context switch on each CPU.
  	 */
  	while (try_stop_cpus(cpu_online_mask,
  			     synchronize_sched_expedited_cpu_stop,
  			     NULL) == -EAGAIN) {
  		put_online_cpus();
a30489c52   Paul E. McKenney   rcu: Instrument s...
2500
  		atomic_long_inc(&rsp->expedited_tryfail);
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2501

1924bcb02   Paul E. McKenney   rcu: Avoid counte...
2502
  		/* Check to see if someone else did our work for us. */
40694d664   Paul E. McKenney   rcu: Move synchro...
2503
  		s = atomic_long_read(&rsp->expedited_done);
1924bcb02   Paul E. McKenney   rcu: Avoid counte...
2504
  		if (ULONG_CMP_GE((ulong)s, (ulong)firstsnap)) {
a30489c52   Paul E. McKenney   rcu: Instrument s...
2505
2506
2507
  			/* ensure test happens before caller kfree */
  			smp_mb__before_atomic_inc(); /* ^^^ */
  			atomic_long_inc(&rsp->expedited_workdone1);
1924bcb02   Paul E. McKenney   rcu: Avoid counte...
2508
2509
  			return;
  		}
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2510
2511
  
  		/* No joy, try again later.  Or just synchronize_sched(). */
c701d5d9b   Paul E. McKenney   rcu: Fix code-sty...
2512
  		if (trycount++ < 10) {
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2513
  			udelay(trycount * num_online_cpus());
c701d5d9b   Paul E. McKenney   rcu: Fix code-sty...
2514
  		} else {
3705b88db   Antti P Miettinen   rcu: Add a module...
2515
  			wait_rcu_gp(call_rcu_sched);
a30489c52   Paul E. McKenney   rcu: Instrument s...
2516
  			atomic_long_inc(&rsp->expedited_normal);
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2517
2518
  			return;
  		}
1924bcb02   Paul E. McKenney   rcu: Avoid counte...
2519
  		/* Recheck to see if someone else did our work for us. */
40694d664   Paul E. McKenney   rcu: Move synchro...
2520
  		s = atomic_long_read(&rsp->expedited_done);
1924bcb02   Paul E. McKenney   rcu: Avoid counte...
2521
  		if (ULONG_CMP_GE((ulong)s, (ulong)firstsnap)) {
a30489c52   Paul E. McKenney   rcu: Instrument s...
2522
2523
2524
  			/* ensure test happens before caller kfree */
  			smp_mb__before_atomic_inc(); /* ^^^ */
  			atomic_long_inc(&rsp->expedited_workdone2);
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2525
2526
2527
2528
2529
  			return;
  		}
  
  		/*
  		 * Refetching sync_sched_expedited_started allows later
1924bcb02   Paul E. McKenney   rcu: Avoid counte...
2530
2531
2532
2533
  		 * callers to piggyback on our grace period.  We retry
  		 * after they started, so our grace period works for them,
  		 * and they started after our first try, so their grace
  		 * period works for us.
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2534
2535
  		 */
  		get_online_cpus();
40694d664   Paul E. McKenney   rcu: Move synchro...
2536
  		snap = atomic_long_read(&rsp->expedited_start);
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2537
2538
  		smp_mb(); /* ensure read is before try_stop_cpus(). */
  	}
a30489c52   Paul E. McKenney   rcu: Instrument s...
2539
  	atomic_long_inc(&rsp->expedited_stoppedcpus);
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2540
2541
2542
2543
2544
  
  	/*
  	 * Everyone up to our most recent fetch is covered by our grace
  	 * period.  Update the counter, but only if our work is still
  	 * relevant -- which it won't be if someone who started later
1924bcb02   Paul E. McKenney   rcu: Avoid counte...
2545
  	 * than we did already did their update.
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2546
2547
  	 */
  	do {
a30489c52   Paul E. McKenney   rcu: Instrument s...
2548
  		atomic_long_inc(&rsp->expedited_done_tries);
40694d664   Paul E. McKenney   rcu: Move synchro...
2549
  		s = atomic_long_read(&rsp->expedited_done);
1924bcb02   Paul E. McKenney   rcu: Avoid counte...
2550
  		if (ULONG_CMP_GE((ulong)s, (ulong)snap)) {
a30489c52   Paul E. McKenney   rcu: Instrument s...
2551
2552
2553
  			/* ensure test happens before caller kfree */
  			smp_mb__before_atomic_inc(); /* ^^^ */
  			atomic_long_inc(&rsp->expedited_done_lost);
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2554
2555
  			break;
  		}
40694d664   Paul E. McKenney   rcu: Move synchro...
2556
  	} while (atomic_long_cmpxchg(&rsp->expedited_done, s, snap) != s);
a30489c52   Paul E. McKenney   rcu: Instrument s...
2557
  	atomic_long_inc(&rsp->expedited_done_exit);
3d3b7db0a   Paul E. McKenney   rcu: Move synchro...
2558
2559
2560
2561
  
  	put_online_cpus();
  }
  EXPORT_SYMBOL_GPL(synchronize_sched_expedited);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2562
2563
2564
2565
2566
2567
2568
2569
2570
  /*
   * Check to see if there is any immediate RCU-related work to be done
   * by the current CPU, for the specified type of RCU, returning 1 if so.
   * The checks are in order of increasing expense: checks that can be
   * carried out against CPU-local state are performed first.  However,
   * we must check for CPU stalls first, else we might not get a chance.
   */
  static int __rcu_pending(struct rcu_state *rsp, struct rcu_data *rdp)
  {
2f51f9884   Paul E. McKenney   rcu: Eliminate __...
2571
  	struct rcu_node *rnp = rdp->mynode;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2572
2573
2574
2575
2576
2577
  	rdp->n_rcu_pending++;
  
  	/* Check for CPU stalls, if enabled. */
  	check_cpu_stall(rsp, rdp);
  
  	/* Is the RCU core waiting for a quiescent state from this CPU? */
5c51dd734   Paul E. McKenney   rcu: Prevent earl...
2578
2579
  	if (rcu_scheduler_fully_active &&
  	    rdp->qs_pending && !rdp->passed_quiesce) {
d21670aca   Paul E. McKenney   rcu: reduce the n...
2580
  		rdp->n_rp_qs_pending++;
e4cc1f22b   Paul E. McKenney   rcu: Simplify qui...
2581
  	} else if (rdp->qs_pending && rdp->passed_quiesce) {
d21670aca   Paul E. McKenney   rcu: reduce the n...
2582
  		rdp->n_rp_report_qs++;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2583
  		return 1;
7ba5c840e   Paul E. McKenney   rcu: Add __rcu_pe...
2584
  	}
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2585
2586
  
  	/* Does this CPU have callbacks ready to invoke? */
7ba5c840e   Paul E. McKenney   rcu: Add __rcu_pe...
2587
2588
  	if (cpu_has_callbacks_ready_to_invoke(rdp)) {
  		rdp->n_rp_cb_ready++;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2589
  		return 1;
7ba5c840e   Paul E. McKenney   rcu: Add __rcu_pe...
2590
  	}
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2591
2592
  
  	/* Has RCU gone idle with this CPU needing another grace period? */
7ba5c840e   Paul E. McKenney   rcu: Add __rcu_pe...
2593
2594
  	if (cpu_needs_another_gp(rsp, rdp)) {
  		rdp->n_rp_cpu_needs_gp++;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2595
  		return 1;
7ba5c840e   Paul E. McKenney   rcu: Add __rcu_pe...
2596
  	}
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2597
2598
  
  	/* Has another RCU grace period completed?  */
2f51f9884   Paul E. McKenney   rcu: Eliminate __...
2599
  	if (ACCESS_ONCE(rnp->completed) != rdp->completed) { /* outside lock */
7ba5c840e   Paul E. McKenney   rcu: Add __rcu_pe...
2600
  		rdp->n_rp_gp_completed++;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2601
  		return 1;
7ba5c840e   Paul E. McKenney   rcu: Add __rcu_pe...
2602
  	}
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2603
2604
  
  	/* Has a new RCU grace period started? */
2f51f9884   Paul E. McKenney   rcu: Eliminate __...
2605
  	if (ACCESS_ONCE(rnp->gpnum) != rdp->gpnum) { /* outside lock */
7ba5c840e   Paul E. McKenney   rcu: Add __rcu_pe...
2606
  		rdp->n_rp_gp_started++;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2607
  		return 1;
7ba5c840e   Paul E. McKenney   rcu: Add __rcu_pe...
2608
  	}
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2609

64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2610
  	/* nothing to do */
7ba5c840e   Paul E. McKenney   rcu: Add __rcu_pe...
2611
  	rdp->n_rp_need_nothing++;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2612
2613
2614
2615
2616
2617
2618
2619
  	return 0;
  }
  
  /*
   * Check to see if there is any immediate RCU-related work to be done
   * by the current CPU, returning 1 if so.  This function is part of the
   * RCU implementation; it is -not- an exported member of the RCU API.
   */
a157229ca   Paul E. McKenney   rcu: Simplify rcu...
2620
  static int rcu_pending(int cpu)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2621
  {
6ce75a232   Paul E. McKenney   rcu: Introduce fo...
2622
2623
2624
2625
2626
2627
  	struct rcu_state *rsp;
  
  	for_each_rcu_flavor(rsp)
  		if (__rcu_pending(rsp, per_cpu_ptr(rsp->rda, cpu)))
  			return 1;
  	return 0;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2628
2629
2630
  }
  
  /*
c0f4dfd4f   Paul E. McKenney   rcu: Make RCU_FAS...
2631
2632
2633
   * Return true if the specified CPU has any callback.  If all_lazy is
   * non-NULL, store an indication of whether all callbacks are lazy.
   * (If there are no callbacks, all of them are deemed to be lazy.)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2634
   */
c0f4dfd4f   Paul E. McKenney   rcu: Make RCU_FAS...
2635
  static int rcu_cpu_has_callbacks(int cpu, bool *all_lazy)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2636
  {
c0f4dfd4f   Paul E. McKenney   rcu: Make RCU_FAS...
2637
2638
2639
  	bool al = true;
  	bool hc = false;
  	struct rcu_data *rdp;
6ce75a232   Paul E. McKenney   rcu: Introduce fo...
2640
  	struct rcu_state *rsp;
c0f4dfd4f   Paul E. McKenney   rcu: Make RCU_FAS...
2641
2642
2643
2644
2645
2646
2647
2648
2649
2650
  	for_each_rcu_flavor(rsp) {
  		rdp = per_cpu_ptr(rsp->rda, cpu);
  		if (rdp->qlen != rdp->qlen_lazy)
  			al = false;
  		if (rdp->nxtlist)
  			hc = true;
  	}
  	if (all_lazy)
  		*all_lazy = al;
  	return hc;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2651
  }
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2652
  /*
a83eff0a8   Paul E. McKenney   rcu: Add tracing ...
2653
2654
2655
2656
2657
2658
2659
2660
2661
2662
2663
   * Helper function for _rcu_barrier() tracing.  If tracing is disabled,
   * the compiler is expected to optimize this away.
   */
  static void _rcu_barrier_trace(struct rcu_state *rsp, char *s,
  			       int cpu, unsigned long done)
  {
  	trace_rcu_barrier(rsp->name, s, cpu,
  			  atomic_read(&rsp->barrier_cpu_count), done);
  }
  
  /*
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2664
2665
2666
   * RCU callback function for _rcu_barrier().  If we are last, wake
   * up the task executing _rcu_barrier().
   */
24ebbca8e   Paul E. McKenney   rcu: Move rcu_bar...
2667
  static void rcu_barrier_callback(struct rcu_head *rhp)
d0ec774cb   Paul E. McKenney   rcu: Move rcu_bar...
2668
  {
24ebbca8e   Paul E. McKenney   rcu: Move rcu_bar...
2669
2670
  	struct rcu_data *rdp = container_of(rhp, struct rcu_data, barrier_head);
  	struct rcu_state *rsp = rdp->rsp;
a83eff0a8   Paul E. McKenney   rcu: Add tracing ...
2671
2672
  	if (atomic_dec_and_test(&rsp->barrier_cpu_count)) {
  		_rcu_barrier_trace(rsp, "LastCB", -1, rsp->n_barrier_done);
7db74df88   Paul E. McKenney   rcu: Move rcu_bar...
2673
  		complete(&rsp->barrier_completion);
a83eff0a8   Paul E. McKenney   rcu: Add tracing ...
2674
2675
2676
  	} else {
  		_rcu_barrier_trace(rsp, "CB", -1, rsp->n_barrier_done);
  	}
d0ec774cb   Paul E. McKenney   rcu: Move rcu_bar...
2677
2678
2679
2680
2681
2682
2683
  }
  
  /*
   * Called with preemption disabled, and from cross-cpu IRQ context.
   */
  static void rcu_barrier_func(void *type)
  {
037b64ed0   Paul E. McKenney   rcu: Place pointe...
2684
  	struct rcu_state *rsp = type;
06668efa9   Paul E. McKenney   rcu: Move _rcu_ba...
2685
  	struct rcu_data *rdp = __this_cpu_ptr(rsp->rda);
d0ec774cb   Paul E. McKenney   rcu: Move rcu_bar...
2686

a83eff0a8   Paul E. McKenney   rcu: Add tracing ...
2687
  	_rcu_barrier_trace(rsp, "IRQ", -1, rsp->n_barrier_done);
24ebbca8e   Paul E. McKenney   rcu: Move rcu_bar...
2688
  	atomic_inc(&rsp->barrier_cpu_count);
06668efa9   Paul E. McKenney   rcu: Move _rcu_ba...
2689
  	rsp->call(&rdp->barrier_head, rcu_barrier_callback);
d0ec774cb   Paul E. McKenney   rcu: Move rcu_bar...
2690
  }
d0ec774cb   Paul E. McKenney   rcu: Move rcu_bar...
2691
2692
2693
2694
  /*
   * Orchestrate the specified type of RCU barrier, waiting for all
   * RCU callbacks of the specified type to complete.
   */
037b64ed0   Paul E. McKenney   rcu: Place pointe...
2695
  static void _rcu_barrier(struct rcu_state *rsp)
d0ec774cb   Paul E. McKenney   rcu: Move rcu_bar...
2696
  {
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2697
  	int cpu;
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2698
  	struct rcu_data *rdp;
cf3a9c484   Paul E. McKenney   rcu: Increase rcu...
2699
2700
  	unsigned long snap = ACCESS_ONCE(rsp->n_barrier_done);
  	unsigned long snap_done;
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2701

a83eff0a8   Paul E. McKenney   rcu: Add tracing ...
2702
  	_rcu_barrier_trace(rsp, "Begin", -1, snap);
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2703

e74f4c456   Paul E. McKenney   rcu: Make hot-unp...
2704
  	/* Take mutex to serialize concurrent rcu_barrier() requests. */
7be7f0be9   Paul E. McKenney   rcu: Move rcu_bar...
2705
  	mutex_lock(&rsp->barrier_mutex);
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2706

cf3a9c484   Paul E. McKenney   rcu: Increase rcu...
2707
2708
2709
2710
2711
2712
2713
2714
2715
2716
2717
2718
2719
  	/*
  	 * Ensure that all prior references, including to ->n_barrier_done,
  	 * are ordered before the _rcu_barrier() machinery.
  	 */
  	smp_mb();  /* See above block comment. */
  
  	/*
  	 * Recheck ->n_barrier_done to see if others did our work for us.
  	 * This means checking ->n_barrier_done for an even-to-odd-to-even
  	 * transition.  The "if" expression below therefore rounds the old
  	 * value up to the next even number and adds two before comparing.
  	 */
  	snap_done = ACCESS_ONCE(rsp->n_barrier_done);
a83eff0a8   Paul E. McKenney   rcu: Add tracing ...
2720
  	_rcu_barrier_trace(rsp, "Check", -1, snap_done);
cf3a9c484   Paul E. McKenney   rcu: Increase rcu...
2721
  	if (ULONG_CMP_GE(snap_done, ((snap + 1) & ~0x1) + 2)) {
a83eff0a8   Paul E. McKenney   rcu: Add tracing ...
2722
  		_rcu_barrier_trace(rsp, "EarlyExit", -1, snap_done);
cf3a9c484   Paul E. McKenney   rcu: Increase rcu...
2723
2724
2725
2726
2727
2728
2729
2730
2731
2732
2733
2734
  		smp_mb(); /* caller's subsequent code after above check. */
  		mutex_unlock(&rsp->barrier_mutex);
  		return;
  	}
  
  	/*
  	 * Increment ->n_barrier_done to avoid duplicate work.  Use
  	 * ACCESS_ONCE() to prevent the compiler from speculating
  	 * the increment to precede the early-exit check.
  	 */
  	ACCESS_ONCE(rsp->n_barrier_done)++;
  	WARN_ON_ONCE((rsp->n_barrier_done & 0x1) != 1);
a83eff0a8   Paul E. McKenney   rcu: Add tracing ...
2735
  	_rcu_barrier_trace(rsp, "Inc1", -1, rsp->n_barrier_done);
cf3a9c484   Paul E. McKenney   rcu: Increase rcu...
2736
  	smp_mb(); /* Order ->n_barrier_done increment with below mechanism. */
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2737

d0ec774cb   Paul E. McKenney   rcu: Move rcu_bar...
2738
  	/*
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2739
2740
  	 * Initialize the count to one rather than to zero in order to
  	 * avoid a too-soon return to zero in case of a short grace period
1331e7a1b   Paul E. McKenney   rcu: Remove _rcu_...
2741
2742
  	 * (or preemption of this task).  Exclude CPU-hotplug operations
  	 * to ensure that no offline CPU has callbacks queued.
d0ec774cb   Paul E. McKenney   rcu: Move rcu_bar...
2743
  	 */
7db74df88   Paul E. McKenney   rcu: Move rcu_bar...
2744
  	init_completion(&rsp->barrier_completion);
24ebbca8e   Paul E. McKenney   rcu: Move rcu_bar...
2745
  	atomic_set(&rsp->barrier_cpu_count, 1);
1331e7a1b   Paul E. McKenney   rcu: Remove _rcu_...
2746
  	get_online_cpus();
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2747
2748
  
  	/*
1331e7a1b   Paul E. McKenney   rcu: Remove _rcu_...
2749
2750
2751
  	 * Force each CPU with callbacks to register a new callback.
  	 * When that callback is invoked, we will know that all of the
  	 * corresponding CPU's preceding callbacks have been invoked.
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2752
  	 */
3fbfbf7a3   Paul E. McKenney   rcu: Add callback...
2753
  	for_each_possible_cpu(cpu) {
d1e43fa5f   Frederic Weisbecker   nohz: Ensure full...
2754
  		if (!cpu_online(cpu) && !rcu_is_nocb_cpu(cpu))
3fbfbf7a3   Paul E. McKenney   rcu: Add callback...
2755
  			continue;
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2756
  		rdp = per_cpu_ptr(rsp->rda, cpu);
d1e43fa5f   Frederic Weisbecker   nohz: Ensure full...
2757
  		if (rcu_is_nocb_cpu(cpu)) {
3fbfbf7a3   Paul E. McKenney   rcu: Add callback...
2758
2759
2760
2761
2762
2763
  			_rcu_barrier_trace(rsp, "OnlineNoCB", cpu,
  					   rsp->n_barrier_done);
  			atomic_inc(&rsp->barrier_cpu_count);
  			__call_rcu(&rdp->barrier_head, rcu_barrier_callback,
  				   rsp, cpu, 0);
  		} else if (ACCESS_ONCE(rdp->qlen)) {
a83eff0a8   Paul E. McKenney   rcu: Add tracing ...
2764
2765
  			_rcu_barrier_trace(rsp, "OnlineQ", cpu,
  					   rsp->n_barrier_done);
037b64ed0   Paul E. McKenney   rcu: Place pointe...
2766
  			smp_call_function_single(cpu, rcu_barrier_func, rsp, 1);
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2767
  		} else {
a83eff0a8   Paul E. McKenney   rcu: Add tracing ...
2768
2769
  			_rcu_barrier_trace(rsp, "OnlineNQ", cpu,
  					   rsp->n_barrier_done);
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2770
2771
  		}
  	}
1331e7a1b   Paul E. McKenney   rcu: Remove _rcu_...
2772
  	put_online_cpus();
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2773
2774
2775
2776
2777
  
  	/*
  	 * Now that we have an rcu_barrier_callback() callback on each
  	 * CPU, and thus each counted, remove the initial count.
  	 */
24ebbca8e   Paul E. McKenney   rcu: Move rcu_bar...
2778
  	if (atomic_dec_and_test(&rsp->barrier_cpu_count))
7db74df88   Paul E. McKenney   rcu: Move rcu_bar...
2779
  		complete(&rsp->barrier_completion);
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2780

cf3a9c484   Paul E. McKenney   rcu: Increase rcu...
2781
2782
2783
2784
  	/* Increment ->n_barrier_done to prevent duplicate work. */
  	smp_mb(); /* Keep increment after above mechanism. */
  	ACCESS_ONCE(rsp->n_barrier_done)++;
  	WARN_ON_ONCE((rsp->n_barrier_done & 0x1) != 0);
a83eff0a8   Paul E. McKenney   rcu: Add tracing ...
2785
  	_rcu_barrier_trace(rsp, "Inc2", -1, rsp->n_barrier_done);
cf3a9c484   Paul E. McKenney   rcu: Increase rcu...
2786
  	smp_mb(); /* Keep increment before caller's subsequent code. */
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2787
  	/* Wait for all rcu_barrier_callback() callbacks to be invoked. */
7db74df88   Paul E. McKenney   rcu: Move rcu_bar...
2788
  	wait_for_completion(&rsp->barrier_completion);
b1420f1c8   Paul E. McKenney   rcu: Make rcu_bar...
2789
2790
  
  	/* Other rcu_barrier() invocations can now safely proceed. */
7be7f0be9   Paul E. McKenney   rcu: Move rcu_bar...
2791
  	mutex_unlock(&rsp->barrier_mutex);
d0ec774cb   Paul E. McKenney   rcu: Move rcu_bar...
2792
  }
d0ec774cb   Paul E. McKenney   rcu: Move rcu_bar...
2793
2794
2795
2796
2797
2798
  
  /**
   * rcu_barrier_bh - Wait until all in-flight call_rcu_bh() callbacks complete.
   */
  void rcu_barrier_bh(void)
  {
037b64ed0   Paul E. McKenney   rcu: Place pointe...
2799
  	_rcu_barrier(&rcu_bh_state);
d0ec774cb   Paul E. McKenney   rcu: Move rcu_bar...
2800
2801
2802
2803
2804
2805
2806
2807
  }
  EXPORT_SYMBOL_GPL(rcu_barrier_bh);
  
  /**
   * rcu_barrier_sched - Wait for in-flight call_rcu_sched() callbacks.
   */
  void rcu_barrier_sched(void)
  {
037b64ed0   Paul E. McKenney   rcu: Place pointe...
2808
  	_rcu_barrier(&rcu_sched_state);
d0ec774cb   Paul E. McKenney   rcu: Move rcu_bar...
2809
2810
  }
  EXPORT_SYMBOL_GPL(rcu_barrier_sched);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2811
  /*
27569620c   Paul E. McKenney   rcu: Split hierar...
2812
   * Do boot-time initialization of a CPU's per-CPU RCU data.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2813
   */
27569620c   Paul E. McKenney   rcu: Split hierar...
2814
2815
  static void __init
  rcu_boot_init_percpu_data(int cpu, struct rcu_state *rsp)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2816
2817
  {
  	unsigned long flags;
394f99a90   Lai Jiangshan   rcu: simplify the...
2818
  	struct rcu_data *rdp = per_cpu_ptr(rsp->rda, cpu);
27569620c   Paul E. McKenney   rcu: Split hierar...
2819
2820
2821
  	struct rcu_node *rnp = rcu_get_root(rsp);
  
  	/* Set up local state, ensuring consistent view of global state. */
1304afb22   Paul E. McKenney   rcu: Convert to r...
2822
  	raw_spin_lock_irqsave(&rnp->lock, flags);
27569620c   Paul E. McKenney   rcu: Split hierar...
2823
  	rdp->grpmask = 1UL << (cpu - rdp->mynode->grplo);
3f5d3ea64   Paul E. McKenney   rcu: Consolidate ...
2824
  	init_callback_list(rdp);
486e25934   Paul E. McKenney   rcu: Avoid waking...
2825
  	rdp->qlen_lazy = 0;
1d1fb395f   Paul E. McKenney   rcu: Add ACCESS_O...
2826
  	ACCESS_ONCE(rdp->qlen) = 0;
27569620c   Paul E. McKenney   rcu: Split hierar...
2827
  	rdp->dynticks = &per_cpu(rcu_dynticks, cpu);
29e37d814   Paul E. McKenney   rcu: Allow nestin...
2828
  	WARN_ON_ONCE(rdp->dynticks->dynticks_nesting != DYNTICK_TASK_EXIT_IDLE);
9b2e4f188   Paul E. McKenney   rcu: Track idlene...
2829
  	WARN_ON_ONCE(atomic_read(&rdp->dynticks->dynticks) != 1);
27569620c   Paul E. McKenney   rcu: Split hierar...
2830
  	rdp->cpu = cpu;
d4c08f2ac   Paul E. McKenney   rcu: Add grace-pe...
2831
  	rdp->rsp = rsp;
3fbfbf7a3   Paul E. McKenney   rcu: Add callback...
2832
  	rcu_boot_init_nocb_percpu_data(rdp);
1304afb22   Paul E. McKenney   rcu: Convert to r...
2833
  	raw_spin_unlock_irqrestore(&rnp->lock, flags);
27569620c   Paul E. McKenney   rcu: Split hierar...
2834
2835
2836
2837
2838
2839
2840
  }
  
  /*
   * Initialize a CPU's per-CPU RCU data.  Note that only one online or
   * offline event can be happening at a given time.  Note also that we
   * can accept some slop in the rsp->completed access due to the fact
   * that this CPU cannot possibly have any RCU callbacks in flight yet.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2841
   */
49fb4c629   Paul Gortmaker   rcu: delete __cpu...
2842
  static void
6cc68793e   Paul E. McKenney   rcu: fix spelling
2843
  rcu_init_percpu_data(int cpu, struct rcu_state *rsp, int preemptible)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2844
2845
  {
  	unsigned long flags;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2846
  	unsigned long mask;
394f99a90   Lai Jiangshan   rcu: simplify the...
2847
  	struct rcu_data *rdp = per_cpu_ptr(rsp->rda, cpu);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2848
  	struct rcu_node *rnp = rcu_get_root(rsp);
a4fbe35a1   Paul E. McKenney   rcu: Grace-period...
2849
2850
  	/* Exclude new grace periods. */
  	mutex_lock(&rsp->onoff_mutex);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2851
  	/* Set up local state, ensuring consistent view of global state. */
1304afb22   Paul E. McKenney   rcu: Convert to r...
2852
  	raw_spin_lock_irqsave(&rnp->lock, flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2853
  	rdp->beenonline = 1;	 /* We have now been online. */
6cc68793e   Paul E. McKenney   rcu: fix spelling
2854
  	rdp->preemptible = preemptible;
37c72e56f   Paul E. McKenney   rcu: Prevent RCU ...
2855
2856
  	rdp->qlen_last_fqs_check = 0;
  	rdp->n_force_qs_snap = rsp->n_force_qs;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2857
  	rdp->blimit = blimit;
0d8ee37e2   Paul E. McKenney   rcu: Disallow cal...
2858
  	init_callback_list(rdp);  /* Re-enable callbacks on this CPU. */
29e37d814   Paul E. McKenney   rcu: Allow nestin...
2859
  	rdp->dynticks->dynticks_nesting = DYNTICK_TASK_EXIT_IDLE;
c92b131bd   Paul E. McKenney   rcu: Remove dynti...
2860
2861
  	atomic_set(&rdp->dynticks->dynticks,
  		   (atomic_read(&rdp->dynticks->dynticks) & ~0x1) + 1);
1304afb22   Paul E. McKenney   rcu: Convert to r...
2862
  	raw_spin_unlock(&rnp->lock);		/* irqs remain disabled. */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2863

64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2864
2865
2866
2867
2868
  	/* Add CPU to rcu_node bitmasks. */
  	rnp = rdp->mynode;
  	mask = rdp->grpmask;
  	do {
  		/* Exclude any attempts to start a new GP on small systems. */
1304afb22   Paul E. McKenney   rcu: Convert to r...
2869
  		raw_spin_lock(&rnp->lock);	/* irqs already disabled. */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2870
2871
  		rnp->qsmaskinit |= mask;
  		mask = rnp->grpmask;
d09b62dfa   Paul E. McKenney   rcu: Fix synchron...
2872
  		if (rnp == rdp->mynode) {
06ae115a1   Paul E. McKenney   rcu: Avoid having...
2873
2874
2875
2876
2877
2878
  			/*
  			 * If there is a grace period in progress, we will
  			 * set up to wait for it next time we run the
  			 * RCU core code.
  			 */
  			rdp->gpnum = rnp->completed;
d09b62dfa   Paul E. McKenney   rcu: Fix synchron...
2879
  			rdp->completed = rnp->completed;
06ae115a1   Paul E. McKenney   rcu: Avoid having...
2880
2881
  			rdp->passed_quiesce = 0;
  			rdp->qs_pending = 0;
d4c08f2ac   Paul E. McKenney   rcu: Add grace-pe...
2882
  			trace_rcu_grace_period(rsp->name, rdp->gpnum, "cpuonl");
d09b62dfa   Paul E. McKenney   rcu: Fix synchron...
2883
  		}
1304afb22   Paul E. McKenney   rcu: Convert to r...
2884
  		raw_spin_unlock(&rnp->lock); /* irqs already disabled. */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2885
2886
  		rnp = rnp->parent;
  	} while (rnp != NULL && !(rnp->qsmaskinit & mask));
a4fbe35a1   Paul E. McKenney   rcu: Grace-period...
2887
  	local_irq_restore(flags);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2888

a4fbe35a1   Paul E. McKenney   rcu: Grace-period...
2889
  	mutex_unlock(&rsp->onoff_mutex);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2890
  }
49fb4c629   Paul Gortmaker   rcu: delete __cpu...
2891
  static void rcu_prepare_cpu(int cpu)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2892
  {
6ce75a232   Paul E. McKenney   rcu: Introduce fo...
2893
2894
2895
2896
2897
  	struct rcu_state *rsp;
  
  	for_each_rcu_flavor(rsp)
  		rcu_init_percpu_data(cpu, rsp,
  				     strcmp(rsp->name, "rcu_preempt") == 0);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2898
2899
2900
  }
  
  /*
f41d911f8   Paul E. McKenney   rcu: Merge preemp...
2901
   * Handle CPU online/offline notification events.
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2902
   */
49fb4c629   Paul Gortmaker   rcu: delete __cpu...
2903
  static int rcu_cpu_notify(struct notifier_block *self,
9f680ab41   Paul E. McKenney   rcu: Eliminate un...
2904
  				    unsigned long action, void *hcpu)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2905
2906
  {
  	long cpu = (long)hcpu;
27f4d2805   Paul E. McKenney   rcu: priority boo...
2907
  	struct rcu_data *rdp = per_cpu_ptr(rcu_state->rda, cpu);
a26ac2455   Paul E. McKenney   rcu: move TREE_RC...
2908
  	struct rcu_node *rnp = rdp->mynode;
6ce75a232   Paul E. McKenney   rcu: Introduce fo...
2909
  	struct rcu_state *rsp;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2910

300df91ca   Paul E. McKenney   rcu: Event-trace ...
2911
  	trace_rcu_utilization("Start CPU hotplug");
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2912
2913
2914
  	switch (action) {
  	case CPU_UP_PREPARE:
  	case CPU_UP_PREPARE_FROZEN:
d72bce0e6   Peter Zijlstra   rcu: Cure load woes
2915
2916
  		rcu_prepare_cpu(cpu);
  		rcu_prepare_kthreads(cpu);
a26ac2455   Paul E. McKenney   rcu: move TREE_RC...
2917
2918
  		break;
  	case CPU_ONLINE:
0f962a5e7   Paul E. McKenney   rcu: Force per-rc...
2919
  	case CPU_DOWN_FAILED:
5d01bbd11   Thomas Gleixner   rcu: Yield simpler
2920
  		rcu_boost_kthread_setaffinity(rnp, -1);
0f962a5e7   Paul E. McKenney   rcu: Force per-rc...
2921
2922
  		break;
  	case CPU_DOWN_PREPARE:
34ed62461   Paul E. McKenney   rcu: Remove restr...
2923
  		rcu_boost_kthread_setaffinity(rnp, cpu);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2924
  		break;
d0ec774cb   Paul E. McKenney   rcu: Move rcu_bar...
2925
2926
  	case CPU_DYING:
  	case CPU_DYING_FROZEN:
6ce75a232   Paul E. McKenney   rcu: Introduce fo...
2927
2928
  		for_each_rcu_flavor(rsp)
  			rcu_cleanup_dying_cpu(rsp);
d0ec774cb   Paul E. McKenney   rcu: Move rcu_bar...
2929
  		break;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2930
2931
2932
2933
  	case CPU_DEAD:
  	case CPU_DEAD_FROZEN:
  	case CPU_UP_CANCELED:
  	case CPU_UP_CANCELED_FROZEN:
6ce75a232   Paul E. McKenney   rcu: Introduce fo...
2934
2935
  		for_each_rcu_flavor(rsp)
  			rcu_cleanup_dead_cpu(cpu, rsp);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2936
2937
2938
2939
  		break;
  	default:
  		break;
  	}
300df91ca   Paul E. McKenney   rcu: Event-trace ...
2940
  	trace_rcu_utilization("End CPU hotplug");
34ed62461   Paul E. McKenney   rcu: Remove restr...
2941
  	return NOTIFY_OK;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2942
2943
2944
  }
  
  /*
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
2945
2946
2947
2948
2949
2950
2951
2952
2953
2954
   * Spawn the kthread that handles this RCU flavor's grace periods.
   */
  static int __init rcu_spawn_gp_kthread(void)
  {
  	unsigned long flags;
  	struct rcu_node *rnp;
  	struct rcu_state *rsp;
  	struct task_struct *t;
  
  	for_each_rcu_flavor(rsp) {
f170168b9   Kees Cook   drivers: avoid pa...
2955
  		t = kthread_run(rcu_gp_kthread, rsp, "%s", rsp->name);
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
2956
2957
2958
2959
2960
  		BUG_ON(IS_ERR(t));
  		rnp = rcu_get_root(rsp);
  		raw_spin_lock_irqsave(&rnp->lock, flags);
  		rsp->gp_kthread = t;
  		raw_spin_unlock_irqrestore(&rnp->lock, flags);
3fbfbf7a3   Paul E. McKenney   rcu: Add callback...
2961
  		rcu_spawn_nocb_kthreads(rsp);
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
2962
2963
2964
2965
2966
2967
  	}
  	return 0;
  }
  early_initcall(rcu_spawn_gp_kthread);
  
  /*
bbad93798   Paul E. McKenney   rcu: slim down rc...
2968
2969
2970
2971
2972
2973
2974
2975
2976
2977
2978
2979
2980
2981
2982
   * This function is invoked towards the end of the scheduler's initialization
   * process.  Before this is called, the idle task might contain
   * RCU read-side critical sections (during which time, this idle
   * task is booting the system).  After this function is called, the
   * idle tasks are prohibited from containing RCU read-side critical
   * sections.  This function also enables RCU lockdep checking.
   */
  void rcu_scheduler_starting(void)
  {
  	WARN_ON(num_online_cpus() != 1);
  	WARN_ON(nr_context_switches() > 0);
  	rcu_scheduler_active = 1;
  }
  
  /*
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2983
2984
2985
2986
2987
2988
2989
   * Compute the per-level fanout, either using the exact fanout specified
   * or balancing the tree, depending on CONFIG_RCU_FANOUT_EXACT.
   */
  #ifdef CONFIG_RCU_FANOUT_EXACT
  static void __init rcu_init_levelspread(struct rcu_state *rsp)
  {
  	int i;
f885b7f2b   Paul E. McKenney   rcu: Control RCU_...
2990
  	for (i = rcu_num_lvls - 1; i > 0; i--)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2991
  		rsp->levelspread[i] = CONFIG_RCU_FANOUT;
f885b7f2b   Paul E. McKenney   rcu: Control RCU_...
2992
  	rsp->levelspread[0] = rcu_fanout_leaf;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
2993
2994
2995
2996
2997
2998
2999
  }
  #else /* #ifdef CONFIG_RCU_FANOUT_EXACT */
  static void __init rcu_init_levelspread(struct rcu_state *rsp)
  {
  	int ccur;
  	int cprv;
  	int i;
4dbd6bb38   Paul E. McKenney   rcu: Handle unbal...
3000
  	cprv = nr_cpu_ids;
f885b7f2b   Paul E. McKenney   rcu: Control RCU_...
3001
  	for (i = rcu_num_lvls - 1; i >= 0; i--) {
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
3002
3003
3004
3005
3006
3007
3008
3009
3010
3011
  		ccur = rsp->levelcnt[i];
  		rsp->levelspread[i] = (cprv + ccur - 1) / ccur;
  		cprv = ccur;
  	}
  }
  #endif /* #else #ifdef CONFIG_RCU_FANOUT_EXACT */
  
  /*
   * Helper function for rcu_init() that initializes one rcu_state structure.
   */
394f99a90   Lai Jiangshan   rcu: simplify the...
3012
3013
  static void __init rcu_init_one(struct rcu_state *rsp,
  		struct rcu_data __percpu *rda)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
3014
  {
394f2769a   Paul E. McKenney   rcu: Prevent forc...
3015
3016
3017
3018
3019
3020
3021
3022
  	static char *buf[] = { "rcu_node_0",
  			       "rcu_node_1",
  			       "rcu_node_2",
  			       "rcu_node_3" };  /* Match MAX_RCU_LVLS */
  	static char *fqs[] = { "rcu_node_fqs_0",
  			       "rcu_node_fqs_1",
  			       "rcu_node_fqs_2",
  			       "rcu_node_fqs_3" };  /* Match MAX_RCU_LVLS */
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
3023
3024
3025
3026
  	int cpustride = 1;
  	int i;
  	int j;
  	struct rcu_node *rnp;
b6407e863   Paul E. McKenney   rcu: Give differe...
3027
  	BUILD_BUG_ON(MAX_RCU_LVLS > ARRAY_SIZE(buf));  /* Fix buf[] init! */
4930521ae   Paul E. McKenney   rcu: Silence comp...
3028
3029
3030
  	/* Silence gcc 4.8 warning about array index out of range. */
  	if (rcu_num_lvls > RCU_NUM_LVLS)
  		panic("rcu_init_one: rcu_num_lvls overflow");
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
3031
  	/* Initialize the level-tracking arrays. */
f885b7f2b   Paul E. McKenney   rcu: Control RCU_...
3032
3033
3034
  	for (i = 0; i < rcu_num_lvls; i++)
  		rsp->levelcnt[i] = num_rcu_lvl[i];
  	for (i = 1; i < rcu_num_lvls; i++)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
3035
3036
3037
3038
  		rsp->level[i] = rsp->level[i - 1] + rsp->levelcnt[i - 1];
  	rcu_init_levelspread(rsp);
  
  	/* Initialize the elements themselves, starting from the leaves. */
f885b7f2b   Paul E. McKenney   rcu: Control RCU_...
3039
  	for (i = rcu_num_lvls - 1; i >= 0; i--) {
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
3040
3041
3042
  		cpustride *= rsp->levelspread[i];
  		rnp = rsp->level[i];
  		for (j = 0; j < rsp->levelcnt[i]; j++, rnp++) {
1304afb22   Paul E. McKenney   rcu: Convert to r...
3043
  			raw_spin_lock_init(&rnp->lock);
b6407e863   Paul E. McKenney   rcu: Give differe...
3044
3045
  			lockdep_set_class_and_name(&rnp->lock,
  						   &rcu_node_class[i], buf[i]);
394f2769a   Paul E. McKenney   rcu: Prevent forc...
3046
3047
3048
  			raw_spin_lock_init(&rnp->fqslock);
  			lockdep_set_class_and_name(&rnp->fqslock,
  						   &rcu_fqs_class[i], fqs[i]);
25d30cf42   Paul E. McKenney   rcu: Adjust for u...
3049
3050
  			rnp->gpnum = rsp->gpnum;
  			rnp->completed = rsp->completed;
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
3051
3052
3053
3054
3055
3056
3057
3058
3059
3060
3061
3062
3063
3064
3065
3066
3067
  			rnp->qsmask = 0;
  			rnp->qsmaskinit = 0;
  			rnp->grplo = j * cpustride;
  			rnp->grphi = (j + 1) * cpustride - 1;
  			if (rnp->grphi >= NR_CPUS)
  				rnp->grphi = NR_CPUS - 1;
  			if (i == 0) {
  				rnp->grpnum = 0;
  				rnp->grpmask = 0;
  				rnp->parent = NULL;
  			} else {
  				rnp->grpnum = j % rsp->levelspread[i - 1];
  				rnp->grpmask = 1UL << rnp->grpnum;
  				rnp->parent = rsp->level[i - 1] +
  					      j / rsp->levelspread[i - 1];
  			}
  			rnp->level = i;
12f5f524c   Paul E. McKenney   rcu: merge TREE_P...
3068
  			INIT_LIST_HEAD(&rnp->blkd_tasks);
dae6e64d2   Paul E. McKenney   rcu: Introduce pr...
3069
  			rcu_init_one_nocb(rnp);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
3070
3071
  		}
  	}
0c34029ab   Lai Jiangshan   rcu: move some co...
3072

394f99a90   Lai Jiangshan   rcu: simplify the...
3073
  	rsp->rda = rda;
b3dbec76e   Paul E. McKenney   rcu: Move RCU gra...
3074
  	init_waitqueue_head(&rsp->gp_wq);
016a8d5be   Steven Rostedt   rcu: Don't call w...
3075
  	init_irq_work(&rsp->wakeup_work, rsp_wakeup);
f885b7f2b   Paul E. McKenney   rcu: Control RCU_...
3076
  	rnp = rsp->level[rcu_num_lvls - 1];
0c34029ab   Lai Jiangshan   rcu: move some co...
3077
  	for_each_possible_cpu(i) {
4a90a0681   Paul E. McKenney   rcu: permit disco...
3078
  		while (i > rnp->grphi)
0c34029ab   Lai Jiangshan   rcu: move some co...
3079
  			rnp++;
394f99a90   Lai Jiangshan   rcu: simplify the...
3080
  		per_cpu_ptr(rsp->rda, i)->mynode = rnp;
0c34029ab   Lai Jiangshan   rcu: move some co...
3081
3082
  		rcu_boot_init_percpu_data(i, rsp);
  	}
6ce75a232   Paul E. McKenney   rcu: Introduce fo...
3083
  	list_add(&rsp->flavors, &rcu_struct_flavors);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
3084
  }
f885b7f2b   Paul E. McKenney   rcu: Control RCU_...
3085
3086
3087
3088
3089
3090
3091
  /*
   * Compute the rcu_node tree geometry from kernel parameters.  This cannot
   * replace the definitions in rcutree.h because those are needed to size
   * the ->node array in the rcu_state structure.
   */
  static void __init rcu_init_geometry(void)
  {
026ad2835   Paul E. McKenney   rcu: Drive quiesc...
3092
  	ulong d;
f885b7f2b   Paul E. McKenney   rcu: Control RCU_...
3093
3094
  	int i;
  	int j;
cca6f3931   Paul E. McKenney   rcu: Size rcu_nod...
3095
  	int n = nr_cpu_ids;
f885b7f2b   Paul E. McKenney   rcu: Control RCU_...
3096
  	int rcu_capacity[MAX_RCU_LVLS + 1];
026ad2835   Paul E. McKenney   rcu: Drive quiesc...
3097
3098
3099
3100
3101
3102
3103
3104
3105
3106
3107
3108
  	/*
  	 * Initialize any unspecified boot parameters.
  	 * The default values of jiffies_till_first_fqs and
  	 * jiffies_till_next_fqs are set to the RCU_JIFFIES_TILL_FORCE_QS
  	 * value, which is a function of HZ, then adding one for each
  	 * RCU_JIFFIES_FQS_DIV CPUs that might be on the system.
  	 */
  	d = RCU_JIFFIES_TILL_FORCE_QS + nr_cpu_ids / RCU_JIFFIES_FQS_DIV;
  	if (jiffies_till_first_fqs == ULONG_MAX)
  		jiffies_till_first_fqs = d;
  	if (jiffies_till_next_fqs == ULONG_MAX)
  		jiffies_till_next_fqs = d;
f885b7f2b   Paul E. McKenney   rcu: Control RCU_...
3109
  	/* If the compile-time values are accurate, just leave. */
b17c7035f   Paul E. McKenney   rcu: Shrink RCU b...
3110
3111
  	if (rcu_fanout_leaf == CONFIG_RCU_FANOUT_LEAF &&
  	    nr_cpu_ids == NR_CPUS)
f885b7f2b   Paul E. McKenney   rcu: Control RCU_...
3112
3113
3114
3115
3116
3117
3118
3119
3120
3121
3122
3123
3124
3125
3126
3127
3128
3129
3130
3131
3132
3133
3134
3135
3136
3137
3138
3139
3140
3141
3142
3143
3144
3145
3146
3147
3148
3149
3150
3151
3152
3153
3154
3155
3156
  		return;
  
  	/*
  	 * Compute number of nodes that can be handled an rcu_node tree
  	 * with the given number of levels.  Setting rcu_capacity[0] makes
  	 * some of the arithmetic easier.
  	 */
  	rcu_capacity[0] = 1;
  	rcu_capacity[1] = rcu_fanout_leaf;
  	for (i = 2; i <= MAX_RCU_LVLS; i++)
  		rcu_capacity[i] = rcu_capacity[i - 1] * CONFIG_RCU_FANOUT;
  
  	/*
  	 * The boot-time rcu_fanout_leaf parameter is only permitted
  	 * to increase the leaf-level fanout, not decrease it.  Of course,
  	 * the leaf-level fanout cannot exceed the number of bits in
  	 * the rcu_node masks.  Finally, the tree must be able to accommodate
  	 * the configured number of CPUs.  Complain and fall back to the
  	 * compile-time values if these limits are exceeded.
  	 */
  	if (rcu_fanout_leaf < CONFIG_RCU_FANOUT_LEAF ||
  	    rcu_fanout_leaf > sizeof(unsigned long) * 8 ||
  	    n > rcu_capacity[MAX_RCU_LVLS]) {
  		WARN_ON(1);
  		return;
  	}
  
  	/* Calculate the number of rcu_nodes at each level of the tree. */
  	for (i = 1; i <= MAX_RCU_LVLS; i++)
  		if (n <= rcu_capacity[i]) {
  			for (j = 0; j <= i; j++)
  				num_rcu_lvl[j] =
  					DIV_ROUND_UP(n, rcu_capacity[i - j]);
  			rcu_num_lvls = i;
  			for (j = i + 1; j <= MAX_RCU_LVLS; j++)
  				num_rcu_lvl[j] = 0;
  			break;
  		}
  
  	/* Calculate the total number of rcu_node structures. */
  	rcu_num_nodes = 0;
  	for (i = 0; i <= MAX_RCU_LVLS; i++)
  		rcu_num_nodes += num_rcu_lvl[i];
  	rcu_num_nodes -= n;
  }
9f680ab41   Paul E. McKenney   rcu: Eliminate un...
3157
  void __init rcu_init(void)
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
3158
  {
017c42613   Paul E. McKenney   rcu: Fix sparse w...
3159
  	int cpu;
9f680ab41   Paul E. McKenney   rcu: Eliminate un...
3160

f41d911f8   Paul E. McKenney   rcu: Merge preemp...
3161
  	rcu_bootup_announce();
f885b7f2b   Paul E. McKenney   rcu: Control RCU_...
3162
  	rcu_init_geometry();
394f99a90   Lai Jiangshan   rcu: simplify the...
3163
3164
  	rcu_init_one(&rcu_sched_state, &rcu_sched_data);
  	rcu_init_one(&rcu_bh_state, &rcu_bh_data);
f41d911f8   Paul E. McKenney   rcu: Merge preemp...
3165
  	__rcu_init_preempt();
b5b393601   Jiang Fang   rcu: Fix spacing ...
3166
  	open_softirq(RCU_SOFTIRQ, rcu_process_callbacks);
9f680ab41   Paul E. McKenney   rcu: Eliminate un...
3167
3168
3169
3170
3171
3172
3173
  
  	/*
  	 * We don't need protection against CPU-hotplug here because
  	 * this is called early in boot, before either interrupts
  	 * or the scheduler are operational.
  	 */
  	cpu_notifier(rcu_cpu_notify, 0);
017c42613   Paul E. McKenney   rcu: Fix sparse w...
3174
3175
  	for_each_online_cpu(cpu)
  		rcu_cpu_notify(NULL, CPU_UP_PREPARE, (void *)(long)cpu);
64db4cfff   Paul E. McKenney   "Tree RCU": scala...
3176
  }
1eba8f843   Paul E. McKenney   rcu: Clean up cod...
3177
  #include "rcutree_plugin.h"