rcu: Fix grace-period-stall bug on large systems with CPU hotplug
[linux-2.6-block.git] / kernel / rcutiny.c
CommitLineData
9b1d82fa
PM
1/*
2 * Read-Copy Update mechanism for mutual exclusion, the Bloatwatch edition.
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; either version 2 of the License, or
7 * (at your option) any later version.
8 *
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
13 *
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write to the Free Software
16 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
17 *
18 * Copyright IBM Corporation, 2008
19 *
20 * Author: Paul E. McKenney <paulmck@linux.vnet.ibm.com>
21 *
22 * For detailed explanation of Read-Copy Update mechanism see -
4ce5b903 23 * Documentation/RCU
9b1d82fa 24 */
9b1d82fa 25#include <linux/moduleparam.h>
4ce5b903
IM
26#include <linux/completion.h>
27#include <linux/interrupt.h>
9b1d82fa 28#include <linux/notifier.h>
4ce5b903
IM
29#include <linux/rcupdate.h>
30#include <linux/kernel.h>
31#include <linux/module.h>
9b1d82fa 32#include <linux/mutex.h>
4ce5b903
IM
33#include <linux/sched.h>
34#include <linux/types.h>
35#include <linux/init.h>
9b1d82fa 36#include <linux/time.h>
4ce5b903 37#include <linux/cpu.h>
9b1d82fa
PM
38
39/* Global control variables for rcupdate callback mechanism. */
40struct rcu_ctrlblk {
41 struct rcu_head *rcucblist; /* List of pending callbacks (CBs). */
42 struct rcu_head **donetail; /* ->next pointer of last "done" CB. */
43 struct rcu_head **curtail; /* ->next pointer of last CB. */
44};
45
46/* Definition for rcupdate control block. */
47static struct rcu_ctrlblk rcu_ctrlblk = {
4ce5b903
IM
48 .donetail = &rcu_ctrlblk.rcucblist,
49 .curtail = &rcu_ctrlblk.rcucblist,
9b1d82fa 50};
4ce5b903 51
9b1d82fa 52static struct rcu_ctrlblk rcu_bh_ctrlblk = {
4ce5b903
IM
53 .donetail = &rcu_bh_ctrlblk.rcucblist,
54 .curtail = &rcu_bh_ctrlblk.rcucblist,
9b1d82fa
PM
55};
56
57#ifdef CONFIG_NO_HZ
58
59static long rcu_dynticks_nesting = 1;
60
61/*
62 * Enter dynticks-idle mode, which is an extended quiescent state
63 * if we have fully entered that mode (i.e., if the new value of
64 * dynticks_nesting is zero).
65 */
66void rcu_enter_nohz(void)
67{
68 if (--rcu_dynticks_nesting == 0)
69 rcu_sched_qs(0); /* implies rcu_bh_qsctr_inc(0) */
70}
71
72/*
73 * Exit dynticks-idle mode, so that we are no longer in an extended
74 * quiescent state.
75 */
76void rcu_exit_nohz(void)
77{
78 rcu_dynticks_nesting++;
79}
80
81#endif /* #ifdef CONFIG_NO_HZ */
82
83/*
84 * Helper function for rcu_qsctr_inc() and rcu_bh_qsctr_inc().
4ce5b903
IM
85 * Also disable irqs to avoid confusion due to interrupt handlers
86 * invoking call_rcu().
9b1d82fa
PM
87 */
88static int rcu_qsctr_help(struct rcu_ctrlblk *rcp)
89{
90 unsigned long flags;
91
92 local_irq_save(flags);
93 if (rcp->rcucblist != NULL &&
94 rcp->donetail != rcp->curtail) {
95 rcp->donetail = rcp->curtail;
96 local_irq_restore(flags);
97 return 1;
98 }
99 local_irq_restore(flags);
4ce5b903 100
9b1d82fa
PM
101 return 0;
102}
103
104/*
105 * Record an rcu quiescent state. And an rcu_bh quiescent state while we
106 * are at it, given that any rcu quiescent state is also an rcu_bh
107 * quiescent state. Use "+" instead of "||" to defeat short circuiting.
108 */
109void rcu_sched_qs(int cpu)
110{
111 if (rcu_qsctr_help(&rcu_ctrlblk) + rcu_qsctr_help(&rcu_bh_ctrlblk))
112 raise_softirq(RCU_SOFTIRQ);
113}
114
115/*
116 * Record an rcu_bh quiescent state.
117 */
118void rcu_bh_qs(int cpu)
119{
120 if (rcu_qsctr_help(&rcu_bh_ctrlblk))
121 raise_softirq(RCU_SOFTIRQ);
122}
123
124/*
125 * Check to see if the scheduling-clock interrupt came from an extended
126 * quiescent state, and, if so, tell RCU about it.
127 */
128void rcu_check_callbacks(int cpu, int user)
129{
130 if (user ||
131 (idle_cpu(cpu) &&
132 !in_softirq() &&
133 hardirq_count() <= (1 << HARDIRQ_SHIFT)))
134 rcu_sched_qs(cpu);
135 else if (!in_softirq())
136 rcu_bh_qs(cpu);
137}
138
139/*
140 * Helper function for rcu_process_callbacks() that operates on the
141 * specified rcu_ctrlkblk structure.
142 */
143static void __rcu_process_callbacks(struct rcu_ctrlblk *rcp)
144{
9b1d82fa 145 struct rcu_head *next, *list;
4ce5b903 146 unsigned long flags;
9b1d82fa
PM
147
148 /* If no RCU callbacks ready to invoke, just return. */
149 if (&rcp->rcucblist == rcp->donetail)
150 return;
151
152 /* Move the ready-to-invoke callbacks to a local list. */
153 local_irq_save(flags);
154 list = rcp->rcucblist;
155 rcp->rcucblist = *rcp->donetail;
156 *rcp->donetail = NULL;
157 if (rcp->curtail == rcp->donetail)
158 rcp->curtail = &rcp->rcucblist;
159 rcp->donetail = &rcp->rcucblist;
160 local_irq_restore(flags);
161
162 /* Invoke the callbacks on the local list. */
163 while (list) {
164 next = list->next;
165 prefetch(next);
166 list->func(list);
167 list = next;
168 }
169}
170
171/*
172 * Invoke any callbacks whose grace period has completed.
173 */
174static void rcu_process_callbacks(struct softirq_action *unused)
175{
176 __rcu_process_callbacks(&rcu_ctrlblk);
177 __rcu_process_callbacks(&rcu_bh_ctrlblk);
178}
179
180/*
181 * Null function to handle CPU being onlined. Longer term, we want to
182 * make TINY_RCU avoid using rcupdate.c, but later...
183 */
4ce5b903 184int rcu_cpu_notify(struct notifier_block *self, unsigned long action, void *hcpu)
9b1d82fa
PM
185{
186 return NOTIFY_OK;
187}
188
189/*
190 * Wait for a grace period to elapse. But it is illegal to invoke
191 * synchronize_sched() from within an RCU read-side critical section.
192 * Therefore, any legal call to synchronize_sched() is a quiescent
193 * state, and so on a UP system, synchronize_sched() need do nothing.
194 * Ditto for synchronize_rcu_bh(). (But Lai Jiangshan points out the
195 * benefits of doing might_sleep() to reduce latency.)
196 *
197 * Cool, huh? (Due to Josh Triplett.)
198 *
199 * But we want to make this a static inline later.
200 */
201void synchronize_sched(void)
202{
203 cond_resched();
204}
205EXPORT_SYMBOL_GPL(synchronize_sched);
206
207void synchronize_rcu_bh(void)
208{
209 synchronize_sched();
210}
211EXPORT_SYMBOL_GPL(synchronize_rcu_bh);
212
213/*
214 * Helper function for call_rcu() and call_rcu_bh().
215 */
216static void __call_rcu(struct rcu_head *head,
217 void (*func)(struct rcu_head *rcu),
218 struct rcu_ctrlblk *rcp)
219{
220 unsigned long flags;
221
222 head->func = func;
223 head->next = NULL;
4ce5b903 224
9b1d82fa
PM
225 local_irq_save(flags);
226 *rcp->curtail = head;
227 rcp->curtail = &head->next;
228 local_irq_restore(flags);
229}
230
231/*
232 * Post an RCU callback to be invoked after the end of an RCU grace
233 * period. But since we have but one CPU, that would be after any
234 * quiescent state.
235 */
4ce5b903 236void call_rcu(struct rcu_head *head, void (*func)(struct rcu_head *rcu))
9b1d82fa
PM
237{
238 __call_rcu(head, func, &rcu_ctrlblk);
239}
240EXPORT_SYMBOL_GPL(call_rcu);
241
242/*
243 * Post an RCU bottom-half callback to be invoked after any subsequent
244 * quiescent state.
245 */
4ce5b903 246void call_rcu_bh(struct rcu_head *head, void (*func)(struct rcu_head *rcu))
9b1d82fa
PM
247{
248 __call_rcu(head, func, &rcu_bh_ctrlblk);
249}
250EXPORT_SYMBOL_GPL(call_rcu_bh);
251
252void rcu_barrier(void)
253{
254 struct rcu_synchronize rcu;
255
256 init_completion(&rcu.completion);
257 /* Will wake me after RCU finished. */
258 call_rcu(&rcu.head, wakeme_after_rcu);
259 /* Wait for it. */
260 wait_for_completion(&rcu.completion);
261}
262EXPORT_SYMBOL_GPL(rcu_barrier);
263
264void rcu_barrier_bh(void)
265{
266 struct rcu_synchronize rcu;
267
268 init_completion(&rcu.completion);
269 /* Will wake me after RCU finished. */
270 call_rcu_bh(&rcu.head, wakeme_after_rcu);
271 /* Wait for it. */
272 wait_for_completion(&rcu.completion);
273}
274EXPORT_SYMBOL_GPL(rcu_barrier_bh);
275
276void rcu_barrier_sched(void)
277{
278 struct rcu_synchronize rcu;
279
280 init_completion(&rcu.completion);
281 /* Will wake me after RCU finished. */
282 call_rcu_sched(&rcu.head, wakeme_after_rcu);
283 /* Wait for it. */
284 wait_for_completion(&rcu.completion);
285}
286EXPORT_SYMBOL_GPL(rcu_barrier_sched);
287
288void __rcu_init(void)
289{
290 open_softirq(RCU_SOFTIRQ, rcu_process_callbacks);
291}