cpu-hotplug: convert cpu_hotplug_disabled to a counter
[linux-2.6-block.git] / kernel / cpu.c
CommitLineData
1da177e4
LT
1/* CPU control.
2 * (C) 2001, 2002, 2003, 2004 Rusty Russell
3 *
4 * This code is licenced under the GPL.
5 */
6#include <linux/proc_fs.h>
7#include <linux/smp.h>
8#include <linux/init.h>
9#include <linux/notifier.h>
10#include <linux/sched.h>
11#include <linux/unistd.h>
12#include <linux/cpu.h>
cb79295e
AV
13#include <linux/oom.h>
14#include <linux/rcupdate.h>
9984de1a 15#include <linux/export.h>
e4cc2f87 16#include <linux/bug.h>
1da177e4
LT
17#include <linux/kthread.h>
18#include <linux/stop_machine.h>
81615b62 19#include <linux/mutex.h>
5a0e3ad6 20#include <linux/gfp.h>
79cfbdfa 21#include <linux/suspend.h>
a19423b9 22#include <linux/lockdep.h>
345527b1 23#include <linux/tick.h>
a8994181 24#include <linux/irq.h>
bb3632c6 25#include <trace/events/power.h>
1da177e4 26
38498a67
TG
27#include "smpboot.h"
28
98a79d6a 29#ifdef CONFIG_SMP
b3199c02 30/* Serializes the updates to cpu_online_mask, cpu_present_mask */
aa953877 31static DEFINE_MUTEX(cpu_add_remove_lock);
1da177e4 32
79a6cdeb 33/*
93ae4f97
SB
34 * The following two APIs (cpu_maps_update_begin/done) must be used when
35 * attempting to serialize the updates to cpu_online_mask & cpu_present_mask.
36 * The APIs cpu_notifier_register_begin/done() must be used to protect CPU
37 * hotplug callback (un)registration performed using __register_cpu_notifier()
38 * or __unregister_cpu_notifier().
79a6cdeb
LJ
39 */
40void cpu_maps_update_begin(void)
41{
42 mutex_lock(&cpu_add_remove_lock);
43}
93ae4f97 44EXPORT_SYMBOL(cpu_notifier_register_begin);
79a6cdeb
LJ
45
46void cpu_maps_update_done(void)
47{
48 mutex_unlock(&cpu_add_remove_lock);
49}
93ae4f97 50EXPORT_SYMBOL(cpu_notifier_register_done);
79a6cdeb 51
5c113fbe 52static RAW_NOTIFIER_HEAD(cpu_chain);
1da177e4 53
e3920fb4
RW
54/* If set, cpu_up and cpu_down will return -EBUSY and do nothing.
55 * Should always be manipulated under cpu_add_remove_lock
56 */
57static int cpu_hotplug_disabled;
58
79a6cdeb
LJ
59#ifdef CONFIG_HOTPLUG_CPU
60
d221938c
GS
61static struct {
62 struct task_struct *active_writer;
87af9e7f
DH
63 /* wait queue to wake up the active_writer */
64 wait_queue_head_t wq;
65 /* verifies that no writer will get active while readers are active */
66 struct mutex lock;
d221938c
GS
67 /*
68 * Also blocks the new readers during
69 * an ongoing cpu hotplug operation.
70 */
87af9e7f 71 atomic_t refcount;
a19423b9
GS
72
73#ifdef CONFIG_DEBUG_LOCK_ALLOC
74 struct lockdep_map dep_map;
75#endif
31950eb6
LT
76} cpu_hotplug = {
77 .active_writer = NULL,
87af9e7f 78 .wq = __WAIT_QUEUE_HEAD_INITIALIZER(cpu_hotplug.wq),
31950eb6 79 .lock = __MUTEX_INITIALIZER(cpu_hotplug.lock),
a19423b9
GS
80#ifdef CONFIG_DEBUG_LOCK_ALLOC
81 .dep_map = {.name = "cpu_hotplug.lock" },
82#endif
31950eb6 83};
d221938c 84
a19423b9
GS
85/* Lockdep annotations for get/put_online_cpus() and cpu_hotplug_begin/end() */
86#define cpuhp_lock_acquire_read() lock_map_acquire_read(&cpu_hotplug.dep_map)
dd56af42
PM
87#define cpuhp_lock_acquire_tryread() \
88 lock_map_acquire_tryread(&cpu_hotplug.dep_map)
a19423b9
GS
89#define cpuhp_lock_acquire() lock_map_acquire(&cpu_hotplug.dep_map)
90#define cpuhp_lock_release() lock_map_release(&cpu_hotplug.dep_map)
91
62db99f4 92
86ef5c9a 93void get_online_cpus(void)
a9d9baa1 94{
d221938c
GS
95 might_sleep();
96 if (cpu_hotplug.active_writer == current)
aa953877 97 return;
a19423b9 98 cpuhp_lock_acquire_read();
d221938c 99 mutex_lock(&cpu_hotplug.lock);
87af9e7f 100 atomic_inc(&cpu_hotplug.refcount);
d221938c 101 mutex_unlock(&cpu_hotplug.lock);
a9d9baa1 102}
86ef5c9a 103EXPORT_SYMBOL_GPL(get_online_cpus);
90d45d17 104
dd56af42
PM
105bool try_get_online_cpus(void)
106{
107 if (cpu_hotplug.active_writer == current)
108 return true;
109 if (!mutex_trylock(&cpu_hotplug.lock))
110 return false;
111 cpuhp_lock_acquire_tryread();
87af9e7f 112 atomic_inc(&cpu_hotplug.refcount);
dd56af42
PM
113 mutex_unlock(&cpu_hotplug.lock);
114 return true;
115}
116EXPORT_SYMBOL_GPL(try_get_online_cpus);
117
86ef5c9a 118void put_online_cpus(void)
a9d9baa1 119{
87af9e7f
DH
120 int refcount;
121
d221938c 122 if (cpu_hotplug.active_writer == current)
aa953877 123 return;
075663d1 124
87af9e7f
DH
125 refcount = atomic_dec_return(&cpu_hotplug.refcount);
126 if (WARN_ON(refcount < 0)) /* try to fix things up */
127 atomic_inc(&cpu_hotplug.refcount);
128
129 if (refcount <= 0 && waitqueue_active(&cpu_hotplug.wq))
130 wake_up(&cpu_hotplug.wq);
075663d1 131
a19423b9 132 cpuhp_lock_release();
d221938c 133
a9d9baa1 134}
86ef5c9a 135EXPORT_SYMBOL_GPL(put_online_cpus);
a9d9baa1 136
d221938c
GS
137/*
138 * This ensures that the hotplug operation can begin only when the
139 * refcount goes to zero.
140 *
141 * Note that during a cpu-hotplug operation, the new readers, if any,
142 * will be blocked by the cpu_hotplug.lock
143 *
d2ba7e2a
ON
144 * Since cpu_hotplug_begin() is always called after invoking
145 * cpu_maps_update_begin(), we can be sure that only one writer is active.
d221938c
GS
146 *
147 * Note that theoretically, there is a possibility of a livelock:
148 * - Refcount goes to zero, last reader wakes up the sleeping
149 * writer.
150 * - Last reader unlocks the cpu_hotplug.lock.
151 * - A new reader arrives at this moment, bumps up the refcount.
152 * - The writer acquires the cpu_hotplug.lock finds the refcount
153 * non zero and goes to sleep again.
154 *
155 * However, this is very difficult to achieve in practice since
86ef5c9a 156 * get_online_cpus() not an api which is called all that often.
d221938c
GS
157 *
158 */
b9d10be7 159void cpu_hotplug_begin(void)
d221938c 160{
87af9e7f 161 DEFINE_WAIT(wait);
d2ba7e2a 162
87af9e7f 163 cpu_hotplug.active_writer = current;
a19423b9 164 cpuhp_lock_acquire();
87af9e7f 165
d2ba7e2a
ON
166 for (;;) {
167 mutex_lock(&cpu_hotplug.lock);
87af9e7f
DH
168 prepare_to_wait(&cpu_hotplug.wq, &wait, TASK_UNINTERRUPTIBLE);
169 if (likely(!atomic_read(&cpu_hotplug.refcount)))
170 break;
d221938c
GS
171 mutex_unlock(&cpu_hotplug.lock);
172 schedule();
d221938c 173 }
87af9e7f 174 finish_wait(&cpu_hotplug.wq, &wait);
d221938c
GS
175}
176
b9d10be7 177void cpu_hotplug_done(void)
d221938c
GS
178{
179 cpu_hotplug.active_writer = NULL;
180 mutex_unlock(&cpu_hotplug.lock);
a19423b9 181 cpuhp_lock_release();
d221938c 182}
79a6cdeb 183
16e53dbf
SB
184/*
185 * Wait for currently running CPU hotplug operations to complete (if any) and
186 * disable future CPU hotplug (from sysfs). The 'cpu_add_remove_lock' protects
187 * the 'cpu_hotplug_disabled' flag. The same lock is also acquired by the
188 * hotplug path before performing hotplug operations. So acquiring that lock
189 * guarantees mutual exclusion from any currently running hotplug operations.
190 */
191void cpu_hotplug_disable(void)
192{
193 cpu_maps_update_begin();
89af7ba5 194 cpu_hotplug_disabled++;
16e53dbf
SB
195 cpu_maps_update_done();
196}
197
198void cpu_hotplug_enable(void)
199{
200 cpu_maps_update_begin();
89af7ba5 201 WARN_ON(--cpu_hotplug_disabled < 0);
16e53dbf
SB
202 cpu_maps_update_done();
203}
204
b9d10be7 205#endif /* CONFIG_HOTPLUG_CPU */
79a6cdeb 206
1da177e4 207/* Need to know about CPUs going up/down? */
f7b16c10 208int __ref register_cpu_notifier(struct notifier_block *nb)
1da177e4 209{
bd5349cf 210 int ret;
d221938c 211 cpu_maps_update_begin();
bd5349cf 212 ret = raw_notifier_chain_register(&cpu_chain, nb);
d221938c 213 cpu_maps_update_done();
bd5349cf 214 return ret;
1da177e4 215}
65edc68c 216
93ae4f97
SB
217int __ref __register_cpu_notifier(struct notifier_block *nb)
218{
219 return raw_notifier_chain_register(&cpu_chain, nb);
220}
221
e9fb7631
AM
222static int __cpu_notify(unsigned long val, void *v, int nr_to_call,
223 int *nr_calls)
224{
e6bde73b
AM
225 int ret;
226
227 ret = __raw_notifier_call_chain(&cpu_chain, val, v, nr_to_call,
e9fb7631 228 nr_calls);
e6bde73b
AM
229
230 return notifier_to_errno(ret);
e9fb7631
AM
231}
232
233static int cpu_notify(unsigned long val, void *v)
234{
235 return __cpu_notify(val, v, -1, NULL);
236}
237
00b9b0af
LT
238#ifdef CONFIG_HOTPLUG_CPU
239
e9fb7631
AM
240static void cpu_notify_nofail(unsigned long val, void *v)
241{
00b9b0af 242 BUG_ON(cpu_notify(val, v));
e9fb7631 243}
1da177e4 244EXPORT_SYMBOL(register_cpu_notifier);
93ae4f97 245EXPORT_SYMBOL(__register_cpu_notifier);
1da177e4 246
9647155f 247void __ref unregister_cpu_notifier(struct notifier_block *nb)
1da177e4 248{
d221938c 249 cpu_maps_update_begin();
bd5349cf 250 raw_notifier_chain_unregister(&cpu_chain, nb);
d221938c 251 cpu_maps_update_done();
1da177e4
LT
252}
253EXPORT_SYMBOL(unregister_cpu_notifier);
254
93ae4f97
SB
255void __ref __unregister_cpu_notifier(struct notifier_block *nb)
256{
257 raw_notifier_chain_unregister(&cpu_chain, nb);
258}
259EXPORT_SYMBOL(__unregister_cpu_notifier);
260
e4cc2f87
AV
261/**
262 * clear_tasks_mm_cpumask - Safely clear tasks' mm_cpumask for a CPU
263 * @cpu: a CPU id
264 *
265 * This function walks all processes, finds a valid mm struct for each one and
266 * then clears a corresponding bit in mm's cpumask. While this all sounds
267 * trivial, there are various non-obvious corner cases, which this function
268 * tries to solve in a safe manner.
269 *
270 * Also note that the function uses a somewhat relaxed locking scheme, so it may
271 * be called only for an already offlined CPU.
272 */
cb79295e
AV
273void clear_tasks_mm_cpumask(int cpu)
274{
275 struct task_struct *p;
276
277 /*
278 * This function is called after the cpu is taken down and marked
279 * offline, so its not like new tasks will ever get this cpu set in
280 * their mm mask. -- Peter Zijlstra
281 * Thus, we may use rcu_read_lock() here, instead of grabbing
282 * full-fledged tasklist_lock.
283 */
e4cc2f87 284 WARN_ON(cpu_online(cpu));
cb79295e
AV
285 rcu_read_lock();
286 for_each_process(p) {
287 struct task_struct *t;
288
e4cc2f87
AV
289 /*
290 * Main thread might exit, but other threads may still have
291 * a valid mm. Find one.
292 */
cb79295e
AV
293 t = find_lock_task_mm(p);
294 if (!t)
295 continue;
296 cpumask_clear_cpu(cpu, mm_cpumask(t->mm));
297 task_unlock(t);
298 }
299 rcu_read_unlock();
300}
301
b728ca06 302static inline void check_for_tasks(int dead_cpu)
1da177e4 303{
b728ca06 304 struct task_struct *g, *p;
1da177e4 305
b728ca06
KT
306 read_lock_irq(&tasklist_lock);
307 do_each_thread(g, p) {
308 if (!p->on_rq)
309 continue;
310 /*
311 * We do the check with unlocked task_rq(p)->lock.
312 * Order the reading to do not warn about a task,
313 * which was running on this cpu in the past, and
314 * it's just been woken on another cpu.
315 */
316 rmb();
317 if (task_cpu(p) != dead_cpu)
318 continue;
319
320 pr_warn("Task %s (pid=%d) is on cpu %d (state=%ld, flags=%x)\n",
321 p->comm, task_pid_nr(p), dead_cpu, p->state, p->flags);
322 } while_each_thread(g, p);
323 read_unlock_irq(&tasklist_lock);
1da177e4
LT
324}
325
db912f96
AK
326struct take_cpu_down_param {
327 unsigned long mod;
328 void *hcpu;
329};
330
1da177e4 331/* Take this CPU down. */
514a20a5 332static int __ref take_cpu_down(void *_param)
1da177e4 333{
db912f96 334 struct take_cpu_down_param *param = _param;
1da177e4
LT
335 int err;
336
1da177e4
LT
337 /* Ensure this CPU doesn't handle any more interrupts. */
338 err = __cpu_disable();
339 if (err < 0)
f3705136 340 return err;
1da177e4 341
e9fb7631 342 cpu_notify(CPU_DYING | param->mod, param->hcpu);
52c063d1
TG
343 /* Give up timekeeping duties */
344 tick_handover_do_timer();
14e568e7
TG
345 /* Park the stopper thread */
346 kthread_park(current);
f3705136 347 return 0;
1da177e4
LT
348}
349
e3920fb4 350/* Requires cpu_add_remove_lock to be held */
514a20a5 351static int __ref _cpu_down(unsigned int cpu, int tasks_frozen)
1da177e4 352{
e7407dcc 353 int err, nr_calls = 0;
e7407dcc 354 void *hcpu = (void *)(long)cpu;
8bb78442 355 unsigned long mod = tasks_frozen ? CPU_TASKS_FROZEN : 0;
db912f96
AK
356 struct take_cpu_down_param tcd_param = {
357 .mod = mod,
358 .hcpu = hcpu,
359 };
1da177e4 360
e3920fb4
RW
361 if (num_online_cpus() == 1)
362 return -EBUSY;
1da177e4 363
e3920fb4
RW
364 if (!cpu_online(cpu))
365 return -EINVAL;
1da177e4 366
d221938c 367 cpu_hotplug_begin();
4d51985e 368
e9fb7631 369 err = __cpu_notify(CPU_DOWN_PREPARE | mod, hcpu, -1, &nr_calls);
e6bde73b 370 if (err) {
a0d8cdb6 371 nr_calls--;
e9fb7631 372 __cpu_notify(CPU_DOWN_FAILED | mod, hcpu, nr_calls, NULL);
84117da5
FF
373 pr_warn("%s: attempt to take down CPU %u failed\n",
374 __func__, cpu);
baaca49f 375 goto out_release;
1da177e4
LT
376 }
377
6acce3ef
PZ
378 /*
379 * By now we've cleared cpu_active_mask, wait for all preempt-disabled
380 * and RCU users of this state to go away such that all new such users
381 * will observe it.
382 *
383 * For CONFIG_PREEMPT we have preemptible RCU and its sync_rcu() might
384 * not imply sync_sched(), so explicitly call both.
106dd5af
M
385 *
386 * Do sync before park smpboot threads to take care the rcu boost case.
6acce3ef
PZ
387 */
388#ifdef CONFIG_PREEMPT
389 synchronize_sched();
390#endif
391 synchronize_rcu();
392
106dd5af
M
393 smpboot_park_threads(cpu);
394
6acce3ef 395 /*
a8994181
TG
396 * Prevent irq alloc/free while the dying cpu reorganizes the
397 * interrupt affinities.
6acce3ef 398 */
a8994181 399 irq_lock_sparse();
6acce3ef 400
a8994181
TG
401 /*
402 * So now all preempt/rcu users must observe !cpu_active().
403 */
e0b582ec 404 err = __stop_machine(take_cpu_down, &tcd_param, cpumask_of(cpu));
04321587 405 if (err) {
1da177e4 406 /* CPU didn't die: tell everyone. Can't complain. */
e9fb7631 407 cpu_notify_nofail(CPU_DOWN_FAILED | mod, hcpu);
a8994181 408 irq_unlock_sparse();
6a1bdc1b 409 goto out_release;
8fa1d7d3 410 }
04321587 411 BUG_ON(cpu_online(cpu));
1da177e4 412
48c5ccae
PZ
413 /*
414 * The migration_call() CPU_DYING callback will have removed all
415 * runnable tasks from the cpu, there's only the idle task left now
416 * that the migration thread is done doing the stop_machine thing.
51a96c77
PZ
417 *
418 * Wait for the stop thread to go away.
48c5ccae 419 */
528a25b0 420 while (!per_cpu(cpu_dead_idle, cpu))
51a96c77 421 cpu_relax();
528a25b0
PM
422 smp_mb(); /* Read from cpu_dead_idle before __cpu_die(). */
423 per_cpu(cpu_dead_idle, cpu) = false;
1da177e4 424
a8994181
TG
425 /* Interrupts are moved away from the dying cpu, reenable alloc/free */
426 irq_unlock_sparse();
427
345527b1 428 hotplug_cpu__broadcast_tick_pull(cpu);
1da177e4
LT
429 /* This actually kills the CPU. */
430 __cpu_die(cpu);
431
1da177e4 432 /* CPU is completely dead: tell everyone. Too late to complain. */
a49b116d 433 tick_cleanup_dead_cpu(cpu);
e9fb7631 434 cpu_notify_nofail(CPU_DEAD | mod, hcpu);
1da177e4
LT
435
436 check_for_tasks(cpu);
437
baaca49f 438out_release:
d221938c 439 cpu_hotplug_done();
e9fb7631
AM
440 if (!err)
441 cpu_notify_nofail(CPU_POST_DEAD | mod, hcpu);
e3920fb4
RW
442 return err;
443}
444
514a20a5 445int __ref cpu_down(unsigned int cpu)
e3920fb4 446{
9ea09af3 447 int err;
e3920fb4 448
d221938c 449 cpu_maps_update_begin();
e761b772
MK
450
451 if (cpu_hotplug_disabled) {
e3920fb4 452 err = -EBUSY;
e761b772
MK
453 goto out;
454 }
455
e761b772 456 err = _cpu_down(cpu, 0);
e3920fb4 457
e761b772 458out:
d221938c 459 cpu_maps_update_done();
1da177e4
LT
460 return err;
461}
b62b8ef9 462EXPORT_SYMBOL(cpu_down);
1da177e4
LT
463#endif /*CONFIG_HOTPLUG_CPU*/
464
00df35f9
PM
465/*
466 * Unpark per-CPU smpboot kthreads at CPU-online time.
467 */
468static int smpboot_thread_call(struct notifier_block *nfb,
469 unsigned long action, void *hcpu)
470{
471 int cpu = (long)hcpu;
472
473 switch (action & ~CPU_TASKS_FROZEN) {
474
64eaf974 475 case CPU_DOWN_FAILED:
00df35f9
PM
476 case CPU_ONLINE:
477 smpboot_unpark_threads(cpu);
478 break;
479
480 default:
481 break;
482 }
483
484 return NOTIFY_OK;
485}
486
487static struct notifier_block smpboot_thread_notifier = {
488 .notifier_call = smpboot_thread_call,
489 .priority = CPU_PRI_SMPBOOT,
490};
491
927da9df 492void smpboot_thread_init(void)
00df35f9
PM
493{
494 register_cpu_notifier(&smpboot_thread_notifier);
495}
496
e3920fb4 497/* Requires cpu_add_remove_lock to be held */
0db0628d 498static int _cpu_up(unsigned int cpu, int tasks_frozen)
1da177e4 499{
baaca49f 500 int ret, nr_calls = 0;
1da177e4 501 void *hcpu = (void *)(long)cpu;
8bb78442 502 unsigned long mod = tasks_frozen ? CPU_TASKS_FROZEN : 0;
3bb5d2ee 503 struct task_struct *idle;
1da177e4 504
d221938c 505 cpu_hotplug_begin();
38498a67 506
5e5041f3
YI
507 if (cpu_online(cpu) || !cpu_present(cpu)) {
508 ret = -EINVAL;
509 goto out;
510 }
511
3bb5d2ee
SS
512 idle = idle_thread_get(cpu);
513 if (IS_ERR(idle)) {
514 ret = PTR_ERR(idle);
38498a67 515 goto out;
3bb5d2ee 516 }
38498a67 517
f97f8f06
TG
518 ret = smpboot_create_threads(cpu);
519 if (ret)
520 goto out;
521
e9fb7631 522 ret = __cpu_notify(CPU_UP_PREPARE | mod, hcpu, -1, &nr_calls);
e6bde73b 523 if (ret) {
a0d8cdb6 524 nr_calls--;
84117da5
FF
525 pr_warn("%s: attempt to bring up CPU %u failed\n",
526 __func__, cpu);
1da177e4
LT
527 goto out_notify;
528 }
529
530 /* Arch-specific enabling code. */
3bb5d2ee 531 ret = __cpu_up(cpu, idle);
a8994181 532
1da177e4
LT
533 if (ret != 0)
534 goto out_notify;
6978c705 535 BUG_ON(!cpu_online(cpu));
1da177e4
LT
536
537 /* Now call notifier in preparation. */
e9fb7631 538 cpu_notify(CPU_ONLINE | mod, hcpu);
1da177e4
LT
539
540out_notify:
541 if (ret != 0)
e9fb7631 542 __cpu_notify(CPU_UP_CANCELED | mod, hcpu, nr_calls, NULL);
38498a67 543out:
d221938c 544 cpu_hotplug_done();
e3920fb4
RW
545
546 return ret;
547}
548
0db0628d 549int cpu_up(unsigned int cpu)
e3920fb4
RW
550{
551 int err = 0;
cf23422b 552
e0b582ec 553 if (!cpu_possible(cpu)) {
84117da5
FF
554 pr_err("can't online cpu %d because it is not configured as may-hotadd at boot time\n",
555 cpu);
87d5e023 556#if defined(CONFIG_IA64)
84117da5 557 pr_err("please check additional_cpus= boot parameter\n");
73e753a5
KH
558#endif
559 return -EINVAL;
560 }
e3920fb4 561
01b0f197
TK
562 err = try_online_node(cpu_to_node(cpu));
563 if (err)
564 return err;
cf23422b 565
d221938c 566 cpu_maps_update_begin();
e761b772
MK
567
568 if (cpu_hotplug_disabled) {
e3920fb4 569 err = -EBUSY;
e761b772
MK
570 goto out;
571 }
572
573 err = _cpu_up(cpu, 0);
574
e761b772 575out:
d221938c 576 cpu_maps_update_done();
e3920fb4
RW
577 return err;
578}
a513f6ba 579EXPORT_SYMBOL_GPL(cpu_up);
e3920fb4 580
f3de4be9 581#ifdef CONFIG_PM_SLEEP_SMP
e0b582ec 582static cpumask_var_t frozen_cpus;
e3920fb4
RW
583
584int disable_nonboot_cpus(void)
585{
e9a5f426 586 int cpu, first_cpu, error = 0;
e3920fb4 587
d221938c 588 cpu_maps_update_begin();
e0b582ec 589 first_cpu = cpumask_first(cpu_online_mask);
9ee349ad
XF
590 /*
591 * We take down all of the non-boot CPUs in one shot to avoid races
e3920fb4
RW
592 * with the userspace trying to use the CPU hotplug at the same time
593 */
e0b582ec 594 cpumask_clear(frozen_cpus);
6ad4c188 595
84117da5 596 pr_info("Disabling non-boot CPUs ...\n");
e3920fb4
RW
597 for_each_online_cpu(cpu) {
598 if (cpu == first_cpu)
599 continue;
bb3632c6 600 trace_suspend_resume(TPS("CPU_OFF"), cpu, true);
8bb78442 601 error = _cpu_down(cpu, 1);
bb3632c6 602 trace_suspend_resume(TPS("CPU_OFF"), cpu, false);
feae3203 603 if (!error)
e0b582ec 604 cpumask_set_cpu(cpu, frozen_cpus);
feae3203 605 else {
84117da5 606 pr_err("Error taking CPU%d down: %d\n", cpu, error);
e3920fb4
RW
607 break;
608 }
609 }
86886e55 610
89af7ba5 611 if (!error)
e3920fb4 612 BUG_ON(num_online_cpus() > 1);
89af7ba5 613 else
84117da5 614 pr_err("Non-boot CPUs are not disabled\n");
89af7ba5
VK
615
616 /*
617 * Make sure the CPUs won't be enabled by someone else. We need to do
618 * this even in case of failure as all disable_nonboot_cpus() users are
619 * supposed to do enable_nonboot_cpus() on the failure path.
620 */
621 cpu_hotplug_disabled++;
622
d221938c 623 cpu_maps_update_done();
e3920fb4
RW
624 return error;
625}
626
d0af9eed
SS
627void __weak arch_enable_nonboot_cpus_begin(void)
628{
629}
630
631void __weak arch_enable_nonboot_cpus_end(void)
632{
633}
634
fa7303e2 635void __ref enable_nonboot_cpus(void)
e3920fb4
RW
636{
637 int cpu, error;
638
639 /* Allow everyone to use the CPU hotplug again */
d221938c 640 cpu_maps_update_begin();
89af7ba5 641 WARN_ON(--cpu_hotplug_disabled < 0);
e0b582ec 642 if (cpumask_empty(frozen_cpus))
1d64b9cb 643 goto out;
e3920fb4 644
84117da5 645 pr_info("Enabling non-boot CPUs ...\n");
d0af9eed
SS
646
647 arch_enable_nonboot_cpus_begin();
648
e0b582ec 649 for_each_cpu(cpu, frozen_cpus) {
bb3632c6 650 trace_suspend_resume(TPS("CPU_ON"), cpu, true);
8bb78442 651 error = _cpu_up(cpu, 1);
bb3632c6 652 trace_suspend_resume(TPS("CPU_ON"), cpu, false);
e3920fb4 653 if (!error) {
84117da5 654 pr_info("CPU%d is up\n", cpu);
e3920fb4
RW
655 continue;
656 }
84117da5 657 pr_warn("Error taking CPU%d up: %d\n", cpu, error);
e3920fb4 658 }
d0af9eed
SS
659
660 arch_enable_nonboot_cpus_end();
661
e0b582ec 662 cpumask_clear(frozen_cpus);
1d64b9cb 663out:
d221938c 664 cpu_maps_update_done();
1da177e4 665}
e0b582ec 666
d7268a31 667static int __init alloc_frozen_cpus(void)
e0b582ec
RR
668{
669 if (!alloc_cpumask_var(&frozen_cpus, GFP_KERNEL|__GFP_ZERO))
670 return -ENOMEM;
671 return 0;
672}
673core_initcall(alloc_frozen_cpus);
79cfbdfa 674
79cfbdfa
SB
675/*
676 * When callbacks for CPU hotplug notifications are being executed, we must
677 * ensure that the state of the system with respect to the tasks being frozen
678 * or not, as reported by the notification, remains unchanged *throughout the
679 * duration* of the execution of the callbacks.
680 * Hence we need to prevent the freezer from racing with regular CPU hotplug.
681 *
682 * This synchronization is implemented by mutually excluding regular CPU
683 * hotplug and Suspend/Hibernate call paths by hooking onto the Suspend/
684 * Hibernate notifications.
685 */
686static int
687cpu_hotplug_pm_callback(struct notifier_block *nb,
688 unsigned long action, void *ptr)
689{
690 switch (action) {
691
692 case PM_SUSPEND_PREPARE:
693 case PM_HIBERNATION_PREPARE:
16e53dbf 694 cpu_hotplug_disable();
79cfbdfa
SB
695 break;
696
697 case PM_POST_SUSPEND:
698 case PM_POST_HIBERNATION:
16e53dbf 699 cpu_hotplug_enable();
79cfbdfa
SB
700 break;
701
702 default:
703 return NOTIFY_DONE;
704 }
705
706 return NOTIFY_OK;
707}
708
709
d7268a31 710static int __init cpu_hotplug_pm_sync_init(void)
79cfbdfa 711{
6e32d479
FY
712 /*
713 * cpu_hotplug_pm_callback has higher priority than x86
714 * bsp_pm_callback which depends on cpu_hotplug_pm_callback
715 * to disable cpu hotplug to avoid cpu hotplug race.
716 */
79cfbdfa
SB
717 pm_notifier(cpu_hotplug_pm_callback, 0);
718 return 0;
719}
720core_initcall(cpu_hotplug_pm_sync_init);
721
f3de4be9 722#endif /* CONFIG_PM_SLEEP_SMP */
68f4f1ec 723
e545a614
MS
724/**
725 * notify_cpu_starting(cpu) - call the CPU_STARTING notifiers
726 * @cpu: cpu that just started
727 *
728 * This function calls the cpu_chain notifiers with CPU_STARTING.
729 * It must be called by the arch code on the new cpu, before the new cpu
730 * enables interrupts and before the "boot" cpu returns from __cpu_up().
731 */
0db0628d 732void notify_cpu_starting(unsigned int cpu)
e545a614
MS
733{
734 unsigned long val = CPU_STARTING;
735
736#ifdef CONFIG_PM_SLEEP_SMP
e0b582ec 737 if (frozen_cpus != NULL && cpumask_test_cpu(cpu, frozen_cpus))
e545a614
MS
738 val = CPU_STARTING_FROZEN;
739#endif /* CONFIG_PM_SLEEP_SMP */
e9fb7631 740 cpu_notify(val, (void *)(long)cpu);
e545a614
MS
741}
742
68f4f1ec 743#endif /* CONFIG_SMP */
b8d317d1 744
e56b3bc7
LT
745/*
746 * cpu_bit_bitmap[] is a special, "compressed" data structure that
747 * represents all NR_CPUS bits binary values of 1<<nr.
748 *
e0b582ec 749 * It is used by cpumask_of() to get a constant address to a CPU
e56b3bc7
LT
750 * mask value that has a single bit set only.
751 */
b8d317d1 752
e56b3bc7 753/* cpu_bit_bitmap[0] is empty - so we can back into it */
4d51985e 754#define MASK_DECLARE_1(x) [x+1][0] = (1UL << (x))
e56b3bc7
LT
755#define MASK_DECLARE_2(x) MASK_DECLARE_1(x), MASK_DECLARE_1(x+1)
756#define MASK_DECLARE_4(x) MASK_DECLARE_2(x), MASK_DECLARE_2(x+2)
757#define MASK_DECLARE_8(x) MASK_DECLARE_4(x), MASK_DECLARE_4(x+4)
b8d317d1 758
e56b3bc7
LT
759const unsigned long cpu_bit_bitmap[BITS_PER_LONG+1][BITS_TO_LONGS(NR_CPUS)] = {
760
761 MASK_DECLARE_8(0), MASK_DECLARE_8(8),
762 MASK_DECLARE_8(16), MASK_DECLARE_8(24),
763#if BITS_PER_LONG > 32
764 MASK_DECLARE_8(32), MASK_DECLARE_8(40),
765 MASK_DECLARE_8(48), MASK_DECLARE_8(56),
b8d317d1
MT
766#endif
767};
e56b3bc7 768EXPORT_SYMBOL_GPL(cpu_bit_bitmap);
2d3854a3
RR
769
770const DECLARE_BITMAP(cpu_all_bits, NR_CPUS) = CPU_BITS_ALL;
771EXPORT_SYMBOL(cpu_all_bits);
b3199c02
RR
772
773#ifdef CONFIG_INIT_ALL_POSSIBLE
774static DECLARE_BITMAP(cpu_possible_bits, CONFIG_NR_CPUS) __read_mostly
775 = CPU_BITS_ALL;
776#else
777static DECLARE_BITMAP(cpu_possible_bits, CONFIG_NR_CPUS) __read_mostly;
778#endif
779const struct cpumask *const cpu_possible_mask = to_cpumask(cpu_possible_bits);
780EXPORT_SYMBOL(cpu_possible_mask);
781
782static DECLARE_BITMAP(cpu_online_bits, CONFIG_NR_CPUS) __read_mostly;
783const struct cpumask *const cpu_online_mask = to_cpumask(cpu_online_bits);
784EXPORT_SYMBOL(cpu_online_mask);
785
786static DECLARE_BITMAP(cpu_present_bits, CONFIG_NR_CPUS) __read_mostly;
787const struct cpumask *const cpu_present_mask = to_cpumask(cpu_present_bits);
788EXPORT_SYMBOL(cpu_present_mask);
789
790static DECLARE_BITMAP(cpu_active_bits, CONFIG_NR_CPUS) __read_mostly;
791const struct cpumask *const cpu_active_mask = to_cpumask(cpu_active_bits);
792EXPORT_SYMBOL(cpu_active_mask);
3fa41520
RR
793
794void set_cpu_possible(unsigned int cpu, bool possible)
795{
796 if (possible)
797 cpumask_set_cpu(cpu, to_cpumask(cpu_possible_bits));
798 else
799 cpumask_clear_cpu(cpu, to_cpumask(cpu_possible_bits));
800}
801
802void set_cpu_present(unsigned int cpu, bool present)
803{
804 if (present)
805 cpumask_set_cpu(cpu, to_cpumask(cpu_present_bits));
806 else
807 cpumask_clear_cpu(cpu, to_cpumask(cpu_present_bits));
808}
809
810void set_cpu_online(unsigned int cpu, bool online)
811{
6acbfb96 812 if (online) {
3fa41520 813 cpumask_set_cpu(cpu, to_cpumask(cpu_online_bits));
6acbfb96
LJ
814 cpumask_set_cpu(cpu, to_cpumask(cpu_active_bits));
815 } else {
3fa41520 816 cpumask_clear_cpu(cpu, to_cpumask(cpu_online_bits));
6acbfb96 817 }
3fa41520
RR
818}
819
820void set_cpu_active(unsigned int cpu, bool active)
821{
822 if (active)
823 cpumask_set_cpu(cpu, to_cpumask(cpu_active_bits));
824 else
825 cpumask_clear_cpu(cpu, to_cpumask(cpu_active_bits));
826}
827
828void init_cpu_present(const struct cpumask *src)
829{
830 cpumask_copy(to_cpumask(cpu_present_bits), src);
831}
832
833void init_cpu_possible(const struct cpumask *src)
834{
835 cpumask_copy(to_cpumask(cpu_possible_bits), src);
836}
837
838void init_cpu_online(const struct cpumask *src)
839{
840 cpumask_copy(to_cpumask(cpu_online_bits), src);
841}