cgroup: add css_parent()
[linux-2.6-block.git] / kernel / cgroup_freezer.c
CommitLineData
dc52ddc0
MH
1/*
2 * cgroup_freezer.c - control group freezer subsystem
3 *
4 * Copyright IBM Corporation, 2007
5 *
6 * Author : Cedric Le Goater <clg@fr.ibm.com>
7 *
8 * This program is free software; you can redistribute it and/or modify it
9 * under the terms of version 2.1 of the GNU Lesser General Public License
10 * as published by the Free Software Foundation.
11 *
12 * This program is distributed in the hope that it would be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
15 */
16
9984de1a 17#include <linux/export.h>
5a0e3ad6 18#include <linux/slab.h>
dc52ddc0
MH
19#include <linux/cgroup.h>
20#include <linux/fs.h>
21#include <linux/uaccess.h>
22#include <linux/freezer.h>
23#include <linux/seq_file.h>
24
ef9fe980
TH
25/*
26 * A cgroup is freezing if any FREEZING flags are set. FREEZING_SELF is
27 * set if "FROZEN" is written to freezer.state cgroupfs file, and cleared
28 * for "THAWED". FREEZING_PARENT is set if the parent freezer is FREEZING
29 * for whatever reason. IOW, a cgroup has FREEZING_PARENT set if one of
30 * its ancestors has FREEZING_SELF set.
31 */
d6a2fe13 32enum freezer_state_flags {
5300a9b3 33 CGROUP_FREEZER_ONLINE = (1 << 0), /* freezer is fully online */
a2252180
TH
34 CGROUP_FREEZING_SELF = (1 << 1), /* this freezer is freezing */
35 CGROUP_FREEZING_PARENT = (1 << 2), /* the parent freezer is freezing */
d6a2fe13 36 CGROUP_FROZEN = (1 << 3), /* this and its descendants frozen */
a2252180
TH
37
38 /* mask for all FREEZING flags */
39 CGROUP_FREEZING = CGROUP_FREEZING_SELF | CGROUP_FREEZING_PARENT,
dc52ddc0
MH
40};
41
42struct freezer {
bcd66c89 43 struct cgroup_subsys_state css;
d6a2fe13 44 unsigned int state;
bcd66c89 45 spinlock_t lock;
dc52ddc0
MH
46};
47
a7c6d554
TH
48static inline struct freezer *css_freezer(struct cgroup_subsys_state *css)
49{
50 return css ? container_of(css, struct freezer, css) : NULL;
51}
52
bcd66c89 53static inline struct freezer *cgroup_freezer(struct cgroup *cgroup)
dc52ddc0 54{
a7c6d554 55 return css_freezer(cgroup_css(cgroup, freezer_subsys_id));
dc52ddc0
MH
56}
57
58static inline struct freezer *task_freezer(struct task_struct *task)
59{
a7c6d554 60 return css_freezer(task_css(task, freezer_subsys_id));
dc52ddc0
MH
61}
62
ef9fe980
TH
63static struct freezer *parent_freezer(struct freezer *freezer)
64{
63876986 65 return css_freezer(css_parent(&freezer->css));
ef9fe980
TH
66}
67
22b4e111 68bool cgroup_freezing(struct task_struct *task)
dc52ddc0 69{
22b4e111 70 bool ret;
dc52ddc0 71
22b4e111 72 rcu_read_lock();
d6a2fe13 73 ret = task_freezer(task)->state & CGROUP_FREEZING;
22b4e111
TH
74 rcu_read_unlock();
75
76 return ret;
dc52ddc0
MH
77}
78
79/*
80 * cgroups_write_string() limits the size of freezer state strings to
81 * CGROUP_LOCAL_BUFFER_SIZE
82 */
d6a2fe13
TH
83static const char *freezer_state_strs(unsigned int state)
84{
85 if (state & CGROUP_FROZEN)
86 return "FROZEN";
87 if (state & CGROUP_FREEZING)
88 return "FREEZING";
89 return "THAWED";
dc52ddc0
MH
90};
91
dc52ddc0
MH
92struct cgroup_subsys freezer_subsys;
93
92fb9748 94static struct cgroup_subsys_state *freezer_css_alloc(struct cgroup *cgroup)
dc52ddc0
MH
95{
96 struct freezer *freezer;
97
98 freezer = kzalloc(sizeof(struct freezer), GFP_KERNEL);
99 if (!freezer)
100 return ERR_PTR(-ENOMEM);
101
102 spin_lock_init(&freezer->lock);
dc52ddc0
MH
103 return &freezer->css;
104}
105
5300a9b3 106/**
92fb9748 107 * freezer_css_online - commit creation of a freezer cgroup
5300a9b3
TH
108 * @cgroup: cgroup being created
109 *
ef9fe980
TH
110 * We're committing to creation of @cgroup. Mark it online and inherit
111 * parent's freezing state while holding both parent's and our
112 * freezer->lock.
5300a9b3 113 */
92fb9748 114static int freezer_css_online(struct cgroup *cgroup)
dc52ddc0 115{
a3201227 116 struct freezer *freezer = cgroup_freezer(cgroup);
ef9fe980
TH
117 struct freezer *parent = parent_freezer(freezer);
118
119 /*
120 * The following double locking and freezing state inheritance
121 * guarantee that @cgroup can never escape ancestors' freezing
122 * states. See cgroup_for_each_descendant_pre() for details.
123 */
124 if (parent)
125 spin_lock_irq(&parent->lock);
126 spin_lock_nested(&freezer->lock, SINGLE_DEPTH_NESTING);
a3201227 127
5300a9b3 128 freezer->state |= CGROUP_FREEZER_ONLINE;
ef9fe980
TH
129
130 if (parent && (parent->state & CGROUP_FREEZING)) {
131 freezer->state |= CGROUP_FREEZING_PARENT | CGROUP_FROZEN;
132 atomic_inc(&system_freezing_cnt);
133 }
134
135 spin_unlock(&freezer->lock);
136 if (parent)
137 spin_unlock_irq(&parent->lock);
b1929db4
TH
138
139 return 0;
5300a9b3
TH
140}
141
142/**
92fb9748 143 * freezer_css_offline - initiate destruction of @cgroup
5300a9b3
TH
144 * @cgroup: cgroup being destroyed
145 *
146 * @cgroup is going away. Mark it dead and decrement system_freezing_count
147 * if it was holding one.
148 */
92fb9748 149static void freezer_css_offline(struct cgroup *cgroup)
5300a9b3
TH
150{
151 struct freezer *freezer = cgroup_freezer(cgroup);
152
153 spin_lock_irq(&freezer->lock);
154
d6a2fe13 155 if (freezer->state & CGROUP_FREEZING)
a3201227 156 atomic_dec(&system_freezing_cnt);
5300a9b3
TH
157
158 freezer->state = 0;
159
160 spin_unlock_irq(&freezer->lock);
161}
162
92fb9748 163static void freezer_css_free(struct cgroup *cgroup)
5300a9b3
TH
164{
165 kfree(cgroup_freezer(cgroup));
dc52ddc0
MH
166}
167
957a4eea 168/*
ead5c473
TH
169 * Tasks can be migrated into a different freezer anytime regardless of its
170 * current state. freezer_attach() is responsible for making new tasks
171 * conform to the current state.
172 *
173 * Freezer state changes and task migration are synchronized via
174 * @freezer->lock. freezer_attach() makes the new tasks conform to the
175 * current state and all following state changes can see the new tasks.
957a4eea 176 */
8755ade6 177static void freezer_attach(struct cgroup *new_cgrp, struct cgroup_taskset *tset)
dc52ddc0 178{
8755ade6 179 struct freezer *freezer = cgroup_freezer(new_cgrp);
bb9d97b6 180 struct task_struct *task;
ef9fe980 181 bool clear_frozen = false;
957a4eea 182
8755ade6
TH
183 spin_lock_irq(&freezer->lock);
184
80a6a2cf 185 /*
8755ade6
TH
186 * Make the new tasks conform to the current state of @new_cgrp.
187 * For simplicity, when migrating any task to a FROZEN cgroup, we
188 * revert it to FREEZING and let update_if_frozen() determine the
189 * correct state later.
190 *
191 * Tasks in @tset are on @new_cgrp but may not conform to its
192 * current state before executing the following - !frozen tasks may
193 * be visible in a FROZEN cgroup and frozen tasks in a THAWED one.
80a6a2cf 194 */
8755ade6 195 cgroup_taskset_for_each(task, new_cgrp, tset) {
d6a2fe13 196 if (!(freezer->state & CGROUP_FREEZING)) {
8755ade6
TH
197 __thaw_task(task);
198 } else {
199 freeze_task(task);
d6a2fe13 200 freezer->state &= ~CGROUP_FROZEN;
ef9fe980 201 clear_frozen = true;
8755ade6
TH
202 }
203 }
dc52ddc0 204
8755ade6 205 spin_unlock_irq(&freezer->lock);
ef9fe980
TH
206
207 /*
208 * Propagate FROZEN clearing upwards. We may race with
209 * update_if_frozen(), but as long as both work bottom-up, either
210 * update_if_frozen() sees child's FROZEN cleared or we clear the
211 * parent's FROZEN later. No parent w/ !FROZEN children can be
212 * left FROZEN.
213 */
214 while (clear_frozen && (freezer = parent_freezer(freezer))) {
215 spin_lock_irq(&freezer->lock);
216 freezer->state &= ~CGROUP_FROZEN;
217 clear_frozen = freezer->state & CGROUP_FREEZING;
218 spin_unlock_irq(&freezer->lock);
219 }
f780bdb7
BB
220}
221
761b3ef5 222static void freezer_fork(struct task_struct *task)
dc52ddc0
MH
223{
224 struct freezer *freezer;
225
8b46f880 226 rcu_read_lock();
dc52ddc0 227 freezer = task_freezer(task);
dc52ddc0 228
3b1b3f6e
LZ
229 /*
230 * The root cgroup is non-freezable, so we can skip the
231 * following check.
232 */
63876986 233 if (!parent_freezer(freezer))
5edee61e 234 goto out;
3b1b3f6e 235
dc52ddc0 236 spin_lock_irq(&freezer->lock);
d6a2fe13 237 if (freezer->state & CGROUP_FREEZING)
839e3407 238 freeze_task(task);
dc52ddc0 239 spin_unlock_irq(&freezer->lock);
5edee61e
TH
240out:
241 rcu_read_unlock();
dc52ddc0
MH
242}
243
ef9fe980
TH
244/**
245 * update_if_frozen - update whether a cgroup finished freezing
246 * @cgroup: cgroup of interest
247 *
248 * Once FREEZING is initiated, transition to FROZEN is lazily updated by
249 * calling this function. If the current state is FREEZING but not FROZEN,
250 * this function checks whether all tasks of this cgroup and the descendant
251 * cgroups finished freezing and, if so, sets FROZEN.
252 *
253 * The caller is responsible for grabbing RCU read lock and calling
254 * update_if_frozen() on all descendants prior to invoking this function.
b4d18311
TH
255 *
256 * Task states and freezer state might disagree while tasks are being
ead5c473
TH
257 * migrated into or out of @cgroup, so we can't verify task states against
258 * @freezer state here. See freezer_attach() for details.
dc52ddc0 259 */
ef9fe980 260static void update_if_frozen(struct cgroup *cgroup)
dc52ddc0 261{
ef9fe980
TH
262 struct freezer *freezer = cgroup_freezer(cgroup);
263 struct cgroup *pos;
dc52ddc0
MH
264 struct cgroup_iter it;
265 struct task_struct *task;
b4d18311 266
ef9fe980
TH
267 WARN_ON_ONCE(!rcu_read_lock_held());
268
269 spin_lock_irq(&freezer->lock);
270
d6a2fe13
TH
271 if (!(freezer->state & CGROUP_FREEZING) ||
272 (freezer->state & CGROUP_FROZEN))
ef9fe980
TH
273 goto out_unlock;
274
275 /* are all (live) children frozen? */
276 cgroup_for_each_child(pos, cgroup) {
277 struct freezer *child = cgroup_freezer(pos);
dc52ddc0 278
ef9fe980
TH
279 if ((child->state & CGROUP_FREEZER_ONLINE) &&
280 !(child->state & CGROUP_FROZEN))
281 goto out_unlock;
282 }
283
284 /* are all tasks frozen? */
dc52ddc0 285 cgroup_iter_start(cgroup, &it);
b4d18311 286
dc52ddc0 287 while ((task = cgroup_iter_next(cgroup, &it))) {
3c426d5e 288 if (freezing(task)) {
3c426d5e
TH
289 /*
290 * freezer_should_skip() indicates that the task
291 * should be skipped when determining freezing
292 * completion. Consider it frozen in addition to
293 * the usual frozen condition.
294 */
5d8f72b5 295 if (!frozen(task) && !freezer_should_skip(task))
ef9fe980 296 goto out_iter_end;
3c426d5e 297 }
dc52ddc0
MH
298 }
299
d6a2fe13 300 freezer->state |= CGROUP_FROZEN;
ef9fe980 301out_iter_end:
dc52ddc0 302 cgroup_iter_end(cgroup, &it);
ef9fe980
TH
303out_unlock:
304 spin_unlock_irq(&freezer->lock);
dc52ddc0
MH
305}
306
307static int freezer_read(struct cgroup *cgroup, struct cftype *cft,
308 struct seq_file *m)
309{
ef9fe980 310 struct cgroup *pos;
dc52ddc0 311
ef9fe980 312 rcu_read_lock();
dc52ddc0 313
ef9fe980
TH
314 /* update states bottom-up */
315 cgroup_for_each_descendant_post(pos, cgroup)
316 update_if_frozen(pos);
317 update_if_frozen(cgroup);
318
319 rcu_read_unlock();
320
321 seq_puts(m, freezer_state_strs(cgroup_freezer(cgroup)->state));
dc52ddc0
MH
322 seq_putc(m, '\n');
323 return 0;
324}
325
bcd66c89 326static void freeze_cgroup(struct freezer *freezer)
dc52ddc0 327{
bcd66c89 328 struct cgroup *cgroup = freezer->css.cgroup;
dc52ddc0
MH
329 struct cgroup_iter it;
330 struct task_struct *task;
dc52ddc0 331
dc52ddc0 332 cgroup_iter_start(cgroup, &it);
51f246ed
TH
333 while ((task = cgroup_iter_next(cgroup, &it)))
334 freeze_task(task);
dc52ddc0 335 cgroup_iter_end(cgroup, &it);
dc52ddc0
MH
336}
337
bcd66c89 338static void unfreeze_cgroup(struct freezer *freezer)
dc52ddc0 339{
bcd66c89 340 struct cgroup *cgroup = freezer->css.cgroup;
dc52ddc0
MH
341 struct cgroup_iter it;
342 struct task_struct *task;
343
344 cgroup_iter_start(cgroup, &it);
a5be2d0d
TH
345 while ((task = cgroup_iter_next(cgroup, &it)))
346 __thaw_task(task);
dc52ddc0 347 cgroup_iter_end(cgroup, &it);
dc52ddc0
MH
348}
349
04a4ec32
TH
350/**
351 * freezer_apply_state - apply state change to a single cgroup_freezer
352 * @freezer: freezer to apply state change to
353 * @freeze: whether to freeze or unfreeze
a2252180
TH
354 * @state: CGROUP_FREEZING_* flag to set or clear
355 *
356 * Set or clear @state on @cgroup according to @freeze, and perform
357 * freezing or thawing as necessary.
04a4ec32 358 */
a2252180
TH
359static void freezer_apply_state(struct freezer *freezer, bool freeze,
360 unsigned int state)
dc52ddc0 361{
ead5c473 362 /* also synchronizes against task migration, see freezer_attach() */
04a4ec32 363 lockdep_assert_held(&freezer->lock);
51308ee5 364
5300a9b3
TH
365 if (!(freezer->state & CGROUP_FREEZER_ONLINE))
366 return;
367
04a4ec32 368 if (freeze) {
d6a2fe13 369 if (!(freezer->state & CGROUP_FREEZING))
a3201227 370 atomic_inc(&system_freezing_cnt);
a2252180 371 freezer->state |= state;
bcd66c89 372 freeze_cgroup(freezer);
04a4ec32 373 } else {
a2252180
TH
374 bool was_freezing = freezer->state & CGROUP_FREEZING;
375
376 freezer->state &= ~state;
377
378 if (!(freezer->state & CGROUP_FREEZING)) {
379 if (was_freezing)
380 atomic_dec(&system_freezing_cnt);
381 freezer->state &= ~CGROUP_FROZEN;
382 unfreeze_cgroup(freezer);
383 }
dc52ddc0 384 }
04a4ec32 385}
22b4e111 386
04a4ec32
TH
387/**
388 * freezer_change_state - change the freezing state of a cgroup_freezer
389 * @freezer: freezer of interest
390 * @freeze: whether to freeze or thaw
391 *
ef9fe980
TH
392 * Freeze or thaw @freezer according to @freeze. The operations are
393 * recursive - all descendants of @freezer will be affected.
04a4ec32
TH
394 */
395static void freezer_change_state(struct freezer *freezer, bool freeze)
396{
ef9fe980
TH
397 struct cgroup *pos;
398
04a4ec32
TH
399 /* update @freezer */
400 spin_lock_irq(&freezer->lock);
a2252180 401 freezer_apply_state(freezer, freeze, CGROUP_FREEZING_SELF);
dc52ddc0 402 spin_unlock_irq(&freezer->lock);
ef9fe980
TH
403
404 /*
405 * Update all its descendants in pre-order traversal. Each
406 * descendant will try to inherit its parent's FREEZING state as
407 * CGROUP_FREEZING_PARENT.
408 */
409 rcu_read_lock();
410 cgroup_for_each_descendant_pre(pos, freezer->css.cgroup) {
411 struct freezer *pos_f = cgroup_freezer(pos);
412 struct freezer *parent = parent_freezer(pos_f);
413
414 /*
415 * Our update to @parent->state is already visible which is
416 * all we need. No need to lock @parent. For more info on
417 * synchronization, see freezer_post_create().
418 */
419 spin_lock_irq(&pos_f->lock);
420 freezer_apply_state(pos_f, parent->state & CGROUP_FREEZING,
421 CGROUP_FREEZING_PARENT);
422 spin_unlock_irq(&pos_f->lock);
423 }
424 rcu_read_unlock();
dc52ddc0
MH
425}
426
bcd66c89 427static int freezer_write(struct cgroup *cgroup, struct cftype *cft,
dc52ddc0
MH
428 const char *buffer)
429{
04a4ec32 430 bool freeze;
dc52ddc0 431
d6a2fe13 432 if (strcmp(buffer, freezer_state_strs(0)) == 0)
04a4ec32 433 freeze = false;
d6a2fe13 434 else if (strcmp(buffer, freezer_state_strs(CGROUP_FROZEN)) == 0)
04a4ec32 435 freeze = true;
dc52ddc0 436 else
3b1b3f6e 437 return -EINVAL;
dc52ddc0 438
04a4ec32 439 freezer_change_state(cgroup_freezer(cgroup), freeze);
51f246ed 440 return 0;
dc52ddc0
MH
441}
442
a2252180
TH
443static u64 freezer_self_freezing_read(struct cgroup *cgroup, struct cftype *cft)
444{
445 struct freezer *freezer = cgroup_freezer(cgroup);
446
447 return (bool)(freezer->state & CGROUP_FREEZING_SELF);
448}
449
450static u64 freezer_parent_freezing_read(struct cgroup *cgroup, struct cftype *cft)
451{
452 struct freezer *freezer = cgroup_freezer(cgroup);
453
454 return (bool)(freezer->state & CGROUP_FREEZING_PARENT);
455}
456
dc52ddc0
MH
457static struct cftype files[] = {
458 {
459 .name = "state",
4baf6e33 460 .flags = CFTYPE_NOT_ON_ROOT,
dc52ddc0
MH
461 .read_seq_string = freezer_read,
462 .write_string = freezer_write,
463 },
a2252180
TH
464 {
465 .name = "self_freezing",
466 .flags = CFTYPE_NOT_ON_ROOT,
467 .read_u64 = freezer_self_freezing_read,
468 },
469 {
470 .name = "parent_freezing",
471 .flags = CFTYPE_NOT_ON_ROOT,
472 .read_u64 = freezer_parent_freezing_read,
473 },
4baf6e33 474 { } /* terminate */
dc52ddc0
MH
475};
476
dc52ddc0
MH
477struct cgroup_subsys freezer_subsys = {
478 .name = "freezer",
92fb9748
TH
479 .css_alloc = freezer_css_alloc,
480 .css_online = freezer_css_online,
481 .css_offline = freezer_css_offline,
482 .css_free = freezer_css_free,
dc52ddc0 483 .subsys_id = freezer_subsys_id,
8755ade6 484 .attach = freezer_attach,
dc52ddc0 485 .fork = freezer_fork,
4baf6e33 486 .base_cftypes = files,
dc52ddc0 487};