cgroup: implement generic child / descendant walk macros
[linux-2.6-block.git] / kernel / cgroup_freezer.c
CommitLineData
dc52ddc0
MH
1/*
2 * cgroup_freezer.c - control group freezer subsystem
3 *
4 * Copyright IBM Corporation, 2007
5 *
6 * Author : Cedric Le Goater <clg@fr.ibm.com>
7 *
8 * This program is free software; you can redistribute it and/or modify it
9 * under the terms of version 2.1 of the GNU Lesser General Public License
10 * as published by the Free Software Foundation.
11 *
12 * This program is distributed in the hope that it would be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
15 */
16
9984de1a 17#include <linux/export.h>
5a0e3ad6 18#include <linux/slab.h>
dc52ddc0
MH
19#include <linux/cgroup.h>
20#include <linux/fs.h>
21#include <linux/uaccess.h>
22#include <linux/freezer.h>
23#include <linux/seq_file.h>
24
25enum freezer_state {
81dcf33c
MH
26 CGROUP_THAWED = 0,
27 CGROUP_FREEZING,
28 CGROUP_FROZEN,
dc52ddc0
MH
29};
30
31struct freezer {
32 struct cgroup_subsys_state css;
33 enum freezer_state state;
34 spinlock_t lock; /* protects _writes_ to state */
35};
36
37static inline struct freezer *cgroup_freezer(
38 struct cgroup *cgroup)
39{
40 return container_of(
41 cgroup_subsys_state(cgroup, freezer_subsys_id),
42 struct freezer, css);
43}
44
45static inline struct freezer *task_freezer(struct task_struct *task)
46{
47 return container_of(task_subsys_state(task, freezer_subsys_id),
48 struct freezer, css);
49}
50
22b4e111 51bool cgroup_freezing(struct task_struct *task)
dc52ddc0 52{
22b4e111
TH
53 enum freezer_state state;
54 bool ret;
dc52ddc0 55
22b4e111
TH
56 rcu_read_lock();
57 state = task_freezer(task)->state;
58 ret = state == CGROUP_FREEZING || state == CGROUP_FROZEN;
59 rcu_read_unlock();
60
61 return ret;
dc52ddc0
MH
62}
63
64/*
65 * cgroups_write_string() limits the size of freezer state strings to
66 * CGROUP_LOCAL_BUFFER_SIZE
67 */
68static const char *freezer_state_strs[] = {
81dcf33c 69 "THAWED",
dc52ddc0
MH
70 "FREEZING",
71 "FROZEN",
72};
73
74/*
75 * State diagram
76 * Transitions are caused by userspace writes to the freezer.state file.
77 * The values in parenthesis are state labels. The rest are edge labels.
78 *
81dcf33c
MH
79 * (THAWED) --FROZEN--> (FREEZING) --FROZEN--> (FROZEN)
80 * ^ ^ | |
81 * | \_______THAWED_______/ |
82 * \__________________________THAWED____________/
dc52ddc0
MH
83 */
84
85struct cgroup_subsys freezer_subsys;
86
761b3ef5 87static struct cgroup_subsys_state *freezer_create(struct cgroup *cgroup)
dc52ddc0
MH
88{
89 struct freezer *freezer;
90
91 freezer = kzalloc(sizeof(struct freezer), GFP_KERNEL);
92 if (!freezer)
93 return ERR_PTR(-ENOMEM);
94
95 spin_lock_init(&freezer->lock);
81dcf33c 96 freezer->state = CGROUP_THAWED;
dc52ddc0
MH
97 return &freezer->css;
98}
99
761b3ef5 100static void freezer_destroy(struct cgroup *cgroup)
dc52ddc0 101{
a3201227
TH
102 struct freezer *freezer = cgroup_freezer(cgroup);
103
104 if (freezer->state != CGROUP_THAWED)
105 atomic_dec(&system_freezing_cnt);
106 kfree(freezer);
dc52ddc0
MH
107}
108
957a4eea 109/*
ead5c473
TH
110 * Tasks can be migrated into a different freezer anytime regardless of its
111 * current state. freezer_attach() is responsible for making new tasks
112 * conform to the current state.
113 *
114 * Freezer state changes and task migration are synchronized via
115 * @freezer->lock. freezer_attach() makes the new tasks conform to the
116 * current state and all following state changes can see the new tasks.
957a4eea 117 */
8755ade6 118static void freezer_attach(struct cgroup *new_cgrp, struct cgroup_taskset *tset)
dc52ddc0 119{
8755ade6 120 struct freezer *freezer = cgroup_freezer(new_cgrp);
bb9d97b6 121 struct task_struct *task;
957a4eea 122
8755ade6
TH
123 spin_lock_irq(&freezer->lock);
124
80a6a2cf 125 /*
8755ade6
TH
126 * Make the new tasks conform to the current state of @new_cgrp.
127 * For simplicity, when migrating any task to a FROZEN cgroup, we
128 * revert it to FREEZING and let update_if_frozen() determine the
129 * correct state later.
130 *
131 * Tasks in @tset are on @new_cgrp but may not conform to its
132 * current state before executing the following - !frozen tasks may
133 * be visible in a FROZEN cgroup and frozen tasks in a THAWED one.
134 * This means that, to determine whether to freeze, one should test
135 * whether the state equals THAWED.
80a6a2cf 136 */
8755ade6
TH
137 cgroup_taskset_for_each(task, new_cgrp, tset) {
138 if (freezer->state == CGROUP_THAWED) {
139 __thaw_task(task);
140 } else {
141 freeze_task(task);
142 freezer->state = CGROUP_FREEZING;
143 }
144 }
dc52ddc0 145
8755ade6 146 spin_unlock_irq(&freezer->lock);
f780bdb7
BB
147}
148
761b3ef5 149static void freezer_fork(struct task_struct *task)
dc52ddc0
MH
150{
151 struct freezer *freezer;
152
8b46f880 153 rcu_read_lock();
dc52ddc0 154 freezer = task_freezer(task);
dc52ddc0 155
3b1b3f6e
LZ
156 /*
157 * The root cgroup is non-freezable, so we can skip the
158 * following check.
159 */
160 if (!freezer->css.cgroup->parent)
5edee61e 161 goto out;
3b1b3f6e 162
dc52ddc0 163 spin_lock_irq(&freezer->lock);
8755ade6
TH
164 /*
165 * @task might have been just migrated into a FROZEN cgroup. Test
166 * equality with THAWED. Read the comment in freezer_attach().
167 */
168 if (freezer->state != CGROUP_THAWED)
839e3407 169 freeze_task(task);
dc52ddc0 170 spin_unlock_irq(&freezer->lock);
5edee61e
TH
171out:
172 rcu_read_unlock();
dc52ddc0
MH
173}
174
175/*
b4d18311
TH
176 * We change from FREEZING to FROZEN lazily if the cgroup was only
177 * partially frozen when we exitted write. Caller must hold freezer->lock.
178 *
179 * Task states and freezer state might disagree while tasks are being
ead5c473
TH
180 * migrated into or out of @cgroup, so we can't verify task states against
181 * @freezer state here. See freezer_attach() for details.
dc52ddc0 182 */
b4d18311 183static void update_if_frozen(struct cgroup *cgroup, struct freezer *freezer)
dc52ddc0
MH
184{
185 struct cgroup_iter it;
186 struct task_struct *task;
b4d18311
TH
187
188 if (freezer->state != CGROUP_FREEZING)
189 return;
dc52ddc0
MH
190
191 cgroup_iter_start(cgroup, &it);
b4d18311 192
dc52ddc0 193 while ((task = cgroup_iter_next(cgroup, &it))) {
3c426d5e 194 if (freezing(task)) {
3c426d5e
TH
195 /*
196 * freezer_should_skip() indicates that the task
197 * should be skipped when determining freezing
198 * completion. Consider it frozen in addition to
199 * the usual frozen condition.
200 */
5d8f72b5 201 if (!frozen(task) && !freezer_should_skip(task))
b4d18311 202 goto notyet;
3c426d5e 203 }
dc52ddc0
MH
204 }
205
b4d18311
TH
206 freezer->state = CGROUP_FROZEN;
207notyet:
dc52ddc0
MH
208 cgroup_iter_end(cgroup, &it);
209}
210
211static int freezer_read(struct cgroup *cgroup, struct cftype *cft,
212 struct seq_file *m)
213{
214 struct freezer *freezer;
215 enum freezer_state state;
216
dc52ddc0
MH
217 freezer = cgroup_freezer(cgroup);
218 spin_lock_irq(&freezer->lock);
b4d18311 219 update_if_frozen(cgroup, freezer);
dc52ddc0 220 state = freezer->state;
dc52ddc0 221 spin_unlock_irq(&freezer->lock);
dc52ddc0
MH
222
223 seq_puts(m, freezer_state_strs[state]);
224 seq_putc(m, '\n');
225 return 0;
226}
227
51f246ed 228static void freeze_cgroup(struct cgroup *cgroup, struct freezer *freezer)
dc52ddc0
MH
229{
230 struct cgroup_iter it;
231 struct task_struct *task;
dc52ddc0 232
dc52ddc0 233 cgroup_iter_start(cgroup, &it);
51f246ed
TH
234 while ((task = cgroup_iter_next(cgroup, &it)))
235 freeze_task(task);
dc52ddc0 236 cgroup_iter_end(cgroup, &it);
dc52ddc0
MH
237}
238
00c2e63c 239static void unfreeze_cgroup(struct cgroup *cgroup, struct freezer *freezer)
dc52ddc0
MH
240{
241 struct cgroup_iter it;
242 struct task_struct *task;
243
244 cgroup_iter_start(cgroup, &it);
a5be2d0d
TH
245 while ((task = cgroup_iter_next(cgroup, &it)))
246 __thaw_task(task);
dc52ddc0 247 cgroup_iter_end(cgroup, &it);
dc52ddc0
MH
248}
249
51f246ed
TH
250static void freezer_change_state(struct cgroup *cgroup,
251 enum freezer_state goal_state)
dc52ddc0 252{
51f246ed 253 struct freezer *freezer = cgroup_freezer(cgroup);
51308ee5 254
ead5c473 255 /* also synchronizes against task migration, see freezer_attach() */
dc52ddc0 256 spin_lock_irq(&freezer->lock);
51308ee5 257
51308ee5 258 switch (goal_state) {
81dcf33c 259 case CGROUP_THAWED:
a3201227
TH
260 if (freezer->state != CGROUP_THAWED)
261 atomic_dec(&system_freezing_cnt);
22b4e111 262 freezer->state = CGROUP_THAWED;
51308ee5 263 unfreeze_cgroup(cgroup, freezer);
dc52ddc0 264 break;
81dcf33c 265 case CGROUP_FROZEN:
a3201227
TH
266 if (freezer->state == CGROUP_THAWED)
267 atomic_inc(&system_freezing_cnt);
22b4e111 268 freezer->state = CGROUP_FREEZING;
51f246ed 269 freeze_cgroup(cgroup, freezer);
dc52ddc0
MH
270 break;
271 default:
51308ee5 272 BUG();
dc52ddc0 273 }
22b4e111 274
dc52ddc0 275 spin_unlock_irq(&freezer->lock);
dc52ddc0
MH
276}
277
278static int freezer_write(struct cgroup *cgroup,
279 struct cftype *cft,
280 const char *buffer)
281{
dc52ddc0
MH
282 enum freezer_state goal_state;
283
81dcf33c
MH
284 if (strcmp(buffer, freezer_state_strs[CGROUP_THAWED]) == 0)
285 goal_state = CGROUP_THAWED;
286 else if (strcmp(buffer, freezer_state_strs[CGROUP_FROZEN]) == 0)
287 goal_state = CGROUP_FROZEN;
dc52ddc0 288 else
3b1b3f6e 289 return -EINVAL;
dc52ddc0 290
51f246ed 291 freezer_change_state(cgroup, goal_state);
51f246ed 292 return 0;
dc52ddc0
MH
293}
294
295static struct cftype files[] = {
296 {
297 .name = "state",
4baf6e33 298 .flags = CFTYPE_NOT_ON_ROOT,
dc52ddc0
MH
299 .read_seq_string = freezer_read,
300 .write_string = freezer_write,
301 },
4baf6e33 302 { } /* terminate */
dc52ddc0
MH
303};
304
dc52ddc0
MH
305struct cgroup_subsys freezer_subsys = {
306 .name = "freezer",
307 .create = freezer_create,
308 .destroy = freezer_destroy,
dc52ddc0 309 .subsys_id = freezer_subsys_id,
8755ade6 310 .attach = freezer_attach,
dc52ddc0 311 .fork = freezer_fork,
4baf6e33 312 .base_cftypes = files,
8c7f6edb
TH
313
314 /*
315 * freezer subsys doesn't handle hierarchy at all. Frozen state
316 * should be inherited through the hierarchy - if a parent is
317 * frozen, all its children should be frozen. Fix it and remove
318 * the following.
319 */
320 .broken_hierarchy = true,
dc52ddc0 321};