Merge tag 'pm-6.16-rc5' of git://git.kernel.org/pub/scm/linux/kernel/git/rafael/linux-pm
[linux-2.6-block.git] / kernel / cgroup / legacy_freezer.c
CommitLineData
dc52ddc0
MH
1/*
2 * cgroup_freezer.c - control group freezer subsystem
3 *
4 * Copyright IBM Corporation, 2007
5 *
6 * Author : Cedric Le Goater <clg@fr.ibm.com>
7 *
8 * This program is free software; you can redistribute it and/or modify it
9 * under the terms of version 2.1 of the GNU Lesser General Public License
10 * as published by the Free Software Foundation.
11 *
12 * This program is distributed in the hope that it would be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
15 */
16
9984de1a 17#include <linux/export.h>
5a0e3ad6 18#include <linux/slab.h>
dc52ddc0
MH
19#include <linux/cgroup.h>
20#include <linux/fs.h>
21#include <linux/uaccess.h>
22#include <linux/freezer.h>
23#include <linux/seq_file.h>
e5ced8eb 24#include <linux/mutex.h>
57dcd64c 25#include <linux/cpu.h>
dc52ddc0 26
ef9fe980
TH
27/*
28 * A cgroup is freezing if any FREEZING flags are set. FREEZING_SELF is
29 * set if "FROZEN" is written to freezer.state cgroupfs file, and cleared
30 * for "THAWED". FREEZING_PARENT is set if the parent freezer is FREEZING
31 * for whatever reason. IOW, a cgroup has FREEZING_PARENT set if one of
32 * its ancestors has FREEZING_SELF set.
33 */
d6a2fe13 34enum freezer_state_flags {
5300a9b3 35 CGROUP_FREEZER_ONLINE = (1 << 0), /* freezer is fully online */
a2252180
TH
36 CGROUP_FREEZING_SELF = (1 << 1), /* this freezer is freezing */
37 CGROUP_FREEZING_PARENT = (1 << 2), /* the parent freezer is freezing */
d6a2fe13 38 CGROUP_FROZEN = (1 << 3), /* this and its descendants frozen */
a2252180
TH
39
40 /* mask for all FREEZING flags */
41 CGROUP_FREEZING = CGROUP_FREEZING_SELF | CGROUP_FREEZING_PARENT,
dc52ddc0
MH
42};
43
44struct freezer {
bcd66c89 45 struct cgroup_subsys_state css;
d6a2fe13 46 unsigned int state;
dc52ddc0
MH
47};
48
e5ced8eb
TH
49static DEFINE_MUTEX(freezer_mutex);
50
a7c6d554
TH
51static inline struct freezer *css_freezer(struct cgroup_subsys_state *css)
52{
53 return css ? container_of(css, struct freezer, css) : NULL;
54}
55
dc52ddc0
MH
56static inline struct freezer *task_freezer(struct task_struct *task)
57{
073219e9 58 return css_freezer(task_css(task, freezer_cgrp_id));
dc52ddc0
MH
59}
60
ef9fe980
TH
61static struct freezer *parent_freezer(struct freezer *freezer)
62{
5c9d535b 63 return css_freezer(freezer->css.parent);
ef9fe980
TH
64}
65
22b4e111 66bool cgroup_freezing(struct task_struct *task)
dc52ddc0 67{
22b4e111 68 bool ret;
cff5f49d 69 unsigned int state;
dc52ddc0 70
22b4e111 71 rcu_read_lock();
cff5f49d
TVP
72 /* Check if the cgroup is still FREEZING, but not FROZEN. The extra
73 * !FROZEN check is required, because the FREEZING bit is not cleared
74 * when the state FROZEN is reached.
75 */
76 state = task_freezer(task)->state;
77 ret = (state & CGROUP_FREEZING) && !(state & CGROUP_FROZEN);
22b4e111
TH
78 rcu_read_unlock();
79
80 return ret;
dc52ddc0
MH
81}
82
d6a2fe13
TH
83static const char *freezer_state_strs(unsigned int state)
84{
85 if (state & CGROUP_FROZEN)
86 return "FROZEN";
87 if (state & CGROUP_FREEZING)
88 return "FREEZING";
89 return "THAWED";
dc52ddc0
MH
90};
91
eb95419b
TH
92static struct cgroup_subsys_state *
93freezer_css_alloc(struct cgroup_subsys_state *parent_css)
dc52ddc0
MH
94{
95 struct freezer *freezer;
96
97 freezer = kzalloc(sizeof(struct freezer), GFP_KERNEL);
98 if (!freezer)
99 return ERR_PTR(-ENOMEM);
100
dc52ddc0
MH
101 return &freezer->css;
102}
103
5300a9b3 104/**
eb95419b
TH
105 * freezer_css_online - commit creation of a freezer css
106 * @css: css being created
5300a9b3 107 *
eb95419b 108 * We're committing to creation of @css. Mark it online and inherit
a6b8daba 109 * parent's freezing state while holding cpus read lock and freezer_mutex.
5300a9b3 110 */
eb95419b 111static int freezer_css_online(struct cgroup_subsys_state *css)
dc52ddc0 112{
eb95419b 113 struct freezer *freezer = css_freezer(css);
ef9fe980
TH
114 struct freezer *parent = parent_freezer(freezer);
115
f0cc7492 116 cpus_read_lock();
e5ced8eb 117 mutex_lock(&freezer_mutex);
a3201227 118
5300a9b3 119 freezer->state |= CGROUP_FREEZER_ONLINE;
ef9fe980
TH
120
121 if (parent && (parent->state & CGROUP_FREEZING)) {
122 freezer->state |= CGROUP_FREEZING_PARENT | CGROUP_FROZEN;
f0cc7492 123 static_branch_inc_cpuslocked(&freezer_active);
ef9fe980
TH
124 }
125
e5ced8eb 126 mutex_unlock(&freezer_mutex);
f0cc7492 127 cpus_read_unlock();
b1929db4 128 return 0;
5300a9b3
TH
129}
130
131/**
eb95419b
TH
132 * freezer_css_offline - initiate destruction of a freezer css
133 * @css: css being destroyed
5300a9b3 134 *
f71bfbe1 135 * @css is going away. Mark it dead and decrement freezer_active if
eb95419b 136 * it was holding one.
5300a9b3 137 */
eb95419b 138static void freezer_css_offline(struct cgroup_subsys_state *css)
5300a9b3 139{
eb95419b 140 struct freezer *freezer = css_freezer(css);
5300a9b3 141
f0cc7492 142 cpus_read_lock();
e5ced8eb 143 mutex_lock(&freezer_mutex);
5300a9b3 144
d6a2fe13 145 if (freezer->state & CGROUP_FREEZING)
f0cc7492 146 static_branch_dec_cpuslocked(&freezer_active);
5300a9b3
TH
147
148 freezer->state = 0;
149
e5ced8eb 150 mutex_unlock(&freezer_mutex);
f0cc7492 151 cpus_read_unlock();
5300a9b3
TH
152}
153
eb95419b 154static void freezer_css_free(struct cgroup_subsys_state *css)
5300a9b3 155{
eb95419b 156 kfree(css_freezer(css));
dc52ddc0
MH
157}
158
957a4eea 159/*
ead5c473
TH
160 * Tasks can be migrated into a different freezer anytime regardless of its
161 * current state. freezer_attach() is responsible for making new tasks
162 * conform to the current state.
163 *
164 * Freezer state changes and task migration are synchronized via
165 * @freezer->lock. freezer_attach() makes the new tasks conform to the
166 * current state and all following state changes can see the new tasks.
957a4eea 167 */
1f7dd3e5 168static void freezer_attach(struct cgroup_taskset *tset)
dc52ddc0 169{
bb9d97b6 170 struct task_struct *task;
1f7dd3e5 171 struct cgroup_subsys_state *new_css;
957a4eea 172
e5ced8eb 173 mutex_lock(&freezer_mutex);
8755ade6 174
80a6a2cf 175 /*
eb95419b 176 * Make the new tasks conform to the current state of @new_css.
8755ade6
TH
177 * For simplicity, when migrating any task to a FROZEN cgroup, we
178 * revert it to FREEZING and let update_if_frozen() determine the
179 * correct state later.
180 *
eb95419b 181 * Tasks in @tset are on @new_css but may not conform to its
8755ade6
TH
182 * current state before executing the following - !frozen tasks may
183 * be visible in a FROZEN cgroup and frozen tasks in a THAWED one.
80a6a2cf 184 */
1f7dd3e5 185 cgroup_taskset_for_each(task, new_css, tset) {
599c963a
TH
186 struct freezer *freezer = css_freezer(new_css);
187
d6a2fe13 188 if (!(freezer->state & CGROUP_FREEZING)) {
8755ade6
TH
189 __thaw_task(task);
190 } else {
599c963a
TH
191 /* clear FROZEN and propagate upwards */
192 while (freezer && (freezer->state & CGROUP_FROZEN)) {
193 freezer->state &= ~CGROUP_FROZEN;
194 freezer = parent_freezer(freezer);
195 }
37fb58a7 196 freeze_task(task);
8755ade6
TH
197 }
198 }
dc52ddc0 199
e5ced8eb 200 mutex_unlock(&freezer_mutex);
f780bdb7
BB
201}
202
a60bed29
TH
203/**
204 * freezer_fork - cgroup post fork callback
205 * @task: a task which has just been forked
206 *
207 * @task has just been created and should conform to the current state of
208 * the cgroup_freezer it belongs to. This function may race against
209 * freezer_attach(). Losing to freezer_attach() means that we don't have
210 * to do anything as freezer_attach() will put @task into the appropriate
211 * state.
212 */
b53202e6 213static void freezer_fork(struct task_struct *task)
dc52ddc0
MH
214{
215 struct freezer *freezer;
216
3b1b3f6e 217 /*
a60bed29
TH
218 * The root cgroup is non-freezable, so we can skip locking the
219 * freezer. This is safe regardless of race with task migration.
220 * If we didn't race or won, skipping is obviously the right thing
221 * to do. If we lost and root is the new cgroup, noop is still the
222 * right thing to do.
3b1b3f6e 223 */
e5ced8eb
TH
224 if (task_css_is_root(task, freezer_cgrp_id))
225 return;
3b1b3f6e 226
e5ced8eb
TH
227 mutex_lock(&freezer_mutex);
228 rcu_read_lock();
229
230 freezer = task_freezer(task);
231 if (freezer->state & CGROUP_FREEZING)
839e3407 232 freeze_task(task);
e5ced8eb 233
5edee61e 234 rcu_read_unlock();
e5ced8eb 235 mutex_unlock(&freezer_mutex);
dc52ddc0
MH
236}
237
ef9fe980
TH
238/**
239 * update_if_frozen - update whether a cgroup finished freezing
182446d0 240 * @css: css of interest
ef9fe980
TH
241 *
242 * Once FREEZING is initiated, transition to FROZEN is lazily updated by
243 * calling this function. If the current state is FREEZING but not FROZEN,
244 * this function checks whether all tasks of this cgroup and the descendant
245 * cgroups finished freezing and, if so, sets FROZEN.
246 *
247 * The caller is responsible for grabbing RCU read lock and calling
248 * update_if_frozen() on all descendants prior to invoking this function.
b4d18311
TH
249 *
250 * Task states and freezer state might disagree while tasks are being
182446d0 251 * migrated into or out of @css, so we can't verify task states against
ead5c473 252 * @freezer state here. See freezer_attach() for details.
dc52ddc0 253 */
182446d0 254static void update_if_frozen(struct cgroup_subsys_state *css)
dc52ddc0 255{
182446d0 256 struct freezer *freezer = css_freezer(css);
492eb21b 257 struct cgroup_subsys_state *pos;
72ec7029 258 struct css_task_iter it;
dc52ddc0 259 struct task_struct *task;
b4d18311 260
e5ced8eb 261 lockdep_assert_held(&freezer_mutex);
ef9fe980 262
d6a2fe13
TH
263 if (!(freezer->state & CGROUP_FREEZING) ||
264 (freezer->state & CGROUP_FROZEN))
e5ced8eb 265 return;
ef9fe980
TH
266
267 /* are all (live) children frozen? */
e5ced8eb 268 rcu_read_lock();
492eb21b
TH
269 css_for_each_child(pos, css) {
270 struct freezer *child = css_freezer(pos);
dc52ddc0 271
ef9fe980 272 if ((child->state & CGROUP_FREEZER_ONLINE) &&
36e9d2eb
TH
273 !(child->state & CGROUP_FROZEN)) {
274 rcu_read_unlock();
e5ced8eb 275 return;
36e9d2eb 276 }
ef9fe980 277 }
e5ced8eb 278 rcu_read_unlock();
ef9fe980
TH
279
280 /* are all tasks frozen? */
bc2fb7ed 281 css_task_iter_start(css, 0, &it);
b4d18311 282
72ec7029 283 while ((task = css_task_iter_next(&it))) {
f5d39b02
PZ
284 if (freezing(task) && !frozen(task))
285 goto out_iter_end;
dc52ddc0
MH
286 }
287
d6a2fe13 288 freezer->state |= CGROUP_FROZEN;
ef9fe980 289out_iter_end:
72ec7029 290 css_task_iter_end(&it);
dc52ddc0
MH
291}
292
2da8ca82 293static int freezer_read(struct seq_file *m, void *v)
dc52ddc0 294{
2da8ca82 295 struct cgroup_subsys_state *css = seq_css(m), *pos;
dc52ddc0 296
e5ced8eb 297 mutex_lock(&freezer_mutex);
ef9fe980 298 rcu_read_lock();
dc52ddc0 299
ef9fe980 300 /* update states bottom-up */
e5ced8eb 301 css_for_each_descendant_post(pos, css) {
ec903c0c 302 if (!css_tryget_online(pos))
e5ced8eb
TH
303 continue;
304 rcu_read_unlock();
305
492eb21b 306 update_if_frozen(pos);
ef9fe980 307
e5ced8eb
TH
308 rcu_read_lock();
309 css_put(pos);
310 }
311
ef9fe980 312 rcu_read_unlock();
e5ced8eb 313 mutex_unlock(&freezer_mutex);
ef9fe980 314
182446d0 315 seq_puts(m, freezer_state_strs(css_freezer(css)->state));
dc52ddc0
MH
316 seq_putc(m, '\n');
317 return 0;
318}
319
bcd66c89 320static void freeze_cgroup(struct freezer *freezer)
dc52ddc0 321{
72ec7029 322 struct css_task_iter it;
dc52ddc0 323 struct task_struct *task;
dc52ddc0 324
bc2fb7ed 325 css_task_iter_start(&freezer->css, 0, &it);
72ec7029 326 while ((task = css_task_iter_next(&it)))
51f246ed 327 freeze_task(task);
72ec7029 328 css_task_iter_end(&it);
dc52ddc0
MH
329}
330
bcd66c89 331static void unfreeze_cgroup(struct freezer *freezer)
dc52ddc0 332{
72ec7029 333 struct css_task_iter it;
dc52ddc0
MH
334 struct task_struct *task;
335
bc2fb7ed 336 css_task_iter_start(&freezer->css, 0, &it);
72ec7029 337 while ((task = css_task_iter_next(&it)))
a5be2d0d 338 __thaw_task(task);
72ec7029 339 css_task_iter_end(&it);
dc52ddc0
MH
340}
341
04a4ec32
TH
342/**
343 * freezer_apply_state - apply state change to a single cgroup_freezer
344 * @freezer: freezer to apply state change to
345 * @freeze: whether to freeze or unfreeze
a2252180
TH
346 * @state: CGROUP_FREEZING_* flag to set or clear
347 *
348 * Set or clear @state on @cgroup according to @freeze, and perform
349 * freezing or thawing as necessary.
04a4ec32 350 */
a2252180
TH
351static void freezer_apply_state(struct freezer *freezer, bool freeze,
352 unsigned int state)
dc52ddc0 353{
ead5c473 354 /* also synchronizes against task migration, see freezer_attach() */
e5ced8eb 355 lockdep_assert_held(&freezer_mutex);
51308ee5 356
5300a9b3
TH
357 if (!(freezer->state & CGROUP_FREEZER_ONLINE))
358 return;
359
04a4ec32 360 if (freeze) {
d6a2fe13 361 if (!(freezer->state & CGROUP_FREEZING))
57dcd64c 362 static_branch_inc_cpuslocked(&freezer_active);
a2252180 363 freezer->state |= state;
bcd66c89 364 freeze_cgroup(freezer);
04a4ec32 365 } else {
a2252180
TH
366 bool was_freezing = freezer->state & CGROUP_FREEZING;
367
368 freezer->state &= ~state;
369
370 if (!(freezer->state & CGROUP_FREEZING)) {
a2252180 371 freezer->state &= ~CGROUP_FROZEN;
f5d39b02 372 if (was_freezing)
57dcd64c 373 static_branch_dec_cpuslocked(&freezer_active);
a2252180
TH
374 unfreeze_cgroup(freezer);
375 }
dc52ddc0 376 }
04a4ec32 377}
22b4e111 378
04a4ec32
TH
379/**
380 * freezer_change_state - change the freezing state of a cgroup_freezer
381 * @freezer: freezer of interest
382 * @freeze: whether to freeze or thaw
383 *
ef9fe980
TH
384 * Freeze or thaw @freezer according to @freeze. The operations are
385 * recursive - all descendants of @freezer will be affected.
04a4ec32
TH
386 */
387static void freezer_change_state(struct freezer *freezer, bool freeze)
388{
492eb21b 389 struct cgroup_subsys_state *pos;
ef9fe980 390
57dcd64c 391 cpus_read_lock();
ef9fe980
TH
392 /*
393 * Update all its descendants in pre-order traversal. Each
394 * descendant will try to inherit its parent's FREEZING state as
395 * CGROUP_FREEZING_PARENT.
396 */
e5ced8eb 397 mutex_lock(&freezer_mutex);
ef9fe980 398 rcu_read_lock();
492eb21b
TH
399 css_for_each_descendant_pre(pos, &freezer->css) {
400 struct freezer *pos_f = css_freezer(pos);
ef9fe980
TH
401 struct freezer *parent = parent_freezer(pos_f);
402
ec903c0c 403 if (!css_tryget_online(pos))
e5ced8eb
TH
404 continue;
405 rcu_read_unlock();
bd8815a6 406
e5ced8eb 407 if (pos_f == freezer)
bd8815a6
TH
408 freezer_apply_state(pos_f, freeze,
409 CGROUP_FREEZING_SELF);
e5ced8eb 410 else
bd8815a6
TH
411 freezer_apply_state(pos_f,
412 parent->state & CGROUP_FREEZING,
413 CGROUP_FREEZING_PARENT);
bd8815a6 414
e5ced8eb
TH
415 rcu_read_lock();
416 css_put(pos);
ef9fe980
TH
417 }
418 rcu_read_unlock();
e5ced8eb 419 mutex_unlock(&freezer_mutex);
57dcd64c 420 cpus_read_unlock();
dc52ddc0
MH
421}
422
451af504
TH
423static ssize_t freezer_write(struct kernfs_open_file *of,
424 char *buf, size_t nbytes, loff_t off)
dc52ddc0 425{
04a4ec32 426 bool freeze;
dc52ddc0 427
451af504
TH
428 buf = strstrip(buf);
429
430 if (strcmp(buf, freezer_state_strs(0)) == 0)
04a4ec32 431 freeze = false;
78f6519e
MK
432 else if (strcmp(buf, freezer_state_strs(CGROUP_FROZEN)) == 0) {
433 pr_info_once("Freezing with imperfect legacy cgroup freezer. "
434 "See cgroup.freeze of cgroup v2\n");
04a4ec32 435 freeze = true;
78f6519e 436 } else
3b1b3f6e 437 return -EINVAL;
dc52ddc0 438
451af504
TH
439 freezer_change_state(css_freezer(of_css(of)), freeze);
440 return nbytes;
dc52ddc0
MH
441}
442
182446d0
TH
443static u64 freezer_self_freezing_read(struct cgroup_subsys_state *css,
444 struct cftype *cft)
a2252180 445{
182446d0 446 struct freezer *freezer = css_freezer(css);
a2252180
TH
447
448 return (bool)(freezer->state & CGROUP_FREEZING_SELF);
449}
450
182446d0
TH
451static u64 freezer_parent_freezing_read(struct cgroup_subsys_state *css,
452 struct cftype *cft)
a2252180 453{
182446d0 454 struct freezer *freezer = css_freezer(css);
a2252180
TH
455
456 return (bool)(freezer->state & CGROUP_FREEZING_PARENT);
457}
458
dc52ddc0
MH
459static struct cftype files[] = {
460 {
461 .name = "state",
4baf6e33 462 .flags = CFTYPE_NOT_ON_ROOT,
2da8ca82 463 .seq_show = freezer_read,
451af504 464 .write = freezer_write,
dc52ddc0 465 },
a2252180
TH
466 {
467 .name = "self_freezing",
468 .flags = CFTYPE_NOT_ON_ROOT,
469 .read_u64 = freezer_self_freezing_read,
470 },
471 {
472 .name = "parent_freezing",
473 .flags = CFTYPE_NOT_ON_ROOT,
474 .read_u64 = freezer_parent_freezing_read,
475 },
4baf6e33 476 { } /* terminate */
dc52ddc0
MH
477};
478
073219e9 479struct cgroup_subsys freezer_cgrp_subsys = {
92fb9748
TH
480 .css_alloc = freezer_css_alloc,
481 .css_online = freezer_css_online,
482 .css_offline = freezer_css_offline,
483 .css_free = freezer_css_free,
8755ade6 484 .attach = freezer_attach,
dc52ddc0 485 .fork = freezer_fork,
5577964e 486 .legacy_cftypes = files,
dc52ddc0 487};