Merge tag 'net-6.17-rc7' of git://git.kernel.org/pub/scm/linux/kernel/git/netdev/net
[linux-2.6-block.git] / kernel / cgroup / legacy_freezer.c
CommitLineData
dc52ddc0
MH
1/*
2 * cgroup_freezer.c - control group freezer subsystem
3 *
4 * Copyright IBM Corporation, 2007
5 *
6 * Author : Cedric Le Goater <clg@fr.ibm.com>
7 *
8 * This program is free software; you can redistribute it and/or modify it
9 * under the terms of version 2.1 of the GNU Lesser General Public License
10 * as published by the Free Software Foundation.
11 *
12 * This program is distributed in the hope that it would be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
15 */
16
9984de1a 17#include <linux/export.h>
5a0e3ad6 18#include <linux/slab.h>
dc52ddc0
MH
19#include <linux/cgroup.h>
20#include <linux/fs.h>
21#include <linux/uaccess.h>
22#include <linux/freezer.h>
23#include <linux/seq_file.h>
e5ced8eb 24#include <linux/mutex.h>
57dcd64c 25#include <linux/cpu.h>
dc52ddc0 26
ef9fe980
TH
27/*
28 * A cgroup is freezing if any FREEZING flags are set. FREEZING_SELF is
29 * set if "FROZEN" is written to freezer.state cgroupfs file, and cleared
30 * for "THAWED". FREEZING_PARENT is set if the parent freezer is FREEZING
31 * for whatever reason. IOW, a cgroup has FREEZING_PARENT set if one of
32 * its ancestors has FREEZING_SELF set.
33 */
d6a2fe13 34enum freezer_state_flags {
5300a9b3 35 CGROUP_FREEZER_ONLINE = (1 << 0), /* freezer is fully online */
a2252180
TH
36 CGROUP_FREEZING_SELF = (1 << 1), /* this freezer is freezing */
37 CGROUP_FREEZING_PARENT = (1 << 2), /* the parent freezer is freezing */
d6a2fe13 38 CGROUP_FROZEN = (1 << 3), /* this and its descendants frozen */
a2252180
TH
39
40 /* mask for all FREEZING flags */
41 CGROUP_FREEZING = CGROUP_FREEZING_SELF | CGROUP_FREEZING_PARENT,
dc52ddc0
MH
42};
43
44struct freezer {
bcd66c89 45 struct cgroup_subsys_state css;
d6a2fe13 46 unsigned int state;
dc52ddc0
MH
47};
48
e5ced8eb
TH
49static DEFINE_MUTEX(freezer_mutex);
50
a7c6d554
TH
51static inline struct freezer *css_freezer(struct cgroup_subsys_state *css)
52{
53 return css ? container_of(css, struct freezer, css) : NULL;
54}
55
dc52ddc0
MH
56static inline struct freezer *task_freezer(struct task_struct *task)
57{
073219e9 58 return css_freezer(task_css(task, freezer_cgrp_id));
dc52ddc0
MH
59}
60
ef9fe980
TH
61static struct freezer *parent_freezer(struct freezer *freezer)
62{
5c9d535b 63 return css_freezer(freezer->css.parent);
ef9fe980
TH
64}
65
22b4e111 66bool cgroup_freezing(struct task_struct *task)
dc52ddc0 67{
22b4e111 68 bool ret;
dc52ddc0 69
22b4e111 70 rcu_read_lock();
14a67b42 71 ret = task_freezer(task)->state & CGROUP_FREEZING;
22b4e111
TH
72 rcu_read_unlock();
73
74 return ret;
dc52ddc0
MH
75}
76
d6a2fe13
TH
77static const char *freezer_state_strs(unsigned int state)
78{
79 if (state & CGROUP_FROZEN)
80 return "FROZEN";
81 if (state & CGROUP_FREEZING)
82 return "FREEZING";
83 return "THAWED";
dc52ddc0
MH
84};
85
eb95419b
TH
86static struct cgroup_subsys_state *
87freezer_css_alloc(struct cgroup_subsys_state *parent_css)
dc52ddc0
MH
88{
89 struct freezer *freezer;
90
91 freezer = kzalloc(sizeof(struct freezer), GFP_KERNEL);
92 if (!freezer)
93 return ERR_PTR(-ENOMEM);
94
dc52ddc0
MH
95 return &freezer->css;
96}
97
5300a9b3 98/**
eb95419b
TH
99 * freezer_css_online - commit creation of a freezer css
100 * @css: css being created
5300a9b3 101 *
eb95419b 102 * We're committing to creation of @css. Mark it online and inherit
a6b8daba 103 * parent's freezing state while holding cpus read lock and freezer_mutex.
5300a9b3 104 */
eb95419b 105static int freezer_css_online(struct cgroup_subsys_state *css)
dc52ddc0 106{
eb95419b 107 struct freezer *freezer = css_freezer(css);
ef9fe980
TH
108 struct freezer *parent = parent_freezer(freezer);
109
f0cc7492 110 cpus_read_lock();
e5ced8eb 111 mutex_lock(&freezer_mutex);
a3201227 112
5300a9b3 113 freezer->state |= CGROUP_FREEZER_ONLINE;
ef9fe980
TH
114
115 if (parent && (parent->state & CGROUP_FREEZING)) {
116 freezer->state |= CGROUP_FREEZING_PARENT | CGROUP_FROZEN;
f0cc7492 117 static_branch_inc_cpuslocked(&freezer_active);
ef9fe980
TH
118 }
119
e5ced8eb 120 mutex_unlock(&freezer_mutex);
f0cc7492 121 cpus_read_unlock();
b1929db4 122 return 0;
5300a9b3
TH
123}
124
125/**
eb95419b
TH
126 * freezer_css_offline - initiate destruction of a freezer css
127 * @css: css being destroyed
5300a9b3 128 *
f71bfbe1 129 * @css is going away. Mark it dead and decrement freezer_active if
eb95419b 130 * it was holding one.
5300a9b3 131 */
eb95419b 132static void freezer_css_offline(struct cgroup_subsys_state *css)
5300a9b3 133{
eb95419b 134 struct freezer *freezer = css_freezer(css);
5300a9b3 135
f0cc7492 136 cpus_read_lock();
e5ced8eb 137 mutex_lock(&freezer_mutex);
5300a9b3 138
d6a2fe13 139 if (freezer->state & CGROUP_FREEZING)
f0cc7492 140 static_branch_dec_cpuslocked(&freezer_active);
5300a9b3
TH
141
142 freezer->state = 0;
143
e5ced8eb 144 mutex_unlock(&freezer_mutex);
f0cc7492 145 cpus_read_unlock();
5300a9b3
TH
146}
147
eb95419b 148static void freezer_css_free(struct cgroup_subsys_state *css)
5300a9b3 149{
eb95419b 150 kfree(css_freezer(css));
dc52ddc0
MH
151}
152
957a4eea 153/*
ead5c473
TH
154 * Tasks can be migrated into a different freezer anytime regardless of its
155 * current state. freezer_attach() is responsible for making new tasks
156 * conform to the current state.
157 *
158 * Freezer state changes and task migration are synchronized via
159 * @freezer->lock. freezer_attach() makes the new tasks conform to the
160 * current state and all following state changes can see the new tasks.
957a4eea 161 */
1f7dd3e5 162static void freezer_attach(struct cgroup_taskset *tset)
dc52ddc0 163{
bb9d97b6 164 struct task_struct *task;
1f7dd3e5 165 struct cgroup_subsys_state *new_css;
957a4eea 166
e5ced8eb 167 mutex_lock(&freezer_mutex);
8755ade6 168
80a6a2cf 169 /*
eb95419b 170 * Make the new tasks conform to the current state of @new_css.
8755ade6
TH
171 * For simplicity, when migrating any task to a FROZEN cgroup, we
172 * revert it to FREEZING and let update_if_frozen() determine the
173 * correct state later.
174 *
eb95419b 175 * Tasks in @tset are on @new_css but may not conform to its
8755ade6
TH
176 * current state before executing the following - !frozen tasks may
177 * be visible in a FROZEN cgroup and frozen tasks in a THAWED one.
80a6a2cf 178 */
1f7dd3e5 179 cgroup_taskset_for_each(task, new_css, tset) {
599c963a
TH
180 struct freezer *freezer = css_freezer(new_css);
181
d6a2fe13 182 if (!(freezer->state & CGROUP_FREEZING)) {
8755ade6
TH
183 __thaw_task(task);
184 } else {
599c963a
TH
185 /* clear FROZEN and propagate upwards */
186 while (freezer && (freezer->state & CGROUP_FROZEN)) {
187 freezer->state &= ~CGROUP_FROZEN;
188 freezer = parent_freezer(freezer);
189 }
37fb58a7 190 freeze_task(task);
8755ade6
TH
191 }
192 }
dc52ddc0 193
e5ced8eb 194 mutex_unlock(&freezer_mutex);
f780bdb7
BB
195}
196
a60bed29
TH
197/**
198 * freezer_fork - cgroup post fork callback
199 * @task: a task which has just been forked
200 *
201 * @task has just been created and should conform to the current state of
202 * the cgroup_freezer it belongs to. This function may race against
203 * freezer_attach(). Losing to freezer_attach() means that we don't have
204 * to do anything as freezer_attach() will put @task into the appropriate
205 * state.
206 */
b53202e6 207static void freezer_fork(struct task_struct *task)
dc52ddc0
MH
208{
209 struct freezer *freezer;
210
3b1b3f6e 211 /*
a60bed29
TH
212 * The root cgroup is non-freezable, so we can skip locking the
213 * freezer. This is safe regardless of race with task migration.
214 * If we didn't race or won, skipping is obviously the right thing
215 * to do. If we lost and root is the new cgroup, noop is still the
216 * right thing to do.
3b1b3f6e 217 */
e5ced8eb
TH
218 if (task_css_is_root(task, freezer_cgrp_id))
219 return;
3b1b3f6e 220
e5ced8eb
TH
221 mutex_lock(&freezer_mutex);
222 rcu_read_lock();
223
224 freezer = task_freezer(task);
225 if (freezer->state & CGROUP_FREEZING)
839e3407 226 freeze_task(task);
e5ced8eb 227
5edee61e 228 rcu_read_unlock();
e5ced8eb 229 mutex_unlock(&freezer_mutex);
dc52ddc0
MH
230}
231
ef9fe980
TH
232/**
233 * update_if_frozen - update whether a cgroup finished freezing
182446d0 234 * @css: css of interest
ef9fe980
TH
235 *
236 * Once FREEZING is initiated, transition to FROZEN is lazily updated by
237 * calling this function. If the current state is FREEZING but not FROZEN,
238 * this function checks whether all tasks of this cgroup and the descendant
239 * cgroups finished freezing and, if so, sets FROZEN.
240 *
241 * The caller is responsible for grabbing RCU read lock and calling
242 * update_if_frozen() on all descendants prior to invoking this function.
b4d18311
TH
243 *
244 * Task states and freezer state might disagree while tasks are being
182446d0 245 * migrated into or out of @css, so we can't verify task states against
ead5c473 246 * @freezer state here. See freezer_attach() for details.
dc52ddc0 247 */
182446d0 248static void update_if_frozen(struct cgroup_subsys_state *css)
dc52ddc0 249{
182446d0 250 struct freezer *freezer = css_freezer(css);
492eb21b 251 struct cgroup_subsys_state *pos;
72ec7029 252 struct css_task_iter it;
dc52ddc0 253 struct task_struct *task;
b4d18311 254
e5ced8eb 255 lockdep_assert_held(&freezer_mutex);
ef9fe980 256
d6a2fe13
TH
257 if (!(freezer->state & CGROUP_FREEZING) ||
258 (freezer->state & CGROUP_FROZEN))
e5ced8eb 259 return;
ef9fe980
TH
260
261 /* are all (live) children frozen? */
e5ced8eb 262 rcu_read_lock();
492eb21b
TH
263 css_for_each_child(pos, css) {
264 struct freezer *child = css_freezer(pos);
dc52ddc0 265
ef9fe980 266 if ((child->state & CGROUP_FREEZER_ONLINE) &&
36e9d2eb
TH
267 !(child->state & CGROUP_FROZEN)) {
268 rcu_read_unlock();
e5ced8eb 269 return;
36e9d2eb 270 }
ef9fe980 271 }
e5ced8eb 272 rcu_read_unlock();
ef9fe980
TH
273
274 /* are all tasks frozen? */
bc2fb7ed 275 css_task_iter_start(css, 0, &it);
b4d18311 276
72ec7029 277 while ((task = css_task_iter_next(&it))) {
f5d39b02
PZ
278 if (freezing(task) && !frozen(task))
279 goto out_iter_end;
dc52ddc0
MH
280 }
281
d6a2fe13 282 freezer->state |= CGROUP_FROZEN;
ef9fe980 283out_iter_end:
72ec7029 284 css_task_iter_end(&it);
dc52ddc0
MH
285}
286
2da8ca82 287static int freezer_read(struct seq_file *m, void *v)
dc52ddc0 288{
2da8ca82 289 struct cgroup_subsys_state *css = seq_css(m), *pos;
dc52ddc0 290
e5ced8eb 291 mutex_lock(&freezer_mutex);
ef9fe980 292 rcu_read_lock();
dc52ddc0 293
ef9fe980 294 /* update states bottom-up */
e5ced8eb 295 css_for_each_descendant_post(pos, css) {
ec903c0c 296 if (!css_tryget_online(pos))
e5ced8eb
TH
297 continue;
298 rcu_read_unlock();
299
492eb21b 300 update_if_frozen(pos);
ef9fe980 301
e5ced8eb
TH
302 rcu_read_lock();
303 css_put(pos);
304 }
305
ef9fe980 306 rcu_read_unlock();
e5ced8eb 307 mutex_unlock(&freezer_mutex);
ef9fe980 308
182446d0 309 seq_puts(m, freezer_state_strs(css_freezer(css)->state));
dc52ddc0
MH
310 seq_putc(m, '\n');
311 return 0;
312}
313
bcd66c89 314static void freeze_cgroup(struct freezer *freezer)
dc52ddc0 315{
72ec7029 316 struct css_task_iter it;
dc52ddc0 317 struct task_struct *task;
dc52ddc0 318
bc2fb7ed 319 css_task_iter_start(&freezer->css, 0, &it);
72ec7029 320 while ((task = css_task_iter_next(&it)))
51f246ed 321 freeze_task(task);
72ec7029 322 css_task_iter_end(&it);
dc52ddc0
MH
323}
324
bcd66c89 325static void unfreeze_cgroup(struct freezer *freezer)
dc52ddc0 326{
72ec7029 327 struct css_task_iter it;
dc52ddc0
MH
328 struct task_struct *task;
329
bc2fb7ed 330 css_task_iter_start(&freezer->css, 0, &it);
72ec7029 331 while ((task = css_task_iter_next(&it)))
a5be2d0d 332 __thaw_task(task);
72ec7029 333 css_task_iter_end(&it);
dc52ddc0
MH
334}
335
04a4ec32
TH
336/**
337 * freezer_apply_state - apply state change to a single cgroup_freezer
338 * @freezer: freezer to apply state change to
339 * @freeze: whether to freeze or unfreeze
a2252180
TH
340 * @state: CGROUP_FREEZING_* flag to set or clear
341 *
342 * Set or clear @state on @cgroup according to @freeze, and perform
343 * freezing or thawing as necessary.
04a4ec32 344 */
a2252180
TH
345static void freezer_apply_state(struct freezer *freezer, bool freeze,
346 unsigned int state)
dc52ddc0 347{
ead5c473 348 /* also synchronizes against task migration, see freezer_attach() */
e5ced8eb 349 lockdep_assert_held(&freezer_mutex);
51308ee5 350
5300a9b3
TH
351 if (!(freezer->state & CGROUP_FREEZER_ONLINE))
352 return;
353
04a4ec32 354 if (freeze) {
d6a2fe13 355 if (!(freezer->state & CGROUP_FREEZING))
57dcd64c 356 static_branch_inc_cpuslocked(&freezer_active);
a2252180 357 freezer->state |= state;
bcd66c89 358 freeze_cgroup(freezer);
04a4ec32 359 } else {
a2252180
TH
360 bool was_freezing = freezer->state & CGROUP_FREEZING;
361
362 freezer->state &= ~state;
363
364 if (!(freezer->state & CGROUP_FREEZING)) {
a2252180 365 freezer->state &= ~CGROUP_FROZEN;
f5d39b02 366 if (was_freezing)
57dcd64c 367 static_branch_dec_cpuslocked(&freezer_active);
a2252180
TH
368 unfreeze_cgroup(freezer);
369 }
dc52ddc0 370 }
04a4ec32 371}
22b4e111 372
04a4ec32
TH
373/**
374 * freezer_change_state - change the freezing state of a cgroup_freezer
375 * @freezer: freezer of interest
376 * @freeze: whether to freeze or thaw
377 *
ef9fe980
TH
378 * Freeze or thaw @freezer according to @freeze. The operations are
379 * recursive - all descendants of @freezer will be affected.
04a4ec32
TH
380 */
381static void freezer_change_state(struct freezer *freezer, bool freeze)
382{
492eb21b 383 struct cgroup_subsys_state *pos;
ef9fe980 384
57dcd64c 385 cpus_read_lock();
ef9fe980
TH
386 /*
387 * Update all its descendants in pre-order traversal. Each
388 * descendant will try to inherit its parent's FREEZING state as
389 * CGROUP_FREEZING_PARENT.
390 */
e5ced8eb 391 mutex_lock(&freezer_mutex);
ef9fe980 392 rcu_read_lock();
492eb21b
TH
393 css_for_each_descendant_pre(pos, &freezer->css) {
394 struct freezer *pos_f = css_freezer(pos);
ef9fe980
TH
395 struct freezer *parent = parent_freezer(pos_f);
396
ec903c0c 397 if (!css_tryget_online(pos))
e5ced8eb
TH
398 continue;
399 rcu_read_unlock();
bd8815a6 400
e5ced8eb 401 if (pos_f == freezer)
bd8815a6
TH
402 freezer_apply_state(pos_f, freeze,
403 CGROUP_FREEZING_SELF);
e5ced8eb 404 else
bd8815a6
TH
405 freezer_apply_state(pos_f,
406 parent->state & CGROUP_FREEZING,
407 CGROUP_FREEZING_PARENT);
bd8815a6 408
e5ced8eb
TH
409 rcu_read_lock();
410 css_put(pos);
ef9fe980
TH
411 }
412 rcu_read_unlock();
e5ced8eb 413 mutex_unlock(&freezer_mutex);
57dcd64c 414 cpus_read_unlock();
dc52ddc0
MH
415}
416
451af504
TH
417static ssize_t freezer_write(struct kernfs_open_file *of,
418 char *buf, size_t nbytes, loff_t off)
dc52ddc0 419{
04a4ec32 420 bool freeze;
dc52ddc0 421
451af504
TH
422 buf = strstrip(buf);
423
424 if (strcmp(buf, freezer_state_strs(0)) == 0)
04a4ec32 425 freeze = false;
78f6519e
MK
426 else if (strcmp(buf, freezer_state_strs(CGROUP_FROZEN)) == 0) {
427 pr_info_once("Freezing with imperfect legacy cgroup freezer. "
428 "See cgroup.freeze of cgroup v2\n");
04a4ec32 429 freeze = true;
78f6519e 430 } else
3b1b3f6e 431 return -EINVAL;
dc52ddc0 432
451af504
TH
433 freezer_change_state(css_freezer(of_css(of)), freeze);
434 return nbytes;
dc52ddc0
MH
435}
436
182446d0
TH
437static u64 freezer_self_freezing_read(struct cgroup_subsys_state *css,
438 struct cftype *cft)
a2252180 439{
182446d0 440 struct freezer *freezer = css_freezer(css);
a2252180
TH
441
442 return (bool)(freezer->state & CGROUP_FREEZING_SELF);
443}
444
182446d0
TH
445static u64 freezer_parent_freezing_read(struct cgroup_subsys_state *css,
446 struct cftype *cft)
a2252180 447{
182446d0 448 struct freezer *freezer = css_freezer(css);
a2252180
TH
449
450 return (bool)(freezer->state & CGROUP_FREEZING_PARENT);
451}
452
dc52ddc0
MH
453static struct cftype files[] = {
454 {
455 .name = "state",
4baf6e33 456 .flags = CFTYPE_NOT_ON_ROOT,
2da8ca82 457 .seq_show = freezer_read,
451af504 458 .write = freezer_write,
dc52ddc0 459 },
a2252180
TH
460 {
461 .name = "self_freezing",
462 .flags = CFTYPE_NOT_ON_ROOT,
463 .read_u64 = freezer_self_freezing_read,
464 },
465 {
466 .name = "parent_freezing",
467 .flags = CFTYPE_NOT_ON_ROOT,
468 .read_u64 = freezer_parent_freezing_read,
469 },
4baf6e33 470 { } /* terminate */
dc52ddc0
MH
471};
472
073219e9 473struct cgroup_subsys freezer_cgrp_subsys = {
92fb9748
TH
474 .css_alloc = freezer_css_alloc,
475 .css_online = freezer_css_online,
476 .css_offline = freezer_css_offline,
477 .css_free = freezer_css_free,
8755ade6 478 .attach = freezer_attach,
dc52ddc0 479 .fork = freezer_fork,
5577964e 480 .legacy_cftypes = files,
dc52ddc0 481};