2 * cgroup_freezer.c - control group freezer subsystem
4 * Copyright IBM Corporation, 2007
6 * Author : Cedric Le Goater <clg@fr.ibm.com>
8 * This program is free software; you can redistribute it and/or modify it
9 * under the terms of version 2.1 of the GNU Lesser General Public License
10 * as published by the Free Software Foundation.
12 * This program is distributed in the hope that it would be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
17 #include <linux/export.h>
18 #include <linux/slab.h>
19 #include <linux/cgroup.h>
21 #include <linux/uaccess.h>
22 #include <linux/freezer.h>
23 #include <linux/seq_file.h>
26 * A cgroup is freezing if any FREEZING flags are set. FREEZING_SELF is
27 * set if "FROZEN" is written to freezer.state cgroupfs file, and cleared
28 * for "THAWED". FREEZING_PARENT is set if the parent freezer is FREEZING
29 * for whatever reason. IOW, a cgroup has FREEZING_PARENT set if one of
30 * its ancestors has FREEZING_SELF set.
32 enum freezer_state_flags {
33 CGROUP_FREEZER_ONLINE = (1 << 0), /* freezer is fully online */
34 CGROUP_FREEZING_SELF = (1 << 1), /* this freezer is freezing */
35 CGROUP_FREEZING_PARENT = (1 << 2), /* the parent freezer is freezing */
36 CGROUP_FROZEN = (1 << 3), /* this and its descendants frozen */
38 /* mask for all FREEZING flags */
39 CGROUP_FREEZING = CGROUP_FREEZING_SELF | CGROUP_FREEZING_PARENT,
43 struct cgroup_subsys_state css;
48 static inline struct freezer *cgroup_freezer(struct cgroup *cgroup)
50 return container_of(cgroup_subsys_state(cgroup, freezer_subsys_id),
54 static inline struct freezer *task_freezer(struct task_struct *task)
56 return container_of(task_subsys_state(task, freezer_subsys_id),
60 static struct freezer *parent_freezer(struct freezer *freezer)
62 struct cgroup *pcg = freezer->css.cgroup->parent;
65 return cgroup_freezer(pcg);
69 bool cgroup_freezing(struct task_struct *task)
74 ret = task_freezer(task)->state & CGROUP_FREEZING;
81 * cgroups_write_string() limits the size of freezer state strings to
82 * CGROUP_LOCAL_BUFFER_SIZE
84 static const char *freezer_state_strs(unsigned int state)
86 if (state & CGROUP_FROZEN)
88 if (state & CGROUP_FREEZING)
93 struct cgroup_subsys freezer_subsys;
95 static struct cgroup_subsys_state *freezer_css_alloc(struct cgroup *cgroup)
97 struct freezer *freezer;
99 freezer = kzalloc(sizeof(struct freezer), GFP_KERNEL);
101 return ERR_PTR(-ENOMEM);
103 spin_lock_init(&freezer->lock);
104 return &freezer->css;
108 * freezer_css_online - commit creation of a freezer cgroup
109 * @cgroup: cgroup being created
111 * We're committing to creation of @cgroup. Mark it online and inherit
112 * parent's freezing state while holding both parent's and our
115 static int freezer_css_online(struct cgroup *cgroup)
117 struct freezer *freezer = cgroup_freezer(cgroup);
118 struct freezer *parent = parent_freezer(freezer);
121 * The following double locking and freezing state inheritance
122 * guarantee that @cgroup can never escape ancestors' freezing
123 * states. See cgroup_for_each_descendant_pre() for details.
126 spin_lock_irq(&parent->lock);
127 spin_lock_nested(&freezer->lock, SINGLE_DEPTH_NESTING);
129 freezer->state |= CGROUP_FREEZER_ONLINE;
131 if (parent && (parent->state & CGROUP_FREEZING)) {
132 freezer->state |= CGROUP_FREEZING_PARENT | CGROUP_FROZEN;
133 atomic_inc(&system_freezing_cnt);
136 spin_unlock(&freezer->lock);
138 spin_unlock_irq(&parent->lock);
144 * freezer_css_offline - initiate destruction of @cgroup
145 * @cgroup: cgroup being destroyed
147 * @cgroup is going away. Mark it dead and decrement system_freezing_count
148 * if it was holding one.
150 static void freezer_css_offline(struct cgroup *cgroup)
152 struct freezer *freezer = cgroup_freezer(cgroup);
154 spin_lock_irq(&freezer->lock);
156 if (freezer->state & CGROUP_FREEZING)
157 atomic_dec(&system_freezing_cnt);
161 spin_unlock_irq(&freezer->lock);
164 static void freezer_css_free(struct cgroup *cgroup)
166 kfree(cgroup_freezer(cgroup));
170 * Tasks can be migrated into a different freezer anytime regardless of its
171 * current state. freezer_attach() is responsible for making new tasks
172 * conform to the current state.
174 * Freezer state changes and task migration are synchronized via
175 * @freezer->lock. freezer_attach() makes the new tasks conform to the
176 * current state and all following state changes can see the new tasks.
178 static void freezer_attach(struct cgroup *new_cgrp, struct cgroup_taskset *tset)
180 struct freezer *freezer = cgroup_freezer(new_cgrp);
181 struct task_struct *task;
182 bool clear_frozen = false;
184 spin_lock_irq(&freezer->lock);
187 * Make the new tasks conform to the current state of @new_cgrp.
188 * For simplicity, when migrating any task to a FROZEN cgroup, we
189 * revert it to FREEZING and let update_if_frozen() determine the
190 * correct state later.
192 * Tasks in @tset are on @new_cgrp but may not conform to its
193 * current state before executing the following - !frozen tasks may
194 * be visible in a FROZEN cgroup and frozen tasks in a THAWED one.
196 cgroup_taskset_for_each(task, new_cgrp, tset) {
197 if (!(freezer->state & CGROUP_FREEZING)) {
201 freezer->state &= ~CGROUP_FROZEN;
206 spin_unlock_irq(&freezer->lock);
209 * Propagate FROZEN clearing upwards. We may race with
210 * update_if_frozen(), but as long as both work bottom-up, either
211 * update_if_frozen() sees child's FROZEN cleared or we clear the
212 * parent's FROZEN later. No parent w/ !FROZEN children can be
215 while (clear_frozen && (freezer = parent_freezer(freezer))) {
216 spin_lock_irq(&freezer->lock);
217 freezer->state &= ~CGROUP_FROZEN;
218 clear_frozen = freezer->state & CGROUP_FREEZING;
219 spin_unlock_irq(&freezer->lock);
223 static void freezer_fork(struct task_struct *task)
225 struct freezer *freezer;
228 freezer = task_freezer(task);
231 * The root cgroup is non-freezable, so we can skip the
234 if (!freezer->css.cgroup->parent)
237 spin_lock_irq(&freezer->lock);
238 if (freezer->state & CGROUP_FREEZING)
240 spin_unlock_irq(&freezer->lock);
246 * update_if_frozen - update whether a cgroup finished freezing
247 * @cgroup: cgroup of interest
249 * Once FREEZING is initiated, transition to FROZEN is lazily updated by
250 * calling this function. If the current state is FREEZING but not FROZEN,
251 * this function checks whether all tasks of this cgroup and the descendant
252 * cgroups finished freezing and, if so, sets FROZEN.
254 * The caller is responsible for grabbing RCU read lock and calling
255 * update_if_frozen() on all descendants prior to invoking this function.
257 * Task states and freezer state might disagree while tasks are being
258 * migrated into or out of @cgroup, so we can't verify task states against
259 * @freezer state here. See freezer_attach() for details.
261 static void update_if_frozen(struct cgroup *cgroup)
263 struct freezer *freezer = cgroup_freezer(cgroup);
265 struct cgroup_iter it;
266 struct task_struct *task;
268 WARN_ON_ONCE(!rcu_read_lock_held());
270 spin_lock_irq(&freezer->lock);
272 if (!(freezer->state & CGROUP_FREEZING) ||
273 (freezer->state & CGROUP_FROZEN))
276 /* are all (live) children frozen? */
277 cgroup_for_each_child(pos, cgroup) {
278 struct freezer *child = cgroup_freezer(pos);
280 if ((child->state & CGROUP_FREEZER_ONLINE) &&
281 !(child->state & CGROUP_FROZEN))
285 /* are all tasks frozen? */
286 cgroup_iter_start(cgroup, &it);
288 while ((task = cgroup_iter_next(cgroup, &it))) {
289 if (freezing(task)) {
291 * freezer_should_skip() indicates that the task
292 * should be skipped when determining freezing
293 * completion. Consider it frozen in addition to
294 * the usual frozen condition.
296 if (!frozen(task) && !freezer_should_skip(task))
301 freezer->state |= CGROUP_FROZEN;
303 cgroup_iter_end(cgroup, &it);
305 spin_unlock_irq(&freezer->lock);
308 static int freezer_read(struct cgroup *cgroup, struct cftype *cft,
315 /* update states bottom-up */
316 cgroup_for_each_descendant_post(pos, cgroup)
317 update_if_frozen(pos);
318 update_if_frozen(cgroup);
322 seq_puts(m, freezer_state_strs(cgroup_freezer(cgroup)->state));
327 static void freeze_cgroup(struct freezer *freezer)
329 struct cgroup *cgroup = freezer->css.cgroup;
330 struct cgroup_iter it;
331 struct task_struct *task;
333 cgroup_iter_start(cgroup, &it);
334 while ((task = cgroup_iter_next(cgroup, &it)))
336 cgroup_iter_end(cgroup, &it);
339 static void unfreeze_cgroup(struct freezer *freezer)
341 struct cgroup *cgroup = freezer->css.cgroup;
342 struct cgroup_iter it;
343 struct task_struct *task;
345 cgroup_iter_start(cgroup, &it);
346 while ((task = cgroup_iter_next(cgroup, &it)))
348 cgroup_iter_end(cgroup, &it);
352 * freezer_apply_state - apply state change to a single cgroup_freezer
353 * @freezer: freezer to apply state change to
354 * @freeze: whether to freeze or unfreeze
355 * @state: CGROUP_FREEZING_* flag to set or clear
357 * Set or clear @state on @cgroup according to @freeze, and perform
358 * freezing or thawing as necessary.
360 static void freezer_apply_state(struct freezer *freezer, bool freeze,
363 /* also synchronizes against task migration, see freezer_attach() */
364 lockdep_assert_held(&freezer->lock);
366 if (!(freezer->state & CGROUP_FREEZER_ONLINE))
370 if (!(freezer->state & CGROUP_FREEZING))
371 atomic_inc(&system_freezing_cnt);
372 freezer->state |= state;
373 freeze_cgroup(freezer);
375 bool was_freezing = freezer->state & CGROUP_FREEZING;
377 freezer->state &= ~state;
379 if (!(freezer->state & CGROUP_FREEZING)) {
381 atomic_dec(&system_freezing_cnt);
382 freezer->state &= ~CGROUP_FROZEN;
383 unfreeze_cgroup(freezer);
389 * freezer_change_state - change the freezing state of a cgroup_freezer
390 * @freezer: freezer of interest
391 * @freeze: whether to freeze or thaw
393 * Freeze or thaw @freezer according to @freeze. The operations are
394 * recursive - all descendants of @freezer will be affected.
396 static void freezer_change_state(struct freezer *freezer, bool freeze)
400 /* update @freezer */
401 spin_lock_irq(&freezer->lock);
402 freezer_apply_state(freezer, freeze, CGROUP_FREEZING_SELF);
403 spin_unlock_irq(&freezer->lock);
406 * Update all its descendants in pre-order traversal. Each
407 * descendant will try to inherit its parent's FREEZING state as
408 * CGROUP_FREEZING_PARENT.
411 cgroup_for_each_descendant_pre(pos, freezer->css.cgroup) {
412 struct freezer *pos_f = cgroup_freezer(pos);
413 struct freezer *parent = parent_freezer(pos_f);
416 * Our update to @parent->state is already visible which is
417 * all we need. No need to lock @parent. For more info on
418 * synchronization, see freezer_post_create().
420 spin_lock_irq(&pos_f->lock);
421 freezer_apply_state(pos_f, parent->state & CGROUP_FREEZING,
422 CGROUP_FREEZING_PARENT);
423 spin_unlock_irq(&pos_f->lock);
428 static int freezer_write(struct cgroup *cgroup, struct cftype *cft,
433 if (strcmp(buffer, freezer_state_strs(0)) == 0)
435 else if (strcmp(buffer, freezer_state_strs(CGROUP_FROZEN)) == 0)
440 freezer_change_state(cgroup_freezer(cgroup), freeze);
444 static u64 freezer_self_freezing_read(struct cgroup *cgroup, struct cftype *cft)
446 struct freezer *freezer = cgroup_freezer(cgroup);
448 return (bool)(freezer->state & CGROUP_FREEZING_SELF);
451 static u64 freezer_parent_freezing_read(struct cgroup *cgroup, struct cftype *cft)
453 struct freezer *freezer = cgroup_freezer(cgroup);
455 return (bool)(freezer->state & CGROUP_FREEZING_PARENT);
458 static struct cftype files[] = {
461 .flags = CFTYPE_NOT_ON_ROOT,
462 .read_seq_string = freezer_read,
463 .write_string = freezer_write,
466 .name = "self_freezing",
467 .flags = CFTYPE_NOT_ON_ROOT,
468 .read_u64 = freezer_self_freezing_read,
471 .name = "parent_freezing",
472 .flags = CFTYPE_NOT_ON_ROOT,
473 .read_u64 = freezer_parent_freezing_read,
478 struct cgroup_subsys freezer_subsys = {
480 .css_alloc = freezer_css_alloc,
481 .css_online = freezer_css_online,
482 .css_offline = freezer_css_offline,
483 .css_free = freezer_css_free,
484 .subsys_id = freezer_subsys_id,
485 .attach = freezer_attach,
486 .fork = freezer_fork,
487 .base_cftypes = files,