cgroup_freezer.c 12.9 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 * cgroup_freezer.c -  control group freezer subsystem
 *
 * Copyright IBM Corporation, 2007
 *
 * Author : Cedric Le Goater <clg@fr.ibm.com>
 *
 * This program is free software; you can redistribute it and/or modify it
 * under the terms of version 2.1 of the GNU Lesser General Public License
 * as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it would be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
 */

17
#include <linux/export.h>
18
#include <linux/slab.h>
19 20 21 22 23 24
#include <linux/cgroup.h>
#include <linux/fs.h>
#include <linux/uaccess.h>
#include <linux/freezer.h>
#include <linux/seq_file.h>

25 26 27 28 29 30 31
/*
 * A cgroup is freezing if any FREEZING flags are set.  FREEZING_SELF is
 * set if "FROZEN" is written to freezer.state cgroupfs file, and cleared
 * for "THAWED".  FREEZING_PARENT is set if the parent freezer is FREEZING
 * for whatever reason.  IOW, a cgroup has FREEZING_PARENT set if one of
 * its ancestors has FREEZING_SELF set.
 */
32
enum freezer_state_flags {
33
	CGROUP_FREEZER_ONLINE	= (1 << 0), /* freezer is fully online */
34 35
	CGROUP_FREEZING_SELF	= (1 << 1), /* this freezer is freezing */
	CGROUP_FREEZING_PARENT	= (1 << 2), /* the parent freezer is freezing */
36
	CGROUP_FROZEN		= (1 << 3), /* this and its descendants frozen */
37 38 39

	/* mask for all FREEZING flags */
	CGROUP_FREEZING		= CGROUP_FREEZING_SELF | CGROUP_FREEZING_PARENT,
40 41 42
};

struct freezer {
T
Tejun Heo 已提交
43
	struct cgroup_subsys_state	css;
44
	unsigned int			state;
T
Tejun Heo 已提交
45
	spinlock_t			lock;
46 47
};

48 49 50 51 52
static inline struct freezer *css_freezer(struct cgroup_subsys_state *css)
{
	return css ? container_of(css, struct freezer, css) : NULL;
}

T
Tejun Heo 已提交
53
static inline struct freezer *cgroup_freezer(struct cgroup *cgroup)
54
{
55
	return css_freezer(cgroup_css(cgroup, freezer_subsys_id));
56 57 58 59
}

static inline struct freezer *task_freezer(struct task_struct *task)
{
60
	return css_freezer(task_css(task, freezer_subsys_id));
61 62
}

63 64
static struct freezer *parent_freezer(struct freezer *freezer)
{
T
Tejun Heo 已提交
65
	return css_freezer(css_parent(&freezer->css));
66 67
}

68
bool cgroup_freezing(struct task_struct *task)
69
{
70
	bool ret;
71

72
	rcu_read_lock();
73
	ret = task_freezer(task)->state & CGROUP_FREEZING;
74 75 76
	rcu_read_unlock();

	return ret;
77 78 79 80 81 82
}

/*
 * cgroups_write_string() limits the size of freezer state strings to
 * CGROUP_LOCAL_BUFFER_SIZE
 */
83 84 85 86 87 88 89
static const char *freezer_state_strs(unsigned int state)
{
	if (state & CGROUP_FROZEN)
		return "FROZEN";
	if (state & CGROUP_FREEZING)
		return "FREEZING";
	return "THAWED";
90 91 92 93
};

struct cgroup_subsys freezer_subsys;

94
static struct cgroup_subsys_state *freezer_css_alloc(struct cgroup *cgroup)
95 96 97 98 99 100 101 102 103 104 105
{
	struct freezer *freezer;

	freezer = kzalloc(sizeof(struct freezer), GFP_KERNEL);
	if (!freezer)
		return ERR_PTR(-ENOMEM);

	spin_lock_init(&freezer->lock);
	return &freezer->css;
}

106
/**
107
 * freezer_css_online - commit creation of a freezer cgroup
108 109
 * @cgroup: cgroup being created
 *
110 111 112
 * We're committing to creation of @cgroup.  Mark it online and inherit
 * parent's freezing state while holding both parent's and our
 * freezer->lock.
113
 */
114
static int freezer_css_online(struct cgroup *cgroup)
115
{
116
	struct freezer *freezer = cgroup_freezer(cgroup);
117 118 119 120 121 122 123 124 125 126
	struct freezer *parent = parent_freezer(freezer);

	/*
	 * The following double locking and freezing state inheritance
	 * guarantee that @cgroup can never escape ancestors' freezing
	 * states.  See cgroup_for_each_descendant_pre() for details.
	 */
	if (parent)
		spin_lock_irq(&parent->lock);
	spin_lock_nested(&freezer->lock, SINGLE_DEPTH_NESTING);
127

128
	freezer->state |= CGROUP_FREEZER_ONLINE;
129 130 131 132 133 134 135 136 137

	if (parent && (parent->state & CGROUP_FREEZING)) {
		freezer->state |= CGROUP_FREEZING_PARENT | CGROUP_FROZEN;
		atomic_inc(&system_freezing_cnt);
	}

	spin_unlock(&freezer->lock);
	if (parent)
		spin_unlock_irq(&parent->lock);
T
Tejun Heo 已提交
138 139

	return 0;
140 141 142
}

/**
143
 * freezer_css_offline - initiate destruction of @cgroup
144 145 146 147 148
 * @cgroup: cgroup being destroyed
 *
 * @cgroup is going away.  Mark it dead and decrement system_freezing_count
 * if it was holding one.
 */
149
static void freezer_css_offline(struct cgroup *cgroup)
150 151 152 153 154
{
	struct freezer *freezer = cgroup_freezer(cgroup);

	spin_lock_irq(&freezer->lock);

155
	if (freezer->state & CGROUP_FREEZING)
156
		atomic_dec(&system_freezing_cnt);
157 158 159 160 161 162

	freezer->state = 0;

	spin_unlock_irq(&freezer->lock);
}

163
static void freezer_css_free(struct cgroup *cgroup)
164 165
{
	kfree(cgroup_freezer(cgroup));
166 167
}

168
/*
169 170 171 172 173 174 175
 * Tasks can be migrated into a different freezer anytime regardless of its
 * current state.  freezer_attach() is responsible for making new tasks
 * conform to the current state.
 *
 * Freezer state changes and task migration are synchronized via
 * @freezer->lock.  freezer_attach() makes the new tasks conform to the
 * current state and all following state changes can see the new tasks.
176
 */
177
static void freezer_attach(struct cgroup *new_cgrp, struct cgroup_taskset *tset)
178
{
179
	struct freezer *freezer = cgroup_freezer(new_cgrp);
180
	struct task_struct *task;
181
	bool clear_frozen = false;
182

183 184
	spin_lock_irq(&freezer->lock);

185
	/*
186 187 188 189 190 191 192 193
	 * Make the new tasks conform to the current state of @new_cgrp.
	 * For simplicity, when migrating any task to a FROZEN cgroup, we
	 * revert it to FREEZING and let update_if_frozen() determine the
	 * correct state later.
	 *
	 * Tasks in @tset are on @new_cgrp but may not conform to its
	 * current state before executing the following - !frozen tasks may
	 * be visible in a FROZEN cgroup and frozen tasks in a THAWED one.
194
	 */
195
	cgroup_taskset_for_each(task, new_cgrp, tset) {
196
		if (!(freezer->state & CGROUP_FREEZING)) {
197 198 199
			__thaw_task(task);
		} else {
			freeze_task(task);
200
			freezer->state &= ~CGROUP_FROZEN;
201
			clear_frozen = true;
202 203
		}
	}
204

205
	spin_unlock_irq(&freezer->lock);
206 207 208 209 210 211 212 213 214 215 216 217 218 219

	/*
	 * Propagate FROZEN clearing upwards.  We may race with
	 * update_if_frozen(), but as long as both work bottom-up, either
	 * update_if_frozen() sees child's FROZEN cleared or we clear the
	 * parent's FROZEN later.  No parent w/ !FROZEN children can be
	 * left FROZEN.
	 */
	while (clear_frozen && (freezer = parent_freezer(freezer))) {
		spin_lock_irq(&freezer->lock);
		freezer->state &= ~CGROUP_FROZEN;
		clear_frozen = freezer->state & CGROUP_FREEZING;
		spin_unlock_irq(&freezer->lock);
	}
220 221
}

222
static void freezer_fork(struct task_struct *task)
223 224 225
{
	struct freezer *freezer;

226
	rcu_read_lock();
227 228
	freezer = task_freezer(task);

229 230 231 232
	/*
	 * The root cgroup is non-freezable, so we can skip the
	 * following check.
	 */
T
Tejun Heo 已提交
233
	if (!parent_freezer(freezer))
234
		goto out;
235

236
	spin_lock_irq(&freezer->lock);
237
	if (freezer->state & CGROUP_FREEZING)
238
		freeze_task(task);
239
	spin_unlock_irq(&freezer->lock);
240 241
out:
	rcu_read_unlock();
242 243
}

244 245 246 247 248 249 250 251 252 253 254
/**
 * update_if_frozen - update whether a cgroup finished freezing
 * @cgroup: cgroup of interest
 *
 * Once FREEZING is initiated, transition to FROZEN is lazily updated by
 * calling this function.  If the current state is FREEZING but not FROZEN,
 * this function checks whether all tasks of this cgroup and the descendant
 * cgroups finished freezing and, if so, sets FROZEN.
 *
 * The caller is responsible for grabbing RCU read lock and calling
 * update_if_frozen() on all descendants prior to invoking this function.
255 256
 *
 * Task states and freezer state might disagree while tasks are being
257 258
 * migrated into or out of @cgroup, so we can't verify task states against
 * @freezer state here.  See freezer_attach() for details.
259
 */
260
static void update_if_frozen(struct cgroup *cgroup)
261
{
262 263
	struct freezer *freezer = cgroup_freezer(cgroup);
	struct cgroup *pos;
264 265
	struct cgroup_iter it;
	struct task_struct *task;
266

267 268 269 270
	WARN_ON_ONCE(!rcu_read_lock_held());

	spin_lock_irq(&freezer->lock);

271 272
	if (!(freezer->state & CGROUP_FREEZING) ||
	    (freezer->state & CGROUP_FROZEN))
273 274 275 276 277
		goto out_unlock;

	/* are all (live) children frozen? */
	cgroup_for_each_child(pos, cgroup) {
		struct freezer *child = cgroup_freezer(pos);
278

279 280 281 282 283 284
		if ((child->state & CGROUP_FREEZER_ONLINE) &&
		    !(child->state & CGROUP_FROZEN))
			goto out_unlock;
	}

	/* are all tasks frozen? */
285
	cgroup_iter_start(cgroup, &it);
286

287
	while ((task = cgroup_iter_next(cgroup, &it))) {
288 289 290 291 292 293 294
		if (freezing(task)) {
			/*
			 * freezer_should_skip() indicates that the task
			 * should be skipped when determining freezing
			 * completion.  Consider it frozen in addition to
			 * the usual frozen condition.
			 */
295
			if (!frozen(task) && !freezer_should_skip(task))
296
				goto out_iter_end;
297
		}
298 299
	}

300
	freezer->state |= CGROUP_FROZEN;
301
out_iter_end:
302
	cgroup_iter_end(cgroup, &it);
303 304
out_unlock:
	spin_unlock_irq(&freezer->lock);
305 306 307 308 309
}

static int freezer_read(struct cgroup *cgroup, struct cftype *cft,
			struct seq_file *m)
{
310
	struct cgroup *pos;
311

312
	rcu_read_lock();
313

314 315 316 317 318 319 320 321
	/* update states bottom-up */
	cgroup_for_each_descendant_post(pos, cgroup)
		update_if_frozen(pos);
	update_if_frozen(cgroup);

	rcu_read_unlock();

	seq_puts(m, freezer_state_strs(cgroup_freezer(cgroup)->state));
322 323 324 325
	seq_putc(m, '\n');
	return 0;
}

T
Tejun Heo 已提交
326
static void freeze_cgroup(struct freezer *freezer)
327
{
T
Tejun Heo 已提交
328
	struct cgroup *cgroup = freezer->css.cgroup;
329 330 331 332
	struct cgroup_iter it;
	struct task_struct *task;

	cgroup_iter_start(cgroup, &it);
333 334
	while ((task = cgroup_iter_next(cgroup, &it)))
		freeze_task(task);
335 336 337
	cgroup_iter_end(cgroup, &it);
}

T
Tejun Heo 已提交
338
static void unfreeze_cgroup(struct freezer *freezer)
339
{
T
Tejun Heo 已提交
340
	struct cgroup *cgroup = freezer->css.cgroup;
341 342 343 344
	struct cgroup_iter it;
	struct task_struct *task;

	cgroup_iter_start(cgroup, &it);
345 346
	while ((task = cgroup_iter_next(cgroup, &it)))
		__thaw_task(task);
347 348 349
	cgroup_iter_end(cgroup, &it);
}

350 351 352 353
/**
 * freezer_apply_state - apply state change to a single cgroup_freezer
 * @freezer: freezer to apply state change to
 * @freeze: whether to freeze or unfreeze
354 355 356 357
 * @state: CGROUP_FREEZING_* flag to set or clear
 *
 * Set or clear @state on @cgroup according to @freeze, and perform
 * freezing or thawing as necessary.
358
 */
359 360
static void freezer_apply_state(struct freezer *freezer, bool freeze,
				unsigned int state)
361
{
362
	/* also synchronizes against task migration, see freezer_attach() */
363
	lockdep_assert_held(&freezer->lock);
364

365 366 367
	if (!(freezer->state & CGROUP_FREEZER_ONLINE))
		return;

368
	if (freeze) {
369
		if (!(freezer->state & CGROUP_FREEZING))
370
			atomic_inc(&system_freezing_cnt);
371
		freezer->state |= state;
T
Tejun Heo 已提交
372
		freeze_cgroup(freezer);
373
	} else {
374 375 376 377 378 379 380 381 382 383
		bool was_freezing = freezer->state & CGROUP_FREEZING;

		freezer->state &= ~state;

		if (!(freezer->state & CGROUP_FREEZING)) {
			if (was_freezing)
				atomic_dec(&system_freezing_cnt);
			freezer->state &= ~CGROUP_FROZEN;
			unfreeze_cgroup(freezer);
		}
384
	}
385
}
386

387 388 389 390 391
/**
 * freezer_change_state - change the freezing state of a cgroup_freezer
 * @freezer: freezer of interest
 * @freeze: whether to freeze or thaw
 *
392 393
 * Freeze or thaw @freezer according to @freeze.  The operations are
 * recursive - all descendants of @freezer will be affected.
394 395 396
 */
static void freezer_change_state(struct freezer *freezer, bool freeze)
{
397 398
	struct cgroup *pos;

399 400
	/* update @freezer */
	spin_lock_irq(&freezer->lock);
401
	freezer_apply_state(freezer, freeze, CGROUP_FREEZING_SELF);
402
	spin_unlock_irq(&freezer->lock);
403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424

	/*
	 * Update all its descendants in pre-order traversal.  Each
	 * descendant will try to inherit its parent's FREEZING state as
	 * CGROUP_FREEZING_PARENT.
	 */
	rcu_read_lock();
	cgroup_for_each_descendant_pre(pos, freezer->css.cgroup) {
		struct freezer *pos_f = cgroup_freezer(pos);
		struct freezer *parent = parent_freezer(pos_f);

		/*
		 * Our update to @parent->state is already visible which is
		 * all we need.  No need to lock @parent.  For more info on
		 * synchronization, see freezer_post_create().
		 */
		spin_lock_irq(&pos_f->lock);
		freezer_apply_state(pos_f, parent->state & CGROUP_FREEZING,
				    CGROUP_FREEZING_PARENT);
		spin_unlock_irq(&pos_f->lock);
	}
	rcu_read_unlock();
425 426
}

T
Tejun Heo 已提交
427
static int freezer_write(struct cgroup *cgroup, struct cftype *cft,
428 429
			 const char *buffer)
{
430
	bool freeze;
431

432
	if (strcmp(buffer, freezer_state_strs(0)) == 0)
433
		freeze = false;
434
	else if (strcmp(buffer, freezer_state_strs(CGROUP_FROZEN)) == 0)
435
		freeze = true;
436
	else
437
		return -EINVAL;
438

439
	freezer_change_state(cgroup_freezer(cgroup), freeze);
440
	return 0;
441 442
}

443 444 445 446 447 448 449 450 451 452 453 454 455 456
static u64 freezer_self_freezing_read(struct cgroup *cgroup, struct cftype *cft)
{
	struct freezer *freezer = cgroup_freezer(cgroup);

	return (bool)(freezer->state & CGROUP_FREEZING_SELF);
}

static u64 freezer_parent_freezing_read(struct cgroup *cgroup, struct cftype *cft)
{
	struct freezer *freezer = cgroup_freezer(cgroup);

	return (bool)(freezer->state & CGROUP_FREEZING_PARENT);
}

457 458 459
static struct cftype files[] = {
	{
		.name = "state",
460
		.flags = CFTYPE_NOT_ON_ROOT,
461 462 463
		.read_seq_string = freezer_read,
		.write_string = freezer_write,
	},
464 465 466 467 468 469 470 471 472 473
	{
		.name = "self_freezing",
		.flags = CFTYPE_NOT_ON_ROOT,
		.read_u64 = freezer_self_freezing_read,
	},
	{
		.name = "parent_freezing",
		.flags = CFTYPE_NOT_ON_ROOT,
		.read_u64 = freezer_parent_freezing_read,
	},
474
	{ }	/* terminate */
475 476 477 478
};

struct cgroup_subsys freezer_subsys = {
	.name		= "freezer",
479 480 481 482
	.css_alloc	= freezer_css_alloc,
	.css_online	= freezer_css_online,
	.css_offline	= freezer_css_offline,
	.css_free	= freezer_css_free,
483
	.subsys_id	= freezer_subsys_id,
484
	.attach		= freezer_attach,
485
	.fork		= freezer_fork,
486
	.base_cftypes	= files,
487
};