freezer.c 12.4 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/*
 * cgroup_freezer.c -  control group freezer subsystem
 *
 * Copyright IBM Corporation, 2007
 *
 * Author : Cedric Le Goater <clg@fr.ibm.com>
 *
 * This program is free software; you can redistribute it and/or modify it
 * under the terms of version 2.1 of the GNU Lesser General Public License
 * as published by the Free Software Foundation.
 *
 * This program is distributed in the hope that it would be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
 */

17
#include <linux/export.h>
18
#include <linux/slab.h>
19 20 21 22 23
#include <linux/cgroup.h>
#include <linux/fs.h>
#include <linux/uaccess.h>
#include <linux/freezer.h>
#include <linux/seq_file.h>
24
#include <linux/mutex.h>
25

26 27 28 29 30 31 32
/*
 * A cgroup is freezing if any FREEZING flags are set.  FREEZING_SELF is
 * set if "FROZEN" is written to freezer.state cgroupfs file, and cleared
 * for "THAWED".  FREEZING_PARENT is set if the parent freezer is FREEZING
 * for whatever reason.  IOW, a cgroup has FREEZING_PARENT set if one of
 * its ancestors has FREEZING_SELF set.
 */
33
enum freezer_state_flags {
34
	CGROUP_FREEZER_ONLINE	= (1 << 0), /* freezer is fully online */
35 36
	CGROUP_FREEZING_SELF	= (1 << 1), /* this freezer is freezing */
	CGROUP_FREEZING_PARENT	= (1 << 2), /* the parent freezer is freezing */
37
	CGROUP_FROZEN		= (1 << 3), /* this and its descendants frozen */
38 39 40

	/* mask for all FREEZING flags */
	CGROUP_FREEZING		= CGROUP_FREEZING_SELF | CGROUP_FREEZING_PARENT,
41 42 43
};

struct freezer {
T
Tejun Heo 已提交
44
	struct cgroup_subsys_state	css;
45
	unsigned int			state;
46 47
};

48 49
static DEFINE_MUTEX(freezer_mutex);

50 51 52 53 54
static inline struct freezer *css_freezer(struct cgroup_subsys_state *css)
{
	return css ? container_of(css, struct freezer, css) : NULL;
}

55 56
static inline struct freezer *task_freezer(struct task_struct *task)
{
57
	return css_freezer(task_css(task, freezer_cgrp_id));
58 59
}

60 61
static struct freezer *parent_freezer(struct freezer *freezer)
{
T
Tejun Heo 已提交
62
	return css_freezer(freezer->css.parent);
63 64
}

65
bool cgroup_freezing(struct task_struct *task)
66
{
67
	bool ret;
68

69
	rcu_read_lock();
70
	ret = task_freezer(task)->state & CGROUP_FREEZING;
71 72 73
	rcu_read_unlock();

	return ret;
74 75
}

76 77 78 79 80 81 82
static const char *freezer_state_strs(unsigned int state)
{
	if (state & CGROUP_FROZEN)
		return "FROZEN";
	if (state & CGROUP_FREEZING)
		return "FREEZING";
	return "THAWED";
83 84
};

85 86
static struct cgroup_subsys_state *
freezer_css_alloc(struct cgroup_subsys_state *parent_css)
87 88 89 90 91 92 93 94 95 96
{
	struct freezer *freezer;

	freezer = kzalloc(sizeof(struct freezer), GFP_KERNEL);
	if (!freezer)
		return ERR_PTR(-ENOMEM);

	return &freezer->css;
}

97
/**
98 99
 * freezer_css_online - commit creation of a freezer css
 * @css: css being created
100
 *
101
 * We're committing to creation of @css.  Mark it online and inherit
102 103
 * parent's freezing state while holding both parent's and our
 * freezer->lock.
104
 */
105
static int freezer_css_online(struct cgroup_subsys_state *css)
106
{
107
	struct freezer *freezer = css_freezer(css);
108 109
	struct freezer *parent = parent_freezer(freezer);

110
	mutex_lock(&freezer_mutex);
111

112
	freezer->state |= CGROUP_FREEZER_ONLINE;
113 114 115 116 117 118

	if (parent && (parent->state & CGROUP_FREEZING)) {
		freezer->state |= CGROUP_FREEZING_PARENT | CGROUP_FROZEN;
		atomic_inc(&system_freezing_cnt);
	}

119
	mutex_unlock(&freezer_mutex);
T
Tejun Heo 已提交
120
	return 0;
121 122 123
}

/**
124 125
 * freezer_css_offline - initiate destruction of a freezer css
 * @css: css being destroyed
126
 *
127 128
 * @css is going away.  Mark it dead and decrement system_freezing_count if
 * it was holding one.
129
 */
130
static void freezer_css_offline(struct cgroup_subsys_state *css)
131
{
132
	struct freezer *freezer = css_freezer(css);
133

134
	mutex_lock(&freezer_mutex);
135

136
	if (freezer->state & CGROUP_FREEZING)
137
		atomic_dec(&system_freezing_cnt);
138 139 140

	freezer->state = 0;

141
	mutex_unlock(&freezer_mutex);
142 143
}

144
static void freezer_css_free(struct cgroup_subsys_state *css)
145
{
146
	kfree(css_freezer(css));
147 148
}

149
/*
150 151 152 153 154 155 156
 * Tasks can be migrated into a different freezer anytime regardless of its
 * current state.  freezer_attach() is responsible for making new tasks
 * conform to the current state.
 *
 * Freezer state changes and task migration are synchronized via
 * @freezer->lock.  freezer_attach() makes the new tasks conform to the
 * current state and all following state changes can see the new tasks.
157
 */
158
static void freezer_attach(struct cgroup_taskset *tset)
159
{
160
	struct task_struct *task;
161
	struct cgroup_subsys_state *new_css;
162

163
	mutex_lock(&freezer_mutex);
164

165
	/*
166
	 * Make the new tasks conform to the current state of @new_css.
167 168 169 170
	 * For simplicity, when migrating any task to a FROZEN cgroup, we
	 * revert it to FREEZING and let update_if_frozen() determine the
	 * correct state later.
	 *
171
	 * Tasks in @tset are on @new_css but may not conform to its
172 173
	 * current state before executing the following - !frozen tasks may
	 * be visible in a FROZEN cgroup and frozen tasks in a THAWED one.
174
	 */
175
	cgroup_taskset_for_each(task, new_css, tset) {
176 177
		struct freezer *freezer = css_freezer(new_css);

178
		if (!(freezer->state & CGROUP_FREEZING)) {
179 180 181
			__thaw_task(task);
		} else {
			freeze_task(task);
182 183 184 185 186
			/* clear FROZEN and propagate upwards */
			while (freezer && (freezer->state & CGROUP_FROZEN)) {
				freezer->state &= ~CGROUP_FROZEN;
				freezer = parent_freezer(freezer);
			}
187 188
		}
	}
189

190
	mutex_unlock(&freezer_mutex);
191 192
}

193 194 195 196 197 198 199 200 201 202
/**
 * freezer_fork - cgroup post fork callback
 * @task: a task which has just been forked
 *
 * @task has just been created and should conform to the current state of
 * the cgroup_freezer it belongs to.  This function may race against
 * freezer_attach().  Losing to freezer_attach() means that we don't have
 * to do anything as freezer_attach() will put @task into the appropriate
 * state.
 */
203
static void freezer_fork(struct task_struct *task)
204 205 206
{
	struct freezer *freezer;

207
	/*
208 209 210 211 212
	 * The root cgroup is non-freezable, so we can skip locking the
	 * freezer.  This is safe regardless of race with task migration.
	 * If we didn't race or won, skipping is obviously the right thing
	 * to do.  If we lost and root is the new cgroup, noop is still the
	 * right thing to do.
213
	 */
214 215
	if (task_css_is_root(task, freezer_cgrp_id))
		return;
216

217 218 219 220 221
	mutex_lock(&freezer_mutex);
	rcu_read_lock();

	freezer = task_freezer(task);
	if (freezer->state & CGROUP_FREEZING)
222
		freeze_task(task);
223

224
	rcu_read_unlock();
225
	mutex_unlock(&freezer_mutex);
226 227
}

228 229
/**
 * update_if_frozen - update whether a cgroup finished freezing
230
 * @css: css of interest
231 232 233 234 235 236 237 238
 *
 * Once FREEZING is initiated, transition to FROZEN is lazily updated by
 * calling this function.  If the current state is FREEZING but not FROZEN,
 * this function checks whether all tasks of this cgroup and the descendant
 * cgroups finished freezing and, if so, sets FROZEN.
 *
 * The caller is responsible for grabbing RCU read lock and calling
 * update_if_frozen() on all descendants prior to invoking this function.
239 240
 *
 * Task states and freezer state might disagree while tasks are being
241
 * migrated into or out of @css, so we can't verify task states against
242
 * @freezer state here.  See freezer_attach() for details.
243
 */
244
static void update_if_frozen(struct cgroup_subsys_state *css)
245
{
246
	struct freezer *freezer = css_freezer(css);
247
	struct cgroup_subsys_state *pos;
248
	struct css_task_iter it;
249
	struct task_struct *task;
250

251
	lockdep_assert_held(&freezer_mutex);
252

253 254
	if (!(freezer->state & CGROUP_FREEZING) ||
	    (freezer->state & CGROUP_FROZEN))
255
		return;
256 257

	/* are all (live) children frozen? */
258
	rcu_read_lock();
259 260
	css_for_each_child(pos, css) {
		struct freezer *child = css_freezer(pos);
261

262
		if ((child->state & CGROUP_FREEZER_ONLINE) &&
263 264
		    !(child->state & CGROUP_FROZEN)) {
			rcu_read_unlock();
265
			return;
266
		}
267
	}
268
	rcu_read_unlock();
269 270

	/* are all tasks frozen? */
271
	css_task_iter_start(css, &it);
272

273
	while ((task = css_task_iter_next(&it))) {
274 275 276 277 278 279 280
		if (freezing(task)) {
			/*
			 * freezer_should_skip() indicates that the task
			 * should be skipped when determining freezing
			 * completion.  Consider it frozen in addition to
			 * the usual frozen condition.
			 */
281
			if (!frozen(task) && !freezer_should_skip(task))
282
				goto out_iter_end;
283
		}
284 285
	}

286
	freezer->state |= CGROUP_FROZEN;
287
out_iter_end:
288
	css_task_iter_end(&it);
289 290
}

291
static int freezer_read(struct seq_file *m, void *v)
292
{
293
	struct cgroup_subsys_state *css = seq_css(m), *pos;
294

295
	mutex_lock(&freezer_mutex);
296
	rcu_read_lock();
297

298
	/* update states bottom-up */
299
	css_for_each_descendant_post(pos, css) {
300
		if (!css_tryget_online(pos))
301 302 303
			continue;
		rcu_read_unlock();

304
		update_if_frozen(pos);
305

306 307 308 309
		rcu_read_lock();
		css_put(pos);
	}

310
	rcu_read_unlock();
311
	mutex_unlock(&freezer_mutex);
312

313
	seq_puts(m, freezer_state_strs(css_freezer(css)->state));
314 315 316 317
	seq_putc(m, '\n');
	return 0;
}

T
Tejun Heo 已提交
318
static void freeze_cgroup(struct freezer *freezer)
319
{
320
	struct css_task_iter it;
321 322
	struct task_struct *task;

323 324
	css_task_iter_start(&freezer->css, &it);
	while ((task = css_task_iter_next(&it)))
325
		freeze_task(task);
326
	css_task_iter_end(&it);
327 328
}

T
Tejun Heo 已提交
329
static void unfreeze_cgroup(struct freezer *freezer)
330
{
331
	struct css_task_iter it;
332 333
	struct task_struct *task;

334 335
	css_task_iter_start(&freezer->css, &it);
	while ((task = css_task_iter_next(&it)))
336
		__thaw_task(task);
337
	css_task_iter_end(&it);
338 339
}

340 341 342 343
/**
 * freezer_apply_state - apply state change to a single cgroup_freezer
 * @freezer: freezer to apply state change to
 * @freeze: whether to freeze or unfreeze
344 345 346 347
 * @state: CGROUP_FREEZING_* flag to set or clear
 *
 * Set or clear @state on @cgroup according to @freeze, and perform
 * freezing or thawing as necessary.
348
 */
349 350
static void freezer_apply_state(struct freezer *freezer, bool freeze,
				unsigned int state)
351
{
352
	/* also synchronizes against task migration, see freezer_attach() */
353
	lockdep_assert_held(&freezer_mutex);
354

355 356 357
	if (!(freezer->state & CGROUP_FREEZER_ONLINE))
		return;

358
	if (freeze) {
359
		if (!(freezer->state & CGROUP_FREEZING))
360
			atomic_inc(&system_freezing_cnt);
361
		freezer->state |= state;
T
Tejun Heo 已提交
362
		freeze_cgroup(freezer);
363
	} else {
364 365 366 367 368 369 370 371 372 373
		bool was_freezing = freezer->state & CGROUP_FREEZING;

		freezer->state &= ~state;

		if (!(freezer->state & CGROUP_FREEZING)) {
			if (was_freezing)
				atomic_dec(&system_freezing_cnt);
			freezer->state &= ~CGROUP_FROZEN;
			unfreeze_cgroup(freezer);
		}
374
	}
375
}
376

377 378 379 380 381
/**
 * freezer_change_state - change the freezing state of a cgroup_freezer
 * @freezer: freezer of interest
 * @freeze: whether to freeze or thaw
 *
382 383
 * Freeze or thaw @freezer according to @freeze.  The operations are
 * recursive - all descendants of @freezer will be affected.
384 385 386
 */
static void freezer_change_state(struct freezer *freezer, bool freeze)
{
387
	struct cgroup_subsys_state *pos;
388 389 390 391 392 393

	/*
	 * Update all its descendants in pre-order traversal.  Each
	 * descendant will try to inherit its parent's FREEZING state as
	 * CGROUP_FREEZING_PARENT.
	 */
394
	mutex_lock(&freezer_mutex);
395
	rcu_read_lock();
396 397
	css_for_each_descendant_pre(pos, &freezer->css) {
		struct freezer *pos_f = css_freezer(pos);
398 399
		struct freezer *parent = parent_freezer(pos_f);

400
		if (!css_tryget_online(pos))
401 402
			continue;
		rcu_read_unlock();
403

404
		if (pos_f == freezer)
405 406
			freezer_apply_state(pos_f, freeze,
					    CGROUP_FREEZING_SELF);
407
		else
408 409 410 411
			freezer_apply_state(pos_f,
					    parent->state & CGROUP_FREEZING,
					    CGROUP_FREEZING_PARENT);

412 413
		rcu_read_lock();
		css_put(pos);
414 415
	}
	rcu_read_unlock();
416
	mutex_unlock(&freezer_mutex);
417 418
}

419 420
static ssize_t freezer_write(struct kernfs_open_file *of,
			     char *buf, size_t nbytes, loff_t off)
421
{
422
	bool freeze;
423

424 425 426
	buf = strstrip(buf);

	if (strcmp(buf, freezer_state_strs(0)) == 0)
427
		freeze = false;
428
	else if (strcmp(buf, freezer_state_strs(CGROUP_FROZEN)) == 0)
429
		freeze = true;
430
	else
431
		return -EINVAL;
432

433 434
	freezer_change_state(css_freezer(of_css(of)), freeze);
	return nbytes;
435 436
}

437 438
static u64 freezer_self_freezing_read(struct cgroup_subsys_state *css,
				      struct cftype *cft)
439
{
440
	struct freezer *freezer = css_freezer(css);
441 442 443 444

	return (bool)(freezer->state & CGROUP_FREEZING_SELF);
}

445 446
static u64 freezer_parent_freezing_read(struct cgroup_subsys_state *css,
					struct cftype *cft)
447
{
448
	struct freezer *freezer = css_freezer(css);
449 450 451 452

	return (bool)(freezer->state & CGROUP_FREEZING_PARENT);
}

453 454 455
static struct cftype files[] = {
	{
		.name = "state",
456
		.flags = CFTYPE_NOT_ON_ROOT,
457
		.seq_show = freezer_read,
458
		.write = freezer_write,
459
	},
460 461 462 463 464 465 466 467 468 469
	{
		.name = "self_freezing",
		.flags = CFTYPE_NOT_ON_ROOT,
		.read_u64 = freezer_self_freezing_read,
	},
	{
		.name = "parent_freezing",
		.flags = CFTYPE_NOT_ON_ROOT,
		.read_u64 = freezer_parent_freezing_read,
	},
470
	{ }	/* terminate */
471 472
};

473
struct cgroup_subsys freezer_cgrp_subsys = {
474 475 476 477
	.css_alloc	= freezer_css_alloc,
	.css_online	= freezer_css_online,
	.css_offline	= freezer_css_offline,
	.css_free	= freezer_css_free,
478
	.attach		= freezer_attach,
479
	.fork		= freezer_fork,
480
	.legacy_cftypes	= files,
481
};