cpuset: use css_task_iter_start/next/end() instead of css_scan_tasks()
[deliverable/linux.git] / kernel / cgroup_freezer.c
1 /*
2 * cgroup_freezer.c - control group freezer subsystem
3 *
4 * Copyright IBM Corporation, 2007
5 *
6 * Author : Cedric Le Goater <clg@fr.ibm.com>
7 *
8 * This program is free software; you can redistribute it and/or modify it
9 * under the terms of version 2.1 of the GNU Lesser General Public License
10 * as published by the Free Software Foundation.
11 *
12 * This program is distributed in the hope that it would be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
15 */
16
17 #include <linux/export.h>
18 #include <linux/slab.h>
19 #include <linux/cgroup.h>
20 #include <linux/fs.h>
21 #include <linux/uaccess.h>
22 #include <linux/freezer.h>
23 #include <linux/seq_file.h>
24
25 /*
26 * A cgroup is freezing if any FREEZING flags are set. FREEZING_SELF is
27 * set if "FROZEN" is written to freezer.state cgroupfs file, and cleared
28 * for "THAWED". FREEZING_PARENT is set if the parent freezer is FREEZING
29 * for whatever reason. IOW, a cgroup has FREEZING_PARENT set if one of
30 * its ancestors has FREEZING_SELF set.
31 */
32 enum freezer_state_flags {
33 CGROUP_FREEZER_ONLINE = (1 << 0), /* freezer is fully online */
34 CGROUP_FREEZING_SELF = (1 << 1), /* this freezer is freezing */
35 CGROUP_FREEZING_PARENT = (1 << 2), /* the parent freezer is freezing */
36 CGROUP_FROZEN = (1 << 3), /* this and its descendants frozen */
37
38 /* mask for all FREEZING flags */
39 CGROUP_FREEZING = CGROUP_FREEZING_SELF | CGROUP_FREEZING_PARENT,
40 };
41
42 struct freezer {
43 struct cgroup_subsys_state css;
44 unsigned int state;
45 spinlock_t lock;
46 };
47
48 static inline struct freezer *css_freezer(struct cgroup_subsys_state *css)
49 {
50 return css ? container_of(css, struct freezer, css) : NULL;
51 }
52
53 static inline struct freezer *task_freezer(struct task_struct *task)
54 {
55 return css_freezer(task_css(task, freezer_cgrp_id));
56 }
57
58 static struct freezer *parent_freezer(struct freezer *freezer)
59 {
60 return css_freezer(css_parent(&freezer->css));
61 }
62
63 bool cgroup_freezing(struct task_struct *task)
64 {
65 bool ret;
66
67 rcu_read_lock();
68 ret = task_freezer(task)->state & CGROUP_FREEZING;
69 rcu_read_unlock();
70
71 return ret;
72 }
73
74 /*
75 * cgroups_write_string() limits the size of freezer state strings to
76 * CGROUP_LOCAL_BUFFER_SIZE
77 */
78 static const char *freezer_state_strs(unsigned int state)
79 {
80 if (state & CGROUP_FROZEN)
81 return "FROZEN";
82 if (state & CGROUP_FREEZING)
83 return "FREEZING";
84 return "THAWED";
85 };
86
87 static struct cgroup_subsys_state *
88 freezer_css_alloc(struct cgroup_subsys_state *parent_css)
89 {
90 struct freezer *freezer;
91
92 freezer = kzalloc(sizeof(struct freezer), GFP_KERNEL);
93 if (!freezer)
94 return ERR_PTR(-ENOMEM);
95
96 spin_lock_init(&freezer->lock);
97 return &freezer->css;
98 }
99
100 /**
101 * freezer_css_online - commit creation of a freezer css
102 * @css: css being created
103 *
104 * We're committing to creation of @css. Mark it online and inherit
105 * parent's freezing state while holding both parent's and our
106 * freezer->lock.
107 */
108 static int freezer_css_online(struct cgroup_subsys_state *css)
109 {
110 struct freezer *freezer = css_freezer(css);
111 struct freezer *parent = parent_freezer(freezer);
112
113 /*
114 * The following double locking and freezing state inheritance
115 * guarantee that @cgroup can never escape ancestors' freezing
116 * states. See css_for_each_descendant_pre() for details.
117 */
118 if (parent)
119 spin_lock_irq(&parent->lock);
120 spin_lock_nested(&freezer->lock, SINGLE_DEPTH_NESTING);
121
122 freezer->state |= CGROUP_FREEZER_ONLINE;
123
124 if (parent && (parent->state & CGROUP_FREEZING)) {
125 freezer->state |= CGROUP_FREEZING_PARENT | CGROUP_FROZEN;
126 atomic_inc(&system_freezing_cnt);
127 }
128
129 spin_unlock(&freezer->lock);
130 if (parent)
131 spin_unlock_irq(&parent->lock);
132
133 return 0;
134 }
135
136 /**
137 * freezer_css_offline - initiate destruction of a freezer css
138 * @css: css being destroyed
139 *
140 * @css is going away. Mark it dead and decrement system_freezing_count if
141 * it was holding one.
142 */
143 static void freezer_css_offline(struct cgroup_subsys_state *css)
144 {
145 struct freezer *freezer = css_freezer(css);
146
147 spin_lock_irq(&freezer->lock);
148
149 if (freezer->state & CGROUP_FREEZING)
150 atomic_dec(&system_freezing_cnt);
151
152 freezer->state = 0;
153
154 spin_unlock_irq(&freezer->lock);
155 }
156
157 static void freezer_css_free(struct cgroup_subsys_state *css)
158 {
159 kfree(css_freezer(css));
160 }
161
162 /*
163 * Tasks can be migrated into a different freezer anytime regardless of its
164 * current state. freezer_attach() is responsible for making new tasks
165 * conform to the current state.
166 *
167 * Freezer state changes and task migration are synchronized via
168 * @freezer->lock. freezer_attach() makes the new tasks conform to the
169 * current state and all following state changes can see the new tasks.
170 */
171 static void freezer_attach(struct cgroup_subsys_state *new_css,
172 struct cgroup_taskset *tset)
173 {
174 struct freezer *freezer = css_freezer(new_css);
175 struct task_struct *task;
176 bool clear_frozen = false;
177
178 spin_lock_irq(&freezer->lock);
179
180 /*
181 * Make the new tasks conform to the current state of @new_css.
182 * For simplicity, when migrating any task to a FROZEN cgroup, we
183 * revert it to FREEZING and let update_if_frozen() determine the
184 * correct state later.
185 *
186 * Tasks in @tset are on @new_css but may not conform to its
187 * current state before executing the following - !frozen tasks may
188 * be visible in a FROZEN cgroup and frozen tasks in a THAWED one.
189 */
190 cgroup_taskset_for_each(task, new_css, tset) {
191 if (!(freezer->state & CGROUP_FREEZING)) {
192 __thaw_task(task);
193 } else {
194 freeze_task(task);
195 freezer->state &= ~CGROUP_FROZEN;
196 clear_frozen = true;
197 }
198 }
199
200 spin_unlock_irq(&freezer->lock);
201
202 /*
203 * Propagate FROZEN clearing upwards. We may race with
204 * update_if_frozen(), but as long as both work bottom-up, either
205 * update_if_frozen() sees child's FROZEN cleared or we clear the
206 * parent's FROZEN later. No parent w/ !FROZEN children can be
207 * left FROZEN.
208 */
209 while (clear_frozen && (freezer = parent_freezer(freezer))) {
210 spin_lock_irq(&freezer->lock);
211 freezer->state &= ~CGROUP_FROZEN;
212 clear_frozen = freezer->state & CGROUP_FREEZING;
213 spin_unlock_irq(&freezer->lock);
214 }
215 }
216
217 static void freezer_fork(struct task_struct *task)
218 {
219 struct freezer *freezer;
220
221 rcu_read_lock();
222 freezer = task_freezer(task);
223
224 /*
225 * The root cgroup is non-freezable, so we can skip the
226 * following check.
227 */
228 if (!parent_freezer(freezer))
229 goto out;
230
231 spin_lock_irq(&freezer->lock);
232 if (freezer->state & CGROUP_FREEZING)
233 freeze_task(task);
234 spin_unlock_irq(&freezer->lock);
235 out:
236 rcu_read_unlock();
237 }
238
239 /**
240 * update_if_frozen - update whether a cgroup finished freezing
241 * @css: css of interest
242 *
243 * Once FREEZING is initiated, transition to FROZEN is lazily updated by
244 * calling this function. If the current state is FREEZING but not FROZEN,
245 * this function checks whether all tasks of this cgroup and the descendant
246 * cgroups finished freezing and, if so, sets FROZEN.
247 *
248 * The caller is responsible for grabbing RCU read lock and calling
249 * update_if_frozen() on all descendants prior to invoking this function.
250 *
251 * Task states and freezer state might disagree while tasks are being
252 * migrated into or out of @css, so we can't verify task states against
253 * @freezer state here. See freezer_attach() for details.
254 */
255 static void update_if_frozen(struct cgroup_subsys_state *css)
256 {
257 struct freezer *freezer = css_freezer(css);
258 struct cgroup_subsys_state *pos;
259 struct css_task_iter it;
260 struct task_struct *task;
261
262 WARN_ON_ONCE(!rcu_read_lock_held());
263
264 spin_lock_irq(&freezer->lock);
265
266 if (!(freezer->state & CGROUP_FREEZING) ||
267 (freezer->state & CGROUP_FROZEN))
268 goto out_unlock;
269
270 /* are all (live) children frozen? */
271 css_for_each_child(pos, css) {
272 struct freezer *child = css_freezer(pos);
273
274 if ((child->state & CGROUP_FREEZER_ONLINE) &&
275 !(child->state & CGROUP_FROZEN))
276 goto out_unlock;
277 }
278
279 /* are all tasks frozen? */
280 css_task_iter_start(css, &it);
281
282 while ((task = css_task_iter_next(&it))) {
283 if (freezing(task)) {
284 /*
285 * freezer_should_skip() indicates that the task
286 * should be skipped when determining freezing
287 * completion. Consider it frozen in addition to
288 * the usual frozen condition.
289 */
290 if (!frozen(task) && !freezer_should_skip(task))
291 goto out_iter_end;
292 }
293 }
294
295 freezer->state |= CGROUP_FROZEN;
296 out_iter_end:
297 css_task_iter_end(&it);
298 out_unlock:
299 spin_unlock_irq(&freezer->lock);
300 }
301
302 static int freezer_read(struct seq_file *m, void *v)
303 {
304 struct cgroup_subsys_state *css = seq_css(m), *pos;
305
306 rcu_read_lock();
307
308 /* update states bottom-up */
309 css_for_each_descendant_post(pos, css)
310 update_if_frozen(pos);
311
312 rcu_read_unlock();
313
314 seq_puts(m, freezer_state_strs(css_freezer(css)->state));
315 seq_putc(m, '\n');
316 return 0;
317 }
318
319 static void freeze_cgroup(struct freezer *freezer)
320 {
321 struct css_task_iter it;
322 struct task_struct *task;
323
324 css_task_iter_start(&freezer->css, &it);
325 while ((task = css_task_iter_next(&it)))
326 freeze_task(task);
327 css_task_iter_end(&it);
328 }
329
330 static void unfreeze_cgroup(struct freezer *freezer)
331 {
332 struct css_task_iter it;
333 struct task_struct *task;
334
335 css_task_iter_start(&freezer->css, &it);
336 while ((task = css_task_iter_next(&it)))
337 __thaw_task(task);
338 css_task_iter_end(&it);
339 }
340
341 /**
342 * freezer_apply_state - apply state change to a single cgroup_freezer
343 * @freezer: freezer to apply state change to
344 * @freeze: whether to freeze or unfreeze
345 * @state: CGROUP_FREEZING_* flag to set or clear
346 *
347 * Set or clear @state on @cgroup according to @freeze, and perform
348 * freezing or thawing as necessary.
349 */
350 static void freezer_apply_state(struct freezer *freezer, bool freeze,
351 unsigned int state)
352 {
353 /* also synchronizes against task migration, see freezer_attach() */
354 lockdep_assert_held(&freezer->lock);
355
356 if (!(freezer->state & CGROUP_FREEZER_ONLINE))
357 return;
358
359 if (freeze) {
360 if (!(freezer->state & CGROUP_FREEZING))
361 atomic_inc(&system_freezing_cnt);
362 freezer->state |= state;
363 freeze_cgroup(freezer);
364 } else {
365 bool was_freezing = freezer->state & CGROUP_FREEZING;
366
367 freezer->state &= ~state;
368
369 if (!(freezer->state & CGROUP_FREEZING)) {
370 if (was_freezing)
371 atomic_dec(&system_freezing_cnt);
372 freezer->state &= ~CGROUP_FROZEN;
373 unfreeze_cgroup(freezer);
374 }
375 }
376 }
377
378 /**
379 * freezer_change_state - change the freezing state of a cgroup_freezer
380 * @freezer: freezer of interest
381 * @freeze: whether to freeze or thaw
382 *
383 * Freeze or thaw @freezer according to @freeze. The operations are
384 * recursive - all descendants of @freezer will be affected.
385 */
386 static void freezer_change_state(struct freezer *freezer, bool freeze)
387 {
388 struct cgroup_subsys_state *pos;
389
390 /*
391 * Update all its descendants in pre-order traversal. Each
392 * descendant will try to inherit its parent's FREEZING state as
393 * CGROUP_FREEZING_PARENT.
394 */
395 rcu_read_lock();
396 css_for_each_descendant_pre(pos, &freezer->css) {
397 struct freezer *pos_f = css_freezer(pos);
398 struct freezer *parent = parent_freezer(pos_f);
399
400 spin_lock_irq(&pos_f->lock);
401
402 if (pos_f == freezer) {
403 freezer_apply_state(pos_f, freeze,
404 CGROUP_FREEZING_SELF);
405 } else {
406 /*
407 * Our update to @parent->state is already visible
408 * which is all we need. No need to lock @parent.
409 * For more info on synchronization, see
410 * freezer_post_create().
411 */
412 freezer_apply_state(pos_f,
413 parent->state & CGROUP_FREEZING,
414 CGROUP_FREEZING_PARENT);
415 }
416
417 spin_unlock_irq(&pos_f->lock);
418 }
419 rcu_read_unlock();
420 }
421
422 static int freezer_write(struct cgroup_subsys_state *css, struct cftype *cft,
423 const char *buffer)
424 {
425 bool freeze;
426
427 if (strcmp(buffer, freezer_state_strs(0)) == 0)
428 freeze = false;
429 else if (strcmp(buffer, freezer_state_strs(CGROUP_FROZEN)) == 0)
430 freeze = true;
431 else
432 return -EINVAL;
433
434 freezer_change_state(css_freezer(css), freeze);
435 return 0;
436 }
437
438 static u64 freezer_self_freezing_read(struct cgroup_subsys_state *css,
439 struct cftype *cft)
440 {
441 struct freezer *freezer = css_freezer(css);
442
443 return (bool)(freezer->state & CGROUP_FREEZING_SELF);
444 }
445
446 static u64 freezer_parent_freezing_read(struct cgroup_subsys_state *css,
447 struct cftype *cft)
448 {
449 struct freezer *freezer = css_freezer(css);
450
451 return (bool)(freezer->state & CGROUP_FREEZING_PARENT);
452 }
453
454 static struct cftype files[] = {
455 {
456 .name = "state",
457 .flags = CFTYPE_NOT_ON_ROOT,
458 .seq_show = freezer_read,
459 .write_string = freezer_write,
460 },
461 {
462 .name = "self_freezing",
463 .flags = CFTYPE_NOT_ON_ROOT,
464 .read_u64 = freezer_self_freezing_read,
465 },
466 {
467 .name = "parent_freezing",
468 .flags = CFTYPE_NOT_ON_ROOT,
469 .read_u64 = freezer_parent_freezing_read,
470 },
471 { } /* terminate */
472 };
473
474 struct cgroup_subsys freezer_cgrp_subsys = {
475 .css_alloc = freezer_css_alloc,
476 .css_online = freezer_css_online,
477 .css_offline = freezer_css_offline,
478 .css_free = freezer_css_free,
479 .attach = freezer_attach,
480 .fork = freezer_fork,
481 .base_cftypes = files,
482 };
This page took 0.058085 seconds and 5 git commands to generate.