cgroup_freezer.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488
  1. /*
  2. * cgroup_freezer.c - control group freezer subsystem
  3. *
  4. * Copyright IBM Corporation, 2007
  5. *
  6. * Author : Cedric Le Goater <clg@fr.ibm.com>
  7. *
  8. * This program is free software; you can redistribute it and/or modify it
  9. * under the terms of version 2.1 of the GNU Lesser General Public License
  10. * as published by the Free Software Foundation.
  11. *
  12. * This program is distributed in the hope that it would be useful, but
  13. * WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  15. */
  16. #include <linux/export.h>
  17. #include <linux/slab.h>
  18. #include <linux/cgroup.h>
  19. #include <linux/fs.h>
  20. #include <linux/uaccess.h>
  21. #include <linux/freezer.h>
  22. #include <linux/seq_file.h>
  23. /*
  24. * A cgroup is freezing if any FREEZING flags are set. FREEZING_SELF is
  25. * set if "FROZEN" is written to freezer.state cgroupfs file, and cleared
  26. * for "THAWED". FREEZING_PARENT is set if the parent freezer is FREEZING
  27. * for whatever reason. IOW, a cgroup has FREEZING_PARENT set if one of
  28. * its ancestors has FREEZING_SELF set.
  29. */
  30. enum freezer_state_flags {
  31. CGROUP_FREEZER_ONLINE = (1 << 0), /* freezer is fully online */
  32. CGROUP_FREEZING_SELF = (1 << 1), /* this freezer is freezing */
  33. CGROUP_FREEZING_PARENT = (1 << 2), /* the parent freezer is freezing */
  34. CGROUP_FROZEN = (1 << 3), /* this and its descendants frozen */
  35. /* mask for all FREEZING flags */
  36. CGROUP_FREEZING = CGROUP_FREEZING_SELF | CGROUP_FREEZING_PARENT,
  37. };
  38. struct freezer {
  39. struct cgroup_subsys_state css;
  40. unsigned int state;
  41. spinlock_t lock;
  42. };
  43. static inline struct freezer *cgroup_freezer(struct cgroup *cgroup)
  44. {
  45. return container_of(cgroup_subsys_state(cgroup, freezer_subsys_id),
  46. struct freezer, css);
  47. }
  48. static inline struct freezer *task_freezer(struct task_struct *task)
  49. {
  50. return container_of(task_subsys_state(task, freezer_subsys_id),
  51. struct freezer, css);
  52. }
  53. static struct freezer *parent_freezer(struct freezer *freezer)
  54. {
  55. struct cgroup *pcg = freezer->css.cgroup->parent;
  56. if (pcg)
  57. return cgroup_freezer(pcg);
  58. return NULL;
  59. }
  60. bool cgroup_freezing(struct task_struct *task)
  61. {
  62. bool ret;
  63. rcu_read_lock();
  64. ret = task_freezer(task)->state & CGROUP_FREEZING;
  65. rcu_read_unlock();
  66. return ret;
  67. }
  68. /*
  69. * cgroups_write_string() limits the size of freezer state strings to
  70. * CGROUP_LOCAL_BUFFER_SIZE
  71. */
  72. static const char *freezer_state_strs(unsigned int state)
  73. {
  74. if (state & CGROUP_FROZEN)
  75. return "FROZEN";
  76. if (state & CGROUP_FREEZING)
  77. return "FREEZING";
  78. return "THAWED";
  79. };
  80. struct cgroup_subsys freezer_subsys;
  81. static struct cgroup_subsys_state *freezer_css_alloc(struct cgroup *cgroup)
  82. {
  83. struct freezer *freezer;
  84. freezer = kzalloc(sizeof(struct freezer), GFP_KERNEL);
  85. if (!freezer)
  86. return ERR_PTR(-ENOMEM);
  87. spin_lock_init(&freezer->lock);
  88. return &freezer->css;
  89. }
  90. /**
  91. * freezer_css_online - commit creation of a freezer cgroup
  92. * @cgroup: cgroup being created
  93. *
  94. * We're committing to creation of @cgroup. Mark it online and inherit
  95. * parent's freezing state while holding both parent's and our
  96. * freezer->lock.
  97. */
  98. static int freezer_css_online(struct cgroup *cgroup)
  99. {
  100. struct freezer *freezer = cgroup_freezer(cgroup);
  101. struct freezer *parent = parent_freezer(freezer);
  102. /*
  103. * The following double locking and freezing state inheritance
  104. * guarantee that @cgroup can never escape ancestors' freezing
  105. * states. See cgroup_for_each_descendant_pre() for details.
  106. */
  107. if (parent)
  108. spin_lock_irq(&parent->lock);
  109. spin_lock_nested(&freezer->lock, SINGLE_DEPTH_NESTING);
  110. freezer->state |= CGROUP_FREEZER_ONLINE;
  111. if (parent && (parent->state & CGROUP_FREEZING)) {
  112. freezer->state |= CGROUP_FREEZING_PARENT | CGROUP_FROZEN;
  113. atomic_inc(&system_freezing_cnt);
  114. }
  115. spin_unlock(&freezer->lock);
  116. if (parent)
  117. spin_unlock_irq(&parent->lock);
  118. return 0;
  119. }
  120. /**
  121. * freezer_css_offline - initiate destruction of @cgroup
  122. * @cgroup: cgroup being destroyed
  123. *
  124. * @cgroup is going away. Mark it dead and decrement system_freezing_count
  125. * if it was holding one.
  126. */
  127. static void freezer_css_offline(struct cgroup *cgroup)
  128. {
  129. struct freezer *freezer = cgroup_freezer(cgroup);
  130. spin_lock_irq(&freezer->lock);
  131. if (freezer->state & CGROUP_FREEZING)
  132. atomic_dec(&system_freezing_cnt);
  133. freezer->state = 0;
  134. spin_unlock_irq(&freezer->lock);
  135. }
  136. static void freezer_css_free(struct cgroup *cgroup)
  137. {
  138. kfree(cgroup_freezer(cgroup));
  139. }
  140. /*
  141. * Tasks can be migrated into a different freezer anytime regardless of its
  142. * current state. freezer_attach() is responsible for making new tasks
  143. * conform to the current state.
  144. *
  145. * Freezer state changes and task migration are synchronized via
  146. * @freezer->lock. freezer_attach() makes the new tasks conform to the
  147. * current state and all following state changes can see the new tasks.
  148. */
  149. static void freezer_attach(struct cgroup *new_cgrp, struct cgroup_taskset *tset)
  150. {
  151. struct freezer *freezer = cgroup_freezer(new_cgrp);
  152. struct task_struct *task;
  153. bool clear_frozen = false;
  154. spin_lock_irq(&freezer->lock);
  155. /*
  156. * Make the new tasks conform to the current state of @new_cgrp.
  157. * For simplicity, when migrating any task to a FROZEN cgroup, we
  158. * revert it to FREEZING and let update_if_frozen() determine the
  159. * correct state later.
  160. *
  161. * Tasks in @tset are on @new_cgrp but may not conform to its
  162. * current state before executing the following - !frozen tasks may
  163. * be visible in a FROZEN cgroup and frozen tasks in a THAWED one.
  164. */
  165. cgroup_taskset_for_each(task, new_cgrp, tset) {
  166. if (!(freezer->state & CGROUP_FREEZING)) {
  167. __thaw_task(task);
  168. } else {
  169. freeze_task(task);
  170. freezer->state &= ~CGROUP_FROZEN;
  171. clear_frozen = true;
  172. }
  173. }
  174. spin_unlock_irq(&freezer->lock);
  175. /*
  176. * Propagate FROZEN clearing upwards. We may race with
  177. * update_if_frozen(), but as long as both work bottom-up, either
  178. * update_if_frozen() sees child's FROZEN cleared or we clear the
  179. * parent's FROZEN later. No parent w/ !FROZEN children can be
  180. * left FROZEN.
  181. */
  182. while (clear_frozen && (freezer = parent_freezer(freezer))) {
  183. spin_lock_irq(&freezer->lock);
  184. freezer->state &= ~CGROUP_FROZEN;
  185. clear_frozen = freezer->state & CGROUP_FREEZING;
  186. spin_unlock_irq(&freezer->lock);
  187. }
  188. }
  189. static void freezer_fork(struct task_struct *task)
  190. {
  191. struct freezer *freezer;
  192. rcu_read_lock();
  193. freezer = task_freezer(task);
  194. /*
  195. * The root cgroup is non-freezable, so we can skip the
  196. * following check.
  197. */
  198. if (!freezer->css.cgroup->parent)
  199. goto out;
  200. spin_lock_irq(&freezer->lock);
  201. if (freezer->state & CGROUP_FREEZING)
  202. freeze_task(task);
  203. spin_unlock_irq(&freezer->lock);
  204. out:
  205. rcu_read_unlock();
  206. }
  207. /**
  208. * update_if_frozen - update whether a cgroup finished freezing
  209. * @cgroup: cgroup of interest
  210. *
  211. * Once FREEZING is initiated, transition to FROZEN is lazily updated by
  212. * calling this function. If the current state is FREEZING but not FROZEN,
  213. * this function checks whether all tasks of this cgroup and the descendant
  214. * cgroups finished freezing and, if so, sets FROZEN.
  215. *
  216. * The caller is responsible for grabbing RCU read lock and calling
  217. * update_if_frozen() on all descendants prior to invoking this function.
  218. *
  219. * Task states and freezer state might disagree while tasks are being
  220. * migrated into or out of @cgroup, so we can't verify task states against
  221. * @freezer state here. See freezer_attach() for details.
  222. */
  223. static void update_if_frozen(struct cgroup *cgroup)
  224. {
  225. struct freezer *freezer = cgroup_freezer(cgroup);
  226. struct cgroup *pos;
  227. struct cgroup_iter it;
  228. struct task_struct *task;
  229. WARN_ON_ONCE(!rcu_read_lock_held());
  230. spin_lock_irq(&freezer->lock);
  231. if (!(freezer->state & CGROUP_FREEZING) ||
  232. (freezer->state & CGROUP_FROZEN))
  233. goto out_unlock;
  234. /* are all (live) children frozen? */
  235. cgroup_for_each_child(pos, cgroup) {
  236. struct freezer *child = cgroup_freezer(pos);
  237. if ((child->state & CGROUP_FREEZER_ONLINE) &&
  238. !(child->state & CGROUP_FROZEN))
  239. goto out_unlock;
  240. }
  241. /* are all tasks frozen? */
  242. cgroup_iter_start(cgroup, &it);
  243. while ((task = cgroup_iter_next(cgroup, &it))) {
  244. if (freezing(task)) {
  245. /*
  246. * freezer_should_skip() indicates that the task
  247. * should be skipped when determining freezing
  248. * completion. Consider it frozen in addition to
  249. * the usual frozen condition.
  250. */
  251. if (!frozen(task) && !freezer_should_skip(task))
  252. goto out_iter_end;
  253. }
  254. }
  255. freezer->state |= CGROUP_FROZEN;
  256. out_iter_end:
  257. cgroup_iter_end(cgroup, &it);
  258. out_unlock:
  259. spin_unlock_irq(&freezer->lock);
  260. }
  261. static int freezer_read(struct cgroup *cgroup, struct cftype *cft,
  262. struct seq_file *m)
  263. {
  264. struct cgroup *pos;
  265. rcu_read_lock();
  266. /* update states bottom-up */
  267. cgroup_for_each_descendant_post(pos, cgroup)
  268. update_if_frozen(pos);
  269. update_if_frozen(cgroup);
  270. rcu_read_unlock();
  271. seq_puts(m, freezer_state_strs(cgroup_freezer(cgroup)->state));
  272. seq_putc(m, '\n');
  273. return 0;
  274. }
  275. static void freeze_cgroup(struct freezer *freezer)
  276. {
  277. struct cgroup *cgroup = freezer->css.cgroup;
  278. struct cgroup_iter it;
  279. struct task_struct *task;
  280. cgroup_iter_start(cgroup, &it);
  281. while ((task = cgroup_iter_next(cgroup, &it)))
  282. freeze_task(task);
  283. cgroup_iter_end(cgroup, &it);
  284. }
  285. static void unfreeze_cgroup(struct freezer *freezer)
  286. {
  287. struct cgroup *cgroup = freezer->css.cgroup;
  288. struct cgroup_iter it;
  289. struct task_struct *task;
  290. cgroup_iter_start(cgroup, &it);
  291. while ((task = cgroup_iter_next(cgroup, &it)))
  292. __thaw_task(task);
  293. cgroup_iter_end(cgroup, &it);
  294. }
  295. /**
  296. * freezer_apply_state - apply state change to a single cgroup_freezer
  297. * @freezer: freezer to apply state change to
  298. * @freeze: whether to freeze or unfreeze
  299. * @state: CGROUP_FREEZING_* flag to set or clear
  300. *
  301. * Set or clear @state on @cgroup according to @freeze, and perform
  302. * freezing or thawing as necessary.
  303. */
  304. static void freezer_apply_state(struct freezer *freezer, bool freeze,
  305. unsigned int state)
  306. {
  307. /* also synchronizes against task migration, see freezer_attach() */
  308. lockdep_assert_held(&freezer->lock);
  309. if (!(freezer->state & CGROUP_FREEZER_ONLINE))
  310. return;
  311. if (freeze) {
  312. if (!(freezer->state & CGROUP_FREEZING))
  313. atomic_inc(&system_freezing_cnt);
  314. freezer->state |= state;
  315. freeze_cgroup(freezer);
  316. } else {
  317. bool was_freezing = freezer->state & CGROUP_FREEZING;
  318. freezer->state &= ~state;
  319. if (!(freezer->state & CGROUP_FREEZING)) {
  320. if (was_freezing)
  321. atomic_dec(&system_freezing_cnt);
  322. freezer->state &= ~CGROUP_FROZEN;
  323. unfreeze_cgroup(freezer);
  324. }
  325. }
  326. }
  327. /**
  328. * freezer_change_state - change the freezing state of a cgroup_freezer
  329. * @freezer: freezer of interest
  330. * @freeze: whether to freeze or thaw
  331. *
  332. * Freeze or thaw @freezer according to @freeze. The operations are
  333. * recursive - all descendants of @freezer will be affected.
  334. */
  335. static void freezer_change_state(struct freezer *freezer, bool freeze)
  336. {
  337. struct cgroup *pos;
  338. /* update @freezer */
  339. spin_lock_irq(&freezer->lock);
  340. freezer_apply_state(freezer, freeze, CGROUP_FREEZING_SELF);
  341. spin_unlock_irq(&freezer->lock);
  342. /*
  343. * Update all its descendants in pre-order traversal. Each
  344. * descendant will try to inherit its parent's FREEZING state as
  345. * CGROUP_FREEZING_PARENT.
  346. */
  347. rcu_read_lock();
  348. cgroup_for_each_descendant_pre(pos, freezer->css.cgroup) {
  349. struct freezer *pos_f = cgroup_freezer(pos);
  350. struct freezer *parent = parent_freezer(pos_f);
  351. /*
  352. * Our update to @parent->state is already visible which is
  353. * all we need. No need to lock @parent. For more info on
  354. * synchronization, see freezer_post_create().
  355. */
  356. spin_lock_irq(&pos_f->lock);
  357. freezer_apply_state(pos_f, parent->state & CGROUP_FREEZING,
  358. CGROUP_FREEZING_PARENT);
  359. spin_unlock_irq(&pos_f->lock);
  360. }
  361. rcu_read_unlock();
  362. }
  363. static int freezer_write(struct cgroup *cgroup, struct cftype *cft,
  364. const char *buffer)
  365. {
  366. bool freeze;
  367. if (strcmp(buffer, freezer_state_strs(0)) == 0)
  368. freeze = false;
  369. else if (strcmp(buffer, freezer_state_strs(CGROUP_FROZEN)) == 0)
  370. freeze = true;
  371. else
  372. return -EINVAL;
  373. freezer_change_state(cgroup_freezer(cgroup), freeze);
  374. return 0;
  375. }
  376. static u64 freezer_self_freezing_read(struct cgroup *cgroup, struct cftype *cft)
  377. {
  378. struct freezer *freezer = cgroup_freezer(cgroup);
  379. return (bool)(freezer->state & CGROUP_FREEZING_SELF);
  380. }
  381. static u64 freezer_parent_freezing_read(struct cgroup *cgroup, struct cftype *cft)
  382. {
  383. struct freezer *freezer = cgroup_freezer(cgroup);
  384. return (bool)(freezer->state & CGROUP_FREEZING_PARENT);
  385. }
  386. static struct cftype files[] = {
  387. {
  388. .name = "state",
  389. .flags = CFTYPE_NOT_ON_ROOT,
  390. .read_seq_string = freezer_read,
  391. .write_string = freezer_write,
  392. },
  393. {
  394. .name = "self_freezing",
  395. .flags = CFTYPE_NOT_ON_ROOT,
  396. .read_u64 = freezer_self_freezing_read,
  397. },
  398. {
  399. .name = "parent_freezing",
  400. .flags = CFTYPE_NOT_ON_ROOT,
  401. .read_u64 = freezer_parent_freezing_read,
  402. },
  403. { } /* terminate */
  404. };
  405. struct cgroup_subsys freezer_subsys = {
  406. .name = "freezer",
  407. .css_alloc = freezer_css_alloc,
  408. .css_online = freezer_css_online,
  409. .css_offline = freezer_css_offline,
  410. .css_free = freezer_css_free,
  411. .subsys_id = freezer_subsys_id,
  412. .attach = freezer_attach,
  413. .fork = freezer_fork,
  414. .base_cftypes = files,
  415. };