auto_group.c 6.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272
  1. #include "sched.h"
  2. #include <linux/proc_fs.h>
  3. #include <linux/seq_file.h>
  4. #include <linux/kallsyms.h>
  5. #include <linux/utsname.h>
  6. #include <linux/security.h>
  7. #include <linux/export.h>
  8. unsigned int __read_mostly sysctl_sched_autogroup_enabled = 1;
  9. static struct autogroup autogroup_default;
  10. static atomic_t autogroup_seq_nr;
  11. void __init autogroup_init(struct task_struct *init_task)
  12. {
  13. autogroup_default.tg = &root_task_group;
  14. kref_init(&autogroup_default.kref);
  15. init_rwsem(&autogroup_default.lock);
  16. init_task->signal->autogroup = &autogroup_default;
  17. }
  18. void autogroup_free(struct task_group *tg)
  19. {
  20. kfree(tg->autogroup);
  21. }
  22. static inline void autogroup_destroy(struct kref *kref)
  23. {
  24. struct autogroup *ag = container_of(kref, struct autogroup, kref);
  25. #ifdef CONFIG_RT_GROUP_SCHED
  26. /* We've redirected RT tasks to the root task group... */
  27. ag->tg->rt_se = NULL;
  28. ag->tg->rt_rq = NULL;
  29. #endif
  30. sched_offline_group(ag->tg);
  31. sched_destroy_group(ag->tg);
  32. }
  33. static inline void autogroup_kref_put(struct autogroup *ag)
  34. {
  35. kref_put(&ag->kref, autogroup_destroy);
  36. }
  37. static inline struct autogroup *autogroup_kref_get(struct autogroup *ag)
  38. {
  39. kref_get(&ag->kref);
  40. return ag;
  41. }
  42. static inline struct autogroup *autogroup_task_get(struct task_struct *p)
  43. {
  44. struct autogroup *ag;
  45. unsigned long flags;
  46. if (!lock_task_sighand(p, &flags))
  47. return autogroup_kref_get(&autogroup_default);
  48. ag = autogroup_kref_get(p->signal->autogroup);
  49. unlock_task_sighand(p, &flags);
  50. return ag;
  51. }
  52. static inline struct autogroup *autogroup_create(void)
  53. {
  54. struct autogroup *ag = kzalloc(sizeof(*ag), GFP_KERNEL);
  55. struct task_group *tg;
  56. if (!ag)
  57. goto out_fail;
  58. tg = sched_create_group(&root_task_group);
  59. if (IS_ERR(tg))
  60. goto out_free;
  61. kref_init(&ag->kref);
  62. init_rwsem(&ag->lock);
  63. ag->id = atomic_inc_return(&autogroup_seq_nr);
  64. ag->tg = tg;
  65. #ifdef CONFIG_RT_GROUP_SCHED
  66. /*
  67. * Autogroup RT tasks are redirected to the root task group
  68. * so we don't have to move tasks around upon policy change,
  69. * or flail around trying to allocate bandwidth on the fly.
  70. * A bandwidth exception in __sched_setscheduler() allows
  71. * the policy change to proceed.
  72. */
  73. free_rt_sched_group(tg);
  74. tg->rt_se = root_task_group.rt_se;
  75. tg->rt_rq = root_task_group.rt_rq;
  76. #endif
  77. tg->autogroup = ag;
  78. sched_online_group(tg, &root_task_group);
  79. return ag;
  80. out_free:
  81. kfree(ag);
  82. out_fail:
  83. if (printk_ratelimit()) {
  84. printk(KERN_WARNING "autogroup_create: %s failure.\n",
  85. ag ? "sched_create_group()" : "kmalloc()");
  86. }
  87. return autogroup_kref_get(&autogroup_default);
  88. }
  89. bool task_wants_autogroup(struct task_struct *p, struct task_group *tg)
  90. {
  91. if (tg != &root_task_group)
  92. return false;
  93. /*
  94. * If we race with autogroup_move_group() the caller can use the old
  95. * value of signal->autogroup but in this case sched_move_task() will
  96. * be called again before autogroup_kref_put().
  97. *
  98. * However, there is no way sched_autogroup_exit_task() could tell us
  99. * to avoid autogroup->tg, so we abuse PF_EXITING flag for this case.
  100. */
  101. if (p->flags & PF_EXITING)
  102. return false;
  103. return true;
  104. }
  105. void sched_autogroup_exit_task(struct task_struct *p)
  106. {
  107. /*
  108. * We are going to call exit_notify() and autogroup_move_group() can't
  109. * see this thread after that: we can no longer use signal->autogroup.
  110. * See the PF_EXITING check in task_wants_autogroup().
  111. */
  112. sched_move_task(p);
  113. }
  114. static void
  115. autogroup_move_group(struct task_struct *p, struct autogroup *ag)
  116. {
  117. struct autogroup *prev;
  118. struct task_struct *t;
  119. unsigned long flags;
  120. BUG_ON(!lock_task_sighand(p, &flags));
  121. prev = p->signal->autogroup;
  122. if (prev == ag) {
  123. unlock_task_sighand(p, &flags);
  124. return;
  125. }
  126. p->signal->autogroup = autogroup_kref_get(ag);
  127. /*
  128. * We can't avoid sched_move_task() after we changed signal->autogroup,
  129. * this process can already run with task_group() == prev->tg or we can
  130. * race with cgroup code which can read autogroup = prev under rq->lock.
  131. * In the latter case for_each_thread() can not miss a migrating thread,
  132. * cpu_cgroup_attach() must not be possible after cgroup_exit() and it
  133. * can't be removed from thread list, we hold ->siglock.
  134. *
  135. * If an exiting thread was already removed from thread list we rely on
  136. * sched_autogroup_exit_task().
  137. */
  138. for_each_thread(p, t)
  139. sched_move_task(t);
  140. unlock_task_sighand(p, &flags);
  141. autogroup_kref_put(prev);
  142. }
  143. /* Allocates GFP_KERNEL, cannot be called under any spinlock */
  144. void sched_autogroup_create_attach(struct task_struct *p)
  145. {
  146. struct autogroup *ag = autogroup_create();
  147. autogroup_move_group(p, ag);
  148. /* drop extra reference added by autogroup_create() */
  149. autogroup_kref_put(ag);
  150. }
  151. EXPORT_SYMBOL(sched_autogroup_create_attach);
  152. /* Cannot be called under siglock. Currently has no users */
  153. void sched_autogroup_detach(struct task_struct *p)
  154. {
  155. autogroup_move_group(p, &autogroup_default);
  156. }
  157. EXPORT_SYMBOL(sched_autogroup_detach);
  158. void sched_autogroup_fork(struct signal_struct *sig)
  159. {
  160. sig->autogroup = autogroup_task_get(current);
  161. }
  162. void sched_autogroup_exit(struct signal_struct *sig)
  163. {
  164. autogroup_kref_put(sig->autogroup);
  165. }
  166. static int __init setup_autogroup(char *str)
  167. {
  168. sysctl_sched_autogroup_enabled = 0;
  169. return 1;
  170. }
  171. __setup("noautogroup", setup_autogroup);
  172. #ifdef CONFIG_PROC_FS
  173. int proc_sched_autogroup_set_nice(struct task_struct *p, int nice)
  174. {
  175. static unsigned long next = INITIAL_JIFFIES;
  176. struct autogroup *ag;
  177. unsigned long shares;
  178. int err;
  179. if (nice < MIN_NICE || nice > MAX_NICE)
  180. return -EINVAL;
  181. err = security_task_setnice(current, nice);
  182. if (err)
  183. return err;
  184. if (nice < 0 && !can_nice(current, nice))
  185. return -EPERM;
  186. /* this is a heavy operation taking global locks.. */
  187. if (!capable(CAP_SYS_ADMIN) && time_before(jiffies, next))
  188. return -EAGAIN;
  189. next = HZ / 10 + jiffies;
  190. ag = autogroup_task_get(p);
  191. shares = scale_load(sched_prio_to_weight[nice + 20]);
  192. down_write(&ag->lock);
  193. err = sched_group_set_shares(ag->tg, shares);
  194. if (!err)
  195. ag->nice = nice;
  196. up_write(&ag->lock);
  197. autogroup_kref_put(ag);
  198. return err;
  199. }
  200. void proc_sched_autogroup_show_task(struct task_struct *p, struct seq_file *m)
  201. {
  202. struct autogroup *ag = autogroup_task_get(p);
  203. if (!task_group_is_autogroup(ag->tg))
  204. goto out;
  205. down_read(&ag->lock);
  206. seq_printf(m, "/autogroup-%ld nice %d\n", ag->id, ag->nice);
  207. up_read(&ag->lock);
  208. out:
  209. autogroup_kref_put(ag);
  210. }
  211. #endif /* CONFIG_PROC_FS */
  212. #ifdef CONFIG_SCHED_DEBUG
  213. int autogroup_path(struct task_group *tg, char *buf, int buflen)
  214. {
  215. if (!task_group_is_autogroup(tg))
  216. return 0;
  217. return snprintf(buf, buflen, "%s-%ld", "/autogroup", tg->autogroup->id);
  218. }
  219. #endif /* CONFIG_SCHED_DEBUG */