cgroup: Fix task counter common ancestor logic

author Frederic Weisbecker <fweisbec@gmail.com>

Thu, 8 Dec 2011 04:42:38 +0000 (15:42 +1100)

committer Stephen Rothwell <sfr@canb.auug.org.au>

Fri, 9 Dec 2011 04:57:58 +0000 (15:57 +1100)
author Frederic Weisbecker <fweisbec@gmail.com>
Thu, 8 Dec 2011 04:42:38 +0000 (15:42 +1100)
committer Stephen Rothwell <sfr@canb.auug.org.au>
Fri, 9 Dec 2011 04:57:58 +0000 (15:57 +1100)
diff --git a/Documentation/cgroups/cgroups.txt b/Documentation/cgroups/cgroups.txt

index 3fa646f6c6d68a3b05f2fa5f2a62e415d6c671fb..7df0e5b6f4cda841b0a8d429bcf66417bd235f76 100644 (file)
--- a/Documentation/cgroups/cgroups.txt
+++ b/Documentation/cgroups/cgroups.txt
@@ -623,7 +623,8 @@ function, so that the subsystem can implement a rollback. If not, not necessary.
  This will be called only about subsystems whose can_attach() operation have
  succeeded.
  
-void cancel_attach_task(struct cgroup *cgrp, struct task_struct *tsk)
+void cancel_attach_task(struct cgroup *cgrp, struct cgroup *old_cgrp,
+                       struct task_struct *tsk)
  (cgroup_mutex held by caller)
  
  As cancel_attach, but for operations that must be cancelled once per
diff --git a/include/linux/cgroup.h b/include/linux/cgroup.h

index ddc13eb76b09eafe813388d35a28dd1bd14157f3..8dada1dbc73e5339887d7bd422b338fd9d2e1b71 100644 (file)
--- a/include/linux/cgroup.h
+++ b/include/linux/cgroup.h
@@ -475,7 +475,7 @@ struct cgroup_subsys {
                                struct task_struct *tsk);
         void (*cancel_attach)(struct cgroup_subsys *ss, struct cgroup *cgrp,
                               struct task_struct *tsk);
-       void (*cancel_attach_task)(struct cgroup *cgrp,
+       void (*cancel_attach_task)(struct cgroup *cgrp, struct cgroup *old_cgrp,
                                    struct task_struct *tsk);
         void (*pre_attach)(struct cgroup *cgrp);
         void (*attach_task)(struct cgroup *cgrp, struct cgroup *old_cgrp,
diff --git a/kernel/cgroup.c b/kernel/cgroup.c

index 893fc3d5c87604d738c9a5cbee461671212d4858..19a4faff23316166ee4bcde12bf71640eda0eae3 100644 (file)
--- a/kernel/cgroup.c
+++ b/kernel/cgroup.c
@@ -1885,7 +1885,7 @@ out:
                                 break;
  
                         if (ss->cancel_attach_task)
-                               ss->cancel_attach_task(cgrp, tsk);
+                               ss->cancel_attach_task(cgrp, oldcgrp, tsk);
                         if (ss->cancel_attach)
                                 ss->cancel_attach(ss, cgrp, tsk);
                 }
@@ -1983,6 +1983,11 @@ static int css_set_prefetch(struct cgroup *cgrp, struct css_set *cg,
         return 0;
  }
  
+struct task_cgroup {
+       struct task_struct *tsk;
+       struct cgroup *oldcgrp;
+};
+
  /**
   * cgroup_attach_proc - attach all threads in a threadgroup to a cgroup
   * @cgrp: the cgroup to attach to
@@ -2003,6 +2008,7 @@ int cgroup_attach_proc(struct cgroup *cgrp, struct task_struct *leader)
         /* threadgroup list cursor and array */
         struct task_struct *tsk;
         struct flex_array *group;
+       struct task_cgroup *tc;
         /*
          * we need to make sure we have css_sets for all the tasks we're
          * going to move -before- we actually start moving them, so that in
@@ -2020,7 +2026,7 @@ int cgroup_attach_proc(struct cgroup *cgrp, struct task_struct *leader)
          */
         group_size = get_nr_threads(leader);
         /* flex_array supports very large thread-groups better than kmalloc. */
-       group = flex_array_alloc(sizeof(struct task_struct *), group_size,
+       group = flex_array_alloc(sizeof(struct task_cgroup), group_size,
                                  GFP_KERNEL);
         if (!group)
                 return -ENOMEM;
@@ -2047,14 +2053,18 @@ int cgroup_attach_proc(struct cgroup *cgrp, struct task_struct *leader)
         tsk = leader;
         i = 0;
         do {
+               struct task_cgroup tsk_cgrp;
+
                 /* as per above, nr_threads may decrease, but not increase. */
                 BUG_ON(i >= group_size);
                 get_task_struct(tsk);
+               tsk_cgrp.tsk = tsk;
+               tsk_cgrp.oldcgrp = task_cgroup_from_root(tsk, root);
                 /*
                  * saying GFP_ATOMIC has no effect here because we did prealloc
                  * earlier, but it's good form to communicate our expectations.
                  */
-               retval = flex_array_put_ptr(group, i, tsk, GFP_ATOMIC);
+               retval = flex_array_put(group, i, &tsk_cgrp, GFP_ATOMIC);
                 BUG_ON(retval != 0);
                 i++;
         } while_each_thread(leader, tsk);
@@ -2077,14 +2087,13 @@ int cgroup_attach_proc(struct cgroup *cgrp, struct task_struct *leader)
                 if (ss->can_attach_task) {
                         /* run on each task in the threadgroup. */
                         for (i = 0; i < group_size; i++) {
-                               tsk = flex_array_get_ptr(group, i);
-                               oldcgrp = task_cgroup_from_root(tsk, root);
-
+                               tc = flex_array_get(group, i);
                                 retval = ss->can_attach_task(cgrp,
-                                                            oldcgrp, tsk);
+                                                            tc->oldcgrp,
+                                                            tc->tsk);
                                 if (retval) {
                                         failed_ss = ss;
-                                       failed_task = tsk;
+                                       failed_task = tc->tsk;
                                         goto out_cancel_attach;
                                 }
                         }
@@ -2097,10 +2106,10 @@ int cgroup_attach_proc(struct cgroup *cgrp, struct task_struct *leader)
          */
         INIT_LIST_HEAD(&newcg_list);
         for (i = 0; i < group_size; i++) {
-               tsk = flex_array_get_ptr(group, i);
+               tc = flex_array_get(group, i);
+               tsk = tc->tsk;
                 /* nothing to do if this task is already in the cgroup */
-               oldcgrp = task_cgroup_from_root(tsk, root);
-               if (cgrp == oldcgrp)
+               if (cgrp == tc->oldcgrp)
                         continue;
                 /* get old css_set pointer */
                 task_lock(tsk);
@@ -2136,9 +2145,10 @@ int cgroup_attach_proc(struct cgroup *cgrp, struct task_struct *leader)
                         ss->pre_attach(cgrp);
         }
         for (i = 0; i < group_size; i++) {
-               tsk = flex_array_get_ptr(group, i);
+               tc = flex_array_get(group, i);
+               tsk = tc->tsk;
+               oldcgrp = tc->oldcgrp;
                 /* leave current thread as it is if it's already there */
-               oldcgrp = task_cgroup_from_root(tsk, root);
                 if (cgrp == oldcgrp)
                         continue;
                 /* if the thread is PF_EXITING, it can just get skipped. */
@@ -2151,7 +2161,7 @@ int cgroup_attach_proc(struct cgroup *cgrp, struct task_struct *leader)
                         }
                 } else if (retval == -ESRCH) {
                         if (ss->cancel_attach_task)
-                               ss->cancel_attach_task(cgrp, tsk);
+                               ss->cancel_attach_task(cgrp, oldcgrp, tsk);
                 } else {
                         BUG_ON(1);
                 }
@@ -2188,10 +2198,10 @@ out_cancel_attach:
                         if (ss->cancel_attach_task && (ss != failed_ss ||
                                                        failed_task)) {
                                 for (i = 0; i < group_size; i++) {
-                                       tsk = flex_array_get_ptr(group, i);
-                                       if (tsk == failed_task)
+                                       tc = flex_array_get(group, i);
+                                       if (tc->tsk == failed_task)
                                                 break;
-                                       ss->cancel_attach_task(cgrp, tsk);
+                                       ss->cancel_attach_task(cgrp, tc->oldcgrp, tc->tsk);
                                 }
                         }
  
@@ -2206,8 +2216,8 @@ out_cancel_attach:
         }
         /* clean up the array of referenced threads in the group. */
         for (i = 0; i < group_size; i++) {
-               tsk = flex_array_get_ptr(group, i);
-               put_task_struct(tsk);
+               tc = flex_array_get(group, i);
+               put_task_struct(tc->tsk);
         }
  out_free_group_list:
         flex_array_free(group);
diff --git a/kernel/cgroup_task_counter.c b/kernel/cgroup_task_counter.c

index d3b2a8290fef57c3d9c8b2c5d2fe14e12a38c79b..c04340d0ef9861d71f25ab8fd4986118d6fa0922 100644 (file)
--- a/kernel/cgroup_task_counter.c
+++ b/kernel/cgroup_task_counter.c
@@ -94,12 +94,6 @@ static void task_counter_exit(struct cgroup_subsys *ss, struct cgroup *cgrp,
                 res_counter_uncharge(cgroup_task_res_counter(old_cgrp), 1);
  }
  
-/*
- * Protected amongst can_attach_task/attach_task/cancel_attach_task by
- * cgroup mutex
- */
-static struct res_counter *common_ancestor;
-
  /*
   * This does more than just probing the ability to attach to the dest cgroup.
   * We can not just _check_ if we can attach to the destination and do the real
@@ -111,9 +105,10 @@ static int task_counter_can_attach_task(struct cgroup *cgrp,
                                         struct cgroup *old_cgrp,
                                         struct task_struct *tsk)
  {
+       int err;
+       struct res_counter *common_ancestor;
         struct res_counter *res = cgroup_task_res_counter(cgrp);
         struct res_counter *old_res = cgroup_task_res_counter(old_cgrp);
-       int err;
  
         /*
          * When moving a task from a cgroup to another, we don't want
@@ -138,10 +133,15 @@ static int task_counter_can_attach_task(struct cgroup *cgrp,
  
  /* Uncharge the dest cgroup that we charged in task_counter_can_attach_task() */
  static void task_counter_cancel_attach_task(struct cgroup *cgrp,
+                                           struct cgroup *old_cgrp,
                                             struct task_struct *tsk)
  {
-       res_counter_uncharge_until(cgroup_task_res_counter(cgrp),
-                                  common_ancestor, 1);
+       struct res_counter *common_ancestor;
+       struct res_counter *res = cgroup_task_res_counter(cgrp);
+       struct res_counter *old_res = cgroup_task_res_counter(old_cgrp);
+
+       common_ancestor = res_counter_common_ancestor(res, old_res);
+       res_counter_uncharge_until(res, common_ancestor, 1);
  }
  
  /*
@@ -155,8 +155,12 @@ static void task_counter_attach_task(struct cgroup *cgrp,
                                      struct cgroup *old_cgrp,
                                      struct task_struct *tsk)
  {
-       res_counter_uncharge_until(cgroup_task_res_counter(old_cgrp),
-                                  common_ancestor, 1);
+       struct res_counter *common_ancestor;
+       struct res_counter *res = cgroup_task_res_counter(cgrp);
+       struct res_counter *old_res = cgroup_task_res_counter(old_cgrp);
+
+       common_ancestor = res_counter_common_ancestor(res, old_res);
+       res_counter_uncharge_until(old_res, common_ancestor, 1);
  }
  
  static u64 task_counter_read_u64(struct cgroup *cgrp, struct cftype *cft)
author	Frederic Weisbecker <fweisbec@gmail.com>
	Thu, 8 Dec 2011 04:42:38 +0000 (15:42 +1100)
committer	Stephen Rothwell <sfr@canb.auug.org.au>
	Fri, 9 Dec 2011 04:57:58 +0000 (15:57 +1100)
Documentation/cgroups/cgroups.txt		patch \| blob \| history
include/linux/cgroup.h		patch \| blob \| history
kernel/cgroup.c		patch \| blob \| history
kernel/cgroup_task_counter.c		patch \| blob \| history