sched/numa: Fix use-after-free bug in the task_numa_compare

author Gavin Guo <gavin.guo@canonical.com>

Wed, 20 Jan 2016 04:36:58 +0000 (12:36 +0800)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Thu, 15 Sep 2016 06:27:45 +0000 (08:27 +0200)
author Gavin Guo <gavin.guo@canonical.com>
Wed, 20 Jan 2016 04:36:58 +0000 (12:36 +0800)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Thu, 15 Sep 2016 06:27:45 +0000 (08:27 +0200)
diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c

index b8b516c37bf1c282f9b0bcbb0acdbb2a23a1f6bc..8f258f437ac2c12d566e87aaed751d7d7387fb4e 100644 (file)
--- a/kernel/sched/fair.c
+++ b/kernel/sched/fair.c
@@ -1191,8 +1191,6 @@ static void task_numa_assign(struct task_numa_env *env,
  {
         if (env->best_task)
                 put_task_struct(env->best_task);
-       if (p)
-               get_task_struct(p);
  
         env->best_task = p;
         env->best_imp = imp;
@@ -1260,20 +1258,30 @@ static void task_numa_compare(struct task_numa_env *env,
         long imp = env->p->numa_group ? groupimp : taskimp;
         long moveimp = imp;
         int dist = env->dist;
+       bool assigned = false;
  
         rcu_read_lock();
  
         raw_spin_lock_irq(&dst_rq->lock);
         cur = dst_rq->curr;
         /*
-        * No need to move the exiting task, and this ensures that ->curr
-        * wasn't reaped and thus get_task_struct() in task_numa_assign()
-        * is safe under RCU read lock.
-        * Note that rcu_read_lock() itself can't protect from the final
-        * put_task_struct() after the last schedule().
+        * No need to move the exiting task or idle task.
          */
         if ((cur->flags & PF_EXITING) || is_idle_task(cur))
                 cur = NULL;
+       else {
+               /*
+                * The task_struct must be protected here to protect the
+                * p->numa_faults access in the task_weight since the
+                * numa_faults could already be freed in the following path:
+                * finish_task_switch()
+                *     --> put_task_struct()
+                *         --> __put_task_struct()
+                *             --> task_numa_free()
+                */
+               get_task_struct(cur);
+       }
+
         raw_spin_unlock_irq(&dst_rq->lock);
  
         /*
@@ -1357,6 +1365,7 @@ balance:
                  */
                 if (!load_too_imbalanced(src_load, dst_load, env)) {
                         imp = moveimp - 1;
+                       put_task_struct(cur);
                         cur = NULL;
                         goto assign;
                 }
@@ -1382,9 +1391,16 @@ balance:
                 env->dst_cpu = select_idle_sibling(env->p, env->dst_cpu);
  
  assign:
+       assigned = true;
         task_numa_assign(env, cur, imp);
  unlock:
         rcu_read_unlock();
+       /*
+        * The dst_rq->curr isn't assigned. The protection for task_struct is
+        * finished.
+        */
+       if (cur && !assigned)
+               put_task_struct(cur);
  }
  
  static void task_numa_find_cpu(struct task_numa_env *env,
author	Gavin Guo <gavin.guo@canonical.com>
	Wed, 20 Jan 2016 04:36:58 +0000 (12:36 +0800)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Thu, 15 Sep 2016 06:27:45 +0000 (08:27 +0200)