sched/core: Fix an SMP ordering race in try_to_wake_up() vs. schedule()

author Peter Zijlstra <peterz@infradead.org>

Wed, 7 Oct 2015 12:14:13 +0000 (14:14 +0200)

committer Ingo Molnar <mingo@kernel.org>

Fri, 4 Dec 2015 09:26:43 +0000 (10:26 +0100)
author Peter Zijlstra <peterz@infradead.org>
Wed, 7 Oct 2015 12:14:13 +0000 (14:14 +0200)
committer Ingo Molnar <mingo@kernel.org>
Fri, 4 Dec 2015 09:26:43 +0000 (10:26 +0100)
diff --git a/kernel/sched/core.c b/kernel/sched/core.c

index b64f163d512cbc4adb1477d7d493fd78b3571be2..7063c6a0744055c367eb82159677cfe6522b6c60 100644 (file)
--- a/kernel/sched/core.c
+++ b/kernel/sched/core.c
@@ -1946,6 +1946,25 @@ try_to_wake_up(struct task_struct *p, unsigned int state, int wake_flags)
                 goto stat;
  
  #ifdef CONFIG_SMP
+       /*
+        * Ensure we load p->on_cpu _after_ p->on_rq, otherwise it would be
+        * possible to, falsely, observe p->on_cpu == 0.
+        *
+        * One must be running (->on_cpu == 1) in order to remove oneself
+        * from the runqueue.
+        *
+        *  [S] ->on_cpu = 1;   [L] ->on_rq
+        *      UNLOCK rq->lock
+        *                      RMB
+        *      LOCK   rq->lock
+        *  [S] ->on_rq = 0;    [L] ->on_cpu
+        *
+        * Pairs with the full barrier implied in the UNLOCK+LOCK on rq->lock
+        * from the consecutive calls to schedule(); the first switching to our
+        * task, the second putting it to sleep.
+        */
+       smp_rmb();
+
         /*
          * If the owning (remote) cpu is still in the middle of schedule() with
          * this task as prev, wait until its done referencing the task.
author	Peter Zijlstra <peterz@infradead.org>
	Wed, 7 Oct 2015 12:14:13 +0000 (14:14 +0200)
committer	Ingo Molnar <mingo@kernel.org>
	Fri, 4 Dec 2015 09:26:43 +0000 (10:26 +0100)