On Tue, Jun 05, 2018 at 05:22:12PM +0200, Peter Zijlstra wrote:

> > OK, but __kthread_parkme() can be preempted before it calls schedule(), so 
> > the
> > caller still can be migrated? Plus kthread_park_complete() can be called 
> > twice.
> 
> Argh... I forgot TASK_DEAD does the whole thing with preempt_disable().
> Let me stare at that a bit.

This should ensure we only ever complete when we read PARKED, right?

diff --git a/kernel/sched/core.c b/kernel/sched/core.c
index 8d59b259af4a..e513b4600796 100644
--- a/kernel/sched/core.c
+++ b/kernel/sched/core.c
@@ -2641,7 +2641,7 @@ prepare_task_switch(struct rq *rq, struct task_struct 
*prev,
  * past. prev == current is still correct but we need to recalculate this_rq
  * because prev may have moved to another CPU.
  */
-static struct rq *finish_task_switch(struct task_struct *prev)
+static struct rq *finish_task_switch(struct task_struct *prev, bool preempt)
        __releases(rq->lock)
 {
        struct rq *rq = this_rq();
@@ -2674,7 +2674,7 @@ static struct rq *finish_task_switch(struct task_struct 
*prev)
         *
         * We must observe prev->state before clearing prev->on_cpu (in
         * finish_task), otherwise a concurrent wakeup can get prev
-        * running on another CPU and we could rave with its RUNNING -> DEAD
+        * running on another CPU and we could race with its RUNNING -> DEAD
         * transition, resulting in a double drop.
         */
        prev_state = prev->state;
@@ -2720,7 +2720,8 @@ static struct rq *finish_task_switch(struct task_struct 
*prev)
                        break;
 
                case TASK_PARKED:
-                       kthread_park_complete(prev);
+                       if (!preempt)
+                               kthread_park_complete(prev);
                        break;
                }
        }
@@ -2784,7 +2785,7 @@ asmlinkage __visible void schedule_tail(struct 
task_struct *prev)
         * PREEMPT_COUNT kernels).
         */
 
-       rq = finish_task_switch(prev);
+       rq = finish_task_switch(prev, false);
        balance_callback(rq);
        preempt_enable();
 
@@ -2797,7 +2798,7 @@ asmlinkage __visible void schedule_tail(struct 
task_struct *prev)
  */
 static __always_inline struct rq *
 context_switch(struct rq *rq, struct task_struct *prev,
-              struct task_struct *next, struct rq_flags *rf)
+              struct task_struct *next, bool preempt, struct rq_flags *rf)
 {
        struct mm_struct *mm, *oldmm;
 
@@ -2839,7 +2840,7 @@ context_switch(struct rq *rq, struct task_struct *prev,
        switch_to(prev, next, prev);
        barrier();
 
-       return finish_task_switch(prev);
+       return finish_task_switch(prev, preempt);
 }
 
 /*
@@ -3478,7 +3479,7 @@ static void __sched notrace __schedule(bool preempt)
                trace_sched_switch(preempt, prev, next);
 
                /* Also unlocks the rq: */
-               rq = context_switch(rq, prev, next, &rf);
+               rq = context_switch(rq, prev, next, preempt, &rf);
        } else {
                rq->clock_update_flags &= ~(RQCF_ACT_SKIP|RQCF_REQ_SKIP);
                rq_unlock_irq(rq, &rf);
@@ -3487,6 +3488,7 @@ static void __sched notrace __schedule(bool preempt)
        balance_callback(rq);
 }
 
+/* called with preemption disabled */
 void __noreturn do_task_dead(void)
 {
        /* Causes final put_task_struct in finish_task_switch(): */

Reply via email to