On Tue, Jun 05, 2018 at 05:22:12PM +0200, Peter Zijlstra wrote: > > OK, but __kthread_parkme() can be preempted before it calls schedule(), so the > > caller still can be migrated? Plus kthread_park_complete() can be called twice. > > Argh... I forgot TASK_DEAD does the whole thing with preempt_disable(). > Let me stare at that a bit. This should ensure we only ever complete when we read PARKED, right? diff --git a/kernel/sched/core.c b/kernel/sched/core.c index 8d59b259af4a..e513b4600796 100644 --- a/kernel/sched/core.c +++ b/kernel/sched/core.c @@ -2641,7 +2641,7 @@ prepare_task_switch(struct rq *rq, struct task_struct *prev, * past. prev == current is still correct but we need to recalculate this_rq * because prev may have moved to another CPU. */ -static struct rq *finish_task_switch(struct task_struct *prev) +static struct rq *finish_task_switch(struct task_struct *prev, bool preempt) __releases(rq->lock) { struct rq *rq = this_rq(); @@ -2674,7 +2674,7 @@ static struct rq *finish_task_switch(struct task_struct *prev) * * We must observe prev->state before clearing prev->on_cpu (in * finish_task), otherwise a concurrent wakeup can get prev - * running on another CPU and we could rave with its RUNNING -> DEAD + * running on another CPU and we could race with its RUNNING -> DEAD * transition, resulting in a double drop. */ prev_state = prev->state; @@ -2720,7 +2720,8 @@ static struct rq *finish_task_switch(struct task_struct *prev) break; case TASK_PARKED: - kthread_park_complete(prev); + if (!preempt) + kthread_park_complete(prev); break; } } @@ -2784,7 +2785,7 @@ asmlinkage __visible void schedule_tail(struct task_struct *prev) * PREEMPT_COUNT kernels). */ - rq = finish_task_switch(prev); + rq = finish_task_switch(prev, false); balance_callback(rq); preempt_enable(); @@ -2797,7 +2798,7 @@ asmlinkage __visible void schedule_tail(struct task_struct *prev) */ static __always_inline struct rq * context_switch(struct rq *rq, struct task_struct *prev, - struct task_struct *next, struct rq_flags *rf) + struct task_struct *next, bool preempt, struct rq_flags *rf) { struct mm_struct *mm, *oldmm; @@ -2839,7 +2840,7 @@ context_switch(struct rq *rq, struct task_struct *prev, switch_to(prev, next, prev); barrier(); - return finish_task_switch(prev); + return finish_task_switch(prev, preempt); } /* @@ -3478,7 +3479,7 @@ static void __sched notrace __schedule(bool preempt) trace_sched_switch(preempt, prev, next); /* Also unlocks the rq: */ - rq = context_switch(rq, prev, next, &rf); + rq = context_switch(rq, prev, next, preempt, &rf); } else { rq->clock_update_flags &= ~(RQCF_ACT_SKIP|RQCF_REQ_SKIP); rq_unlock_irq(rq, &rf); @@ -3487,6 +3488,7 @@ static void __sched notrace __schedule(bool preempt) balance_callback(rq); } +/* called with preemption disabled */ void __noreturn do_task_dead(void) { /* Causes final put_task_struct in finish_task_switch(): */ -- To unsubscribe from this list: send the line "unsubscribe linux-arm-msm" in the body of a message to majordomo@xxxxxxxxxxxxxxx More majordomo info at http://vger.kernel.org/majordomo-info.html