ptrace: fix ptrace vs tasklist_lock race

As explained by Alexander Fyodorov <halcy@yandex.ru>:

|read_lock(&tasklist_lock) in ptrace_stop() is converted to mutex on RT kernel,
|and it can remove __TASK_TRACED from task->state (by moving  it to
|task->saved_state). If parent does wait() on child followed by a sys_ptrace
|call, the following race can happen:
|
|- child sets __TASK_TRACED in ptrace_stop()
|- parent does wait() which eventually calls wait_task_stopped() and returns
|  child's pid
|- child blocks on read_lock(&tasklist_lock) in ptrace_stop() and moves
|  __TASK_TRACED flag to saved_state
|- parent calls sys_ptrace, which calls ptrace_check_attach() and wait_task_inactive()

The patch is based on his initial patch where an additional check is
added in case the __TASK_TRACED moved to ->saved_state. The pi_lock is
taken in case the caller is interrupted between looking into ->state and
->saved_state.

Signed-off-by: Sebastian Andrzej Siewior <bigeasy@linutronix.de>
This commit is contained in:
Sebastian Andrzej Siewior 2013-08-29 18:21:04 +02:00 committed by Alibek Omarov
parent 9d05b17470
commit 76aef5dded
3 changed files with 67 additions and 7 deletions

View File

@ -236,10 +236,7 @@ extern char ___assert_task_state[1 - 2*!!(
TASK_UNINTERRUPTIBLE | __TASK_STOPPED | \
__TASK_TRACED | EXIT_ZOMBIE | EXIT_DEAD)
#define task_is_traced(task) ((task->state & __TASK_TRACED) != 0)
#define task_is_stopped(task) ((task->state & __TASK_STOPPED) != 0)
#define task_is_stopped_or_traced(task) \
((task->state & (__TASK_STOPPED | __TASK_TRACED)) != 0)
#define task_contributes_to_load(task) \
((task->state & TASK_UNINTERRUPTIBLE) != 0 && \
(task->flags & PF_FROZEN) == 0)
@ -2635,6 +2632,51 @@ static inline int signal_pending_state(long state, struct task_struct *p)
return (state & TASK_INTERRUPTIBLE) || __fatal_signal_pending(p);
}
static inline bool __task_is_stopped_or_traced(struct task_struct *task)
{
if (task->state & (__TASK_STOPPED | __TASK_TRACED))
return true;
#ifdef CONFIG_PREEMPT_RT_FULL
if (task->saved_state & (__TASK_STOPPED | __TASK_TRACED))
return true;
#endif
return false;
}
static inline bool task_is_stopped_or_traced(struct task_struct *task)
{
bool traced_stopped;
#ifdef CONFIG_PREEMPT_RT_FULL
unsigned long flags;
raw_spin_lock_irqsave(&task->pi_lock, flags);
traced_stopped = __task_is_stopped_or_traced(task);
raw_spin_unlock_irqrestore(&task->pi_lock, flags);
#else
traced_stopped = __task_is_stopped_or_traced(task);
#endif
return traced_stopped;
}
static inline bool task_is_traced(struct task_struct *task)
{
bool traced = false;
if (task->state & __TASK_TRACED)
return true;
#ifdef CONFIG_PREEMPT_RT_FULL
/* in case the task is sleeping on tasklist_lock */
raw_spin_lock_irq(&task->pi_lock);
if (task->state & __TASK_TRACED)
traced = true;
else if (task->saved_state & __TASK_TRACED)
traced = true;
raw_spin_unlock_irq(&task->pi_lock);
#endif
return traced;
}
/*
* cond_resched() and cond_resched_lock(): latency reduction via
* explicit rescheduling in places that are safe. The return

View File

@ -135,7 +135,12 @@ static bool ptrace_freeze_traced(struct task_struct *task)
spin_lock_irq(&task->sighand->siglock);
if (task_is_traced(task) && !__fatal_signal_pending(task)) {
task->state = __TASK_TRACED;
raw_spin_lock_irq(&task->pi_lock);
if (task->state & __TASK_TRACED)
task->state = __TASK_TRACED;
else
task->saved_state = __TASK_TRACED;
raw_spin_unlock_irq(&task->pi_lock);
ret = true;
}
spin_unlock_irq(&task->sighand->siglock);

View File

@ -1122,6 +1122,18 @@ struct migration_arg {
static int migration_cpu_stop(void *data);
static bool check_task_state(struct task_struct *p, long match_state)
{
bool match = false;
raw_spin_lock_irq(&p->pi_lock);
if (p->state == match_state || p->saved_state == match_state)
match = true;
raw_spin_unlock_irq(&p->pi_lock);
return match;
}
/*
* wait_task_inactive - wait for a thread to unschedule.
*
@ -1166,7 +1178,7 @@ unsigned long wait_task_inactive(struct task_struct *p, long match_state)
* is actually now running somewhere else!
*/
while (task_running(rq, p)) {
if (match_state && unlikely(p->state != match_state))
if (match_state && !check_task_state(p, match_state))
return 0;
cpu_relax();
}
@ -1181,7 +1193,8 @@ unsigned long wait_task_inactive(struct task_struct *p, long match_state)
running = task_running(rq, p);
on_rq = p->on_rq;
ncsw = 0;
if (!match_state || p->state == match_state)
if (!match_state || p->state == match_state
|| p->saved_state == match_state)
ncsw = p->nvcsw | LONG_MIN; /* sets MSB */
task_rq_unlock(rq, p, &flags);
@ -1685,7 +1698,7 @@ out:
*/
int wake_up_process(struct task_struct *p)
{
WARN_ON(task_is_stopped_or_traced(p));
WARN_ON(__task_is_stopped_or_traced(p));
return try_to_wake_up(p, TASK_NORMAL, 0);
}
EXPORT_SYMBOL(wake_up_process);