Revert "timers: do not raise softirq unconditionally"
This reverts commit 891f510568343d93c5aa2f477b6bebe009b48f05. An issue arisen that if a rt_mutex (spin_lock converted to a mutex in PREEMPT_RT) is taken in hard interrupt context, it could cause a false deadlock detection and trigger a BUG_ON() from the return value of task_blocks_on_rt_mutex() in rt_spin_lock_slowlock(). The problem is this: CPU0 CPU1 ---- ---- spin_lock(A) spin_lock(A) [ blocks, but spins as owner on CPU 0 is running ] <interrupt> spin_trylock(B) [ succeeds ] spin_lock(B) <blocks> Now the deadlock detection triggers and follows the locking: Task X (on CPU0) blocked on spinlock B owned by task Y on CPU1 (via the interrupt taking it with a try lock) The owner of B (Y) is blocked on spin_lock A (still spinning) A is owned by task X (self). DEADLOCK detected! BUG_ON triggered. This was caused by the code to try to not raise softirq unconditionally to allow NO_HZ_FULL to work. Unfortunately, reverting that patch causes NO_HZ_FULL to break again, but that's still better than triggering a BUG_ON(). Signed-off-by: Steven Rostedt <rostedt@goodmis.org> Conflicts: kernel/timer.c
This commit is contained in:
parent
d8b0072a62
commit
f13b372196
|
@ -461,8 +461,9 @@ extern int schedule_hrtimeout_range_clock(ktime_t *expires,
|
|||
unsigned long delta, const enum hrtimer_mode mode, int clock);
|
||||
extern int schedule_hrtimeout(ktime_t *expires, const enum hrtimer_mode mode);
|
||||
|
||||
/* Called from the periodic timer tick */
|
||||
/* Soft interrupt function to run the hrtimer queues: */
|
||||
extern void hrtimer_run_queues(void);
|
||||
extern void hrtimer_run_pending(void);
|
||||
|
||||
/* Bootup initialization: */
|
||||
extern void __init hrtimers_init(void);
|
||||
|
|
|
@ -1716,6 +1716,30 @@ static void run_hrtimer_softirq(struct softirq_action *h)
|
|||
hrtimer_rt_run_pending();
|
||||
}
|
||||
|
||||
/*
|
||||
* Called from timer softirq every jiffy, expire hrtimers:
|
||||
*
|
||||
* For HRT its the fall back code to run the softirq in the timer
|
||||
* softirq context in case the hrtimer initialization failed or has
|
||||
* not been done yet.
|
||||
*/
|
||||
void hrtimer_run_pending(void)
|
||||
{
|
||||
if (hrtimer_hres_active())
|
||||
return;
|
||||
|
||||
/*
|
||||
* This _is_ ugly: We have to check in the softirq context,
|
||||
* whether we can switch to highres and / or nohz mode. The
|
||||
* clocksource switch happens in the timer interrupt with
|
||||
* xtime_lock held. Notification from there only sets the
|
||||
* check bit in the tick_oneshot code, otherwise we might
|
||||
* deadlock vs. xtime_lock.
|
||||
*/
|
||||
if (tick_check_oneshot_change(!hrtimer_is_hres_enabled()))
|
||||
hrtimer_switch_to_hres();
|
||||
}
|
||||
|
||||
/*
|
||||
* Called from hardirq context every jiffy
|
||||
*/
|
||||
|
@ -1729,13 +1753,6 @@ void hrtimer_run_queues(void)
|
|||
if (hrtimer_hres_active())
|
||||
return;
|
||||
|
||||
/*
|
||||
* Check whether we can switch to highres mode.
|
||||
*/
|
||||
if (tick_check_oneshot_change(!hrtimer_is_hres_enabled())
|
||||
&& hrtimer_switch_to_hres())
|
||||
return;
|
||||
|
||||
for (index = 0; index < HRTIMER_MAX_CLOCK_BASES; index++) {
|
||||
base = &cpu_base->clock_base[index];
|
||||
if (!timerqueue_getnext(&base->active))
|
||||
|
|
|
@ -1464,6 +1464,8 @@ static void run_timer_softirq(struct softirq_action *h)
|
|||
{
|
||||
struct tvec_base *base = __this_cpu_read(tvec_bases);
|
||||
|
||||
hrtimer_run_pending();
|
||||
|
||||
#if defined(CONFIG_IRQ_WORK) && defined(CONFIG_PREEMPT_RT_FULL)
|
||||
irq_work_run();
|
||||
#endif
|
||||
|
@ -1477,52 +1479,8 @@ static void run_timer_softirq(struct softirq_action *h)
|
|||
*/
|
||||
void run_local_timers(void)
|
||||
{
|
||||
struct tvec_base *base = __this_cpu_read(tvec_bases);
|
||||
|
||||
hrtimer_run_queues();
|
||||
/*
|
||||
* We can access this lockless as we are in the timer
|
||||
* interrupt. If there are no timers queued, nothing to do in
|
||||
* the timer softirq.
|
||||
*/
|
||||
#ifdef CONFIG_PREEMPT_RT_FULL
|
||||
|
||||
#ifndef CONFIG_SMP
|
||||
/*
|
||||
* The spin_do_trylock() later may fail as the lock may be hold before
|
||||
* the interrupt arrived. The spin-lock debugging code will raise a
|
||||
* warning if the try_lock fails on UP. Since this is only an
|
||||
* optimization for the FULL_NO_HZ case (not to run the timer softirq on
|
||||
* an nohz_full CPU) we don't really care and shedule the softirq.
|
||||
*/
|
||||
raise_softirq(TIMER_SOFTIRQ);
|
||||
return;
|
||||
#endif
|
||||
|
||||
/* On RT, irq work runs from softirq */
|
||||
if (irq_work_needs_cpu()) {
|
||||
raise_softirq(TIMER_SOFTIRQ);
|
||||
return;
|
||||
}
|
||||
|
||||
if (!spin_do_trylock(&base->lock)) {
|
||||
raise_softirq(TIMER_SOFTIRQ);
|
||||
return;
|
||||
}
|
||||
#endif
|
||||
|
||||
if (!base->active_timers)
|
||||
goto out;
|
||||
|
||||
/* Check whether the next pending timer has expired */
|
||||
if (time_before_eq(base->next_timer, jiffies))
|
||||
raise_softirq(TIMER_SOFTIRQ);
|
||||
out:
|
||||
#ifdef CONFIG_PREEMPT_RT_FULL
|
||||
rt_spin_unlock_after_trylock_in_irq(&base->lock);
|
||||
#endif
|
||||
/* The ; ensures that gcc won't complain in the !RT case */
|
||||
;
|
||||
}
|
||||
|
||||
#ifdef __ARCH_WANT_SYS_ALARM
|
||||
|
|
Loading…
Reference in New Issue