Commit bf967be3 authored by Ingo Molnar's avatar Ingo Molnar

Merge branch 'timers/nohz' of...

Merge branch 'timers/nohz' of git://git.kernel.org/pub/scm/linux/kernel/git/frederic/linux-dynticks into timers/nohz

Pull nohz-full enabling patches from Frederic Weisbecker:

  " This handles perf and CPUs that get more than one task and fix posix cpu timers
    handling.

    This can finally stop the tick."
Signed-off-by: default avatarIngo Molnar <mingo@kernel.org>
parents a166fcf0 67826eae
...@@ -799,6 +799,12 @@ static inline int __perf_event_disable(void *info) { return -1; } ...@@ -799,6 +799,12 @@ static inline int __perf_event_disable(void *info) { return -1; }
static inline void perf_event_task_tick(void) { } static inline void perf_event_task_tick(void) { }
#endif #endif
#if defined(CONFIG_PERF_EVENTS) && defined(CONFIG_NO_HZ_FULL)
extern bool perf_event_can_stop_tick(void);
#else
static inline bool perf_event_can_stop_tick(void) { return true; }
#endif
#define perf_output_put(handle, x) perf_output_copy((handle), &(x), sizeof(x)) #define perf_output_put(handle, x) perf_output_copy((handle), &(x), sizeof(x))
/* /*
......
...@@ -1856,6 +1856,12 @@ extern void wake_up_nohz_cpu(int cpu); ...@@ -1856,6 +1856,12 @@ extern void wake_up_nohz_cpu(int cpu);
static inline void wake_up_nohz_cpu(int cpu) { } static inline void wake_up_nohz_cpu(int cpu) { }
#endif #endif
#ifdef CONFIG_NO_HZ_FULL
extern bool sched_can_stop_tick(void);
#else
static inline bool sched_can_stop_tick(void) { return false; }
#endif
#ifdef CONFIG_SCHED_AUTOGROUP #ifdef CONFIG_SCHED_AUTOGROUP
extern void sched_autogroup_create_attach(struct task_struct *p); extern void sched_autogroup_create_attach(struct task_struct *p);
extern void sched_autogroup_detach(struct task_struct *p); extern void sched_autogroup_detach(struct task_struct *p);
......
...@@ -160,13 +160,17 @@ static inline u64 get_cpu_iowait_time_us(int cpu, u64 *unused) { return -1; } ...@@ -160,13 +160,17 @@ static inline u64 get_cpu_iowait_time_us(int cpu, u64 *unused) { return -1; }
#ifdef CONFIG_NO_HZ_FULL #ifdef CONFIG_NO_HZ_FULL
extern void tick_nohz_init(void); extern void tick_nohz_init(void);
extern int tick_nohz_full_cpu(int cpu); extern int tick_nohz_full_cpu(int cpu);
extern void tick_nohz_full_check(void);
extern void tick_nohz_full_kick(void); extern void tick_nohz_full_kick(void);
extern void tick_nohz_full_kick_all(void); extern void tick_nohz_full_kick_all(void);
extern void tick_nohz_task_switch(struct task_struct *tsk);
#else #else
static inline void tick_nohz_init(void) { } static inline void tick_nohz_init(void) { }
static inline int tick_nohz_full_cpu(int cpu) { return 0; } static inline int tick_nohz_full_cpu(int cpu) { return 0; }
static inline void tick_nohz_full_check(void) { }
static inline void tick_nohz_full_kick(void) { } static inline void tick_nohz_full_kick(void) { }
static inline void tick_nohz_full_kick_all(void) { } static inline void tick_nohz_full_kick_all(void) { }
static inline void tick_nohz_task_switch(struct task_struct *tsk) { }
#endif #endif
......
...@@ -18,6 +18,7 @@ ...@@ -18,6 +18,7 @@
#include <linux/poll.h> #include <linux/poll.h>
#include <linux/slab.h> #include <linux/slab.h>
#include <linux/hash.h> #include <linux/hash.h>
#include <linux/tick.h>
#include <linux/sysfs.h> #include <linux/sysfs.h>
#include <linux/dcache.h> #include <linux/dcache.h>
#include <linux/percpu.h> #include <linux/percpu.h>
...@@ -655,8 +656,12 @@ static void perf_pmu_rotate_start(struct pmu *pmu) ...@@ -655,8 +656,12 @@ static void perf_pmu_rotate_start(struct pmu *pmu)
WARN_ON(!irqs_disabled()); WARN_ON(!irqs_disabled());
if (list_empty(&cpuctx->rotation_list)) if (list_empty(&cpuctx->rotation_list)) {
int was_empty = list_empty(head);
list_add(&cpuctx->rotation_list, head); list_add(&cpuctx->rotation_list, head);
if (was_empty)
tick_nohz_full_kick();
}
} }
static void get_ctx(struct perf_event_context *ctx) static void get_ctx(struct perf_event_context *ctx)
...@@ -2555,6 +2560,16 @@ static void perf_rotate_context(struct perf_cpu_context *cpuctx) ...@@ -2555,6 +2560,16 @@ static void perf_rotate_context(struct perf_cpu_context *cpuctx)
list_del_init(&cpuctx->rotation_list); list_del_init(&cpuctx->rotation_list);
} }
#ifdef CONFIG_NO_HZ_FULL
bool perf_event_can_stop_tick(void)
{
if (list_empty(&__get_cpu_var(rotation_list)))
return true;
else
return false;
}
#endif
void perf_event_task_tick(void) void perf_event_task_tick(void)
{ {
struct list_head *head = &__get_cpu_var(rotation_list); struct list_head *head = &__get_cpu_var(rotation_list);
......
...@@ -673,12 +673,12 @@ static void posix_cpu_timer_kick_nohz(void) ...@@ -673,12 +673,12 @@ static void posix_cpu_timer_kick_nohz(void)
bool posix_cpu_timers_can_stop_tick(struct task_struct *tsk) bool posix_cpu_timers_can_stop_tick(struct task_struct *tsk)
{ {
if (!task_cputime_zero(&tsk->cputime_expires)) if (!task_cputime_zero(&tsk->cputime_expires))
return true; return false;
if (tsk->signal->cputimer.running) if (tsk->signal->cputimer.running)
return true;
return false; return false;
return true;
} }
#else #else
static inline void posix_cpu_timer_kick_nohz(void) { } static inline void posix_cpu_timer_kick_nohz(void) { }
......
...@@ -650,6 +650,24 @@ static inline bool got_nohz_idle_kick(void) ...@@ -650,6 +650,24 @@ static inline bool got_nohz_idle_kick(void)
#endif /* CONFIG_NO_HZ_COMMON */ #endif /* CONFIG_NO_HZ_COMMON */
#ifdef CONFIG_NO_HZ_FULL
bool sched_can_stop_tick(void)
{
struct rq *rq;
rq = this_rq();
/* Make sure rq->nr_running update is visible after the IPI */
smp_rmb();
/* More than one running task need preemption */
if (rq->nr_running > 1)
return false;
return true;
}
#endif /* CONFIG_NO_HZ_FULL */
void sched_avg_update(struct rq *rq) void sched_avg_update(struct rq *rq)
{ {
s64 period = sched_avg_period(); s64 period = sched_avg_period();
...@@ -1380,7 +1398,8 @@ static void sched_ttwu_pending(void) ...@@ -1380,7 +1398,8 @@ static void sched_ttwu_pending(void)
void scheduler_ipi(void) void scheduler_ipi(void)
{ {
if (llist_empty(&this_rq()->wake_list) && !got_nohz_idle_kick()) if (llist_empty(&this_rq()->wake_list) && !got_nohz_idle_kick()
&& !tick_nohz_full_cpu(smp_processor_id()))
return; return;
/* /*
...@@ -1397,6 +1416,7 @@ void scheduler_ipi(void) ...@@ -1397,6 +1416,7 @@ void scheduler_ipi(void)
* somewhat pessimize the simple resched case. * somewhat pessimize the simple resched case.
*/ */
irq_enter(); irq_enter();
tick_nohz_full_check();
sched_ttwu_pending(); sched_ttwu_pending();
/* /*
...@@ -1876,6 +1896,8 @@ static void finish_task_switch(struct rq *rq, struct task_struct *prev) ...@@ -1876,6 +1896,8 @@ static void finish_task_switch(struct rq *rq, struct task_struct *prev)
kprobe_flush_task(prev); kprobe_flush_task(prev);
put_task_struct(prev); put_task_struct(prev);
} }
tick_nohz_task_switch(current);
} }
#ifdef CONFIG_SMP #ifdef CONFIG_SMP
......
...@@ -5,6 +5,7 @@ ...@@ -5,6 +5,7 @@
#include <linux/mutex.h> #include <linux/mutex.h>
#include <linux/spinlock.h> #include <linux/spinlock.h>
#include <linux/stop_machine.h> #include <linux/stop_machine.h>
#include <linux/tick.h>
#include "cpupri.h" #include "cpupri.h"
...@@ -1106,6 +1107,16 @@ static inline u64 steal_ticks(u64 steal) ...@@ -1106,6 +1107,16 @@ static inline u64 steal_ticks(u64 steal)
static inline void inc_nr_running(struct rq *rq) static inline void inc_nr_running(struct rq *rq)
{ {
rq->nr_running++; rq->nr_running++;
#ifdef CONFIG_NO_HZ_FULL
if (rq->nr_running == 2) {
if (tick_nohz_full_cpu(rq->cpu)) {
/* Order rq->nr_running write against the IPI */
smp_wmb();
smp_send_reschedule(rq->cpu);
}
}
#endif
} }
static inline void dec_nr_running(struct rq *rq) static inline void dec_nr_running(struct rq *rq)
......
...@@ -337,6 +337,19 @@ static inline void invoke_softirq(void) ...@@ -337,6 +337,19 @@ static inline void invoke_softirq(void)
} }
} }
static inline void tick_irq_exit(void)
{
#ifdef CONFIG_NO_HZ_COMMON
int cpu = smp_processor_id();
/* Make sure that timer wheel updates are propagated */
if ((idle_cpu(cpu) && !need_resched()) || tick_nohz_full_cpu(cpu)) {
if (!in_interrupt())
tick_nohz_irq_exit();
}
#endif
}
/* /*
* Exit an interrupt context. Process softirqs if needed and possible: * Exit an interrupt context. Process softirqs if needed and possible:
*/ */
...@@ -348,11 +361,7 @@ void irq_exit(void) ...@@ -348,11 +361,7 @@ void irq_exit(void)
if (!in_interrupt() && local_softirq_pending()) if (!in_interrupt() && local_softirq_pending())
invoke_softirq(); invoke_softirq();
#ifdef CONFIG_NO_HZ_COMMON tick_irq_exit();
/* Make sure that timer wheel updates are propagated */
if (idle_cpu(smp_processor_id()) && !in_interrupt() && !need_resched())
tick_nohz_irq_exit();
#endif
rcu_irq_exit(); rcu_irq_exit();
sched_preempt_enable_no_resched(); sched_preempt_enable_no_resched();
} }
......
...@@ -21,6 +21,8 @@ ...@@ -21,6 +21,8 @@
#include <linux/sched.h> #include <linux/sched.h>
#include <linux/module.h> #include <linux/module.h>
#include <linux/irq_work.h> #include <linux/irq_work.h>
#include <linux/posix-timers.h>
#include <linux/perf_event.h>
#include <asm/irq_regs.h> #include <asm/irq_regs.h>
...@@ -147,16 +149,48 @@ static void tick_sched_handle(struct tick_sched *ts, struct pt_regs *regs) ...@@ -147,16 +149,48 @@ static void tick_sched_handle(struct tick_sched *ts, struct pt_regs *regs)
static cpumask_var_t nohz_full_mask; static cpumask_var_t nohz_full_mask;
bool have_nohz_full_mask; bool have_nohz_full_mask;
static bool can_stop_full_tick(void)
{
WARN_ON_ONCE(!irqs_disabled());
if (!sched_can_stop_tick())
return false;
if (!posix_cpu_timers_can_stop_tick(current))
return false;
if (!perf_event_can_stop_tick())
return false;
/* sched_clock_tick() needs us? */
#ifdef CONFIG_HAVE_UNSTABLE_SCHED_CLOCK
/*
* TODO: kick full dynticks CPUs when
* sched_clock_stable is set.
*/
if (!sched_clock_stable)
return false;
#endif
return true;
}
static void tick_nohz_restart_sched_tick(struct tick_sched *ts, ktime_t now);
/* /*
* Re-evaluate the need for the tick on the current CPU * Re-evaluate the need for the tick on the current CPU
* and restart it if necessary. * and restart it if necessary.
*/ */
static void tick_nohz_full_check(void) void tick_nohz_full_check(void)
{ {
/* struct tick_sched *ts = &__get_cpu_var(tick_cpu_sched);
* STUB for now, will be filled with the full tick stop/restart
* infrastructure patches if (tick_nohz_full_cpu(smp_processor_id())) {
*/ if (ts->tick_stopped && !is_idle_task(current)) {
if (!can_stop_full_tick())
tick_nohz_restart_sched_tick(ts, ktime_get());
}
}
} }
static void nohz_full_kick_work_func(struct irq_work *work) static void nohz_full_kick_work_func(struct irq_work *work)
...@@ -198,6 +232,26 @@ void tick_nohz_full_kick_all(void) ...@@ -198,6 +232,26 @@ void tick_nohz_full_kick_all(void)
preempt_enable(); preempt_enable();
} }
/*
* Re-evaluate the need for the tick as we switch the current task.
* It might need the tick due to per task/process properties:
* perf events, posix cpu timers, ...
*/
void tick_nohz_task_switch(struct task_struct *tsk)
{
unsigned long flags;
if (!tick_nohz_full_cpu(smp_processor_id()))
return;
local_irq_save(flags);
if (tick_nohz_tick_stopped() && !can_stop_full_tick())
tick_nohz_full_kick();
local_irq_restore(flags);
}
int tick_nohz_full_cpu(int cpu) int tick_nohz_full_cpu(int cpu)
{ {
if (!have_nohz_full_mask) if (!have_nohz_full_mask)
...@@ -613,6 +667,24 @@ static ktime_t tick_nohz_stop_sched_tick(struct tick_sched *ts, ...@@ -613,6 +667,24 @@ static ktime_t tick_nohz_stop_sched_tick(struct tick_sched *ts,
return ret; return ret;
} }
static void tick_nohz_full_stop_tick(struct tick_sched *ts)
{
#ifdef CONFIG_NO_HZ_FULL
int cpu = smp_processor_id();
if (!tick_nohz_full_cpu(cpu) || is_idle_task(current))
return;
if (!ts->tick_stopped && ts->nohz_mode == NOHZ_MODE_INACTIVE)
return;
if (!can_stop_full_tick())
return;
tick_nohz_stop_sched_tick(ts, ktime_get(), cpu);
#endif
}
static bool can_stop_idle_tick(int cpu, struct tick_sched *ts) static bool can_stop_idle_tick(int cpu, struct tick_sched *ts)
{ {
/* /*
...@@ -739,12 +811,13 @@ void tick_nohz_irq_exit(void) ...@@ -739,12 +811,13 @@ void tick_nohz_irq_exit(void)
{ {
struct tick_sched *ts = &__get_cpu_var(tick_cpu_sched); struct tick_sched *ts = &__get_cpu_var(tick_cpu_sched);
if (!ts->inidle) if (ts->inidle) {
return;
/* Cancel the timer because CPU already waken up from the C-states*/ /* Cancel the timer because CPU already waken up from the C-states*/
menu_hrtimer_cancel(); menu_hrtimer_cancel();
__tick_nohz_idle_enter(ts); __tick_nohz_idle_enter(ts);
} else {
tick_nohz_full_stop_tick(ts);
}
} }
/** /**
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment