Commit bc6679ae authored by Frederic Weisbecker's avatar Frederic Weisbecker

irq_work: Make self-IPIs optable

On irq work initialization, let the user choose to define it
as "lazy" or not. "Lazy" means that we don't want to send
an IPI (provided the arch can anyway) when we enqueue this
work but we rather prefer to wait for the next timer tick
to execute our work if possible.

This is going to be a benefit for non-urgent enqueuers
(like printk in the future) that may prefer not to raise
an IPI storm in case of frequent enqueuing on short periods
of time.
Signed-off-by: default avatarFrederic Weisbecker <fweisbec@gmail.com>
Acked-by: default avatarSteven Rostedt <rostedt@goodmis.org>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Thomas Gleixner <tglx@linutronix.de>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Andrew Morton <akpm@linux-foundation.org>
Cc: Paul Gortmaker <paul.gortmaker@windriver.com>
parent 8aa2acce
...@@ -3,6 +3,20 @@ ...@@ -3,6 +3,20 @@
#include <linux/llist.h> #include <linux/llist.h>
/*
* An entry can be in one of four states:
*
* free NULL, 0 -> {claimed} : free to be used
* claimed NULL, 3 -> {pending} : claimed to be enqueued
* pending next, 3 -> {busy} : queued, pending callback
* busy NULL, 2 -> {free, claimed} : callback in progress, can be claimed
*/
#define IRQ_WORK_PENDING 1UL
#define IRQ_WORK_BUSY 2UL
#define IRQ_WORK_FLAGS 3UL
#define IRQ_WORK_LAZY 4UL /* Doesn't want IPI, wait for tick */
struct irq_work { struct irq_work {
unsigned long flags; unsigned long flags;
struct llist_node llnode; struct llist_node llnode;
......
...@@ -12,24 +12,15 @@ ...@@ -12,24 +12,15 @@
#include <linux/percpu.h> #include <linux/percpu.h>
#include <linux/hardirq.h> #include <linux/hardirq.h>
#include <linux/irqflags.h> #include <linux/irqflags.h>
#include <linux/sched.h>
#include <linux/tick.h>
#include <linux/cpu.h> #include <linux/cpu.h>
#include <linux/notifier.h> #include <linux/notifier.h>
#include <asm/processor.h> #include <asm/processor.h>
/*
* An entry can be in one of four states:
*
* free NULL, 0 -> {claimed} : free to be used
* claimed NULL, 3 -> {pending} : claimed to be enqueued
* pending next, 3 -> {busy} : queued, pending callback
* busy NULL, 2 -> {free, claimed} : callback in progress, can be claimed
*/
#define IRQ_WORK_PENDING 1UL
#define IRQ_WORK_BUSY 2UL
#define IRQ_WORK_FLAGS 3UL
static DEFINE_PER_CPU(struct llist_head, irq_work_list); static DEFINE_PER_CPU(struct llist_head, irq_work_list);
static DEFINE_PER_CPU(int, irq_work_raised);
/* /*
* Claim the entry so that no one else will poke at it. * Claim the entry so that no one else will poke at it.
...@@ -69,14 +60,19 @@ void __weak arch_irq_work_raise(void) ...@@ -69,14 +60,19 @@ void __weak arch_irq_work_raise(void)
*/ */
static void __irq_work_queue(struct irq_work *work) static void __irq_work_queue(struct irq_work *work)
{ {
bool empty;
preempt_disable(); preempt_disable();
empty = llist_add(&work->llnode, &__get_cpu_var(irq_work_list)); llist_add(&work->llnode, &__get_cpu_var(irq_work_list));
/* The list was empty, raise self-interrupt to start processing. */
if (empty) /*
arch_irq_work_raise(); * If the work is not "lazy" or the tick is stopped, raise the irq
* work interrupt (if supported by the arch), otherwise, just wait
* for the next tick.
*/
if (!(work->flags & IRQ_WORK_LAZY) || tick_nohz_tick_stopped()) {
if (!this_cpu_cmpxchg(irq_work_raised, 0, 1))
arch_irq_work_raise();
}
preempt_enable(); preempt_enable();
} }
...@@ -117,10 +113,19 @@ bool irq_work_needs_cpu(void) ...@@ -117,10 +113,19 @@ bool irq_work_needs_cpu(void)
static void __irq_work_run(void) static void __irq_work_run(void)
{ {
unsigned long flags;
struct irq_work *work; struct irq_work *work;
struct llist_head *this_list; struct llist_head *this_list;
struct llist_node *llnode; struct llist_node *llnode;
/*
* Reset the "raised" state right before we check the list because
* an NMI may enqueue after we find the list empty from the runner.
*/
__this_cpu_write(irq_work_raised, 0);
barrier();
this_list = &__get_cpu_var(irq_work_list); this_list = &__get_cpu_var(irq_work_list);
if (llist_empty(this_list)) if (llist_empty(this_list))
return; return;
...@@ -140,13 +145,15 @@ static void __irq_work_run(void) ...@@ -140,13 +145,15 @@ static void __irq_work_run(void)
* to claim that work don't rely on us to handle their data * to claim that work don't rely on us to handle their data
* while we are in the middle of the func. * while we are in the middle of the func.
*/ */
xchg(&work->flags, IRQ_WORK_BUSY); flags = work->flags & ~IRQ_WORK_PENDING;
xchg(&work->flags, flags);
work->func(work); work->func(work);
/* /*
* Clear the BUSY bit and return to the free state if * Clear the BUSY bit and return to the free state if
* no-one else claimed it meanwhile. * no-one else claimed it meanwhile.
*/ */
(void)cmpxchg(&work->flags, IRQ_WORK_BUSY, 0); (void)cmpxchg(&work->flags, flags, flags & ~IRQ_WORK_BUSY);
} }
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment