blob: 7f3a59bc8e3d97660a8e75fdf6847fd4124f96c6 [file] [log] [blame]
Peter Zijlstrae360adb2010-10-14 14:01:34 +08001/*
2 * Copyright (C) 2010 Red Hat, Inc., Peter Zijlstra <pzijlstr@redhat.com>
3 *
4 * Provides a framework for enqueueing and running callbacks from hardirq
5 * context. The enqueueing is NMI-safe.
6 */
7
Paul Gortmaker83e3fa62012-04-01 16:38:37 -04008#include <linux/bug.h>
Peter Zijlstrae360adb2010-10-14 14:01:34 +08009#include <linux/kernel.h>
Paul Gortmaker9984de12011-05-23 14:51:41 -040010#include <linux/export.h>
Peter Zijlstrae360adb2010-10-14 14:01:34 +080011#include <linux/irq_work.h>
Paul Gortmaker967d1f92011-07-18 13:03:04 -040012#include <linux/percpu.h>
Peter Zijlstrae360adb2010-10-14 14:01:34 +080013#include <linux/hardirq.h>
Chris Metcalfef1f0982012-04-11 12:21:39 -040014#include <linux/irqflags.h>
Frederic Weisbeckerbc6679a2012-10-19 16:43:41 -040015#include <linux/sched.h>
16#include <linux/tick.h>
Steven Rostedtc0e980a2012-11-15 11:34:21 -050017#include <linux/cpu.h>
18#include <linux/notifier.h>
Paul Gortmaker967d1f92011-07-18 13:03:04 -040019#include <asm/processor.h>
Peter Zijlstrae360adb2010-10-14 14:01:34 +080020
Peter Zijlstrae360adb2010-10-14 14:01:34 +080021
Huang Ying38aaf802011-09-08 14:00:46 +080022static DEFINE_PER_CPU(struct llist_head, irq_work_list);
Frederic Weisbeckerbc6679a2012-10-19 16:43:41 -040023static DEFINE_PER_CPU(int, irq_work_raised);
Peter Zijlstrae360adb2010-10-14 14:01:34 +080024
25/*
26 * Claim the entry so that no one else will poke at it.
27 */
Huang Ying38aaf802011-09-08 14:00:46 +080028static bool irq_work_claim(struct irq_work *work)
Peter Zijlstrae360adb2010-10-14 14:01:34 +080029{
Frederic Weisbeckere0bbe2d2012-10-27 15:21:36 +020030 unsigned long flags, oflags, nflags;
Peter Zijlstrae360adb2010-10-14 14:01:34 +080031
Frederic Weisbeckere0bbe2d2012-10-27 15:21:36 +020032 /*
33 * Start with our best wish as a premise but only trust any
34 * flag value after cmpxchg() result.
35 */
36 flags = work->flags & ~IRQ_WORK_PENDING;
Huang Ying38aaf802011-09-08 14:00:46 +080037 for (;;) {
Huang Ying38aaf802011-09-08 14:00:46 +080038 nflags = flags | IRQ_WORK_FLAGS;
Frederic Weisbeckere0bbe2d2012-10-27 15:21:36 +020039 oflags = cmpxchg(&work->flags, flags, nflags);
40 if (oflags == flags)
Huang Ying38aaf802011-09-08 14:00:46 +080041 break;
Frederic Weisbeckere0bbe2d2012-10-27 15:21:36 +020042 if (oflags & IRQ_WORK_PENDING)
43 return false;
44 flags = oflags;
Huang Ying38aaf802011-09-08 14:00:46 +080045 cpu_relax();
46 }
Peter Zijlstrae360adb2010-10-14 14:01:34 +080047
48 return true;
49}
50
Peter Zijlstrae360adb2010-10-14 14:01:34 +080051void __weak arch_irq_work_raise(void)
52{
53 /*
54 * Lame architectures will get the timer tick callback
55 */
56}
57
58/*
59 * Queue the entry and raise the IPI if needed.
60 */
Huang Ying38aaf802011-09-08 14:00:46 +080061static void __irq_work_queue(struct irq_work *work)
Peter Zijlstrae360adb2010-10-14 14:01:34 +080062{
Christoph Lameter20b87692010-12-14 10:28:45 -060063 preempt_disable();
Peter Zijlstrae360adb2010-10-14 14:01:34 +080064
Frederic Weisbeckerbc6679a2012-10-19 16:43:41 -040065 llist_add(&work->llnode, &__get_cpu_var(irq_work_list));
66
67 /*
68 * If the work is not "lazy" or the tick is stopped, raise the irq
69 * work interrupt (if supported by the arch), otherwise, just wait
70 * for the next tick.
71 */
72 if (!(work->flags & IRQ_WORK_LAZY) || tick_nohz_tick_stopped()) {
73 if (!this_cpu_cmpxchg(irq_work_raised, 0, 1))
74 arch_irq_work_raise();
75 }
Peter Zijlstrae360adb2010-10-14 14:01:34 +080076
Christoph Lameter20b87692010-12-14 10:28:45 -060077 preempt_enable();
Peter Zijlstrae360adb2010-10-14 14:01:34 +080078}
79
80/*
81 * Enqueue the irq_work @entry, returns true on success, failure when the
82 * @entry was already enqueued by someone else.
83 *
84 * Can be re-enqueued while the callback is still in progress.
85 */
Huang Ying38aaf802011-09-08 14:00:46 +080086bool irq_work_queue(struct irq_work *work)
Peter Zijlstrae360adb2010-10-14 14:01:34 +080087{
Huang Ying38aaf802011-09-08 14:00:46 +080088 if (!irq_work_claim(work)) {
Peter Zijlstrae360adb2010-10-14 14:01:34 +080089 /*
90 * Already enqueued, can't do!
91 */
92 return false;
93 }
94
Huang Ying38aaf802011-09-08 14:00:46 +080095 __irq_work_queue(work);
Peter Zijlstrae360adb2010-10-14 14:01:34 +080096 return true;
97}
98EXPORT_SYMBOL_GPL(irq_work_queue);
99
Frederic Weisbecker00b42952012-11-07 21:03:07 +0100100bool irq_work_needs_cpu(void)
101{
102 struct llist_head *this_list;
103
104 this_list = &__get_cpu_var(irq_work_list);
105 if (llist_empty(this_list))
106 return false;
107
Steven Rostedt8aa2acc2012-11-15 12:52:44 -0500108 /* All work should have been flushed before going offline */
109 WARN_ON_ONCE(cpu_is_offline(smp_processor_id()));
110
Frederic Weisbecker00b42952012-11-07 21:03:07 +0100111 return true;
112}
113
Steven Rostedtc0e980a2012-11-15 11:34:21 -0500114static void __irq_work_run(void)
Peter Zijlstrae360adb2010-10-14 14:01:34 +0800115{
Frederic Weisbeckerbc6679a2012-10-19 16:43:41 -0400116 unsigned long flags;
Huang Ying38aaf802011-09-08 14:00:46 +0800117 struct irq_work *work;
118 struct llist_head *this_list;
119 struct llist_node *llnode;
Peter Zijlstrae360adb2010-10-14 14:01:34 +0800120
Frederic Weisbeckerbc6679a2012-10-19 16:43:41 -0400121
122 /*
123 * Reset the "raised" state right before we check the list because
124 * an NMI may enqueue after we find the list empty from the runner.
125 */
126 __this_cpu_write(irq_work_raised, 0);
127 barrier();
128
Huang Ying38aaf802011-09-08 14:00:46 +0800129 this_list = &__get_cpu_var(irq_work_list);
130 if (llist_empty(this_list))
Peter Zijlstrae360adb2010-10-14 14:01:34 +0800131 return;
132
Peter Zijlstrae360adb2010-10-14 14:01:34 +0800133 BUG_ON(!irqs_disabled());
134
Huang Ying38aaf802011-09-08 14:00:46 +0800135 llnode = llist_del_all(this_list);
136 while (llnode != NULL) {
137 work = llist_entry(llnode, struct irq_work, llnode);
Christoph Lameter20b87692010-12-14 10:28:45 -0600138
Peter Zijlstra924f8f52011-09-12 13:12:28 +0200139 llnode = llist_next(llnode);
Peter Zijlstrae360adb2010-10-14 14:01:34 +0800140
141 /*
Huang Ying38aaf802011-09-08 14:00:46 +0800142 * Clear the PENDING bit, after this point the @work
Peter Zijlstrae360adb2010-10-14 14:01:34 +0800143 * can be re-used.
Frederic Weisbeckerc8446b72012-10-30 13:33:54 +0100144 * Make it immediately visible so that other CPUs trying
145 * to claim that work don't rely on us to handle their data
146 * while we are in the middle of the func.
Peter Zijlstrae360adb2010-10-14 14:01:34 +0800147 */
Frederic Weisbeckerbc6679a2012-10-19 16:43:41 -0400148 flags = work->flags & ~IRQ_WORK_PENDING;
149 xchg(&work->flags, flags);
150
Huang Ying38aaf802011-09-08 14:00:46 +0800151 work->func(work);
Peter Zijlstrae360adb2010-10-14 14:01:34 +0800152 /*
153 * Clear the BUSY bit and return to the free state if
154 * no-one else claimed it meanwhile.
155 */
Frederic Weisbeckerbc6679a2012-10-19 16:43:41 -0400156 (void)cmpxchg(&work->flags, flags, flags & ~IRQ_WORK_BUSY);
Peter Zijlstrae360adb2010-10-14 14:01:34 +0800157 }
158}
Steven Rostedtc0e980a2012-11-15 11:34:21 -0500159
160/*
161 * Run the irq_work entries on this cpu. Requires to be ran from hardirq
162 * context with local IRQs disabled.
163 */
164void irq_work_run(void)
165{
166 BUG_ON(!in_irq());
167 __irq_work_run();
168}
Peter Zijlstrae360adb2010-10-14 14:01:34 +0800169EXPORT_SYMBOL_GPL(irq_work_run);
170
171/*
172 * Synchronize against the irq_work @entry, ensures the entry is not
173 * currently in use.
174 */
Huang Ying38aaf802011-09-08 14:00:46 +0800175void irq_work_sync(struct irq_work *work)
Peter Zijlstrae360adb2010-10-14 14:01:34 +0800176{
177 WARN_ON_ONCE(irqs_disabled());
178
Huang Ying38aaf802011-09-08 14:00:46 +0800179 while (work->flags & IRQ_WORK_BUSY)
Peter Zijlstrae360adb2010-10-14 14:01:34 +0800180 cpu_relax();
181}
182EXPORT_SYMBOL_GPL(irq_work_sync);
Steven Rostedtc0e980a2012-11-15 11:34:21 -0500183
184#ifdef CONFIG_HOTPLUG_CPU
185static int irq_work_cpu_notify(struct notifier_block *self,
186 unsigned long action, void *hcpu)
187{
188 long cpu = (long)hcpu;
189
190 switch (action) {
191 case CPU_DYING:
192 /* Called from stop_machine */
193 if (WARN_ON_ONCE(cpu != smp_processor_id()))
194 break;
195 __irq_work_run();
196 break;
197 default:
198 break;
199 }
200 return NOTIFY_OK;
201}
202
203static struct notifier_block cpu_notify;
204
205static __init int irq_work_init_cpu_notifier(void)
206{
207 cpu_notify.notifier_call = irq_work_cpu_notify;
208 cpu_notify.priority = 0;
209 register_cpu_notifier(&cpu_notify);
210 return 0;
211}
212device_initcall(irq_work_init_cpu_notifier);
213
214#endif /* CONFIG_HOTPLUG_CPU */