]>
Commit | Line | Data |
---|---|---|
e360adbe | 1 | /* |
90eec103 | 2 | * Copyright (C) 2010 Red Hat, Inc., Peter Zijlstra |
e360adbe PZ |
3 | * |
4 | * Provides a framework for enqueueing and running callbacks from hardirq | |
5 | * context. The enqueueing is NMI-safe. | |
6 | */ | |
7 | ||
83e3fa6f | 8 | #include <linux/bug.h> |
e360adbe | 9 | #include <linux/kernel.h> |
9984de1a | 10 | #include <linux/export.h> |
e360adbe | 11 | #include <linux/irq_work.h> |
967d1f90 | 12 | #include <linux/percpu.h> |
e360adbe | 13 | #include <linux/hardirq.h> |
ef1f0982 | 14 | #include <linux/irqflags.h> |
bc6679ae FW |
15 | #include <linux/sched.h> |
16 | #include <linux/tick.h> | |
c0e980a4 SR |
17 | #include <linux/cpu.h> |
18 | #include <linux/notifier.h> | |
47885016 | 19 | #include <linux/smp.h> |
967d1f90 | 20 | #include <asm/processor.h> |
e360adbe | 21 | |
e360adbe | 22 | |
b93e0b8f FW |
23 | static DEFINE_PER_CPU(struct llist_head, raised_list); |
24 | static DEFINE_PER_CPU(struct llist_head, lazy_list); | |
e360adbe PZ |
25 | |
26 | /* | |
27 | * Claim the entry so that no one else will poke at it. | |
28 | */ | |
38aaf809 | 29 | static bool irq_work_claim(struct irq_work *work) |
e360adbe | 30 | { |
e0bbe2d8 | 31 | unsigned long flags, oflags, nflags; |
e360adbe | 32 | |
e0bbe2d8 FW |
33 | /* |
34 | * Start with our best wish as a premise but only trust any | |
35 | * flag value after cmpxchg() result. | |
36 | */ | |
37 | flags = work->flags & ~IRQ_WORK_PENDING; | |
38aaf809 | 38 | for (;;) { |
6baf9e67 | 39 | nflags = flags | IRQ_WORK_CLAIMED; |
e0bbe2d8 FW |
40 | oflags = cmpxchg(&work->flags, flags, nflags); |
41 | if (oflags == flags) | |
38aaf809 | 42 | break; |
e0bbe2d8 FW |
43 | if (oflags & IRQ_WORK_PENDING) |
44 | return false; | |
45 | flags = oflags; | |
38aaf809 YH |
46 | cpu_relax(); |
47 | } | |
e360adbe PZ |
48 | |
49 | return true; | |
50 | } | |
51 | ||
e360adbe PZ |
52 | void __weak arch_irq_work_raise(void) |
53 | { | |
54 | /* | |
55 | * Lame architectures will get the timer tick callback | |
56 | */ | |
57 | } | |
58 | ||
471ba0e6 NP |
59 | /* Enqueue on current CPU, work must already be claimed and preempt disabled */ |
60 | static void __irq_work_queue_local(struct irq_work *work) | |
47885016 | 61 | { |
471ba0e6 NP |
62 | /* If the work is "lazy", handle it from next tick if any */ |
63 | if (work->flags & IRQ_WORK_LAZY) { | |
64 | if (llist_add(&work->llnode, this_cpu_ptr(&lazy_list)) && | |
65 | tick_nohz_tick_stopped()) | |
66 | arch_irq_work_raise(); | |
67 | } else { | |
68 | if (llist_add(&work->llnode, this_cpu_ptr(&raised_list))) | |
69 | arch_irq_work_raise(); | |
70 | } | |
71 | } | |
47885016 | 72 | |
471ba0e6 NP |
73 | /* Enqueue the irq work @work on the current CPU */ |
74 | bool irq_work_queue(struct irq_work *work) | |
75 | { | |
47885016 FW |
76 | /* Only queue if not already pending */ |
77 | if (!irq_work_claim(work)) | |
78 | return false; | |
79 | ||
471ba0e6 NP |
80 | /* Queue the entry and raise the IPI if needed. */ |
81 | preempt_disable(); | |
82 | __irq_work_queue_local(work); | |
83 | preempt_enable(); | |
6733bab7 | 84 | |
47885016 FW |
85 | return true; |
86 | } | |
471ba0e6 | 87 | EXPORT_SYMBOL_GPL(irq_work_queue); |
47885016 | 88 | |
471ba0e6 NP |
89 | /* |
90 | * Enqueue the irq_work @work on @cpu unless it's already pending | |
91 | * somewhere. | |
92 | * | |
93 | * Can be re-enqueued while the callback is still in progress. | |
94 | */ | |
95 | bool irq_work_queue_on(struct irq_work *work, int cpu) | |
e360adbe | 96 | { |
471ba0e6 NP |
97 | #ifndef CONFIG_SMP |
98 | return irq_work_queue(work); | |
99 | ||
100 | #else /* CONFIG_SMP: */ | |
101 | /* All work should have been flushed before going offline */ | |
102 | WARN_ON_ONCE(cpu_is_offline(cpu)); | |
103 | ||
c02cf5f8 | 104 | /* Only queue if not already pending */ |
105 | if (!irq_work_claim(work)) | |
cd578abb | 106 | return false; |
c02cf5f8 | 107 | |
20b87691 | 108 | preempt_disable(); |
471ba0e6 NP |
109 | if (cpu != smp_processor_id()) { |
110 | /* Arch remote IPI send/receive backend aren't NMI safe */ | |
111 | WARN_ON_ONCE(in_nmi()); | |
112 | if (llist_add(&work->llnode, &per_cpu(raised_list, cpu))) | |
113 | arch_send_call_function_single_ipi(cpu); | |
b93e0b8f | 114 | } else { |
471ba0e6 | 115 | __irq_work_queue_local(work); |
bc6679ae | 116 | } |
20b87691 | 117 | preempt_enable(); |
cd578abb PZ |
118 | |
119 | return true; | |
471ba0e6 | 120 | #endif /* CONFIG_SMP */ |
e360adbe | 121 | } |
471ba0e6 | 122 | |
e360adbe | 123 | |
00b42959 FW |
124 | bool irq_work_needs_cpu(void) |
125 | { | |
b93e0b8f | 126 | struct llist_head *raised, *lazy; |
00b42959 | 127 | |
22127e93 CL |
128 | raised = this_cpu_ptr(&raised_list); |
129 | lazy = this_cpu_ptr(&lazy_list); | |
76a33061 FW |
130 | |
131 | if (llist_empty(raised) || arch_irq_work_has_interrupt()) | |
132 | if (llist_empty(lazy)) | |
133 | return false; | |
00b42959 | 134 | |
8aa2acce SR |
135 | /* All work should have been flushed before going offline */ |
136 | WARN_ON_ONCE(cpu_is_offline(smp_processor_id())); | |
137 | ||
00b42959 FW |
138 | return true; |
139 | } | |
140 | ||
b93e0b8f | 141 | static void irq_work_run_list(struct llist_head *list) |
e360adbe | 142 | { |
d00a08cf | 143 | struct irq_work *work, *tmp; |
38aaf809 | 144 | struct llist_node *llnode; |
d00a08cf | 145 | unsigned long flags; |
e360adbe | 146 | |
b93e0b8f | 147 | BUG_ON(!irqs_disabled()); |
bc6679ae | 148 | |
b93e0b8f | 149 | if (llist_empty(list)) |
e360adbe PZ |
150 | return; |
151 | ||
b93e0b8f | 152 | llnode = llist_del_all(list); |
d00a08cf | 153 | llist_for_each_entry_safe(work, tmp, llnode, llnode) { |
e360adbe | 154 | /* |
38aaf809 | 155 | * Clear the PENDING bit, after this point the @work |
e360adbe | 156 | * can be re-used. |
c8446b75 FW |
157 | * Make it immediately visible so that other CPUs trying |
158 | * to claim that work don't rely on us to handle their data | |
159 | * while we are in the middle of the func. | |
e360adbe | 160 | */ |
bc6679ae FW |
161 | flags = work->flags & ~IRQ_WORK_PENDING; |
162 | xchg(&work->flags, flags); | |
163 | ||
38aaf809 | 164 | work->func(work); |
e360adbe PZ |
165 | /* |
166 | * Clear the BUSY bit and return to the free state if | |
167 | * no-one else claimed it meanwhile. | |
168 | */ | |
bc6679ae | 169 | (void)cmpxchg(&work->flags, flags, flags & ~IRQ_WORK_BUSY); |
e360adbe PZ |
170 | } |
171 | } | |
c0e980a4 SR |
172 | |
173 | /* | |
a77353e5 PZ |
174 | * hotplug calls this through: |
175 | * hotplug_cfd() -> flush_smp_call_function_queue() | |
c0e980a4 SR |
176 | */ |
177 | void irq_work_run(void) | |
178 | { | |
22127e93 CL |
179 | irq_work_run_list(this_cpu_ptr(&raised_list)); |
180 | irq_work_run_list(this_cpu_ptr(&lazy_list)); | |
c0e980a4 | 181 | } |
e360adbe PZ |
182 | EXPORT_SYMBOL_GPL(irq_work_run); |
183 | ||
76a33061 FW |
184 | void irq_work_tick(void) |
185 | { | |
56e4dea8 | 186 | struct llist_head *raised = this_cpu_ptr(&raised_list); |
76a33061 FW |
187 | |
188 | if (!llist_empty(raised) && !arch_irq_work_has_interrupt()) | |
189 | irq_work_run_list(raised); | |
56e4dea8 | 190 | irq_work_run_list(this_cpu_ptr(&lazy_list)); |
76a33061 FW |
191 | } |
192 | ||
e360adbe PZ |
193 | /* |
194 | * Synchronize against the irq_work @entry, ensures the entry is not | |
195 | * currently in use. | |
196 | */ | |
38aaf809 | 197 | void irq_work_sync(struct irq_work *work) |
e360adbe | 198 | { |
3c7169a3 | 199 | lockdep_assert_irqs_enabled(); |
e360adbe | 200 | |
38aaf809 | 201 | while (work->flags & IRQ_WORK_BUSY) |
e360adbe PZ |
202 | cpu_relax(); |
203 | } | |
204 | EXPORT_SYMBOL_GPL(irq_work_sync); |