blob: 9f8092b82a948bc9227779ddd6dc3b03219c60dd [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/kernel/softirq.c
3 *
4 * Copyright (C) 1992 Linus Torvalds
5 *
Pavel Machekb10db7f2008-01-30 13:30:00 +01006 * Distribute under GPLv2.
7 *
8 * Rewritten. Old one was good in 2.2, but in 2.3 it was immoral. --ANK (990903)
David S. Miller54514a72008-09-23 22:15:57 -07009 *
10 * Remote softirq infrastructure is by Jens Axboe.
Linus Torvalds1da177e2005-04-16 15:20:36 -070011 */
12
Paul Gortmaker9984de12011-05-23 14:51:41 -040013#include <linux/export.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070014#include <linux/kernel_stat.h>
15#include <linux/interrupt.h>
16#include <linux/init.h>
17#include <linux/mm.h>
18#include <linux/notifier.h>
19#include <linux/percpu.h>
20#include <linux/cpu.h>
Rafael J. Wysocki83144182007-07-17 04:03:35 -070021#include <linux/freezer.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070022#include <linux/kthread.h>
23#include <linux/rcupdate.h>
Steven Rostedt7e49fcc2009-01-22 19:01:40 -050024#include <linux/ftrace.h>
Andrew Morton78eef012006-03-22 00:08:16 -080025#include <linux/smp.h>
Thomas Gleixner3e339b52012-07-16 10:42:37 +000026#include <linux/smpboot.h>
Thomas Gleixner79bf2bb2007-02-16 01:28:03 -080027#include <linux/tick.h>
Heiko Carstensa0e39ed2009-04-29 13:51:39 +020028
29#define CREATE_TRACE_POINTS
Steven Rostedtad8d75f2009-04-14 19:39:12 -040030#include <trace/events/irq.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070031
Linus Torvalds1da177e2005-04-16 15:20:36 -070032/*
33 - No shared variables, all the data are CPU local.
34 - If a softirq needs serialization, let it serialize itself
35 by its own spinlocks.
36 - Even if softirq is serialized, only local cpu is marked for
37 execution. Hence, we get something sort of weak cpu binding.
38 Though it is still not clear, will it result in better locality
39 or will not.
40
41 Examples:
42 - NET RX softirq. It is multithreaded and does not require
43 any global serialization.
44 - NET TX softirq. It kicks software netdevice queues, hence
45 it is logically serialized per device, but this serialization
46 is invisible to common code.
47 - Tasklets: serialized wrt itself.
48 */
49
50#ifndef __ARCH_IRQ_STAT
51irq_cpustat_t irq_stat[NR_CPUS] ____cacheline_aligned;
52EXPORT_SYMBOL(irq_stat);
53#endif
54
Alexey Dobriyan978b0112008-09-06 20:04:36 +020055static struct softirq_action softirq_vec[NR_SOFTIRQS] __cacheline_aligned_in_smp;
Linus Torvalds1da177e2005-04-16 15:20:36 -070056
Venkatesh Pallipadi4dd53d82010-12-21 17:09:00 -080057DEFINE_PER_CPU(struct task_struct *, ksoftirqd);
Linus Torvalds1da177e2005-04-16 15:20:36 -070058
Jason Baron5d592b42009-03-12 14:33:36 -040059char *softirq_to_name[NR_SOFTIRQS] = {
Li Zefan5dd4de52009-09-17 17:38:32 +080060 "HI", "TIMER", "NET_TX", "NET_RX", "BLOCK", "BLOCK_IOPOLL",
Shaohua Li09223372011-06-14 13:26:25 +080061 "TASKLET", "SCHED", "HRTIMER", "RCU"
Jason Baron5d592b42009-03-12 14:33:36 -040062};
63
Linus Torvalds1da177e2005-04-16 15:20:36 -070064/*
65 * we cannot loop indefinitely here to avoid userspace starvation,
66 * but we also don't want to introduce a worst case 1/HZ latency
67 * to the pending events, so lets the scheduler to balance
68 * the softirq load for us.
69 */
Thomas Gleixner676cb022009-07-20 23:33:49 +020070static void wakeup_softirqd(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -070071{
72 /* Interrupts are disabled: no need to stop preemption */
Christoph Lameter909ea962010-12-08 16:22:55 +010073 struct task_struct *tsk = __this_cpu_read(ksoftirqd);
Linus Torvalds1da177e2005-04-16 15:20:36 -070074
75 if (tsk && tsk->state != TASK_RUNNING)
76 wake_up_process(tsk);
77}
78
79/*
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -070080 * preempt_count and SOFTIRQ_OFFSET usage:
81 * - preempt_count is changed by SOFTIRQ_OFFSET on entering or leaving
82 * softirq processing.
83 * - preempt_count is changed by SOFTIRQ_DISABLE_OFFSET (= 2 * SOFTIRQ_OFFSET)
84 * on local_bh_disable or local_bh_enable.
85 * This lets us distinguish between whether we are currently processing
86 * softirq and whether we just have bh disabled.
87 */
88
89/*
Ingo Molnarde30a2b2006-07-03 00:24:42 -070090 * This one is for softirq.c-internal use,
91 * where hardirqs are disabled legitimately:
92 */
Tim Chen3c829c32006-07-30 03:04:02 -070093#ifdef CONFIG_TRACE_IRQFLAGS
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -070094static void __local_bh_disable(unsigned long ip, unsigned int cnt)
Ingo Molnarde30a2b2006-07-03 00:24:42 -070095{
96 unsigned long flags;
97
98 WARN_ON_ONCE(in_irq());
99
100 raw_local_irq_save(flags);
Steven Rostedt7e49fcc2009-01-22 19:01:40 -0500101 /*
102 * The preempt tracer hooks into add_preempt_count and will break
103 * lockdep because it calls back into lockdep after SOFTIRQ_OFFSET
104 * is set and before current->softirq_enabled is cleared.
105 * We must manually increment preempt_count here and manually
106 * call the trace_preempt_off later.
107 */
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700108 preempt_count() += cnt;
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700109 /*
110 * Were softirqs turned off above:
111 */
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700112 if (softirq_count() == cnt)
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700113 trace_softirqs_off(ip);
114 raw_local_irq_restore(flags);
Steven Rostedt7e49fcc2009-01-22 19:01:40 -0500115
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700116 if (preempt_count() == cnt)
Steven Rostedt7e49fcc2009-01-22 19:01:40 -0500117 trace_preempt_off(CALLER_ADDR0, get_parent_ip(CALLER_ADDR1));
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700118}
Tim Chen3c829c32006-07-30 03:04:02 -0700119#else /* !CONFIG_TRACE_IRQFLAGS */
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700120static inline void __local_bh_disable(unsigned long ip, unsigned int cnt)
Tim Chen3c829c32006-07-30 03:04:02 -0700121{
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700122 add_preempt_count(cnt);
Tim Chen3c829c32006-07-30 03:04:02 -0700123 barrier();
124}
125#endif /* CONFIG_TRACE_IRQFLAGS */
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700126
127void local_bh_disable(void)
128{
Davidlohr Buesod2e08472013-04-30 11:46:09 -0700129 __local_bh_disable(_RET_IP_, SOFTIRQ_DISABLE_OFFSET);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700130}
131
132EXPORT_SYMBOL(local_bh_disable);
133
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700134static void __local_bh_enable(unsigned int cnt)
135{
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700136 WARN_ON_ONCE(!irqs_disabled());
137
138 if (softirq_count() == cnt)
Davidlohr Buesod2e08472013-04-30 11:46:09 -0700139 trace_softirqs_on(_RET_IP_);
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700140 sub_preempt_count(cnt);
141}
142
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700143/*
144 * Special-case - softirqs can safely be enabled in
145 * cond_resched_softirq(), or by __do_softirq(),
146 * without processing still-pending softirqs:
147 */
148void _local_bh_enable(void)
149{
Frederic Weisbecker5d60d3e2013-09-24 04:11:35 +0200150 WARN_ON_ONCE(in_irq());
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700151 __local_bh_enable(SOFTIRQ_DISABLE_OFFSET);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700152}
153
154EXPORT_SYMBOL(_local_bh_enable);
155
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200156static inline void _local_bh_enable_ip(unsigned long ip)
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700157{
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200158 WARN_ON_ONCE(in_irq() || irqs_disabled());
Tim Chen3c829c32006-07-30 03:04:02 -0700159#ifdef CONFIG_TRACE_IRQFLAGS
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200160 local_irq_disable();
Tim Chen3c829c32006-07-30 03:04:02 -0700161#endif
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700162 /*
163 * Are softirqs going to be turned on now:
164 */
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700165 if (softirq_count() == SOFTIRQ_DISABLE_OFFSET)
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700166 trace_softirqs_on(ip);
167 /*
168 * Keep preemption disabled until we are done with
169 * softirq processing:
170 */
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700171 sub_preempt_count(SOFTIRQ_DISABLE_OFFSET - 1);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700172
173 if (unlikely(!in_interrupt() && local_softirq_pending()))
174 do_softirq();
175
176 dec_preempt_count();
Tim Chen3c829c32006-07-30 03:04:02 -0700177#ifdef CONFIG_TRACE_IRQFLAGS
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200178 local_irq_enable();
Tim Chen3c829c32006-07-30 03:04:02 -0700179#endif
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700180 preempt_check_resched();
181}
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200182
183void local_bh_enable(void)
184{
Davidlohr Buesod2e08472013-04-30 11:46:09 -0700185 _local_bh_enable_ip(_RET_IP_);
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200186}
187EXPORT_SYMBOL(local_bh_enable);
188
189void local_bh_enable_ip(unsigned long ip)
190{
191 _local_bh_enable_ip(ip);
192}
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700193EXPORT_SYMBOL(local_bh_enable_ip);
194
195/*
Ben Greear34376a52013-06-06 14:29:49 -0700196 * We restart softirq processing for at most MAX_SOFTIRQ_RESTART times,
197 * but break the loop if need_resched() is set or after 2 ms.
198 * The MAX_SOFTIRQ_TIME provides a nice upper bound in most cases, but in
199 * certain cases, such as stop_machine(), jiffies may cease to
200 * increment and so we need the MAX_SOFTIRQ_RESTART limit as
201 * well to make sure we eventually return from this method.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700202 *
Eric Dumazetc10d7362013-01-10 15:26:34 -0800203 * These limits have been established via experimentation.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700204 * The two things to balance is latency against fairness -
205 * we want to handle softirqs as soon as possible, but they
206 * should not be able to lock up the box.
207 */
Eric Dumazetc10d7362013-01-10 15:26:34 -0800208#define MAX_SOFTIRQ_TIME msecs_to_jiffies(2)
Ben Greear34376a52013-06-06 14:29:49 -0700209#define MAX_SOFTIRQ_RESTART 10
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210
211asmlinkage void __do_softirq(void)
212{
213 struct softirq_action *h;
214 __u32 pending;
Eric Dumazetc10d7362013-01-10 15:26:34 -0800215 unsigned long end = jiffies + MAX_SOFTIRQ_TIME;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700216 int cpu;
Mel Gorman907aed42012-07-31 16:44:07 -0700217 unsigned long old_flags = current->flags;
Ben Greear34376a52013-06-06 14:29:49 -0700218 int max_restart = MAX_SOFTIRQ_RESTART;
Mel Gorman907aed42012-07-31 16:44:07 -0700219
220 /*
221 * Mask out PF_MEMALLOC s current task context is borrowed for the
222 * softirq. A softirq handled such as network RX might set PF_MEMALLOC
223 * again if the socket is related to swap
224 */
225 current->flags &= ~PF_MEMALLOC;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700226
227 pending = local_softirq_pending();
Frederic Weisbecker6a616712012-12-16 20:00:34 +0100228 account_irq_enter_time(current);
Paul Mackerras829035fd2006-07-03 00:25:40 -0700229
Davidlohr Buesod2e08472013-04-30 11:46:09 -0700230 __local_bh_disable(_RET_IP_, SOFTIRQ_OFFSET);
Ingo Molnard820ac42009-03-13 01:30:40 +0100231 lockdep_softirq_enter();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700232
Linus Torvalds1da177e2005-04-16 15:20:36 -0700233 cpu = smp_processor_id();
234restart:
235 /* Reset the pending bitmask before enabling irqs */
Andi Kleen3f744782005-09-12 18:49:24 +0200236 set_softirq_pending(0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700237
Andrew Mortonc70f5d62005-07-30 10:22:49 -0700238 local_irq_enable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700239
240 h = softirq_vec;
241
242 do {
243 if (pending & 1) {
Thomas Gleixnerf4bc6bb2010-10-19 15:00:13 +0200244 unsigned int vec_nr = h - softirq_vec;
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200245 int prev_count = preempt_count();
246
Thomas Gleixnerf4bc6bb2010-10-19 15:00:13 +0200247 kstat_incr_softirqs_this_cpu(vec_nr);
248
249 trace_softirq_entry(vec_nr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700250 h->action(h);
Thomas Gleixnerf4bc6bb2010-10-19 15:00:13 +0200251 trace_softirq_exit(vec_nr);
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200252 if (unlikely(prev_count != preempt_count())) {
Thomas Gleixnerf4bc6bb2010-10-19 15:00:13 +0200253 printk(KERN_ERR "huh, entered softirq %u %s %p"
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200254 "with preempt_count %08x,"
Thomas Gleixnerf4bc6bb2010-10-19 15:00:13 +0200255 " exited with %08x?\n", vec_nr,
256 softirq_to_name[vec_nr], h->action,
257 prev_count, preempt_count());
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200258 preempt_count() = prev_count;
259 }
260
Paul E. McKenneyd6714c22009-08-22 13:56:46 -0700261 rcu_bh_qs(cpu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262 }
263 h++;
264 pending >>= 1;
265 } while (pending);
266
Andrew Mortonc70f5d62005-07-30 10:22:49 -0700267 local_irq_disable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268
269 pending = local_softirq_pending();
Eric Dumazetc10d7362013-01-10 15:26:34 -0800270 if (pending) {
Ben Greear34376a52013-06-06 14:29:49 -0700271 if (time_before(jiffies, end) && !need_resched() &&
272 --max_restart)
Eric Dumazetc10d7362013-01-10 15:26:34 -0800273 goto restart;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700274
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275 wakeup_softirqd();
Eric Dumazetc10d7362013-01-10 15:26:34 -0800276 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700277
Ingo Molnard820ac42009-03-13 01:30:40 +0100278 lockdep_softirq_exit();
Paul Mackerras829035fd2006-07-03 00:25:40 -0700279
Frederic Weisbecker6a616712012-12-16 20:00:34 +0100280 account_irq_exit_time(current);
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700281 __local_bh_enable(SOFTIRQ_OFFSET);
Frederic Weisbecker5d60d3e2013-09-24 04:11:35 +0200282 WARN_ON_ONCE(in_interrupt());
Mel Gorman907aed42012-07-31 16:44:07 -0700283 tsk_restore_flags(current, old_flags, PF_MEMALLOC);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700284}
285
Frederic Weisbecker7d65f4a2013-09-05 15:49:45 +0200286
Linus Torvalds1da177e2005-04-16 15:20:36 -0700287
288asmlinkage void do_softirq(void)
289{
290 __u32 pending;
291 unsigned long flags;
292
293 if (in_interrupt())
294 return;
295
296 local_irq_save(flags);
297
298 pending = local_softirq_pending();
299
300 if (pending)
Frederic Weisbecker7d65f4a2013-09-05 15:49:45 +0200301 do_softirq_own_stack();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302
303 local_irq_restore(flags);
304}
305
Ingo Molnardde4b2b2007-02-16 01:27:45 -0800306/*
307 * Enter an interrupt context.
308 */
309void irq_enter(void)
310{
Venki Pallipadi6378ddb2008-01-30 13:30:04 +0100311 int cpu = smp_processor_id();
Thomas Gleixner719254f2008-10-17 09:59:47 +0200312
Paul E. McKenney64db4cf2008-12-18 21:55:32 +0100313 rcu_irq_enter();
Frederic Weisbecker0a8a2e72012-01-24 18:59:44 +0100314 if (is_idle_task(current) && !in_interrupt()) {
Venkatesh Pallipadid267f872010-10-04 17:03:23 -0700315 /*
316 * Prevent raise_softirq from needlessly waking up ksoftirqd
317 * here, as softirq will be serviced on return from interrupt.
318 */
319 local_bh_disable();
Thomas Gleixner719254f2008-10-17 09:59:47 +0200320 tick_check_idle(cpu);
Venkatesh Pallipadid267f872010-10-04 17:03:23 -0700321 _local_bh_enable();
322 }
323
324 __irq_enter();
Ingo Molnardde4b2b2007-02-16 01:27:45 -0800325}
326
Heiko Carstensb2a00172012-03-05 15:07:25 -0800327static inline void invoke_softirq(void)
328{
Frederic Weisbeckerded79752013-09-24 00:50:25 +0200329 if (!force_irqthreads) {
330 /*
331 * We can safely execute softirq on the current stack if
332 * it is the irq stack, because it should be near empty
333 * at this stage. But we have no way to know if the arch
334 * calls irq_exit() on the irq stack. So call softirq
335 * in its own stack to prevent from any overrun on top
336 * of a potentially deep task stack.
337 */
Frederic Weisbeckerbe6e1012013-09-24 16:39:41 +0200338 do_softirq_own_stack();
Frederic Weisbeckerded79752013-09-24 00:50:25 +0200339 } else {
Thomas Gleixner8d32a302011-02-23 23:52:23 +0000340 wakeup_softirqd();
Frederic Weisbeckerded79752013-09-24 00:50:25 +0200341 }
Thomas Gleixner8d32a302011-02-23 23:52:23 +0000342}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700343
Frederic Weisbecker67826ea2013-04-20 17:43:13 +0200344static inline void tick_irq_exit(void)
345{
346#ifdef CONFIG_NO_HZ_COMMON
347 int cpu = smp_processor_id();
348
349 /* Make sure that timer wheel updates are propagated */
350 if ((idle_cpu(cpu) && !need_resched()) || tick_nohz_full_cpu(cpu)) {
351 if (!in_interrupt())
352 tick_nohz_irq_exit();
353 }
354#endif
355}
356
Linus Torvalds1da177e2005-04-16 15:20:36 -0700357/*
358 * Exit an interrupt context. Process softirqs if needed and possible:
359 */
360void irq_exit(void)
361{
Thomas Gleixner74eed012013-02-20 22:00:48 +0100362#ifndef __ARCH_IRQ_EXIT_IRQS_DISABLED
Frederic Weisbecker4cd5d112013-02-28 20:00:43 +0100363 local_irq_disable();
Thomas Gleixner74eed012013-02-20 22:00:48 +0100364#else
365 WARN_ON_ONCE(!irqs_disabled());
366#endif
367
Frederic Weisbecker6a616712012-12-16 20:00:34 +0100368 account_irq_exit_time(current);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700369 trace_hardirq_exit();
Frederic Weisbecker4d4c4e22013-02-22 00:05:07 +0100370 sub_preempt_count(HARDIRQ_OFFSET);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700371 if (!in_interrupt() && local_softirq_pending())
372 invoke_softirq();
Thomas Gleixner79bf2bb2007-02-16 01:28:03 -0800373
Frederic Weisbecker67826ea2013-04-20 17:43:13 +0200374 tick_irq_exit();
Frederic Weisbecker416eb332011-10-07 16:31:02 -0700375 rcu_irq_exit();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376}
377
378/*
379 * This function must run with irqs disabled!
380 */
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800381inline void raise_softirq_irqoff(unsigned int nr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700382{
383 __raise_softirq_irqoff(nr);
384
385 /*
386 * If we're in an interrupt or softirq, we're done
387 * (this also catches softirq-disabled code). We will
388 * actually run the softirq once we return from
389 * the irq or softirq.
390 *
391 * Otherwise we wake up ksoftirqd to make sure we
392 * schedule the softirq soon.
393 */
394 if (!in_interrupt())
395 wakeup_softirqd();
396}
397
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800398void raise_softirq(unsigned int nr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399{
400 unsigned long flags;
401
402 local_irq_save(flags);
403 raise_softirq_irqoff(nr);
404 local_irq_restore(flags);
405}
406
Steven Rostedtf0696862012-01-25 20:18:55 -0500407void __raise_softirq_irqoff(unsigned int nr)
408{
409 trace_softirq_raise(nr);
410 or_softirq_pending(1UL << nr);
411}
412
Carlos R. Mafra962cf362008-05-15 11:15:37 -0300413void open_softirq(int nr, void (*action)(struct softirq_action *))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700414{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700415 softirq_vec[nr].action = action;
416}
417
Peter Zijlstra9ba5f002009-07-22 14:18:35 +0200418/*
419 * Tasklets
420 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700421struct tasklet_head
422{
Olof Johansson48f20a92008-03-04 15:23:25 -0800423 struct tasklet_struct *head;
424 struct tasklet_struct **tail;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700425};
426
Vegard Nossum4620b492008-06-12 23:21:53 +0200427static DEFINE_PER_CPU(struct tasklet_head, tasklet_vec);
428static DEFINE_PER_CPU(struct tasklet_head, tasklet_hi_vec);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700429
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800430void __tasklet_schedule(struct tasklet_struct *t)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700431{
432 unsigned long flags;
433
434 local_irq_save(flags);
Olof Johansson48f20a92008-03-04 15:23:25 -0800435 t->next = NULL;
Christoph Lameter909ea962010-12-08 16:22:55 +0100436 *__this_cpu_read(tasklet_vec.tail) = t;
437 __this_cpu_write(tasklet_vec.tail, &(t->next));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700438 raise_softirq_irqoff(TASKLET_SOFTIRQ);
439 local_irq_restore(flags);
440}
441
442EXPORT_SYMBOL(__tasklet_schedule);
443
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800444void __tasklet_hi_schedule(struct tasklet_struct *t)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700445{
446 unsigned long flags;
447
448 local_irq_save(flags);
Olof Johansson48f20a92008-03-04 15:23:25 -0800449 t->next = NULL;
Christoph Lameter909ea962010-12-08 16:22:55 +0100450 *__this_cpu_read(tasklet_hi_vec.tail) = t;
451 __this_cpu_write(tasklet_hi_vec.tail, &(t->next));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700452 raise_softirq_irqoff(HI_SOFTIRQ);
453 local_irq_restore(flags);
454}
455
456EXPORT_SYMBOL(__tasklet_hi_schedule);
457
Vegard Nossum7c692cb2008-05-21 22:53:13 +0200458void __tasklet_hi_schedule_first(struct tasklet_struct *t)
459{
460 BUG_ON(!irqs_disabled());
461
Christoph Lameter909ea962010-12-08 16:22:55 +0100462 t->next = __this_cpu_read(tasklet_hi_vec.head);
463 __this_cpu_write(tasklet_hi_vec.head, t);
Vegard Nossum7c692cb2008-05-21 22:53:13 +0200464 __raise_softirq_irqoff(HI_SOFTIRQ);
465}
466
467EXPORT_SYMBOL(__tasklet_hi_schedule_first);
468
Linus Torvalds1da177e2005-04-16 15:20:36 -0700469static void tasklet_action(struct softirq_action *a)
470{
471 struct tasklet_struct *list;
472
473 local_irq_disable();
Christoph Lameter909ea962010-12-08 16:22:55 +0100474 list = __this_cpu_read(tasklet_vec.head);
475 __this_cpu_write(tasklet_vec.head, NULL);
476 __this_cpu_write(tasklet_vec.tail, &__get_cpu_var(tasklet_vec).head);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700477 local_irq_enable();
478
479 while (list) {
480 struct tasklet_struct *t = list;
481
482 list = list->next;
483
484 if (tasklet_trylock(t)) {
485 if (!atomic_read(&t->count)) {
486 if (!test_and_clear_bit(TASKLET_STATE_SCHED, &t->state))
487 BUG();
488 t->func(t->data);
489 tasklet_unlock(t);
490 continue;
491 }
492 tasklet_unlock(t);
493 }
494
495 local_irq_disable();
Olof Johansson48f20a92008-03-04 15:23:25 -0800496 t->next = NULL;
Christoph Lameter909ea962010-12-08 16:22:55 +0100497 *__this_cpu_read(tasklet_vec.tail) = t;
498 __this_cpu_write(tasklet_vec.tail, &(t->next));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700499 __raise_softirq_irqoff(TASKLET_SOFTIRQ);
500 local_irq_enable();
501 }
502}
503
504static void tasklet_hi_action(struct softirq_action *a)
505{
506 struct tasklet_struct *list;
507
508 local_irq_disable();
Christoph Lameter909ea962010-12-08 16:22:55 +0100509 list = __this_cpu_read(tasklet_hi_vec.head);
510 __this_cpu_write(tasklet_hi_vec.head, NULL);
511 __this_cpu_write(tasklet_hi_vec.tail, &__get_cpu_var(tasklet_hi_vec).head);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700512 local_irq_enable();
513
514 while (list) {
515 struct tasklet_struct *t = list;
516
517 list = list->next;
518
519 if (tasklet_trylock(t)) {
520 if (!atomic_read(&t->count)) {
521 if (!test_and_clear_bit(TASKLET_STATE_SCHED, &t->state))
522 BUG();
523 t->func(t->data);
524 tasklet_unlock(t);
525 continue;
526 }
527 tasklet_unlock(t);
528 }
529
530 local_irq_disable();
Olof Johansson48f20a92008-03-04 15:23:25 -0800531 t->next = NULL;
Christoph Lameter909ea962010-12-08 16:22:55 +0100532 *__this_cpu_read(tasklet_hi_vec.tail) = t;
533 __this_cpu_write(tasklet_hi_vec.tail, &(t->next));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700534 __raise_softirq_irqoff(HI_SOFTIRQ);
535 local_irq_enable();
536 }
537}
538
539
540void tasklet_init(struct tasklet_struct *t,
541 void (*func)(unsigned long), unsigned long data)
542{
543 t->next = NULL;
544 t->state = 0;
545 atomic_set(&t->count, 0);
546 t->func = func;
547 t->data = data;
548}
549
550EXPORT_SYMBOL(tasklet_init);
551
552void tasklet_kill(struct tasklet_struct *t)
553{
554 if (in_interrupt())
555 printk("Attempt to kill tasklet from interrupt\n");
556
557 while (test_and_set_bit(TASKLET_STATE_SCHED, &t->state)) {
H Hartley Sweeten79d381c2009-04-16 19:30:18 -0400558 do {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700559 yield();
H Hartley Sweeten79d381c2009-04-16 19:30:18 -0400560 } while (test_bit(TASKLET_STATE_SCHED, &t->state));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700561 }
562 tasklet_unlock_wait(t);
563 clear_bit(TASKLET_STATE_SCHED, &t->state);
564}
565
566EXPORT_SYMBOL(tasklet_kill);
567
Peter Zijlstra9ba5f002009-07-22 14:18:35 +0200568/*
569 * tasklet_hrtimer
570 */
571
572/*
Peter Zijlstrab9c30322010-02-03 18:08:52 +0100573 * The trampoline is called when the hrtimer expires. It schedules a tasklet
574 * to run __tasklet_hrtimer_trampoline() which in turn will call the intended
575 * hrtimer callback, but from softirq context.
Peter Zijlstra9ba5f002009-07-22 14:18:35 +0200576 */
577static enum hrtimer_restart __hrtimer_tasklet_trampoline(struct hrtimer *timer)
578{
579 struct tasklet_hrtimer *ttimer =
580 container_of(timer, struct tasklet_hrtimer, timer);
581
Peter Zijlstrab9c30322010-02-03 18:08:52 +0100582 tasklet_hi_schedule(&ttimer->tasklet);
583 return HRTIMER_NORESTART;
Peter Zijlstra9ba5f002009-07-22 14:18:35 +0200584}
585
586/*
587 * Helper function which calls the hrtimer callback from
588 * tasklet/softirq context
589 */
590static void __tasklet_hrtimer_trampoline(unsigned long data)
591{
592 struct tasklet_hrtimer *ttimer = (void *)data;
593 enum hrtimer_restart restart;
594
595 restart = ttimer->function(&ttimer->timer);
596 if (restart != HRTIMER_NORESTART)
597 hrtimer_restart(&ttimer->timer);
598}
599
600/**
601 * tasklet_hrtimer_init - Init a tasklet/hrtimer combo for softirq callbacks
602 * @ttimer: tasklet_hrtimer which is initialized
Lucas De Marchi25985ed2011-03-30 22:57:33 -0300603 * @function: hrtimer callback function which gets called from softirq context
Peter Zijlstra9ba5f002009-07-22 14:18:35 +0200604 * @which_clock: clock id (CLOCK_MONOTONIC/CLOCK_REALTIME)
605 * @mode: hrtimer mode (HRTIMER_MODE_ABS/HRTIMER_MODE_REL)
606 */
607void tasklet_hrtimer_init(struct tasklet_hrtimer *ttimer,
608 enum hrtimer_restart (*function)(struct hrtimer *),
609 clockid_t which_clock, enum hrtimer_mode mode)
610{
611 hrtimer_init(&ttimer->timer, which_clock, mode);
612 ttimer->timer.function = __hrtimer_tasklet_trampoline;
613 tasklet_init(&ttimer->tasklet, __tasklet_hrtimer_trampoline,
614 (unsigned long)ttimer);
615 ttimer->function = function;
616}
617EXPORT_SYMBOL_GPL(tasklet_hrtimer_init);
618
619/*
620 * Remote softirq bits
621 */
622
David S. Miller54514a72008-09-23 22:15:57 -0700623DEFINE_PER_CPU(struct list_head [NR_SOFTIRQS], softirq_work_list);
624EXPORT_PER_CPU_SYMBOL(softirq_work_list);
625
626static void __local_trigger(struct call_single_data *cp, int softirq)
627{
628 struct list_head *head = &__get_cpu_var(softirq_work_list[softirq]);
629
630 list_add_tail(&cp->list, head);
631
632 /* Trigger the softirq only if the list was previously empty. */
633 if (head->next == &cp->list)
634 raise_softirq_irqoff(softirq);
635}
636
637#ifdef CONFIG_USE_GENERIC_SMP_HELPERS
638static void remote_softirq_receive(void *data)
639{
640 struct call_single_data *cp = data;
641 unsigned long flags;
642 int softirq;
643
liguang3440a1c2013-04-30 15:27:26 -0700644 softirq = *(int *)cp->info;
David S. Miller54514a72008-09-23 22:15:57 -0700645 local_irq_save(flags);
646 __local_trigger(cp, softirq);
647 local_irq_restore(flags);
648}
649
650static int __try_remote_softirq(struct call_single_data *cp, int cpu, int softirq)
651{
652 if (cpu_online(cpu)) {
653 cp->func = remote_softirq_receive;
liguang3440a1c2013-04-30 15:27:26 -0700654 cp->info = &softirq;
David S. Miller54514a72008-09-23 22:15:57 -0700655 cp->flags = 0;
David S. Miller54514a72008-09-23 22:15:57 -0700656
Peter Zijlstra6e275632009-02-25 13:59:48 +0100657 __smp_call_function_single(cpu, cp, 0);
David S. Miller54514a72008-09-23 22:15:57 -0700658 return 0;
659 }
660 return 1;
661}
662#else /* CONFIG_USE_GENERIC_SMP_HELPERS */
663static int __try_remote_softirq(struct call_single_data *cp, int cpu, int softirq)
664{
665 return 1;
666}
667#endif
668
669/**
670 * __send_remote_softirq - try to schedule softirq work on a remote cpu
671 * @cp: private SMP call function data area
672 * @cpu: the remote cpu
673 * @this_cpu: the currently executing cpu
674 * @softirq: the softirq for the work
675 *
676 * Attempt to schedule softirq work on a remote cpu. If this cannot be
677 * done, the work is instead queued up on the local cpu.
678 *
679 * Interrupts must be disabled.
680 */
681void __send_remote_softirq(struct call_single_data *cp, int cpu, int this_cpu, int softirq)
682{
683 if (cpu == this_cpu || __try_remote_softirq(cp, cpu, softirq))
684 __local_trigger(cp, softirq);
685}
686EXPORT_SYMBOL(__send_remote_softirq);
687
688/**
689 * send_remote_softirq - try to schedule softirq work on a remote cpu
690 * @cp: private SMP call function data area
691 * @cpu: the remote cpu
692 * @softirq: the softirq for the work
693 *
694 * Like __send_remote_softirq except that disabling interrupts and
695 * computing the current cpu is done for the caller.
696 */
697void send_remote_softirq(struct call_single_data *cp, int cpu, int softirq)
698{
699 unsigned long flags;
700 int this_cpu;
701
702 local_irq_save(flags);
703 this_cpu = smp_processor_id();
704 __send_remote_softirq(cp, cpu, this_cpu, softirq);
705 local_irq_restore(flags);
706}
707EXPORT_SYMBOL(send_remote_softirq);
708
Paul Gortmaker0db06282013-06-19 14:53:51 -0400709static int remote_softirq_cpu_notify(struct notifier_block *self,
David S. Miller54514a72008-09-23 22:15:57 -0700710 unsigned long action, void *hcpu)
711{
712 /*
713 * If a CPU goes away, splice its entries to the current CPU
714 * and trigger a run of the softirq
715 */
716 if (action == CPU_DEAD || action == CPU_DEAD_FROZEN) {
717 int cpu = (unsigned long) hcpu;
718 int i;
719
720 local_irq_disable();
721 for (i = 0; i < NR_SOFTIRQS; i++) {
722 struct list_head *head = &per_cpu(softirq_work_list[i], cpu);
723 struct list_head *local_head;
724
725 if (list_empty(head))
726 continue;
727
728 local_head = &__get_cpu_var(softirq_work_list[i]);
729 list_splice_init(head, local_head);
730 raise_softirq_irqoff(i);
731 }
732 local_irq_enable();
733 }
734
735 return NOTIFY_OK;
736}
737
Paul Gortmaker0db06282013-06-19 14:53:51 -0400738static struct notifier_block remote_softirq_cpu_notifier = {
David S. Miller54514a72008-09-23 22:15:57 -0700739 .notifier_call = remote_softirq_cpu_notify,
740};
741
Linus Torvalds1da177e2005-04-16 15:20:36 -0700742void __init softirq_init(void)
743{
Olof Johansson48f20a92008-03-04 15:23:25 -0800744 int cpu;
745
746 for_each_possible_cpu(cpu) {
David S. Miller54514a72008-09-23 22:15:57 -0700747 int i;
748
Olof Johansson48f20a92008-03-04 15:23:25 -0800749 per_cpu(tasklet_vec, cpu).tail =
750 &per_cpu(tasklet_vec, cpu).head;
751 per_cpu(tasklet_hi_vec, cpu).tail =
752 &per_cpu(tasklet_hi_vec, cpu).head;
David S. Miller54514a72008-09-23 22:15:57 -0700753 for (i = 0; i < NR_SOFTIRQS; i++)
754 INIT_LIST_HEAD(&per_cpu(softirq_work_list[i], cpu));
Olof Johansson48f20a92008-03-04 15:23:25 -0800755 }
756
David S. Miller54514a72008-09-23 22:15:57 -0700757 register_hotcpu_notifier(&remote_softirq_cpu_notifier);
758
Carlos R. Mafra962cf362008-05-15 11:15:37 -0300759 open_softirq(TASKLET_SOFTIRQ, tasklet_action);
760 open_softirq(HI_SOFTIRQ, tasklet_hi_action);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700761}
762
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000763static int ksoftirqd_should_run(unsigned int cpu)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700764{
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000765 return local_softirq_pending();
766}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700767
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000768static void run_ksoftirqd(unsigned int cpu)
769{
770 local_irq_disable();
771 if (local_softirq_pending()) {
772 __do_softirq();
773 rcu_note_context_switch(cpu);
774 local_irq_enable();
775 cond_resched();
776 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700777 }
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000778 local_irq_enable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700779}
780
781#ifdef CONFIG_HOTPLUG_CPU
782/*
783 * tasklet_kill_immediate is called to remove a tasklet which can already be
784 * scheduled for execution on @cpu.
785 *
786 * Unlike tasklet_kill, this function removes the tasklet
787 * _immediately_, even if the tasklet is in TASKLET_STATE_SCHED state.
788 *
789 * When this function is called, @cpu must be in the CPU_DEAD state.
790 */
791void tasklet_kill_immediate(struct tasklet_struct *t, unsigned int cpu)
792{
793 struct tasklet_struct **i;
794
795 BUG_ON(cpu_online(cpu));
796 BUG_ON(test_bit(TASKLET_STATE_RUN, &t->state));
797
798 if (!test_bit(TASKLET_STATE_SCHED, &t->state))
799 return;
800
801 /* CPU is dead, so no lock needed. */
Olof Johansson48f20a92008-03-04 15:23:25 -0800802 for (i = &per_cpu(tasklet_vec, cpu).head; *i; i = &(*i)->next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700803 if (*i == t) {
804 *i = t->next;
Olof Johansson48f20a92008-03-04 15:23:25 -0800805 /* If this was the tail element, move the tail ptr */
806 if (*i == NULL)
807 per_cpu(tasklet_vec, cpu).tail = i;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700808 return;
809 }
810 }
811 BUG();
812}
813
814static void takeover_tasklets(unsigned int cpu)
815{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700816 /* CPU is dead, so no lock needed. */
817 local_irq_disable();
818
819 /* Find end, append list for that CPU. */
Christian Borntraegere5e41722008-05-01 04:34:23 -0700820 if (&per_cpu(tasklet_vec, cpu).head != per_cpu(tasklet_vec, cpu).tail) {
Christoph Lameter909ea962010-12-08 16:22:55 +0100821 *__this_cpu_read(tasklet_vec.tail) = per_cpu(tasklet_vec, cpu).head;
822 this_cpu_write(tasklet_vec.tail, per_cpu(tasklet_vec, cpu).tail);
Christian Borntraegere5e41722008-05-01 04:34:23 -0700823 per_cpu(tasklet_vec, cpu).head = NULL;
824 per_cpu(tasklet_vec, cpu).tail = &per_cpu(tasklet_vec, cpu).head;
825 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700826 raise_softirq_irqoff(TASKLET_SOFTIRQ);
827
Christian Borntraegere5e41722008-05-01 04:34:23 -0700828 if (&per_cpu(tasklet_hi_vec, cpu).head != per_cpu(tasklet_hi_vec, cpu).tail) {
Christoph Lameter909ea962010-12-08 16:22:55 +0100829 *__this_cpu_read(tasklet_hi_vec.tail) = per_cpu(tasklet_hi_vec, cpu).head;
830 __this_cpu_write(tasklet_hi_vec.tail, per_cpu(tasklet_hi_vec, cpu).tail);
Christian Borntraegere5e41722008-05-01 04:34:23 -0700831 per_cpu(tasklet_hi_vec, cpu).head = NULL;
832 per_cpu(tasklet_hi_vec, cpu).tail = &per_cpu(tasklet_hi_vec, cpu).head;
833 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700834 raise_softirq_irqoff(HI_SOFTIRQ);
835
836 local_irq_enable();
837}
838#endif /* CONFIG_HOTPLUG_CPU */
839
Paul Gortmaker0db06282013-06-19 14:53:51 -0400840static int cpu_callback(struct notifier_block *nfb,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700841 unsigned long action,
842 void *hcpu)
843{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700844 switch (action) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700845#ifdef CONFIG_HOTPLUG_CPU
Linus Torvalds1da177e2005-04-16 15:20:36 -0700846 case CPU_DEAD:
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000847 case CPU_DEAD_FROZEN:
848 takeover_tasklets((unsigned long)hcpu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700849 break;
850#endif /* CONFIG_HOTPLUG_CPU */
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000851 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700852 return NOTIFY_OK;
853}
854
Paul Gortmaker0db06282013-06-19 14:53:51 -0400855static struct notifier_block cpu_nfb = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700856 .notifier_call = cpu_callback
857};
858
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000859static struct smp_hotplug_thread softirq_threads = {
860 .store = &ksoftirqd,
861 .thread_should_run = ksoftirqd_should_run,
862 .thread_fn = run_ksoftirqd,
863 .thread_comm = "ksoftirqd/%u",
864};
865
Eduard - Gabriel Munteanu7babe8d2008-07-25 19:45:11 -0700866static __init int spawn_ksoftirqd(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700867{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700868 register_cpu_notifier(&cpu_nfb);
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000869
870 BUG_ON(smpboot_register_percpu_thread(&softirq_threads));
871
Linus Torvalds1da177e2005-04-16 15:20:36 -0700872 return 0;
873}
Eduard - Gabriel Munteanu7babe8d2008-07-25 19:45:11 -0700874early_initcall(spawn_ksoftirqd);
Andrew Morton78eef012006-03-22 00:08:16 -0800875
Yinghai Lu43a25632008-12-28 16:01:13 -0800876/*
877 * [ These __weak aliases are kept in a separate compilation unit, so that
878 * GCC does not inline them incorrectly. ]
879 */
880
881int __init __weak early_irq_init(void)
882{
883 return 0;
884}
885
Yinghai Lu4a046d12009-01-12 17:39:24 -0800886int __init __weak arch_probe_nr_irqs(void)
887{
Thomas Gleixnerb683de22010-09-27 20:55:03 +0200888 return NR_IRQS_LEGACY;
Yinghai Lu4a046d12009-01-12 17:39:24 -0800889}
890
Yinghai Lu43a25632008-12-28 16:01:13 -0800891int __init __weak arch_early_irq_init(void)
892{
893 return 0;
894}