blob: 9e368ef35f9a7e5d706abf35fb85fee2a73a8c45 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/kernel/softirq.c
3 *
4 * Copyright (C) 1992 Linus Torvalds
5 *
Pavel Machekb10db7f2008-01-30 13:30:00 +01006 * Distribute under GPLv2.
7 *
8 * Rewritten. Old one was good in 2.2, but in 2.3 it was immoral. --ANK (990903)
Linus Torvalds1da177e2005-04-16 15:20:36 -07009 */
10
Paul Gortmaker9984de12011-05-23 14:51:41 -040011#include <linux/export.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <linux/kernel_stat.h>
13#include <linux/interrupt.h>
14#include <linux/init.h>
15#include <linux/mm.h>
16#include <linux/notifier.h>
17#include <linux/percpu.h>
18#include <linux/cpu.h>
Rafael J. Wysocki83144182007-07-17 04:03:35 -070019#include <linux/freezer.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <linux/kthread.h>
21#include <linux/rcupdate.h>
Steven Rostedt7e49fcc2009-01-22 19:01:40 -050022#include <linux/ftrace.h>
Andrew Morton78eef012006-03-22 00:08:16 -080023#include <linux/smp.h>
Thomas Gleixner3e339b52012-07-16 10:42:37 +000024#include <linux/smpboot.h>
Thomas Gleixner79bf2bb2007-02-16 01:28:03 -080025#include <linux/tick.h>
Heiko Carstensa0e39ed2009-04-29 13:51:39 +020026
27#define CREATE_TRACE_POINTS
Steven Rostedtad8d75f2009-04-14 19:39:12 -040028#include <trace/events/irq.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070029
Linus Torvalds1da177e2005-04-16 15:20:36 -070030/*
31 - No shared variables, all the data are CPU local.
32 - If a softirq needs serialization, let it serialize itself
33 by its own spinlocks.
34 - Even if softirq is serialized, only local cpu is marked for
35 execution. Hence, we get something sort of weak cpu binding.
36 Though it is still not clear, will it result in better locality
37 or will not.
38
39 Examples:
40 - NET RX softirq. It is multithreaded and does not require
41 any global serialization.
42 - NET TX softirq. It kicks software netdevice queues, hence
43 it is logically serialized per device, but this serialization
44 is invisible to common code.
45 - Tasklets: serialized wrt itself.
46 */
47
48#ifndef __ARCH_IRQ_STAT
49irq_cpustat_t irq_stat[NR_CPUS] ____cacheline_aligned;
50EXPORT_SYMBOL(irq_stat);
51#endif
52
Alexey Dobriyan978b0112008-09-06 20:04:36 +020053static struct softirq_action softirq_vec[NR_SOFTIRQS] __cacheline_aligned_in_smp;
Linus Torvalds1da177e2005-04-16 15:20:36 -070054
Venkatesh Pallipadi4dd53d82010-12-21 17:09:00 -080055DEFINE_PER_CPU(struct task_struct *, ksoftirqd);
Linus Torvalds1da177e2005-04-16 15:20:36 -070056
Jason Baron5d592b42009-03-12 14:33:36 -040057char *softirq_to_name[NR_SOFTIRQS] = {
Li Zefan5dd4de52009-09-17 17:38:32 +080058 "HI", "TIMER", "NET_TX", "NET_RX", "BLOCK", "BLOCK_IOPOLL",
Shaohua Li09223372011-06-14 13:26:25 +080059 "TASKLET", "SCHED", "HRTIMER", "RCU"
Jason Baron5d592b42009-03-12 14:33:36 -040060};
61
Linus Torvalds1da177e2005-04-16 15:20:36 -070062/*
63 * we cannot loop indefinitely here to avoid userspace starvation,
64 * but we also don't want to introduce a worst case 1/HZ latency
65 * to the pending events, so lets the scheduler to balance
66 * the softirq load for us.
67 */
Thomas Gleixner676cb022009-07-20 23:33:49 +020068static void wakeup_softirqd(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -070069{
70 /* Interrupts are disabled: no need to stop preemption */
Christoph Lameter909ea962010-12-08 16:22:55 +010071 struct task_struct *tsk = __this_cpu_read(ksoftirqd);
Linus Torvalds1da177e2005-04-16 15:20:36 -070072
73 if (tsk && tsk->state != TASK_RUNNING)
74 wake_up_process(tsk);
75}
76
77/*
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -070078 * preempt_count and SOFTIRQ_OFFSET usage:
79 * - preempt_count is changed by SOFTIRQ_OFFSET on entering or leaving
80 * softirq processing.
81 * - preempt_count is changed by SOFTIRQ_DISABLE_OFFSET (= 2 * SOFTIRQ_OFFSET)
82 * on local_bh_disable or local_bh_enable.
83 * This lets us distinguish between whether we are currently processing
84 * softirq and whether we just have bh disabled.
85 */
86
87/*
Ingo Molnarde30a2b2006-07-03 00:24:42 -070088 * This one is for softirq.c-internal use,
89 * where hardirqs are disabled legitimately:
90 */
Tim Chen3c829c32006-07-30 03:04:02 -070091#ifdef CONFIG_TRACE_IRQFLAGS
Peter Zijlstra0bd3a172013-11-19 16:13:38 +010092void __local_bh_disable_ip(unsigned long ip, unsigned int cnt)
Ingo Molnarde30a2b2006-07-03 00:24:42 -070093{
94 unsigned long flags;
95
96 WARN_ON_ONCE(in_irq());
97
98 raw_local_irq_save(flags);
Steven Rostedt7e49fcc2009-01-22 19:01:40 -050099 /*
Peter Zijlstrabdb43802013-09-10 12:15:23 +0200100 * The preempt tracer hooks into preempt_count_add and will break
Steven Rostedt7e49fcc2009-01-22 19:01:40 -0500101 * lockdep because it calls back into lockdep after SOFTIRQ_OFFSET
102 * is set and before current->softirq_enabled is cleared.
103 * We must manually increment preempt_count here and manually
104 * call the trace_preempt_off later.
105 */
Peter Zijlstrabdb43802013-09-10 12:15:23 +0200106 __preempt_count_add(cnt);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700107 /*
108 * Were softirqs turned off above:
109 */
Peter Zijlstra9ea4c382013-11-19 16:13:38 +0100110 if (softirq_count() == (cnt & SOFTIRQ_MASK))
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700111 trace_softirqs_off(ip);
112 raw_local_irq_restore(flags);
Steven Rostedt7e49fcc2009-01-22 19:01:40 -0500113
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700114 if (preempt_count() == cnt)
Steven Rostedt7e49fcc2009-01-22 19:01:40 -0500115 trace_preempt_off(CALLER_ADDR0, get_parent_ip(CALLER_ADDR1));
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700116}
Peter Zijlstra0bd3a172013-11-19 16:13:38 +0100117EXPORT_SYMBOL(__local_bh_disable_ip);
Tim Chen3c829c32006-07-30 03:04:02 -0700118#endif /* CONFIG_TRACE_IRQFLAGS */
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700119
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700120static void __local_bh_enable(unsigned int cnt)
121{
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700122 WARN_ON_ONCE(!irqs_disabled());
123
Peter Zijlstra9ea4c382013-11-19 16:13:38 +0100124 if (softirq_count() == (cnt & SOFTIRQ_MASK))
Davidlohr Buesod2e08472013-04-30 11:46:09 -0700125 trace_softirqs_on(_RET_IP_);
Peter Zijlstrabdb43802013-09-10 12:15:23 +0200126 preempt_count_sub(cnt);
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700127}
128
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700129/*
130 * Special-case - softirqs can safely be enabled in
131 * cond_resched_softirq(), or by __do_softirq(),
132 * without processing still-pending softirqs:
133 */
134void _local_bh_enable(void)
135{
Frederic Weisbecker5d60d3e2013-09-24 04:11:35 +0200136 WARN_ON_ONCE(in_irq());
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700137 __local_bh_enable(SOFTIRQ_DISABLE_OFFSET);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700138}
139
140EXPORT_SYMBOL(_local_bh_enable);
141
Peter Zijlstra0bd3a172013-11-19 16:13:38 +0100142void __local_bh_enable_ip(unsigned long ip, unsigned int cnt)
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700143{
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200144 WARN_ON_ONCE(in_irq() || irqs_disabled());
Tim Chen3c829c32006-07-30 03:04:02 -0700145#ifdef CONFIG_TRACE_IRQFLAGS
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200146 local_irq_disable();
Tim Chen3c829c32006-07-30 03:04:02 -0700147#endif
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700148 /*
149 * Are softirqs going to be turned on now:
150 */
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700151 if (softirq_count() == SOFTIRQ_DISABLE_OFFSET)
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700152 trace_softirqs_on(ip);
153 /*
154 * Keep preemption disabled until we are done with
155 * softirq processing:
156 */
Peter Zijlstra0bd3a172013-11-19 16:13:38 +0100157 preempt_count_sub(cnt - 1);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700158
Frederic Weisbecker0bed6982013-09-05 16:14:00 +0200159 if (unlikely(!in_interrupt() && local_softirq_pending())) {
160 /*
161 * Run softirq if any pending. And do it in its own stack
162 * as we may be calling this deep in a task call stack already.
163 */
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700164 do_softirq();
Frederic Weisbecker0bed6982013-09-05 16:14:00 +0200165 }
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700166
Peter Zijlstrabdb43802013-09-10 12:15:23 +0200167 preempt_count_dec();
Tim Chen3c829c32006-07-30 03:04:02 -0700168#ifdef CONFIG_TRACE_IRQFLAGS
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200169 local_irq_enable();
Tim Chen3c829c32006-07-30 03:04:02 -0700170#endif
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700171 preempt_check_resched();
172}
Peter Zijlstra0bd3a172013-11-19 16:13:38 +0100173EXPORT_SYMBOL(__local_bh_enable_ip);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700174
175/*
Ben Greear34376a52013-06-06 14:29:49 -0700176 * We restart softirq processing for at most MAX_SOFTIRQ_RESTART times,
177 * but break the loop if need_resched() is set or after 2 ms.
178 * The MAX_SOFTIRQ_TIME provides a nice upper bound in most cases, but in
179 * certain cases, such as stop_machine(), jiffies may cease to
180 * increment and so we need the MAX_SOFTIRQ_RESTART limit as
181 * well to make sure we eventually return from this method.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700182 *
Eric Dumazetc10d7362013-01-10 15:26:34 -0800183 * These limits have been established via experimentation.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700184 * The two things to balance is latency against fairness -
185 * we want to handle softirqs as soon as possible, but they
186 * should not be able to lock up the box.
187 */
Eric Dumazetc10d7362013-01-10 15:26:34 -0800188#define MAX_SOFTIRQ_TIME msecs_to_jiffies(2)
Ben Greear34376a52013-06-06 14:29:49 -0700189#define MAX_SOFTIRQ_RESTART 10
Linus Torvalds1da177e2005-04-16 15:20:36 -0700190
191asmlinkage void __do_softirq(void)
192{
193 struct softirq_action *h;
194 __u32 pending;
Eric Dumazetc10d7362013-01-10 15:26:34 -0800195 unsigned long end = jiffies + MAX_SOFTIRQ_TIME;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700196 int cpu;
Mel Gorman907aed42012-07-31 16:44:07 -0700197 unsigned long old_flags = current->flags;
Ben Greear34376a52013-06-06 14:29:49 -0700198 int max_restart = MAX_SOFTIRQ_RESTART;
Mel Gorman907aed42012-07-31 16:44:07 -0700199
200 /*
201 * Mask out PF_MEMALLOC s current task context is borrowed for the
202 * softirq. A softirq handled such as network RX might set PF_MEMALLOC
203 * again if the socket is related to swap
204 */
205 current->flags &= ~PF_MEMALLOC;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700206
207 pending = local_softirq_pending();
Frederic Weisbecker6a616712012-12-16 20:00:34 +0100208 account_irq_enter_time(current);
Paul Mackerras829035fd2006-07-03 00:25:40 -0700209
Peter Zijlstra0bd3a172013-11-19 16:13:38 +0100210 __local_bh_disable_ip(_RET_IP_, SOFTIRQ_OFFSET);
Ingo Molnard820ac42009-03-13 01:30:40 +0100211 lockdep_softirq_enter();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700212
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213 cpu = smp_processor_id();
214restart:
215 /* Reset the pending bitmask before enabling irqs */
Andi Kleen3f744782005-09-12 18:49:24 +0200216 set_softirq_pending(0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217
Andrew Mortonc70f5d62005-07-30 10:22:49 -0700218 local_irq_enable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700219
220 h = softirq_vec;
221
222 do {
223 if (pending & 1) {
Thomas Gleixnerf4bc6bb2010-10-19 15:00:13 +0200224 unsigned int vec_nr = h - softirq_vec;
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200225 int prev_count = preempt_count();
226
Thomas Gleixnerf4bc6bb2010-10-19 15:00:13 +0200227 kstat_incr_softirqs_this_cpu(vec_nr);
228
229 trace_softirq_entry(vec_nr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700230 h->action(h);
Thomas Gleixnerf4bc6bb2010-10-19 15:00:13 +0200231 trace_softirq_exit(vec_nr);
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200232 if (unlikely(prev_count != preempt_count())) {
Thomas Gleixnerf4bc6bb2010-10-19 15:00:13 +0200233 printk(KERN_ERR "huh, entered softirq %u %s %p"
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200234 "with preempt_count %08x,"
Thomas Gleixnerf4bc6bb2010-10-19 15:00:13 +0200235 " exited with %08x?\n", vec_nr,
236 softirq_to_name[vec_nr], h->action,
237 prev_count, preempt_count());
Peter Zijlstra4a2b4b22013-08-14 14:55:24 +0200238 preempt_count_set(prev_count);
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200239 }
240
Paul E. McKenneyd6714c22009-08-22 13:56:46 -0700241 rcu_bh_qs(cpu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700242 }
243 h++;
244 pending >>= 1;
245 } while (pending);
246
Andrew Mortonc70f5d62005-07-30 10:22:49 -0700247 local_irq_disable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248
249 pending = local_softirq_pending();
Eric Dumazetc10d7362013-01-10 15:26:34 -0800250 if (pending) {
Ben Greear34376a52013-06-06 14:29:49 -0700251 if (time_before(jiffies, end) && !need_resched() &&
252 --max_restart)
Eric Dumazetc10d7362013-01-10 15:26:34 -0800253 goto restart;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255 wakeup_softirqd();
Eric Dumazetc10d7362013-01-10 15:26:34 -0800256 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700257
Ingo Molnard820ac42009-03-13 01:30:40 +0100258 lockdep_softirq_exit();
Paul Mackerras829035fd2006-07-03 00:25:40 -0700259
Frederic Weisbecker6a616712012-12-16 20:00:34 +0100260 account_irq_exit_time(current);
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700261 __local_bh_enable(SOFTIRQ_OFFSET);
Frederic Weisbecker5d60d3e2013-09-24 04:11:35 +0200262 WARN_ON_ONCE(in_interrupt());
Mel Gorman907aed42012-07-31 16:44:07 -0700263 tsk_restore_flags(current, old_flags, PF_MEMALLOC);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700264}
265
Frederic Weisbecker7d65f4a2013-09-05 15:49:45 +0200266
Linus Torvalds1da177e2005-04-16 15:20:36 -0700267
268asmlinkage void do_softirq(void)
269{
270 __u32 pending;
271 unsigned long flags;
272
273 if (in_interrupt())
274 return;
275
276 local_irq_save(flags);
277
278 pending = local_softirq_pending();
279
280 if (pending)
Frederic Weisbecker7d65f4a2013-09-05 15:49:45 +0200281 do_softirq_own_stack();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700282
283 local_irq_restore(flags);
284}
285
Ingo Molnardde4b2b2007-02-16 01:27:45 -0800286/*
287 * Enter an interrupt context.
288 */
289void irq_enter(void)
290{
Venki Pallipadi6378ddb2008-01-30 13:30:04 +0100291 int cpu = smp_processor_id();
Thomas Gleixner719254f2008-10-17 09:59:47 +0200292
Paul E. McKenney64db4cf2008-12-18 21:55:32 +0100293 rcu_irq_enter();
Frederic Weisbecker0a8a2e72012-01-24 18:59:44 +0100294 if (is_idle_task(current) && !in_interrupt()) {
Venkatesh Pallipadid267f872010-10-04 17:03:23 -0700295 /*
296 * Prevent raise_softirq from needlessly waking up ksoftirqd
297 * here, as softirq will be serviced on return from interrupt.
298 */
299 local_bh_disable();
Thomas Gleixner719254f2008-10-17 09:59:47 +0200300 tick_check_idle(cpu);
Venkatesh Pallipadid267f872010-10-04 17:03:23 -0700301 _local_bh_enable();
302 }
303
304 __irq_enter();
Ingo Molnardde4b2b2007-02-16 01:27:45 -0800305}
306
Heiko Carstensb2a00172012-03-05 15:07:25 -0800307static inline void invoke_softirq(void)
308{
Frederic Weisbeckerded79752013-09-24 00:50:25 +0200309 if (!force_irqthreads) {
Frederic Weisbeckercc1f0272013-09-24 17:17:47 +0200310#ifdef CONFIG_HAVE_IRQ_EXIT_ON_IRQ_STACK
Frederic Weisbeckerded79752013-09-24 00:50:25 +0200311 /*
312 * We can safely execute softirq on the current stack if
313 * it is the irq stack, because it should be near empty
Frederic Weisbeckercc1f0272013-09-24 17:17:47 +0200314 * at this stage.
315 */
316 __do_softirq();
317#else
318 /*
319 * Otherwise, irq_exit() is called on the task stack that can
320 * be potentially deep already. So call softirq in its own stack
321 * to prevent from any overrun.
Frederic Weisbeckerded79752013-09-24 00:50:25 +0200322 */
Frederic Weisbeckerbe6e1012013-09-24 16:39:41 +0200323 do_softirq_own_stack();
Frederic Weisbeckercc1f0272013-09-24 17:17:47 +0200324#endif
Frederic Weisbeckerded79752013-09-24 00:50:25 +0200325 } else {
Thomas Gleixner8d32a302011-02-23 23:52:23 +0000326 wakeup_softirqd();
Frederic Weisbeckerded79752013-09-24 00:50:25 +0200327 }
Thomas Gleixner8d32a302011-02-23 23:52:23 +0000328}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700329
Frederic Weisbecker67826ea2013-04-20 17:43:13 +0200330static inline void tick_irq_exit(void)
331{
332#ifdef CONFIG_NO_HZ_COMMON
333 int cpu = smp_processor_id();
334
335 /* Make sure that timer wheel updates are propagated */
336 if ((idle_cpu(cpu) && !need_resched()) || tick_nohz_full_cpu(cpu)) {
337 if (!in_interrupt())
338 tick_nohz_irq_exit();
339 }
340#endif
341}
342
Linus Torvalds1da177e2005-04-16 15:20:36 -0700343/*
344 * Exit an interrupt context. Process softirqs if needed and possible:
345 */
346void irq_exit(void)
347{
Thomas Gleixner74eed012013-02-20 22:00:48 +0100348#ifndef __ARCH_IRQ_EXIT_IRQS_DISABLED
Frederic Weisbecker4cd5d112013-02-28 20:00:43 +0100349 local_irq_disable();
Thomas Gleixner74eed012013-02-20 22:00:48 +0100350#else
351 WARN_ON_ONCE(!irqs_disabled());
352#endif
353
Frederic Weisbecker6a616712012-12-16 20:00:34 +0100354 account_irq_exit_time(current);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700355 trace_hardirq_exit();
Peter Zijlstrabdb43802013-09-10 12:15:23 +0200356 preempt_count_sub(HARDIRQ_OFFSET);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700357 if (!in_interrupt() && local_softirq_pending())
358 invoke_softirq();
Thomas Gleixner79bf2bb2007-02-16 01:28:03 -0800359
Frederic Weisbecker67826ea2013-04-20 17:43:13 +0200360 tick_irq_exit();
Frederic Weisbecker416eb332011-10-07 16:31:02 -0700361 rcu_irq_exit();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700362}
363
364/*
365 * This function must run with irqs disabled!
366 */
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800367inline void raise_softirq_irqoff(unsigned int nr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700368{
369 __raise_softirq_irqoff(nr);
370
371 /*
372 * If we're in an interrupt or softirq, we're done
373 * (this also catches softirq-disabled code). We will
374 * actually run the softirq once we return from
375 * the irq or softirq.
376 *
377 * Otherwise we wake up ksoftirqd to make sure we
378 * schedule the softirq soon.
379 */
380 if (!in_interrupt())
381 wakeup_softirqd();
382}
383
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800384void raise_softirq(unsigned int nr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700385{
386 unsigned long flags;
387
388 local_irq_save(flags);
389 raise_softirq_irqoff(nr);
390 local_irq_restore(flags);
391}
392
Steven Rostedtf0696862012-01-25 20:18:55 -0500393void __raise_softirq_irqoff(unsigned int nr)
394{
395 trace_softirq_raise(nr);
396 or_softirq_pending(1UL << nr);
397}
398
Carlos R. Mafra962cf362008-05-15 11:15:37 -0300399void open_softirq(int nr, void (*action)(struct softirq_action *))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700400{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700401 softirq_vec[nr].action = action;
402}
403
Peter Zijlstra9ba5f002009-07-22 14:18:35 +0200404/*
405 * Tasklets
406 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700407struct tasklet_head
408{
Olof Johansson48f20a92008-03-04 15:23:25 -0800409 struct tasklet_struct *head;
410 struct tasklet_struct **tail;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700411};
412
Vegard Nossum4620b492008-06-12 23:21:53 +0200413static DEFINE_PER_CPU(struct tasklet_head, tasklet_vec);
414static DEFINE_PER_CPU(struct tasklet_head, tasklet_hi_vec);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700415
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800416void __tasklet_schedule(struct tasklet_struct *t)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417{
418 unsigned long flags;
419
420 local_irq_save(flags);
Olof Johansson48f20a92008-03-04 15:23:25 -0800421 t->next = NULL;
Christoph Lameter909ea962010-12-08 16:22:55 +0100422 *__this_cpu_read(tasklet_vec.tail) = t;
423 __this_cpu_write(tasklet_vec.tail, &(t->next));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700424 raise_softirq_irqoff(TASKLET_SOFTIRQ);
425 local_irq_restore(flags);
426}
427
428EXPORT_SYMBOL(__tasklet_schedule);
429
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800430void __tasklet_hi_schedule(struct tasklet_struct *t)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700431{
432 unsigned long flags;
433
434 local_irq_save(flags);
Olof Johansson48f20a92008-03-04 15:23:25 -0800435 t->next = NULL;
Christoph Lameter909ea962010-12-08 16:22:55 +0100436 *__this_cpu_read(tasklet_hi_vec.tail) = t;
437 __this_cpu_write(tasklet_hi_vec.tail, &(t->next));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700438 raise_softirq_irqoff(HI_SOFTIRQ);
439 local_irq_restore(flags);
440}
441
442EXPORT_SYMBOL(__tasklet_hi_schedule);
443
Vegard Nossum7c692cb2008-05-21 22:53:13 +0200444void __tasklet_hi_schedule_first(struct tasklet_struct *t)
445{
446 BUG_ON(!irqs_disabled());
447
Christoph Lameter909ea962010-12-08 16:22:55 +0100448 t->next = __this_cpu_read(tasklet_hi_vec.head);
449 __this_cpu_write(tasklet_hi_vec.head, t);
Vegard Nossum7c692cb2008-05-21 22:53:13 +0200450 __raise_softirq_irqoff(HI_SOFTIRQ);
451}
452
453EXPORT_SYMBOL(__tasklet_hi_schedule_first);
454
Linus Torvalds1da177e2005-04-16 15:20:36 -0700455static void tasklet_action(struct softirq_action *a)
456{
457 struct tasklet_struct *list;
458
459 local_irq_disable();
Christoph Lameter909ea962010-12-08 16:22:55 +0100460 list = __this_cpu_read(tasklet_vec.head);
461 __this_cpu_write(tasklet_vec.head, NULL);
462 __this_cpu_write(tasklet_vec.tail, &__get_cpu_var(tasklet_vec).head);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700463 local_irq_enable();
464
465 while (list) {
466 struct tasklet_struct *t = list;
467
468 list = list->next;
469
470 if (tasklet_trylock(t)) {
471 if (!atomic_read(&t->count)) {
472 if (!test_and_clear_bit(TASKLET_STATE_SCHED, &t->state))
473 BUG();
474 t->func(t->data);
475 tasklet_unlock(t);
476 continue;
477 }
478 tasklet_unlock(t);
479 }
480
481 local_irq_disable();
Olof Johansson48f20a92008-03-04 15:23:25 -0800482 t->next = NULL;
Christoph Lameter909ea962010-12-08 16:22:55 +0100483 *__this_cpu_read(tasklet_vec.tail) = t;
484 __this_cpu_write(tasklet_vec.tail, &(t->next));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700485 __raise_softirq_irqoff(TASKLET_SOFTIRQ);
486 local_irq_enable();
487 }
488}
489
490static void tasklet_hi_action(struct softirq_action *a)
491{
492 struct tasklet_struct *list;
493
494 local_irq_disable();
Christoph Lameter909ea962010-12-08 16:22:55 +0100495 list = __this_cpu_read(tasklet_hi_vec.head);
496 __this_cpu_write(tasklet_hi_vec.head, NULL);
497 __this_cpu_write(tasklet_hi_vec.tail, &__get_cpu_var(tasklet_hi_vec).head);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700498 local_irq_enable();
499
500 while (list) {
501 struct tasklet_struct *t = list;
502
503 list = list->next;
504
505 if (tasklet_trylock(t)) {
506 if (!atomic_read(&t->count)) {
507 if (!test_and_clear_bit(TASKLET_STATE_SCHED, &t->state))
508 BUG();
509 t->func(t->data);
510 tasklet_unlock(t);
511 continue;
512 }
513 tasklet_unlock(t);
514 }
515
516 local_irq_disable();
Olof Johansson48f20a92008-03-04 15:23:25 -0800517 t->next = NULL;
Christoph Lameter909ea962010-12-08 16:22:55 +0100518 *__this_cpu_read(tasklet_hi_vec.tail) = t;
519 __this_cpu_write(tasklet_hi_vec.tail, &(t->next));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700520 __raise_softirq_irqoff(HI_SOFTIRQ);
521 local_irq_enable();
522 }
523}
524
525
526void tasklet_init(struct tasklet_struct *t,
527 void (*func)(unsigned long), unsigned long data)
528{
529 t->next = NULL;
530 t->state = 0;
531 atomic_set(&t->count, 0);
532 t->func = func;
533 t->data = data;
534}
535
536EXPORT_SYMBOL(tasklet_init);
537
538void tasklet_kill(struct tasklet_struct *t)
539{
540 if (in_interrupt())
541 printk("Attempt to kill tasklet from interrupt\n");
542
543 while (test_and_set_bit(TASKLET_STATE_SCHED, &t->state)) {
H Hartley Sweeten79d381c2009-04-16 19:30:18 -0400544 do {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700545 yield();
H Hartley Sweeten79d381c2009-04-16 19:30:18 -0400546 } while (test_bit(TASKLET_STATE_SCHED, &t->state));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700547 }
548 tasklet_unlock_wait(t);
549 clear_bit(TASKLET_STATE_SCHED, &t->state);
550}
551
552EXPORT_SYMBOL(tasklet_kill);
553
Peter Zijlstra9ba5f002009-07-22 14:18:35 +0200554/*
555 * tasklet_hrtimer
556 */
557
558/*
Peter Zijlstrab9c30322010-02-03 18:08:52 +0100559 * The trampoline is called when the hrtimer expires. It schedules a tasklet
560 * to run __tasklet_hrtimer_trampoline() which in turn will call the intended
561 * hrtimer callback, but from softirq context.
Peter Zijlstra9ba5f002009-07-22 14:18:35 +0200562 */
563static enum hrtimer_restart __hrtimer_tasklet_trampoline(struct hrtimer *timer)
564{
565 struct tasklet_hrtimer *ttimer =
566 container_of(timer, struct tasklet_hrtimer, timer);
567
Peter Zijlstrab9c30322010-02-03 18:08:52 +0100568 tasklet_hi_schedule(&ttimer->tasklet);
569 return HRTIMER_NORESTART;
Peter Zijlstra9ba5f002009-07-22 14:18:35 +0200570}
571
572/*
573 * Helper function which calls the hrtimer callback from
574 * tasklet/softirq context
575 */
576static void __tasklet_hrtimer_trampoline(unsigned long data)
577{
578 struct tasklet_hrtimer *ttimer = (void *)data;
579 enum hrtimer_restart restart;
580
581 restart = ttimer->function(&ttimer->timer);
582 if (restart != HRTIMER_NORESTART)
583 hrtimer_restart(&ttimer->timer);
584}
585
586/**
587 * tasklet_hrtimer_init - Init a tasklet/hrtimer combo for softirq callbacks
588 * @ttimer: tasklet_hrtimer which is initialized
Lucas De Marchi25985ed2011-03-30 22:57:33 -0300589 * @function: hrtimer callback function which gets called from softirq context
Peter Zijlstra9ba5f002009-07-22 14:18:35 +0200590 * @which_clock: clock id (CLOCK_MONOTONIC/CLOCK_REALTIME)
591 * @mode: hrtimer mode (HRTIMER_MODE_ABS/HRTIMER_MODE_REL)
592 */
593void tasklet_hrtimer_init(struct tasklet_hrtimer *ttimer,
594 enum hrtimer_restart (*function)(struct hrtimer *),
595 clockid_t which_clock, enum hrtimer_mode mode)
596{
597 hrtimer_init(&ttimer->timer, which_clock, mode);
598 ttimer->timer.function = __hrtimer_tasklet_trampoline;
599 tasklet_init(&ttimer->tasklet, __tasklet_hrtimer_trampoline,
600 (unsigned long)ttimer);
601 ttimer->function = function;
602}
603EXPORT_SYMBOL_GPL(tasklet_hrtimer_init);
604
Linus Torvalds1da177e2005-04-16 15:20:36 -0700605void __init softirq_init(void)
606{
Olof Johansson48f20a92008-03-04 15:23:25 -0800607 int cpu;
608
609 for_each_possible_cpu(cpu) {
610 per_cpu(tasklet_vec, cpu).tail =
611 &per_cpu(tasklet_vec, cpu).head;
612 per_cpu(tasklet_hi_vec, cpu).tail =
613 &per_cpu(tasklet_hi_vec, cpu).head;
614 }
615
Carlos R. Mafra962cf362008-05-15 11:15:37 -0300616 open_softirq(TASKLET_SOFTIRQ, tasklet_action);
617 open_softirq(HI_SOFTIRQ, tasklet_hi_action);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700618}
619
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000620static int ksoftirqd_should_run(unsigned int cpu)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700621{
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000622 return local_softirq_pending();
623}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700624
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000625static void run_ksoftirqd(unsigned int cpu)
626{
627 local_irq_disable();
628 if (local_softirq_pending()) {
Frederic Weisbecker0bed6982013-09-05 16:14:00 +0200629 /*
630 * We can safely run softirq on inline stack, as we are not deep
631 * in the task stack here.
632 */
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000633 __do_softirq();
634 rcu_note_context_switch(cpu);
635 local_irq_enable();
636 cond_resched();
637 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700638 }
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000639 local_irq_enable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700640}
641
642#ifdef CONFIG_HOTPLUG_CPU
643/*
644 * tasklet_kill_immediate is called to remove a tasklet which can already be
645 * scheduled for execution on @cpu.
646 *
647 * Unlike tasklet_kill, this function removes the tasklet
648 * _immediately_, even if the tasklet is in TASKLET_STATE_SCHED state.
649 *
650 * When this function is called, @cpu must be in the CPU_DEAD state.
651 */
652void tasklet_kill_immediate(struct tasklet_struct *t, unsigned int cpu)
653{
654 struct tasklet_struct **i;
655
656 BUG_ON(cpu_online(cpu));
657 BUG_ON(test_bit(TASKLET_STATE_RUN, &t->state));
658
659 if (!test_bit(TASKLET_STATE_SCHED, &t->state))
660 return;
661
662 /* CPU is dead, so no lock needed. */
Olof Johansson48f20a92008-03-04 15:23:25 -0800663 for (i = &per_cpu(tasklet_vec, cpu).head; *i; i = &(*i)->next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700664 if (*i == t) {
665 *i = t->next;
Olof Johansson48f20a92008-03-04 15:23:25 -0800666 /* If this was the tail element, move the tail ptr */
667 if (*i == NULL)
668 per_cpu(tasklet_vec, cpu).tail = i;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700669 return;
670 }
671 }
672 BUG();
673}
674
675static void takeover_tasklets(unsigned int cpu)
676{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700677 /* CPU is dead, so no lock needed. */
678 local_irq_disable();
679
680 /* Find end, append list for that CPU. */
Christian Borntraegere5e41722008-05-01 04:34:23 -0700681 if (&per_cpu(tasklet_vec, cpu).head != per_cpu(tasklet_vec, cpu).tail) {
Christoph Lameter909ea962010-12-08 16:22:55 +0100682 *__this_cpu_read(tasklet_vec.tail) = per_cpu(tasklet_vec, cpu).head;
683 this_cpu_write(tasklet_vec.tail, per_cpu(tasklet_vec, cpu).tail);
Christian Borntraegere5e41722008-05-01 04:34:23 -0700684 per_cpu(tasklet_vec, cpu).head = NULL;
685 per_cpu(tasklet_vec, cpu).tail = &per_cpu(tasklet_vec, cpu).head;
686 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700687 raise_softirq_irqoff(TASKLET_SOFTIRQ);
688
Christian Borntraegere5e41722008-05-01 04:34:23 -0700689 if (&per_cpu(tasklet_hi_vec, cpu).head != per_cpu(tasklet_hi_vec, cpu).tail) {
Christoph Lameter909ea962010-12-08 16:22:55 +0100690 *__this_cpu_read(tasklet_hi_vec.tail) = per_cpu(tasklet_hi_vec, cpu).head;
691 __this_cpu_write(tasklet_hi_vec.tail, per_cpu(tasklet_hi_vec, cpu).tail);
Christian Borntraegere5e41722008-05-01 04:34:23 -0700692 per_cpu(tasklet_hi_vec, cpu).head = NULL;
693 per_cpu(tasklet_hi_vec, cpu).tail = &per_cpu(tasklet_hi_vec, cpu).head;
694 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700695 raise_softirq_irqoff(HI_SOFTIRQ);
696
697 local_irq_enable();
698}
699#endif /* CONFIG_HOTPLUG_CPU */
700
Paul Gortmaker0db06282013-06-19 14:53:51 -0400701static int cpu_callback(struct notifier_block *nfb,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700702 unsigned long action,
703 void *hcpu)
704{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700705 switch (action) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700706#ifdef CONFIG_HOTPLUG_CPU
Linus Torvalds1da177e2005-04-16 15:20:36 -0700707 case CPU_DEAD:
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000708 case CPU_DEAD_FROZEN:
709 takeover_tasklets((unsigned long)hcpu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700710 break;
711#endif /* CONFIG_HOTPLUG_CPU */
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000712 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700713 return NOTIFY_OK;
714}
715
Paul Gortmaker0db06282013-06-19 14:53:51 -0400716static struct notifier_block cpu_nfb = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700717 .notifier_call = cpu_callback
718};
719
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000720static struct smp_hotplug_thread softirq_threads = {
721 .store = &ksoftirqd,
722 .thread_should_run = ksoftirqd_should_run,
723 .thread_fn = run_ksoftirqd,
724 .thread_comm = "ksoftirqd/%u",
725};
726
Eduard - Gabriel Munteanu7babe8d2008-07-25 19:45:11 -0700727static __init int spawn_ksoftirqd(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700728{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700729 register_cpu_notifier(&cpu_nfb);
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000730
731 BUG_ON(smpboot_register_percpu_thread(&softirq_threads));
732
Linus Torvalds1da177e2005-04-16 15:20:36 -0700733 return 0;
734}
Eduard - Gabriel Munteanu7babe8d2008-07-25 19:45:11 -0700735early_initcall(spawn_ksoftirqd);
Andrew Morton78eef012006-03-22 00:08:16 -0800736
Yinghai Lu43a25632008-12-28 16:01:13 -0800737/*
738 * [ These __weak aliases are kept in a separate compilation unit, so that
739 * GCC does not inline them incorrectly. ]
740 */
741
742int __init __weak early_irq_init(void)
743{
744 return 0;
745}
746
Yinghai Lu4a046d12009-01-12 17:39:24 -0800747int __init __weak arch_probe_nr_irqs(void)
748{
Thomas Gleixnerb683de22010-09-27 20:55:03 +0200749 return NR_IRQS_LEGACY;
Yinghai Lu4a046d12009-01-12 17:39:24 -0800750}
751
Yinghai Lu43a25632008-12-28 16:01:13 -0800752int __init __weak arch_early_irq_init(void)
753{
754 return 0;
755}