blob: ba79bbfe380e3ebf027f556c4b31abe8f7906892 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/kernel/softirq.c
3 *
4 * Copyright (C) 1992 Linus Torvalds
5 *
Pavel Machekb10db7f2008-01-30 13:30:00 +01006 * Distribute under GPLv2.
7 *
8 * Rewritten. Old one was good in 2.2, but in 2.3 it was immoral. --ANK (990903)
Linus Torvalds1da177e2005-04-16 15:20:36 -07009 */
10
Paul Gortmaker9984de12011-05-23 14:51:41 -040011#include <linux/export.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <linux/kernel_stat.h>
13#include <linux/interrupt.h>
14#include <linux/init.h>
15#include <linux/mm.h>
16#include <linux/notifier.h>
17#include <linux/percpu.h>
18#include <linux/cpu.h>
Rafael J. Wysocki83144182007-07-17 04:03:35 -070019#include <linux/freezer.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <linux/kthread.h>
21#include <linux/rcupdate.h>
Steven Rostedt7e49fcc2009-01-22 19:01:40 -050022#include <linux/ftrace.h>
Andrew Morton78eef012006-03-22 00:08:16 -080023#include <linux/smp.h>
Thomas Gleixner3e339b52012-07-16 10:42:37 +000024#include <linux/smpboot.h>
Thomas Gleixner79bf2bb2007-02-16 01:28:03 -080025#include <linux/tick.h>
Heiko Carstensa0e39ed2009-04-29 13:51:39 +020026
27#define CREATE_TRACE_POINTS
Steven Rostedtad8d75f2009-04-14 19:39:12 -040028#include <trace/events/irq.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070029
Linus Torvalds1da177e2005-04-16 15:20:36 -070030/*
31 - No shared variables, all the data are CPU local.
32 - If a softirq needs serialization, let it serialize itself
33 by its own spinlocks.
34 - Even if softirq is serialized, only local cpu is marked for
35 execution. Hence, we get something sort of weak cpu binding.
36 Though it is still not clear, will it result in better locality
37 or will not.
38
39 Examples:
40 - NET RX softirq. It is multithreaded and does not require
41 any global serialization.
42 - NET TX softirq. It kicks software netdevice queues, hence
43 it is logically serialized per device, but this serialization
44 is invisible to common code.
45 - Tasklets: serialized wrt itself.
46 */
47
48#ifndef __ARCH_IRQ_STAT
49irq_cpustat_t irq_stat[NR_CPUS] ____cacheline_aligned;
50EXPORT_SYMBOL(irq_stat);
51#endif
52
Alexey Dobriyan978b0112008-09-06 20:04:36 +020053static struct softirq_action softirq_vec[NR_SOFTIRQS] __cacheline_aligned_in_smp;
Linus Torvalds1da177e2005-04-16 15:20:36 -070054
Venkatesh Pallipadi4dd53d82010-12-21 17:09:00 -080055DEFINE_PER_CPU(struct task_struct *, ksoftirqd);
Linus Torvalds1da177e2005-04-16 15:20:36 -070056
Jason Baron5d592b42009-03-12 14:33:36 -040057char *softirq_to_name[NR_SOFTIRQS] = {
Li Zefan5dd4de52009-09-17 17:38:32 +080058 "HI", "TIMER", "NET_TX", "NET_RX", "BLOCK", "BLOCK_IOPOLL",
Shaohua Li09223372011-06-14 13:26:25 +080059 "TASKLET", "SCHED", "HRTIMER", "RCU"
Jason Baron5d592b42009-03-12 14:33:36 -040060};
61
Linus Torvalds1da177e2005-04-16 15:20:36 -070062/*
63 * we cannot loop indefinitely here to avoid userspace starvation,
64 * but we also don't want to introduce a worst case 1/HZ latency
65 * to the pending events, so lets the scheduler to balance
66 * the softirq load for us.
67 */
Thomas Gleixner676cb022009-07-20 23:33:49 +020068static void wakeup_softirqd(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -070069{
70 /* Interrupts are disabled: no need to stop preemption */
Christoph Lameter909ea962010-12-08 16:22:55 +010071 struct task_struct *tsk = __this_cpu_read(ksoftirqd);
Linus Torvalds1da177e2005-04-16 15:20:36 -070072
73 if (tsk && tsk->state != TASK_RUNNING)
74 wake_up_process(tsk);
75}
76
77/*
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -070078 * preempt_count and SOFTIRQ_OFFSET usage:
79 * - preempt_count is changed by SOFTIRQ_OFFSET on entering or leaving
80 * softirq processing.
81 * - preempt_count is changed by SOFTIRQ_DISABLE_OFFSET (= 2 * SOFTIRQ_OFFSET)
82 * on local_bh_disable or local_bh_enable.
83 * This lets us distinguish between whether we are currently processing
84 * softirq and whether we just have bh disabled.
85 */
86
87/*
Ingo Molnarde30a2b2006-07-03 00:24:42 -070088 * This one is for softirq.c-internal use,
89 * where hardirqs are disabled legitimately:
90 */
Tim Chen3c829c32006-07-30 03:04:02 -070091#ifdef CONFIG_TRACE_IRQFLAGS
Peter Zijlstra0bd3a172013-11-19 16:13:38 +010092void __local_bh_disable_ip(unsigned long ip, unsigned int cnt)
Ingo Molnarde30a2b2006-07-03 00:24:42 -070093{
94 unsigned long flags;
95
96 WARN_ON_ONCE(in_irq());
97
98 raw_local_irq_save(flags);
Steven Rostedt7e49fcc2009-01-22 19:01:40 -050099 /*
Peter Zijlstrabdb43802013-09-10 12:15:23 +0200100 * The preempt tracer hooks into preempt_count_add and will break
Steven Rostedt7e49fcc2009-01-22 19:01:40 -0500101 * lockdep because it calls back into lockdep after SOFTIRQ_OFFSET
102 * is set and before current->softirq_enabled is cleared.
103 * We must manually increment preempt_count here and manually
104 * call the trace_preempt_off later.
105 */
Peter Zijlstrabdb43802013-09-10 12:15:23 +0200106 __preempt_count_add(cnt);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700107 /*
108 * Were softirqs turned off above:
109 */
Peter Zijlstra9ea4c382013-11-19 16:13:38 +0100110 if (softirq_count() == (cnt & SOFTIRQ_MASK))
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700111 trace_softirqs_off(ip);
112 raw_local_irq_restore(flags);
Steven Rostedt7e49fcc2009-01-22 19:01:40 -0500113
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700114 if (preempt_count() == cnt)
Steven Rostedt7e49fcc2009-01-22 19:01:40 -0500115 trace_preempt_off(CALLER_ADDR0, get_parent_ip(CALLER_ADDR1));
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700116}
Peter Zijlstra0bd3a172013-11-19 16:13:38 +0100117EXPORT_SYMBOL(__local_bh_disable_ip);
Tim Chen3c829c32006-07-30 03:04:02 -0700118#endif /* CONFIG_TRACE_IRQFLAGS */
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700119
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700120static void __local_bh_enable(unsigned int cnt)
121{
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700122 WARN_ON_ONCE(!irqs_disabled());
123
Peter Zijlstra9ea4c382013-11-19 16:13:38 +0100124 if (softirq_count() == (cnt & SOFTIRQ_MASK))
Davidlohr Buesod2e08472013-04-30 11:46:09 -0700125 trace_softirqs_on(_RET_IP_);
Peter Zijlstrabdb43802013-09-10 12:15:23 +0200126 preempt_count_sub(cnt);
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700127}
128
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700129/*
130 * Special-case - softirqs can safely be enabled in
131 * cond_resched_softirq(), or by __do_softirq(),
132 * without processing still-pending softirqs:
133 */
134void _local_bh_enable(void)
135{
Frederic Weisbecker5d60d3e2013-09-24 04:11:35 +0200136 WARN_ON_ONCE(in_irq());
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700137 __local_bh_enable(SOFTIRQ_DISABLE_OFFSET);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700138}
139
140EXPORT_SYMBOL(_local_bh_enable);
141
Peter Zijlstra0bd3a172013-11-19 16:13:38 +0100142void __local_bh_enable_ip(unsigned long ip, unsigned int cnt)
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700143{
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200144 WARN_ON_ONCE(in_irq() || irqs_disabled());
Tim Chen3c829c32006-07-30 03:04:02 -0700145#ifdef CONFIG_TRACE_IRQFLAGS
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200146 local_irq_disable();
Tim Chen3c829c32006-07-30 03:04:02 -0700147#endif
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700148 /*
149 * Are softirqs going to be turned on now:
150 */
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700151 if (softirq_count() == SOFTIRQ_DISABLE_OFFSET)
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700152 trace_softirqs_on(ip);
153 /*
154 * Keep preemption disabled until we are done with
155 * softirq processing:
156 */
Peter Zijlstra0bd3a172013-11-19 16:13:38 +0100157 preempt_count_sub(cnt - 1);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700158
Frederic Weisbecker0bed6982013-09-05 16:14:00 +0200159 if (unlikely(!in_interrupt() && local_softirq_pending())) {
160 /*
161 * Run softirq if any pending. And do it in its own stack
162 * as we may be calling this deep in a task call stack already.
163 */
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700164 do_softirq();
Frederic Weisbecker0bed6982013-09-05 16:14:00 +0200165 }
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700166
Peter Zijlstrabdb43802013-09-10 12:15:23 +0200167 preempt_count_dec();
Tim Chen3c829c32006-07-30 03:04:02 -0700168#ifdef CONFIG_TRACE_IRQFLAGS
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200169 local_irq_enable();
Tim Chen3c829c32006-07-30 03:04:02 -0700170#endif
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700171 preempt_check_resched();
172}
Peter Zijlstra0bd3a172013-11-19 16:13:38 +0100173EXPORT_SYMBOL(__local_bh_enable_ip);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700174
175/*
Ben Greear34376a52013-06-06 14:29:49 -0700176 * We restart softirq processing for at most MAX_SOFTIRQ_RESTART times,
177 * but break the loop if need_resched() is set or after 2 ms.
178 * The MAX_SOFTIRQ_TIME provides a nice upper bound in most cases, but in
179 * certain cases, such as stop_machine(), jiffies may cease to
180 * increment and so we need the MAX_SOFTIRQ_RESTART limit as
181 * well to make sure we eventually return from this method.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700182 *
Eric Dumazetc10d7362013-01-10 15:26:34 -0800183 * These limits have been established via experimentation.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700184 * The two things to balance is latency against fairness -
185 * we want to handle softirqs as soon as possible, but they
186 * should not be able to lock up the box.
187 */
Eric Dumazetc10d7362013-01-10 15:26:34 -0800188#define MAX_SOFTIRQ_TIME msecs_to_jiffies(2)
Ben Greear34376a52013-06-06 14:29:49 -0700189#define MAX_SOFTIRQ_RESTART 10
Linus Torvalds1da177e2005-04-16 15:20:36 -0700190
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100191#ifdef CONFIG_TRACE_IRQFLAGS
192/*
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100193 * When we run softirqs from irq_exit() and thus on the hardirq stack we need
194 * to keep the lockdep irq context tracking as tight as possible in order to
195 * not miss-qualify lock contexts and miss possible deadlocks.
196 */
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100197
Frederic Weisbecker5c4853b2013-11-20 01:07:34 +0100198static inline bool lockdep_softirq_start(void)
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100199{
Frederic Weisbecker5c4853b2013-11-20 01:07:34 +0100200 bool in_hardirq = false;
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100201
Frederic Weisbecker5c4853b2013-11-20 01:07:34 +0100202 if (trace_hardirq_context(current)) {
203 in_hardirq = true;
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100204 trace_hardirq_exit();
Frederic Weisbecker5c4853b2013-11-20 01:07:34 +0100205 }
206
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100207 lockdep_softirq_enter();
Frederic Weisbecker5c4853b2013-11-20 01:07:34 +0100208
209 return in_hardirq;
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100210}
211
Frederic Weisbecker5c4853b2013-11-20 01:07:34 +0100212static inline void lockdep_softirq_end(bool in_hardirq)
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100213{
214 lockdep_softirq_exit();
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100215
Frederic Weisbecker5c4853b2013-11-20 01:07:34 +0100216 if (in_hardirq)
217 trace_hardirq_enter();
218}
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100219#else
Frederic Weisbecker5c4853b2013-11-20 01:07:34 +0100220static inline bool lockdep_softirq_start(void) { return false; }
221static inline void lockdep_softirq_end(bool in_hardirq) { }
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100222#endif
223
Linus Torvalds1da177e2005-04-16 15:20:36 -0700224asmlinkage void __do_softirq(void)
225{
Eric Dumazetc10d7362013-01-10 15:26:34 -0800226 unsigned long end = jiffies + MAX_SOFTIRQ_TIME;
Mel Gorman907aed42012-07-31 16:44:07 -0700227 unsigned long old_flags = current->flags;
Ben Greear34376a52013-06-06 14:29:49 -0700228 int max_restart = MAX_SOFTIRQ_RESTART;
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100229 struct softirq_action *h;
Frederic Weisbecker5c4853b2013-11-20 01:07:34 +0100230 bool in_hardirq;
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100231 __u32 pending;
Joe Perches2e702b92014-01-27 17:07:14 -0800232 int softirq_bit;
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100233 int cpu;
Mel Gorman907aed42012-07-31 16:44:07 -0700234
235 /*
236 * Mask out PF_MEMALLOC s current task context is borrowed for the
237 * softirq. A softirq handled such as network RX might set PF_MEMALLOC
238 * again if the socket is related to swap
239 */
240 current->flags &= ~PF_MEMALLOC;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241
242 pending = local_softirq_pending();
Frederic Weisbecker6a616712012-12-16 20:00:34 +0100243 account_irq_enter_time(current);
Paul Mackerras829035fd2006-07-03 00:25:40 -0700244
Peter Zijlstra0bd3a172013-11-19 16:13:38 +0100245 __local_bh_disable_ip(_RET_IP_, SOFTIRQ_OFFSET);
Frederic Weisbecker5c4853b2013-11-20 01:07:34 +0100246 in_hardirq = lockdep_softirq_start();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248 cpu = smp_processor_id();
249restart:
250 /* Reset the pending bitmask before enabling irqs */
Andi Kleen3f744782005-09-12 18:49:24 +0200251 set_softirq_pending(0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252
Andrew Mortonc70f5d62005-07-30 10:22:49 -0700253 local_irq_enable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254
255 h = softirq_vec;
256
Joe Perches2e702b92014-01-27 17:07:14 -0800257 while ((softirq_bit = ffs(pending))) {
258 unsigned int vec_nr;
259 int prev_count;
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200260
Joe Perches2e702b92014-01-27 17:07:14 -0800261 h += softirq_bit - 1;
Thomas Gleixnerf4bc6bb2010-10-19 15:00:13 +0200262
Joe Perches2e702b92014-01-27 17:07:14 -0800263 vec_nr = h - softirq_vec;
264 prev_count = preempt_count();
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200265
Joe Perches2e702b92014-01-27 17:07:14 -0800266 kstat_incr_softirqs_this_cpu(vec_nr);
267
268 trace_softirq_entry(vec_nr);
269 h->action(h);
270 trace_softirq_exit(vec_nr);
271 if (unlikely(prev_count != preempt_count())) {
272 printk(KERN_ERR "huh, entered softirq %u %s %p with preempt_count %08x, exited with %08x?\n",
273 vec_nr, softirq_to_name[vec_nr], h->action,
274 prev_count, preempt_count());
275 preempt_count_set(prev_count);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276 }
Joe Perches2e702b92014-01-27 17:07:14 -0800277 rcu_bh_qs(cpu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278 h++;
Joe Perches2e702b92014-01-27 17:07:14 -0800279 pending >>= softirq_bit;
280 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700281
Andrew Mortonc70f5d62005-07-30 10:22:49 -0700282 local_irq_disable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700283
284 pending = local_softirq_pending();
Eric Dumazetc10d7362013-01-10 15:26:34 -0800285 if (pending) {
Ben Greear34376a52013-06-06 14:29:49 -0700286 if (time_before(jiffies, end) && !need_resched() &&
287 --max_restart)
Eric Dumazetc10d7362013-01-10 15:26:34 -0800288 goto restart;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700289
Linus Torvalds1da177e2005-04-16 15:20:36 -0700290 wakeup_softirqd();
Eric Dumazetc10d7362013-01-10 15:26:34 -0800291 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292
Frederic Weisbecker5c4853b2013-11-20 01:07:34 +0100293 lockdep_softirq_end(in_hardirq);
Frederic Weisbecker6a616712012-12-16 20:00:34 +0100294 account_irq_exit_time(current);
Venkatesh Pallipadi75e10562010-10-04 17:03:16 -0700295 __local_bh_enable(SOFTIRQ_OFFSET);
Frederic Weisbecker5d60d3e2013-09-24 04:11:35 +0200296 WARN_ON_ONCE(in_interrupt());
Mel Gorman907aed42012-07-31 16:44:07 -0700297 tsk_restore_flags(current, old_flags, PF_MEMALLOC);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700298}
299
Linus Torvalds1da177e2005-04-16 15:20:36 -0700300asmlinkage void do_softirq(void)
301{
302 __u32 pending;
303 unsigned long flags;
304
305 if (in_interrupt())
306 return;
307
308 local_irq_save(flags);
309
310 pending = local_softirq_pending();
311
312 if (pending)
Frederic Weisbecker7d65f4a2013-09-05 15:49:45 +0200313 do_softirq_own_stack();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700314
315 local_irq_restore(flags);
316}
317
Ingo Molnardde4b2b2007-02-16 01:27:45 -0800318/*
319 * Enter an interrupt context.
320 */
321void irq_enter(void)
322{
Paul E. McKenney64db4cf2008-12-18 21:55:32 +0100323 rcu_irq_enter();
Frederic Weisbecker0a8a2e72012-01-24 18:59:44 +0100324 if (is_idle_task(current) && !in_interrupt()) {
Venkatesh Pallipadid267f872010-10-04 17:03:23 -0700325 /*
326 * Prevent raise_softirq from needlessly waking up ksoftirqd
327 * here, as softirq will be serviced on return from interrupt.
328 */
329 local_bh_disable();
Frederic Weisbeckere8fcaa52013-08-07 22:28:01 +0200330 tick_check_idle();
Venkatesh Pallipadid267f872010-10-04 17:03:23 -0700331 _local_bh_enable();
332 }
333
334 __irq_enter();
Ingo Molnardde4b2b2007-02-16 01:27:45 -0800335}
336
Heiko Carstensb2a00172012-03-05 15:07:25 -0800337static inline void invoke_softirq(void)
338{
Frederic Weisbeckerded79752013-09-24 00:50:25 +0200339 if (!force_irqthreads) {
Frederic Weisbeckercc1f0272013-09-24 17:17:47 +0200340#ifdef CONFIG_HAVE_IRQ_EXIT_ON_IRQ_STACK
Frederic Weisbeckerded79752013-09-24 00:50:25 +0200341 /*
342 * We can safely execute softirq on the current stack if
343 * it is the irq stack, because it should be near empty
Frederic Weisbeckercc1f0272013-09-24 17:17:47 +0200344 * at this stage.
345 */
346 __do_softirq();
347#else
348 /*
349 * Otherwise, irq_exit() is called on the task stack that can
350 * be potentially deep already. So call softirq in its own stack
351 * to prevent from any overrun.
Frederic Weisbeckerded79752013-09-24 00:50:25 +0200352 */
Frederic Weisbeckerbe6e1012013-09-24 16:39:41 +0200353 do_softirq_own_stack();
Frederic Weisbeckercc1f0272013-09-24 17:17:47 +0200354#endif
Frederic Weisbeckerded79752013-09-24 00:50:25 +0200355 } else {
Thomas Gleixner8d32a302011-02-23 23:52:23 +0000356 wakeup_softirqd();
Frederic Weisbeckerded79752013-09-24 00:50:25 +0200357 }
Thomas Gleixner8d32a302011-02-23 23:52:23 +0000358}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700359
Frederic Weisbecker67826ea2013-04-20 17:43:13 +0200360static inline void tick_irq_exit(void)
361{
362#ifdef CONFIG_NO_HZ_COMMON
363 int cpu = smp_processor_id();
364
365 /* Make sure that timer wheel updates are propagated */
366 if ((idle_cpu(cpu) && !need_resched()) || tick_nohz_full_cpu(cpu)) {
367 if (!in_interrupt())
368 tick_nohz_irq_exit();
369 }
370#endif
371}
372
Linus Torvalds1da177e2005-04-16 15:20:36 -0700373/*
374 * Exit an interrupt context. Process softirqs if needed and possible:
375 */
376void irq_exit(void)
377{
Thomas Gleixner74eed012013-02-20 22:00:48 +0100378#ifndef __ARCH_IRQ_EXIT_IRQS_DISABLED
Frederic Weisbecker4cd5d112013-02-28 20:00:43 +0100379 local_irq_disable();
Thomas Gleixner74eed012013-02-20 22:00:48 +0100380#else
381 WARN_ON_ONCE(!irqs_disabled());
382#endif
383
Frederic Weisbecker6a616712012-12-16 20:00:34 +0100384 account_irq_exit_time(current);
Peter Zijlstrabdb43802013-09-10 12:15:23 +0200385 preempt_count_sub(HARDIRQ_OFFSET);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700386 if (!in_interrupt() && local_softirq_pending())
387 invoke_softirq();
Thomas Gleixner79bf2bb2007-02-16 01:28:03 -0800388
Frederic Weisbecker67826ea2013-04-20 17:43:13 +0200389 tick_irq_exit();
Frederic Weisbecker416eb332011-10-07 16:31:02 -0700390 rcu_irq_exit();
Peter Zijlstraf1a83e62013-11-19 16:42:47 +0100391 trace_hardirq_exit(); /* must be last! */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700392}
393
394/*
395 * This function must run with irqs disabled!
396 */
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800397inline void raise_softirq_irqoff(unsigned int nr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700398{
399 __raise_softirq_irqoff(nr);
400
401 /*
402 * If we're in an interrupt or softirq, we're done
403 * (this also catches softirq-disabled code). We will
404 * actually run the softirq once we return from
405 * the irq or softirq.
406 *
407 * Otherwise we wake up ksoftirqd to make sure we
408 * schedule the softirq soon.
409 */
410 if (!in_interrupt())
411 wakeup_softirqd();
412}
413
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800414void raise_softirq(unsigned int nr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700415{
416 unsigned long flags;
417
418 local_irq_save(flags);
419 raise_softirq_irqoff(nr);
420 local_irq_restore(flags);
421}
422
Steven Rostedtf0696862012-01-25 20:18:55 -0500423void __raise_softirq_irqoff(unsigned int nr)
424{
425 trace_softirq_raise(nr);
426 or_softirq_pending(1UL << nr);
427}
428
Carlos R. Mafra962cf362008-05-15 11:15:37 -0300429void open_softirq(int nr, void (*action)(struct softirq_action *))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700430{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700431 softirq_vec[nr].action = action;
432}
433
Peter Zijlstra9ba5f002009-07-22 14:18:35 +0200434/*
435 * Tasklets
436 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700437struct tasklet_head
438{
Olof Johansson48f20a92008-03-04 15:23:25 -0800439 struct tasklet_struct *head;
440 struct tasklet_struct **tail;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700441};
442
Vegard Nossum4620b492008-06-12 23:21:53 +0200443static DEFINE_PER_CPU(struct tasklet_head, tasklet_vec);
444static DEFINE_PER_CPU(struct tasklet_head, tasklet_hi_vec);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700445
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800446void __tasklet_schedule(struct tasklet_struct *t)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700447{
448 unsigned long flags;
449
450 local_irq_save(flags);
Olof Johansson48f20a92008-03-04 15:23:25 -0800451 t->next = NULL;
Christoph Lameter909ea962010-12-08 16:22:55 +0100452 *__this_cpu_read(tasklet_vec.tail) = t;
453 __this_cpu_write(tasklet_vec.tail, &(t->next));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700454 raise_softirq_irqoff(TASKLET_SOFTIRQ);
455 local_irq_restore(flags);
456}
457
458EXPORT_SYMBOL(__tasklet_schedule);
459
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800460void __tasklet_hi_schedule(struct tasklet_struct *t)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700461{
462 unsigned long flags;
463
464 local_irq_save(flags);
Olof Johansson48f20a92008-03-04 15:23:25 -0800465 t->next = NULL;
Christoph Lameter909ea962010-12-08 16:22:55 +0100466 *__this_cpu_read(tasklet_hi_vec.tail) = t;
467 __this_cpu_write(tasklet_hi_vec.tail, &(t->next));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700468 raise_softirq_irqoff(HI_SOFTIRQ);
469 local_irq_restore(flags);
470}
471
472EXPORT_SYMBOL(__tasklet_hi_schedule);
473
Vegard Nossum7c692cb2008-05-21 22:53:13 +0200474void __tasklet_hi_schedule_first(struct tasklet_struct *t)
475{
476 BUG_ON(!irqs_disabled());
477
Christoph Lameter909ea962010-12-08 16:22:55 +0100478 t->next = __this_cpu_read(tasklet_hi_vec.head);
479 __this_cpu_write(tasklet_hi_vec.head, t);
Vegard Nossum7c692cb2008-05-21 22:53:13 +0200480 __raise_softirq_irqoff(HI_SOFTIRQ);
481}
482
483EXPORT_SYMBOL(__tasklet_hi_schedule_first);
484
Linus Torvalds1da177e2005-04-16 15:20:36 -0700485static void tasklet_action(struct softirq_action *a)
486{
487 struct tasklet_struct *list;
488
489 local_irq_disable();
Christoph Lameter909ea962010-12-08 16:22:55 +0100490 list = __this_cpu_read(tasklet_vec.head);
491 __this_cpu_write(tasklet_vec.head, NULL);
492 __this_cpu_write(tasklet_vec.tail, &__get_cpu_var(tasklet_vec).head);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700493 local_irq_enable();
494
495 while (list) {
496 struct tasklet_struct *t = list;
497
498 list = list->next;
499
500 if (tasklet_trylock(t)) {
501 if (!atomic_read(&t->count)) {
502 if (!test_and_clear_bit(TASKLET_STATE_SCHED, &t->state))
503 BUG();
504 t->func(t->data);
505 tasklet_unlock(t);
506 continue;
507 }
508 tasklet_unlock(t);
509 }
510
511 local_irq_disable();
Olof Johansson48f20a92008-03-04 15:23:25 -0800512 t->next = NULL;
Christoph Lameter909ea962010-12-08 16:22:55 +0100513 *__this_cpu_read(tasklet_vec.tail) = t;
514 __this_cpu_write(tasklet_vec.tail, &(t->next));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700515 __raise_softirq_irqoff(TASKLET_SOFTIRQ);
516 local_irq_enable();
517 }
518}
519
520static void tasklet_hi_action(struct softirq_action *a)
521{
522 struct tasklet_struct *list;
523
524 local_irq_disable();
Christoph Lameter909ea962010-12-08 16:22:55 +0100525 list = __this_cpu_read(tasklet_hi_vec.head);
526 __this_cpu_write(tasklet_hi_vec.head, NULL);
527 __this_cpu_write(tasklet_hi_vec.tail, &__get_cpu_var(tasklet_hi_vec).head);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700528 local_irq_enable();
529
530 while (list) {
531 struct tasklet_struct *t = list;
532
533 list = list->next;
534
535 if (tasklet_trylock(t)) {
536 if (!atomic_read(&t->count)) {
537 if (!test_and_clear_bit(TASKLET_STATE_SCHED, &t->state))
538 BUG();
539 t->func(t->data);
540 tasklet_unlock(t);
541 continue;
542 }
543 tasklet_unlock(t);
544 }
545
546 local_irq_disable();
Olof Johansson48f20a92008-03-04 15:23:25 -0800547 t->next = NULL;
Christoph Lameter909ea962010-12-08 16:22:55 +0100548 *__this_cpu_read(tasklet_hi_vec.tail) = t;
549 __this_cpu_write(tasklet_hi_vec.tail, &(t->next));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700550 __raise_softirq_irqoff(HI_SOFTIRQ);
551 local_irq_enable();
552 }
553}
554
555
556void tasklet_init(struct tasklet_struct *t,
557 void (*func)(unsigned long), unsigned long data)
558{
559 t->next = NULL;
560 t->state = 0;
561 atomic_set(&t->count, 0);
562 t->func = func;
563 t->data = data;
564}
565
566EXPORT_SYMBOL(tasklet_init);
567
568void tasklet_kill(struct tasklet_struct *t)
569{
570 if (in_interrupt())
571 printk("Attempt to kill tasklet from interrupt\n");
572
573 while (test_and_set_bit(TASKLET_STATE_SCHED, &t->state)) {
H Hartley Sweeten79d381c2009-04-16 19:30:18 -0400574 do {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700575 yield();
H Hartley Sweeten79d381c2009-04-16 19:30:18 -0400576 } while (test_bit(TASKLET_STATE_SCHED, &t->state));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700577 }
578 tasklet_unlock_wait(t);
579 clear_bit(TASKLET_STATE_SCHED, &t->state);
580}
581
582EXPORT_SYMBOL(tasklet_kill);
583
Peter Zijlstra9ba5f002009-07-22 14:18:35 +0200584/*
585 * tasklet_hrtimer
586 */
587
588/*
Peter Zijlstrab9c30322010-02-03 18:08:52 +0100589 * The trampoline is called when the hrtimer expires. It schedules a tasklet
590 * to run __tasklet_hrtimer_trampoline() which in turn will call the intended
591 * hrtimer callback, but from softirq context.
Peter Zijlstra9ba5f002009-07-22 14:18:35 +0200592 */
593static enum hrtimer_restart __hrtimer_tasklet_trampoline(struct hrtimer *timer)
594{
595 struct tasklet_hrtimer *ttimer =
596 container_of(timer, struct tasklet_hrtimer, timer);
597
Peter Zijlstrab9c30322010-02-03 18:08:52 +0100598 tasklet_hi_schedule(&ttimer->tasklet);
599 return HRTIMER_NORESTART;
Peter Zijlstra9ba5f002009-07-22 14:18:35 +0200600}
601
602/*
603 * Helper function which calls the hrtimer callback from
604 * tasklet/softirq context
605 */
606static void __tasklet_hrtimer_trampoline(unsigned long data)
607{
608 struct tasklet_hrtimer *ttimer = (void *)data;
609 enum hrtimer_restart restart;
610
611 restart = ttimer->function(&ttimer->timer);
612 if (restart != HRTIMER_NORESTART)
613 hrtimer_restart(&ttimer->timer);
614}
615
616/**
617 * tasklet_hrtimer_init - Init a tasklet/hrtimer combo for softirq callbacks
618 * @ttimer: tasklet_hrtimer which is initialized
Lucas De Marchi25985ed2011-03-30 22:57:33 -0300619 * @function: hrtimer callback function which gets called from softirq context
Peter Zijlstra9ba5f002009-07-22 14:18:35 +0200620 * @which_clock: clock id (CLOCK_MONOTONIC/CLOCK_REALTIME)
621 * @mode: hrtimer mode (HRTIMER_MODE_ABS/HRTIMER_MODE_REL)
622 */
623void tasklet_hrtimer_init(struct tasklet_hrtimer *ttimer,
624 enum hrtimer_restart (*function)(struct hrtimer *),
625 clockid_t which_clock, enum hrtimer_mode mode)
626{
627 hrtimer_init(&ttimer->timer, which_clock, mode);
628 ttimer->timer.function = __hrtimer_tasklet_trampoline;
629 tasklet_init(&ttimer->tasklet, __tasklet_hrtimer_trampoline,
630 (unsigned long)ttimer);
631 ttimer->function = function;
632}
633EXPORT_SYMBOL_GPL(tasklet_hrtimer_init);
634
Linus Torvalds1da177e2005-04-16 15:20:36 -0700635void __init softirq_init(void)
636{
Olof Johansson48f20a92008-03-04 15:23:25 -0800637 int cpu;
638
639 for_each_possible_cpu(cpu) {
640 per_cpu(tasklet_vec, cpu).tail =
641 &per_cpu(tasklet_vec, cpu).head;
642 per_cpu(tasklet_hi_vec, cpu).tail =
643 &per_cpu(tasklet_hi_vec, cpu).head;
644 }
645
Carlos R. Mafra962cf362008-05-15 11:15:37 -0300646 open_softirq(TASKLET_SOFTIRQ, tasklet_action);
647 open_softirq(HI_SOFTIRQ, tasklet_hi_action);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700648}
649
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000650static int ksoftirqd_should_run(unsigned int cpu)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700651{
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000652 return local_softirq_pending();
653}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700654
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000655static void run_ksoftirqd(unsigned int cpu)
656{
657 local_irq_disable();
658 if (local_softirq_pending()) {
Frederic Weisbecker0bed6982013-09-05 16:14:00 +0200659 /*
660 * We can safely run softirq on inline stack, as we are not deep
661 * in the task stack here.
662 */
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000663 __do_softirq();
664 rcu_note_context_switch(cpu);
665 local_irq_enable();
666 cond_resched();
667 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700668 }
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000669 local_irq_enable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700670}
671
672#ifdef CONFIG_HOTPLUG_CPU
673/*
674 * tasklet_kill_immediate is called to remove a tasklet which can already be
675 * scheduled for execution on @cpu.
676 *
677 * Unlike tasklet_kill, this function removes the tasklet
678 * _immediately_, even if the tasklet is in TASKLET_STATE_SCHED state.
679 *
680 * When this function is called, @cpu must be in the CPU_DEAD state.
681 */
682void tasklet_kill_immediate(struct tasklet_struct *t, unsigned int cpu)
683{
684 struct tasklet_struct **i;
685
686 BUG_ON(cpu_online(cpu));
687 BUG_ON(test_bit(TASKLET_STATE_RUN, &t->state));
688
689 if (!test_bit(TASKLET_STATE_SCHED, &t->state))
690 return;
691
692 /* CPU is dead, so no lock needed. */
Olof Johansson48f20a92008-03-04 15:23:25 -0800693 for (i = &per_cpu(tasklet_vec, cpu).head; *i; i = &(*i)->next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700694 if (*i == t) {
695 *i = t->next;
Olof Johansson48f20a92008-03-04 15:23:25 -0800696 /* If this was the tail element, move the tail ptr */
697 if (*i == NULL)
698 per_cpu(tasklet_vec, cpu).tail = i;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700699 return;
700 }
701 }
702 BUG();
703}
704
705static void takeover_tasklets(unsigned int cpu)
706{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700707 /* CPU is dead, so no lock needed. */
708 local_irq_disable();
709
710 /* Find end, append list for that CPU. */
Christian Borntraegere5e41722008-05-01 04:34:23 -0700711 if (&per_cpu(tasklet_vec, cpu).head != per_cpu(tasklet_vec, cpu).tail) {
Christoph Lameter909ea962010-12-08 16:22:55 +0100712 *__this_cpu_read(tasklet_vec.tail) = per_cpu(tasklet_vec, cpu).head;
713 this_cpu_write(tasklet_vec.tail, per_cpu(tasklet_vec, cpu).tail);
Christian Borntraegere5e41722008-05-01 04:34:23 -0700714 per_cpu(tasklet_vec, cpu).head = NULL;
715 per_cpu(tasklet_vec, cpu).tail = &per_cpu(tasklet_vec, cpu).head;
716 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700717 raise_softirq_irqoff(TASKLET_SOFTIRQ);
718
Christian Borntraegere5e41722008-05-01 04:34:23 -0700719 if (&per_cpu(tasklet_hi_vec, cpu).head != per_cpu(tasklet_hi_vec, cpu).tail) {
Christoph Lameter909ea962010-12-08 16:22:55 +0100720 *__this_cpu_read(tasklet_hi_vec.tail) = per_cpu(tasklet_hi_vec, cpu).head;
721 __this_cpu_write(tasklet_hi_vec.tail, per_cpu(tasklet_hi_vec, cpu).tail);
Christian Borntraegere5e41722008-05-01 04:34:23 -0700722 per_cpu(tasklet_hi_vec, cpu).head = NULL;
723 per_cpu(tasklet_hi_vec, cpu).tail = &per_cpu(tasklet_hi_vec, cpu).head;
724 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700725 raise_softirq_irqoff(HI_SOFTIRQ);
726
727 local_irq_enable();
728}
729#endif /* CONFIG_HOTPLUG_CPU */
730
Paul Gortmaker0db06282013-06-19 14:53:51 -0400731static int cpu_callback(struct notifier_block *nfb,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700732 unsigned long action,
733 void *hcpu)
734{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700735 switch (action) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700736#ifdef CONFIG_HOTPLUG_CPU
Linus Torvalds1da177e2005-04-16 15:20:36 -0700737 case CPU_DEAD:
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000738 case CPU_DEAD_FROZEN:
739 takeover_tasklets((unsigned long)hcpu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700740 break;
741#endif /* CONFIG_HOTPLUG_CPU */
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000742 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700743 return NOTIFY_OK;
744}
745
Paul Gortmaker0db06282013-06-19 14:53:51 -0400746static struct notifier_block cpu_nfb = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700747 .notifier_call = cpu_callback
748};
749
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000750static struct smp_hotplug_thread softirq_threads = {
751 .store = &ksoftirqd,
752 .thread_should_run = ksoftirqd_should_run,
753 .thread_fn = run_ksoftirqd,
754 .thread_comm = "ksoftirqd/%u",
755};
756
Eduard - Gabriel Munteanu7babe8d2008-07-25 19:45:11 -0700757static __init int spawn_ksoftirqd(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700758{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700759 register_cpu_notifier(&cpu_nfb);
Thomas Gleixner3e339b52012-07-16 10:42:37 +0000760
761 BUG_ON(smpboot_register_percpu_thread(&softirq_threads));
762
Linus Torvalds1da177e2005-04-16 15:20:36 -0700763 return 0;
764}
Eduard - Gabriel Munteanu7babe8d2008-07-25 19:45:11 -0700765early_initcall(spawn_ksoftirqd);
Andrew Morton78eef012006-03-22 00:08:16 -0800766
Yinghai Lu43a25632008-12-28 16:01:13 -0800767/*
768 * [ These __weak aliases are kept in a separate compilation unit, so that
769 * GCC does not inline them incorrectly. ]
770 */
771
772int __init __weak early_irq_init(void)
773{
774 return 0;
775}
776
Yinghai Lu4a046d12009-01-12 17:39:24 -0800777int __init __weak arch_probe_nr_irqs(void)
778{
Thomas Gleixnerb683de22010-09-27 20:55:03 +0200779 return NR_IRQS_LEGACY;
Yinghai Lu4a046d12009-01-12 17:39:24 -0800780}
781
Yinghai Lu43a25632008-12-28 16:01:13 -0800782int __init __weak arch_early_irq_init(void)
783{
784 return 0;
785}