blob: 7ab9dfd8d0820c4dc2bbbcec9522e61a8be71b6e [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/kernel/softirq.c
3 *
4 * Copyright (C) 1992 Linus Torvalds
5 *
Pavel Machekb10db7f2008-01-30 13:30:00 +01006 * Distribute under GPLv2.
7 *
8 * Rewritten. Old one was good in 2.2, but in 2.3 it was immoral. --ANK (990903)
David S. Miller54514a72008-09-23 22:15:57 -07009 *
10 * Remote softirq infrastructure is by Jens Axboe.
Linus Torvalds1da177e2005-04-16 15:20:36 -070011 */
12
13#include <linux/module.h>
14#include <linux/kernel_stat.h>
15#include <linux/interrupt.h>
16#include <linux/init.h>
17#include <linux/mm.h>
18#include <linux/notifier.h>
19#include <linux/percpu.h>
20#include <linux/cpu.h>
Rafael J. Wysocki83144182007-07-17 04:03:35 -070021#include <linux/freezer.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070022#include <linux/kthread.h>
23#include <linux/rcupdate.h>
Steven Rostedt7e49fcc2009-01-22 19:01:40 -050024#include <linux/ftrace.h>
Andrew Morton78eef012006-03-22 00:08:16 -080025#include <linux/smp.h>
Thomas Gleixner79bf2bb2007-02-16 01:28:03 -080026#include <linux/tick.h>
Steven Rostedtad8d75f2009-04-14 19:39:12 -040027#include <trace/events/irq.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070028
29#include <asm/irq.h>
30/*
31 - No shared variables, all the data are CPU local.
32 - If a softirq needs serialization, let it serialize itself
33 by its own spinlocks.
34 - Even if softirq is serialized, only local cpu is marked for
35 execution. Hence, we get something sort of weak cpu binding.
36 Though it is still not clear, will it result in better locality
37 or will not.
38
39 Examples:
40 - NET RX softirq. It is multithreaded and does not require
41 any global serialization.
42 - NET TX softirq. It kicks software netdevice queues, hence
43 it is logically serialized per device, but this serialization
44 is invisible to common code.
45 - Tasklets: serialized wrt itself.
46 */
47
48#ifndef __ARCH_IRQ_STAT
49irq_cpustat_t irq_stat[NR_CPUS] ____cacheline_aligned;
50EXPORT_SYMBOL(irq_stat);
51#endif
52
Alexey Dobriyan978b0112008-09-06 20:04:36 +020053static struct softirq_action softirq_vec[NR_SOFTIRQS] __cacheline_aligned_in_smp;
Linus Torvalds1da177e2005-04-16 15:20:36 -070054
55static DEFINE_PER_CPU(struct task_struct *, ksoftirqd);
56
Jason Baron5d592b42009-03-12 14:33:36 -040057char *softirq_to_name[NR_SOFTIRQS] = {
Steven Rostedt899039e2009-03-13 00:43:33 -040058 "HI", "TIMER", "NET_TX", "NET_RX", "BLOCK",
59 "TASKLET", "SCHED", "HRTIMER", "RCU"
Jason Baron5d592b42009-03-12 14:33:36 -040060};
61
Linus Torvalds1da177e2005-04-16 15:20:36 -070062/*
63 * we cannot loop indefinitely here to avoid userspace starvation,
64 * but we also don't want to introduce a worst case 1/HZ latency
65 * to the pending events, so lets the scheduler to balance
66 * the softirq load for us.
67 */
Peter Zijlstra7f1e2ca2009-03-13 12:21:27 +010068void wakeup_softirqd(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -070069{
70 /* Interrupts are disabled: no need to stop preemption */
71 struct task_struct *tsk = __get_cpu_var(ksoftirqd);
72
73 if (tsk && tsk->state != TASK_RUNNING)
74 wake_up_process(tsk);
75}
76
77/*
Ingo Molnarde30a2b2006-07-03 00:24:42 -070078 * This one is for softirq.c-internal use,
79 * where hardirqs are disabled legitimately:
80 */
Tim Chen3c829c32006-07-30 03:04:02 -070081#ifdef CONFIG_TRACE_IRQFLAGS
Ingo Molnarde30a2b2006-07-03 00:24:42 -070082static void __local_bh_disable(unsigned long ip)
83{
84 unsigned long flags;
85
86 WARN_ON_ONCE(in_irq());
87
88 raw_local_irq_save(flags);
Steven Rostedt7e49fcc2009-01-22 19:01:40 -050089 /*
90 * The preempt tracer hooks into add_preempt_count and will break
91 * lockdep because it calls back into lockdep after SOFTIRQ_OFFSET
92 * is set and before current->softirq_enabled is cleared.
93 * We must manually increment preempt_count here and manually
94 * call the trace_preempt_off later.
95 */
96 preempt_count() += SOFTIRQ_OFFSET;
Ingo Molnarde30a2b2006-07-03 00:24:42 -070097 /*
98 * Were softirqs turned off above:
99 */
100 if (softirq_count() == SOFTIRQ_OFFSET)
101 trace_softirqs_off(ip);
102 raw_local_irq_restore(flags);
Steven Rostedt7e49fcc2009-01-22 19:01:40 -0500103
104 if (preempt_count() == SOFTIRQ_OFFSET)
105 trace_preempt_off(CALLER_ADDR0, get_parent_ip(CALLER_ADDR1));
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700106}
Tim Chen3c829c32006-07-30 03:04:02 -0700107#else /* !CONFIG_TRACE_IRQFLAGS */
108static inline void __local_bh_disable(unsigned long ip)
109{
110 add_preempt_count(SOFTIRQ_OFFSET);
111 barrier();
112}
113#endif /* CONFIG_TRACE_IRQFLAGS */
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700114
115void local_bh_disable(void)
116{
117 __local_bh_disable((unsigned long)__builtin_return_address(0));
118}
119
120EXPORT_SYMBOL(local_bh_disable);
121
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700122/*
123 * Special-case - softirqs can safely be enabled in
124 * cond_resched_softirq(), or by __do_softirq(),
125 * without processing still-pending softirqs:
126 */
127void _local_bh_enable(void)
128{
129 WARN_ON_ONCE(in_irq());
130 WARN_ON_ONCE(!irqs_disabled());
131
132 if (softirq_count() == SOFTIRQ_OFFSET)
133 trace_softirqs_on((unsigned long)__builtin_return_address(0));
134 sub_preempt_count(SOFTIRQ_OFFSET);
135}
136
137EXPORT_SYMBOL(_local_bh_enable);
138
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200139static inline void _local_bh_enable_ip(unsigned long ip)
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700140{
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200141 WARN_ON_ONCE(in_irq() || irqs_disabled());
Tim Chen3c829c32006-07-30 03:04:02 -0700142#ifdef CONFIG_TRACE_IRQFLAGS
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200143 local_irq_disable();
Tim Chen3c829c32006-07-30 03:04:02 -0700144#endif
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700145 /*
146 * Are softirqs going to be turned on now:
147 */
148 if (softirq_count() == SOFTIRQ_OFFSET)
149 trace_softirqs_on(ip);
150 /*
151 * Keep preemption disabled until we are done with
152 * softirq processing:
153 */
154 sub_preempt_count(SOFTIRQ_OFFSET - 1);
155
156 if (unlikely(!in_interrupt() && local_softirq_pending()))
157 do_softirq();
158
159 dec_preempt_count();
Tim Chen3c829c32006-07-30 03:04:02 -0700160#ifdef CONFIG_TRACE_IRQFLAGS
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200161 local_irq_enable();
Tim Chen3c829c32006-07-30 03:04:02 -0700162#endif
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700163 preempt_check_resched();
164}
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200165
166void local_bh_enable(void)
167{
168 _local_bh_enable_ip((unsigned long)__builtin_return_address(0));
169}
170EXPORT_SYMBOL(local_bh_enable);
171
172void local_bh_enable_ip(unsigned long ip)
173{
174 _local_bh_enable_ip(ip);
175}
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700176EXPORT_SYMBOL(local_bh_enable_ip);
177
178/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179 * We restart softirq processing MAX_SOFTIRQ_RESTART times,
180 * and we fall back to softirqd after that.
181 *
182 * This number has been established via experimentation.
183 * The two things to balance is latency against fairness -
184 * we want to handle softirqs as soon as possible, but they
185 * should not be able to lock up the box.
186 */
187#define MAX_SOFTIRQ_RESTART 10
188
189asmlinkage void __do_softirq(void)
190{
191 struct softirq_action *h;
192 __u32 pending;
193 int max_restart = MAX_SOFTIRQ_RESTART;
194 int cpu;
195
196 pending = local_softirq_pending();
Paul Mackerras829035fd2006-07-03 00:25:40 -0700197 account_system_vtime(current);
198
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700199 __local_bh_disable((unsigned long)__builtin_return_address(0));
Ingo Molnard820ac42009-03-13 01:30:40 +0100200 lockdep_softirq_enter();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700201
Linus Torvalds1da177e2005-04-16 15:20:36 -0700202 cpu = smp_processor_id();
203restart:
204 /* Reset the pending bitmask before enabling irqs */
Andi Kleen3f744782005-09-12 18:49:24 +0200205 set_softirq_pending(0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700206
Andrew Mortonc70f5d62005-07-30 10:22:49 -0700207 local_irq_enable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700208
209 h = softirq_vec;
210
211 do {
212 if (pending & 1) {
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200213 int prev_count = preempt_count();
214
Jason Baron39842322009-03-12 14:36:03 -0400215 trace_softirq_entry(h, softirq_vec);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700216 h->action(h);
Jason Baron39842322009-03-12 14:36:03 -0400217 trace_softirq_exit(h, softirq_vec);
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200218 if (unlikely(prev_count != preempt_count())) {
Jason Baron5d592b42009-03-12 14:33:36 -0400219 printk(KERN_ERR "huh, entered softirq %td %s %p"
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200220 "with preempt_count %08x,"
221 " exited with %08x?\n", h - softirq_vec,
Jason Baron5d592b42009-03-12 14:33:36 -0400222 softirq_to_name[h - softirq_vec],
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200223 h->action, prev_count, preempt_count());
224 preempt_count() = prev_count;
225 }
226
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227 rcu_bh_qsctr_inc(cpu);
228 }
229 h++;
230 pending >>= 1;
231 } while (pending);
232
Andrew Mortonc70f5d62005-07-30 10:22:49 -0700233 local_irq_disable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700234
235 pending = local_softirq_pending();
236 if (pending && --max_restart)
237 goto restart;
238
239 if (pending)
240 wakeup_softirqd();
241
Ingo Molnard820ac42009-03-13 01:30:40 +0100242 lockdep_softirq_exit();
Paul Mackerras829035fd2006-07-03 00:25:40 -0700243
244 account_system_vtime(current);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700245 _local_bh_enable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246}
247
248#ifndef __ARCH_HAS_DO_SOFTIRQ
249
250asmlinkage void do_softirq(void)
251{
252 __u32 pending;
253 unsigned long flags;
254
255 if (in_interrupt())
256 return;
257
258 local_irq_save(flags);
259
260 pending = local_softirq_pending();
261
262 if (pending)
263 __do_softirq();
264
265 local_irq_restore(flags);
266}
267
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268#endif
269
Ingo Molnardde4b2b2007-02-16 01:27:45 -0800270/*
271 * Enter an interrupt context.
272 */
273void irq_enter(void)
274{
Venki Pallipadi6378ddb2008-01-30 13:30:04 +0100275 int cpu = smp_processor_id();
Thomas Gleixner719254f2008-10-17 09:59:47 +0200276
Paul E. McKenney64db4cf2008-12-18 21:55:32 +0100277 rcu_irq_enter();
Thomas Gleixneree5f80a2008-11-07 11:06:00 +0100278 if (idle_cpu(cpu) && !in_interrupt()) {
279 __irq_enter();
Thomas Gleixner719254f2008-10-17 09:59:47 +0200280 tick_check_idle(cpu);
Thomas Gleixneree5f80a2008-11-07 11:06:00 +0100281 } else
282 __irq_enter();
Ingo Molnardde4b2b2007-02-16 01:27:45 -0800283}
284
Linus Torvalds1da177e2005-04-16 15:20:36 -0700285#ifdef __ARCH_IRQ_EXIT_IRQS_DISABLED
286# define invoke_softirq() __do_softirq()
287#else
288# define invoke_softirq() do_softirq()
289#endif
290
291/*
292 * Exit an interrupt context. Process softirqs if needed and possible:
293 */
294void irq_exit(void)
295{
296 account_system_vtime(current);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700297 trace_hardirq_exit();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700298 sub_preempt_count(IRQ_EXIT_OFFSET);
299 if (!in_interrupt() && local_softirq_pending())
300 invoke_softirq();
Thomas Gleixner79bf2bb2007-02-16 01:28:03 -0800301
302#ifdef CONFIG_NO_HZ
303 /* Make sure that timer wheel updates are propagated */
Steven Rostedt2232c2d2008-02-29 18:46:50 +0100304 rcu_irq_exit();
Paul E. McKenney64db4cf2008-12-18 21:55:32 +0100305 if (idle_cpu(smp_processor_id()) && !in_interrupt() && !need_resched())
306 tick_nohz_stop_sched_tick(0);
Thomas Gleixner79bf2bb2007-02-16 01:28:03 -0800307#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700308 preempt_enable_no_resched();
309}
310
311/*
312 * This function must run with irqs disabled!
313 */
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800314inline void raise_softirq_irqoff(unsigned int nr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315{
316 __raise_softirq_irqoff(nr);
317
318 /*
319 * If we're in an interrupt or softirq, we're done
320 * (this also catches softirq-disabled code). We will
321 * actually run the softirq once we return from
322 * the irq or softirq.
323 *
324 * Otherwise we wake up ksoftirqd to make sure we
325 * schedule the softirq soon.
326 */
327 if (!in_interrupt())
328 wakeup_softirqd();
329}
330
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800331void raise_softirq(unsigned int nr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700332{
333 unsigned long flags;
334
335 local_irq_save(flags);
336 raise_softirq_irqoff(nr);
337 local_irq_restore(flags);
338}
339
Carlos R. Mafra962cf362008-05-15 11:15:37 -0300340void open_softirq(int nr, void (*action)(struct softirq_action *))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700342 softirq_vec[nr].action = action;
343}
344
Linus Torvalds1da177e2005-04-16 15:20:36 -0700345/* Tasklets */
346struct tasklet_head
347{
Olof Johansson48f20a92008-03-04 15:23:25 -0800348 struct tasklet_struct *head;
349 struct tasklet_struct **tail;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700350};
351
Vegard Nossum4620b492008-06-12 23:21:53 +0200352static DEFINE_PER_CPU(struct tasklet_head, tasklet_vec);
353static DEFINE_PER_CPU(struct tasklet_head, tasklet_hi_vec);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700354
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800355void __tasklet_schedule(struct tasklet_struct *t)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700356{
357 unsigned long flags;
358
359 local_irq_save(flags);
Olof Johansson48f20a92008-03-04 15:23:25 -0800360 t->next = NULL;
361 *__get_cpu_var(tasklet_vec).tail = t;
362 __get_cpu_var(tasklet_vec).tail = &(t->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363 raise_softirq_irqoff(TASKLET_SOFTIRQ);
364 local_irq_restore(flags);
365}
366
367EXPORT_SYMBOL(__tasklet_schedule);
368
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800369void __tasklet_hi_schedule(struct tasklet_struct *t)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700370{
371 unsigned long flags;
372
373 local_irq_save(flags);
Olof Johansson48f20a92008-03-04 15:23:25 -0800374 t->next = NULL;
375 *__get_cpu_var(tasklet_hi_vec).tail = t;
376 __get_cpu_var(tasklet_hi_vec).tail = &(t->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700377 raise_softirq_irqoff(HI_SOFTIRQ);
378 local_irq_restore(flags);
379}
380
381EXPORT_SYMBOL(__tasklet_hi_schedule);
382
383static void tasklet_action(struct softirq_action *a)
384{
385 struct tasklet_struct *list;
386
387 local_irq_disable();
Olof Johansson48f20a92008-03-04 15:23:25 -0800388 list = __get_cpu_var(tasklet_vec).head;
389 __get_cpu_var(tasklet_vec).head = NULL;
390 __get_cpu_var(tasklet_vec).tail = &__get_cpu_var(tasklet_vec).head;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700391 local_irq_enable();
392
393 while (list) {
394 struct tasklet_struct *t = list;
395
396 list = list->next;
397
398 if (tasklet_trylock(t)) {
399 if (!atomic_read(&t->count)) {
400 if (!test_and_clear_bit(TASKLET_STATE_SCHED, &t->state))
401 BUG();
402 t->func(t->data);
403 tasklet_unlock(t);
404 continue;
405 }
406 tasklet_unlock(t);
407 }
408
409 local_irq_disable();
Olof Johansson48f20a92008-03-04 15:23:25 -0800410 t->next = NULL;
411 *__get_cpu_var(tasklet_vec).tail = t;
412 __get_cpu_var(tasklet_vec).tail = &(t->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700413 __raise_softirq_irqoff(TASKLET_SOFTIRQ);
414 local_irq_enable();
415 }
416}
417
418static void tasklet_hi_action(struct softirq_action *a)
419{
420 struct tasklet_struct *list;
421
422 local_irq_disable();
Olof Johansson48f20a92008-03-04 15:23:25 -0800423 list = __get_cpu_var(tasklet_hi_vec).head;
424 __get_cpu_var(tasklet_hi_vec).head = NULL;
425 __get_cpu_var(tasklet_hi_vec).tail = &__get_cpu_var(tasklet_hi_vec).head;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700426 local_irq_enable();
427
428 while (list) {
429 struct tasklet_struct *t = list;
430
431 list = list->next;
432
433 if (tasklet_trylock(t)) {
434 if (!atomic_read(&t->count)) {
435 if (!test_and_clear_bit(TASKLET_STATE_SCHED, &t->state))
436 BUG();
437 t->func(t->data);
438 tasklet_unlock(t);
439 continue;
440 }
441 tasklet_unlock(t);
442 }
443
444 local_irq_disable();
Olof Johansson48f20a92008-03-04 15:23:25 -0800445 t->next = NULL;
446 *__get_cpu_var(tasklet_hi_vec).tail = t;
447 __get_cpu_var(tasklet_hi_vec).tail = &(t->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700448 __raise_softirq_irqoff(HI_SOFTIRQ);
449 local_irq_enable();
450 }
451}
452
453
454void tasklet_init(struct tasklet_struct *t,
455 void (*func)(unsigned long), unsigned long data)
456{
457 t->next = NULL;
458 t->state = 0;
459 atomic_set(&t->count, 0);
460 t->func = func;
461 t->data = data;
462}
463
464EXPORT_SYMBOL(tasklet_init);
465
466void tasklet_kill(struct tasklet_struct *t)
467{
468 if (in_interrupt())
469 printk("Attempt to kill tasklet from interrupt\n");
470
471 while (test_and_set_bit(TASKLET_STATE_SCHED, &t->state)) {
472 do
473 yield();
474 while (test_bit(TASKLET_STATE_SCHED, &t->state));
475 }
476 tasklet_unlock_wait(t);
477 clear_bit(TASKLET_STATE_SCHED, &t->state);
478}
479
480EXPORT_SYMBOL(tasklet_kill);
481
David S. Miller54514a72008-09-23 22:15:57 -0700482DEFINE_PER_CPU(struct list_head [NR_SOFTIRQS], softirq_work_list);
483EXPORT_PER_CPU_SYMBOL(softirq_work_list);
484
485static void __local_trigger(struct call_single_data *cp, int softirq)
486{
487 struct list_head *head = &__get_cpu_var(softirq_work_list[softirq]);
488
489 list_add_tail(&cp->list, head);
490
491 /* Trigger the softirq only if the list was previously empty. */
492 if (head->next == &cp->list)
493 raise_softirq_irqoff(softirq);
494}
495
496#ifdef CONFIG_USE_GENERIC_SMP_HELPERS
497static void remote_softirq_receive(void *data)
498{
499 struct call_single_data *cp = data;
500 unsigned long flags;
501 int softirq;
502
503 softirq = cp->priv;
504
505 local_irq_save(flags);
506 __local_trigger(cp, softirq);
507 local_irq_restore(flags);
508}
509
510static int __try_remote_softirq(struct call_single_data *cp, int cpu, int softirq)
511{
512 if (cpu_online(cpu)) {
513 cp->func = remote_softirq_receive;
514 cp->info = cp;
515 cp->flags = 0;
516 cp->priv = softirq;
517
Peter Zijlstra6e275632009-02-25 13:59:48 +0100518 __smp_call_function_single(cpu, cp, 0);
David S. Miller54514a72008-09-23 22:15:57 -0700519 return 0;
520 }
521 return 1;
522}
523#else /* CONFIG_USE_GENERIC_SMP_HELPERS */
524static int __try_remote_softirq(struct call_single_data *cp, int cpu, int softirq)
525{
526 return 1;
527}
528#endif
529
530/**
531 * __send_remote_softirq - try to schedule softirq work on a remote cpu
532 * @cp: private SMP call function data area
533 * @cpu: the remote cpu
534 * @this_cpu: the currently executing cpu
535 * @softirq: the softirq for the work
536 *
537 * Attempt to schedule softirq work on a remote cpu. If this cannot be
538 * done, the work is instead queued up on the local cpu.
539 *
540 * Interrupts must be disabled.
541 */
542void __send_remote_softirq(struct call_single_data *cp, int cpu, int this_cpu, int softirq)
543{
544 if (cpu == this_cpu || __try_remote_softirq(cp, cpu, softirq))
545 __local_trigger(cp, softirq);
546}
547EXPORT_SYMBOL(__send_remote_softirq);
548
549/**
550 * send_remote_softirq - try to schedule softirq work on a remote cpu
551 * @cp: private SMP call function data area
552 * @cpu: the remote cpu
553 * @softirq: the softirq for the work
554 *
555 * Like __send_remote_softirq except that disabling interrupts and
556 * computing the current cpu is done for the caller.
557 */
558void send_remote_softirq(struct call_single_data *cp, int cpu, int softirq)
559{
560 unsigned long flags;
561 int this_cpu;
562
563 local_irq_save(flags);
564 this_cpu = smp_processor_id();
565 __send_remote_softirq(cp, cpu, this_cpu, softirq);
566 local_irq_restore(flags);
567}
568EXPORT_SYMBOL(send_remote_softirq);
569
570static int __cpuinit remote_softirq_cpu_notify(struct notifier_block *self,
571 unsigned long action, void *hcpu)
572{
573 /*
574 * If a CPU goes away, splice its entries to the current CPU
575 * and trigger a run of the softirq
576 */
577 if (action == CPU_DEAD || action == CPU_DEAD_FROZEN) {
578 int cpu = (unsigned long) hcpu;
579 int i;
580
581 local_irq_disable();
582 for (i = 0; i < NR_SOFTIRQS; i++) {
583 struct list_head *head = &per_cpu(softirq_work_list[i], cpu);
584 struct list_head *local_head;
585
586 if (list_empty(head))
587 continue;
588
589 local_head = &__get_cpu_var(softirq_work_list[i]);
590 list_splice_init(head, local_head);
591 raise_softirq_irqoff(i);
592 }
593 local_irq_enable();
594 }
595
596 return NOTIFY_OK;
597}
598
599static struct notifier_block __cpuinitdata remote_softirq_cpu_notifier = {
600 .notifier_call = remote_softirq_cpu_notify,
601};
602
Linus Torvalds1da177e2005-04-16 15:20:36 -0700603void __init softirq_init(void)
604{
Olof Johansson48f20a92008-03-04 15:23:25 -0800605 int cpu;
606
607 for_each_possible_cpu(cpu) {
David S. Miller54514a72008-09-23 22:15:57 -0700608 int i;
609
Olof Johansson48f20a92008-03-04 15:23:25 -0800610 per_cpu(tasklet_vec, cpu).tail =
611 &per_cpu(tasklet_vec, cpu).head;
612 per_cpu(tasklet_hi_vec, cpu).tail =
613 &per_cpu(tasklet_hi_vec, cpu).head;
David S. Miller54514a72008-09-23 22:15:57 -0700614 for (i = 0; i < NR_SOFTIRQS; i++)
615 INIT_LIST_HEAD(&per_cpu(softirq_work_list[i], cpu));
Olof Johansson48f20a92008-03-04 15:23:25 -0800616 }
617
David S. Miller54514a72008-09-23 22:15:57 -0700618 register_hotcpu_notifier(&remote_softirq_cpu_notifier);
619
Carlos R. Mafra962cf362008-05-15 11:15:37 -0300620 open_softirq(TASKLET_SOFTIRQ, tasklet_action);
621 open_softirq(HI_SOFTIRQ, tasklet_hi_action);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700622}
623
624static int ksoftirqd(void * __bind_cpu)
625{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700626 set_current_state(TASK_INTERRUPTIBLE);
627
628 while (!kthread_should_stop()) {
629 preempt_disable();
630 if (!local_softirq_pending()) {
631 preempt_enable_no_resched();
632 schedule();
633 preempt_disable();
634 }
635
636 __set_current_state(TASK_RUNNING);
637
638 while (local_softirq_pending()) {
639 /* Preempt disable stops cpu going offline.
640 If already offline, we'll be on wrong CPU:
641 don't process */
642 if (cpu_is_offline((long)__bind_cpu))
643 goto wait_to_die;
644 do_softirq();
645 preempt_enable_no_resched();
646 cond_resched();
647 preempt_disable();
Eric Dumazet64ca5ab2009-03-04 12:11:56 -0800648 rcu_qsctr_inc((long)__bind_cpu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700649 }
650 preempt_enable();
651 set_current_state(TASK_INTERRUPTIBLE);
652 }
653 __set_current_state(TASK_RUNNING);
654 return 0;
655
656wait_to_die:
657 preempt_enable();
658 /* Wait for kthread_stop */
659 set_current_state(TASK_INTERRUPTIBLE);
660 while (!kthread_should_stop()) {
661 schedule();
662 set_current_state(TASK_INTERRUPTIBLE);
663 }
664 __set_current_state(TASK_RUNNING);
665 return 0;
666}
667
668#ifdef CONFIG_HOTPLUG_CPU
669/*
670 * tasklet_kill_immediate is called to remove a tasklet which can already be
671 * scheduled for execution on @cpu.
672 *
673 * Unlike tasklet_kill, this function removes the tasklet
674 * _immediately_, even if the tasklet is in TASKLET_STATE_SCHED state.
675 *
676 * When this function is called, @cpu must be in the CPU_DEAD state.
677 */
678void tasklet_kill_immediate(struct tasklet_struct *t, unsigned int cpu)
679{
680 struct tasklet_struct **i;
681
682 BUG_ON(cpu_online(cpu));
683 BUG_ON(test_bit(TASKLET_STATE_RUN, &t->state));
684
685 if (!test_bit(TASKLET_STATE_SCHED, &t->state))
686 return;
687
688 /* CPU is dead, so no lock needed. */
Olof Johansson48f20a92008-03-04 15:23:25 -0800689 for (i = &per_cpu(tasklet_vec, cpu).head; *i; i = &(*i)->next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700690 if (*i == t) {
691 *i = t->next;
Olof Johansson48f20a92008-03-04 15:23:25 -0800692 /* If this was the tail element, move the tail ptr */
693 if (*i == NULL)
694 per_cpu(tasklet_vec, cpu).tail = i;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700695 return;
696 }
697 }
698 BUG();
699}
700
701static void takeover_tasklets(unsigned int cpu)
702{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700703 /* CPU is dead, so no lock needed. */
704 local_irq_disable();
705
706 /* Find end, append list for that CPU. */
Christian Borntraegere5e41722008-05-01 04:34:23 -0700707 if (&per_cpu(tasklet_vec, cpu).head != per_cpu(tasklet_vec, cpu).tail) {
708 *(__get_cpu_var(tasklet_vec).tail) = per_cpu(tasklet_vec, cpu).head;
709 __get_cpu_var(tasklet_vec).tail = per_cpu(tasklet_vec, cpu).tail;
710 per_cpu(tasklet_vec, cpu).head = NULL;
711 per_cpu(tasklet_vec, cpu).tail = &per_cpu(tasklet_vec, cpu).head;
712 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700713 raise_softirq_irqoff(TASKLET_SOFTIRQ);
714
Christian Borntraegere5e41722008-05-01 04:34:23 -0700715 if (&per_cpu(tasklet_hi_vec, cpu).head != per_cpu(tasklet_hi_vec, cpu).tail) {
716 *__get_cpu_var(tasklet_hi_vec).tail = per_cpu(tasklet_hi_vec, cpu).head;
717 __get_cpu_var(tasklet_hi_vec).tail = per_cpu(tasklet_hi_vec, cpu).tail;
718 per_cpu(tasklet_hi_vec, cpu).head = NULL;
719 per_cpu(tasklet_hi_vec, cpu).tail = &per_cpu(tasklet_hi_vec, cpu).head;
720 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700721 raise_softirq_irqoff(HI_SOFTIRQ);
722
723 local_irq_enable();
724}
725#endif /* CONFIG_HOTPLUG_CPU */
726
Chandra Seetharaman8c78f302006-07-30 03:03:35 -0700727static int __cpuinit cpu_callback(struct notifier_block *nfb,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700728 unsigned long action,
729 void *hcpu)
730{
731 int hotcpu = (unsigned long)hcpu;
732 struct task_struct *p;
733
734 switch (action) {
735 case CPU_UP_PREPARE:
Rafael J. Wysocki8bb78442007-05-09 02:35:10 -0700736 case CPU_UP_PREPARE_FROZEN:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700737 p = kthread_create(ksoftirqd, hcpu, "ksoftirqd/%d", hotcpu);
738 if (IS_ERR(p)) {
739 printk("ksoftirqd for %i failed\n", hotcpu);
740 return NOTIFY_BAD;
741 }
742 kthread_bind(p, hotcpu);
743 per_cpu(ksoftirqd, hotcpu) = p;
744 break;
745 case CPU_ONLINE:
Rafael J. Wysocki8bb78442007-05-09 02:35:10 -0700746 case CPU_ONLINE_FROZEN:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700747 wake_up_process(per_cpu(ksoftirqd, hotcpu));
748 break;
749#ifdef CONFIG_HOTPLUG_CPU
750 case CPU_UP_CANCELED:
Rafael J. Wysocki8bb78442007-05-09 02:35:10 -0700751 case CPU_UP_CANCELED_FROZEN:
Heiko Carstensfc75cdf2006-06-25 05:49:10 -0700752 if (!per_cpu(ksoftirqd, hotcpu))
753 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700754 /* Unbind so it can run. Fall thru. */
Heiko Carstensa4c4af72005-11-07 00:58:38 -0800755 kthread_bind(per_cpu(ksoftirqd, hotcpu),
Rusty Russellf1fc0572009-01-01 10:12:23 +1030756 cpumask_any(cpu_online_mask));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700757 case CPU_DEAD:
Satoru Takeuchi1c6b4aa2007-07-15 23:39:48 -0700758 case CPU_DEAD_FROZEN: {
759 struct sched_param param = { .sched_priority = MAX_RT_PRIO-1 };
760
Linus Torvalds1da177e2005-04-16 15:20:36 -0700761 p = per_cpu(ksoftirqd, hotcpu);
762 per_cpu(ksoftirqd, hotcpu) = NULL;
Rusty Russell961ccdd2008-06-23 13:55:38 +1000763 sched_setscheduler_nocheck(p, SCHED_FIFO, &param);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700764 kthread_stop(p);
765 takeover_tasklets(hotcpu);
766 break;
Satoru Takeuchi1c6b4aa2007-07-15 23:39:48 -0700767 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700768#endif /* CONFIG_HOTPLUG_CPU */
769 }
770 return NOTIFY_OK;
771}
772
Chandra Seetharaman8c78f302006-07-30 03:03:35 -0700773static struct notifier_block __cpuinitdata cpu_nfb = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700774 .notifier_call = cpu_callback
775};
776
Eduard - Gabriel Munteanu7babe8d2008-07-25 19:45:11 -0700777static __init int spawn_ksoftirqd(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700778{
779 void *cpu = (void *)(long)smp_processor_id();
Akinobu Mita07dccf32006-09-29 02:00:22 -0700780 int err = cpu_callback(&cpu_nfb, CPU_UP_PREPARE, cpu);
781
782 BUG_ON(err == NOTIFY_BAD);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700783 cpu_callback(&cpu_nfb, CPU_ONLINE, cpu);
784 register_cpu_notifier(&cpu_nfb);
785 return 0;
786}
Eduard - Gabriel Munteanu7babe8d2008-07-25 19:45:11 -0700787early_initcall(spawn_ksoftirqd);
Andrew Morton78eef012006-03-22 00:08:16 -0800788
789#ifdef CONFIG_SMP
790/*
791 * Call a function on all processors
792 */
Jens Axboe15c8b6c2008-05-09 09:39:44 +0200793int on_each_cpu(void (*func) (void *info), void *info, int wait)
Andrew Morton78eef012006-03-22 00:08:16 -0800794{
795 int ret = 0;
796
797 preempt_disable();
Jens Axboe8691e5a2008-06-06 11:18:06 +0200798 ret = smp_call_function(func, info, wait);
Andrew Morton78eef012006-03-22 00:08:16 -0800799 local_irq_disable();
800 func(info);
801 local_irq_enable();
802 preempt_enable();
803 return ret;
804}
805EXPORT_SYMBOL(on_each_cpu);
806#endif
Yinghai Lu43a25632008-12-28 16:01:13 -0800807
808/*
809 * [ These __weak aliases are kept in a separate compilation unit, so that
810 * GCC does not inline them incorrectly. ]
811 */
812
813int __init __weak early_irq_init(void)
814{
815 return 0;
816}
817
Yinghai Lu4a046d12009-01-12 17:39:24 -0800818int __init __weak arch_probe_nr_irqs(void)
819{
820 return 0;
821}
822
Yinghai Lu43a25632008-12-28 16:01:13 -0800823int __init __weak arch_early_irq_init(void)
824{
825 return 0;
826}
827
828int __weak arch_init_chip_data(struct irq_desc *desc, int cpu)
829{
830 return 0;
831}