blob: 80d323e6f61a352a2a25a7e8df82d337df995464 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/kernel/softirq.c
3 *
4 * Copyright (C) 1992 Linus Torvalds
5 *
Pavel Machekb10db7f2008-01-30 13:30:00 +01006 * Distribute under GPLv2.
7 *
8 * Rewritten. Old one was good in 2.2, but in 2.3 it was immoral. --ANK (990903)
David S. Miller54514a72008-09-23 22:15:57 -07009 *
10 * Remote softirq infrastructure is by Jens Axboe.
Linus Torvalds1da177e2005-04-16 15:20:36 -070011 */
12
13#include <linux/module.h>
14#include <linux/kernel_stat.h>
15#include <linux/interrupt.h>
16#include <linux/init.h>
17#include <linux/mm.h>
18#include <linux/notifier.h>
19#include <linux/percpu.h>
20#include <linux/cpu.h>
Rafael J. Wysocki83144182007-07-17 04:03:35 -070021#include <linux/freezer.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070022#include <linux/kthread.h>
23#include <linux/rcupdate.h>
Andrew Morton78eef012006-03-22 00:08:16 -080024#include <linux/smp.h>
Thomas Gleixner79bf2bb2007-02-16 01:28:03 -080025#include <linux/tick.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070026
27#include <asm/irq.h>
28/*
29 - No shared variables, all the data are CPU local.
30 - If a softirq needs serialization, let it serialize itself
31 by its own spinlocks.
32 - Even if softirq is serialized, only local cpu is marked for
33 execution. Hence, we get something sort of weak cpu binding.
34 Though it is still not clear, will it result in better locality
35 or will not.
36
37 Examples:
38 - NET RX softirq. It is multithreaded and does not require
39 any global serialization.
40 - NET TX softirq. It kicks software netdevice queues, hence
41 it is logically serialized per device, but this serialization
42 is invisible to common code.
43 - Tasklets: serialized wrt itself.
44 */
45
46#ifndef __ARCH_IRQ_STAT
47irq_cpustat_t irq_stat[NR_CPUS] ____cacheline_aligned;
48EXPORT_SYMBOL(irq_stat);
49#endif
50
Alexey Dobriyan978b0112008-09-06 20:04:36 +020051static struct softirq_action softirq_vec[NR_SOFTIRQS] __cacheline_aligned_in_smp;
Linus Torvalds1da177e2005-04-16 15:20:36 -070052
53static DEFINE_PER_CPU(struct task_struct *, ksoftirqd);
54
55/*
56 * we cannot loop indefinitely here to avoid userspace starvation,
57 * but we also don't want to introduce a worst case 1/HZ latency
58 * to the pending events, so lets the scheduler to balance
59 * the softirq load for us.
60 */
61static inline void wakeup_softirqd(void)
62{
63 /* Interrupts are disabled: no need to stop preemption */
64 struct task_struct *tsk = __get_cpu_var(ksoftirqd);
65
66 if (tsk && tsk->state != TASK_RUNNING)
67 wake_up_process(tsk);
68}
69
70/*
Ingo Molnarde30a2b2006-07-03 00:24:42 -070071 * This one is for softirq.c-internal use,
72 * where hardirqs are disabled legitimately:
73 */
Tim Chen3c829c32006-07-30 03:04:02 -070074#ifdef CONFIG_TRACE_IRQFLAGS
Ingo Molnarde30a2b2006-07-03 00:24:42 -070075static void __local_bh_disable(unsigned long ip)
76{
77 unsigned long flags;
78
79 WARN_ON_ONCE(in_irq());
80
81 raw_local_irq_save(flags);
82 add_preempt_count(SOFTIRQ_OFFSET);
83 /*
84 * Were softirqs turned off above:
85 */
86 if (softirq_count() == SOFTIRQ_OFFSET)
87 trace_softirqs_off(ip);
88 raw_local_irq_restore(flags);
89}
Tim Chen3c829c32006-07-30 03:04:02 -070090#else /* !CONFIG_TRACE_IRQFLAGS */
91static inline void __local_bh_disable(unsigned long ip)
92{
93 add_preempt_count(SOFTIRQ_OFFSET);
94 barrier();
95}
96#endif /* CONFIG_TRACE_IRQFLAGS */
Ingo Molnarde30a2b2006-07-03 00:24:42 -070097
98void local_bh_disable(void)
99{
100 __local_bh_disable((unsigned long)__builtin_return_address(0));
101}
102
103EXPORT_SYMBOL(local_bh_disable);
104
105void __local_bh_enable(void)
106{
107 WARN_ON_ONCE(in_irq());
108
109 /*
110 * softirqs should never be enabled by __local_bh_enable(),
111 * it always nests inside local_bh_enable() sections:
112 */
113 WARN_ON_ONCE(softirq_count() == SOFTIRQ_OFFSET);
114
115 sub_preempt_count(SOFTIRQ_OFFSET);
116}
117EXPORT_SYMBOL_GPL(__local_bh_enable);
118
119/*
120 * Special-case - softirqs can safely be enabled in
121 * cond_resched_softirq(), or by __do_softirq(),
122 * without processing still-pending softirqs:
123 */
124void _local_bh_enable(void)
125{
126 WARN_ON_ONCE(in_irq());
127 WARN_ON_ONCE(!irqs_disabled());
128
129 if (softirq_count() == SOFTIRQ_OFFSET)
130 trace_softirqs_on((unsigned long)__builtin_return_address(0));
131 sub_preempt_count(SOFTIRQ_OFFSET);
132}
133
134EXPORT_SYMBOL(_local_bh_enable);
135
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200136static inline void _local_bh_enable_ip(unsigned long ip)
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700137{
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200138 WARN_ON_ONCE(in_irq() || irqs_disabled());
Tim Chen3c829c32006-07-30 03:04:02 -0700139#ifdef CONFIG_TRACE_IRQFLAGS
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200140 local_irq_disable();
Tim Chen3c829c32006-07-30 03:04:02 -0700141#endif
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700142 /*
143 * Are softirqs going to be turned on now:
144 */
145 if (softirq_count() == SOFTIRQ_OFFSET)
146 trace_softirqs_on(ip);
147 /*
148 * Keep preemption disabled until we are done with
149 * softirq processing:
150 */
151 sub_preempt_count(SOFTIRQ_OFFSET - 1);
152
153 if (unlikely(!in_interrupt() && local_softirq_pending()))
154 do_softirq();
155
156 dec_preempt_count();
Tim Chen3c829c32006-07-30 03:04:02 -0700157#ifdef CONFIG_TRACE_IRQFLAGS
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200158 local_irq_enable();
Tim Chen3c829c32006-07-30 03:04:02 -0700159#endif
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700160 preempt_check_resched();
161}
Johannes Berg0f476b6d2008-06-18 09:29:37 +0200162
163void local_bh_enable(void)
164{
165 _local_bh_enable_ip((unsigned long)__builtin_return_address(0));
166}
167EXPORT_SYMBOL(local_bh_enable);
168
169void local_bh_enable_ip(unsigned long ip)
170{
171 _local_bh_enable_ip(ip);
172}
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700173EXPORT_SYMBOL(local_bh_enable_ip);
174
175/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700176 * We restart softirq processing MAX_SOFTIRQ_RESTART times,
177 * and we fall back to softirqd after that.
178 *
179 * This number has been established via experimentation.
180 * The two things to balance is latency against fairness -
181 * we want to handle softirqs as soon as possible, but they
182 * should not be able to lock up the box.
183 */
184#define MAX_SOFTIRQ_RESTART 10
185
186asmlinkage void __do_softirq(void)
187{
188 struct softirq_action *h;
189 __u32 pending;
190 int max_restart = MAX_SOFTIRQ_RESTART;
191 int cpu;
192
193 pending = local_softirq_pending();
Paul Mackerras829035fd2006-07-03 00:25:40 -0700194 account_system_vtime(current);
195
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700196 __local_bh_disable((unsigned long)__builtin_return_address(0));
197 trace_softirq_enter();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700198
Linus Torvalds1da177e2005-04-16 15:20:36 -0700199 cpu = smp_processor_id();
200restart:
201 /* Reset the pending bitmask before enabling irqs */
Andi Kleen3f744782005-09-12 18:49:24 +0200202 set_softirq_pending(0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203
Andrew Mortonc70f5d62005-07-30 10:22:49 -0700204 local_irq_enable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700205
206 h = softirq_vec;
207
208 do {
209 if (pending & 1) {
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200210 int prev_count = preempt_count();
211
Linus Torvalds1da177e2005-04-16 15:20:36 -0700212 h->action(h);
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200213
214 if (unlikely(prev_count != preempt_count())) {
Linus Torvalds1c95e1b2008-10-16 15:32:46 -0700215 printk(KERN_ERR "huh, entered softirq %td %p"
Thomas Gleixner8e85b4b2008-10-02 10:50:53 +0200216 "with preempt_count %08x,"
217 " exited with %08x?\n", h - softirq_vec,
218 h->action, prev_count, preempt_count());
219 preempt_count() = prev_count;
220 }
221
Linus Torvalds1da177e2005-04-16 15:20:36 -0700222 rcu_bh_qsctr_inc(cpu);
223 }
224 h++;
225 pending >>= 1;
226 } while (pending);
227
Andrew Mortonc70f5d62005-07-30 10:22:49 -0700228 local_irq_disable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229
230 pending = local_softirq_pending();
231 if (pending && --max_restart)
232 goto restart;
233
234 if (pending)
235 wakeup_softirqd();
236
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700237 trace_softirq_exit();
Paul Mackerras829035fd2006-07-03 00:25:40 -0700238
239 account_system_vtime(current);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700240 _local_bh_enable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241}
242
243#ifndef __ARCH_HAS_DO_SOFTIRQ
244
245asmlinkage void do_softirq(void)
246{
247 __u32 pending;
248 unsigned long flags;
249
250 if (in_interrupt())
251 return;
252
253 local_irq_save(flags);
254
255 pending = local_softirq_pending();
256
257 if (pending)
258 __do_softirq();
259
260 local_irq_restore(flags);
261}
262
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263#endif
264
Ingo Molnardde4b2b2007-02-16 01:27:45 -0800265/*
266 * Enter an interrupt context.
267 */
268void irq_enter(void)
269{
Venki Pallipadi6378ddb2008-01-30 13:30:04 +0100270 int cpu = smp_processor_id();
Thomas Gleixner719254f2008-10-17 09:59:47 +0200271
Paul E. McKenney64db4cf2008-12-18 21:55:32 +0100272 rcu_irq_enter();
Thomas Gleixneree5f80a2008-11-07 11:06:00 +0100273 if (idle_cpu(cpu) && !in_interrupt()) {
274 __irq_enter();
Thomas Gleixner719254f2008-10-17 09:59:47 +0200275 tick_check_idle(cpu);
Thomas Gleixneree5f80a2008-11-07 11:06:00 +0100276 } else
277 __irq_enter();
Ingo Molnardde4b2b2007-02-16 01:27:45 -0800278}
279
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280#ifdef __ARCH_IRQ_EXIT_IRQS_DISABLED
281# define invoke_softirq() __do_softirq()
282#else
283# define invoke_softirq() do_softirq()
284#endif
285
286/*
287 * Exit an interrupt context. Process softirqs if needed and possible:
288 */
289void irq_exit(void)
290{
291 account_system_vtime(current);
Ingo Molnarde30a2b2006-07-03 00:24:42 -0700292 trace_hardirq_exit();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293 sub_preempt_count(IRQ_EXIT_OFFSET);
294 if (!in_interrupt() && local_softirq_pending())
295 invoke_softirq();
Thomas Gleixner79bf2bb2007-02-16 01:28:03 -0800296
297#ifdef CONFIG_NO_HZ
298 /* Make sure that timer wheel updates are propagated */
Steven Rostedt2232c2d2008-02-29 18:46:50 +0100299 rcu_irq_exit();
Paul E. McKenney64db4cf2008-12-18 21:55:32 +0100300 if (idle_cpu(smp_processor_id()) && !in_interrupt() && !need_resched())
301 tick_nohz_stop_sched_tick(0);
Thomas Gleixner79bf2bb2007-02-16 01:28:03 -0800302#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700303 preempt_enable_no_resched();
304}
305
306/*
307 * This function must run with irqs disabled!
308 */
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800309inline void raise_softirq_irqoff(unsigned int nr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700310{
311 __raise_softirq_irqoff(nr);
312
313 /*
314 * If we're in an interrupt or softirq, we're done
315 * (this also catches softirq-disabled code). We will
316 * actually run the softirq once we return from
317 * the irq or softirq.
318 *
319 * Otherwise we wake up ksoftirqd to make sure we
320 * schedule the softirq soon.
321 */
322 if (!in_interrupt())
323 wakeup_softirqd();
324}
325
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800326void raise_softirq(unsigned int nr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700327{
328 unsigned long flags;
329
330 local_irq_save(flags);
331 raise_softirq_irqoff(nr);
332 local_irq_restore(flags);
333}
334
Carlos R. Mafra962cf362008-05-15 11:15:37 -0300335void open_softirq(int nr, void (*action)(struct softirq_action *))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700336{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700337 softirq_vec[nr].action = action;
338}
339
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340/* Tasklets */
341struct tasklet_head
342{
Olof Johansson48f20a92008-03-04 15:23:25 -0800343 struct tasklet_struct *head;
344 struct tasklet_struct **tail;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700345};
346
Vegard Nossum4620b492008-06-12 23:21:53 +0200347static DEFINE_PER_CPU(struct tasklet_head, tasklet_vec);
348static DEFINE_PER_CPU(struct tasklet_head, tasklet_hi_vec);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800350void __tasklet_schedule(struct tasklet_struct *t)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351{
352 unsigned long flags;
353
354 local_irq_save(flags);
Olof Johansson48f20a92008-03-04 15:23:25 -0800355 t->next = NULL;
356 *__get_cpu_var(tasklet_vec).tail = t;
357 __get_cpu_var(tasklet_vec).tail = &(t->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700358 raise_softirq_irqoff(TASKLET_SOFTIRQ);
359 local_irq_restore(flags);
360}
361
362EXPORT_SYMBOL(__tasklet_schedule);
363
Harvey Harrison7ad5b3a2008-02-08 04:19:53 -0800364void __tasklet_hi_schedule(struct tasklet_struct *t)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700365{
366 unsigned long flags;
367
368 local_irq_save(flags);
Olof Johansson48f20a92008-03-04 15:23:25 -0800369 t->next = NULL;
370 *__get_cpu_var(tasklet_hi_vec).tail = t;
371 __get_cpu_var(tasklet_hi_vec).tail = &(t->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700372 raise_softirq_irqoff(HI_SOFTIRQ);
373 local_irq_restore(flags);
374}
375
376EXPORT_SYMBOL(__tasklet_hi_schedule);
377
378static void tasklet_action(struct softirq_action *a)
379{
380 struct tasklet_struct *list;
381
382 local_irq_disable();
Olof Johansson48f20a92008-03-04 15:23:25 -0800383 list = __get_cpu_var(tasklet_vec).head;
384 __get_cpu_var(tasklet_vec).head = NULL;
385 __get_cpu_var(tasklet_vec).tail = &__get_cpu_var(tasklet_vec).head;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700386 local_irq_enable();
387
388 while (list) {
389 struct tasklet_struct *t = list;
390
391 list = list->next;
392
393 if (tasklet_trylock(t)) {
394 if (!atomic_read(&t->count)) {
395 if (!test_and_clear_bit(TASKLET_STATE_SCHED, &t->state))
396 BUG();
397 t->func(t->data);
398 tasklet_unlock(t);
399 continue;
400 }
401 tasklet_unlock(t);
402 }
403
404 local_irq_disable();
Olof Johansson48f20a92008-03-04 15:23:25 -0800405 t->next = NULL;
406 *__get_cpu_var(tasklet_vec).tail = t;
407 __get_cpu_var(tasklet_vec).tail = &(t->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700408 __raise_softirq_irqoff(TASKLET_SOFTIRQ);
409 local_irq_enable();
410 }
411}
412
413static void tasklet_hi_action(struct softirq_action *a)
414{
415 struct tasklet_struct *list;
416
417 local_irq_disable();
Olof Johansson48f20a92008-03-04 15:23:25 -0800418 list = __get_cpu_var(tasklet_hi_vec).head;
419 __get_cpu_var(tasklet_hi_vec).head = NULL;
420 __get_cpu_var(tasklet_hi_vec).tail = &__get_cpu_var(tasklet_hi_vec).head;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700421 local_irq_enable();
422
423 while (list) {
424 struct tasklet_struct *t = list;
425
426 list = list->next;
427
428 if (tasklet_trylock(t)) {
429 if (!atomic_read(&t->count)) {
430 if (!test_and_clear_bit(TASKLET_STATE_SCHED, &t->state))
431 BUG();
432 t->func(t->data);
433 tasklet_unlock(t);
434 continue;
435 }
436 tasklet_unlock(t);
437 }
438
439 local_irq_disable();
Olof Johansson48f20a92008-03-04 15:23:25 -0800440 t->next = NULL;
441 *__get_cpu_var(tasklet_hi_vec).tail = t;
442 __get_cpu_var(tasklet_hi_vec).tail = &(t->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700443 __raise_softirq_irqoff(HI_SOFTIRQ);
444 local_irq_enable();
445 }
446}
447
448
449void tasklet_init(struct tasklet_struct *t,
450 void (*func)(unsigned long), unsigned long data)
451{
452 t->next = NULL;
453 t->state = 0;
454 atomic_set(&t->count, 0);
455 t->func = func;
456 t->data = data;
457}
458
459EXPORT_SYMBOL(tasklet_init);
460
461void tasklet_kill(struct tasklet_struct *t)
462{
463 if (in_interrupt())
464 printk("Attempt to kill tasklet from interrupt\n");
465
466 while (test_and_set_bit(TASKLET_STATE_SCHED, &t->state)) {
467 do
468 yield();
469 while (test_bit(TASKLET_STATE_SCHED, &t->state));
470 }
471 tasklet_unlock_wait(t);
472 clear_bit(TASKLET_STATE_SCHED, &t->state);
473}
474
475EXPORT_SYMBOL(tasklet_kill);
476
David S. Miller54514a72008-09-23 22:15:57 -0700477DEFINE_PER_CPU(struct list_head [NR_SOFTIRQS], softirq_work_list);
478EXPORT_PER_CPU_SYMBOL(softirq_work_list);
479
480static void __local_trigger(struct call_single_data *cp, int softirq)
481{
482 struct list_head *head = &__get_cpu_var(softirq_work_list[softirq]);
483
484 list_add_tail(&cp->list, head);
485
486 /* Trigger the softirq only if the list was previously empty. */
487 if (head->next == &cp->list)
488 raise_softirq_irqoff(softirq);
489}
490
491#ifdef CONFIG_USE_GENERIC_SMP_HELPERS
492static void remote_softirq_receive(void *data)
493{
494 struct call_single_data *cp = data;
495 unsigned long flags;
496 int softirq;
497
498 softirq = cp->priv;
499
500 local_irq_save(flags);
501 __local_trigger(cp, softirq);
502 local_irq_restore(flags);
503}
504
505static int __try_remote_softirq(struct call_single_data *cp, int cpu, int softirq)
506{
507 if (cpu_online(cpu)) {
508 cp->func = remote_softirq_receive;
509 cp->info = cp;
510 cp->flags = 0;
511 cp->priv = softirq;
512
513 __smp_call_function_single(cpu, cp);
514 return 0;
515 }
516 return 1;
517}
518#else /* CONFIG_USE_GENERIC_SMP_HELPERS */
519static int __try_remote_softirq(struct call_single_data *cp, int cpu, int softirq)
520{
521 return 1;
522}
523#endif
524
525/**
526 * __send_remote_softirq - try to schedule softirq work on a remote cpu
527 * @cp: private SMP call function data area
528 * @cpu: the remote cpu
529 * @this_cpu: the currently executing cpu
530 * @softirq: the softirq for the work
531 *
532 * Attempt to schedule softirq work on a remote cpu. If this cannot be
533 * done, the work is instead queued up on the local cpu.
534 *
535 * Interrupts must be disabled.
536 */
537void __send_remote_softirq(struct call_single_data *cp, int cpu, int this_cpu, int softirq)
538{
539 if (cpu == this_cpu || __try_remote_softirq(cp, cpu, softirq))
540 __local_trigger(cp, softirq);
541}
542EXPORT_SYMBOL(__send_remote_softirq);
543
544/**
545 * send_remote_softirq - try to schedule softirq work on a remote cpu
546 * @cp: private SMP call function data area
547 * @cpu: the remote cpu
548 * @softirq: the softirq for the work
549 *
550 * Like __send_remote_softirq except that disabling interrupts and
551 * computing the current cpu is done for the caller.
552 */
553void send_remote_softirq(struct call_single_data *cp, int cpu, int softirq)
554{
555 unsigned long flags;
556 int this_cpu;
557
558 local_irq_save(flags);
559 this_cpu = smp_processor_id();
560 __send_remote_softirq(cp, cpu, this_cpu, softirq);
561 local_irq_restore(flags);
562}
563EXPORT_SYMBOL(send_remote_softirq);
564
565static int __cpuinit remote_softirq_cpu_notify(struct notifier_block *self,
566 unsigned long action, void *hcpu)
567{
568 /*
569 * If a CPU goes away, splice its entries to the current CPU
570 * and trigger a run of the softirq
571 */
572 if (action == CPU_DEAD || action == CPU_DEAD_FROZEN) {
573 int cpu = (unsigned long) hcpu;
574 int i;
575
576 local_irq_disable();
577 for (i = 0; i < NR_SOFTIRQS; i++) {
578 struct list_head *head = &per_cpu(softirq_work_list[i], cpu);
579 struct list_head *local_head;
580
581 if (list_empty(head))
582 continue;
583
584 local_head = &__get_cpu_var(softirq_work_list[i]);
585 list_splice_init(head, local_head);
586 raise_softirq_irqoff(i);
587 }
588 local_irq_enable();
589 }
590
591 return NOTIFY_OK;
592}
593
594static struct notifier_block __cpuinitdata remote_softirq_cpu_notifier = {
595 .notifier_call = remote_softirq_cpu_notify,
596};
597
Linus Torvalds1da177e2005-04-16 15:20:36 -0700598void __init softirq_init(void)
599{
Olof Johansson48f20a92008-03-04 15:23:25 -0800600 int cpu;
601
602 for_each_possible_cpu(cpu) {
David S. Miller54514a72008-09-23 22:15:57 -0700603 int i;
604
Olof Johansson48f20a92008-03-04 15:23:25 -0800605 per_cpu(tasklet_vec, cpu).tail =
606 &per_cpu(tasklet_vec, cpu).head;
607 per_cpu(tasklet_hi_vec, cpu).tail =
608 &per_cpu(tasklet_hi_vec, cpu).head;
David S. Miller54514a72008-09-23 22:15:57 -0700609 for (i = 0; i < NR_SOFTIRQS; i++)
610 INIT_LIST_HEAD(&per_cpu(softirq_work_list[i], cpu));
Olof Johansson48f20a92008-03-04 15:23:25 -0800611 }
612
David S. Miller54514a72008-09-23 22:15:57 -0700613 register_hotcpu_notifier(&remote_softirq_cpu_notifier);
614
Carlos R. Mafra962cf362008-05-15 11:15:37 -0300615 open_softirq(TASKLET_SOFTIRQ, tasklet_action);
616 open_softirq(HI_SOFTIRQ, tasklet_hi_action);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700617}
618
619static int ksoftirqd(void * __bind_cpu)
620{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700621 set_current_state(TASK_INTERRUPTIBLE);
622
623 while (!kthread_should_stop()) {
624 preempt_disable();
625 if (!local_softirq_pending()) {
626 preempt_enable_no_resched();
627 schedule();
628 preempt_disable();
629 }
630
631 __set_current_state(TASK_RUNNING);
632
633 while (local_softirq_pending()) {
634 /* Preempt disable stops cpu going offline.
635 If already offline, we'll be on wrong CPU:
636 don't process */
637 if (cpu_is_offline((long)__bind_cpu))
638 goto wait_to_die;
639 do_softirq();
640 preempt_enable_no_resched();
641 cond_resched();
642 preempt_disable();
643 }
644 preempt_enable();
645 set_current_state(TASK_INTERRUPTIBLE);
646 }
647 __set_current_state(TASK_RUNNING);
648 return 0;
649
650wait_to_die:
651 preempt_enable();
652 /* Wait for kthread_stop */
653 set_current_state(TASK_INTERRUPTIBLE);
654 while (!kthread_should_stop()) {
655 schedule();
656 set_current_state(TASK_INTERRUPTIBLE);
657 }
658 __set_current_state(TASK_RUNNING);
659 return 0;
660}
661
662#ifdef CONFIG_HOTPLUG_CPU
663/*
664 * tasklet_kill_immediate is called to remove a tasklet which can already be
665 * scheduled for execution on @cpu.
666 *
667 * Unlike tasklet_kill, this function removes the tasklet
668 * _immediately_, even if the tasklet is in TASKLET_STATE_SCHED state.
669 *
670 * When this function is called, @cpu must be in the CPU_DEAD state.
671 */
672void tasklet_kill_immediate(struct tasklet_struct *t, unsigned int cpu)
673{
674 struct tasklet_struct **i;
675
676 BUG_ON(cpu_online(cpu));
677 BUG_ON(test_bit(TASKLET_STATE_RUN, &t->state));
678
679 if (!test_bit(TASKLET_STATE_SCHED, &t->state))
680 return;
681
682 /* CPU is dead, so no lock needed. */
Olof Johansson48f20a92008-03-04 15:23:25 -0800683 for (i = &per_cpu(tasklet_vec, cpu).head; *i; i = &(*i)->next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700684 if (*i == t) {
685 *i = t->next;
Olof Johansson48f20a92008-03-04 15:23:25 -0800686 /* If this was the tail element, move the tail ptr */
687 if (*i == NULL)
688 per_cpu(tasklet_vec, cpu).tail = i;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700689 return;
690 }
691 }
692 BUG();
693}
694
695static void takeover_tasklets(unsigned int cpu)
696{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700697 /* CPU is dead, so no lock needed. */
698 local_irq_disable();
699
700 /* Find end, append list for that CPU. */
Christian Borntraegere5e41722008-05-01 04:34:23 -0700701 if (&per_cpu(tasklet_vec, cpu).head != per_cpu(tasklet_vec, cpu).tail) {
702 *(__get_cpu_var(tasklet_vec).tail) = per_cpu(tasklet_vec, cpu).head;
703 __get_cpu_var(tasklet_vec).tail = per_cpu(tasklet_vec, cpu).tail;
704 per_cpu(tasklet_vec, cpu).head = NULL;
705 per_cpu(tasklet_vec, cpu).tail = &per_cpu(tasklet_vec, cpu).head;
706 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700707 raise_softirq_irqoff(TASKLET_SOFTIRQ);
708
Christian Borntraegere5e41722008-05-01 04:34:23 -0700709 if (&per_cpu(tasklet_hi_vec, cpu).head != per_cpu(tasklet_hi_vec, cpu).tail) {
710 *__get_cpu_var(tasklet_hi_vec).tail = per_cpu(tasklet_hi_vec, cpu).head;
711 __get_cpu_var(tasklet_hi_vec).tail = per_cpu(tasklet_hi_vec, cpu).tail;
712 per_cpu(tasklet_hi_vec, cpu).head = NULL;
713 per_cpu(tasklet_hi_vec, cpu).tail = &per_cpu(tasklet_hi_vec, cpu).head;
714 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700715 raise_softirq_irqoff(HI_SOFTIRQ);
716
717 local_irq_enable();
718}
719#endif /* CONFIG_HOTPLUG_CPU */
720
Chandra Seetharaman8c78f302006-07-30 03:03:35 -0700721static int __cpuinit cpu_callback(struct notifier_block *nfb,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700722 unsigned long action,
723 void *hcpu)
724{
725 int hotcpu = (unsigned long)hcpu;
726 struct task_struct *p;
727
728 switch (action) {
729 case CPU_UP_PREPARE:
Rafael J. Wysocki8bb78442007-05-09 02:35:10 -0700730 case CPU_UP_PREPARE_FROZEN:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700731 p = kthread_create(ksoftirqd, hcpu, "ksoftirqd/%d", hotcpu);
732 if (IS_ERR(p)) {
733 printk("ksoftirqd for %i failed\n", hotcpu);
734 return NOTIFY_BAD;
735 }
736 kthread_bind(p, hotcpu);
737 per_cpu(ksoftirqd, hotcpu) = p;
738 break;
739 case CPU_ONLINE:
Rafael J. Wysocki8bb78442007-05-09 02:35:10 -0700740 case CPU_ONLINE_FROZEN:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700741 wake_up_process(per_cpu(ksoftirqd, hotcpu));
742 break;
743#ifdef CONFIG_HOTPLUG_CPU
744 case CPU_UP_CANCELED:
Rafael J. Wysocki8bb78442007-05-09 02:35:10 -0700745 case CPU_UP_CANCELED_FROZEN:
Heiko Carstensfc75cdf2006-06-25 05:49:10 -0700746 if (!per_cpu(ksoftirqd, hotcpu))
747 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700748 /* Unbind so it can run. Fall thru. */
Heiko Carstensa4c4af72005-11-07 00:58:38 -0800749 kthread_bind(per_cpu(ksoftirqd, hotcpu),
750 any_online_cpu(cpu_online_map));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700751 case CPU_DEAD:
Satoru Takeuchi1c6b4aa2007-07-15 23:39:48 -0700752 case CPU_DEAD_FROZEN: {
753 struct sched_param param = { .sched_priority = MAX_RT_PRIO-1 };
754
Linus Torvalds1da177e2005-04-16 15:20:36 -0700755 p = per_cpu(ksoftirqd, hotcpu);
756 per_cpu(ksoftirqd, hotcpu) = NULL;
Rusty Russell961ccdd2008-06-23 13:55:38 +1000757 sched_setscheduler_nocheck(p, SCHED_FIFO, &param);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700758 kthread_stop(p);
759 takeover_tasklets(hotcpu);
760 break;
Satoru Takeuchi1c6b4aa2007-07-15 23:39:48 -0700761 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700762#endif /* CONFIG_HOTPLUG_CPU */
763 }
764 return NOTIFY_OK;
765}
766
Chandra Seetharaman8c78f302006-07-30 03:03:35 -0700767static struct notifier_block __cpuinitdata cpu_nfb = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700768 .notifier_call = cpu_callback
769};
770
Eduard - Gabriel Munteanu7babe8d2008-07-25 19:45:11 -0700771static __init int spawn_ksoftirqd(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700772{
773 void *cpu = (void *)(long)smp_processor_id();
Akinobu Mita07dccf32006-09-29 02:00:22 -0700774 int err = cpu_callback(&cpu_nfb, CPU_UP_PREPARE, cpu);
775
776 BUG_ON(err == NOTIFY_BAD);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700777 cpu_callback(&cpu_nfb, CPU_ONLINE, cpu);
778 register_cpu_notifier(&cpu_nfb);
779 return 0;
780}
Eduard - Gabriel Munteanu7babe8d2008-07-25 19:45:11 -0700781early_initcall(spawn_ksoftirqd);
Andrew Morton78eef012006-03-22 00:08:16 -0800782
783#ifdef CONFIG_SMP
784/*
785 * Call a function on all processors
786 */
Jens Axboe15c8b6c2008-05-09 09:39:44 +0200787int on_each_cpu(void (*func) (void *info), void *info, int wait)
Andrew Morton78eef012006-03-22 00:08:16 -0800788{
789 int ret = 0;
790
791 preempt_disable();
Jens Axboe8691e5a2008-06-06 11:18:06 +0200792 ret = smp_call_function(func, info, wait);
Andrew Morton78eef012006-03-22 00:08:16 -0800793 local_irq_disable();
794 func(info);
795 local_irq_enable();
796 preempt_enable();
797 return ret;
798}
799EXPORT_SYMBOL(on_each_cpu);
800#endif