Merge branch 'x86/apic' into irq/numa
[linux-2.6] / kernel / softirq.c
1 /*
2  *      linux/kernel/softirq.c
3  *
4  *      Copyright (C) 1992 Linus Torvalds
5  *
6  *      Distribute under GPLv2.
7  *
8  *      Rewritten. Old one was good in 2.2, but in 2.3 it was immoral. --ANK (990903)
9  *
10  *      Remote softirq infrastructure is by Jens Axboe.
11  */
12
13 #include <linux/module.h>
14 #include <linux/kernel_stat.h>
15 #include <linux/interrupt.h>
16 #include <linux/init.h>
17 #include <linux/mm.h>
18 #include <linux/notifier.h>
19 #include <linux/percpu.h>
20 #include <linux/cpu.h>
21 #include <linux/freezer.h>
22 #include <linux/kthread.h>
23 #include <linux/rcupdate.h>
24 #include <linux/ftrace.h>
25 #include <linux/smp.h>
26 #include <linux/tick.h>
27 #include <trace/irq.h>
28
29 #include <asm/irq.h>
30 /*
31    - No shared variables, all the data are CPU local.
32    - If a softirq needs serialization, let it serialize itself
33      by its own spinlocks.
34    - Even if softirq is serialized, only local cpu is marked for
35      execution. Hence, we get something sort of weak cpu binding.
36      Though it is still not clear, will it result in better locality
37      or will not.
38
39    Examples:
40    - NET RX softirq. It is multithreaded and does not require
41      any global serialization.
42    - NET TX softirq. It kicks software netdevice queues, hence
43      it is logically serialized per device, but this serialization
44      is invisible to common code.
45    - Tasklets: serialized wrt itself.
46  */
47
48 #ifndef __ARCH_IRQ_STAT
49 irq_cpustat_t irq_stat[NR_CPUS] ____cacheline_aligned;
50 EXPORT_SYMBOL(irq_stat);
51 #endif
52
53 static struct softirq_action softirq_vec[NR_SOFTIRQS] __cacheline_aligned_in_smp;
54
55 static DEFINE_PER_CPU(struct task_struct *, ksoftirqd);
56
57 char *softirq_to_name[NR_SOFTIRQS] = {
58         "HI", "TIMER", "NET_TX", "NET_RX", "BLOCK",
59         "TASKLET", "SCHED", "HRTIMER",  "RCU"
60 };
61
62 /*
63  * we cannot loop indefinitely here to avoid userspace starvation,
64  * but we also don't want to introduce a worst case 1/HZ latency
65  * to the pending events, so lets the scheduler to balance
66  * the softirq load for us.
67  */
68 void wakeup_softirqd(void)
69 {
70         /* Interrupts are disabled: no need to stop preemption */
71         struct task_struct *tsk = __get_cpu_var(ksoftirqd);
72
73         if (tsk && tsk->state != TASK_RUNNING)
74                 wake_up_process(tsk);
75 }
76
77 /*
78  * This one is for softirq.c-internal use,
79  * where hardirqs are disabled legitimately:
80  */
81 #ifdef CONFIG_TRACE_IRQFLAGS
82 static void __local_bh_disable(unsigned long ip)
83 {
84         unsigned long flags;
85
86         WARN_ON_ONCE(in_irq());
87
88         raw_local_irq_save(flags);
89         /*
90          * The preempt tracer hooks into add_preempt_count and will break
91          * lockdep because it calls back into lockdep after SOFTIRQ_OFFSET
92          * is set and before current->softirq_enabled is cleared.
93          * We must manually increment preempt_count here and manually
94          * call the trace_preempt_off later.
95          */
96         preempt_count() += SOFTIRQ_OFFSET;
97         /*
98          * Were softirqs turned off above:
99          */
100         if (softirq_count() == SOFTIRQ_OFFSET)
101                 trace_softirqs_off(ip);
102         raw_local_irq_restore(flags);
103
104         if (preempt_count() == SOFTIRQ_OFFSET)
105                 trace_preempt_off(CALLER_ADDR0, get_parent_ip(CALLER_ADDR1));
106 }
107 #else /* !CONFIG_TRACE_IRQFLAGS */
108 static inline void __local_bh_disable(unsigned long ip)
109 {
110         add_preempt_count(SOFTIRQ_OFFSET);
111         barrier();
112 }
113 #endif /* CONFIG_TRACE_IRQFLAGS */
114
115 void local_bh_disable(void)
116 {
117         __local_bh_disable((unsigned long)__builtin_return_address(0));
118 }
119
120 EXPORT_SYMBOL(local_bh_disable);
121
122 /*
123  * Special-case - softirqs can safely be enabled in
124  * cond_resched_softirq(), or by __do_softirq(),
125  * without processing still-pending softirqs:
126  */
127 void _local_bh_enable(void)
128 {
129         WARN_ON_ONCE(in_irq());
130         WARN_ON_ONCE(!irqs_disabled());
131
132         if (softirq_count() == SOFTIRQ_OFFSET)
133                 trace_softirqs_on((unsigned long)__builtin_return_address(0));
134         sub_preempt_count(SOFTIRQ_OFFSET);
135 }
136
137 EXPORT_SYMBOL(_local_bh_enable);
138
139 static inline void _local_bh_enable_ip(unsigned long ip)
140 {
141         WARN_ON_ONCE(in_irq() || irqs_disabled());
142 #ifdef CONFIG_TRACE_IRQFLAGS
143         local_irq_disable();
144 #endif
145         /*
146          * Are softirqs going to be turned on now:
147          */
148         if (softirq_count() == SOFTIRQ_OFFSET)
149                 trace_softirqs_on(ip);
150         /*
151          * Keep preemption disabled until we are done with
152          * softirq processing:
153          */
154         sub_preempt_count(SOFTIRQ_OFFSET - 1);
155
156         if (unlikely(!in_interrupt() && local_softirq_pending()))
157                 do_softirq();
158
159         dec_preempt_count();
160 #ifdef CONFIG_TRACE_IRQFLAGS
161         local_irq_enable();
162 #endif
163         preempt_check_resched();
164 }
165
166 void local_bh_enable(void)
167 {
168         _local_bh_enable_ip((unsigned long)__builtin_return_address(0));
169 }
170 EXPORT_SYMBOL(local_bh_enable);
171
172 void local_bh_enable_ip(unsigned long ip)
173 {
174         _local_bh_enable_ip(ip);
175 }
176 EXPORT_SYMBOL(local_bh_enable_ip);
177
178 /*
179  * We restart softirq processing MAX_SOFTIRQ_RESTART times,
180  * and we fall back to softirqd after that.
181  *
182  * This number has been established via experimentation.
183  * The two things to balance is latency against fairness -
184  * we want to handle softirqs as soon as possible, but they
185  * should not be able to lock up the box.
186  */
187 #define MAX_SOFTIRQ_RESTART 10
188
189 DEFINE_TRACE(softirq_entry);
190 DEFINE_TRACE(softirq_exit);
191
192 asmlinkage void __do_softirq(void)
193 {
194         struct softirq_action *h;
195         __u32 pending;
196         int max_restart = MAX_SOFTIRQ_RESTART;
197         int cpu;
198
199         pending = local_softirq_pending();
200         account_system_vtime(current);
201
202         __local_bh_disable((unsigned long)__builtin_return_address(0));
203         lockdep_softirq_enter();
204
205         cpu = smp_processor_id();
206 restart:
207         /* Reset the pending bitmask before enabling irqs */
208         set_softirq_pending(0);
209
210         local_irq_enable();
211
212         h = softirq_vec;
213
214         do {
215                 if (pending & 1) {
216                         int prev_count = preempt_count();
217
218                         trace_softirq_entry(h, softirq_vec);
219                         h->action(h);
220                         trace_softirq_exit(h, softirq_vec);
221                         if (unlikely(prev_count != preempt_count())) {
222                                 printk(KERN_ERR "huh, entered softirq %td %s %p"
223                                        "with preempt_count %08x,"
224                                        " exited with %08x?\n", h - softirq_vec,
225                                        softirq_to_name[h - softirq_vec],
226                                        h->action, prev_count, preempt_count());
227                                 preempt_count() = prev_count;
228                         }
229
230                         rcu_bh_qsctr_inc(cpu);
231                 }
232                 h++;
233                 pending >>= 1;
234         } while (pending);
235
236         local_irq_disable();
237
238         pending = local_softirq_pending();
239         if (pending && --max_restart)
240                 goto restart;
241
242         if (pending)
243                 wakeup_softirqd();
244
245         lockdep_softirq_exit();
246
247         account_system_vtime(current);
248         _local_bh_enable();
249 }
250
251 #ifndef __ARCH_HAS_DO_SOFTIRQ
252
253 asmlinkage void do_softirq(void)
254 {
255         __u32 pending;
256         unsigned long flags;
257
258         if (in_interrupt())
259                 return;
260
261         local_irq_save(flags);
262
263         pending = local_softirq_pending();
264
265         if (pending)
266                 __do_softirq();
267
268         local_irq_restore(flags);
269 }
270
271 #endif
272
273 /*
274  * Enter an interrupt context.
275  */
276 void irq_enter(void)
277 {
278         int cpu = smp_processor_id();
279
280         rcu_irq_enter();
281         if (idle_cpu(cpu) && !in_interrupt()) {
282                 __irq_enter();
283                 tick_check_idle(cpu);
284         } else
285                 __irq_enter();
286 }
287
288 #ifdef __ARCH_IRQ_EXIT_IRQS_DISABLED
289 # define invoke_softirq()       __do_softirq()
290 #else
291 # define invoke_softirq()       do_softirq()
292 #endif
293
294 /*
295  * Exit an interrupt context. Process softirqs if needed and possible:
296  */
297 void irq_exit(void)
298 {
299         account_system_vtime(current);
300         trace_hardirq_exit();
301         sub_preempt_count(IRQ_EXIT_OFFSET);
302         if (!in_interrupt() && local_softirq_pending())
303                 invoke_softirq();
304
305 #ifdef CONFIG_NO_HZ
306         /* Make sure that timer wheel updates are propagated */
307         rcu_irq_exit();
308         if (idle_cpu(smp_processor_id()) && !in_interrupt() && !need_resched())
309                 tick_nohz_stop_sched_tick(0);
310 #endif
311         preempt_enable_no_resched();
312 }
313
314 /*
315  * This function must run with irqs disabled!
316  */
317 inline void raise_softirq_irqoff(unsigned int nr)
318 {
319         __raise_softirq_irqoff(nr);
320
321         /*
322          * If we're in an interrupt or softirq, we're done
323          * (this also catches softirq-disabled code). We will
324          * actually run the softirq once we return from
325          * the irq or softirq.
326          *
327          * Otherwise we wake up ksoftirqd to make sure we
328          * schedule the softirq soon.
329          */
330         if (!in_interrupt())
331                 wakeup_softirqd();
332 }
333
334 void raise_softirq(unsigned int nr)
335 {
336         unsigned long flags;
337
338         local_irq_save(flags);
339         raise_softirq_irqoff(nr);
340         local_irq_restore(flags);
341 }
342
343 void open_softirq(int nr, void (*action)(struct softirq_action *))
344 {
345         softirq_vec[nr].action = action;
346 }
347
348 /* Tasklets */
349 struct tasklet_head
350 {
351         struct tasklet_struct *head;
352         struct tasklet_struct **tail;
353 };
354
355 static DEFINE_PER_CPU(struct tasklet_head, tasklet_vec);
356 static DEFINE_PER_CPU(struct tasklet_head, tasklet_hi_vec);
357
358 void __tasklet_schedule(struct tasklet_struct *t)
359 {
360         unsigned long flags;
361
362         local_irq_save(flags);
363         t->next = NULL;
364         *__get_cpu_var(tasklet_vec).tail = t;
365         __get_cpu_var(tasklet_vec).tail = &(t->next);
366         raise_softirq_irqoff(TASKLET_SOFTIRQ);
367         local_irq_restore(flags);
368 }
369
370 EXPORT_SYMBOL(__tasklet_schedule);
371
372 void __tasklet_hi_schedule(struct tasklet_struct *t)
373 {
374         unsigned long flags;
375
376         local_irq_save(flags);
377         t->next = NULL;
378         *__get_cpu_var(tasklet_hi_vec).tail = t;
379         __get_cpu_var(tasklet_hi_vec).tail = &(t->next);
380         raise_softirq_irqoff(HI_SOFTIRQ);
381         local_irq_restore(flags);
382 }
383
384 EXPORT_SYMBOL(__tasklet_hi_schedule);
385
386 static void tasklet_action(struct softirq_action *a)
387 {
388         struct tasklet_struct *list;
389
390         local_irq_disable();
391         list = __get_cpu_var(tasklet_vec).head;
392         __get_cpu_var(tasklet_vec).head = NULL;
393         __get_cpu_var(tasklet_vec).tail = &__get_cpu_var(tasklet_vec).head;
394         local_irq_enable();
395
396         while (list) {
397                 struct tasklet_struct *t = list;
398
399                 list = list->next;
400
401                 if (tasklet_trylock(t)) {
402                         if (!atomic_read(&t->count)) {
403                                 if (!test_and_clear_bit(TASKLET_STATE_SCHED, &t->state))
404                                         BUG();
405                                 t->func(t->data);
406                                 tasklet_unlock(t);
407                                 continue;
408                         }
409                         tasklet_unlock(t);
410                 }
411
412                 local_irq_disable();
413                 t->next = NULL;
414                 *__get_cpu_var(tasklet_vec).tail = t;
415                 __get_cpu_var(tasklet_vec).tail = &(t->next);
416                 __raise_softirq_irqoff(TASKLET_SOFTIRQ);
417                 local_irq_enable();
418         }
419 }
420
421 static void tasklet_hi_action(struct softirq_action *a)
422 {
423         struct tasklet_struct *list;
424
425         local_irq_disable();
426         list = __get_cpu_var(tasklet_hi_vec).head;
427         __get_cpu_var(tasklet_hi_vec).head = NULL;
428         __get_cpu_var(tasklet_hi_vec).tail = &__get_cpu_var(tasklet_hi_vec).head;
429         local_irq_enable();
430
431         while (list) {
432                 struct tasklet_struct *t = list;
433
434                 list = list->next;
435
436                 if (tasklet_trylock(t)) {
437                         if (!atomic_read(&t->count)) {
438                                 if (!test_and_clear_bit(TASKLET_STATE_SCHED, &t->state))
439                                         BUG();
440                                 t->func(t->data);
441                                 tasklet_unlock(t);
442                                 continue;
443                         }
444                         tasklet_unlock(t);
445                 }
446
447                 local_irq_disable();
448                 t->next = NULL;
449                 *__get_cpu_var(tasklet_hi_vec).tail = t;
450                 __get_cpu_var(tasklet_hi_vec).tail = &(t->next);
451                 __raise_softirq_irqoff(HI_SOFTIRQ);
452                 local_irq_enable();
453         }
454 }
455
456
457 void tasklet_init(struct tasklet_struct *t,
458                   void (*func)(unsigned long), unsigned long data)
459 {
460         t->next = NULL;
461         t->state = 0;
462         atomic_set(&t->count, 0);
463         t->func = func;
464         t->data = data;
465 }
466
467 EXPORT_SYMBOL(tasklet_init);
468
469 void tasklet_kill(struct tasklet_struct *t)
470 {
471         if (in_interrupt())
472                 printk("Attempt to kill tasklet from interrupt\n");
473
474         while (test_and_set_bit(TASKLET_STATE_SCHED, &t->state)) {
475                 do {
476                         yield();
477                 } while (test_bit(TASKLET_STATE_SCHED, &t->state));
478         }
479         tasklet_unlock_wait(t);
480         clear_bit(TASKLET_STATE_SCHED, &t->state);
481 }
482
483 EXPORT_SYMBOL(tasklet_kill);
484
485 DEFINE_PER_CPU(struct list_head [NR_SOFTIRQS], softirq_work_list);
486 EXPORT_PER_CPU_SYMBOL(softirq_work_list);
487
488 static void __local_trigger(struct call_single_data *cp, int softirq)
489 {
490         struct list_head *head = &__get_cpu_var(softirq_work_list[softirq]);
491
492         list_add_tail(&cp->list, head);
493
494         /* Trigger the softirq only if the list was previously empty.  */
495         if (head->next == &cp->list)
496                 raise_softirq_irqoff(softirq);
497 }
498
499 #ifdef CONFIG_USE_GENERIC_SMP_HELPERS
500 static void remote_softirq_receive(void *data)
501 {
502         struct call_single_data *cp = data;
503         unsigned long flags;
504         int softirq;
505
506         softirq = cp->priv;
507
508         local_irq_save(flags);
509         __local_trigger(cp, softirq);
510         local_irq_restore(flags);
511 }
512
513 static int __try_remote_softirq(struct call_single_data *cp, int cpu, int softirq)
514 {
515         if (cpu_online(cpu)) {
516                 cp->func = remote_softirq_receive;
517                 cp->info = cp;
518                 cp->flags = 0;
519                 cp->priv = softirq;
520
521                 __smp_call_function_single(cpu, cp, 0);
522                 return 0;
523         }
524         return 1;
525 }
526 #else /* CONFIG_USE_GENERIC_SMP_HELPERS */
527 static int __try_remote_softirq(struct call_single_data *cp, int cpu, int softirq)
528 {
529         return 1;
530 }
531 #endif
532
533 /**
534  * __send_remote_softirq - try to schedule softirq work on a remote cpu
535  * @cp: private SMP call function data area
536  * @cpu: the remote cpu
537  * @this_cpu: the currently executing cpu
538  * @softirq: the softirq for the work
539  *
540  * Attempt to schedule softirq work on a remote cpu.  If this cannot be
541  * done, the work is instead queued up on the local cpu.
542  *
543  * Interrupts must be disabled.
544  */
545 void __send_remote_softirq(struct call_single_data *cp, int cpu, int this_cpu, int softirq)
546 {
547         if (cpu == this_cpu || __try_remote_softirq(cp, cpu, softirq))
548                 __local_trigger(cp, softirq);
549 }
550 EXPORT_SYMBOL(__send_remote_softirq);
551
552 /**
553  * send_remote_softirq - try to schedule softirq work on a remote cpu
554  * @cp: private SMP call function data area
555  * @cpu: the remote cpu
556  * @softirq: the softirq for the work
557  *
558  * Like __send_remote_softirq except that disabling interrupts and
559  * computing the current cpu is done for the caller.
560  */
561 void send_remote_softirq(struct call_single_data *cp, int cpu, int softirq)
562 {
563         unsigned long flags;
564         int this_cpu;
565
566         local_irq_save(flags);
567         this_cpu = smp_processor_id();
568         __send_remote_softirq(cp, cpu, this_cpu, softirq);
569         local_irq_restore(flags);
570 }
571 EXPORT_SYMBOL(send_remote_softirq);
572
573 static int __cpuinit remote_softirq_cpu_notify(struct notifier_block *self,
574                                                unsigned long action, void *hcpu)
575 {
576         /*
577          * If a CPU goes away, splice its entries to the current CPU
578          * and trigger a run of the softirq
579          */
580         if (action == CPU_DEAD || action == CPU_DEAD_FROZEN) {
581                 int cpu = (unsigned long) hcpu;
582                 int i;
583
584                 local_irq_disable();
585                 for (i = 0; i < NR_SOFTIRQS; i++) {
586                         struct list_head *head = &per_cpu(softirq_work_list[i], cpu);
587                         struct list_head *local_head;
588
589                         if (list_empty(head))
590                                 continue;
591
592                         local_head = &__get_cpu_var(softirq_work_list[i]);
593                         list_splice_init(head, local_head);
594                         raise_softirq_irqoff(i);
595                 }
596                 local_irq_enable();
597         }
598
599         return NOTIFY_OK;
600 }
601
602 static struct notifier_block __cpuinitdata remote_softirq_cpu_notifier = {
603         .notifier_call  = remote_softirq_cpu_notify,
604 };
605
606 void __init softirq_init(void)
607 {
608         int cpu;
609
610         for_each_possible_cpu(cpu) {
611                 int i;
612
613                 per_cpu(tasklet_vec, cpu).tail =
614                         &per_cpu(tasklet_vec, cpu).head;
615                 per_cpu(tasklet_hi_vec, cpu).tail =
616                         &per_cpu(tasklet_hi_vec, cpu).head;
617                 for (i = 0; i < NR_SOFTIRQS; i++)
618                         INIT_LIST_HEAD(&per_cpu(softirq_work_list[i], cpu));
619         }
620
621         register_hotcpu_notifier(&remote_softirq_cpu_notifier);
622
623         open_softirq(TASKLET_SOFTIRQ, tasklet_action);
624         open_softirq(HI_SOFTIRQ, tasklet_hi_action);
625 }
626
627 static int ksoftirqd(void * __bind_cpu)
628 {
629         set_current_state(TASK_INTERRUPTIBLE);
630
631         while (!kthread_should_stop()) {
632                 preempt_disable();
633                 if (!local_softirq_pending()) {
634                         preempt_enable_no_resched();
635                         schedule();
636                         preempt_disable();
637                 }
638
639                 __set_current_state(TASK_RUNNING);
640
641                 while (local_softirq_pending()) {
642                         /* Preempt disable stops cpu going offline.
643                            If already offline, we'll be on wrong CPU:
644                            don't process */
645                         if (cpu_is_offline((long)__bind_cpu))
646                                 goto wait_to_die;
647                         do_softirq();
648                         preempt_enable_no_resched();
649                         cond_resched();
650                         preempt_disable();
651                         rcu_qsctr_inc((long)__bind_cpu);
652                 }
653                 preempt_enable();
654                 set_current_state(TASK_INTERRUPTIBLE);
655         }
656         __set_current_state(TASK_RUNNING);
657         return 0;
658
659 wait_to_die:
660         preempt_enable();
661         /* Wait for kthread_stop */
662         set_current_state(TASK_INTERRUPTIBLE);
663         while (!kthread_should_stop()) {
664                 schedule();
665                 set_current_state(TASK_INTERRUPTIBLE);
666         }
667         __set_current_state(TASK_RUNNING);
668         return 0;
669 }
670
671 #ifdef CONFIG_HOTPLUG_CPU
672 /*
673  * tasklet_kill_immediate is called to remove a tasklet which can already be
674  * scheduled for execution on @cpu.
675  *
676  * Unlike tasklet_kill, this function removes the tasklet
677  * _immediately_, even if the tasklet is in TASKLET_STATE_SCHED state.
678  *
679  * When this function is called, @cpu must be in the CPU_DEAD state.
680  */
681 void tasklet_kill_immediate(struct tasklet_struct *t, unsigned int cpu)
682 {
683         struct tasklet_struct **i;
684
685         BUG_ON(cpu_online(cpu));
686         BUG_ON(test_bit(TASKLET_STATE_RUN, &t->state));
687
688         if (!test_bit(TASKLET_STATE_SCHED, &t->state))
689                 return;
690
691         /* CPU is dead, so no lock needed. */
692         for (i = &per_cpu(tasklet_vec, cpu).head; *i; i = &(*i)->next) {
693                 if (*i == t) {
694                         *i = t->next;
695                         /* If this was the tail element, move the tail ptr */
696                         if (*i == NULL)
697                                 per_cpu(tasklet_vec, cpu).tail = i;
698                         return;
699                 }
700         }
701         BUG();
702 }
703
704 static void takeover_tasklets(unsigned int cpu)
705 {
706         /* CPU is dead, so no lock needed. */
707         local_irq_disable();
708
709         /* Find end, append list for that CPU. */
710         if (&per_cpu(tasklet_vec, cpu).head != per_cpu(tasklet_vec, cpu).tail) {
711                 *(__get_cpu_var(tasklet_vec).tail) = per_cpu(tasklet_vec, cpu).head;
712                 __get_cpu_var(tasklet_vec).tail = per_cpu(tasklet_vec, cpu).tail;
713                 per_cpu(tasklet_vec, cpu).head = NULL;
714                 per_cpu(tasklet_vec, cpu).tail = &per_cpu(tasklet_vec, cpu).head;
715         }
716         raise_softirq_irqoff(TASKLET_SOFTIRQ);
717
718         if (&per_cpu(tasklet_hi_vec, cpu).head != per_cpu(tasklet_hi_vec, cpu).tail) {
719                 *__get_cpu_var(tasklet_hi_vec).tail = per_cpu(tasklet_hi_vec, cpu).head;
720                 __get_cpu_var(tasklet_hi_vec).tail = per_cpu(tasklet_hi_vec, cpu).tail;
721                 per_cpu(tasklet_hi_vec, cpu).head = NULL;
722                 per_cpu(tasklet_hi_vec, cpu).tail = &per_cpu(tasklet_hi_vec, cpu).head;
723         }
724         raise_softirq_irqoff(HI_SOFTIRQ);
725
726         local_irq_enable();
727 }
728 #endif /* CONFIG_HOTPLUG_CPU */
729
730 static int __cpuinit cpu_callback(struct notifier_block *nfb,
731                                   unsigned long action,
732                                   void *hcpu)
733 {
734         int hotcpu = (unsigned long)hcpu;
735         struct task_struct *p;
736
737         switch (action) {
738         case CPU_UP_PREPARE:
739         case CPU_UP_PREPARE_FROZEN:
740                 p = kthread_create(ksoftirqd, hcpu, "ksoftirqd/%d", hotcpu);
741                 if (IS_ERR(p)) {
742                         printk("ksoftirqd for %i failed\n", hotcpu);
743                         return NOTIFY_BAD;
744                 }
745                 kthread_bind(p, hotcpu);
746                 per_cpu(ksoftirqd, hotcpu) = p;
747                 break;
748         case CPU_ONLINE:
749         case CPU_ONLINE_FROZEN:
750                 wake_up_process(per_cpu(ksoftirqd, hotcpu));
751                 break;
752 #ifdef CONFIG_HOTPLUG_CPU
753         case CPU_UP_CANCELED:
754         case CPU_UP_CANCELED_FROZEN:
755                 if (!per_cpu(ksoftirqd, hotcpu))
756                         break;
757                 /* Unbind so it can run.  Fall thru. */
758                 kthread_bind(per_cpu(ksoftirqd, hotcpu),
759                              cpumask_any(cpu_online_mask));
760         case CPU_DEAD:
761         case CPU_DEAD_FROZEN: {
762                 struct sched_param param = { .sched_priority = MAX_RT_PRIO-1 };
763
764                 p = per_cpu(ksoftirqd, hotcpu);
765                 per_cpu(ksoftirqd, hotcpu) = NULL;
766                 sched_setscheduler_nocheck(p, SCHED_FIFO, &param);
767                 kthread_stop(p);
768                 takeover_tasklets(hotcpu);
769                 break;
770         }
771 #endif /* CONFIG_HOTPLUG_CPU */
772         }
773         return NOTIFY_OK;
774 }
775
776 static struct notifier_block __cpuinitdata cpu_nfb = {
777         .notifier_call = cpu_callback
778 };
779
780 static __init int spawn_ksoftirqd(void)
781 {
782         void *cpu = (void *)(long)smp_processor_id();
783         int err = cpu_callback(&cpu_nfb, CPU_UP_PREPARE, cpu);
784
785         BUG_ON(err == NOTIFY_BAD);
786         cpu_callback(&cpu_nfb, CPU_ONLINE, cpu);
787         register_cpu_notifier(&cpu_nfb);
788         return 0;
789 }
790 early_initcall(spawn_ksoftirqd);
791
792 #ifdef CONFIG_SMP
793 /*
794  * Call a function on all processors
795  */
796 int on_each_cpu(void (*func) (void *info), void *info, int wait)
797 {
798         int ret = 0;
799
800         preempt_disable();
801         ret = smp_call_function(func, info, wait);
802         local_irq_disable();
803         func(info);
804         local_irq_enable();
805         preempt_enable();
806         return ret;
807 }
808 EXPORT_SYMBOL(on_each_cpu);
809 #endif
810
811 /*
812  * [ These __weak aliases are kept in a separate compilation unit, so that
813  *   GCC does not inline them incorrectly. ]
814  */
815
816 int __init __weak early_irq_init(void)
817 {
818         return 0;
819 }
820
821 int __init __weak arch_probe_nr_irqs(void)
822 {
823         return 0;
824 }
825
826 int __init __weak arch_early_irq_init(void)
827 {
828         return 0;
829 }
830
831 int __weak arch_init_chip_data(struct irq_desc *desc, int node)
832 {
833         return 0;
834 }