2 * linux/kernel/softirq.c
4 * Copyright (C) 1992 Linus Torvalds
6 * Rewritten. Old one was good in 2.2, but in 2.3 it was immoral. --ANK (990903)
9 #include <linux/module.h>
10 #include <linux/kernel_stat.h>
11 #include <linux/interrupt.h>
12 #include <linux/init.h>
14 #include <linux/notifier.h>
15 #include <linux/percpu.h>
16 #include <linux/cpu.h>
17 #include <linux/kthread.h>
18 #include <linux/rcupdate.h>
19 #include <linux/smp.h>
23 - No shared variables, all the data are CPU local.
24 - If a softirq needs serialization, let it serialize itself
26 - Even if softirq is serialized, only local cpu is marked for
27 execution. Hence, we get something sort of weak cpu binding.
28 Though it is still not clear, will it result in better locality
32 - NET RX softirq. It is multithreaded and does not require
33 any global serialization.
34 - NET TX softirq. It kicks software netdevice queues, hence
35 it is logically serialized per device, but this serialization
36 is invisible to common code.
37 - Tasklets: serialized wrt itself.
40 #ifndef __ARCH_IRQ_STAT
41 irq_cpustat_t irq_stat
[NR_CPUS
] ____cacheline_aligned
;
42 EXPORT_SYMBOL(irq_stat
);
45 static struct softirq_action softirq_vec
[32] __cacheline_aligned_in_smp
;
47 static DEFINE_PER_CPU(struct task_struct
*, ksoftirqd
);
50 * we cannot loop indefinitely here to avoid userspace starvation,
51 * but we also don't want to introduce a worst case 1/HZ latency
52 * to the pending events, so lets the scheduler to balance
53 * the softirq load for us.
55 static inline void wakeup_softirqd(void)
57 /* Interrupts are disabled: no need to stop preemption */
58 struct task_struct
*tsk
= __get_cpu_var(ksoftirqd
);
60 if (tsk
&& tsk
->state
!= TASK_RUNNING
)
64 static inline int softirqd_is_waken(void)
66 struct task_struct
*tsk
= __get_cpu_var(ksoftirqd
);
68 return tsk
&& tsk
->state
== TASK_RUNNING
;
72 * This one is for softirq.c-internal use,
73 * where hardirqs are disabled legitimately:
75 #ifdef CONFIG_TRACE_IRQFLAGS
76 static void __local_bh_disable(unsigned long ip
)
80 WARN_ON_ONCE(in_irq());
82 raw_local_irq_save(flags
);
83 add_preempt_count(SOFTIRQ_OFFSET
);
85 * Were softirqs turned off above:
87 if (softirq_count() == SOFTIRQ_OFFSET
)
88 trace_softirqs_off(ip
);
89 raw_local_irq_restore(flags
);
91 #else /* !CONFIG_TRACE_IRQFLAGS */
92 static inline void __local_bh_disable(unsigned long ip
)
94 add_preempt_count(SOFTIRQ_OFFSET
);
97 #endif /* CONFIG_TRACE_IRQFLAGS */
99 void local_bh_disable(void)
101 __local_bh_disable((unsigned long)__builtin_return_address(0));
104 EXPORT_SYMBOL(local_bh_disable
);
106 void __local_bh_enable(void)
108 WARN_ON_ONCE(in_irq());
111 * softirqs should never be enabled by __local_bh_enable(),
112 * it always nests inside local_bh_enable() sections:
114 WARN_ON_ONCE(softirq_count() == SOFTIRQ_OFFSET
);
116 sub_preempt_count(SOFTIRQ_OFFSET
);
118 EXPORT_SYMBOL_GPL(__local_bh_enable
);
121 * Special-case - softirqs can safely be enabled in
122 * cond_resched_softirq(), or by __do_softirq(),
123 * without processing still-pending softirqs:
125 void _local_bh_enable(void)
127 WARN_ON_ONCE(in_irq());
128 WARN_ON_ONCE(!irqs_disabled());
130 if (softirq_count() == SOFTIRQ_OFFSET
)
131 trace_softirqs_on((unsigned long)__builtin_return_address(0));
132 sub_preempt_count(SOFTIRQ_OFFSET
);
135 EXPORT_SYMBOL(_local_bh_enable
);
137 void local_bh_enable(void)
139 #ifdef CONFIG_TRACE_IRQFLAGS
142 WARN_ON_ONCE(in_irq());
144 WARN_ON_ONCE(irqs_disabled());
146 #ifdef CONFIG_TRACE_IRQFLAGS
147 local_irq_save(flags
);
150 * Are softirqs going to be turned on now:
152 if (softirq_count() == SOFTIRQ_OFFSET
)
153 trace_softirqs_on((unsigned long)__builtin_return_address(0));
155 * Keep preemption disabled until we are done with
156 * softirq processing:
158 sub_preempt_count(SOFTIRQ_OFFSET
- 1);
160 if (unlikely(!in_interrupt() && local_softirq_pending()))
164 #ifdef CONFIG_TRACE_IRQFLAGS
165 local_irq_restore(flags
);
167 preempt_check_resched();
169 EXPORT_SYMBOL(local_bh_enable
);
171 void local_bh_enable_ip(unsigned long ip
)
173 #ifdef CONFIG_TRACE_IRQFLAGS
176 WARN_ON_ONCE(in_irq());
178 local_irq_save(flags
);
181 * Are softirqs going to be turned on now:
183 if (softirq_count() == SOFTIRQ_OFFSET
)
184 trace_softirqs_on(ip
);
186 * Keep preemption disabled until we are done with
187 * softirq processing:
189 sub_preempt_count(SOFTIRQ_OFFSET
- 1);
191 if (unlikely(!in_interrupt() && local_softirq_pending()))
195 #ifdef CONFIG_TRACE_IRQFLAGS
196 local_irq_restore(flags
);
198 preempt_check_resched();
200 EXPORT_SYMBOL(local_bh_enable_ip
);
203 * We restart softirq processing MAX_SOFTIRQ_RESTART times,
204 * and we fall back to softirqd after that.
206 * This number has been established via experimentation.
207 * The two things to balance is latency against fairness -
208 * we want to handle softirqs as soon as possible, but they
209 * should not be able to lock up the box.
211 #define MAX_SOFTIRQ_RESTART 10
213 static asmlinkage
void __do_softirq2(void)
215 struct softirq_action
*h
;
217 int max_restart
= MAX_SOFTIRQ_RESTART
;
220 pending
= local_softirq_pending();
221 account_system_vtime(current
);
223 __local_bh_disable((unsigned long)__builtin_return_address(0));
224 trace_softirq_enter();
226 cpu
= smp_processor_id();
228 /* Reset the pending bitmask before enabling irqs */
229 set_softirq_pending(0);
238 rcu_bh_qsctr_inc(cpu
);
246 pending
= local_softirq_pending();
247 if (pending
&& --max_restart
)
253 trace_softirq_exit();
255 account_system_vtime(current
);
259 asmlinkage
void __do_softirq(void)
261 if (!softirqd_is_waken())
265 #ifndef __ARCH_HAS_DO_SOFTIRQ
267 asmlinkage
void do_softirq(void)
275 local_irq_save(flags
);
277 pending
= local_softirq_pending();
282 local_irq_restore(flags
);
285 EXPORT_SYMBOL(do_softirq
);
289 #ifdef __ARCH_IRQ_EXIT_IRQS_DISABLED
290 # define invoke_softirq() __do_softirq()
292 # define invoke_softirq() do_softirq()
296 * Exit an interrupt context. Process softirqs if needed and possible:
300 account_system_vtime(current
);
301 trace_hardirq_exit();
302 sub_preempt_count(IRQ_EXIT_OFFSET
);
303 if (!in_interrupt() && local_softirq_pending())
305 preempt_enable_no_resched();
309 * This function must run with irqs disabled!
311 inline fastcall
void raise_softirq_irqoff(unsigned int nr
)
313 __raise_softirq_irqoff(nr
);
316 * If we're in an interrupt or softirq, we're done
317 * (this also catches softirq-disabled code). We will
318 * actually run the softirq once we return from
319 * the irq or softirq.
321 * Otherwise we wake up ksoftirqd to make sure we
322 * schedule the softirq soon.
328 EXPORT_SYMBOL(raise_softirq_irqoff
);
330 void fastcall
raise_softirq(unsigned int nr
)
334 local_irq_save(flags
);
335 raise_softirq_irqoff(nr
);
336 local_irq_restore(flags
);
339 void open_softirq(int nr
, void (*action
)(struct softirq_action
*), void *data
)
341 softirq_vec
[nr
].data
= data
;
342 softirq_vec
[nr
].action
= action
;
348 struct tasklet_struct
*list
;
351 /* Some compilers disobey section attribute on statics when not
353 static DEFINE_PER_CPU(struct tasklet_head
, tasklet_vec
) = { NULL
};
354 static DEFINE_PER_CPU(struct tasklet_head
, tasklet_hi_vec
) = { NULL
};
356 void fastcall
__tasklet_schedule(struct tasklet_struct
*t
)
360 local_irq_save(flags
);
361 t
->next
= __get_cpu_var(tasklet_vec
).list
;
362 __get_cpu_var(tasklet_vec
).list
= t
;
363 raise_softirq_irqoff(TASKLET_SOFTIRQ
);
364 local_irq_restore(flags
);
367 EXPORT_SYMBOL(__tasklet_schedule
);
369 void fastcall
__tasklet_hi_schedule(struct tasklet_struct
*t
)
373 local_irq_save(flags
);
374 t
->next
= __get_cpu_var(tasklet_hi_vec
).list
;
375 __get_cpu_var(tasklet_hi_vec
).list
= t
;
376 raise_softirq_irqoff(HI_SOFTIRQ
);
377 local_irq_restore(flags
);
380 EXPORT_SYMBOL(__tasklet_hi_schedule
);
382 static void tasklet_action(struct softirq_action
*a
)
384 struct tasklet_struct
*list
;
387 list
= __get_cpu_var(tasklet_vec
).list
;
388 __get_cpu_var(tasklet_vec
).list
= NULL
;
392 struct tasklet_struct
*t
= list
;
396 if (tasklet_trylock(t
)) {
397 if (!atomic_read(&t
->count
)) {
398 if (!test_and_clear_bit(TASKLET_STATE_SCHED
, &t
->state
))
408 t
->next
= __get_cpu_var(tasklet_vec
).list
;
409 __get_cpu_var(tasklet_vec
).list
= t
;
410 __raise_softirq_irqoff(TASKLET_SOFTIRQ
);
415 static void tasklet_hi_action(struct softirq_action
*a
)
417 struct tasklet_struct
*list
;
420 list
= __get_cpu_var(tasklet_hi_vec
).list
;
421 __get_cpu_var(tasklet_hi_vec
).list
= NULL
;
425 struct tasklet_struct
*t
= list
;
429 if (tasklet_trylock(t
)) {
430 if (!atomic_read(&t
->count
)) {
431 if (!test_and_clear_bit(TASKLET_STATE_SCHED
, &t
->state
))
441 t
->next
= __get_cpu_var(tasklet_hi_vec
).list
;
442 __get_cpu_var(tasklet_hi_vec
).list
= t
;
443 __raise_softirq_irqoff(HI_SOFTIRQ
);
449 void tasklet_init(struct tasklet_struct
*t
,
450 void (*func
)(unsigned long), unsigned long data
)
454 atomic_set(&t
->count
, 0);
459 EXPORT_SYMBOL(tasklet_init
);
461 void tasklet_kill(struct tasklet_struct
*t
)
464 printk("Attempt to kill tasklet from interrupt\n");
466 while (test_and_set_bit(TASKLET_STATE_SCHED
, &t
->state
)) {
469 while (test_bit(TASKLET_STATE_SCHED
, &t
->state
));
471 tasklet_unlock_wait(t
);
472 clear_bit(TASKLET_STATE_SCHED
, &t
->state
);
475 EXPORT_SYMBOL(tasklet_kill
);
477 void __init
softirq_init(void)
479 open_softirq(TASKLET_SOFTIRQ
, tasklet_action
, NULL
);
480 open_softirq(HI_SOFTIRQ
, tasklet_hi_action
, NULL
);
483 static int ksoftirqd(void * __bind_cpu
)
487 set_user_nice(current
, 19);
488 current
->flags
|= PF_NOFREEZE
;
490 set_current_state(TASK_INTERRUPTIBLE
);
492 while (!kthread_should_stop()) {
494 if (!local_softirq_pending()) {
495 preempt_enable_no_resched();
500 __set_current_state(TASK_RUNNING
);
502 while (local_softirq_pending()) {
503 /* Preempt disable stops cpu going offline.
504 If already offline, we'll be on wrong CPU:
506 if (cpu_is_offline((long)__bind_cpu
))
509 local_irq_save(flags
);
511 local_irq_restore(flags
);
513 preempt_enable_no_resched();
518 set_current_state(TASK_INTERRUPTIBLE
);
520 __set_current_state(TASK_RUNNING
);
525 /* Wait for kthread_stop */
526 set_current_state(TASK_INTERRUPTIBLE
);
527 while (!kthread_should_stop()) {
529 set_current_state(TASK_INTERRUPTIBLE
);
531 __set_current_state(TASK_RUNNING
);
535 #ifdef CONFIG_HOTPLUG_CPU
537 * tasklet_kill_immediate is called to remove a tasklet which can already be
538 * scheduled for execution on @cpu.
540 * Unlike tasklet_kill, this function removes the tasklet
541 * _immediately_, even if the tasklet is in TASKLET_STATE_SCHED state.
543 * When this function is called, @cpu must be in the CPU_DEAD state.
545 void tasklet_kill_immediate(struct tasklet_struct
*t
, unsigned int cpu
)
547 struct tasklet_struct
**i
;
549 BUG_ON(cpu_online(cpu
));
550 BUG_ON(test_bit(TASKLET_STATE_RUN
, &t
->state
));
552 if (!test_bit(TASKLET_STATE_SCHED
, &t
->state
))
555 /* CPU is dead, so no lock needed. */
556 for (i
= &per_cpu(tasklet_vec
, cpu
).list
; *i
; i
= &(*i
)->next
) {
565 static void takeover_tasklets(unsigned int cpu
)
567 struct tasklet_struct
**i
;
569 /* CPU is dead, so no lock needed. */
572 /* Find end, append list for that CPU. */
573 for (i
= &__get_cpu_var(tasklet_vec
).list
; *i
; i
= &(*i
)->next
);
574 *i
= per_cpu(tasklet_vec
, cpu
).list
;
575 per_cpu(tasklet_vec
, cpu
).list
= NULL
;
576 raise_softirq_irqoff(TASKLET_SOFTIRQ
);
578 for (i
= &__get_cpu_var(tasklet_hi_vec
).list
; *i
; i
= &(*i
)->next
);
579 *i
= per_cpu(tasklet_hi_vec
, cpu
).list
;
580 per_cpu(tasklet_hi_vec
, cpu
).list
= NULL
;
581 raise_softirq_irqoff(HI_SOFTIRQ
);
585 #endif /* CONFIG_HOTPLUG_CPU */
587 static int __cpuinit
cpu_callback(struct notifier_block
*nfb
,
588 unsigned long action
,
591 int hotcpu
= (unsigned long)hcpu
;
592 struct task_struct
*p
;
596 BUG_ON(per_cpu(tasklet_vec
, hotcpu
).list
);
597 BUG_ON(per_cpu(tasklet_hi_vec
, hotcpu
).list
);
598 p
= kthread_create(ksoftirqd
, hcpu
, "ksoftirqd/%d", hotcpu
);
600 printk("ksoftirqd for %i failed\n", hotcpu
);
603 kthread_bind(p
, hotcpu
);
604 per_cpu(ksoftirqd
, hotcpu
) = p
;
607 wake_up_process(per_cpu(ksoftirqd
, hotcpu
));
609 #ifdef CONFIG_HOTPLUG_CPU
610 case CPU_UP_CANCELED
:
611 if (!per_cpu(ksoftirqd
, hotcpu
))
613 /* Unbind so it can run. Fall thru. */
614 kthread_bind(per_cpu(ksoftirqd
, hotcpu
),
615 any_online_cpu(cpu_online_map
));
617 p
= per_cpu(ksoftirqd
, hotcpu
);
618 per_cpu(ksoftirqd
, hotcpu
) = NULL
;
620 takeover_tasklets(hotcpu
);
622 #endif /* CONFIG_HOTPLUG_CPU */
627 static struct notifier_block __cpuinitdata cpu_nfb
= {
628 .notifier_call
= cpu_callback
631 __init
int spawn_ksoftirqd(void)
633 void *cpu
= (void *)(long)smp_processor_id();
634 int err
= cpu_callback(&cpu_nfb
, CPU_UP_PREPARE
, cpu
);
636 BUG_ON(err
== NOTIFY_BAD
);
637 cpu_callback(&cpu_nfb
, CPU_ONLINE
, cpu
);
638 register_cpu_notifier(&cpu_nfb
);
644 * Call a function on all processors
646 int on_each_cpu(void (*func
) (void *info
), void *info
, int retry
, int wait
)
651 ret
= smp_call_function(func
, info
, retry
, wait
);
658 EXPORT_SYMBOL(on_each_cpu
);