2 * Functions related to interrupt-poll handling in the block layer. This
3 * is similar to NAPI for network devices.
5 #include <linux/kernel.h>
6 #include <linux/module.h>
7 #include <linux/init.h>
9 #include <linux/blkdev.h>
10 #include <linux/interrupt.h>
11 #include <linux/cpu.h>
12 #include <linux/blk-iopoll.h>
13 #include <linux/delay.h>
17 static unsigned int blk_iopoll_budget __read_mostly
= 256;
19 static DEFINE_PER_CPU(struct list_head
, blk_cpu_iopoll
);
22 * blk_iopoll_sched - Schedule a run of the iopoll handler
23 * @iop: The parent iopoll structure
26 * Add this blk_iopoll structure to the pending poll list and trigger the
27 * raise of the blk iopoll softirq. The driver must already have gotten a
28 * successful return from blk_iopoll_sched_prep() before calling this.
30 void blk_iopoll_sched(struct blk_iopoll
*iop
)
34 local_irq_save(flags
);
35 list_add_tail(&iop
->list
, this_cpu_ptr(&blk_cpu_iopoll
));
36 __raise_softirq_irqoff(BLOCK_IOPOLL_SOFTIRQ
);
37 local_irq_restore(flags
);
39 EXPORT_SYMBOL(blk_iopoll_sched
);
42 * __blk_iopoll_complete - Mark this @iop as un-polled again
43 * @iop: The parent iopoll structure
46 * See blk_iopoll_complete(). This function must be called with interrupts
49 void __blk_iopoll_complete(struct blk_iopoll
*iop
)
52 smp_mb__before_atomic();
53 clear_bit_unlock(IOPOLL_F_SCHED
, &iop
->state
);
55 EXPORT_SYMBOL(__blk_iopoll_complete
);
58 * blk_iopoll_complete - Mark this @iop as un-polled again
59 * @iop: The parent iopoll structure
62 * If a driver consumes less than the assigned budget in its run of the
63 * iopoll handler, it'll end the polled mode by calling this function. The
64 * iopoll handler will not be invoked again before blk_iopoll_sched_prep()
67 void blk_iopoll_complete(struct blk_iopoll
*iop
)
71 local_irq_save(flags
);
72 __blk_iopoll_complete(iop
);
73 local_irq_restore(flags
);
75 EXPORT_SYMBOL(blk_iopoll_complete
);
77 static void blk_iopoll_softirq(struct softirq_action
*h
)
79 struct list_head
*list
= this_cpu_ptr(&blk_cpu_iopoll
);
80 int rearm
= 0, budget
= blk_iopoll_budget
;
81 unsigned long start_time
= jiffies
;
85 while (!list_empty(list
)) {
86 struct blk_iopoll
*iop
;
90 * If softirq window is exhausted then punt.
92 if (budget
<= 0 || time_after(jiffies
, start_time
)) {
99 /* Even though interrupts have been re-enabled, this
100 * access is safe because interrupts can only add new
101 * entries to the tail of this list, and only ->poll()
102 * calls can remove this head entry from the list.
104 iop
= list_entry(list
->next
, struct blk_iopoll
, list
);
106 weight
= iop
->weight
;
108 if (test_bit(IOPOLL_F_SCHED
, &iop
->state
))
109 work
= iop
->poll(iop
, weight
);
116 * Drivers must not modify the iopoll state, if they
117 * consume their assigned weight (or more, some drivers can't
118 * easily just stop processing, they have to complete an
119 * entire mask of commands).In such cases this code
120 * still "owns" the iopoll instance and therefore can
121 * move the instance around on the list at-will.
123 if (work
>= weight
) {
124 if (blk_iopoll_disable_pending(iop
))
125 __blk_iopoll_complete(iop
);
127 list_move_tail(&iop
->list
, list
);
132 __raise_softirq_irqoff(BLOCK_IOPOLL_SOFTIRQ
);
138 * blk_iopoll_disable - Disable iopoll on this @iop
139 * @iop: The parent iopoll structure
142 * Disable io polling and wait for any pending callbacks to have completed.
144 void blk_iopoll_disable(struct blk_iopoll
*iop
)
146 set_bit(IOPOLL_F_DISABLE
, &iop
->state
);
147 while (test_and_set_bit(IOPOLL_F_SCHED
, &iop
->state
))
149 clear_bit(IOPOLL_F_DISABLE
, &iop
->state
);
151 EXPORT_SYMBOL(blk_iopoll_disable
);
154 * blk_iopoll_enable - Enable iopoll on this @iop
155 * @iop: The parent iopoll structure
158 * Enable iopoll on this @iop. Note that the handler run will not be
159 * scheduled, it will only mark it as active.
161 void blk_iopoll_enable(struct blk_iopoll
*iop
)
163 BUG_ON(!test_bit(IOPOLL_F_SCHED
, &iop
->state
));
164 smp_mb__before_atomic();
165 clear_bit_unlock(IOPOLL_F_SCHED
, &iop
->state
);
167 EXPORT_SYMBOL(blk_iopoll_enable
);
170 * blk_iopoll_init - Initialize this @iop
171 * @iop: The parent iopoll structure
172 * @weight: The default weight (or command completion budget)
173 * @poll_fn: The handler to invoke
176 * Initialize this blk_iopoll structure. Before being actively used, the
177 * driver must call blk_iopoll_enable().
179 void blk_iopoll_init(struct blk_iopoll
*iop
, int weight
, blk_iopoll_fn
*poll_fn
)
181 memset(iop
, 0, sizeof(*iop
));
182 INIT_LIST_HEAD(&iop
->list
);
183 iop
->weight
= weight
;
185 set_bit(IOPOLL_F_SCHED
, &iop
->state
);
187 EXPORT_SYMBOL(blk_iopoll_init
);
189 static int blk_iopoll_cpu_notify(struct notifier_block
*self
,
190 unsigned long action
, void *hcpu
)
193 * If a CPU goes away, splice its entries to the current CPU
194 * and trigger a run of the softirq
196 if (action
== CPU_DEAD
|| action
== CPU_DEAD_FROZEN
) {
197 int cpu
= (unsigned long) hcpu
;
200 list_splice_init(&per_cpu(blk_cpu_iopoll
, cpu
),
201 this_cpu_ptr(&blk_cpu_iopoll
));
202 __raise_softirq_irqoff(BLOCK_IOPOLL_SOFTIRQ
);
209 static struct notifier_block blk_iopoll_cpu_notifier
= {
210 .notifier_call
= blk_iopoll_cpu_notify
,
213 static __init
int blk_iopoll_setup(void)
217 for_each_possible_cpu(i
)
218 INIT_LIST_HEAD(&per_cpu(blk_cpu_iopoll
, i
));
220 open_softirq(BLOCK_IOPOLL_SOFTIRQ
, blk_iopoll_softirq
);
221 register_hotcpu_notifier(&blk_iopoll_cpu_notifier
);
224 subsys_initcall(blk_iopoll_setup
);