2 * Functions related to tagged command queuing
4 #include <linux/kernel.h>
5 #include <linux/module.h>
7 #include <linux/blkdev.h>
8 #include <linux/slab.h>
13 * blk_queue_find_tag - find a request by its tag and queue
14 * @q: The request queue for the device
15 * @tag: The tag of the request
18 * Should be used when a device returns a tag and you want to match
21 * no locks need be held.
23 struct request
*blk_queue_find_tag(struct request_queue
*q
, int tag
)
25 return blk_map_queue_find_tag(q
->queue_tags
, tag
);
27 EXPORT_SYMBOL(blk_queue_find_tag
);
30 * blk_free_tags - release a given set of tag maintenance info
31 * @bqt: the tag map to free
33 * Drop the reference count on @bqt and frees it when the last reference
36 void blk_free_tags(struct blk_queue_tag
*bqt
)
38 if (atomic_dec_and_test(&bqt
->refcnt
)) {
39 BUG_ON(find_first_bit(bqt
->tag_map
, bqt
->max_depth
) <
42 kfree(bqt
->tag_index
);
43 bqt
->tag_index
= NULL
;
51 EXPORT_SYMBOL(blk_free_tags
);
54 * __blk_queue_free_tags - release tag maintenance info
55 * @q: the request queue for the device
58 * blk_cleanup_queue() will take care of calling this function, if tagging
59 * has been used. So there's no need to call this directly.
61 void __blk_queue_free_tags(struct request_queue
*q
)
63 struct blk_queue_tag
*bqt
= q
->queue_tags
;
71 queue_flag_clear_unlocked(QUEUE_FLAG_QUEUED
, q
);
75 * blk_queue_free_tags - release tag maintenance info
76 * @q: the request queue for the device
79 * This is used to disable tagged queuing to a device, yet leave
82 void blk_queue_free_tags(struct request_queue
*q
)
84 queue_flag_clear_unlocked(QUEUE_FLAG_QUEUED
, q
);
86 EXPORT_SYMBOL(blk_queue_free_tags
);
89 init_tag_map(struct request_queue
*q
, struct blk_queue_tag
*tags
, int depth
)
91 struct request
**tag_index
;
92 unsigned long *tag_map
;
95 if (q
&& depth
> q
->nr_requests
* 2) {
96 depth
= q
->nr_requests
* 2;
97 printk(KERN_ERR
"%s: adjusted depth to %d\n",
101 tag_index
= kzalloc(depth
* sizeof(struct request
*), GFP_ATOMIC
);
105 nr_ulongs
= ALIGN(depth
, BITS_PER_LONG
) / BITS_PER_LONG
;
106 tag_map
= kzalloc(nr_ulongs
* sizeof(unsigned long), GFP_ATOMIC
);
110 tags
->real_max_depth
= depth
;
111 tags
->max_depth
= depth
;
112 tags
->tag_index
= tag_index
;
113 tags
->tag_map
= tag_map
;
121 static struct blk_queue_tag
*__blk_queue_init_tags(struct request_queue
*q
,
122 int depth
, int alloc_policy
)
124 struct blk_queue_tag
*tags
;
126 tags
= kmalloc(sizeof(struct blk_queue_tag
), GFP_ATOMIC
);
130 if (init_tag_map(q
, tags
, depth
))
133 atomic_set(&tags
->refcnt
, 1);
134 tags
->alloc_policy
= alloc_policy
;
143 * blk_init_tags - initialize the tag info for an external tag map
144 * @depth: the maximum queue depth supported
145 * @alloc_policy: tag allocation policy
147 struct blk_queue_tag
*blk_init_tags(int depth
, int alloc_policy
)
149 return __blk_queue_init_tags(NULL
, depth
, alloc_policy
);
151 EXPORT_SYMBOL(blk_init_tags
);
154 * blk_queue_init_tags - initialize the queue tag info
155 * @q: the request queue for the device
156 * @depth: the maximum queue depth supported
157 * @tags: the tag to use
158 * @alloc_policy: tag allocation policy
160 * Queue lock must be held here if the function is called to resize an
163 int blk_queue_init_tags(struct request_queue
*q
, int depth
,
164 struct blk_queue_tag
*tags
, int alloc_policy
)
168 BUG_ON(tags
&& q
->queue_tags
&& tags
!= q
->queue_tags
);
170 if (!tags
&& !q
->queue_tags
) {
171 tags
= __blk_queue_init_tags(q
, depth
, alloc_policy
);
176 } else if (q
->queue_tags
) {
177 rc
= blk_queue_resize_tags(q
, depth
);
180 queue_flag_set(QUEUE_FLAG_QUEUED
, q
);
183 atomic_inc(&tags
->refcnt
);
186 * assign it, all done
188 q
->queue_tags
= tags
;
189 queue_flag_set_unlocked(QUEUE_FLAG_QUEUED
, q
);
190 INIT_LIST_HEAD(&q
->tag_busy_list
);
193 EXPORT_SYMBOL(blk_queue_init_tags
);
196 * blk_queue_resize_tags - change the queueing depth
197 * @q: the request queue for the device
198 * @new_depth: the new max command queueing depth
201 * Must be called with the queue lock held.
203 int blk_queue_resize_tags(struct request_queue
*q
, int new_depth
)
205 struct blk_queue_tag
*bqt
= q
->queue_tags
;
206 struct request
**tag_index
;
207 unsigned long *tag_map
;
208 int max_depth
, nr_ulongs
;
214 * if we already have large enough real_max_depth. just
215 * adjust max_depth. *NOTE* as requests with tag value
216 * between new_depth and real_max_depth can be in-flight, tag
217 * map can not be shrunk blindly here.
219 if (new_depth
<= bqt
->real_max_depth
) {
220 bqt
->max_depth
= new_depth
;
225 * Currently cannot replace a shared tag map with a new
226 * one, so error out if this is the case
228 if (atomic_read(&bqt
->refcnt
) != 1)
232 * save the old state info, so we can copy it back
234 tag_index
= bqt
->tag_index
;
235 tag_map
= bqt
->tag_map
;
236 max_depth
= bqt
->real_max_depth
;
238 if (init_tag_map(q
, bqt
, new_depth
))
241 memcpy(bqt
->tag_index
, tag_index
, max_depth
* sizeof(struct request
*));
242 nr_ulongs
= ALIGN(max_depth
, BITS_PER_LONG
) / BITS_PER_LONG
;
243 memcpy(bqt
->tag_map
, tag_map
, nr_ulongs
* sizeof(unsigned long));
249 EXPORT_SYMBOL(blk_queue_resize_tags
);
252 * blk_queue_end_tag - end tag operations for a request
253 * @q: the request queue for the device
254 * @rq: the request that has completed
257 * Typically called when end_that_request_first() returns %0, meaning
258 * all transfers have been done for a request. It's important to call
259 * this function before end_that_request_last(), as that will put the
260 * request back on the free list thus corrupting the internal tag list.
263 * queue lock must be held.
265 void blk_queue_end_tag(struct request_queue
*q
, struct request
*rq
)
267 struct blk_queue_tag
*bqt
= q
->queue_tags
;
268 unsigned tag
= rq
->tag
; /* negative tags invalid */
270 BUG_ON(tag
>= bqt
->real_max_depth
);
272 list_del_init(&rq
->queuelist
);
273 rq
->cmd_flags
&= ~REQ_QUEUED
;
276 if (unlikely(bqt
->tag_index
[tag
] == NULL
))
277 printk(KERN_ERR
"%s: tag %d is missing\n",
280 bqt
->tag_index
[tag
] = NULL
;
282 if (unlikely(!test_bit(tag
, bqt
->tag_map
))) {
283 printk(KERN_ERR
"%s: attempt to clear non-busy tag (%d)\n",
288 * The tag_map bit acts as a lock for tag_index[bit], so we need
289 * unlock memory barrier semantics.
291 clear_bit_unlock(tag
, bqt
->tag_map
);
293 EXPORT_SYMBOL(blk_queue_end_tag
);
296 * blk_queue_start_tag - find a free tag and assign it
297 * @q: the request queue for the device
298 * @rq: the block request that needs tagging
301 * This can either be used as a stand-alone helper, or possibly be
302 * assigned as the queue &prep_rq_fn (in which case &struct request
303 * automagically gets a tag assigned). Note that this function
304 * assumes that any type of request can be queued! if this is not
305 * true for your device, you must check the request type before
306 * calling this function. The request will also be removed from
307 * the request queue, so it's the drivers responsibility to readd
308 * it if it should need to be restarted for some reason.
311 * queue lock must be held.
313 int blk_queue_start_tag(struct request_queue
*q
, struct request
*rq
)
315 struct blk_queue_tag
*bqt
= q
->queue_tags
;
319 if (unlikely((rq
->cmd_flags
& REQ_QUEUED
))) {
321 "%s: request %p for device [%s] already tagged %d",
323 rq
->rq_disk
? rq
->rq_disk
->disk_name
: "?", rq
->tag
);
328 * Protect against shared tag maps, as we may not have exclusive
329 * access to the tag map.
331 * We reserve a few tags just for sync IO, since we don't want
332 * to starve sync IO on behalf of flooding async IO.
334 max_depth
= bqt
->max_depth
;
335 if (!rq_is_sync(rq
) && max_depth
> 1) {
346 if (q
->in_flight
[BLK_RW_ASYNC
] > max_depth
)
351 if (bqt
->alloc_policy
== BLK_TAG_ALLOC_FIFO
) {
352 tag
= find_first_zero_bit(bqt
->tag_map
, max_depth
);
353 if (tag
>= max_depth
)
356 int start
= bqt
->next_tag
;
357 int size
= min_t(int, bqt
->max_depth
, max_depth
+ start
);
358 tag
= find_next_zero_bit(bqt
->tag_map
, size
, start
);
359 if (tag
>= size
&& start
+ size
> bqt
->max_depth
) {
360 size
= start
+ size
- bqt
->max_depth
;
361 tag
= find_first_zero_bit(bqt
->tag_map
, size
);
367 } while (test_and_set_bit_lock(tag
, bqt
->tag_map
));
369 * We need lock ordering semantics given by test_and_set_bit_lock.
370 * See blk_queue_end_tag for details.
373 bqt
->next_tag
= (tag
+ 1) % bqt
->max_depth
;
374 rq
->cmd_flags
|= REQ_QUEUED
;
376 bqt
->tag_index
[tag
] = rq
;
377 blk_start_request(rq
);
378 list_add(&rq
->queuelist
, &q
->tag_busy_list
);
381 EXPORT_SYMBOL(blk_queue_start_tag
);
384 * blk_queue_invalidate_tags - invalidate all pending tags
385 * @q: the request queue for the device
388 * Hardware conditions may dictate a need to stop all pending requests.
389 * In this case, we will safely clear the block side of the tag queue and
390 * readd all requests to the request queue in the right order.
393 * queue lock must be held.
395 void blk_queue_invalidate_tags(struct request_queue
*q
)
397 struct list_head
*tmp
, *n
;
399 list_for_each_safe(tmp
, n
, &q
->tag_busy_list
)
400 blk_requeue_request(q
, list_entry_rq(tmp
));
402 EXPORT_SYMBOL(blk_queue_invalidate_tags
);