blob: 3f33d86722688a4f50ac0064488540d1960447fb [file] [log] [blame]
Jens Axboe8324aa92008-01-29 14:51:59 +01001/*
2 * Functions related to tagged command queuing
3 */
4#include <linux/kernel.h>
5#include <linux/module.h>
6#include <linux/bio.h>
7#include <linux/blkdev.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +09008#include <linux/slab.h>
Jens Axboe8324aa92008-01-29 14:51:59 +01009
Adrian Bunk278caf02008-03-04 11:23:44 +010010#include "blk.h"
11
Jens Axboe8324aa92008-01-29 14:51:59 +010012/**
13 * blk_queue_find_tag - find a request by its tag and queue
14 * @q: The request queue for the device
15 * @tag: The tag of the request
16 *
17 * Notes:
18 * Should be used when a device returns a tag and you want to match
19 * it with a request.
20 *
21 * no locks need be held.
22 **/
23struct request *blk_queue_find_tag(struct request_queue *q, int tag)
24{
25 return blk_map_queue_find_tag(q->queue_tags, tag);
26}
Jens Axboe8324aa92008-01-29 14:51:59 +010027EXPORT_SYMBOL(blk_queue_find_tag);
28
29/**
30 * __blk_free_tags - release a given set of tag maintenance info
31 * @bqt: the tag map to free
32 *
Randy Dunlap710027a2008-08-19 20:13:11 +020033 * Tries to free the specified @bqt. Returns true if it was
Jens Axboe8324aa92008-01-29 14:51:59 +010034 * actually freed and false if there are still references using it
35 */
36static int __blk_free_tags(struct blk_queue_tag *bqt)
37{
38 int retval;
39
40 retval = atomic_dec_and_test(&bqt->refcnt);
41 if (retval) {
Matthew Wilcox0e3eb452008-08-26 09:02:28 +020042 BUG_ON(find_first_bit(bqt->tag_map, bqt->max_depth) <
43 bqt->max_depth);
Jens Axboe8324aa92008-01-29 14:51:59 +010044
45 kfree(bqt->tag_index);
46 bqt->tag_index = NULL;
47
48 kfree(bqt->tag_map);
49 bqt->tag_map = NULL;
50
51 kfree(bqt);
52 }
53
54 return retval;
55}
56
57/**
58 * __blk_queue_free_tags - release tag maintenance info
59 * @q: the request queue for the device
60 *
61 * Notes:
62 * blk_cleanup_queue() will take care of calling this function, if tagging
63 * has been used. So there's no need to call this directly.
64 **/
65void __blk_queue_free_tags(struct request_queue *q)
66{
67 struct blk_queue_tag *bqt = q->queue_tags;
68
69 if (!bqt)
70 return;
71
72 __blk_free_tags(bqt);
73
74 q->queue_tags = NULL;
Jens Axboeaa94b532008-05-07 09:27:43 +020075 queue_flag_clear_unlocked(QUEUE_FLAG_QUEUED, q);
Jens Axboe8324aa92008-01-29 14:51:59 +010076}
77
78/**
79 * blk_free_tags - release a given set of tag maintenance info
80 * @bqt: the tag map to free
81 *
Randy Dunlap710027a2008-08-19 20:13:11 +020082 * For externally managed @bqt frees the map. Callers of this
Jens Axboe8324aa92008-01-29 14:51:59 +010083 * function must guarantee to have released all the queues that
84 * might have been using this tag map.
85 */
86void blk_free_tags(struct blk_queue_tag *bqt)
87{
88 if (unlikely(!__blk_free_tags(bqt)))
89 BUG();
90}
91EXPORT_SYMBOL(blk_free_tags);
92
93/**
94 * blk_queue_free_tags - release tag maintenance info
95 * @q: the request queue for the device
96 *
97 * Notes:
Randy Dunlap710027a2008-08-19 20:13:11 +020098 * This is used to disable tagged queuing to a device, yet leave
Jens Axboe8324aa92008-01-29 14:51:59 +010099 * queue in function.
100 **/
101void blk_queue_free_tags(struct request_queue *q)
102{
Jens Axboeaa94b532008-05-07 09:27:43 +0200103 queue_flag_clear_unlocked(QUEUE_FLAG_QUEUED, q);
Jens Axboe8324aa92008-01-29 14:51:59 +0100104}
Jens Axboe8324aa92008-01-29 14:51:59 +0100105EXPORT_SYMBOL(blk_queue_free_tags);
106
107static int
108init_tag_map(struct request_queue *q, struct blk_queue_tag *tags, int depth)
109{
110 struct request **tag_index;
111 unsigned long *tag_map;
112 int nr_ulongs;
113
114 if (q && depth > q->nr_requests * 2) {
115 depth = q->nr_requests * 2;
116 printk(KERN_ERR "%s: adjusted depth to %d\n",
Harvey Harrison24c03d42008-05-01 04:35:17 -0700117 __func__, depth);
Jens Axboe8324aa92008-01-29 14:51:59 +0100118 }
119
120 tag_index = kzalloc(depth * sizeof(struct request *), GFP_ATOMIC);
121 if (!tag_index)
122 goto fail;
123
124 nr_ulongs = ALIGN(depth, BITS_PER_LONG) / BITS_PER_LONG;
125 tag_map = kzalloc(nr_ulongs * sizeof(unsigned long), GFP_ATOMIC);
126 if (!tag_map)
127 goto fail;
128
129 tags->real_max_depth = depth;
130 tags->max_depth = depth;
131 tags->tag_index = tag_index;
132 tags->tag_map = tag_map;
133
134 return 0;
135fail:
136 kfree(tag_index);
137 return -ENOMEM;
138}
139
140static struct blk_queue_tag *__blk_queue_init_tags(struct request_queue *q,
141 int depth)
142{
143 struct blk_queue_tag *tags;
144
145 tags = kmalloc(sizeof(struct blk_queue_tag), GFP_ATOMIC);
146 if (!tags)
147 goto fail;
148
149 if (init_tag_map(q, tags, depth))
150 goto fail;
151
Jens Axboe8324aa92008-01-29 14:51:59 +0100152 atomic_set(&tags->refcnt, 1);
153 return tags;
154fail:
155 kfree(tags);
156 return NULL;
157}
158
159/**
160 * blk_init_tags - initialize the tag info for an external tag map
161 * @depth: the maximum queue depth supported
Jens Axboe8324aa92008-01-29 14:51:59 +0100162 **/
163struct blk_queue_tag *blk_init_tags(int depth)
164{
165 return __blk_queue_init_tags(NULL, depth);
166}
167EXPORT_SYMBOL(blk_init_tags);
168
169/**
170 * blk_queue_init_tags - initialize the queue tag info
171 * @q: the request queue for the device
172 * @depth: the maximum queue depth supported
173 * @tags: the tag to use
Jens Axboeaa94b532008-05-07 09:27:43 +0200174 *
175 * Queue lock must be held here if the function is called to resize an
176 * existing map.
Jens Axboe8324aa92008-01-29 14:51:59 +0100177 **/
178int blk_queue_init_tags(struct request_queue *q, int depth,
179 struct blk_queue_tag *tags)
180{
181 int rc;
182
183 BUG_ON(tags && q->queue_tags && tags != q->queue_tags);
184
185 if (!tags && !q->queue_tags) {
186 tags = __blk_queue_init_tags(q, depth);
187
188 if (!tags)
Peter Senna Tschudind41570b2012-09-12 17:06:40 +0200189 return -ENOMEM;
190
Jens Axboe8324aa92008-01-29 14:51:59 +0100191 } else if (q->queue_tags) {
Jens Axboe6728cb02008-01-31 13:03:55 +0100192 rc = blk_queue_resize_tags(q, depth);
193 if (rc)
Jens Axboe8324aa92008-01-29 14:51:59 +0100194 return rc;
Nick Piggin75ad23b2008-04-29 14:48:33 +0200195 queue_flag_set(QUEUE_FLAG_QUEUED, q);
Jens Axboe8324aa92008-01-29 14:51:59 +0100196 return 0;
197 } else
198 atomic_inc(&tags->refcnt);
199
200 /*
201 * assign it, all done
202 */
203 q->queue_tags = tags;
Jens Axboeaa94b532008-05-07 09:27:43 +0200204 queue_flag_set_unlocked(QUEUE_FLAG_QUEUED, q);
Jens Axboe8324aa92008-01-29 14:51:59 +0100205 INIT_LIST_HEAD(&q->tag_busy_list);
206 return 0;
Jens Axboe8324aa92008-01-29 14:51:59 +0100207}
Jens Axboe8324aa92008-01-29 14:51:59 +0100208EXPORT_SYMBOL(blk_queue_init_tags);
209
210/**
211 * blk_queue_resize_tags - change the queueing depth
212 * @q: the request queue for the device
213 * @new_depth: the new max command queueing depth
214 *
215 * Notes:
216 * Must be called with the queue lock held.
217 **/
218int blk_queue_resize_tags(struct request_queue *q, int new_depth)
219{
220 struct blk_queue_tag *bqt = q->queue_tags;
221 struct request **tag_index;
222 unsigned long *tag_map;
223 int max_depth, nr_ulongs;
224
225 if (!bqt)
226 return -ENXIO;
227
228 /*
229 * if we already have large enough real_max_depth. just
230 * adjust max_depth. *NOTE* as requests with tag value
231 * between new_depth and real_max_depth can be in-flight, tag
232 * map can not be shrunk blindly here.
233 */
234 if (new_depth <= bqt->real_max_depth) {
235 bqt->max_depth = new_depth;
236 return 0;
237 }
238
239 /*
240 * Currently cannot replace a shared tag map with a new
241 * one, so error out if this is the case
242 */
243 if (atomic_read(&bqt->refcnt) != 1)
244 return -EBUSY;
245
246 /*
247 * save the old state info, so we can copy it back
248 */
249 tag_index = bqt->tag_index;
250 tag_map = bqt->tag_map;
251 max_depth = bqt->real_max_depth;
252
253 if (init_tag_map(q, bqt, new_depth))
254 return -ENOMEM;
255
256 memcpy(bqt->tag_index, tag_index, max_depth * sizeof(struct request *));
257 nr_ulongs = ALIGN(max_depth, BITS_PER_LONG) / BITS_PER_LONG;
258 memcpy(bqt->tag_map, tag_map, nr_ulongs * sizeof(unsigned long));
259
260 kfree(tag_index);
261 kfree(tag_map);
262 return 0;
263}
Jens Axboe8324aa92008-01-29 14:51:59 +0100264EXPORT_SYMBOL(blk_queue_resize_tags);
265
266/**
267 * blk_queue_end_tag - end tag operations for a request
268 * @q: the request queue for the device
269 * @rq: the request that has completed
270 *
271 * Description:
Randy Dunlap710027a2008-08-19 20:13:11 +0200272 * Typically called when end_that_request_first() returns %0, meaning
Jens Axboe8324aa92008-01-29 14:51:59 +0100273 * all transfers have been done for a request. It's important to call
274 * this function before end_that_request_last(), as that will put the
275 * request back on the free list thus corrupting the internal tag list.
276 *
277 * Notes:
278 * queue lock must be held.
279 **/
280void blk_queue_end_tag(struct request_queue *q, struct request *rq)
281{
282 struct blk_queue_tag *bqt = q->queue_tags;
Dan Williamsf2b20d42011-12-29 09:16:28 +0100283 unsigned tag = rq->tag; /* negative tags invalid */
Jens Axboe8324aa92008-01-29 14:51:59 +0100284
Dan Williamsf2b20d42011-12-29 09:16:28 +0100285 BUG_ON(tag >= bqt->real_max_depth);
Jens Axboe8324aa92008-01-29 14:51:59 +0100286
287 list_del_init(&rq->queuelist);
288 rq->cmd_flags &= ~REQ_QUEUED;
289 rq->tag = -1;
290
291 if (unlikely(bqt->tag_index[tag] == NULL))
292 printk(KERN_ERR "%s: tag %d is missing\n",
Harvey Harrison24c03d42008-05-01 04:35:17 -0700293 __func__, tag);
Jens Axboe8324aa92008-01-29 14:51:59 +0100294
295 bqt->tag_index[tag] = NULL;
296
297 if (unlikely(!test_bit(tag, bqt->tag_map))) {
298 printk(KERN_ERR "%s: attempt to clear non-busy tag (%d)\n",
Harvey Harrison24c03d42008-05-01 04:35:17 -0700299 __func__, tag);
Jens Axboe8324aa92008-01-29 14:51:59 +0100300 return;
301 }
302 /*
303 * The tag_map bit acts as a lock for tag_index[bit], so we need
304 * unlock memory barrier semantics.
305 */
306 clear_bit_unlock(tag, bqt->tag_map);
Jens Axboe8324aa92008-01-29 14:51:59 +0100307}
Jens Axboe8324aa92008-01-29 14:51:59 +0100308EXPORT_SYMBOL(blk_queue_end_tag);
309
310/**
311 * blk_queue_start_tag - find a free tag and assign it
312 * @q: the request queue for the device
313 * @rq: the block request that needs tagging
314 *
315 * Description:
316 * This can either be used as a stand-alone helper, or possibly be
317 * assigned as the queue &prep_rq_fn (in which case &struct request
318 * automagically gets a tag assigned). Note that this function
319 * assumes that any type of request can be queued! if this is not
320 * true for your device, you must check the request type before
321 * calling this function. The request will also be removed from
322 * the request queue, so it's the drivers responsibility to readd
323 * it if it should need to be restarted for some reason.
324 *
325 * Notes:
326 * queue lock must be held.
327 **/
328int blk_queue_start_tag(struct request_queue *q, struct request *rq)
329{
330 struct blk_queue_tag *bqt = q->queue_tags;
Jens Axboe0a7ae2f2009-05-20 08:54:31 +0200331 unsigned max_depth;
Jens Axboe8324aa92008-01-29 14:51:59 +0100332 int tag;
333
334 if (unlikely((rq->cmd_flags & REQ_QUEUED))) {
Jens Axboe6728cb02008-01-31 13:03:55 +0100335 printk(KERN_ERR
Jens Axboe8324aa92008-01-29 14:51:59 +0100336 "%s: request %p for device [%s] already tagged %d",
Harvey Harrison24c03d42008-05-01 04:35:17 -0700337 __func__, rq,
Jens Axboe8324aa92008-01-29 14:51:59 +0100338 rq->rq_disk ? rq->rq_disk->disk_name : "?", rq->tag);
339 BUG();
340 }
341
342 /*
343 * Protect against shared tag maps, as we may not have exclusive
344 * access to the tag map.
Jens Axboee3ba9ae2008-09-25 11:42:41 +0200345 *
346 * We reserve a few tags just for sync IO, since we don't want
347 * to starve sync IO on behalf of flooding async IO.
Jens Axboe8324aa92008-01-29 14:51:59 +0100348 */
Jens Axboee3ba9ae2008-09-25 11:42:41 +0200349 max_depth = bqt->max_depth;
Jens Axboe0a7ae2f2009-05-20 08:54:31 +0200350 if (!rq_is_sync(rq) && max_depth > 1) {
Jan Karaa6b3f762013-06-28 21:32:27 +0200351 switch (max_depth) {
352 case 2:
Jens Axboe0a7ae2f2009-05-20 08:54:31 +0200353 max_depth = 1;
Jan Karaa6b3f762013-06-28 21:32:27 +0200354 break;
355 case 3:
356 max_depth = 2;
357 break;
358 default:
359 max_depth -= 2;
360 }
Jens Axboe1b59dd52009-10-06 20:19:02 +0200361 if (q->in_flight[BLK_RW_ASYNC] > max_depth)
Jens Axboe0a7ae2f2009-05-20 08:54:31 +0200362 return 1;
363 }
Jens Axboee3ba9ae2008-09-25 11:42:41 +0200364
Jens Axboe8324aa92008-01-29 14:51:59 +0100365 do {
Jens Axboe0a7ae2f2009-05-20 08:54:31 +0200366 tag = find_first_zero_bit(bqt->tag_map, max_depth);
Jens Axboee3ba9ae2008-09-25 11:42:41 +0200367 if (tag >= max_depth)
Jens Axboe8324aa92008-01-29 14:51:59 +0100368 return 1;
369
370 } while (test_and_set_bit_lock(tag, bqt->tag_map));
371 /*
372 * We need lock ordering semantics given by test_and_set_bit_lock.
373 * See blk_queue_end_tag for details.
374 */
375
376 rq->cmd_flags |= REQ_QUEUED;
377 rq->tag = tag;
378 bqt->tag_index[tag] = rq;
Tejun Heo9934c8c2009-05-08 11:54:16 +0900379 blk_start_request(rq);
Jens Axboe8324aa92008-01-29 14:51:59 +0100380 list_add(&rq->queuelist, &q->tag_busy_list);
Jens Axboe8324aa92008-01-29 14:51:59 +0100381 return 0;
382}
Jens Axboe8324aa92008-01-29 14:51:59 +0100383EXPORT_SYMBOL(blk_queue_start_tag);
384
385/**
386 * blk_queue_invalidate_tags - invalidate all pending tags
387 * @q: the request queue for the device
388 *
389 * Description:
390 * Hardware conditions may dictate a need to stop all pending requests.
391 * In this case, we will safely clear the block side of the tag queue and
392 * readd all requests to the request queue in the right order.
393 *
394 * Notes:
395 * queue lock must be held.
396 **/
397void blk_queue_invalidate_tags(struct request_queue *q)
398{
399 struct list_head *tmp, *n;
400
401 list_for_each_safe(tmp, n, &q->tag_busy_list)
402 blk_requeue_request(q, list_entry_rq(tmp));
403}
Jens Axboe8324aa92008-01-29 14:51:59 +0100404EXPORT_SYMBOL(blk_queue_invalidate_tags);