blk-tag.c 9.3 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0
2 3 4 5 6 7 8
/*
 * Functions related to tagged command queuing
 */
#include <linux/kernel.h>
#include <linux/module.h>
#include <linux/bio.h>
#include <linux/blkdev.h>
9
#include <linux/slab.h>
10

11 12
#include "blk.h"

13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30
/**
 * blk_queue_find_tag - find a request by its tag and queue
 * @q:	 The request queue for the device
 * @tag: The tag of the request
 *
 * Notes:
 *    Should be used when a device returns a tag and you want to match
 *    it with a request.
 *
 *    no locks need be held.
 **/
struct request *blk_queue_find_tag(struct request_queue *q, int tag)
{
	return blk_map_queue_find_tag(q->queue_tags, tag);
}
EXPORT_SYMBOL(blk_queue_find_tag);

/**
31
 * blk_free_tags - release a given set of tag maintenance info
32 33
 * @bqt:	the tag map to free
 *
34 35
 * Drop the reference count on @bqt and frees it when the last reference
 * is dropped.
36
 */
37
void blk_free_tags(struct blk_queue_tag *bqt)
38
{
39
	if (atomic_dec_and_test(&bqt->refcnt)) {
40 41
		BUG_ON(find_first_bit(bqt->tag_map, bqt->max_depth) <
							bqt->max_depth);
42 43 44 45 46 47 48 49 50 51

		kfree(bqt->tag_index);
		bqt->tag_index = NULL;

		kfree(bqt->tag_map);
		bqt->tag_map = NULL;

		kfree(bqt);
	}
}
52
EXPORT_SYMBOL(blk_free_tags);
53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68

/**
 * __blk_queue_free_tags - release tag maintenance info
 * @q:  the request queue for the device
 *
 *  Notes:
 *    blk_cleanup_queue() will take care of calling this function, if tagging
 *    has been used. So there's no need to call this directly.
 **/
void __blk_queue_free_tags(struct request_queue *q)
{
	struct blk_queue_tag *bqt = q->queue_tags;

	if (!bqt)
		return;

69
	blk_free_tags(bqt);
70 71

	q->queue_tags = NULL;
72
	queue_flag_clear_unlocked(QUEUE_FLAG_QUEUED, q);
73 74 75 76 77 78 79
}

/**
 * blk_queue_free_tags - release tag maintenance info
 * @q:  the request queue for the device
 *
 *  Notes:
80
 *	This is used to disable tagged queuing to a device, yet leave
81 82 83 84
 *	queue in function.
 **/
void blk_queue_free_tags(struct request_queue *q)
{
85
	queue_flag_clear_unlocked(QUEUE_FLAG_QUEUED, q);
86 87 88 89 90 91 92 93 94 95 96 97 98
}
EXPORT_SYMBOL(blk_queue_free_tags);

static int
init_tag_map(struct request_queue *q, struct blk_queue_tag *tags, int depth)
{
	struct request **tag_index;
	unsigned long *tag_map;
	int nr_ulongs;

	if (q && depth > q->nr_requests * 2) {
		depth = q->nr_requests * 2;
		printk(KERN_ERR "%s: adjusted depth to %d\n",
99
		       __func__, depth);
100 101
	}

K
Kees Cook 已提交
102
	tag_index = kcalloc(depth, sizeof(struct request *), GFP_ATOMIC);
103 104 105 106
	if (!tag_index)
		goto fail;

	nr_ulongs = ALIGN(depth, BITS_PER_LONG) / BITS_PER_LONG;
K
Kees Cook 已提交
107
	tag_map = kcalloc(nr_ulongs, sizeof(unsigned long), GFP_ATOMIC);
108 109 110 111 112 113 114 115 116 117 118 119 120 121 122
	if (!tag_map)
		goto fail;

	tags->real_max_depth = depth;
	tags->max_depth = depth;
	tags->tag_index = tag_index;
	tags->tag_map = tag_map;

	return 0;
fail:
	kfree(tag_index);
	return -ENOMEM;
}

static struct blk_queue_tag *__blk_queue_init_tags(struct request_queue *q,
123
						int depth, int alloc_policy)
124 125 126 127 128 129 130 131 132 133 134
{
	struct blk_queue_tag *tags;

	tags = kmalloc(sizeof(struct blk_queue_tag), GFP_ATOMIC);
	if (!tags)
		goto fail;

	if (init_tag_map(q, tags, depth))
		goto fail;

	atomic_set(&tags->refcnt, 1);
135 136
	tags->alloc_policy = alloc_policy;
	tags->next_tag = 0;
137 138 139 140 141 142 143 144 145
	return tags;
fail:
	kfree(tags);
	return NULL;
}

/**
 * blk_init_tags - initialize the tag info for an external tag map
 * @depth:	the maximum queue depth supported
146
 * @alloc_policy: tag allocation policy
147
 **/
148
struct blk_queue_tag *blk_init_tags(int depth, int alloc_policy)
149
{
150
	return __blk_queue_init_tags(NULL, depth, alloc_policy);
151 152 153 154 155 156 157 158
}
EXPORT_SYMBOL(blk_init_tags);

/**
 * blk_queue_init_tags - initialize the queue tag info
 * @q:  the request queue for the device
 * @depth:  the maximum queue depth supported
 * @tags: the tag to use
159
 * @alloc_policy: tag allocation policy
160 161 162
 *
 * Queue lock must be held here if the function is called to resize an
 * existing map.
163 164
 **/
int blk_queue_init_tags(struct request_queue *q, int depth,
165
			struct blk_queue_tag *tags, int alloc_policy)
166 167 168 169 170 171
{
	int rc;

	BUG_ON(tags && q->queue_tags && tags != q->queue_tags);

	if (!tags && !q->queue_tags) {
172
		tags = __blk_queue_init_tags(q, depth, alloc_policy);
173 174

		if (!tags)
175 176
			return -ENOMEM;

177
	} else if (q->queue_tags) {
178 179
		rc = blk_queue_resize_tags(q, depth);
		if (rc)
180
			return rc;
N
Nick Piggin 已提交
181
		queue_flag_set(QUEUE_FLAG_QUEUED, q);
182 183 184 185 186 187 188 189
		return 0;
	} else
		atomic_inc(&tags->refcnt);

	/*
	 * assign it, all done
	 */
	q->queue_tags = tags;
190
	queue_flag_set_unlocked(QUEUE_FLAG_QUEUED, q);
191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256
	return 0;
}
EXPORT_SYMBOL(blk_queue_init_tags);

/**
 * blk_queue_resize_tags - change the queueing depth
 * @q:  the request queue for the device
 * @new_depth: the new max command queueing depth
 *
 *  Notes:
 *    Must be called with the queue lock held.
 **/
int blk_queue_resize_tags(struct request_queue *q, int new_depth)
{
	struct blk_queue_tag *bqt = q->queue_tags;
	struct request **tag_index;
	unsigned long *tag_map;
	int max_depth, nr_ulongs;

	if (!bqt)
		return -ENXIO;

	/*
	 * if we already have large enough real_max_depth.  just
	 * adjust max_depth.  *NOTE* as requests with tag value
	 * between new_depth and real_max_depth can be in-flight, tag
	 * map can not be shrunk blindly here.
	 */
	if (new_depth <= bqt->real_max_depth) {
		bqt->max_depth = new_depth;
		return 0;
	}

	/*
	 * Currently cannot replace a shared tag map with a new
	 * one, so error out if this is the case
	 */
	if (atomic_read(&bqt->refcnt) != 1)
		return -EBUSY;

	/*
	 * save the old state info, so we can copy it back
	 */
	tag_index = bqt->tag_index;
	tag_map = bqt->tag_map;
	max_depth = bqt->real_max_depth;

	if (init_tag_map(q, bqt, new_depth))
		return -ENOMEM;

	memcpy(bqt->tag_index, tag_index, max_depth * sizeof(struct request *));
	nr_ulongs = ALIGN(max_depth, BITS_PER_LONG) / BITS_PER_LONG;
	memcpy(bqt->tag_map, tag_map, nr_ulongs * sizeof(unsigned long));

	kfree(tag_index);
	kfree(tag_map);
	return 0;
}
EXPORT_SYMBOL(blk_queue_resize_tags);

/**
 * blk_queue_end_tag - end tag operations for a request
 * @q:  the request queue for the device
 * @rq: the request that has completed
 *
 *  Description:
257
 *    Typically called when end_that_request_first() returns %0, meaning
258 259 260 261 262 263 264
 *    all transfers have been done for a request. It's important to call
 *    this function before end_that_request_last(), as that will put the
 *    request back on the free list thus corrupting the internal tag list.
 **/
void blk_queue_end_tag(struct request_queue *q, struct request *rq)
{
	struct blk_queue_tag *bqt = q->queue_tags;
D
Dan Williams 已提交
265
	unsigned tag = rq->tag; /* negative tags invalid */
266

267 268
	lockdep_assert_held(q->queue_lock);

D
Dan Williams 已提交
269
	BUG_ON(tag >= bqt->real_max_depth);
270 271

	list_del_init(&rq->queuelist);
272
	rq->rq_flags &= ~RQF_QUEUED;
273
	rq->tag = -1;
274
	rq->internal_tag = -1;
275 276 277

	if (unlikely(bqt->tag_index[tag] == NULL))
		printk(KERN_ERR "%s: tag %d is missing\n",
278
		       __func__, tag);
279 280 281 282 283

	bqt->tag_index[tag] = NULL;

	if (unlikely(!test_bit(tag, bqt->tag_map))) {
		printk(KERN_ERR "%s: attempt to clear non-busy tag (%d)\n",
284
		       __func__, tag);
285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311
		return;
	}
	/*
	 * The tag_map bit acts as a lock for tag_index[bit], so we need
	 * unlock memory barrier semantics.
	 */
	clear_bit_unlock(tag, bqt->tag_map);
}

/**
 * blk_queue_start_tag - find a free tag and assign it
 * @q:  the request queue for the device
 * @rq:  the block request that needs tagging
 *
 *  Description:
 *    This can either be used as a stand-alone helper, or possibly be
 *    assigned as the queue &prep_rq_fn (in which case &struct request
 *    automagically gets a tag assigned). Note that this function
 *    assumes that any type of request can be queued! if this is not
 *    true for your device, you must check the request type before
 *    calling this function.  The request will also be removed from
 *    the request queue, so it's the drivers responsibility to readd
 *    it if it should need to be restarted for some reason.
 **/
int blk_queue_start_tag(struct request_queue *q, struct request *rq)
{
	struct blk_queue_tag *bqt = q->queue_tags;
312
	unsigned max_depth;
313 314
	int tag;

315 316
	lockdep_assert_held(q->queue_lock);

317
	if (unlikely((rq->rq_flags & RQF_QUEUED))) {
318
		printk(KERN_ERR
319
		       "%s: request %p for device [%s] already tagged %d",
320
		       __func__, rq,
321 322 323 324 325 326 327
		       rq->rq_disk ? rq->rq_disk->disk_name : "?", rq->tag);
		BUG();
	}

	/*
	 * Protect against shared tag maps, as we may not have exclusive
	 * access to the tag map.
328 329 330
	 *
	 * We reserve a few tags just for sync IO, since we don't want
	 * to starve sync IO on behalf of flooding async IO.
331
	 */
332
	max_depth = bqt->max_depth;
333
	if (!rq_is_sync(rq) && max_depth > 1) {
334 335
		switch (max_depth) {
		case 2:
336
			max_depth = 1;
337 338 339 340 341 342 343
			break;
		case 3:
			max_depth = 2;
			break;
		default:
			max_depth -= 2;
		}
344
		if (q->in_flight[BLK_RW_ASYNC] > max_depth)
345 346
			return 1;
	}
347

348
	do {
349 350 351 352 353 354 355 356 357 358 359 360 361 362 363
		if (bqt->alloc_policy == BLK_TAG_ALLOC_FIFO) {
			tag = find_first_zero_bit(bqt->tag_map, max_depth);
			if (tag >= max_depth)
				return 1;
		} else {
			int start = bqt->next_tag;
			int size = min_t(int, bqt->max_depth, max_depth + start);
			tag = find_next_zero_bit(bqt->tag_map, size, start);
			if (tag >= size && start + size > bqt->max_depth) {
				size = start + size - bqt->max_depth;
				tag = find_first_zero_bit(bqt->tag_map, size);
			}
			if (tag >= size)
				return 1;
		}
364 365 366 367 368 369 370

	} while (test_and_set_bit_lock(tag, bqt->tag_map));
	/*
	 * We need lock ordering semantics given by test_and_set_bit_lock.
	 * See blk_queue_end_tag for details.
	 */

371
	bqt->next_tag = (tag + 1) % bqt->max_depth;
372
	rq->rq_flags |= RQF_QUEUED;
373 374
	rq->tag = tag;
	bqt->tag_index[tag] = rq;
375
	blk_start_request(rq);
376 377 378
	return 0;
}
EXPORT_SYMBOL(blk_queue_start_tag);