blk.h 9.8 KB
Newer Older
1 2 3
#ifndef BLK_INTERNAL_H
#define BLK_INTERNAL_H

4
#include <linux/idr.h>
5 6
#include <linux/blk-mq.h>
#include "blk-mq.h"
7

J
Jens Axboe 已提交
8 9 10 11 12 13
/* Amount of time in which a process may batch requests */
#define BLK_BATCH_TIME	(HZ/50UL)

/* Number of requests a "batching" process may submit */
#define BLK_BATCH_REQ	32

14 15 16
/* Max future timer expiry for timeouts */
#define BLK_MAX_TIMEOUT		(5 * HZ)

17 18 19 20
#ifdef CONFIG_DEBUG_FS
extern struct dentry *blk_debugfs_root;
#endif

21 22 23 24 25 26 27 28
struct blk_flush_queue {
	unsigned int		flush_queue_delayed:1;
	unsigned int		flush_pending_idx:1;
	unsigned int		flush_running_idx:1;
	unsigned long		flush_pending_since;
	struct list_head	flush_queue[2];
	struct list_head	flush_data_in_flight;
	struct request		*flush_rq;
29 30 31 32 33 34

	/*
	 * flush_rq shares tag with this rq, both can't be active
	 * at the same time
	 */
	struct request		*orig_rq;
35 36 37
	spinlock_t		mq_flush_lock;
};

38
extern struct kmem_cache *blk_requestq_cachep;
39
extern struct kmem_cache *request_cachep;
40
extern struct kobj_type blk_queue_ktype;
41
extern struct ida blk_queue_ida;
42

43
static inline struct blk_flush_queue *blk_get_flush_queue(
44
		struct request_queue *q, struct blk_mq_ctx *ctx)
45
{
C
Christoph Hellwig 已提交
46 47 48
	if (q->mq_ops)
		return blk_mq_map_queue(q, ctx->cpu)->fq;
	return q->fq;
49 50
}

T
Tejun Heo 已提交
51 52 53 54 55
static inline void __blk_get_queue(struct request_queue *q)
{
	kobject_get(&q->kobj);
}

56 57 58
struct blk_flush_queue *blk_alloc_flush_queue(struct request_queue *q,
		int node, int cmd_size);
void blk_free_flush_queue(struct blk_flush_queue *q);
59

60 61 62
int blk_init_rl(struct request_list *rl, struct request_queue *q,
		gfp_t gfp_mask);
void blk_exit_rl(struct request_list *rl);
J
Jens Axboe 已提交
63 64 65
void init_request_from_bio(struct request *req, struct bio *bio);
void blk_rq_bio_prep(struct request_queue *q, struct request *rq,
			struct bio *bio);
66 67
void blk_queue_bypass_start(struct request_queue *q);
void blk_queue_bypass_end(struct request_queue *q);
68
void blk_dequeue_request(struct request *rq);
69
void __blk_queue_free_tags(struct request_queue *q);
70 71
bool __blk_end_bidi_request(struct request *rq, int error,
			    unsigned int nr_bytes, unsigned int bidi_bytes);
72 73 74 75 76 77 78 79 80 81 82 83
void blk_freeze_queue(struct request_queue *q);

static inline void blk_queue_enter_live(struct request_queue *q)
{
	/*
	 * Given that running in generic_make_request() context
	 * guarantees that a live reference against q_usage_counter has
	 * been established, further references under that same context
	 * need not check that the queue has been frozen (marked dead).
	 */
	percpu_ref_get(&q->q_usage_counter);
}
84

85 86 87 88 89 90 91
#ifdef CONFIG_BLK_DEV_INTEGRITY
void blk_flush_integrity(void);
#else
static inline void blk_flush_integrity(void)
{
}
#endif
92

93
void blk_timeout_work(struct work_struct *work);
94
unsigned long blk_rq_timeout(unsigned long timeout);
95
void blk_add_timer(struct request *req);
J
Jens Axboe 已提交
96 97
void blk_delete_timer(struct request *);

98 99 100 101 102

bool bio_attempt_front_merge(struct request_queue *q, struct request *req,
			     struct bio *bio);
bool bio_attempt_back_merge(struct request_queue *q, struct request *req,
			    struct bio *bio);
103 104
bool bio_attempt_discard_merge(struct request_queue *q, struct request *req,
		struct bio *bio);
105
bool blk_attempt_plug_merge(struct request_queue *q, struct bio *bio,
106 107
			    unsigned int *request_count,
			    struct request **same_queue_rq);
108
unsigned int blk_plug_queued_count(struct request_queue *q);
109 110 111 112 113

void blk_account_io_start(struct request *req, bool new_io);
void blk_account_io_completion(struct request *req, unsigned int bytes);
void blk_account_io_done(struct request *req);

J
Jens Axboe 已提交
114 115 116 117 118
/*
 * Internal atomic flags for request handling
 */
enum rq_atomic_flags {
	REQ_ATOM_COMPLETE = 0,
119
	REQ_ATOM_STARTED,
120
	REQ_ATOM_POLL_SLEPT,
J
Jens Axboe 已提交
121 122 123 124
};

/*
 * EH timer and IO completion will both attempt to 'grab' the request, make
L
Lucas De Marchi 已提交
125
 * sure that only one of them succeeds
J
Jens Axboe 已提交
126 127 128 129 130 131 132 133 134 135
 */
static inline int blk_mark_rq_complete(struct request *rq)
{
	return test_and_set_bit(REQ_ATOM_COMPLETE, &rq->atomic_flags);
}

static inline void blk_clear_rq_complete(struct request *rq)
{
	clear_bit(REQ_ATOM_COMPLETE, &rq->atomic_flags);
}
J
Jens Axboe 已提交
136

137 138 139
/*
 * Internal elevator interface
 */
140
#define ELV_ON_HASH(rq) ((rq)->rq_flags & RQF_HASHED)
141

142
void blk_insert_flush(struct request *rq);
T
Tejun Heo 已提交
143

144 145 146
static inline struct request *__elv_next_request(struct request_queue *q)
{
	struct request *rq;
147
	struct blk_flush_queue *fq = blk_get_flush_queue(q, NULL);
148 149

	while (1) {
150
		if (!list_empty(&q->queue_head)) {
151
			rq = list_entry_rq(q->queue_head.next);
152
			return rq;
153 154
		}

155 156 157 158 159 160 161 162 163 164 165 166 167 168 169
		/*
		 * Flush request is running and flush request isn't queueable
		 * in the drive, we can hold the queue till flush request is
		 * finished. Even we don't do this, driver can't dispatch next
		 * requests and will requeue them. And this can improve
		 * throughput too. For example, we have request flush1, write1,
		 * flush 2. flush1 is dispatched, then queue is hold, write1
		 * isn't inserted to queue. After flush1 is finished, flush2
		 * will be dispatched. Since disk cache is already clean,
		 * flush2 will be finished very soon, so looks like flush2 is
		 * folded to flush1.
		 * Since the queue is hold, a flag is set to indicate the queue
		 * should be restarted later. Please see flush_end_io() for
		 * details.
		 */
170
		if (fq->flush_pending_idx != fq->flush_running_idx &&
171
				!queue_flush_queueable(q)) {
172
			fq->flush_queue_delayed = 1;
173 174
			return NULL;
		}
175
		if (unlikely(blk_queue_bypass(q)) ||
176
		    !q->elevator->type->ops.sq.elevator_dispatch_fn(q, 0))
177 178 179 180 181 182 183 184
			return NULL;
	}
}

static inline void elv_activate_rq(struct request_queue *q, struct request *rq)
{
	struct elevator_queue *e = q->elevator;

185 186
	if (e->type->ops.sq.elevator_activate_req_fn)
		e->type->ops.sq.elevator_activate_req_fn(q, rq);
187 188 189 190 191 192
}

static inline void elv_deactivate_rq(struct request_queue *q, struct request *rq)
{
	struct elevator_queue *e = q->elevator;

193 194
	if (e->type->ops.sq.elevator_deactivate_req_fn)
		e->type->ops.sq.elevator_deactivate_req_fn(q, rq);
195 196
}

197 198 199 200 201 202 203 204 205 206 207 208
#ifdef CONFIG_FAIL_IO_TIMEOUT
int blk_should_fake_timeout(struct request_queue *);
ssize_t part_timeout_show(struct device *, struct device_attribute *, char *);
ssize_t part_timeout_store(struct device *, struct device_attribute *,
				const char *, size_t);
#else
static inline int blk_should_fake_timeout(struct request_queue *q)
{
	return 0;
}
#endif

209 210 211 212
int ll_back_merge_fn(struct request_queue *q, struct request *req,
		     struct bio *bio);
int ll_front_merge_fn(struct request_queue *q, struct request *req, 
		      struct bio *bio);
213 214
struct request *attempt_back_merge(struct request_queue *q, struct request *rq);
struct request *attempt_front_merge(struct request_queue *q, struct request *rq);
215 216
int blk_attempt_req_merge(struct request_queue *q, struct request *rq,
				struct request *next);
217
void blk_recalc_rq_segments(struct request *rq);
218
void blk_rq_set_mixed_merge(struct request *rq);
219
bool blk_rq_merge_ok(struct request *rq, struct bio *bio);
220
enum elv_merge blk_try_merge(struct request *rq, struct bio *bio);
221

222 223
void blk_queue_congestion_threshold(struct request_queue *q);

224 225
int blk_dev_init(void);

226

227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244
/*
 * Return the threshold (number of used requests) at which the queue is
 * considered to be congested.  It include a little hysteresis to keep the
 * context switch rate down.
 */
static inline int queue_congestion_on_threshold(struct request_queue *q)
{
	return q->nr_congestion_on;
}

/*
 * The threshold at which a queue is considered to be uncongested
 */
static inline int queue_congestion_off_threshold(struct request_queue *q)
{
	return q->nr_congestion_off;
}

245 246
extern int blk_update_nr_requests(struct request_queue *, unsigned int);

247 248 249 250 251
/*
 * Contribute to IO statistics IFF:
 *
 *	a) it's attached to a gendisk, and
 *	b) the queue had IO stats enabled when this request was started, and
252
 *	c) it's a file system request
253
 */
254
static inline int blk_do_io_stat(struct request *rq)
255
{
256
	return rq->rq_disk &&
257
	       (rq->rq_flags & RQF_IO_STAT) &&
258
		!blk_rq_is_passthrough(rq);
259 260
}

261 262 263 264 265 266 267
static inline void req_set_nomerge(struct request_queue *q, struct request *req)
{
	req->cmd_flags |= REQ_NOMERGE;
	if (req == q->last_merge)
		q->last_merge = NULL;
}

268 269 270 271
/*
 * Internal io_context interface
 */
void get_io_context(struct io_context *ioc);
272
struct io_cq *ioc_lookup_icq(struct io_context *ioc, struct request_queue *q);
273 274
struct io_cq *ioc_create_icq(struct io_context *ioc, struct request_queue *q,
			     gfp_t gfp_mask);
275
void ioc_clear_queue(struct request_queue *q);
276

277
int create_task_io_context(struct task_struct *task, gfp_t gfp_mask, int node);
278

J
Jens Axboe 已提交
279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294
/**
 * rq_ioc - determine io_context for request allocation
 * @bio: request being allocated is for this bio (can be %NULL)
 *
 * Determine io_context to use for request allocation for @bio.  May return
 * %NULL if %current->io_context doesn't exist.
 */
static inline struct io_context *rq_ioc(struct bio *bio)
{
#ifdef CONFIG_BLK_CGROUP
	if (bio && bio->bi_ioc)
		return bio->bi_ioc;
#endif
	return current->io_context;
}

295 296 297 298 299
/**
 * create_io_context - try to create task->io_context
 * @gfp_mask: allocation mask
 * @node: allocation node
 *
300 301 302
 * If %current->io_context is %NULL, allocate a new io_context and install
 * it.  Returns the current %current->io_context which may be %NULL if
 * allocation failed.
303 304
 *
 * Note that this function can't be called with IRQ disabled because
305
 * task_lock which protects %current->io_context is IRQ-unsafe.
306
 */
307
static inline struct io_context *create_io_context(gfp_t gfp_mask, int node)
308 309
{
	WARN_ON_ONCE(irqs_disabled());
310 311 312
	if (unlikely(!current->io_context))
		create_task_io_context(current, gfp_mask, node);
	return current->io_context;
313 314 315 316 317
}

/*
 * Internal throttling interface
 */
318
#ifdef CONFIG_BLK_DEV_THROTTLING
319
extern void blk_throtl_drain(struct request_queue *q);
320 321 322
extern int blk_throtl_init(struct request_queue *q);
extern void blk_throtl_exit(struct request_queue *q);
#else /* CONFIG_BLK_DEV_THROTTLING */
323
static inline void blk_throtl_drain(struct request_queue *q) { }
324 325 326 327 328
static inline int blk_throtl_init(struct request_queue *q) { return 0; }
static inline void blk_throtl_exit(struct request_queue *q) { }
#endif /* CONFIG_BLK_DEV_THROTTLING */

#endif /* BLK_INTERNAL_H */