bcache: Do bkey_put() in btree_split() error path
[linux-2.6-block.git] / include / linux / blkdev.h
CommitLineData
1da177e4
LT
1#ifndef _LINUX_BLKDEV_H
2#define _LINUX_BLKDEV_H
3
85fd0bc9
RK
4#include <linux/sched.h>
5
f5ff8422
JA
6#ifdef CONFIG_BLOCK
7
1da177e4
LT
8#include <linux/major.h>
9#include <linux/genhd.h>
10#include <linux/list.h>
320ae51f 11#include <linux/llist.h>
1da177e4
LT
12#include <linux/timer.h>
13#include <linux/workqueue.h>
14#include <linux/pagemap.h>
15#include <linux/backing-dev.h>
16#include <linux/wait.h>
17#include <linux/mempool.h>
18#include <linux/bio.h>
1da177e4 19#include <linux/stringify.h>
3e6053d7 20#include <linux/gfp.h>
d351af01 21#include <linux/bsg.h>
c7c22e4d 22#include <linux/smp.h>
548bc8e1 23#include <linux/rcupdate.h>
1da177e4
LT
24
25#include <asm/scatterlist.h>
26
de477254 27struct module;
21b2f0c8
CH
28struct scsi_ioctl_command;
29
1da177e4 30struct request_queue;
1da177e4 31struct elevator_queue;
1da177e4 32struct request_pm_state;
2056a782 33struct blk_trace;
3d6392cf
JA
34struct request;
35struct sg_io_hdr;
aa387cc8 36struct bsg_job;
3c798398 37struct blkcg_gq;
1da177e4
LT
38
39#define BLKDEV_MIN_RQ 4
40#define BLKDEV_MAX_RQ 128 /* Default maximum */
41
8bd435b3
TH
42/*
43 * Maximum number of blkcg policies allowed to be registered concurrently.
44 * Defined here to simplify include dependency.
45 */
46#define BLKCG_MAX_POLS 2
47
1da177e4 48struct request;
8ffdc655 49typedef void (rq_end_io_fn)(struct request *, int);
1da177e4 50
5b788ce3
TH
51#define BLK_RL_SYNCFULL (1U << 0)
52#define BLK_RL_ASYNCFULL (1U << 1)
53
1da177e4 54struct request_list {
5b788ce3 55 struct request_queue *q; /* the queue this rl belongs to */
a051661c
TH
56#ifdef CONFIG_BLK_CGROUP
57 struct blkcg_gq *blkg; /* blkg this request pool belongs to */
58#endif
1faa16d2
JA
59 /*
60 * count[], starved[], and wait[] are indexed by
61 * BLK_RW_SYNC/BLK_RW_ASYNC
62 */
8a5ecdd4
TH
63 int count[2];
64 int starved[2];
65 mempool_t *rq_pool;
66 wait_queue_head_t wait[2];
5b788ce3 67 unsigned int flags;
1da177e4
LT
68};
69
4aff5e23
JA
70/*
71 * request command types
72 */
73enum rq_cmd_type_bits {
74 REQ_TYPE_FS = 1, /* fs request */
75 REQ_TYPE_BLOCK_PC, /* scsi command */
76 REQ_TYPE_SENSE, /* sense request */
77 REQ_TYPE_PM_SUSPEND, /* suspend request */
78 REQ_TYPE_PM_RESUME, /* resume request */
79 REQ_TYPE_PM_SHUTDOWN, /* shutdown request */
4aff5e23 80 REQ_TYPE_SPECIAL, /* driver defined type */
4aff5e23
JA
81 /*
82 * for ATA/ATAPI devices. this really doesn't belong here, ide should
83 * use REQ_TYPE_SPECIAL and use rq->cmd[0] with the range of driver
84 * private REQ_LB opcodes to differentiate what type of request this is
85 */
4aff5e23 86 REQ_TYPE_ATA_TASKFILE,
cea2885a 87 REQ_TYPE_ATA_PC,
4aff5e23
JA
88};
89
1da177e4
LT
90#define BLK_MAX_CDB 16
91
92/*
63a71386 93 * try to put the fields that are referenced together in the same cacheline.
4d0d98b6 94 * if you modify this structure, be sure to check block/blk-core.c:blk_rq_init()
63a71386 95 * as well!
1da177e4
LT
96 */
97struct request {
320ae51f
JA
98 union {
99 struct list_head queuelist;
100 struct llist_node ll_list;
101 };
102 union {
103 struct call_single_data csd;
104 struct work_struct mq_flush_data;
105 };
ff856bad 106
165125e1 107 struct request_queue *q;
320ae51f 108 struct blk_mq_ctx *mq_ctx;
e6a1c874 109
5953316d 110 u64 cmd_flags;
4aff5e23 111 enum rq_cmd_type_bits cmd_type;
242f9dcb 112 unsigned long atomic_flags;
1da177e4 113
181fdde3
RK
114 int cpu;
115
a2dec7b3 116 /* the following two fields are internal, NEVER access directly */
a2dec7b3 117 unsigned int __data_len; /* total data len */
181fdde3 118 sector_t __sector; /* sector cursor */
1da177e4
LT
119
120 struct bio *bio;
121 struct bio *biotail;
122
9817064b 123 struct hlist_node hash; /* merge hash */
e6a1c874
JA
124 /*
125 * The rb_node is only used inside the io scheduler, requests
126 * are pruned when moved to the dispatch queue. So let the
c186794d 127 * completion_data share space with the rb_node.
e6a1c874
JA
128 */
129 union {
130 struct rb_node rb_node; /* sort/lookup */
c186794d 131 void *completion_data;
e6a1c874 132 };
9817064b 133
ff7d145f 134 /*
7f1dc8a2 135 * Three pointers are available for the IO schedulers, if they need
c186794d
MS
136 * more they have to dynamically allocate it. Flush requests are
137 * never put on the IO scheduler. So let the flush fields share
a612fddf 138 * space with the elevator data.
ff7d145f 139 */
c186794d 140 union {
a612fddf
TH
141 struct {
142 struct io_cq *icq;
143 void *priv[2];
144 } elv;
145
c186794d
MS
146 struct {
147 unsigned int seq;
148 struct list_head list;
4853abaa 149 rq_end_io_fn *saved_end_io;
c186794d
MS
150 } flush;
151 };
ff7d145f 152
8f34ee75 153 struct gendisk *rq_disk;
09e099d4 154 struct hd_struct *part;
1da177e4 155 unsigned long start_time;
9195291e 156#ifdef CONFIG_BLK_CGROUP
a051661c 157 struct request_list *rl; /* rl this rq is alloced from */
9195291e
DS
158 unsigned long long start_time_ns;
159 unsigned long long io_start_time_ns; /* when passed to hardware */
160#endif
1da177e4
LT
161 /* Number of scatter-gather DMA addr+len pairs after
162 * physical address coalescing is performed.
163 */
164 unsigned short nr_phys_segments;
13f05c8d
MP
165#if defined(CONFIG_BLK_DEV_INTEGRITY)
166 unsigned short nr_integrity_segments;
167#endif
1da177e4 168
8f34ee75
JA
169 unsigned short ioprio;
170
731ec497
TH
171 void *special; /* opaque pointer available for LLD use */
172 char *buffer; /* kaddr of the current segment if available */
1da177e4 173
cdd60262
JA
174 int tag;
175 int errors;
176
1da177e4
LT
177 /*
178 * when request is used as a packet command carrier
179 */
d7e3c324
FT
180 unsigned char __cmd[BLK_MAX_CDB];
181 unsigned char *cmd;
181fdde3 182 unsigned short cmd_len;
1da177e4 183
7a85f889 184 unsigned int extra_len; /* length of alignment and padding */
1da177e4 185 unsigned int sense_len;
c3a4d78c 186 unsigned int resid_len; /* residual count */
1da177e4
LT
187 void *sense;
188
242f9dcb
JA
189 unsigned long deadline;
190 struct list_head timeout_list;
1da177e4 191 unsigned int timeout;
17e01f21 192 int retries;
1da177e4 193
1da177e4 194 /*
c00895ab 195 * completion callback.
1da177e4
LT
196 */
197 rq_end_io_fn *end_io;
198 void *end_io_data;
abae1fde
FT
199
200 /* for bidi */
201 struct request *next_rq;
1da177e4
LT
202};
203
766ca442
FLVC
204static inline unsigned short req_get_ioprio(struct request *req)
205{
206 return req->ioprio;
207}
208
1da177e4 209/*
4aff5e23 210 * State information carried for REQ_TYPE_PM_SUSPEND and REQ_TYPE_PM_RESUME
1da177e4
LT
211 * requests. Some step values could eventually be made generic.
212 */
213struct request_pm_state
214{
215 /* PM state machine step value, currently driver specific */
216 int pm_step;
217 /* requested PM state value (S1, S2, S3, S4, ...) */
218 u32 pm_state;
219 void* data; /* for driver use */
220};
221
222#include <linux/elevator.h>
223
320ae51f
JA
224struct blk_queue_ctx;
225
165125e1 226typedef void (request_fn_proc) (struct request_queue *q);
5a7bbad2 227typedef void (make_request_fn) (struct request_queue *q, struct bio *bio);
165125e1 228typedef int (prep_rq_fn) (struct request_queue *, struct request *);
28018c24 229typedef void (unprep_rq_fn) (struct request_queue *, struct request *);
1da177e4
LT
230
231struct bio_vec;
cc371e66
AK
232struct bvec_merge_data {
233 struct block_device *bi_bdev;
234 sector_t bi_sector;
235 unsigned bi_size;
236 unsigned long bi_rw;
237};
238typedef int (merge_bvec_fn) (struct request_queue *, struct bvec_merge_data *,
239 struct bio_vec *);
ff856bad 240typedef void (softirq_done_fn)(struct request *);
2fb98e84 241typedef int (dma_drain_needed_fn)(struct request *);
ef9e3fac 242typedef int (lld_busy_fn) (struct request_queue *q);
aa387cc8 243typedef int (bsg_job_fn) (struct bsg_job *);
1da177e4 244
242f9dcb
JA
245enum blk_eh_timer_return {
246 BLK_EH_NOT_HANDLED,
247 BLK_EH_HANDLED,
248 BLK_EH_RESET_TIMER,
249};
250
251typedef enum blk_eh_timer_return (rq_timed_out_fn)(struct request *);
252
1da177e4
LT
253enum blk_queue_state {
254 Queue_down,
255 Queue_up,
256};
257
1da177e4
LT
258struct blk_queue_tag {
259 struct request **tag_index; /* map of busy tags */
260 unsigned long *tag_map; /* bit map of free/busy tags */
1da177e4
LT
261 int busy; /* current depth */
262 int max_depth; /* what we will send to device */
ba025082 263 int real_max_depth; /* what the array can hold */
1da177e4
LT
264 atomic_t refcnt; /* map can be shared */
265};
266
abf54393
FT
267#define BLK_SCSI_MAX_CMDS (256)
268#define BLK_SCSI_CMD_PER_LONG (BLK_SCSI_MAX_CMDS / (sizeof(long) * 8))
269
025146e1
MP
270struct queue_limits {
271 unsigned long bounce_pfn;
272 unsigned long seg_boundary_mask;
273
274 unsigned int max_hw_sectors;
275 unsigned int max_sectors;
276 unsigned int max_segment_size;
c72758f3
MP
277 unsigned int physical_block_size;
278 unsigned int alignment_offset;
279 unsigned int io_min;
280 unsigned int io_opt;
67efc925 281 unsigned int max_discard_sectors;
4363ac7c 282 unsigned int max_write_same_sectors;
86b37281
MP
283 unsigned int discard_granularity;
284 unsigned int discard_alignment;
025146e1
MP
285
286 unsigned short logical_block_size;
8a78362c 287 unsigned short max_segments;
13f05c8d 288 unsigned short max_integrity_segments;
025146e1 289
c72758f3 290 unsigned char misaligned;
86b37281 291 unsigned char discard_misaligned;
e692cb66 292 unsigned char cluster;
a934a00a 293 unsigned char discard_zeroes_data;
025146e1
MP
294};
295
d7b76301 296struct request_queue {
1da177e4
LT
297 /*
298 * Together with queue_head for cacheline sharing
299 */
300 struct list_head queue_head;
301 struct request *last_merge;
b374d18a 302 struct elevator_queue *elevator;
8a5ecdd4
TH
303 int nr_rqs[2]; /* # allocated [a]sync rqs */
304 int nr_rqs_elvpriv; /* # allocated rqs w/ elvpriv */
1da177e4
LT
305
306 /*
a051661c
TH
307 * If blkcg is not used, @q->root_rl serves all requests. If blkcg
308 * is used, root blkg allocates from @q->root_rl and all other
309 * blkgs from their own blkg->rl. Which one to use should be
310 * determined using bio_request_list().
1da177e4 311 */
a051661c 312 struct request_list root_rl;
1da177e4
LT
313
314 request_fn_proc *request_fn;
1da177e4
LT
315 make_request_fn *make_request_fn;
316 prep_rq_fn *prep_rq_fn;
28018c24 317 unprep_rq_fn *unprep_rq_fn;
1da177e4 318 merge_bvec_fn *merge_bvec_fn;
ff856bad 319 softirq_done_fn *softirq_done_fn;
242f9dcb 320 rq_timed_out_fn *rq_timed_out_fn;
2fb98e84 321 dma_drain_needed_fn *dma_drain_needed;
ef9e3fac 322 lld_busy_fn *lld_busy_fn;
1da177e4 323
320ae51f
JA
324 struct blk_mq_ops *mq_ops;
325
326 unsigned int *mq_map;
327
328 /* sw queues */
329 struct blk_mq_ctx *queue_ctx;
330 unsigned int nr_queues;
331
332 /* hw dispatch queues */
333 struct blk_mq_hw_ctx **queue_hw_ctx;
334 unsigned int nr_hw_queues;
335
8922e16c
TH
336 /*
337 * Dispatch queue sorting
338 */
1b47f531 339 sector_t end_sector;
8922e16c 340 struct request *boundary_rq;
8922e16c 341
1da177e4 342 /*
3cca6dc1 343 * Delayed queue handling
1da177e4 344 */
3cca6dc1 345 struct delayed_work delay_work;
1da177e4
LT
346
347 struct backing_dev_info backing_dev_info;
348
349 /*
350 * The queue owner gets to use this for whatever they like.
351 * ll_rw_blk doesn't touch it.
352 */
353 void *queuedata;
354
1da177e4 355 /*
d7b76301 356 * various queue flags, see QUEUE_* below
1da177e4 357 */
d7b76301 358 unsigned long queue_flags;
1da177e4 359
a73f730d
TH
360 /*
361 * ida allocated id for this queue. Used to index queues from
362 * ioctx.
363 */
364 int id;
365
1da177e4 366 /*
d7b76301 367 * queue needs bounce pages for pages above this limit
1da177e4 368 */
d7b76301 369 gfp_t bounce_gfp;
1da177e4
LT
370
371 /*
152587de 372 * protects queue structures from reentrancy. ->__queue_lock should
373 * _never_ be used directly, it is queue private. always use
374 * ->queue_lock.
1da177e4 375 */
152587de 376 spinlock_t __queue_lock;
1da177e4
LT
377 spinlock_t *queue_lock;
378
379 /*
380 * queue kobject
381 */
382 struct kobject kobj;
383
320ae51f
JA
384 /*
385 * mq queue kobject
386 */
387 struct kobject mq_kobj;
388
6c954667
LM
389#ifdef CONFIG_PM_RUNTIME
390 struct device *dev;
391 int rpm_status;
392 unsigned int nr_pending;
393#endif
394
1da177e4
LT
395 /*
396 * queue settings
397 */
398 unsigned long nr_requests; /* Max # of requests */
399 unsigned int nr_congestion_on;
400 unsigned int nr_congestion_off;
401 unsigned int nr_batching;
402
fa0ccd83 403 unsigned int dma_drain_size;
d7b76301 404 void *dma_drain_buffer;
e3790c7d 405 unsigned int dma_pad_mask;
1da177e4
LT
406 unsigned int dma_alignment;
407
408 struct blk_queue_tag *queue_tags;
6eca9004 409 struct list_head tag_busy_list;
1da177e4 410
15853af9 411 unsigned int nr_sorted;
0a7ae2ff 412 unsigned int in_flight[2];
24faf6f6
BVA
413 /*
414 * Number of active block driver functions for which blk_drain_queue()
415 * must wait. Must be incremented around functions that unlock the
416 * queue_lock internally, e.g. scsi_request_fn().
417 */
418 unsigned int request_fn_active;
1da177e4 419
242f9dcb
JA
420 unsigned int rq_timeout;
421 struct timer_list timeout;
422 struct list_head timeout_list;
423
a612fddf 424 struct list_head icq_list;
4eef3049 425#ifdef CONFIG_BLK_CGROUP
a2b1693b 426 DECLARE_BITMAP (blkcg_pols, BLKCG_MAX_POLS);
3c798398 427 struct blkcg_gq *root_blkg;
03aa264a 428 struct list_head blkg_list;
4eef3049 429#endif
a612fddf 430
025146e1
MP
431 struct queue_limits limits;
432
1da177e4
LT
433 /*
434 * sg stuff
435 */
436 unsigned int sg_timeout;
437 unsigned int sg_reserved_size;
1946089a 438 int node;
6c5c9341 439#ifdef CONFIG_BLK_DEV_IO_TRACE
2056a782 440 struct blk_trace *blk_trace;
6c5c9341 441#endif
1da177e4 442 /*
4913efe4 443 * for flush operations
1da177e4 444 */
4913efe4 445 unsigned int flush_flags;
f3876930 446 unsigned int flush_not_queueable:1;
3ac0cc45 447 unsigned int flush_queue_delayed:1;
ae1b1539
TH
448 unsigned int flush_pending_idx:1;
449 unsigned int flush_running_idx:1;
450 unsigned long flush_pending_since;
451 struct list_head flush_queue[2];
452 struct list_head flush_data_in_flight;
320ae51f
JA
453 union {
454 struct request flush_rq;
455 struct {
456 spinlock_t mq_flush_lock;
457 struct work_struct mq_flush_work;
458 };
459 };
483f4afc
AV
460
461 struct mutex sysfs_lock;
d351af01 462
d732580b
TH
463 int bypass_depth;
464
d351af01 465#if defined(CONFIG_BLK_DEV_BSG)
aa387cc8
MC
466 bsg_job_fn *bsg_job_fn;
467 int bsg_job_size;
d351af01
FT
468 struct bsg_class_device bsg_dev;
469#endif
e43473b7
VG
470
471#ifdef CONFIG_BLK_DEV_THROTTLING
472 /* Throttle data */
473 struct throtl_data *td;
474#endif
548bc8e1 475 struct rcu_head rcu_head;
320ae51f
JA
476 wait_queue_head_t mq_freeze_wq;
477 struct percpu_counter mq_usage_counter;
478 struct list_head all_q_node;
1da177e4
LT
479};
480
1da177e4
LT
481#define QUEUE_FLAG_QUEUED 1 /* uses generic tag queueing */
482#define QUEUE_FLAG_STOPPED 2 /* queue is stopped */
1faa16d2
JA
483#define QUEUE_FLAG_SYNCFULL 3 /* read queue has been filled */
484#define QUEUE_FLAG_ASYNCFULL 4 /* write queue has been filled */
3f3299d5 485#define QUEUE_FLAG_DYING 5 /* queue being torn down */
d732580b 486#define QUEUE_FLAG_BYPASS 6 /* act as dumb FIFO queue */
c21e6beb
JA
487#define QUEUE_FLAG_BIDI 7 /* queue supports bidi requests */
488#define QUEUE_FLAG_NOMERGES 8 /* disable merge attempts */
5757a6d7 489#define QUEUE_FLAG_SAME_COMP 9 /* complete on same CPU-group */
c21e6beb
JA
490#define QUEUE_FLAG_FAIL_IO 10 /* fake timeout */
491#define QUEUE_FLAG_STACKABLE 11 /* supports request stacking */
492#define QUEUE_FLAG_NONROT 12 /* non-rotational device (SSD) */
88e740f1 493#define QUEUE_FLAG_VIRT QUEUE_FLAG_NONROT /* paravirt device */
c21e6beb
JA
494#define QUEUE_FLAG_IO_STAT 13 /* do IO stats */
495#define QUEUE_FLAG_DISCARD 14 /* supports DISCARD */
496#define QUEUE_FLAG_NOXMERGES 15 /* No extended merges */
497#define QUEUE_FLAG_ADD_RANDOM 16 /* Contributes to random pool */
498#define QUEUE_FLAG_SECDISCARD 17 /* supports SECDISCARD */
5757a6d7 499#define QUEUE_FLAG_SAME_FORCE 18 /* force complete on same CPU */
c246e80d 500#define QUEUE_FLAG_DEAD 19 /* queue tear-down finished */
320ae51f 501#define QUEUE_FLAG_INIT_DONE 20 /* queue is initialized */
bc58ba94
JA
502
503#define QUEUE_FLAG_DEFAULT ((1 << QUEUE_FLAG_IO_STAT) | \
01e97f6b 504 (1 << QUEUE_FLAG_STACKABLE) | \
e2e1a148
JA
505 (1 << QUEUE_FLAG_SAME_COMP) | \
506 (1 << QUEUE_FLAG_ADD_RANDOM))
797e7dbb 507
94eddfbe
JA
508#define QUEUE_FLAG_MQ_DEFAULT ((1 << QUEUE_FLAG_IO_STAT) | \
509 (1 << QUEUE_FLAG_SAME_COMP))
510
8bcb6c7d 511static inline void queue_lockdep_assert_held(struct request_queue *q)
8f45c1a5 512{
8bcb6c7d
AK
513 if (q->queue_lock)
514 lockdep_assert_held(q->queue_lock);
8f45c1a5
LT
515}
516
75ad23bc
NP
517static inline void queue_flag_set_unlocked(unsigned int flag,
518 struct request_queue *q)
519{
520 __set_bit(flag, &q->queue_flags);
521}
522
e48ec690
JA
523static inline int queue_flag_test_and_clear(unsigned int flag,
524 struct request_queue *q)
525{
8bcb6c7d 526 queue_lockdep_assert_held(q);
e48ec690
JA
527
528 if (test_bit(flag, &q->queue_flags)) {
529 __clear_bit(flag, &q->queue_flags);
530 return 1;
531 }
532
533 return 0;
534}
535
536static inline int queue_flag_test_and_set(unsigned int flag,
537 struct request_queue *q)
538{
8bcb6c7d 539 queue_lockdep_assert_held(q);
e48ec690
JA
540
541 if (!test_bit(flag, &q->queue_flags)) {
542 __set_bit(flag, &q->queue_flags);
543 return 0;
544 }
545
546 return 1;
547}
548
75ad23bc
NP
549static inline void queue_flag_set(unsigned int flag, struct request_queue *q)
550{
8bcb6c7d 551 queue_lockdep_assert_held(q);
75ad23bc
NP
552 __set_bit(flag, &q->queue_flags);
553}
554
555static inline void queue_flag_clear_unlocked(unsigned int flag,
556 struct request_queue *q)
557{
558 __clear_bit(flag, &q->queue_flags);
559}
560
0a7ae2ff
JA
561static inline int queue_in_flight(struct request_queue *q)
562{
563 return q->in_flight[0] + q->in_flight[1];
564}
565
75ad23bc
NP
566static inline void queue_flag_clear(unsigned int flag, struct request_queue *q)
567{
8bcb6c7d 568 queue_lockdep_assert_held(q);
75ad23bc
NP
569 __clear_bit(flag, &q->queue_flags);
570}
571
1da177e4
LT
572#define blk_queue_tagged(q) test_bit(QUEUE_FLAG_QUEUED, &(q)->queue_flags)
573#define blk_queue_stopped(q) test_bit(QUEUE_FLAG_STOPPED, &(q)->queue_flags)
3f3299d5 574#define blk_queue_dying(q) test_bit(QUEUE_FLAG_DYING, &(q)->queue_flags)
c246e80d 575#define blk_queue_dead(q) test_bit(QUEUE_FLAG_DEAD, &(q)->queue_flags)
d732580b 576#define blk_queue_bypass(q) test_bit(QUEUE_FLAG_BYPASS, &(q)->queue_flags)
320ae51f 577#define blk_queue_init_done(q) test_bit(QUEUE_FLAG_INIT_DONE, &(q)->queue_flags)
ac9fafa1 578#define blk_queue_nomerges(q) test_bit(QUEUE_FLAG_NOMERGES, &(q)->queue_flags)
488991e2
AB
579#define blk_queue_noxmerges(q) \
580 test_bit(QUEUE_FLAG_NOXMERGES, &(q)->queue_flags)
a68bbddb 581#define blk_queue_nonrot(q) test_bit(QUEUE_FLAG_NONROT, &(q)->queue_flags)
bc58ba94 582#define blk_queue_io_stat(q) test_bit(QUEUE_FLAG_IO_STAT, &(q)->queue_flags)
e2e1a148 583#define blk_queue_add_random(q) test_bit(QUEUE_FLAG_ADD_RANDOM, &(q)->queue_flags)
4ee5eaf4
KU
584#define blk_queue_stackable(q) \
585 test_bit(QUEUE_FLAG_STACKABLE, &(q)->queue_flags)
c15227de 586#define blk_queue_discard(q) test_bit(QUEUE_FLAG_DISCARD, &(q)->queue_flags)
8d57a98c
AH
587#define blk_queue_secdiscard(q) (blk_queue_discard(q) && \
588 test_bit(QUEUE_FLAG_SECDISCARD, &(q)->queue_flags))
1da177e4 589
33659ebb
CH
590#define blk_noretry_request(rq) \
591 ((rq)->cmd_flags & (REQ_FAILFAST_DEV|REQ_FAILFAST_TRANSPORT| \
592 REQ_FAILFAST_DRIVER))
593
594#define blk_account_rq(rq) \
595 (((rq)->cmd_flags & REQ_STARTED) && \
e2a60da7 596 ((rq)->cmd_type == REQ_TYPE_FS))
33659ebb 597
1da177e4 598#define blk_pm_request(rq) \
33659ebb
CH
599 ((rq)->cmd_type == REQ_TYPE_PM_SUSPEND || \
600 (rq)->cmd_type == REQ_TYPE_PM_RESUME)
1da177e4 601
ab780f1e 602#define blk_rq_cpu_valid(rq) ((rq)->cpu != -1)
abae1fde 603#define blk_bidi_rq(rq) ((rq)->next_rq != NULL)
336cdb40
KU
604/* rq->queuelist of dequeued request must be list_empty() */
605#define blk_queued_rq(rq) (!list_empty(&(rq)->queuelist))
1da177e4
LT
606
607#define list_entry_rq(ptr) list_entry((ptr), struct request, queuelist)
608
5953316d 609#define rq_data_dir(rq) (((rq)->cmd_flags & 1) != 0)
1da177e4 610
e692cb66
MP
611static inline unsigned int blk_queue_cluster(struct request_queue *q)
612{
613 return q->limits.cluster;
614}
615
9e2585a8 616/*
1faa16d2 617 * We regard a request as sync, if either a read or a sync write
9e2585a8 618 */
1faa16d2
JA
619static inline bool rw_is_sync(unsigned int rw_flags)
620{
7b6d91da 621 return !(rw_flags & REQ_WRITE) || (rw_flags & REQ_SYNC);
1faa16d2
JA
622}
623
624static inline bool rq_is_sync(struct request *rq)
625{
626 return rw_is_sync(rq->cmd_flags);
627}
628
5b788ce3 629static inline bool blk_rl_full(struct request_list *rl, bool sync)
1da177e4 630{
5b788ce3
TH
631 unsigned int flag = sync ? BLK_RL_SYNCFULL : BLK_RL_ASYNCFULL;
632
633 return rl->flags & flag;
1da177e4
LT
634}
635
5b788ce3 636static inline void blk_set_rl_full(struct request_list *rl, bool sync)
1da177e4 637{
5b788ce3
TH
638 unsigned int flag = sync ? BLK_RL_SYNCFULL : BLK_RL_ASYNCFULL;
639
640 rl->flags |= flag;
1da177e4
LT
641}
642
5b788ce3 643static inline void blk_clear_rl_full(struct request_list *rl, bool sync)
1da177e4 644{
5b788ce3
TH
645 unsigned int flag = sync ? BLK_RL_SYNCFULL : BLK_RL_ASYNCFULL;
646
647 rl->flags &= ~flag;
1da177e4
LT
648}
649
e2a60da7
MP
650static inline bool rq_mergeable(struct request *rq)
651{
652 if (rq->cmd_type != REQ_TYPE_FS)
653 return false;
1da177e4 654
e2a60da7
MP
655 if (rq->cmd_flags & REQ_NOMERGE_FLAGS)
656 return false;
657
658 return true;
659}
1da177e4 660
f31dc1cd
MP
661static inline bool blk_check_merge_flags(unsigned int flags1,
662 unsigned int flags2)
663{
664 if ((flags1 & REQ_DISCARD) != (flags2 & REQ_DISCARD))
665 return false;
666
667 if ((flags1 & REQ_SECURE) != (flags2 & REQ_SECURE))
668 return false;
669
4363ac7c
MP
670 if ((flags1 & REQ_WRITE_SAME) != (flags2 & REQ_WRITE_SAME))
671 return false;
672
f31dc1cd
MP
673 return true;
674}
675
4363ac7c
MP
676static inline bool blk_write_same_mergeable(struct bio *a, struct bio *b)
677{
678 if (bio_data(a) == bio_data(b))
679 return true;
680
681 return false;
682}
683
1da177e4
LT
684/*
685 * q->prep_rq_fn return values
686 */
687#define BLKPREP_OK 0 /* serve it */
688#define BLKPREP_KILL 1 /* fatal error, kill */
689#define BLKPREP_DEFER 2 /* leave on queue */
690
691extern unsigned long blk_max_low_pfn, blk_max_pfn;
692
693/*
694 * standard bounce addresses:
695 *
696 * BLK_BOUNCE_HIGH : bounce all highmem pages
697 * BLK_BOUNCE_ANY : don't bounce anything
698 * BLK_BOUNCE_ISA : bounce pages above ISA DMA boundary
699 */
2472892a
AK
700
701#if BITS_PER_LONG == 32
1da177e4 702#define BLK_BOUNCE_HIGH ((u64)blk_max_low_pfn << PAGE_SHIFT)
2472892a
AK
703#else
704#define BLK_BOUNCE_HIGH -1ULL
705#endif
706#define BLK_BOUNCE_ANY (-1ULL)
bfe17231 707#define BLK_BOUNCE_ISA (DMA_BIT_MASK(24))
1da177e4 708
3d6392cf
JA
709/*
710 * default timeout for SG_IO if none specified
711 */
712#define BLK_DEFAULT_SG_TIMEOUT (60 * HZ)
f2f1fa78 713#define BLK_MIN_SG_TIMEOUT (7 * HZ)
3d6392cf 714
2a7326b5 715#ifdef CONFIG_BOUNCE
1da177e4 716extern int init_emergency_isa_pool(void);
165125e1 717extern void blk_queue_bounce(struct request_queue *q, struct bio **bio);
1da177e4
LT
718#else
719static inline int init_emergency_isa_pool(void)
720{
721 return 0;
722}
165125e1 723static inline void blk_queue_bounce(struct request_queue *q, struct bio **bio)
1da177e4
LT
724{
725}
726#endif /* CONFIG_MMU */
727
152e283f
FT
728struct rq_map_data {
729 struct page **pages;
730 int page_order;
731 int nr_entries;
56c451f4 732 unsigned long offset;
97ae77a1 733 int null_mapped;
ecb554a8 734 int from_user;
152e283f
FT
735};
736
5705f702 737struct req_iterator {
7988613b 738 struct bvec_iter iter;
5705f702
N
739 struct bio *bio;
740};
741
742/* This should not be used directly - use rq_for_each_segment */
1e428079
JA
743#define for_each_bio(_bio) \
744 for (; _bio; _bio = _bio->bi_next)
5705f702 745#define __rq_for_each_bio(_bio, rq) \
1da177e4
LT
746 if ((rq->bio)) \
747 for (_bio = (rq)->bio; _bio; _bio = _bio->bi_next)
748
5705f702
N
749#define rq_for_each_segment(bvl, _rq, _iter) \
750 __rq_for_each_bio(_iter.bio, _rq) \
7988613b 751 bio_for_each_segment(bvl, _iter.bio, _iter.iter)
5705f702 752
4550dd6c 753#define rq_iter_last(bvec, _iter) \
7988613b 754 (_iter.bio->bi_next == NULL && \
4550dd6c 755 bio_iter_last(bvec, _iter.iter))
5705f702 756
2d4dc890
IL
757#ifndef ARCH_IMPLEMENTS_FLUSH_DCACHE_PAGE
758# error "You should define ARCH_IMPLEMENTS_FLUSH_DCACHE_PAGE for your platform"
759#endif
760#if ARCH_IMPLEMENTS_FLUSH_DCACHE_PAGE
761extern void rq_flush_dcache_pages(struct request *rq);
762#else
763static inline void rq_flush_dcache_pages(struct request *rq)
764{
765}
766#endif
767
1da177e4
LT
768extern int blk_register_queue(struct gendisk *disk);
769extern void blk_unregister_queue(struct gendisk *disk);
1da177e4 770extern void generic_make_request(struct bio *bio);
2a4aa30c 771extern void blk_rq_init(struct request_queue *q, struct request *rq);
1da177e4 772extern void blk_put_request(struct request *);
165125e1 773extern void __blk_put_request(struct request_queue *, struct request *);
165125e1 774extern struct request *blk_get_request(struct request_queue *, int, gfp_t);
79eb63e9
BH
775extern struct request *blk_make_request(struct request_queue *, struct bio *,
776 gfp_t);
165125e1 777extern void blk_requeue_request(struct request_queue *, struct request *);
66ac0280
CH
778extern void blk_add_request_payload(struct request *rq, struct page *page,
779 unsigned int len);
82124d60 780extern int blk_rq_check_limits(struct request_queue *q, struct request *rq);
ef9e3fac 781extern int blk_lld_busy(struct request_queue *q);
b0fd271d
KU
782extern int blk_rq_prep_clone(struct request *rq, struct request *rq_src,
783 struct bio_set *bs, gfp_t gfp_mask,
784 int (*bio_ctr)(struct bio *, struct bio *, void *),
785 void *data);
786extern void blk_rq_unprep_clone(struct request *rq);
82124d60
KU
787extern int blk_insert_cloned_request(struct request_queue *q,
788 struct request *rq);
3cca6dc1 789extern void blk_delay_queue(struct request_queue *, unsigned long);
165125e1 790extern void blk_recount_segments(struct request_queue *, struct bio *);
0bfc96cb 791extern int scsi_verify_blk_ioctl(struct block_device *, unsigned int);
577ebb37
PB
792extern int scsi_cmd_blk_ioctl(struct block_device *, fmode_t,
793 unsigned int, void __user *);
74f3c8af
AV
794extern int scsi_cmd_ioctl(struct request_queue *, struct gendisk *, fmode_t,
795 unsigned int, void __user *);
e915e872
AV
796extern int sg_scsi_ioctl(struct request_queue *, struct gendisk *, fmode_t,
797 struct scsi_ioctl_command __user *);
3fcfab16 798
5a7bbad2 799extern void blk_queue_bio(struct request_queue *q, struct bio *bio);
166e1f90 800
3fcfab16
AM
801/*
802 * A queue has just exitted congestion. Note this in the global counter of
803 * congested queues, and wake up anyone who was waiting for requests to be
804 * put back.
805 */
8aa7e847 806static inline void blk_clear_queue_congested(struct request_queue *q, int sync)
3fcfab16 807{
8aa7e847 808 clear_bdi_congested(&q->backing_dev_info, sync);
3fcfab16
AM
809}
810
811/*
812 * A queue has just entered congestion. Flag that in the queue's VM-visible
813 * state flags and increment the global gounter of congested queues.
814 */
8aa7e847 815static inline void blk_set_queue_congested(struct request_queue *q, int sync)
3fcfab16 816{
8aa7e847 817 set_bdi_congested(&q->backing_dev_info, sync);
3fcfab16
AM
818}
819
165125e1
JA
820extern void blk_start_queue(struct request_queue *q);
821extern void blk_stop_queue(struct request_queue *q);
1da177e4 822extern void blk_sync_queue(struct request_queue *q);
165125e1 823extern void __blk_stop_queue(struct request_queue *q);
24ecfbe2 824extern void __blk_run_queue(struct request_queue *q);
165125e1 825extern void blk_run_queue(struct request_queue *);
c21e6beb 826extern void blk_run_queue_async(struct request_queue *q);
a3bce90e 827extern int blk_rq_map_user(struct request_queue *, struct request *,
152e283f
FT
828 struct rq_map_data *, void __user *, unsigned long,
829 gfp_t);
8e5cfc45 830extern int blk_rq_unmap_user(struct bio *);
165125e1
JA
831extern int blk_rq_map_kern(struct request_queue *, struct request *, void *, unsigned int, gfp_t);
832extern int blk_rq_map_user_iov(struct request_queue *, struct request *,
152e283f
FT
833 struct rq_map_data *, struct sg_iovec *, int,
834 unsigned int, gfp_t);
165125e1 835extern int blk_execute_rq(struct request_queue *, struct gendisk *,
994ca9a1 836 struct request *, int);
165125e1 837extern void blk_execute_rq_nowait(struct request_queue *, struct gendisk *,
15fc858a 838 struct request *, int, rq_end_io_fn *);
6e39b69e 839
165125e1 840static inline struct request_queue *bdev_get_queue(struct block_device *bdev)
1da177e4
LT
841{
842 return bdev->bd_disk->queue;
843}
844
5efccd17 845/*
80a761fd
TH
846 * blk_rq_pos() : the current sector
847 * blk_rq_bytes() : bytes left in the entire request
848 * blk_rq_cur_bytes() : bytes left in the current segment
849 * blk_rq_err_bytes() : bytes left till the next error boundary
850 * blk_rq_sectors() : sectors left in the entire request
851 * blk_rq_cur_sectors() : sectors left in the current segment
5efccd17 852 */
5b93629b
TH
853static inline sector_t blk_rq_pos(const struct request *rq)
854{
a2dec7b3 855 return rq->__sector;
2e46e8b2
TH
856}
857
858static inline unsigned int blk_rq_bytes(const struct request *rq)
859{
a2dec7b3 860 return rq->__data_len;
5b93629b
TH
861}
862
2e46e8b2
TH
863static inline int blk_rq_cur_bytes(const struct request *rq)
864{
865 return rq->bio ? bio_cur_bytes(rq->bio) : 0;
866}
5efccd17 867
80a761fd
TH
868extern unsigned int blk_rq_err_bytes(const struct request *rq);
869
5b93629b
TH
870static inline unsigned int blk_rq_sectors(const struct request *rq)
871{
2e46e8b2 872 return blk_rq_bytes(rq) >> 9;
5b93629b
TH
873}
874
875static inline unsigned int blk_rq_cur_sectors(const struct request *rq)
876{
2e46e8b2 877 return blk_rq_cur_bytes(rq) >> 9;
5b93629b
TH
878}
879
f31dc1cd
MP
880static inline unsigned int blk_queue_get_max_sectors(struct request_queue *q,
881 unsigned int cmd_flags)
882{
883 if (unlikely(cmd_flags & REQ_DISCARD))
871dd928 884 return min(q->limits.max_discard_sectors, UINT_MAX >> 9);
f31dc1cd 885
4363ac7c
MP
886 if (unlikely(cmd_flags & REQ_WRITE_SAME))
887 return q->limits.max_write_same_sectors;
888
f31dc1cd
MP
889 return q->limits.max_sectors;
890}
891
892static inline unsigned int blk_rq_get_max_sectors(struct request *rq)
893{
894 struct request_queue *q = rq->q;
895
896 if (unlikely(rq->cmd_type == REQ_TYPE_BLOCK_PC))
897 return q->limits.max_hw_sectors;
898
899 return blk_queue_get_max_sectors(q, rq->cmd_flags);
900}
901
75afb352
JN
902static inline unsigned int blk_rq_count_bios(struct request *rq)
903{
904 unsigned int nr_bios = 0;
905 struct bio *bio;
906
907 __rq_for_each_bio(bio, rq)
908 nr_bios++;
909
910 return nr_bios;
911}
912
9934c8c0
TH
913/*
914 * Request issue related functions.
915 */
916extern struct request *blk_peek_request(struct request_queue *q);
917extern void blk_start_request(struct request *rq);
918extern struct request *blk_fetch_request(struct request_queue *q);
919
1da177e4 920/*
2e60e022
TH
921 * Request completion related functions.
922 *
923 * blk_update_request() completes given number of bytes and updates
924 * the request without completing it.
925 *
f06d9a2b
TH
926 * blk_end_request() and friends. __blk_end_request() must be called
927 * with the request queue spinlock acquired.
1da177e4
LT
928 *
929 * Several drivers define their own end_request and call
3bcddeac
KU
930 * blk_end_request() for parts of the original function.
931 * This prevents code duplication in drivers.
1da177e4 932 */
2e60e022
TH
933extern bool blk_update_request(struct request *rq, int error,
934 unsigned int nr_bytes);
b1f74493
FT
935extern bool blk_end_request(struct request *rq, int error,
936 unsigned int nr_bytes);
937extern void blk_end_request_all(struct request *rq, int error);
938extern bool blk_end_request_cur(struct request *rq, int error);
80a761fd 939extern bool blk_end_request_err(struct request *rq, int error);
b1f74493
FT
940extern bool __blk_end_request(struct request *rq, int error,
941 unsigned int nr_bytes);
942extern void __blk_end_request_all(struct request *rq, int error);
943extern bool __blk_end_request_cur(struct request *rq, int error);
80a761fd 944extern bool __blk_end_request_err(struct request *rq, int error);
2e60e022 945
ff856bad 946extern void blk_complete_request(struct request *);
242f9dcb
JA
947extern void __blk_complete_request(struct request *);
948extern void blk_abort_request(struct request *);
28018c24 949extern void blk_unprep_request(struct request *);
ff856bad 950
1da177e4
LT
951/*
952 * Access functions for manipulating queue properties
953 */
165125e1 954extern struct request_queue *blk_init_queue_node(request_fn_proc *rfn,
1946089a 955 spinlock_t *lock, int node_id);
165125e1 956extern struct request_queue *blk_init_queue(request_fn_proc *, spinlock_t *);
01effb0d
MS
957extern struct request_queue *blk_init_allocated_queue(struct request_queue *,
958 request_fn_proc *, spinlock_t *);
165125e1
JA
959extern void blk_cleanup_queue(struct request_queue *);
960extern void blk_queue_make_request(struct request_queue *, make_request_fn *);
961extern void blk_queue_bounce_limit(struct request_queue *, u64);
72d4cd9f 962extern void blk_limits_max_hw_sectors(struct queue_limits *, unsigned int);
086fa5ff 963extern void blk_queue_max_hw_sectors(struct request_queue *, unsigned int);
8a78362c 964extern void blk_queue_max_segments(struct request_queue *, unsigned short);
165125e1 965extern void blk_queue_max_segment_size(struct request_queue *, unsigned int);
67efc925
CH
966extern void blk_queue_max_discard_sectors(struct request_queue *q,
967 unsigned int max_discard_sectors);
4363ac7c
MP
968extern void blk_queue_max_write_same_sectors(struct request_queue *q,
969 unsigned int max_write_same_sectors);
e1defc4f 970extern void blk_queue_logical_block_size(struct request_queue *, unsigned short);
892b6f90 971extern void blk_queue_physical_block_size(struct request_queue *, unsigned int);
c72758f3
MP
972extern void blk_queue_alignment_offset(struct request_queue *q,
973 unsigned int alignment);
7c958e32 974extern void blk_limits_io_min(struct queue_limits *limits, unsigned int min);
c72758f3 975extern void blk_queue_io_min(struct request_queue *q, unsigned int min);
3c5820c7 976extern void blk_limits_io_opt(struct queue_limits *limits, unsigned int opt);
c72758f3 977extern void blk_queue_io_opt(struct request_queue *q, unsigned int opt);
e475bba2 978extern void blk_set_default_limits(struct queue_limits *lim);
b1bd055d 979extern void blk_set_stacking_limits(struct queue_limits *lim);
c72758f3
MP
980extern int blk_stack_limits(struct queue_limits *t, struct queue_limits *b,
981 sector_t offset);
17be8c24
MP
982extern int bdev_stack_limits(struct queue_limits *t, struct block_device *bdev,
983 sector_t offset);
c72758f3
MP
984extern void disk_stack_limits(struct gendisk *disk, struct block_device *bdev,
985 sector_t offset);
165125e1 986extern void blk_queue_stack_limits(struct request_queue *t, struct request_queue *b);
e3790c7d 987extern void blk_queue_dma_pad(struct request_queue *, unsigned int);
27f8221a 988extern void blk_queue_update_dma_pad(struct request_queue *, unsigned int);
2fb98e84
TH
989extern int blk_queue_dma_drain(struct request_queue *q,
990 dma_drain_needed_fn *dma_drain_needed,
991 void *buf, unsigned int size);
ef9e3fac 992extern void blk_queue_lld_busy(struct request_queue *q, lld_busy_fn *fn);
165125e1
JA
993extern void blk_queue_segment_boundary(struct request_queue *, unsigned long);
994extern void blk_queue_prep_rq(struct request_queue *, prep_rq_fn *pfn);
28018c24 995extern void blk_queue_unprep_rq(struct request_queue *, unprep_rq_fn *ufn);
165125e1
JA
996extern void blk_queue_merge_bvec(struct request_queue *, merge_bvec_fn *);
997extern void blk_queue_dma_alignment(struct request_queue *, int);
11c3e689 998extern void blk_queue_update_dma_alignment(struct request_queue *, int);
165125e1 999extern void blk_queue_softirq_done(struct request_queue *, softirq_done_fn *);
242f9dcb
JA
1000extern void blk_queue_rq_timed_out(struct request_queue *, rq_timed_out_fn *);
1001extern void blk_queue_rq_timeout(struct request_queue *, unsigned int);
4913efe4 1002extern void blk_queue_flush(struct request_queue *q, unsigned int flush);
f3876930 1003extern void blk_queue_flush_queueable(struct request_queue *q, bool queueable);
1da177e4 1004extern struct backing_dev_info *blk_get_backing_dev_info(struct block_device *bdev);
1da177e4 1005
165125e1 1006extern int blk_rq_map_sg(struct request_queue *, struct request *, struct scatterlist *);
85b9f66a
AH
1007extern int blk_bio_map_sg(struct request_queue *q, struct bio *bio,
1008 struct scatterlist *sglist);
1da177e4 1009extern void blk_dump_rq_flags(struct request *, char *);
1da177e4 1010extern long nr_blockdev_pages(void);
1da177e4 1011
09ac46c4 1012bool __must_check blk_get_queue(struct request_queue *);
165125e1
JA
1013struct request_queue *blk_alloc_queue(gfp_t);
1014struct request_queue *blk_alloc_queue_node(gfp_t, int);
1015extern void blk_put_queue(struct request_queue *);
1da177e4 1016
6c954667
LM
1017/*
1018 * block layer runtime pm functions
1019 */
1020#ifdef CONFIG_PM_RUNTIME
1021extern void blk_pm_runtime_init(struct request_queue *q, struct device *dev);
1022extern int blk_pre_runtime_suspend(struct request_queue *q);
1023extern void blk_post_runtime_suspend(struct request_queue *q, int err);
1024extern void blk_pre_runtime_resume(struct request_queue *q);
1025extern void blk_post_runtime_resume(struct request_queue *q, int err);
1026#else
1027static inline void blk_pm_runtime_init(struct request_queue *q,
1028 struct device *dev) {}
1029static inline int blk_pre_runtime_suspend(struct request_queue *q)
1030{
1031 return -ENOSYS;
1032}
1033static inline void blk_post_runtime_suspend(struct request_queue *q, int err) {}
1034static inline void blk_pre_runtime_resume(struct request_queue *q) {}
1035static inline void blk_post_runtime_resume(struct request_queue *q, int err) {}
1036#endif
1037
316cc67d 1038/*
75df7136
SJ
1039 * blk_plug permits building a queue of related requests by holding the I/O
1040 * fragments for a short period. This allows merging of sequential requests
1041 * into single larger request. As the requests are moved from a per-task list to
1042 * the device's request_queue in a batch, this results in improved scalability
1043 * as the lock contention for request_queue lock is reduced.
1044 *
1045 * It is ok not to disable preemption when adding the request to the plug list
1046 * or when attempting a merge, because blk_schedule_flush_list() will only flush
1047 * the plug list when the task sleeps by itself. For details, please see
1048 * schedule() where blk_schedule_flush_plug() is called.
316cc67d 1049 */
73c10101 1050struct blk_plug {
75df7136
SJ
1051 unsigned long magic; /* detect uninitialized use-cases */
1052 struct list_head list; /* requests */
320ae51f 1053 struct list_head mq_list; /* blk-mq requests */
75df7136 1054 struct list_head cb_list; /* md requires an unplug callback */
73c10101 1055};
55c022bb
SL
1056#define BLK_MAX_REQUEST_COUNT 16
1057
9cbb1750 1058struct blk_plug_cb;
74018dc3 1059typedef void (*blk_plug_cb_fn)(struct blk_plug_cb *, bool);
048c9374
N
1060struct blk_plug_cb {
1061 struct list_head list;
9cbb1750
N
1062 blk_plug_cb_fn callback;
1063 void *data;
048c9374 1064};
9cbb1750
N
1065extern struct blk_plug_cb *blk_check_plugged(blk_plug_cb_fn unplug,
1066 void *data, int size);
73c10101
JA
1067extern void blk_start_plug(struct blk_plug *);
1068extern void blk_finish_plug(struct blk_plug *);
f6603783 1069extern void blk_flush_plug_list(struct blk_plug *, bool);
73c10101
JA
1070
1071static inline void blk_flush_plug(struct task_struct *tsk)
1072{
1073 struct blk_plug *plug = tsk->plug;
1074
a237c1c5
JA
1075 if (plug)
1076 blk_flush_plug_list(plug, false);
1077}
1078
1079static inline void blk_schedule_flush_plug(struct task_struct *tsk)
1080{
1081 struct blk_plug *plug = tsk->plug;
1082
88b996cd 1083 if (plug)
f6603783 1084 blk_flush_plug_list(plug, true);
73c10101
JA
1085}
1086
1087static inline bool blk_needs_flush_plug(struct task_struct *tsk)
1088{
1089 struct blk_plug *plug = tsk->plug;
1090
320ae51f
JA
1091 return plug &&
1092 (!list_empty(&plug->list) ||
1093 !list_empty(&plug->mq_list) ||
1094 !list_empty(&plug->cb_list));
73c10101
JA
1095}
1096
1da177e4
LT
1097/*
1098 * tag stuff
1099 */
4aff5e23 1100#define blk_rq_tagged(rq) ((rq)->cmd_flags & REQ_QUEUED)
165125e1
JA
1101extern int blk_queue_start_tag(struct request_queue *, struct request *);
1102extern struct request *blk_queue_find_tag(struct request_queue *, int);
1103extern void blk_queue_end_tag(struct request_queue *, struct request *);
1104extern int blk_queue_init_tags(struct request_queue *, int, struct blk_queue_tag *);
1105extern void blk_queue_free_tags(struct request_queue *);
1106extern int blk_queue_resize_tags(struct request_queue *, int);
1107extern void blk_queue_invalidate_tags(struct request_queue *);
492dfb48
JB
1108extern struct blk_queue_tag *blk_init_tags(int);
1109extern void blk_free_tags(struct blk_queue_tag *);
1da177e4 1110
f583f492
DS
1111static inline struct request *blk_map_queue_find_tag(struct blk_queue_tag *bqt,
1112 int tag)
1113{
1114 if (unlikely(bqt == NULL || tag >= bqt->real_max_depth))
1115 return NULL;
1116 return bqt->tag_index[tag];
1117}
dd3932ed
CH
1118
1119#define BLKDEV_DISCARD_SECURE 0x01 /* secure discard */
1120
1121extern int blkdev_issue_flush(struct block_device *, gfp_t, sector_t *);
fbd9b09a
DM
1122extern int blkdev_issue_discard(struct block_device *bdev, sector_t sector,
1123 sector_t nr_sects, gfp_t gfp_mask, unsigned long flags);
4363ac7c
MP
1124extern int blkdev_issue_write_same(struct block_device *bdev, sector_t sector,
1125 sector_t nr_sects, gfp_t gfp_mask, struct page *page);
3f14d792 1126extern int blkdev_issue_zeroout(struct block_device *bdev, sector_t sector,
dd3932ed 1127 sector_t nr_sects, gfp_t gfp_mask);
2cf6d26a
CH
1128static inline int sb_issue_discard(struct super_block *sb, sector_t block,
1129 sector_t nr_blocks, gfp_t gfp_mask, unsigned long flags)
fb2dce86 1130{
2cf6d26a
CH
1131 return blkdev_issue_discard(sb->s_bdev, block << (sb->s_blocksize_bits - 9),
1132 nr_blocks << (sb->s_blocksize_bits - 9),
1133 gfp_mask, flags);
fb2dce86 1134}
e6fa0be6 1135static inline int sb_issue_zeroout(struct super_block *sb, sector_t block,
a107e5a3 1136 sector_t nr_blocks, gfp_t gfp_mask)
e6fa0be6
LC
1137{
1138 return blkdev_issue_zeroout(sb->s_bdev,
1139 block << (sb->s_blocksize_bits - 9),
1140 nr_blocks << (sb->s_blocksize_bits - 9),
a107e5a3 1141 gfp_mask);
e6fa0be6 1142}
1da177e4 1143
018e0446 1144extern int blk_verify_command(unsigned char *cmd, fmode_t has_write_perm);
0b07de85 1145
eb28d31b
MP
1146enum blk_default_limits {
1147 BLK_MAX_SEGMENTS = 128,
1148 BLK_SAFE_MAX_SECTORS = 255,
1149 BLK_DEF_MAX_SECTORS = 1024,
1150 BLK_MAX_SEGMENT_SIZE = 65536,
1151 BLK_SEG_BOUNDARY_MASK = 0xFFFFFFFFUL,
1152};
0e435ac2 1153
1da177e4
LT
1154#define blkdev_entry_to_request(entry) list_entry((entry), struct request, queuelist)
1155
ae03bf63
MP
1156static inline unsigned long queue_bounce_pfn(struct request_queue *q)
1157{
025146e1 1158 return q->limits.bounce_pfn;
ae03bf63
MP
1159}
1160
1161static inline unsigned long queue_segment_boundary(struct request_queue *q)
1162{
025146e1 1163 return q->limits.seg_boundary_mask;
ae03bf63
MP
1164}
1165
1166static inline unsigned int queue_max_sectors(struct request_queue *q)
1167{
025146e1 1168 return q->limits.max_sectors;
ae03bf63
MP
1169}
1170
1171static inline unsigned int queue_max_hw_sectors(struct request_queue *q)
1172{
025146e1 1173 return q->limits.max_hw_sectors;
ae03bf63
MP
1174}
1175
8a78362c 1176static inline unsigned short queue_max_segments(struct request_queue *q)
ae03bf63 1177{
8a78362c 1178 return q->limits.max_segments;
ae03bf63
MP
1179}
1180
1181static inline unsigned int queue_max_segment_size(struct request_queue *q)
1182{
025146e1 1183 return q->limits.max_segment_size;
ae03bf63
MP
1184}
1185
e1defc4f 1186static inline unsigned short queue_logical_block_size(struct request_queue *q)
1da177e4
LT
1187{
1188 int retval = 512;
1189
025146e1
MP
1190 if (q && q->limits.logical_block_size)
1191 retval = q->limits.logical_block_size;
1da177e4
LT
1192
1193 return retval;
1194}
1195
e1defc4f 1196static inline unsigned short bdev_logical_block_size(struct block_device *bdev)
1da177e4 1197{
e1defc4f 1198 return queue_logical_block_size(bdev_get_queue(bdev));
1da177e4
LT
1199}
1200
c72758f3
MP
1201static inline unsigned int queue_physical_block_size(struct request_queue *q)
1202{
1203 return q->limits.physical_block_size;
1204}
1205
892b6f90 1206static inline unsigned int bdev_physical_block_size(struct block_device *bdev)
ac481c20
MP
1207{
1208 return queue_physical_block_size(bdev_get_queue(bdev));
1209}
1210
c72758f3
MP
1211static inline unsigned int queue_io_min(struct request_queue *q)
1212{
1213 return q->limits.io_min;
1214}
1215
ac481c20
MP
1216static inline int bdev_io_min(struct block_device *bdev)
1217{
1218 return queue_io_min(bdev_get_queue(bdev));
1219}
1220
c72758f3
MP
1221static inline unsigned int queue_io_opt(struct request_queue *q)
1222{
1223 return q->limits.io_opt;
1224}
1225
ac481c20
MP
1226static inline int bdev_io_opt(struct block_device *bdev)
1227{
1228 return queue_io_opt(bdev_get_queue(bdev));
1229}
1230
c72758f3
MP
1231static inline int queue_alignment_offset(struct request_queue *q)
1232{
ac481c20 1233 if (q->limits.misaligned)
c72758f3
MP
1234 return -1;
1235
ac481c20 1236 return q->limits.alignment_offset;
c72758f3
MP
1237}
1238
e03a72e1 1239static inline int queue_limit_alignment_offset(struct queue_limits *lim, sector_t sector)
81744ee4
MP
1240{
1241 unsigned int granularity = max(lim->physical_block_size, lim->io_min);
e03a72e1 1242 unsigned int alignment = (sector << 9) & (granularity - 1);
81744ee4 1243
e03a72e1
MP
1244 return (granularity + lim->alignment_offset - alignment)
1245 & (granularity - 1);
c72758f3
MP
1246}
1247
ac481c20
MP
1248static inline int bdev_alignment_offset(struct block_device *bdev)
1249{
1250 struct request_queue *q = bdev_get_queue(bdev);
1251
1252 if (q->limits.misaligned)
1253 return -1;
1254
1255 if (bdev != bdev->bd_contains)
1256 return bdev->bd_part->alignment_offset;
1257
1258 return q->limits.alignment_offset;
1259}
1260
86b37281
MP
1261static inline int queue_discard_alignment(struct request_queue *q)
1262{
1263 if (q->limits.discard_misaligned)
1264 return -1;
1265
1266 return q->limits.discard_alignment;
1267}
1268
e03a72e1 1269static inline int queue_limit_discard_alignment(struct queue_limits *lim, sector_t sector)
86b37281 1270{
59771079 1271 unsigned int alignment, granularity, offset;
dd3d145d 1272
a934a00a
MP
1273 if (!lim->max_discard_sectors)
1274 return 0;
1275
59771079
LT
1276 /* Why are these in bytes, not sectors? */
1277 alignment = lim->discard_alignment >> 9;
1278 granularity = lim->discard_granularity >> 9;
1279 if (!granularity)
1280 return 0;
1281
1282 /* Offset of the partition start in 'granularity' sectors */
1283 offset = sector_div(sector, granularity);
1284
1285 /* And why do we do this modulus *again* in blkdev_issue_discard()? */
1286 offset = (granularity + alignment - offset) % granularity;
1287
1288 /* Turn it back into bytes, gaah */
1289 return offset << 9;
86b37281
MP
1290}
1291
c6e66634
PB
1292static inline int bdev_discard_alignment(struct block_device *bdev)
1293{
1294 struct request_queue *q = bdev_get_queue(bdev);
1295
1296 if (bdev != bdev->bd_contains)
1297 return bdev->bd_part->discard_alignment;
1298
1299 return q->limits.discard_alignment;
1300}
1301
98262f27
MP
1302static inline unsigned int queue_discard_zeroes_data(struct request_queue *q)
1303{
a934a00a 1304 if (q->limits.max_discard_sectors && q->limits.discard_zeroes_data == 1)
98262f27
MP
1305 return 1;
1306
1307 return 0;
1308}
1309
1310static inline unsigned int bdev_discard_zeroes_data(struct block_device *bdev)
1311{
1312 return queue_discard_zeroes_data(bdev_get_queue(bdev));
1313}
1314
4363ac7c
MP
1315static inline unsigned int bdev_write_same(struct block_device *bdev)
1316{
1317 struct request_queue *q = bdev_get_queue(bdev);
1318
1319 if (q)
1320 return q->limits.max_write_same_sectors;
1321
1322 return 0;
1323}
1324
165125e1 1325static inline int queue_dma_alignment(struct request_queue *q)
1da177e4 1326{
482eb689 1327 return q ? q->dma_alignment : 511;
1da177e4
LT
1328}
1329
14417799 1330static inline int blk_rq_aligned(struct request_queue *q, unsigned long addr,
87904074
FT
1331 unsigned int len)
1332{
1333 unsigned int alignment = queue_dma_alignment(q) | q->dma_pad_mask;
14417799 1334 return !(addr & alignment) && !(len & alignment);
87904074
FT
1335}
1336
1da177e4
LT
1337/* assumes size > 256 */
1338static inline unsigned int blksize_bits(unsigned int size)
1339{
1340 unsigned int bits = 8;
1341 do {
1342 bits++;
1343 size >>= 1;
1344 } while (size > 256);
1345 return bits;
1346}
1347
2befb9e3 1348static inline unsigned int block_size(struct block_device *bdev)
1da177e4
LT
1349{
1350 return bdev->bd_block_size;
1351}
1352
f3876930 1353static inline bool queue_flush_queueable(struct request_queue *q)
1354{
1355 return !q->flush_not_queueable;
1356}
1357
1da177e4
LT
1358typedef struct {struct page *v;} Sector;
1359
1360unsigned char *read_dev_sector(struct block_device *, sector_t, Sector *);
1361
1362static inline void put_dev_sector(Sector p)
1363{
1364 page_cache_release(p.v);
1365}
1366
1367struct work_struct;
18887ad9 1368int kblockd_schedule_work(struct request_queue *q, struct work_struct *work);
320ae51f 1369int kblockd_schedule_delayed_work(struct request_queue *q, struct delayed_work *dwork, unsigned long delay);
1da177e4 1370
9195291e 1371#ifdef CONFIG_BLK_CGROUP
28f4197e
JA
1372/*
1373 * This should not be using sched_clock(). A real patch is in progress
1374 * to fix this up, until that is in place we need to disable preemption
1375 * around sched_clock() in this function and set_io_start_time_ns().
1376 */
9195291e
DS
1377static inline void set_start_time_ns(struct request *req)
1378{
28f4197e 1379 preempt_disable();
9195291e 1380 req->start_time_ns = sched_clock();
28f4197e 1381 preempt_enable();
9195291e
DS
1382}
1383
1384static inline void set_io_start_time_ns(struct request *req)
1385{
28f4197e 1386 preempt_disable();
9195291e 1387 req->io_start_time_ns = sched_clock();
28f4197e 1388 preempt_enable();
9195291e 1389}
84c124da
DS
1390
1391static inline uint64_t rq_start_time_ns(struct request *req)
1392{
1393 return req->start_time_ns;
1394}
1395
1396static inline uint64_t rq_io_start_time_ns(struct request *req)
1397{
1398 return req->io_start_time_ns;
1399}
9195291e
DS
1400#else
1401static inline void set_start_time_ns(struct request *req) {}
1402static inline void set_io_start_time_ns(struct request *req) {}
84c124da
DS
1403static inline uint64_t rq_start_time_ns(struct request *req)
1404{
1405 return 0;
1406}
1407static inline uint64_t rq_io_start_time_ns(struct request *req)
1408{
1409 return 0;
1410}
9195291e
DS
1411#endif
1412
1da177e4
LT
1413#define MODULE_ALIAS_BLOCKDEV(major,minor) \
1414 MODULE_ALIAS("block-major-" __stringify(major) "-" __stringify(minor))
1415#define MODULE_ALIAS_BLOCKDEV_MAJOR(major) \
1416 MODULE_ALIAS("block-major-" __stringify(major) "-*")
1417
7ba1ba12
MP
1418#if defined(CONFIG_BLK_DEV_INTEGRITY)
1419
b24498d4
JA
1420#define INTEGRITY_FLAG_READ 2 /* verify data integrity on read */
1421#define INTEGRITY_FLAG_WRITE 4 /* generate data integrity on write */
7ba1ba12
MP
1422
1423struct blk_integrity_exchg {
1424 void *prot_buf;
1425 void *data_buf;
1426 sector_t sector;
1427 unsigned int data_size;
1428 unsigned short sector_size;
1429 const char *disk_name;
1430};
1431
1432typedef void (integrity_gen_fn) (struct blk_integrity_exchg *);
1433typedef int (integrity_vrfy_fn) (struct blk_integrity_exchg *);
1434typedef void (integrity_set_tag_fn) (void *, void *, unsigned int);
1435typedef void (integrity_get_tag_fn) (void *, void *, unsigned int);
1436
1437struct blk_integrity {
1438 integrity_gen_fn *generate_fn;
1439 integrity_vrfy_fn *verify_fn;
1440 integrity_set_tag_fn *set_tag_fn;
1441 integrity_get_tag_fn *get_tag_fn;
1442
1443 unsigned short flags;
1444 unsigned short tuple_size;
1445 unsigned short sector_size;
1446 unsigned short tag_size;
1447
1448 const char *name;
1449
1450 struct kobject kobj;
1451};
1452
a63a5cf8 1453extern bool blk_integrity_is_initialized(struct gendisk *);
7ba1ba12
MP
1454extern int blk_integrity_register(struct gendisk *, struct blk_integrity *);
1455extern void blk_integrity_unregister(struct gendisk *);
ad7fce93 1456extern int blk_integrity_compare(struct gendisk *, struct gendisk *);
13f05c8d
MP
1457extern int blk_rq_map_integrity_sg(struct request_queue *, struct bio *,
1458 struct scatterlist *);
1459extern int blk_rq_count_integrity_sg(struct request_queue *, struct bio *);
1460extern int blk_integrity_merge_rq(struct request_queue *, struct request *,
1461 struct request *);
1462extern int blk_integrity_merge_bio(struct request_queue *, struct request *,
1463 struct bio *);
7ba1ba12 1464
b04accc4
JA
1465static inline
1466struct blk_integrity *bdev_get_integrity(struct block_device *bdev)
1467{
1468 return bdev->bd_disk->integrity;
1469}
1470
b02739b0
MP
1471static inline struct blk_integrity *blk_get_integrity(struct gendisk *disk)
1472{
1473 return disk->integrity;
1474}
1475
7ba1ba12
MP
1476static inline int blk_integrity_rq(struct request *rq)
1477{
d442cc44
MP
1478 if (rq->bio == NULL)
1479 return 0;
1480
7ba1ba12
MP
1481 return bio_integrity(rq->bio);
1482}
1483
13f05c8d
MP
1484static inline void blk_queue_max_integrity_segments(struct request_queue *q,
1485 unsigned int segs)
1486{
1487 q->limits.max_integrity_segments = segs;
1488}
1489
1490static inline unsigned short
1491queue_max_integrity_segments(struct request_queue *q)
1492{
1493 return q->limits.max_integrity_segments;
1494}
1495
7ba1ba12
MP
1496#else /* CONFIG_BLK_DEV_INTEGRITY */
1497
fd83240a
SR
1498struct bio;
1499struct block_device;
1500struct gendisk;
1501struct blk_integrity;
1502
1503static inline int blk_integrity_rq(struct request *rq)
1504{
1505 return 0;
1506}
1507static inline int blk_rq_count_integrity_sg(struct request_queue *q,
1508 struct bio *b)
1509{
1510 return 0;
1511}
1512static inline int blk_rq_map_integrity_sg(struct request_queue *q,
1513 struct bio *b,
1514 struct scatterlist *s)
1515{
1516 return 0;
1517}
1518static inline struct blk_integrity *bdev_get_integrity(struct block_device *b)
1519{
1520 return 0;
1521}
1522static inline struct blk_integrity *blk_get_integrity(struct gendisk *disk)
1523{
1524 return NULL;
1525}
1526static inline int blk_integrity_compare(struct gendisk *a, struct gendisk *b)
1527{
1528 return 0;
1529}
1530static inline int blk_integrity_register(struct gendisk *d,
1531 struct blk_integrity *b)
1532{
1533 return 0;
1534}
1535static inline void blk_integrity_unregister(struct gendisk *d)
1536{
1537}
1538static inline void blk_queue_max_integrity_segments(struct request_queue *q,
1539 unsigned int segs)
1540{
1541}
1542static inline unsigned short queue_max_integrity_segments(struct request_queue *q)
1543{
1544 return 0;
1545}
1546static inline int blk_integrity_merge_rq(struct request_queue *rq,
1547 struct request *r1,
1548 struct request *r2)
1549{
1550 return 0;
1551}
1552static inline int blk_integrity_merge_bio(struct request_queue *rq,
1553 struct request *r,
1554 struct bio *b)
1555{
1556 return 0;
1557}
1558static inline bool blk_integrity_is_initialized(struct gendisk *g)
1559{
1560 return 0;
1561}
7ba1ba12
MP
1562
1563#endif /* CONFIG_BLK_DEV_INTEGRITY */
1564
08f85851 1565struct block_device_operations {
d4430d62 1566 int (*open) (struct block_device *, fmode_t);
db2a144b 1567 void (*release) (struct gendisk *, fmode_t);
d4430d62
AV
1568 int (*ioctl) (struct block_device *, fmode_t, unsigned, unsigned long);
1569 int (*compat_ioctl) (struct block_device *, fmode_t, unsigned, unsigned long);
08f85851
AV
1570 int (*direct_access) (struct block_device *, sector_t,
1571 void **, unsigned long *);
77ea887e
TH
1572 unsigned int (*check_events) (struct gendisk *disk,
1573 unsigned int clearing);
1574 /* ->media_changed() is DEPRECATED, use ->check_events() instead */
08f85851 1575 int (*media_changed) (struct gendisk *);
c3e33e04 1576 void (*unlock_native_capacity) (struct gendisk *);
08f85851
AV
1577 int (*revalidate_disk) (struct gendisk *);
1578 int (*getgeo)(struct block_device *, struct hd_geometry *);
b3a27d05
NG
1579 /* this callback is with swap_lock and sometimes page table lock held */
1580 void (*swap_slot_free_notify) (struct block_device *, unsigned long);
08f85851
AV
1581 struct module *owner;
1582};
1583
633a08b8
AV
1584extern int __blkdev_driver_ioctl(struct block_device *, fmode_t, unsigned int,
1585 unsigned long);
9361401e
DH
1586#else /* CONFIG_BLOCK */
1587/*
1588 * stubs for when the block layer is configured out
1589 */
1590#define buffer_heads_over_limit 0
1591
9361401e
DH
1592static inline long nr_blockdev_pages(void)
1593{
1594 return 0;
1595}
1596
1f940bdf
JA
1597struct blk_plug {
1598};
1599
1600static inline void blk_start_plug(struct blk_plug *plug)
73c10101
JA
1601{
1602}
1603
1f940bdf 1604static inline void blk_finish_plug(struct blk_plug *plug)
73c10101
JA
1605{
1606}
1607
1f940bdf 1608static inline void blk_flush_plug(struct task_struct *task)
73c10101
JA
1609{
1610}
1611
a237c1c5
JA
1612static inline void blk_schedule_flush_plug(struct task_struct *task)
1613{
1614}
1615
1616
73c10101
JA
1617static inline bool blk_needs_flush_plug(struct task_struct *tsk)
1618{
1619 return false;
1620}
1621
9361401e
DH
1622#endif /* CONFIG_BLOCK */
1623
1da177e4 1624#endif