fs: move the buffer_heads_over_limit stub to buffer_head.h
[linux-2.6-block.git] / include / linux / blkdev.h
CommitLineData
b2441318 1/* SPDX-License-Identifier: GPL-2.0 */
1da177e4
LT
2#ifndef _LINUX_BLKDEV_H
3#define _LINUX_BLKDEV_H
4
85fd0bc9 5#include <linux/sched.h>
e6017571 6#include <linux/sched/clock.h>
85fd0bc9 7
f5ff8422
JA
8#ifdef CONFIG_BLOCK
9
1da177e4
LT
10#include <linux/major.h>
11#include <linux/genhd.h>
12#include <linux/list.h>
320ae51f 13#include <linux/llist.h>
1da177e4
LT
14#include <linux/timer.h>
15#include <linux/workqueue.h>
16#include <linux/pagemap.h>
66114cad 17#include <linux/backing-dev-defs.h>
1da177e4
LT
18#include <linux/wait.h>
19#include <linux/mempool.h>
34c0fd54 20#include <linux/pfn.h>
1da177e4 21#include <linux/bio.h>
1da177e4 22#include <linux/stringify.h>
3e6053d7 23#include <linux/gfp.h>
d351af01 24#include <linux/bsg.h>
c7c22e4d 25#include <linux/smp.h>
548bc8e1 26#include <linux/rcupdate.h>
add703fd 27#include <linux/percpu-refcount.h>
84be456f 28#include <linux/scatterlist.h>
6a0cb1bc 29#include <linux/blkzoned.h>
1da177e4 30
de477254 31struct module;
21b2f0c8
CH
32struct scsi_ioctl_command;
33
1da177e4 34struct request_queue;
1da177e4 35struct elevator_queue;
2056a782 36struct blk_trace;
3d6392cf
JA
37struct request;
38struct sg_io_hdr;
aa387cc8 39struct bsg_job;
3c798398 40struct blkcg_gq;
7c94e1c1 41struct blk_flush_queue;
bbd3e064 42struct pr_ops;
a7905043 43struct rq_qos;
34dbad5d
OS
44struct blk_queue_stats;
45struct blk_stat_callback;
1b262839 46struct blk_keyslot_manager;
1da177e4
LT
47
48#define BLKDEV_MIN_RQ 4
49#define BLKDEV_MAX_RQ 128 /* Default maximum */
50
096392e0 51/* Must be consistent with blk_mq_poll_stats_bkt() */
0206319f
SB
52#define BLK_MQ_POLL_STATS_BKTS 16
53
29ece8b4
YY
54/* Doing classic polling */
55#define BLK_MQ_POLL_CLASSIC -1
56
8bd435b3
TH
57/*
58 * Maximum number of blkcg policies allowed to be registered concurrently.
59 * Defined here to simplify include dependency.
60 */
01c5f85a 61#define BLKCG_MAX_POLS 5
8bd435b3 62
2a842aca 63typedef void (rq_end_io_fn)(struct request *, blk_status_t);
1da177e4 64
e8064021
CH
65/*
66 * request flags */
67typedef __u32 __bitwise req_flags_t;
68
69/* elevator knows about this request */
70#define RQF_SORTED ((__force req_flags_t)(1 << 0))
71/* drive already may have started this one */
72#define RQF_STARTED ((__force req_flags_t)(1 << 1))
e8064021
CH
73/* may not be passed by ioscheduler */
74#define RQF_SOFTBARRIER ((__force req_flags_t)(1 << 3))
75/* request for flush sequence */
76#define RQF_FLUSH_SEQ ((__force req_flags_t)(1 << 4))
77/* merge of different types, fail separately */
78#define RQF_MIXED_MERGE ((__force req_flags_t)(1 << 5))
79/* track inflight for MQ */
80#define RQF_MQ_INFLIGHT ((__force req_flags_t)(1 << 6))
81/* don't call prep for this one */
82#define RQF_DONTPREP ((__force req_flags_t)(1 << 7))
83/* set for "ide_preempt" requests and also for requests for which the SCSI
84 "quiesce" state must be ignored. */
85#define RQF_PREEMPT ((__force req_flags_t)(1 << 8))
e8064021
CH
86/* vaguely specified driver internal error. Ignored by the block layer */
87#define RQF_FAILED ((__force req_flags_t)(1 << 10))
88/* don't warn about errors */
89#define RQF_QUIET ((__force req_flags_t)(1 << 11))
90/* elevator private data attached */
91#define RQF_ELVPRIV ((__force req_flags_t)(1 << 12))
4822e902 92/* account into disk and partition IO statistics */
e8064021
CH
93#define RQF_IO_STAT ((__force req_flags_t)(1 << 13))
94/* request came from our alloc pool */
95#define RQF_ALLOCED ((__force req_flags_t)(1 << 14))
96/* runtime pm request */
97#define RQF_PM ((__force req_flags_t)(1 << 15))
98/* on IO scheduler merge hash */
99#define RQF_HASHED ((__force req_flags_t)(1 << 16))
4822e902 100/* track IO completion time */
cf43e6be 101#define RQF_STATS ((__force req_flags_t)(1 << 17))
f9d03f96
CH
102/* Look at ->special_vec for the actual data payload instead of the
103 bio chain. */
104#define RQF_SPECIAL_PAYLOAD ((__force req_flags_t)(1 << 18))
6cc77e9c
CH
105/* The per-zone write lock is held for this request */
106#define RQF_ZONE_WRITE_LOCKED ((__force req_flags_t)(1 << 19))
76a86f9d 107/* already slept for hybrid poll */
12f5b931 108#define RQF_MQ_POLL_SLEPT ((__force req_flags_t)(1 << 20))
da661267
CH
109/* ->timeout has been called, don't expire again */
110#define RQF_TIMED_OUT ((__force req_flags_t)(1 << 21))
e8064021
CH
111
112/* flags that prevent us from merging requests: */
113#define RQF_NOMERGE_FLAGS \
f9d03f96 114 (RQF_STARTED | RQF_SOFTBARRIER | RQF_FLUSH_SEQ | RQF_SPECIAL_PAYLOAD)
e8064021 115
12f5b931
KB
116/*
117 * Request state for blk-mq.
118 */
119enum mq_rq_state {
120 MQ_RQ_IDLE = 0,
121 MQ_RQ_IN_FLIGHT = 1,
122 MQ_RQ_COMPLETE = 2,
123};
124
1da177e4 125/*
af76e555
CH
126 * Try to put the fields that are referenced together in the same cacheline.
127 *
128 * If you modify this structure, make sure to update blk_rq_init() and
129 * especially blk_mq_rq_ctx_init() to take care of the added fields.
1da177e4
LT
130 */
131struct request {
165125e1 132 struct request_queue *q;
320ae51f 133 struct blk_mq_ctx *mq_ctx;
ea4f995e 134 struct blk_mq_hw_ctx *mq_hctx;
e6a1c874 135
ef295ecf 136 unsigned int cmd_flags; /* op and common flags */
e8064021 137 req_flags_t rq_flags;
d486f1f2 138
2f578aaf 139 int tag;
d486f1f2
JA
140 int internal_tag;
141
a2dec7b3 142 /* the following two fields are internal, NEVER access directly */
a2dec7b3 143 unsigned int __data_len; /* total data len */
181fdde3 144 sector_t __sector; /* sector cursor */
1da177e4
LT
145
146 struct bio *bio;
147 struct bio *biotail;
148
7c3fb70f
JA
149 struct list_head queuelist;
150
360f92c2
JA
151 /*
152 * The hash is used inside the scheduler, and killed once the
153 * request reaches the dispatch list. The ipi_list is only used
154 * to queue the request for softirq completion, which is long
155 * after the request has been unhashed (and even removed from
156 * the dispatch list).
157 */
158 union {
159 struct hlist_node hash; /* merge hash */
160 struct list_head ipi_list;
161 };
162
e6a1c874
JA
163 /*
164 * The rb_node is only used inside the io scheduler, requests
165 * are pruned when moved to the dispatch queue. So let the
c186794d 166 * completion_data share space with the rb_node.
e6a1c874
JA
167 */
168 union {
169 struct rb_node rb_node; /* sort/lookup */
f9d03f96 170 struct bio_vec special_vec;
c186794d 171 void *completion_data;
e26738e0 172 int error_count; /* for legacy drivers, don't use */
e6a1c874 173 };
9817064b 174
ff7d145f 175 /*
7f1dc8a2 176 * Three pointers are available for the IO schedulers, if they need
c186794d
MS
177 * more they have to dynamically allocate it. Flush requests are
178 * never put on the IO scheduler. So let the flush fields share
a612fddf 179 * space with the elevator data.
ff7d145f 180 */
c186794d 181 union {
a612fddf
TH
182 struct {
183 struct io_cq *icq;
184 void *priv[2];
185 } elv;
186
c186794d
MS
187 struct {
188 unsigned int seq;
189 struct list_head list;
4853abaa 190 rq_end_io_fn *saved_end_io;
c186794d
MS
191 } flush;
192 };
ff7d145f 193
8f34ee75 194 struct gendisk *rq_disk;
09e099d4 195 struct hd_struct *part;
6f816b4b
TH
196#ifdef CONFIG_BLK_RQ_ALLOC_TIME
197 /* Time that the first bio started allocating this request. */
198 u64 alloc_time_ns;
199#endif
200 /* Time that this request was allocated for this IO. */
522a7775 201 u64 start_time_ns;
544ccc8d
OS
202 /* Time that I/O was submitted to the device. */
203 u64 io_start_time_ns;
204
205#ifdef CONFIG_BLK_WBT
206 unsigned short wbt_flags;
207#endif
3d244306
HT
208 /*
209 * rq sectors used for blk stats. It has the same value
210 * with blk_rq_sectors(rq), except that it never be zeroed
211 * by completion.
212 */
213 unsigned short stats_sectors;
544ccc8d
OS
214
215 /*
216 * Number of scatter-gather DMA addr+len pairs after
1da177e4
LT
217 * physical address coalescing is performed.
218 */
219 unsigned short nr_phys_segments;
7c3fb70f 220
13f05c8d
MP
221#if defined(CONFIG_BLK_DEV_INTEGRITY)
222 unsigned short nr_integrity_segments;
223#endif
1da177e4 224
a892c8d5
ST
225#ifdef CONFIG_BLK_INLINE_ENCRYPTION
226 struct bio_crypt_ctx *crypt_ctx;
227 struct blk_ksm_keyslot *crypt_keyslot;
228#endif
229
7c3fb70f 230 unsigned short write_hint;
8f34ee75
JA
231 unsigned short ioprio;
232
12f5b931
KB
233 enum mq_rq_state state;
234 refcount_t ref;
1d9bd516 235
0b7576d8 236 unsigned int timeout;
079076b3 237 unsigned long deadline;
cb6934f8 238
7c3fb70f 239 union {
0a4b6e2f 240 struct __call_single_data csd;
7c3fb70f
JA
241 u64 fifo_time;
242 };
243
1da177e4 244 /*
c00895ab 245 * completion callback.
1da177e4
LT
246 */
247 rq_end_io_fn *end_io;
248 void *end_io_data;
249};
250
14cb0dc6
ML
251static inline bool blk_op_is_scsi(unsigned int op)
252{
253 return op == REQ_OP_SCSI_IN || op == REQ_OP_SCSI_OUT;
254}
255
256static inline bool blk_op_is_private(unsigned int op)
257{
258 return op == REQ_OP_DRV_IN || op == REQ_OP_DRV_OUT;
259}
260
aebf526b
CH
261static inline bool blk_rq_is_scsi(struct request *rq)
262{
14cb0dc6 263 return blk_op_is_scsi(req_op(rq));
aebf526b
CH
264}
265
266static inline bool blk_rq_is_private(struct request *rq)
267{
14cb0dc6 268 return blk_op_is_private(req_op(rq));
aebf526b
CH
269}
270
57292b58
CH
271static inline bool blk_rq_is_passthrough(struct request *rq)
272{
aebf526b 273 return blk_rq_is_scsi(rq) || blk_rq_is_private(rq);
57292b58
CH
274}
275
14cb0dc6
ML
276static inline bool bio_is_passthrough(struct bio *bio)
277{
278 unsigned op = bio_op(bio);
279
280 return blk_op_is_scsi(op) || blk_op_is_private(op);
281}
282
766ca442
FLVC
283static inline unsigned short req_get_ioprio(struct request *req)
284{
285 return req->ioprio;
286}
287
1da177e4
LT
288#include <linux/elevator.h>
289
320ae51f
JA
290struct blk_queue_ctx;
291
dece1635 292typedef blk_qc_t (make_request_fn) (struct request_queue *q, struct bio *bio);
1da177e4
LT
293
294struct bio_vec;
1da177e4 295
242f9dcb 296enum blk_eh_timer_return {
88b0cfad
CH
297 BLK_EH_DONE, /* drivers has completed the command */
298 BLK_EH_RESET_TIMER, /* reset timer and try again */
242f9dcb
JA
299};
300
1da177e4
LT
301enum blk_queue_state {
302 Queue_down,
303 Queue_up,
304};
305
ee1b6f7a
SL
306#define BLK_TAG_ALLOC_FIFO 0 /* allocate starting from 0 */
307#define BLK_TAG_ALLOC_RR 1 /* allocate starting from last allocated tag */
1da177e4 308
abf54393
FT
309#define BLK_SCSI_MAX_CMDS (256)
310#define BLK_SCSI_CMD_PER_LONG (BLK_SCSI_MAX_CMDS / (sizeof(long) * 8))
311
797476b8
DLM
312/*
313 * Zoned block device models (zoned limit).
314 */
315enum blk_zoned_model {
316 BLK_ZONED_NONE, /* Regular block device */
317 BLK_ZONED_HA, /* Host-aware zoned block device */
318 BLK_ZONED_HM, /* Host-managed zoned block device */
319};
320
025146e1
MP
321struct queue_limits {
322 unsigned long bounce_pfn;
323 unsigned long seg_boundary_mask;
03100aad 324 unsigned long virt_boundary_mask;
025146e1
MP
325
326 unsigned int max_hw_sectors;
ca369d51 327 unsigned int max_dev_sectors;
762380ad 328 unsigned int chunk_sectors;
025146e1
MP
329 unsigned int max_sectors;
330 unsigned int max_segment_size;
c72758f3 331 unsigned int physical_block_size;
ad6bf88a 332 unsigned int logical_block_size;
c72758f3
MP
333 unsigned int alignment_offset;
334 unsigned int io_min;
335 unsigned int io_opt;
67efc925 336 unsigned int max_discard_sectors;
0034af03 337 unsigned int max_hw_discard_sectors;
4363ac7c 338 unsigned int max_write_same_sectors;
a6f0788e 339 unsigned int max_write_zeroes_sectors;
0512a75b 340 unsigned int max_zone_append_sectors;
86b37281
MP
341 unsigned int discard_granularity;
342 unsigned int discard_alignment;
025146e1 343
8a78362c 344 unsigned short max_segments;
13f05c8d 345 unsigned short max_integrity_segments;
1e739730 346 unsigned short max_discard_segments;
025146e1 347
c72758f3 348 unsigned char misaligned;
86b37281 349 unsigned char discard_misaligned;
c78afc62 350 unsigned char raid_partial_stripes_expensive;
797476b8 351 enum blk_zoned_model zoned;
025146e1
MP
352};
353
d4100351
CH
354typedef int (*report_zones_cb)(struct blk_zone *zone, unsigned int idx,
355 void *data);
356
6a0cb1bc
HR
357#ifdef CONFIG_BLK_DEV_ZONED
358
d4100351
CH
359#define BLK_ALL_ZONES ((unsigned int)-1)
360int blkdev_report_zones(struct block_device *bdev, sector_t sector,
361 unsigned int nr_zones, report_zones_cb cb, void *data);
9b38bb4b 362unsigned int blkdev_nr_zones(struct gendisk *disk);
6c1b1da5
AJ
363extern int blkdev_zone_mgmt(struct block_device *bdev, enum req_opf op,
364 sector_t sectors, sector_t nr_sectors,
365 gfp_t gfp_mask);
e732671a
DLM
366int blk_revalidate_disk_zones(struct gendisk *disk,
367 void (*update_driver_data)(struct gendisk *disk));
6a0cb1bc 368
3ed05a98
ST
369extern int blkdev_report_zones_ioctl(struct block_device *bdev, fmode_t mode,
370 unsigned int cmd, unsigned long arg);
e876df1f
AJ
371extern int blkdev_zone_mgmt_ioctl(struct block_device *bdev, fmode_t mode,
372 unsigned int cmd, unsigned long arg);
3ed05a98
ST
373
374#else /* CONFIG_BLK_DEV_ZONED */
375
9b38bb4b 376static inline unsigned int blkdev_nr_zones(struct gendisk *disk)
a91e1380
DLM
377{
378 return 0;
379}
bf505456 380
3ed05a98
ST
381static inline int blkdev_report_zones_ioctl(struct block_device *bdev,
382 fmode_t mode, unsigned int cmd,
383 unsigned long arg)
384{
385 return -ENOTTY;
386}
387
e876df1f
AJ
388static inline int blkdev_zone_mgmt_ioctl(struct block_device *bdev,
389 fmode_t mode, unsigned int cmd,
390 unsigned long arg)
3ed05a98
ST
391{
392 return -ENOTTY;
393}
394
6a0cb1bc
HR
395#endif /* CONFIG_BLK_DEV_ZONED */
396
d7b76301 397struct request_queue {
1da177e4 398 struct request *last_merge;
b374d18a 399 struct elevator_queue *elevator;
1da177e4 400
34dbad5d 401 struct blk_queue_stats *stats;
a7905043 402 struct rq_qos *rq_qos;
87760e5e 403
1da177e4 404 make_request_fn *make_request_fn;
1da177e4 405
f8a5b122 406 const struct blk_mq_ops *mq_ops;
320ae51f 407
320ae51f 408 /* sw queues */
e6cdb092 409 struct blk_mq_ctx __percpu *queue_ctx;
320ae51f 410
d278d4a8
JA
411 unsigned int queue_depth;
412
320ae51f
JA
413 /* hw dispatch queues */
414 struct blk_mq_hw_ctx **queue_hw_ctx;
415 unsigned int nr_hw_queues;
416
dc3b17cc 417 struct backing_dev_info *backing_dev_info;
1da177e4
LT
418
419 /*
420 * The queue owner gets to use this for whatever they like.
421 * ll_rw_blk doesn't touch it.
422 */
423 void *queuedata;
424
1da177e4 425 /*
d7b76301 426 * various queue flags, see QUEUE_* below
1da177e4 427 */
d7b76301 428 unsigned long queue_flags;
cd84a62e
BVA
429 /*
430 * Number of contexts that have called blk_set_pm_only(). If this
431 * counter is above zero then only RQF_PM and RQF_PREEMPT requests are
432 * processed.
433 */
434 atomic_t pm_only;
1da177e4 435
a73f730d
TH
436 /*
437 * ida allocated id for this queue. Used to index queues from
438 * ioctx.
439 */
440 int id;
441
1da177e4 442 /*
d7b76301 443 * queue needs bounce pages for pages above this limit
1da177e4 444 */
d7b76301 445 gfp_t bounce_gfp;
1da177e4 446
0d945c1f 447 spinlock_t queue_lock;
1da177e4
LT
448
449 /*
450 * queue kobject
451 */
452 struct kobject kobj;
453
320ae51f
JA
454 /*
455 * mq queue kobject
456 */
1db4909e 457 struct kobject *mq_kobj;
320ae51f 458
ac6fc48c
DW
459#ifdef CONFIG_BLK_DEV_INTEGRITY
460 struct blk_integrity integrity;
461#endif /* CONFIG_BLK_DEV_INTEGRITY */
462
47fafbc7 463#ifdef CONFIG_PM
6c954667
LM
464 struct device *dev;
465 int rpm_status;
466 unsigned int nr_pending;
467#endif
468
1da177e4
LT
469 /*
470 * queue settings
471 */
472 unsigned long nr_requests; /* Max # of requests */
1da177e4 473
e3790c7d 474 unsigned int dma_pad_mask;
1da177e4
LT
475 unsigned int dma_alignment;
476
1b262839
ST
477#ifdef CONFIG_BLK_INLINE_ENCRYPTION
478 /* Inline crypto capabilities */
479 struct blk_keyslot_manager *ksm;
480#endif
481
242f9dcb 482 unsigned int rq_timeout;
64f1c21e 483 int poll_nsec;
34dbad5d
OS
484
485 struct blk_stat_callback *poll_cb;
0206319f 486 struct blk_rq_stat poll_stat[BLK_MQ_POLL_STATS_BKTS];
34dbad5d 487
242f9dcb 488 struct timer_list timeout;
287922eb 489 struct work_struct timeout_work;
242f9dcb 490
a612fddf 491 struct list_head icq_list;
4eef3049 492#ifdef CONFIG_BLK_CGROUP
a2b1693b 493 DECLARE_BITMAP (blkcg_pols, BLKCG_MAX_POLS);
3c798398 494 struct blkcg_gq *root_blkg;
03aa264a 495 struct list_head blkg_list;
4eef3049 496#endif
a612fddf 497
025146e1
MP
498 struct queue_limits limits;
499
68c43f13
DLM
500 unsigned int required_elevator_features;
501
6a5ac984 502#ifdef CONFIG_BLK_DEV_ZONED
6cc77e9c
CH
503 /*
504 * Zoned block device information for request dispatch control.
505 * nr_zones is the total number of zones of the device. This is always
f216fdd7
CH
506 * 0 for regular block devices. conv_zones_bitmap is a bitmap of nr_zones
507 * bits which indicates if a zone is conventional (bit set) or
508 * sequential (bit clear). seq_zones_wlock is a bitmap of nr_zones
6cc77e9c
CH
509 * bits which indicates if a zone is write locked, that is, if a write
510 * request targeting the zone was dispatched. All three fields are
511 * initialized by the low level device driver (e.g. scsi/sd.c).
512 * Stacking drivers (device mappers) may or may not initialize
513 * these fields.
ccce20fc
BVA
514 *
515 * Reads of this information must be protected with blk_queue_enter() /
516 * blk_queue_exit(). Modifying this information is only allowed while
517 * no requests are being processed. See also blk_mq_freeze_queue() and
518 * blk_mq_unfreeze_queue().
6cc77e9c
CH
519 */
520 unsigned int nr_zones;
f216fdd7 521 unsigned long *conv_zones_bitmap;
6cc77e9c 522 unsigned long *seq_zones_wlock;
6a5ac984 523#endif /* CONFIG_BLK_DEV_ZONED */
6cc77e9c 524
1da177e4
LT
525 /*
526 * sg stuff
527 */
528 unsigned int sg_timeout;
529 unsigned int sg_reserved_size;
1946089a 530 int node;
85e0cbbb 531 struct mutex debugfs_mutex;
6c5c9341 532#ifdef CONFIG_BLK_DEV_IO_TRACE
c780e86d 533 struct blk_trace __rcu *blk_trace;
6c5c9341 534#endif
1da177e4 535 /*
4913efe4 536 * for flush operations
1da177e4 537 */
7c94e1c1 538 struct blk_flush_queue *fq;
483f4afc 539
6fca6a61
CH
540 struct list_head requeue_list;
541 spinlock_t requeue_lock;
2849450a 542 struct delayed_work requeue_work;
6fca6a61 543
483f4afc 544 struct mutex sysfs_lock;
cecf5d87 545 struct mutex sysfs_dir_lock;
d351af01 546
2f8f1336
ML
547 /*
548 * for reusing dead hctx instance in case of updating
549 * nr_hw_queues
550 */
551 struct list_head unused_hctx_list;
552 spinlock_t unused_hctx_lock;
553
7996a8b5 554 int mq_freeze_depth;
d732580b 555
d351af01
FT
556#if defined(CONFIG_BLK_DEV_BSG)
557 struct bsg_class_device bsg_dev;
558#endif
e43473b7
VG
559
560#ifdef CONFIG_BLK_DEV_THROTTLING
561 /* Throttle data */
562 struct throtl_data *td;
563#endif
548bc8e1 564 struct rcu_head rcu_head;
320ae51f 565 wait_queue_head_t mq_freeze_wq;
7996a8b5
BL
566 /*
567 * Protect concurrent access to q_usage_counter by
568 * percpu_ref_kill() and percpu_ref_reinit().
569 */
570 struct mutex mq_freeze_lock;
3ef28e83 571 struct percpu_ref q_usage_counter;
0d2602ca
JA
572
573 struct blk_mq_tag_set *tag_set;
574 struct list_head tag_set_list;
338aa96d 575 struct bio_set bio_split;
4593fdbe 576
07e4fead 577 struct dentry *debugfs_dir;
85e0cbbb
LC
578
579#ifdef CONFIG_BLK_DEBUG_FS
d332ce09 580 struct dentry *sched_debugfs_dir;
cc56694f 581 struct dentry *rqos_debugfs_dir;
07e4fead
OS
582#endif
583
4593fdbe 584 bool mq_sysfs_init_done;
6d247d7f
CH
585
586 size_t cmd_size;
dc9edc44 587
f793dfd3
JA
588#define BLK_MAX_WRITE_HINTS 5
589 u64 write_hints[BLK_MAX_WRITE_HINTS];
1da177e4
LT
590};
591
eca7abf3
JA
592#define QUEUE_FLAG_STOPPED 0 /* queue is stopped */
593#define QUEUE_FLAG_DYING 1 /* queue being torn down */
eca7abf3
JA
594#define QUEUE_FLAG_NOMERGES 3 /* disable merge attempts */
595#define QUEUE_FLAG_SAME_COMP 4 /* complete on same CPU-group */
596#define QUEUE_FLAG_FAIL_IO 5 /* fake timeout */
597#define QUEUE_FLAG_NONROT 6 /* non-rotational device (SSD) */
598#define QUEUE_FLAG_VIRT QUEUE_FLAG_NONROT /* paravirt device */
599#define QUEUE_FLAG_IO_STAT 7 /* do disk/partitions IO accounting */
600#define QUEUE_FLAG_DISCARD 8 /* supports DISCARD */
601#define QUEUE_FLAG_NOXMERGES 9 /* No extended merges */
602#define QUEUE_FLAG_ADD_RANDOM 10 /* Contributes to random pool */
603#define QUEUE_FLAG_SECERASE 11 /* supports secure erase */
604#define QUEUE_FLAG_SAME_FORCE 12 /* force complete on same CPU */
605#define QUEUE_FLAG_DEAD 13 /* queue tear-down finished */
606#define QUEUE_FLAG_INIT_DONE 14 /* queue is initialized */
eca7abf3
JA
607#define QUEUE_FLAG_POLL 16 /* IO polling enabled if set */
608#define QUEUE_FLAG_WC 17 /* Write back caching */
609#define QUEUE_FLAG_FUA 18 /* device supports FUA writes */
610#define QUEUE_FLAG_DAX 19 /* device supports DAX */
611#define QUEUE_FLAG_STATS 20 /* track IO start and completion times */
612#define QUEUE_FLAG_POLL_STATS 21 /* collecting stats for hybrid polling */
613#define QUEUE_FLAG_REGISTERED 22 /* queue has been registered to a disk */
614#define QUEUE_FLAG_SCSI_PASSTHROUGH 23 /* queue supports SCSI commands */
615#define QUEUE_FLAG_QUIESCED 24 /* queue has been quiesced */
616#define QUEUE_FLAG_PCI_P2PDMA 25 /* device supports PCI p2p requests */
e84e8f06 617#define QUEUE_FLAG_ZONE_RESETALL 26 /* supports Zone Reset All */
6f816b4b 618#define QUEUE_FLAG_RQ_ALLOC_TIME 27 /* record rq->alloc_time_ns */
797e7dbb 619
94eddfbe 620#define QUEUE_FLAG_MQ_DEFAULT ((1 << QUEUE_FLAG_IO_STAT) | \
6e0de611 621 (1 << QUEUE_FLAG_SAME_COMP))
94eddfbe 622
8814ce8a
BVA
623void blk_queue_flag_set(unsigned int flag, struct request_queue *q);
624void blk_queue_flag_clear(unsigned int flag, struct request_queue *q);
625bool blk_queue_flag_test_and_set(unsigned int flag, struct request_queue *q);
8814ce8a 626
1da177e4 627#define blk_queue_stopped(q) test_bit(QUEUE_FLAG_STOPPED, &(q)->queue_flags)
3f3299d5 628#define blk_queue_dying(q) test_bit(QUEUE_FLAG_DYING, &(q)->queue_flags)
c246e80d 629#define blk_queue_dead(q) test_bit(QUEUE_FLAG_DEAD, &(q)->queue_flags)
320ae51f 630#define blk_queue_init_done(q) test_bit(QUEUE_FLAG_INIT_DONE, &(q)->queue_flags)
ac9fafa1 631#define blk_queue_nomerges(q) test_bit(QUEUE_FLAG_NOMERGES, &(q)->queue_flags)
488991e2
AB
632#define blk_queue_noxmerges(q) \
633 test_bit(QUEUE_FLAG_NOXMERGES, &(q)->queue_flags)
a68bbddb 634#define blk_queue_nonrot(q) test_bit(QUEUE_FLAG_NONROT, &(q)->queue_flags)
bc58ba94 635#define blk_queue_io_stat(q) test_bit(QUEUE_FLAG_IO_STAT, &(q)->queue_flags)
e2e1a148 636#define blk_queue_add_random(q) test_bit(QUEUE_FLAG_ADD_RANDOM, &(q)->queue_flags)
c15227de 637#define blk_queue_discard(q) test_bit(QUEUE_FLAG_DISCARD, &(q)->queue_flags)
e84e8f06
CK
638#define blk_queue_zone_resetall(q) \
639 test_bit(QUEUE_FLAG_ZONE_RESETALL, &(q)->queue_flags)
288dab8a
CH
640#define blk_queue_secure_erase(q) \
641 (test_bit(QUEUE_FLAG_SECERASE, &(q)->queue_flags))
163d4baa 642#define blk_queue_dax(q) test_bit(QUEUE_FLAG_DAX, &(q)->queue_flags)
9efc160f
BVA
643#define blk_queue_scsi_passthrough(q) \
644 test_bit(QUEUE_FLAG_SCSI_PASSTHROUGH, &(q)->queue_flags)
49d92c0d
LG
645#define blk_queue_pci_p2pdma(q) \
646 test_bit(QUEUE_FLAG_PCI_P2PDMA, &(q)->queue_flags)
6f816b4b
TH
647#ifdef CONFIG_BLK_RQ_ALLOC_TIME
648#define blk_queue_rq_alloc_time(q) \
649 test_bit(QUEUE_FLAG_RQ_ALLOC_TIME, &(q)->queue_flags)
650#else
651#define blk_queue_rq_alloc_time(q) false
652#endif
1da177e4 653
33659ebb
CH
654#define blk_noretry_request(rq) \
655 ((rq)->cmd_flags & (REQ_FAILFAST_DEV|REQ_FAILFAST_TRANSPORT| \
656 REQ_FAILFAST_DRIVER))
f4560ffe 657#define blk_queue_quiesced(q) test_bit(QUEUE_FLAG_QUIESCED, &(q)->queue_flags)
cd84a62e 658#define blk_queue_pm_only(q) atomic_read(&(q)->pm_only)
0ce91444 659#define blk_queue_fua(q) test_bit(QUEUE_FLAG_FUA, &(q)->queue_flags)
58c898ba 660#define blk_queue_registered(q) test_bit(QUEUE_FLAG_REGISTERED, &(q)->queue_flags)
c9254f2d 661
cd84a62e
BVA
662extern void blk_set_pm_only(struct request_queue *q);
663extern void blk_clear_pm_only(struct request_queue *q);
33659ebb 664
57292b58
CH
665static inline bool blk_account_rq(struct request *rq)
666{
667 return (rq->rq_flags & RQF_STARTED) && !blk_rq_is_passthrough(rq);
668}
33659ebb 669
1da177e4
LT
670#define list_entry_rq(ptr) list_entry((ptr), struct request, queuelist)
671
4e1b2d52 672#define rq_data_dir(rq) (op_is_write(req_op(rq)) ? WRITE : READ)
1da177e4 673
9d9de535
CH
674#define rq_dma_dir(rq) \
675 (op_is_write(req_op(rq)) ? DMA_TO_DEVICE : DMA_FROM_DEVICE)
676
3ab3a031
CH
677#define dma_map_bvec(dev, bv, dir, attrs) \
678 dma_map_page_attrs(dev, (bv)->bv_page, (bv)->bv_offset, (bv)->bv_len, \
679 (dir), (attrs))
680
344e9ffc 681static inline bool queue_is_mq(struct request_queue *q)
49fd524f 682{
a1ce35fa 683 return q->mq_ops;
49fd524f
JA
684}
685
797476b8
DLM
686static inline enum blk_zoned_model
687blk_queue_zoned_model(struct request_queue *q)
688{
689 return q->limits.zoned;
690}
691
692static inline bool blk_queue_is_zoned(struct request_queue *q)
693{
694 switch (blk_queue_zoned_model(q)) {
695 case BLK_ZONED_HA:
696 case BLK_ZONED_HM:
697 return true;
698 default:
699 return false;
700 }
701}
702
113ab72e 703static inline sector_t blk_queue_zone_sectors(struct request_queue *q)
6a0cb1bc
HR
704{
705 return blk_queue_is_zoned(q) ? q->limits.chunk_sectors : 0;
706}
707
6a5ac984 708#ifdef CONFIG_BLK_DEV_ZONED
965b652e
DLM
709static inline unsigned int blk_queue_nr_zones(struct request_queue *q)
710{
711 return blk_queue_is_zoned(q) ? q->nr_zones : 0;
712}
713
6cc77e9c
CH
714static inline unsigned int blk_queue_zone_no(struct request_queue *q,
715 sector_t sector)
716{
717 if (!blk_queue_is_zoned(q))
718 return 0;
719 return sector >> ilog2(q->limits.chunk_sectors);
720}
721
722static inline bool blk_queue_zone_is_seq(struct request_queue *q,
723 sector_t sector)
724{
f216fdd7 725 if (!blk_queue_is_zoned(q))
6cc77e9c 726 return false;
f216fdd7
CH
727 if (!q->conv_zones_bitmap)
728 return true;
729 return !test_bit(blk_queue_zone_no(q, sector), q->conv_zones_bitmap);
6cc77e9c 730}
965b652e
DLM
731#else /* CONFIG_BLK_DEV_ZONED */
732static inline unsigned int blk_queue_nr_zones(struct request_queue *q)
733{
734 return 0;
735}
02992df8
JT
736static inline bool blk_queue_zone_is_seq(struct request_queue *q,
737 sector_t sector)
738{
739 return false;
740}
741static inline unsigned int blk_queue_zone_no(struct request_queue *q,
742 sector_t sector)
743{
744 return 0;
745}
6a5ac984 746#endif /* CONFIG_BLK_DEV_ZONED */
6cc77e9c 747
1faa16d2
JA
748static inline bool rq_is_sync(struct request *rq)
749{
ef295ecf 750 return op_is_sync(rq->cmd_flags);
1faa16d2
JA
751}
752
e2a60da7
MP
753static inline bool rq_mergeable(struct request *rq)
754{
57292b58 755 if (blk_rq_is_passthrough(rq))
e2a60da7 756 return false;
1da177e4 757
3a5e02ce
MC
758 if (req_op(rq) == REQ_OP_FLUSH)
759 return false;
760
a6f0788e
CK
761 if (req_op(rq) == REQ_OP_WRITE_ZEROES)
762 return false;
763
0512a75b
KB
764 if (req_op(rq) == REQ_OP_ZONE_APPEND)
765 return false;
766
e2a60da7 767 if (rq->cmd_flags & REQ_NOMERGE_FLAGS)
e8064021
CH
768 return false;
769 if (rq->rq_flags & RQF_NOMERGE_FLAGS)
e2a60da7
MP
770 return false;
771
772 return true;
773}
1da177e4 774
4363ac7c
MP
775static inline bool blk_write_same_mergeable(struct bio *a, struct bio *b)
776{
efbeccdb
CH
777 if (bio_page(a) == bio_page(b) &&
778 bio_offset(a) == bio_offset(b))
4363ac7c
MP
779 return true;
780
781 return false;
782}
783
d278d4a8
JA
784static inline unsigned int blk_queue_depth(struct request_queue *q)
785{
786 if (q->queue_depth)
787 return q->queue_depth;
788
789 return q->nr_requests;
790}
791
1da177e4
LT
792extern unsigned long blk_max_low_pfn, blk_max_pfn;
793
794/*
795 * standard bounce addresses:
796 *
797 * BLK_BOUNCE_HIGH : bounce all highmem pages
798 * BLK_BOUNCE_ANY : don't bounce anything
799 * BLK_BOUNCE_ISA : bounce pages above ISA DMA boundary
800 */
2472892a
AK
801
802#if BITS_PER_LONG == 32
1da177e4 803#define BLK_BOUNCE_HIGH ((u64)blk_max_low_pfn << PAGE_SHIFT)
2472892a
AK
804#else
805#define BLK_BOUNCE_HIGH -1ULL
806#endif
807#define BLK_BOUNCE_ANY (-1ULL)
bfe17231 808#define BLK_BOUNCE_ISA (DMA_BIT_MASK(24))
1da177e4 809
3d6392cf
JA
810/*
811 * default timeout for SG_IO if none specified
812 */
813#define BLK_DEFAULT_SG_TIMEOUT (60 * HZ)
f2f1fa78 814#define BLK_MIN_SG_TIMEOUT (7 * HZ)
3d6392cf 815
152e283f
FT
816struct rq_map_data {
817 struct page **pages;
818 int page_order;
819 int nr_entries;
56c451f4 820 unsigned long offset;
97ae77a1 821 int null_mapped;
ecb554a8 822 int from_user;
152e283f
FT
823};
824
5705f702 825struct req_iterator {
7988613b 826 struct bvec_iter iter;
5705f702
N
827 struct bio *bio;
828};
829
830/* This should not be used directly - use rq_for_each_segment */
1e428079
JA
831#define for_each_bio(_bio) \
832 for (; _bio; _bio = _bio->bi_next)
5705f702 833#define __rq_for_each_bio(_bio, rq) \
1da177e4
LT
834 if ((rq->bio)) \
835 for (_bio = (rq)->bio; _bio; _bio = _bio->bi_next)
836
5705f702
N
837#define rq_for_each_segment(bvl, _rq, _iter) \
838 __rq_for_each_bio(_iter.bio, _rq) \
7988613b 839 bio_for_each_segment(bvl, _iter.bio, _iter.iter)
5705f702 840
d18d9174
ML
841#define rq_for_each_bvec(bvl, _rq, _iter) \
842 __rq_for_each_bio(_iter.bio, _rq) \
843 bio_for_each_bvec(bvl, _iter.bio, _iter.iter)
844
4550dd6c 845#define rq_iter_last(bvec, _iter) \
7988613b 846 (_iter.bio->bi_next == NULL && \
4550dd6c 847 bio_iter_last(bvec, _iter.iter))
5705f702 848
2d4dc890
IL
849#ifndef ARCH_IMPLEMENTS_FLUSH_DCACHE_PAGE
850# error "You should define ARCH_IMPLEMENTS_FLUSH_DCACHE_PAGE for your platform"
851#endif
852#if ARCH_IMPLEMENTS_FLUSH_DCACHE_PAGE
853extern void rq_flush_dcache_pages(struct request *rq);
854#else
855static inline void rq_flush_dcache_pages(struct request *rq)
856{
857}
858#endif
859
1da177e4
LT
860extern int blk_register_queue(struct gendisk *disk);
861extern void blk_unregister_queue(struct gendisk *disk);
dece1635 862extern blk_qc_t generic_make_request(struct bio *bio);
f421e1d9 863extern blk_qc_t direct_make_request(struct bio *bio);
2a4aa30c 864extern void blk_rq_init(struct request_queue *q, struct request *rq);
1da177e4 865extern void blk_put_request(struct request *);
cd6ce148 866extern struct request *blk_get_request(struct request_queue *, unsigned int op,
ff005a06 867 blk_mq_req_flags_t flags);
ef9e3fac 868extern int blk_lld_busy(struct request_queue *q);
78d8e58a
MS
869extern int blk_rq_prep_clone(struct request *rq, struct request *rq_src,
870 struct bio_set *bs, gfp_t gfp_mask,
871 int (*bio_ctr)(struct bio *, struct bio *, void *),
872 void *data);
873extern void blk_rq_unprep_clone(struct request *rq);
2a842aca 874extern blk_status_t blk_insert_cloned_request(struct request_queue *q,
82124d60 875 struct request *rq);
0abc2a10 876extern int blk_rq_append_bio(struct request *rq, struct bio **bio);
af67c31f 877extern void blk_queue_split(struct request_queue *, struct bio **);
0bfc96cb 878extern int scsi_verify_blk_ioctl(struct block_device *, unsigned int);
577ebb37
PB
879extern int scsi_cmd_blk_ioctl(struct block_device *, fmode_t,
880 unsigned int, void __user *);
74f3c8af
AV
881extern int scsi_cmd_ioctl(struct request_queue *, struct gendisk *, fmode_t,
882 unsigned int, void __user *);
e915e872
AV
883extern int sg_scsi_ioctl(struct request_queue *, struct gendisk *, fmode_t,
884 struct scsi_ioctl_command __user *);
98aaaec4
AB
885extern int get_sg_io_hdr(struct sg_io_hdr *hdr, const void __user *argp);
886extern int put_sg_io_hdr(const struct sg_io_hdr *hdr, void __user *argp);
3fcfab16 887
9a95e4ef 888extern int blk_queue_enter(struct request_queue *q, blk_mq_req_flags_t flags);
2e6edc95 889extern void blk_queue_exit(struct request_queue *q);
1da177e4 890extern void blk_sync_queue(struct request_queue *q);
a3bce90e 891extern int blk_rq_map_user(struct request_queue *, struct request *,
152e283f
FT
892 struct rq_map_data *, void __user *, unsigned long,
893 gfp_t);
8e5cfc45 894extern int blk_rq_unmap_user(struct bio *);
165125e1
JA
895extern int blk_rq_map_kern(struct request_queue *, struct request *, void *, unsigned int, gfp_t);
896extern int blk_rq_map_user_iov(struct request_queue *, struct request *,
26e49cfc
KO
897 struct rq_map_data *, const struct iov_iter *,
898 gfp_t);
b7819b92 899extern void blk_execute_rq(struct request_queue *, struct gendisk *,
994ca9a1 900 struct request *, int);
165125e1 901extern void blk_execute_rq_nowait(struct request_queue *, struct gendisk *,
15fc858a 902 struct request *, int, rq_end_io_fn *);
6e39b69e 903
e47bc4ed
CK
904/* Helper to convert REQ_OP_XXX to its string format XXX */
905extern const char *blk_op_str(unsigned int op);
906
2a842aca
CH
907int blk_status_to_errno(blk_status_t status);
908blk_status_t errno_to_blk_status(int errno);
909
0a1b8b87 910int blk_poll(struct request_queue *q, blk_qc_t cookie, bool spin);
05229bee 911
165125e1 912static inline struct request_queue *bdev_get_queue(struct block_device *bdev)
1da177e4 913{
ff9ea323 914 return bdev->bd_disk->queue; /* this is never NULL */
1da177e4
LT
915}
916
233bde21
BVA
917/*
918 * The basic unit of block I/O is a sector. It is used in a number of contexts
919 * in Linux (blk, bio, genhd). The size of one sector is 512 = 2**9
920 * bytes. Variables of type sector_t represent an offset or size that is a
921 * multiple of 512 bytes. Hence these two constants.
922 */
923#ifndef SECTOR_SHIFT
924#define SECTOR_SHIFT 9
925#endif
926#ifndef SECTOR_SIZE
927#define SECTOR_SIZE (1 << SECTOR_SHIFT)
928#endif
929
5efccd17 930/*
80a761fd
TH
931 * blk_rq_pos() : the current sector
932 * blk_rq_bytes() : bytes left in the entire request
933 * blk_rq_cur_bytes() : bytes left in the current segment
934 * blk_rq_err_bytes() : bytes left till the next error boundary
935 * blk_rq_sectors() : sectors left in the entire request
936 * blk_rq_cur_sectors() : sectors left in the current segment
3d244306 937 * blk_rq_stats_sectors() : sectors of the entire request used for stats
5efccd17 938 */
5b93629b
TH
939static inline sector_t blk_rq_pos(const struct request *rq)
940{
a2dec7b3 941 return rq->__sector;
2e46e8b2
TH
942}
943
944static inline unsigned int blk_rq_bytes(const struct request *rq)
945{
a2dec7b3 946 return rq->__data_len;
5b93629b
TH
947}
948
2e46e8b2
TH
949static inline int blk_rq_cur_bytes(const struct request *rq)
950{
951 return rq->bio ? bio_cur_bytes(rq->bio) : 0;
952}
5efccd17 953
80a761fd
TH
954extern unsigned int blk_rq_err_bytes(const struct request *rq);
955
5b93629b
TH
956static inline unsigned int blk_rq_sectors(const struct request *rq)
957{
233bde21 958 return blk_rq_bytes(rq) >> SECTOR_SHIFT;
5b93629b
TH
959}
960
961static inline unsigned int blk_rq_cur_sectors(const struct request *rq)
962{
233bde21 963 return blk_rq_cur_bytes(rq) >> SECTOR_SHIFT;
5b93629b
TH
964}
965
3d244306
HT
966static inline unsigned int blk_rq_stats_sectors(const struct request *rq)
967{
968 return rq->stats_sectors;
969}
970
6a5ac984 971#ifdef CONFIG_BLK_DEV_ZONED
02694e86
CK
972
973/* Helper to convert BLK_ZONE_ZONE_XXX to its string format XXX */
974const char *blk_zone_cond_str(enum blk_zone_cond zone_cond);
975
6cc77e9c
CH
976static inline unsigned int blk_rq_zone_no(struct request *rq)
977{
978 return blk_queue_zone_no(rq->q, blk_rq_pos(rq));
979}
980
981static inline unsigned int blk_rq_zone_is_seq(struct request *rq)
982{
983 return blk_queue_zone_is_seq(rq->q, blk_rq_pos(rq));
984}
6a5ac984 985#endif /* CONFIG_BLK_DEV_ZONED */
6cc77e9c 986
2e3258ec
CH
987/*
988 * Some commands like WRITE SAME have a payload or data transfer size which
989 * is different from the size of the request. Any driver that supports such
990 * commands using the RQF_SPECIAL_PAYLOAD flag needs to use this helper to
991 * calculate the data transfer size.
992 */
993static inline unsigned int blk_rq_payload_bytes(struct request *rq)
994{
995 if (rq->rq_flags & RQF_SPECIAL_PAYLOAD)
996 return rq->special_vec.bv_len;
997 return blk_rq_bytes(rq);
998}
999
3aef3cae
CH
1000/*
1001 * Return the first full biovec in the request. The caller needs to check that
1002 * there are any bvecs before calling this helper.
1003 */
1004static inline struct bio_vec req_bvec(struct request *rq)
1005{
1006 if (rq->rq_flags & RQF_SPECIAL_PAYLOAD)
1007 return rq->special_vec;
1008 return mp_bvec_iter_bvec(rq->bio->bi_io_vec, rq->bio->bi_iter);
1009}
1010
f31dc1cd 1011static inline unsigned int blk_queue_get_max_sectors(struct request_queue *q,
8fe0d473 1012 int op)
f31dc1cd 1013{
7afafc8a 1014 if (unlikely(op == REQ_OP_DISCARD || op == REQ_OP_SECURE_ERASE))
233bde21
BVA
1015 return min(q->limits.max_discard_sectors,
1016 UINT_MAX >> SECTOR_SHIFT);
f31dc1cd 1017
8fe0d473 1018 if (unlikely(op == REQ_OP_WRITE_SAME))
4363ac7c
MP
1019 return q->limits.max_write_same_sectors;
1020
a6f0788e
CK
1021 if (unlikely(op == REQ_OP_WRITE_ZEROES))
1022 return q->limits.max_write_zeroes_sectors;
1023
f31dc1cd
MP
1024 return q->limits.max_sectors;
1025}
1026
762380ad
JA
1027/*
1028 * Return maximum size of a request at given offset. Only valid for
1029 * file system requests.
1030 */
1031static inline unsigned int blk_max_size_offset(struct request_queue *q,
1032 sector_t offset)
1033{
1034 if (!q->limits.chunk_sectors)
736ed4de 1035 return q->limits.max_sectors;
762380ad 1036
15bfd21f
KB
1037 return min(q->limits.max_sectors, (unsigned int)(q->limits.chunk_sectors -
1038 (offset & (q->limits.chunk_sectors - 1))));
762380ad
JA
1039}
1040
17007f39
DLM
1041static inline unsigned int blk_rq_get_max_sectors(struct request *rq,
1042 sector_t offset)
f31dc1cd
MP
1043{
1044 struct request_queue *q = rq->q;
1045
57292b58 1046 if (blk_rq_is_passthrough(rq))
f31dc1cd
MP
1047 return q->limits.max_hw_sectors;
1048
7afafc8a
AH
1049 if (!q->limits.chunk_sectors ||
1050 req_op(rq) == REQ_OP_DISCARD ||
1051 req_op(rq) == REQ_OP_SECURE_ERASE)
8fe0d473 1052 return blk_queue_get_max_sectors(q, req_op(rq));
762380ad 1053
17007f39 1054 return min(blk_max_size_offset(q, offset),
8fe0d473 1055 blk_queue_get_max_sectors(q, req_op(rq)));
f31dc1cd
MP
1056}
1057
75afb352
JN
1058static inline unsigned int blk_rq_count_bios(struct request *rq)
1059{
1060 unsigned int nr_bios = 0;
1061 struct bio *bio;
1062
1063 __rq_for_each_bio(bio, rq)
1064 nr_bios++;
1065
1066 return nr_bios;
1067}
1068
ef71de8b
CH
1069void blk_steal_bios(struct bio_list *list, struct request *rq);
1070
1da177e4 1071/*
2e60e022
TH
1072 * Request completion related functions.
1073 *
1074 * blk_update_request() completes given number of bytes and updates
1075 * the request without completing it.
1da177e4 1076 */
2a842aca 1077extern bool blk_update_request(struct request *rq, blk_status_t error,
2e60e022 1078 unsigned int nr_bytes);
2e60e022 1079
242f9dcb 1080extern void blk_abort_request(struct request *);
ff856bad 1081
1da177e4
LT
1082/*
1083 * Access functions for manipulating queue properties
1084 */
165125e1 1085extern void blk_cleanup_queue(struct request_queue *);
165125e1 1086extern void blk_queue_bounce_limit(struct request_queue *, u64);
086fa5ff 1087extern void blk_queue_max_hw_sectors(struct request_queue *, unsigned int);
762380ad 1088extern void blk_queue_chunk_sectors(struct request_queue *, unsigned int);
8a78362c 1089extern void blk_queue_max_segments(struct request_queue *, unsigned short);
1e739730
CH
1090extern void blk_queue_max_discard_segments(struct request_queue *,
1091 unsigned short);
165125e1 1092extern void blk_queue_max_segment_size(struct request_queue *, unsigned int);
67efc925
CH
1093extern void blk_queue_max_discard_sectors(struct request_queue *q,
1094 unsigned int max_discard_sectors);
4363ac7c
MP
1095extern void blk_queue_max_write_same_sectors(struct request_queue *q,
1096 unsigned int max_write_same_sectors);
a6f0788e
CK
1097extern void blk_queue_max_write_zeroes_sectors(struct request_queue *q,
1098 unsigned int max_write_same_sectors);
ad6bf88a 1099extern void blk_queue_logical_block_size(struct request_queue *, unsigned int);
0512a75b
KB
1100extern void blk_queue_max_zone_append_sectors(struct request_queue *q,
1101 unsigned int max_zone_append_sectors);
892b6f90 1102extern void blk_queue_physical_block_size(struct request_queue *, unsigned int);
c72758f3
MP
1103extern void blk_queue_alignment_offset(struct request_queue *q,
1104 unsigned int alignment);
7c958e32 1105extern void blk_limits_io_min(struct queue_limits *limits, unsigned int min);
c72758f3 1106extern void blk_queue_io_min(struct request_queue *q, unsigned int min);
3c5820c7 1107extern void blk_limits_io_opt(struct queue_limits *limits, unsigned int opt);
c72758f3 1108extern void blk_queue_io_opt(struct request_queue *q, unsigned int opt);
d278d4a8 1109extern void blk_set_queue_depth(struct request_queue *q, unsigned int depth);
e475bba2 1110extern void blk_set_default_limits(struct queue_limits *lim);
b1bd055d 1111extern void blk_set_stacking_limits(struct queue_limits *lim);
c72758f3
MP
1112extern int blk_stack_limits(struct queue_limits *t, struct queue_limits *b,
1113 sector_t offset);
17be8c24
MP
1114extern int bdev_stack_limits(struct queue_limits *t, struct block_device *bdev,
1115 sector_t offset);
c72758f3
MP
1116extern void disk_stack_limits(struct gendisk *disk, struct block_device *bdev,
1117 sector_t offset);
165125e1 1118extern void blk_queue_stack_limits(struct request_queue *t, struct request_queue *b);
27f8221a 1119extern void blk_queue_update_dma_pad(struct request_queue *, unsigned int);
165125e1 1120extern void blk_queue_segment_boundary(struct request_queue *, unsigned long);
03100aad 1121extern void blk_queue_virt_boundary(struct request_queue *, unsigned long);
165125e1 1122extern void blk_queue_dma_alignment(struct request_queue *, int);
11c3e689 1123extern void blk_queue_update_dma_alignment(struct request_queue *, int);
242f9dcb 1124extern void blk_queue_rq_timeout(struct request_queue *, unsigned int);
93e9d8e8 1125extern void blk_queue_write_cache(struct request_queue *q, bool enabled, bool fua);
68c43f13
DLM
1126extern void blk_queue_required_elevator_features(struct request_queue *q,
1127 unsigned int features);
45147fb5
YS
1128extern bool blk_queue_can_use_dma_map_merging(struct request_queue *q,
1129 struct device *dev);
1da177e4 1130
1e739730
CH
1131/*
1132 * Number of physical segments as sent to the device.
1133 *
1134 * Normally this is the number of discontiguous data segments sent by the
1135 * submitter. But for data-less command like discard we might have no
1136 * actual data segments submitted, but the driver might have to add it's
1137 * own special payload. In that case we still return 1 here so that this
1138 * special payload will be mapped.
1139 */
f9d03f96
CH
1140static inline unsigned short blk_rq_nr_phys_segments(struct request *rq)
1141{
1142 if (rq->rq_flags & RQF_SPECIAL_PAYLOAD)
1143 return 1;
1144 return rq->nr_phys_segments;
1145}
1146
1e739730
CH
1147/*
1148 * Number of discard segments (or ranges) the driver needs to fill in.
1149 * Each discard bio merged into a request is counted as one segment.
1150 */
1151static inline unsigned short blk_rq_nr_discard_segments(struct request *rq)
1152{
1153 return max_t(unsigned short, rq->nr_phys_segments, 1);
1154}
1155
89de1504
CH
1156int __blk_rq_map_sg(struct request_queue *q, struct request *rq,
1157 struct scatterlist *sglist, struct scatterlist **last_sg);
1158static inline int blk_rq_map_sg(struct request_queue *q, struct request *rq,
1159 struct scatterlist *sglist)
1160{
1161 struct scatterlist *last_sg = NULL;
1162
1163 return __blk_rq_map_sg(q, rq, sglist, &last_sg);
1164}
1da177e4 1165extern void blk_dump_rq_flags(struct request *, char *);
1da177e4 1166extern long nr_blockdev_pages(void);
1da177e4 1167
09ac46c4 1168bool __must_check blk_get_queue(struct request_queue *);
3d745ea5 1169struct request_queue *blk_alloc_queue(make_request_fn make_request, int node_id);
165125e1 1170extern void blk_put_queue(struct request_queue *);
3f21c265 1171extern void blk_set_queue_dying(struct request_queue *);
1da177e4 1172
316cc67d 1173/*
75df7136
SJ
1174 * blk_plug permits building a queue of related requests by holding the I/O
1175 * fragments for a short period. This allows merging of sequential requests
1176 * into single larger request. As the requests are moved from a per-task list to
1177 * the device's request_queue in a batch, this results in improved scalability
1178 * as the lock contention for request_queue lock is reduced.
1179 *
1180 * It is ok not to disable preemption when adding the request to the plug list
1181 * or when attempting a merge, because blk_schedule_flush_list() will only flush
1182 * the plug list when the task sleeps by itself. For details, please see
1183 * schedule() where blk_schedule_flush_plug() is called.
316cc67d 1184 */
73c10101 1185struct blk_plug {
320ae51f 1186 struct list_head mq_list; /* blk-mq requests */
75df7136 1187 struct list_head cb_list; /* md requires an unplug callback */
5f0ed774 1188 unsigned short rq_count;
ce5b009c 1189 bool multiple_queues;
73c10101 1190};
55c022bb 1191#define BLK_MAX_REQUEST_COUNT 16
50d24c34 1192#define BLK_PLUG_FLUSH_SIZE (128 * 1024)
55c022bb 1193
9cbb1750 1194struct blk_plug_cb;
74018dc3 1195typedef void (*blk_plug_cb_fn)(struct blk_plug_cb *, bool);
048c9374
N
1196struct blk_plug_cb {
1197 struct list_head list;
9cbb1750
N
1198 blk_plug_cb_fn callback;
1199 void *data;
048c9374 1200};
9cbb1750
N
1201extern struct blk_plug_cb *blk_check_plugged(blk_plug_cb_fn unplug,
1202 void *data, int size);
73c10101
JA
1203extern void blk_start_plug(struct blk_plug *);
1204extern void blk_finish_plug(struct blk_plug *);
f6603783 1205extern void blk_flush_plug_list(struct blk_plug *, bool);
73c10101
JA
1206
1207static inline void blk_flush_plug(struct task_struct *tsk)
1208{
1209 struct blk_plug *plug = tsk->plug;
1210
a237c1c5
JA
1211 if (plug)
1212 blk_flush_plug_list(plug, false);
1213}
1214
1215static inline void blk_schedule_flush_plug(struct task_struct *tsk)
1216{
1217 struct blk_plug *plug = tsk->plug;
1218
88b996cd 1219 if (plug)
f6603783 1220 blk_flush_plug_list(plug, true);
73c10101
JA
1221}
1222
1223static inline bool blk_needs_flush_plug(struct task_struct *tsk)
1224{
1225 struct blk_plug *plug = tsk->plug;
1226
320ae51f 1227 return plug &&
a1ce35fa 1228 (!list_empty(&plug->mq_list) ||
320ae51f 1229 !list_empty(&plug->cb_list));
73c10101
JA
1230}
1231
71ac860a
ML
1232extern void blk_io_schedule(void);
1233
9398554f 1234int blkdev_issue_flush(struct block_device *, gfp_t);
ee472d83
CH
1235extern int blkdev_issue_write_same(struct block_device *bdev, sector_t sector,
1236 sector_t nr_sects, gfp_t gfp_mask, struct page *page);
e950fdf7
CH
1237
1238#define BLKDEV_DISCARD_SECURE (1 << 0) /* issue a secure erase */
dd3932ed 1239
fbd9b09a
DM
1240extern int blkdev_issue_discard(struct block_device *bdev, sector_t sector,
1241 sector_t nr_sects, gfp_t gfp_mask, unsigned long flags);
38f25255 1242extern int __blkdev_issue_discard(struct block_device *bdev, sector_t sector,
288dab8a 1243 sector_t nr_sects, gfp_t gfp_mask, int flags,
469e3216 1244 struct bio **biop);
ee472d83
CH
1245
1246#define BLKDEV_ZERO_NOUNMAP (1 << 0) /* do not free blocks */
cb365b96 1247#define BLKDEV_ZERO_NOFALLBACK (1 << 1) /* don't write explicit zeroes */
ee472d83 1248
e73c23ff
CK
1249extern int __blkdev_issue_zeroout(struct block_device *bdev, sector_t sector,
1250 sector_t nr_sects, gfp_t gfp_mask, struct bio **biop,
ee472d83 1251 unsigned flags);
3f14d792 1252extern int blkdev_issue_zeroout(struct block_device *bdev, sector_t sector,
ee472d83
CH
1253 sector_t nr_sects, gfp_t gfp_mask, unsigned flags);
1254
2cf6d26a
CH
1255static inline int sb_issue_discard(struct super_block *sb, sector_t block,
1256 sector_t nr_blocks, gfp_t gfp_mask, unsigned long flags)
fb2dce86 1257{
233bde21
BVA
1258 return blkdev_issue_discard(sb->s_bdev,
1259 block << (sb->s_blocksize_bits -
1260 SECTOR_SHIFT),
1261 nr_blocks << (sb->s_blocksize_bits -
1262 SECTOR_SHIFT),
2cf6d26a 1263 gfp_mask, flags);
fb2dce86 1264}
e6fa0be6 1265static inline int sb_issue_zeroout(struct super_block *sb, sector_t block,
a107e5a3 1266 sector_t nr_blocks, gfp_t gfp_mask)
e6fa0be6
LC
1267{
1268 return blkdev_issue_zeroout(sb->s_bdev,
233bde21
BVA
1269 block << (sb->s_blocksize_bits -
1270 SECTOR_SHIFT),
1271 nr_blocks << (sb->s_blocksize_bits -
1272 SECTOR_SHIFT),
ee472d83 1273 gfp_mask, 0);
e6fa0be6 1274}
1da177e4 1275
f00c4d80 1276extern int blk_verify_command(unsigned char *cmd, fmode_t mode);
0b07de85 1277
eb28d31b
MP
1278enum blk_default_limits {
1279 BLK_MAX_SEGMENTS = 128,
1280 BLK_SAFE_MAX_SECTORS = 255,
d2be537c 1281 BLK_DEF_MAX_SECTORS = 2560,
eb28d31b
MP
1282 BLK_MAX_SEGMENT_SIZE = 65536,
1283 BLK_SEG_BOUNDARY_MASK = 0xFFFFFFFFUL,
1284};
0e435ac2 1285
af2c68fe 1286static inline unsigned long queue_segment_boundary(const struct request_queue *q)
ae03bf63 1287{
025146e1 1288 return q->limits.seg_boundary_mask;
ae03bf63
MP
1289}
1290
af2c68fe 1291static inline unsigned long queue_virt_boundary(const struct request_queue *q)
03100aad
KB
1292{
1293 return q->limits.virt_boundary_mask;
1294}
1295
af2c68fe 1296static inline unsigned int queue_max_sectors(const struct request_queue *q)
ae03bf63 1297{
025146e1 1298 return q->limits.max_sectors;
ae03bf63
MP
1299}
1300
af2c68fe 1301static inline unsigned int queue_max_hw_sectors(const struct request_queue *q)
ae03bf63 1302{
025146e1 1303 return q->limits.max_hw_sectors;
ae03bf63
MP
1304}
1305
af2c68fe 1306static inline unsigned short queue_max_segments(const struct request_queue *q)
ae03bf63 1307{
8a78362c 1308 return q->limits.max_segments;
ae03bf63
MP
1309}
1310
af2c68fe 1311static inline unsigned short queue_max_discard_segments(const struct request_queue *q)
1e739730
CH
1312{
1313 return q->limits.max_discard_segments;
1314}
1315
af2c68fe 1316static inline unsigned int queue_max_segment_size(const struct request_queue *q)
ae03bf63 1317{
025146e1 1318 return q->limits.max_segment_size;
ae03bf63
MP
1319}
1320
0512a75b
KB
1321static inline unsigned int queue_max_zone_append_sectors(const struct request_queue *q)
1322{
1323 return q->limits.max_zone_append_sectors;
1324}
1325
ad6bf88a 1326static inline unsigned queue_logical_block_size(const struct request_queue *q)
1da177e4
LT
1327{
1328 int retval = 512;
1329
025146e1
MP
1330 if (q && q->limits.logical_block_size)
1331 retval = q->limits.logical_block_size;
1da177e4
LT
1332
1333 return retval;
1334}
1335
ad6bf88a 1336static inline unsigned int bdev_logical_block_size(struct block_device *bdev)
1da177e4 1337{
e1defc4f 1338 return queue_logical_block_size(bdev_get_queue(bdev));
1da177e4
LT
1339}
1340
af2c68fe 1341static inline unsigned int queue_physical_block_size(const struct request_queue *q)
c72758f3
MP
1342{
1343 return q->limits.physical_block_size;
1344}
1345
892b6f90 1346static inline unsigned int bdev_physical_block_size(struct block_device *bdev)
ac481c20
MP
1347{
1348 return queue_physical_block_size(bdev_get_queue(bdev));
1349}
1350
af2c68fe 1351static inline unsigned int queue_io_min(const struct request_queue *q)
c72758f3
MP
1352{
1353 return q->limits.io_min;
1354}
1355
ac481c20
MP
1356static inline int bdev_io_min(struct block_device *bdev)
1357{
1358 return queue_io_min(bdev_get_queue(bdev));
1359}
1360
af2c68fe 1361static inline unsigned int queue_io_opt(const struct request_queue *q)
c72758f3
MP
1362{
1363 return q->limits.io_opt;
1364}
1365
ac481c20
MP
1366static inline int bdev_io_opt(struct block_device *bdev)
1367{
1368 return queue_io_opt(bdev_get_queue(bdev));
1369}
1370
af2c68fe 1371static inline int queue_alignment_offset(const struct request_queue *q)
c72758f3 1372{
ac481c20 1373 if (q->limits.misaligned)
c72758f3
MP
1374 return -1;
1375
ac481c20 1376 return q->limits.alignment_offset;
c72758f3
MP
1377}
1378
e03a72e1 1379static inline int queue_limit_alignment_offset(struct queue_limits *lim, sector_t sector)
81744ee4
MP
1380{
1381 unsigned int granularity = max(lim->physical_block_size, lim->io_min);
233bde21
BVA
1382 unsigned int alignment = sector_div(sector, granularity >> SECTOR_SHIFT)
1383 << SECTOR_SHIFT;
81744ee4 1384
b8839b8c 1385 return (granularity + lim->alignment_offset - alignment) % granularity;
c72758f3
MP
1386}
1387
ac481c20
MP
1388static inline int bdev_alignment_offset(struct block_device *bdev)
1389{
1390 struct request_queue *q = bdev_get_queue(bdev);
1391
1392 if (q->limits.misaligned)
1393 return -1;
1394
1395 if (bdev != bdev->bd_contains)
1396 return bdev->bd_part->alignment_offset;
1397
1398 return q->limits.alignment_offset;
1399}
1400
af2c68fe 1401static inline int queue_discard_alignment(const struct request_queue *q)
86b37281
MP
1402{
1403 if (q->limits.discard_misaligned)
1404 return -1;
1405
1406 return q->limits.discard_alignment;
1407}
1408
e03a72e1 1409static inline int queue_limit_discard_alignment(struct queue_limits *lim, sector_t sector)
86b37281 1410{
59771079 1411 unsigned int alignment, granularity, offset;
dd3d145d 1412
a934a00a
MP
1413 if (!lim->max_discard_sectors)
1414 return 0;
1415
59771079 1416 /* Why are these in bytes, not sectors? */
233bde21
BVA
1417 alignment = lim->discard_alignment >> SECTOR_SHIFT;
1418 granularity = lim->discard_granularity >> SECTOR_SHIFT;
59771079
LT
1419 if (!granularity)
1420 return 0;
1421
1422 /* Offset of the partition start in 'granularity' sectors */
1423 offset = sector_div(sector, granularity);
1424
1425 /* And why do we do this modulus *again* in blkdev_issue_discard()? */
1426 offset = (granularity + alignment - offset) % granularity;
1427
1428 /* Turn it back into bytes, gaah */
233bde21 1429 return offset << SECTOR_SHIFT;
86b37281
MP
1430}
1431
c6e66634
PB
1432static inline int bdev_discard_alignment(struct block_device *bdev)
1433{
1434 struct request_queue *q = bdev_get_queue(bdev);
1435
1436 if (bdev != bdev->bd_contains)
1437 return bdev->bd_part->discard_alignment;
1438
1439 return q->limits.discard_alignment;
1440}
1441
4363ac7c
MP
1442static inline unsigned int bdev_write_same(struct block_device *bdev)
1443{
1444 struct request_queue *q = bdev_get_queue(bdev);
1445
1446 if (q)
1447 return q->limits.max_write_same_sectors;
1448
1449 return 0;
1450}
1451
a6f0788e
CK
1452static inline unsigned int bdev_write_zeroes_sectors(struct block_device *bdev)
1453{
1454 struct request_queue *q = bdev_get_queue(bdev);
1455
1456 if (q)
1457 return q->limits.max_write_zeroes_sectors;
1458
1459 return 0;
1460}
1461
797476b8
DLM
1462static inline enum blk_zoned_model bdev_zoned_model(struct block_device *bdev)
1463{
1464 struct request_queue *q = bdev_get_queue(bdev);
1465
1466 if (q)
1467 return blk_queue_zoned_model(q);
1468
1469 return BLK_ZONED_NONE;
1470}
1471
1472static inline bool bdev_is_zoned(struct block_device *bdev)
1473{
1474 struct request_queue *q = bdev_get_queue(bdev);
1475
1476 if (q)
1477 return blk_queue_is_zoned(q);
1478
1479 return false;
1480}
1481
113ab72e 1482static inline sector_t bdev_zone_sectors(struct block_device *bdev)
6a0cb1bc
HR
1483{
1484 struct request_queue *q = bdev_get_queue(bdev);
1485
1486 if (q)
f99e8648 1487 return blk_queue_zone_sectors(q);
6cc77e9c
CH
1488 return 0;
1489}
6a0cb1bc 1490
af2c68fe 1491static inline int queue_dma_alignment(const struct request_queue *q)
1da177e4 1492{
482eb689 1493 return q ? q->dma_alignment : 511;
1da177e4
LT
1494}
1495
14417799 1496static inline int blk_rq_aligned(struct request_queue *q, unsigned long addr,
87904074
FT
1497 unsigned int len)
1498{
1499 unsigned int alignment = queue_dma_alignment(q) | q->dma_pad_mask;
14417799 1500 return !(addr & alignment) && !(len & alignment);
87904074
FT
1501}
1502
1da177e4
LT
1503/* assumes size > 256 */
1504static inline unsigned int blksize_bits(unsigned int size)
1505{
1506 unsigned int bits = 8;
1507 do {
1508 bits++;
1509 size >>= 1;
1510 } while (size > 256);
1511 return bits;
1512}
1513
2befb9e3 1514static inline unsigned int block_size(struct block_device *bdev)
1da177e4
LT
1515{
1516 return bdev->bd_block_size;
1517}
1518
59c3d45e 1519int kblockd_schedule_work(struct work_struct *work);
818cd1cb 1520int kblockd_mod_delayed_work_on(int cpu, struct delayed_work *dwork, unsigned long delay);
1da177e4 1521
1da177e4
LT
1522#define MODULE_ALIAS_BLOCKDEV(major,minor) \
1523 MODULE_ALIAS("block-major-" __stringify(major) "-" __stringify(minor))
1524#define MODULE_ALIAS_BLOCKDEV_MAJOR(major) \
1525 MODULE_ALIAS("block-major-" __stringify(major) "-*")
1526
7ba1ba12
MP
1527#if defined(CONFIG_BLK_DEV_INTEGRITY)
1528
8288f496
MP
1529enum blk_integrity_flags {
1530 BLK_INTEGRITY_VERIFY = 1 << 0,
1531 BLK_INTEGRITY_GENERATE = 1 << 1,
3aec2f41 1532 BLK_INTEGRITY_DEVICE_CAPABLE = 1 << 2,
aae7df50 1533 BLK_INTEGRITY_IP_CHECKSUM = 1 << 3,
8288f496 1534};
7ba1ba12 1535
18593088 1536struct blk_integrity_iter {
7ba1ba12
MP
1537 void *prot_buf;
1538 void *data_buf;
3be91c4a 1539 sector_t seed;
7ba1ba12 1540 unsigned int data_size;
3be91c4a 1541 unsigned short interval;
7ba1ba12
MP
1542 const char *disk_name;
1543};
1544
4e4cbee9 1545typedef blk_status_t (integrity_processing_fn) (struct blk_integrity_iter *);
54d4e6ab
MG
1546typedef void (integrity_prepare_fn) (struct request *);
1547typedef void (integrity_complete_fn) (struct request *, unsigned int);
7ba1ba12 1548
0f8087ec
MP
1549struct blk_integrity_profile {
1550 integrity_processing_fn *generate_fn;
1551 integrity_processing_fn *verify_fn;
54d4e6ab
MG
1552 integrity_prepare_fn *prepare_fn;
1553 integrity_complete_fn *complete_fn;
0f8087ec
MP
1554 const char *name;
1555};
7ba1ba12 1556
25520d55 1557extern void blk_integrity_register(struct gendisk *, struct blk_integrity *);
7ba1ba12 1558extern void blk_integrity_unregister(struct gendisk *);
ad7fce93 1559extern int blk_integrity_compare(struct gendisk *, struct gendisk *);
13f05c8d
MP
1560extern int blk_rq_map_integrity_sg(struct request_queue *, struct bio *,
1561 struct scatterlist *);
1562extern int blk_rq_count_integrity_sg(struct request_queue *, struct bio *);
4eaf99be
MP
1563extern bool blk_integrity_merge_rq(struct request_queue *, struct request *,
1564 struct request *);
1565extern bool blk_integrity_merge_bio(struct request_queue *, struct request *,
1566 struct bio *);
7ba1ba12 1567
25520d55 1568static inline struct blk_integrity *blk_get_integrity(struct gendisk *disk)
b04accc4 1569{
ac6fc48c 1570 struct blk_integrity *bi = &disk->queue->integrity;
25520d55
MP
1571
1572 if (!bi->profile)
1573 return NULL;
1574
1575 return bi;
b04accc4
JA
1576}
1577
25520d55
MP
1578static inline
1579struct blk_integrity *bdev_get_integrity(struct block_device *bdev)
b02739b0 1580{
25520d55 1581 return blk_get_integrity(bdev->bd_disk);
b02739b0
MP
1582}
1583
d145dc23
ST
1584static inline bool
1585blk_integrity_queue_supports_integrity(struct request_queue *q)
1586{
1587 return q->integrity.profile;
1588}
1589
180b2f95 1590static inline bool blk_integrity_rq(struct request *rq)
7ba1ba12 1591{
180b2f95 1592 return rq->cmd_flags & REQ_INTEGRITY;
7ba1ba12
MP
1593}
1594
13f05c8d
MP
1595static inline void blk_queue_max_integrity_segments(struct request_queue *q,
1596 unsigned int segs)
1597{
1598 q->limits.max_integrity_segments = segs;
1599}
1600
1601static inline unsigned short
af2c68fe 1602queue_max_integrity_segments(const struct request_queue *q)
13f05c8d
MP
1603{
1604 return q->limits.max_integrity_segments;
1605}
1606
359f6427
GE
1607/**
1608 * bio_integrity_intervals - Return number of integrity intervals for a bio
1609 * @bi: blk_integrity profile for device
1610 * @sectors: Size of the bio in 512-byte sectors
1611 *
1612 * Description: The block layer calculates everything in 512 byte
1613 * sectors but integrity metadata is done in terms of the data integrity
1614 * interval size of the storage device. Convert the block layer sectors
1615 * to the appropriate number of integrity intervals.
1616 */
1617static inline unsigned int bio_integrity_intervals(struct blk_integrity *bi,
1618 unsigned int sectors)
1619{
1620 return sectors >> (bi->interval_exp - 9);
1621}
1622
1623static inline unsigned int bio_integrity_bytes(struct blk_integrity *bi,
1624 unsigned int sectors)
1625{
1626 return bio_integrity_intervals(bi, sectors) * bi->tuple_size;
1627}
1628
2a876f5e
CH
1629/*
1630 * Return the first bvec that contains integrity data. Only drivers that are
1631 * limited to a single integrity segment should use this helper.
1632 */
1633static inline struct bio_vec *rq_integrity_vec(struct request *rq)
1634{
1635 if (WARN_ON_ONCE(queue_max_integrity_segments(rq->q) > 1))
1636 return NULL;
1637 return rq->bio->bi_integrity->bip_vec;
1638}
1639
7ba1ba12
MP
1640#else /* CONFIG_BLK_DEV_INTEGRITY */
1641
fd83240a
SR
1642struct bio;
1643struct block_device;
1644struct gendisk;
1645struct blk_integrity;
1646
1647static inline int blk_integrity_rq(struct request *rq)
1648{
1649 return 0;
1650}
1651static inline int blk_rq_count_integrity_sg(struct request_queue *q,
1652 struct bio *b)
1653{
1654 return 0;
1655}
1656static inline int blk_rq_map_integrity_sg(struct request_queue *q,
1657 struct bio *b,
1658 struct scatterlist *s)
1659{
1660 return 0;
1661}
1662static inline struct blk_integrity *bdev_get_integrity(struct block_device *b)
1663{
61a04e5b 1664 return NULL;
fd83240a
SR
1665}
1666static inline struct blk_integrity *blk_get_integrity(struct gendisk *disk)
1667{
1668 return NULL;
1669}
d145dc23
ST
1670static inline bool
1671blk_integrity_queue_supports_integrity(struct request_queue *q)
1672{
1673 return false;
1674}
fd83240a
SR
1675static inline int blk_integrity_compare(struct gendisk *a, struct gendisk *b)
1676{
1677 return 0;
1678}
25520d55 1679static inline void blk_integrity_register(struct gendisk *d,
fd83240a
SR
1680 struct blk_integrity *b)
1681{
fd83240a
SR
1682}
1683static inline void blk_integrity_unregister(struct gendisk *d)
1684{
1685}
1686static inline void blk_queue_max_integrity_segments(struct request_queue *q,
1687 unsigned int segs)
1688{
1689}
af2c68fe 1690static inline unsigned short queue_max_integrity_segments(const struct request_queue *q)
fd83240a
SR
1691{
1692 return 0;
1693}
4eaf99be
MP
1694static inline bool blk_integrity_merge_rq(struct request_queue *rq,
1695 struct request *r1,
1696 struct request *r2)
fd83240a 1697{
cb1a5ab6 1698 return true;
fd83240a 1699}
4eaf99be
MP
1700static inline bool blk_integrity_merge_bio(struct request_queue *rq,
1701 struct request *r,
1702 struct bio *b)
fd83240a 1703{
cb1a5ab6 1704 return true;
fd83240a 1705}
25520d55 1706
359f6427
GE
1707static inline unsigned int bio_integrity_intervals(struct blk_integrity *bi,
1708 unsigned int sectors)
1709{
1710 return 0;
1711}
1712
1713static inline unsigned int bio_integrity_bytes(struct blk_integrity *bi,
1714 unsigned int sectors)
1715{
1716 return 0;
1717}
1718
2a876f5e
CH
1719static inline struct bio_vec *rq_integrity_vec(struct request *rq)
1720{
1721 return NULL;
1722}
1723
7ba1ba12
MP
1724#endif /* CONFIG_BLK_DEV_INTEGRITY */
1725
d145dc23
ST
1726#ifdef CONFIG_BLK_INLINE_ENCRYPTION
1727
1728bool blk_ksm_register(struct blk_keyslot_manager *ksm, struct request_queue *q);
1729
1730void blk_ksm_unregister(struct request_queue *q);
1731
1732#else /* CONFIG_BLK_INLINE_ENCRYPTION */
1733
1734static inline bool blk_ksm_register(struct blk_keyslot_manager *ksm,
1735 struct request_queue *q)
1736{
1737 return true;
1738}
1739
1740static inline void blk_ksm_unregister(struct request_queue *q) { }
1741
1742#endif /* CONFIG_BLK_INLINE_ENCRYPTION */
1743
1744
08f85851 1745struct block_device_operations {
d4430d62 1746 int (*open) (struct block_device *, fmode_t);
db2a144b 1747 void (*release) (struct gendisk *, fmode_t);
3f289dcb 1748 int (*rw_page)(struct block_device *, sector_t, struct page *, unsigned int);
d4430d62
AV
1749 int (*ioctl) (struct block_device *, fmode_t, unsigned, unsigned long);
1750 int (*compat_ioctl) (struct block_device *, fmode_t, unsigned, unsigned long);
77ea887e
TH
1751 unsigned int (*check_events) (struct gendisk *disk,
1752 unsigned int clearing);
1753 /* ->media_changed() is DEPRECATED, use ->check_events() instead */
08f85851 1754 int (*media_changed) (struct gendisk *);
c3e33e04 1755 void (*unlock_native_capacity) (struct gendisk *);
08f85851
AV
1756 int (*revalidate_disk) (struct gendisk *);
1757 int (*getgeo)(struct block_device *, struct hd_geometry *);
b3a27d05
NG
1758 /* this callback is with swap_lock and sometimes page table lock held */
1759 void (*swap_slot_free_notify) (struct block_device *, unsigned long);
e76239a3 1760 int (*report_zones)(struct gendisk *, sector_t sector,
d4100351 1761 unsigned int nr_zones, report_zones_cb cb, void *data);
348e114b 1762 char *(*devnode)(struct gendisk *disk, umode_t *mode);
08f85851 1763 struct module *owner;
bbd3e064 1764 const struct pr_ops *pr_ops;
08f85851
AV
1765};
1766
ee6a129d
AB
1767#ifdef CONFIG_COMPAT
1768extern int blkdev_compat_ptr_ioctl(struct block_device *, fmode_t,
1769 unsigned int, unsigned long);
1770#else
1771#define blkdev_compat_ptr_ioctl NULL
1772#endif
1773
633a08b8
AV
1774extern int __blkdev_driver_ioctl(struct block_device *, fmode_t, unsigned int,
1775 unsigned long);
47a191fd
MW
1776extern int bdev_read_page(struct block_device *, sector_t, struct page *);
1777extern int bdev_write_page(struct block_device *, sector_t, struct page *,
1778 struct writeback_control *);
6cc77e9c
CH
1779
1780#ifdef CONFIG_BLK_DEV_ZONED
1781bool blk_req_needs_zone_write_lock(struct request *rq);
1392d370 1782bool blk_req_zone_write_trylock(struct request *rq);
6cc77e9c
CH
1783void __blk_req_zone_write_lock(struct request *rq);
1784void __blk_req_zone_write_unlock(struct request *rq);
1785
1786static inline void blk_req_zone_write_lock(struct request *rq)
1787{
1788 if (blk_req_needs_zone_write_lock(rq))
1789 __blk_req_zone_write_lock(rq);
1790}
1791
1792static inline void blk_req_zone_write_unlock(struct request *rq)
1793{
1794 if (rq->rq_flags & RQF_ZONE_WRITE_LOCKED)
1795 __blk_req_zone_write_unlock(rq);
1796}
1797
1798static inline bool blk_req_zone_is_write_locked(struct request *rq)
1799{
1800 return rq->q->seq_zones_wlock &&
1801 test_bit(blk_rq_zone_no(rq), rq->q->seq_zones_wlock);
1802}
1803
1804static inline bool blk_req_can_dispatch_to_zone(struct request *rq)
1805{
1806 if (!blk_req_needs_zone_write_lock(rq))
1807 return true;
1808 return !blk_req_zone_is_write_locked(rq);
1809}
1810#else
1811static inline bool blk_req_needs_zone_write_lock(struct request *rq)
1812{
1813 return false;
1814}
1815
1816static inline void blk_req_zone_write_lock(struct request *rq)
1817{
1818}
1819
1820static inline void blk_req_zone_write_unlock(struct request *rq)
1821{
1822}
1823static inline bool blk_req_zone_is_write_locked(struct request *rq)
1824{
1825 return false;
1826}
1827
1828static inline bool blk_req_can_dispatch_to_zone(struct request *rq)
1829{
1830 return true;
1831}
1832#endif /* CONFIG_BLK_DEV_ZONED */
1833
9361401e 1834#else /* CONFIG_BLOCK */
ac13a829
FF
1835
1836struct block_device;
1837
9361401e
DH
1838/*
1839 * stubs for when the block layer is configured out
1840 */
9361401e 1841
9361401e
DH
1842static inline long nr_blockdev_pages(void)
1843{
1844 return 0;
1845}
1846
1f940bdf
JA
1847struct blk_plug {
1848};
1849
1850static inline void blk_start_plug(struct blk_plug *plug)
73c10101
JA
1851{
1852}
1853
1f940bdf 1854static inline void blk_finish_plug(struct blk_plug *plug)
73c10101
JA
1855{
1856}
1857
1f940bdf 1858static inline void blk_flush_plug(struct task_struct *task)
73c10101
JA
1859{
1860}
1861
a237c1c5
JA
1862static inline void blk_schedule_flush_plug(struct task_struct *task)
1863{
1864}
1865
1866
73c10101
JA
1867static inline bool blk_needs_flush_plug(struct task_struct *tsk)
1868{
1869 return false;
1870}
1871
9398554f 1872static inline int blkdev_issue_flush(struct block_device *bdev, gfp_t gfp_mask)
ac13a829
FF
1873{
1874 return 0;
1875}
1876
9361401e
DH
1877#endif /* CONFIG_BLOCK */
1878
0619317f
JA
1879static inline void blk_wake_io_task(struct task_struct *waiter)
1880{
1881 /*
1882 * If we're polling, the task itself is doing the completions. For
1883 * that case, we don't need to signal a wakeup, it's enough to just
1884 * mark us as RUNNING.
1885 */
1886 if (waiter == current)
1887 __set_current_state(TASK_RUNNING);
1888 else
1889 wake_up_process(waiter);
1890}
1891
dc35ada4 1892#ifdef CONFIG_BLOCK
956d510e
CH
1893unsigned long disk_start_io_acct(struct gendisk *disk, unsigned int sectors,
1894 unsigned int op);
1895void disk_end_io_acct(struct gendisk *disk, unsigned int op,
1896 unsigned long start_time);
1897
956d510e
CH
1898/**
1899 * bio_start_io_acct - start I/O accounting for bio based drivers
1900 * @bio: bio to start account for
1901 *
1902 * Returns the start time that should be passed back to bio_end_io_acct().
1903 */
1904static inline unsigned long bio_start_io_acct(struct bio *bio)
1905{
1906 return disk_start_io_acct(bio->bi_disk, bio_sectors(bio), bio_op(bio));
1907}
1908
1909/**
1910 * bio_end_io_acct - end I/O accounting for bio based drivers
1911 * @bio: bio to end account for
1912 * @start: start time returned by bio_start_io_acct()
1913 */
1914static inline void bio_end_io_acct(struct bio *bio, unsigned long start_time)
1915{
1916 return disk_end_io_acct(bio->bi_disk, bio_op(bio), start_time);
1917}
1918#endif /* CONFIG_BLOCK */
1919
3f1266f1
CH
1920int bdev_read_only(struct block_device *bdev);
1921int set_blocksize(struct block_device *bdev, int size);
1922
1923const char *bdevname(struct block_device *bdev, char *buffer);
1924struct block_device *lookup_bdev(const char *);
1925
1926void blkdev_show(struct seq_file *seqf, off_t offset);
1927
1928#define BDEVNAME_SIZE 32 /* Largest string for a blockdev identifier */
1929#define BDEVT_SIZE 10 /* Largest string for MAJ:MIN for blkdev */
1930#ifdef CONFIG_BLOCK
1931#define BLKDEV_MAJOR_MAX 512
1932#else
1933#define BLKDEV_MAJOR_MAX 0
1934#endif
1935
1936int blkdev_get(struct block_device *bdev, fmode_t mode, void *holder);
1937struct block_device *blkdev_get_by_path(const char *path, fmode_t mode,
1938 void *holder);
1939struct block_device *blkdev_get_by_dev(dev_t dev, fmode_t mode, void *holder);
1940struct block_device *bd_start_claiming(struct block_device *bdev, void *holder);
1941void bd_abort_claiming(struct block_device *bdev, struct block_device *whole,
1942 void *holder);
1943void blkdev_put(struct block_device *bdev, fmode_t mode);
1944
1945struct block_device *bdget(dev_t);
1946struct block_device *bdgrab(struct block_device *bdev);
1947void bdput(struct block_device *);
1948
1949#ifdef CONFIG_BLOCK
1950void invalidate_bdev(struct block_device *bdev);
1951int sync_blockdev(struct block_device *bdev);
1952#else
1953static inline void invalidate_bdev(struct block_device *bdev)
1954{
1955}
1956static inline int sync_blockdev(struct block_device *bdev)
1957{
1958 return 0;
1959}
1da177e4 1960#endif
3f1266f1
CH
1961int fsync_bdev(struct block_device *bdev);
1962
1963struct super_block *freeze_bdev(struct block_device *bdev);
1964int thaw_bdev(struct block_device *bdev, struct super_block *sb);
1965
1966#endif /* _LINUX_BLKDEV_H */