blk-mq: Relocate hctx_may_queue()
[linux-block.git] / include / linux / blkdev.h
CommitLineData
b2441318 1/* SPDX-License-Identifier: GPL-2.0 */
1da177e4
LT
2#ifndef _LINUX_BLKDEV_H
3#define _LINUX_BLKDEV_H
4
85fd0bc9 5#include <linux/sched.h>
e6017571 6#include <linux/sched/clock.h>
1da177e4
LT
7#include <linux/major.h>
8#include <linux/genhd.h>
9#include <linux/list.h>
320ae51f 10#include <linux/llist.h>
1da177e4
LT
11#include <linux/timer.h>
12#include <linux/workqueue.h>
13#include <linux/pagemap.h>
66114cad 14#include <linux/backing-dev-defs.h>
1da177e4
LT
15#include <linux/wait.h>
16#include <linux/mempool.h>
34c0fd54 17#include <linux/pfn.h>
1da177e4 18#include <linux/bio.h>
1da177e4 19#include <linux/stringify.h>
3e6053d7 20#include <linux/gfp.h>
d351af01 21#include <linux/bsg.h>
c7c22e4d 22#include <linux/smp.h>
548bc8e1 23#include <linux/rcupdate.h>
add703fd 24#include <linux/percpu-refcount.h>
84be456f 25#include <linux/scatterlist.h>
6a0cb1bc 26#include <linux/blkzoned.h>
db04e18d 27#include <linux/pm.h>
1da177e4 28
de477254 29struct module;
21b2f0c8
CH
30struct scsi_ioctl_command;
31
1da177e4 32struct request_queue;
1da177e4 33struct elevator_queue;
2056a782 34struct blk_trace;
3d6392cf
JA
35struct request;
36struct sg_io_hdr;
aa387cc8 37struct bsg_job;
3c798398 38struct blkcg_gq;
7c94e1c1 39struct blk_flush_queue;
bbd3e064 40struct pr_ops;
a7905043 41struct rq_qos;
34dbad5d
OS
42struct blk_queue_stats;
43struct blk_stat_callback;
1b262839 44struct blk_keyslot_manager;
1da177e4
LT
45
46#define BLKDEV_MIN_RQ 4
47#define BLKDEV_MAX_RQ 128 /* Default maximum */
48
096392e0 49/* Must be consistent with blk_mq_poll_stats_bkt() */
0206319f
SB
50#define BLK_MQ_POLL_STATS_BKTS 16
51
29ece8b4
YY
52/* Doing classic polling */
53#define BLK_MQ_POLL_CLASSIC -1
54
8bd435b3
TH
55/*
56 * Maximum number of blkcg policies allowed to be registered concurrently.
57 * Defined here to simplify include dependency.
58 */
01c5f85a 59#define BLKCG_MAX_POLS 5
8bd435b3 60
2a842aca 61typedef void (rq_end_io_fn)(struct request *, blk_status_t);
1da177e4 62
e8064021
CH
63/*
64 * request flags */
65typedef __u32 __bitwise req_flags_t;
66
67/* elevator knows about this request */
68#define RQF_SORTED ((__force req_flags_t)(1 << 0))
69/* drive already may have started this one */
70#define RQF_STARTED ((__force req_flags_t)(1 << 1))
e8064021
CH
71/* may not be passed by ioscheduler */
72#define RQF_SOFTBARRIER ((__force req_flags_t)(1 << 3))
73/* request for flush sequence */
74#define RQF_FLUSH_SEQ ((__force req_flags_t)(1 << 4))
75/* merge of different types, fail separately */
76#define RQF_MIXED_MERGE ((__force req_flags_t)(1 << 5))
77/* track inflight for MQ */
78#define RQF_MQ_INFLIGHT ((__force req_flags_t)(1 << 6))
79/* don't call prep for this one */
80#define RQF_DONTPREP ((__force req_flags_t)(1 << 7))
81/* set for "ide_preempt" requests and also for requests for which the SCSI
82 "quiesce" state must be ignored. */
83#define RQF_PREEMPT ((__force req_flags_t)(1 << 8))
e8064021
CH
84/* vaguely specified driver internal error. Ignored by the block layer */
85#define RQF_FAILED ((__force req_flags_t)(1 << 10))
86/* don't warn about errors */
87#define RQF_QUIET ((__force req_flags_t)(1 << 11))
88/* elevator private data attached */
89#define RQF_ELVPRIV ((__force req_flags_t)(1 << 12))
4822e902 90/* account into disk and partition IO statistics */
e8064021
CH
91#define RQF_IO_STAT ((__force req_flags_t)(1 << 13))
92/* request came from our alloc pool */
93#define RQF_ALLOCED ((__force req_flags_t)(1 << 14))
94/* runtime pm request */
95#define RQF_PM ((__force req_flags_t)(1 << 15))
96/* on IO scheduler merge hash */
97#define RQF_HASHED ((__force req_flags_t)(1 << 16))
4822e902 98/* track IO completion time */
cf43e6be 99#define RQF_STATS ((__force req_flags_t)(1 << 17))
f9d03f96
CH
100/* Look at ->special_vec for the actual data payload instead of the
101 bio chain. */
102#define RQF_SPECIAL_PAYLOAD ((__force req_flags_t)(1 << 18))
6cc77e9c
CH
103/* The per-zone write lock is held for this request */
104#define RQF_ZONE_WRITE_LOCKED ((__force req_flags_t)(1 << 19))
76a86f9d 105/* already slept for hybrid poll */
12f5b931 106#define RQF_MQ_POLL_SLEPT ((__force req_flags_t)(1 << 20))
da661267
CH
107/* ->timeout has been called, don't expire again */
108#define RQF_TIMED_OUT ((__force req_flags_t)(1 << 21))
e8064021
CH
109
110/* flags that prevent us from merging requests: */
111#define RQF_NOMERGE_FLAGS \
f9d03f96 112 (RQF_STARTED | RQF_SOFTBARRIER | RQF_FLUSH_SEQ | RQF_SPECIAL_PAYLOAD)
e8064021 113
12f5b931
KB
114/*
115 * Request state for blk-mq.
116 */
117enum mq_rq_state {
118 MQ_RQ_IDLE = 0,
119 MQ_RQ_IN_FLIGHT = 1,
120 MQ_RQ_COMPLETE = 2,
121};
122
1da177e4 123/*
af76e555
CH
124 * Try to put the fields that are referenced together in the same cacheline.
125 *
126 * If you modify this structure, make sure to update blk_rq_init() and
127 * especially blk_mq_rq_ctx_init() to take care of the added fields.
1da177e4
LT
128 */
129struct request {
165125e1 130 struct request_queue *q;
320ae51f 131 struct blk_mq_ctx *mq_ctx;
ea4f995e 132 struct blk_mq_hw_ctx *mq_hctx;
e6a1c874 133
ef295ecf 134 unsigned int cmd_flags; /* op and common flags */
e8064021 135 req_flags_t rq_flags;
d486f1f2 136
2f578aaf 137 int tag;
d486f1f2
JA
138 int internal_tag;
139
a2dec7b3 140 /* the following two fields are internal, NEVER access directly */
a2dec7b3 141 unsigned int __data_len; /* total data len */
181fdde3 142 sector_t __sector; /* sector cursor */
1da177e4
LT
143
144 struct bio *bio;
145 struct bio *biotail;
146
7c3fb70f
JA
147 struct list_head queuelist;
148
360f92c2
JA
149 /*
150 * The hash is used inside the scheduler, and killed once the
151 * request reaches the dispatch list. The ipi_list is only used
152 * to queue the request for softirq completion, which is long
153 * after the request has been unhashed (and even removed from
154 * the dispatch list).
155 */
156 union {
157 struct hlist_node hash; /* merge hash */
158 struct list_head ipi_list;
159 };
160
e6a1c874
JA
161 /*
162 * The rb_node is only used inside the io scheduler, requests
163 * are pruned when moved to the dispatch queue. So let the
c186794d 164 * completion_data share space with the rb_node.
e6a1c874
JA
165 */
166 union {
167 struct rb_node rb_node; /* sort/lookup */
f9d03f96 168 struct bio_vec special_vec;
c186794d 169 void *completion_data;
e26738e0 170 int error_count; /* for legacy drivers, don't use */
e6a1c874 171 };
9817064b 172
ff7d145f 173 /*
7f1dc8a2 174 * Three pointers are available for the IO schedulers, if they need
c186794d
MS
175 * more they have to dynamically allocate it. Flush requests are
176 * never put on the IO scheduler. So let the flush fields share
a612fddf 177 * space with the elevator data.
ff7d145f 178 */
c186794d 179 union {
a612fddf
TH
180 struct {
181 struct io_cq *icq;
182 void *priv[2];
183 } elv;
184
c186794d
MS
185 struct {
186 unsigned int seq;
187 struct list_head list;
4853abaa 188 rq_end_io_fn *saved_end_io;
c186794d
MS
189 } flush;
190 };
ff7d145f 191
8f34ee75 192 struct gendisk *rq_disk;
09e099d4 193 struct hd_struct *part;
6f816b4b
TH
194#ifdef CONFIG_BLK_RQ_ALLOC_TIME
195 /* Time that the first bio started allocating this request. */
196 u64 alloc_time_ns;
197#endif
198 /* Time that this request was allocated for this IO. */
522a7775 199 u64 start_time_ns;
544ccc8d
OS
200 /* Time that I/O was submitted to the device. */
201 u64 io_start_time_ns;
202
203#ifdef CONFIG_BLK_WBT
204 unsigned short wbt_flags;
205#endif
3d244306
HT
206 /*
207 * rq sectors used for blk stats. It has the same value
208 * with blk_rq_sectors(rq), except that it never be zeroed
209 * by completion.
210 */
211 unsigned short stats_sectors;
544ccc8d
OS
212
213 /*
214 * Number of scatter-gather DMA addr+len pairs after
1da177e4
LT
215 * physical address coalescing is performed.
216 */
217 unsigned short nr_phys_segments;
7c3fb70f 218
13f05c8d
MP
219#if defined(CONFIG_BLK_DEV_INTEGRITY)
220 unsigned short nr_integrity_segments;
221#endif
1da177e4 222
a892c8d5
ST
223#ifdef CONFIG_BLK_INLINE_ENCRYPTION
224 struct bio_crypt_ctx *crypt_ctx;
225 struct blk_ksm_keyslot *crypt_keyslot;
226#endif
227
7c3fb70f 228 unsigned short write_hint;
8f34ee75
JA
229 unsigned short ioprio;
230
12f5b931
KB
231 enum mq_rq_state state;
232 refcount_t ref;
1d9bd516 233
0b7576d8 234 unsigned int timeout;
079076b3 235 unsigned long deadline;
cb6934f8 236
7c3fb70f 237 union {
0a4b6e2f 238 struct __call_single_data csd;
7c3fb70f
JA
239 u64 fifo_time;
240 };
241
1da177e4 242 /*
c00895ab 243 * completion callback.
1da177e4
LT
244 */
245 rq_end_io_fn *end_io;
246 void *end_io_data;
247};
248
14cb0dc6
ML
249static inline bool blk_op_is_scsi(unsigned int op)
250{
251 return op == REQ_OP_SCSI_IN || op == REQ_OP_SCSI_OUT;
252}
253
254static inline bool blk_op_is_private(unsigned int op)
255{
256 return op == REQ_OP_DRV_IN || op == REQ_OP_DRV_OUT;
257}
258
aebf526b
CH
259static inline bool blk_rq_is_scsi(struct request *rq)
260{
14cb0dc6 261 return blk_op_is_scsi(req_op(rq));
aebf526b
CH
262}
263
264static inline bool blk_rq_is_private(struct request *rq)
265{
14cb0dc6 266 return blk_op_is_private(req_op(rq));
aebf526b
CH
267}
268
57292b58
CH
269static inline bool blk_rq_is_passthrough(struct request *rq)
270{
aebf526b 271 return blk_rq_is_scsi(rq) || blk_rq_is_private(rq);
57292b58
CH
272}
273
14cb0dc6
ML
274static inline bool bio_is_passthrough(struct bio *bio)
275{
276 unsigned op = bio_op(bio);
277
278 return blk_op_is_scsi(op) || blk_op_is_private(op);
279}
280
766ca442
FLVC
281static inline unsigned short req_get_ioprio(struct request *req)
282{
283 return req->ioprio;
284}
285
1da177e4
LT
286#include <linux/elevator.h>
287
320ae51f
JA
288struct blk_queue_ctx;
289
1da177e4 290struct bio_vec;
1da177e4 291
242f9dcb 292enum blk_eh_timer_return {
88b0cfad
CH
293 BLK_EH_DONE, /* drivers has completed the command */
294 BLK_EH_RESET_TIMER, /* reset timer and try again */
242f9dcb
JA
295};
296
1da177e4
LT
297enum blk_queue_state {
298 Queue_down,
299 Queue_up,
300};
301
ee1b6f7a
SL
302#define BLK_TAG_ALLOC_FIFO 0 /* allocate starting from 0 */
303#define BLK_TAG_ALLOC_RR 1 /* allocate starting from last allocated tag */
1da177e4 304
abf54393
FT
305#define BLK_SCSI_MAX_CMDS (256)
306#define BLK_SCSI_CMD_PER_LONG (BLK_SCSI_MAX_CMDS / (sizeof(long) * 8))
307
797476b8
DLM
308/*
309 * Zoned block device models (zoned limit).
3093a479
CH
310 *
311 * Note: This needs to be ordered from the least to the most severe
312 * restrictions for the inheritance in blk_stack_limits() to work.
797476b8
DLM
313 */
314enum blk_zoned_model {
3093a479
CH
315 BLK_ZONED_NONE = 0, /* Regular block device */
316 BLK_ZONED_HA, /* Host-aware zoned block device */
317 BLK_ZONED_HM, /* Host-managed zoned block device */
797476b8
DLM
318};
319
025146e1
MP
320struct queue_limits {
321 unsigned long bounce_pfn;
322 unsigned long seg_boundary_mask;
03100aad 323 unsigned long virt_boundary_mask;
025146e1
MP
324
325 unsigned int max_hw_sectors;
ca369d51 326 unsigned int max_dev_sectors;
762380ad 327 unsigned int chunk_sectors;
025146e1
MP
328 unsigned int max_sectors;
329 unsigned int max_segment_size;
c72758f3 330 unsigned int physical_block_size;
ad6bf88a 331 unsigned int logical_block_size;
c72758f3
MP
332 unsigned int alignment_offset;
333 unsigned int io_min;
334 unsigned int io_opt;
67efc925 335 unsigned int max_discard_sectors;
0034af03 336 unsigned int max_hw_discard_sectors;
4363ac7c 337 unsigned int max_write_same_sectors;
a6f0788e 338 unsigned int max_write_zeroes_sectors;
0512a75b 339 unsigned int max_zone_append_sectors;
86b37281
MP
340 unsigned int discard_granularity;
341 unsigned int discard_alignment;
025146e1 342
8a78362c 343 unsigned short max_segments;
13f05c8d 344 unsigned short max_integrity_segments;
1e739730 345 unsigned short max_discard_segments;
025146e1 346
c72758f3 347 unsigned char misaligned;
86b37281 348 unsigned char discard_misaligned;
c78afc62 349 unsigned char raid_partial_stripes_expensive;
797476b8 350 enum blk_zoned_model zoned;
025146e1
MP
351};
352
d4100351
CH
353typedef int (*report_zones_cb)(struct blk_zone *zone, unsigned int idx,
354 void *data);
355
6a0cb1bc
HR
356#ifdef CONFIG_BLK_DEV_ZONED
357
d4100351
CH
358#define BLK_ALL_ZONES ((unsigned int)-1)
359int blkdev_report_zones(struct block_device *bdev, sector_t sector,
360 unsigned int nr_zones, report_zones_cb cb, void *data);
9b38bb4b 361unsigned int blkdev_nr_zones(struct gendisk *disk);
6c1b1da5
AJ
362extern int blkdev_zone_mgmt(struct block_device *bdev, enum req_opf op,
363 sector_t sectors, sector_t nr_sectors,
364 gfp_t gfp_mask);
e732671a
DLM
365int blk_revalidate_disk_zones(struct gendisk *disk,
366 void (*update_driver_data)(struct gendisk *disk));
6a0cb1bc 367
3ed05a98
ST
368extern int blkdev_report_zones_ioctl(struct block_device *bdev, fmode_t mode,
369 unsigned int cmd, unsigned long arg);
e876df1f
AJ
370extern int blkdev_zone_mgmt_ioctl(struct block_device *bdev, fmode_t mode,
371 unsigned int cmd, unsigned long arg);
3ed05a98
ST
372
373#else /* CONFIG_BLK_DEV_ZONED */
374
9b38bb4b 375static inline unsigned int blkdev_nr_zones(struct gendisk *disk)
a91e1380
DLM
376{
377 return 0;
378}
bf505456 379
3ed05a98
ST
380static inline int blkdev_report_zones_ioctl(struct block_device *bdev,
381 fmode_t mode, unsigned int cmd,
382 unsigned long arg)
383{
384 return -ENOTTY;
385}
386
e876df1f
AJ
387static inline int blkdev_zone_mgmt_ioctl(struct block_device *bdev,
388 fmode_t mode, unsigned int cmd,
389 unsigned long arg)
3ed05a98
ST
390{
391 return -ENOTTY;
392}
393
6a0cb1bc
HR
394#endif /* CONFIG_BLK_DEV_ZONED */
395
d7b76301 396struct request_queue {
1da177e4 397 struct request *last_merge;
b374d18a 398 struct elevator_queue *elevator;
1da177e4 399
34dbad5d 400 struct blk_queue_stats *stats;
a7905043 401 struct rq_qos *rq_qos;
87760e5e 402
f8a5b122 403 const struct blk_mq_ops *mq_ops;
320ae51f 404
320ae51f 405 /* sw queues */
e6cdb092 406 struct blk_mq_ctx __percpu *queue_ctx;
320ae51f 407
d278d4a8
JA
408 unsigned int queue_depth;
409
320ae51f
JA
410 /* hw dispatch queues */
411 struct blk_mq_hw_ctx **queue_hw_ctx;
412 unsigned int nr_hw_queues;
413
dc3b17cc 414 struct backing_dev_info *backing_dev_info;
1da177e4
LT
415
416 /*
417 * The queue owner gets to use this for whatever they like.
418 * ll_rw_blk doesn't touch it.
419 */
420 void *queuedata;
421
1da177e4 422 /*
d7b76301 423 * various queue flags, see QUEUE_* below
1da177e4 424 */
d7b76301 425 unsigned long queue_flags;
cd84a62e
BVA
426 /*
427 * Number of contexts that have called blk_set_pm_only(). If this
428 * counter is above zero then only RQF_PM and RQF_PREEMPT requests are
429 * processed.
430 */
431 atomic_t pm_only;
1da177e4 432
a73f730d
TH
433 /*
434 * ida allocated id for this queue. Used to index queues from
435 * ioctx.
436 */
437 int id;
438
1da177e4 439 /*
d7b76301 440 * queue needs bounce pages for pages above this limit
1da177e4 441 */
d7b76301 442 gfp_t bounce_gfp;
1da177e4 443
0d945c1f 444 spinlock_t queue_lock;
1da177e4
LT
445
446 /*
447 * queue kobject
448 */
449 struct kobject kobj;
450
320ae51f
JA
451 /*
452 * mq queue kobject
453 */
1db4909e 454 struct kobject *mq_kobj;
320ae51f 455
ac6fc48c
DW
456#ifdef CONFIG_BLK_DEV_INTEGRITY
457 struct blk_integrity integrity;
458#endif /* CONFIG_BLK_DEV_INTEGRITY */
459
47fafbc7 460#ifdef CONFIG_PM
6c954667 461 struct device *dev;
db04e18d 462 enum rpm_status rpm_status;
6c954667
LM
463 unsigned int nr_pending;
464#endif
465
1da177e4
LT
466 /*
467 * queue settings
468 */
469 unsigned long nr_requests; /* Max # of requests */
1da177e4 470
e3790c7d 471 unsigned int dma_pad_mask;
1da177e4
LT
472 unsigned int dma_alignment;
473
1b262839
ST
474#ifdef CONFIG_BLK_INLINE_ENCRYPTION
475 /* Inline crypto capabilities */
476 struct blk_keyslot_manager *ksm;
477#endif
478
242f9dcb 479 unsigned int rq_timeout;
64f1c21e 480 int poll_nsec;
34dbad5d
OS
481
482 struct blk_stat_callback *poll_cb;
0206319f 483 struct blk_rq_stat poll_stat[BLK_MQ_POLL_STATS_BKTS];
34dbad5d 484
242f9dcb 485 struct timer_list timeout;
287922eb 486 struct work_struct timeout_work;
242f9dcb 487
a612fddf 488 struct list_head icq_list;
4eef3049 489#ifdef CONFIG_BLK_CGROUP
a2b1693b 490 DECLARE_BITMAP (blkcg_pols, BLKCG_MAX_POLS);
3c798398 491 struct blkcg_gq *root_blkg;
03aa264a 492 struct list_head blkg_list;
4eef3049 493#endif
a612fddf 494
025146e1
MP
495 struct queue_limits limits;
496
68c43f13
DLM
497 unsigned int required_elevator_features;
498
6a5ac984 499#ifdef CONFIG_BLK_DEV_ZONED
6cc77e9c
CH
500 /*
501 * Zoned block device information for request dispatch control.
502 * nr_zones is the total number of zones of the device. This is always
f216fdd7
CH
503 * 0 for regular block devices. conv_zones_bitmap is a bitmap of nr_zones
504 * bits which indicates if a zone is conventional (bit set) or
505 * sequential (bit clear). seq_zones_wlock is a bitmap of nr_zones
6cc77e9c
CH
506 * bits which indicates if a zone is write locked, that is, if a write
507 * request targeting the zone was dispatched. All three fields are
508 * initialized by the low level device driver (e.g. scsi/sd.c).
509 * Stacking drivers (device mappers) may or may not initialize
510 * these fields.
ccce20fc
BVA
511 *
512 * Reads of this information must be protected with blk_queue_enter() /
513 * blk_queue_exit(). Modifying this information is only allowed while
514 * no requests are being processed. See also blk_mq_freeze_queue() and
515 * blk_mq_unfreeze_queue().
6cc77e9c
CH
516 */
517 unsigned int nr_zones;
f216fdd7 518 unsigned long *conv_zones_bitmap;
6cc77e9c 519 unsigned long *seq_zones_wlock;
e15864f8 520 unsigned int max_open_zones;
659bf827 521 unsigned int max_active_zones;
6a5ac984 522#endif /* CONFIG_BLK_DEV_ZONED */
6cc77e9c 523
1da177e4
LT
524 /*
525 * sg stuff
526 */
527 unsigned int sg_timeout;
528 unsigned int sg_reserved_size;
1946089a 529 int node;
85e0cbbb 530 struct mutex debugfs_mutex;
6c5c9341 531#ifdef CONFIG_BLK_DEV_IO_TRACE
c780e86d 532 struct blk_trace __rcu *blk_trace;
6c5c9341 533#endif
1da177e4 534 /*
4913efe4 535 * for flush operations
1da177e4 536 */
7c94e1c1 537 struct blk_flush_queue *fq;
483f4afc 538
6fca6a61
CH
539 struct list_head requeue_list;
540 spinlock_t requeue_lock;
2849450a 541 struct delayed_work requeue_work;
6fca6a61 542
483f4afc 543 struct mutex sysfs_lock;
cecf5d87 544 struct mutex sysfs_dir_lock;
d351af01 545
2f8f1336
ML
546 /*
547 * for reusing dead hctx instance in case of updating
548 * nr_hw_queues
549 */
550 struct list_head unused_hctx_list;
551 spinlock_t unused_hctx_lock;
552
7996a8b5 553 int mq_freeze_depth;
d732580b 554
d351af01
FT
555#if defined(CONFIG_BLK_DEV_BSG)
556 struct bsg_class_device bsg_dev;
557#endif
e43473b7
VG
558
559#ifdef CONFIG_BLK_DEV_THROTTLING
560 /* Throttle data */
561 struct throtl_data *td;
562#endif
548bc8e1 563 struct rcu_head rcu_head;
320ae51f 564 wait_queue_head_t mq_freeze_wq;
7996a8b5
BL
565 /*
566 * Protect concurrent access to q_usage_counter by
567 * percpu_ref_kill() and percpu_ref_reinit().
568 */
569 struct mutex mq_freeze_lock;
3ef28e83 570 struct percpu_ref q_usage_counter;
0d2602ca
JA
571
572 struct blk_mq_tag_set *tag_set;
573 struct list_head tag_set_list;
338aa96d 574 struct bio_set bio_split;
4593fdbe 575
07e4fead 576 struct dentry *debugfs_dir;
85e0cbbb
LC
577
578#ifdef CONFIG_BLK_DEBUG_FS
d332ce09 579 struct dentry *sched_debugfs_dir;
cc56694f 580 struct dentry *rqos_debugfs_dir;
07e4fead
OS
581#endif
582
4593fdbe 583 bool mq_sysfs_init_done;
6d247d7f
CH
584
585 size_t cmd_size;
dc9edc44 586
f793dfd3
JA
587#define BLK_MAX_WRITE_HINTS 5
588 u64 write_hints[BLK_MAX_WRITE_HINTS];
1da177e4
LT
589};
590
bfe373f6 591/* Keep blk_queue_flag_name[] in sync with the definitions below */
eca7abf3
JA
592#define QUEUE_FLAG_STOPPED 0 /* queue is stopped */
593#define QUEUE_FLAG_DYING 1 /* queue being torn down */
eca7abf3
JA
594#define QUEUE_FLAG_NOMERGES 3 /* disable merge attempts */
595#define QUEUE_FLAG_SAME_COMP 4 /* complete on same CPU-group */
596#define QUEUE_FLAG_FAIL_IO 5 /* fake timeout */
597#define QUEUE_FLAG_NONROT 6 /* non-rotational device (SSD) */
598#define QUEUE_FLAG_VIRT QUEUE_FLAG_NONROT /* paravirt device */
599#define QUEUE_FLAG_IO_STAT 7 /* do disk/partitions IO accounting */
600#define QUEUE_FLAG_DISCARD 8 /* supports DISCARD */
601#define QUEUE_FLAG_NOXMERGES 9 /* No extended merges */
602#define QUEUE_FLAG_ADD_RANDOM 10 /* Contributes to random pool */
603#define QUEUE_FLAG_SECERASE 11 /* supports secure erase */
604#define QUEUE_FLAG_SAME_FORCE 12 /* force complete on same CPU */
605#define QUEUE_FLAG_DEAD 13 /* queue tear-down finished */
606#define QUEUE_FLAG_INIT_DONE 14 /* queue is initialized */
eca7abf3
JA
607#define QUEUE_FLAG_POLL 16 /* IO polling enabled if set */
608#define QUEUE_FLAG_WC 17 /* Write back caching */
609#define QUEUE_FLAG_FUA 18 /* device supports FUA writes */
610#define QUEUE_FLAG_DAX 19 /* device supports DAX */
611#define QUEUE_FLAG_STATS 20 /* track IO start and completion times */
612#define QUEUE_FLAG_POLL_STATS 21 /* collecting stats for hybrid polling */
613#define QUEUE_FLAG_REGISTERED 22 /* queue has been registered to a disk */
614#define QUEUE_FLAG_SCSI_PASSTHROUGH 23 /* queue supports SCSI commands */
615#define QUEUE_FLAG_QUIESCED 24 /* queue has been quiesced */
616#define QUEUE_FLAG_PCI_P2PDMA 25 /* device supports PCI p2p requests */
e84e8f06 617#define QUEUE_FLAG_ZONE_RESETALL 26 /* supports Zone Reset All */
6f816b4b 618#define QUEUE_FLAG_RQ_ALLOC_TIME 27 /* record rq->alloc_time_ns */
797e7dbb 619
94eddfbe 620#define QUEUE_FLAG_MQ_DEFAULT ((1 << QUEUE_FLAG_IO_STAT) | \
6e0de611 621 (1 << QUEUE_FLAG_SAME_COMP))
94eddfbe 622
8814ce8a
BVA
623void blk_queue_flag_set(unsigned int flag, struct request_queue *q);
624void blk_queue_flag_clear(unsigned int flag, struct request_queue *q);
625bool blk_queue_flag_test_and_set(unsigned int flag, struct request_queue *q);
8814ce8a 626
1da177e4 627#define blk_queue_stopped(q) test_bit(QUEUE_FLAG_STOPPED, &(q)->queue_flags)
3f3299d5 628#define blk_queue_dying(q) test_bit(QUEUE_FLAG_DYING, &(q)->queue_flags)
c246e80d 629#define blk_queue_dead(q) test_bit(QUEUE_FLAG_DEAD, &(q)->queue_flags)
320ae51f 630#define blk_queue_init_done(q) test_bit(QUEUE_FLAG_INIT_DONE, &(q)->queue_flags)
ac9fafa1 631#define blk_queue_nomerges(q) test_bit(QUEUE_FLAG_NOMERGES, &(q)->queue_flags)
488991e2
AB
632#define blk_queue_noxmerges(q) \
633 test_bit(QUEUE_FLAG_NOXMERGES, &(q)->queue_flags)
a68bbddb 634#define blk_queue_nonrot(q) test_bit(QUEUE_FLAG_NONROT, &(q)->queue_flags)
bc58ba94 635#define blk_queue_io_stat(q) test_bit(QUEUE_FLAG_IO_STAT, &(q)->queue_flags)
e2e1a148 636#define blk_queue_add_random(q) test_bit(QUEUE_FLAG_ADD_RANDOM, &(q)->queue_flags)
c15227de 637#define blk_queue_discard(q) test_bit(QUEUE_FLAG_DISCARD, &(q)->queue_flags)
e84e8f06
CK
638#define blk_queue_zone_resetall(q) \
639 test_bit(QUEUE_FLAG_ZONE_RESETALL, &(q)->queue_flags)
288dab8a
CH
640#define blk_queue_secure_erase(q) \
641 (test_bit(QUEUE_FLAG_SECERASE, &(q)->queue_flags))
163d4baa 642#define blk_queue_dax(q) test_bit(QUEUE_FLAG_DAX, &(q)->queue_flags)
9efc160f
BVA
643#define blk_queue_scsi_passthrough(q) \
644 test_bit(QUEUE_FLAG_SCSI_PASSTHROUGH, &(q)->queue_flags)
49d92c0d
LG
645#define blk_queue_pci_p2pdma(q) \
646 test_bit(QUEUE_FLAG_PCI_P2PDMA, &(q)->queue_flags)
6f816b4b
TH
647#ifdef CONFIG_BLK_RQ_ALLOC_TIME
648#define blk_queue_rq_alloc_time(q) \
649 test_bit(QUEUE_FLAG_RQ_ALLOC_TIME, &(q)->queue_flags)
650#else
651#define blk_queue_rq_alloc_time(q) false
652#endif
1da177e4 653
33659ebb
CH
654#define blk_noretry_request(rq) \
655 ((rq)->cmd_flags & (REQ_FAILFAST_DEV|REQ_FAILFAST_TRANSPORT| \
656 REQ_FAILFAST_DRIVER))
f4560ffe 657#define blk_queue_quiesced(q) test_bit(QUEUE_FLAG_QUIESCED, &(q)->queue_flags)
cd84a62e 658#define blk_queue_pm_only(q) atomic_read(&(q)->pm_only)
0ce91444 659#define blk_queue_fua(q) test_bit(QUEUE_FLAG_FUA, &(q)->queue_flags)
58c898ba 660#define blk_queue_registered(q) test_bit(QUEUE_FLAG_REGISTERED, &(q)->queue_flags)
c9254f2d 661
cd84a62e
BVA
662extern void blk_set_pm_only(struct request_queue *q);
663extern void blk_clear_pm_only(struct request_queue *q);
33659ebb 664
57292b58
CH
665static inline bool blk_account_rq(struct request *rq)
666{
667 return (rq->rq_flags & RQF_STARTED) && !blk_rq_is_passthrough(rq);
668}
33659ebb 669
1da177e4
LT
670#define list_entry_rq(ptr) list_entry((ptr), struct request, queuelist)
671
4e1b2d52 672#define rq_data_dir(rq) (op_is_write(req_op(rq)) ? WRITE : READ)
1da177e4 673
9d9de535
CH
674#define rq_dma_dir(rq) \
675 (op_is_write(req_op(rq)) ? DMA_TO_DEVICE : DMA_FROM_DEVICE)
676
3ab3a031
CH
677#define dma_map_bvec(dev, bv, dir, attrs) \
678 dma_map_page_attrs(dev, (bv)->bv_page, (bv)->bv_offset, (bv)->bv_len, \
679 (dir), (attrs))
680
344e9ffc 681static inline bool queue_is_mq(struct request_queue *q)
49fd524f 682{
a1ce35fa 683 return q->mq_ops;
49fd524f
JA
684}
685
797476b8
DLM
686static inline enum blk_zoned_model
687blk_queue_zoned_model(struct request_queue *q)
688{
689 return q->limits.zoned;
690}
691
692static inline bool blk_queue_is_zoned(struct request_queue *q)
693{
694 switch (blk_queue_zoned_model(q)) {
695 case BLK_ZONED_HA:
696 case BLK_ZONED_HM:
697 return true;
698 default:
699 return false;
700 }
701}
702
113ab72e 703static inline sector_t blk_queue_zone_sectors(struct request_queue *q)
6a0cb1bc
HR
704{
705 return blk_queue_is_zoned(q) ? q->limits.chunk_sectors : 0;
706}
707
6a5ac984 708#ifdef CONFIG_BLK_DEV_ZONED
965b652e
DLM
709static inline unsigned int blk_queue_nr_zones(struct request_queue *q)
710{
711 return blk_queue_is_zoned(q) ? q->nr_zones : 0;
712}
713
6cc77e9c
CH
714static inline unsigned int blk_queue_zone_no(struct request_queue *q,
715 sector_t sector)
716{
717 if (!blk_queue_is_zoned(q))
718 return 0;
719 return sector >> ilog2(q->limits.chunk_sectors);
720}
721
722static inline bool blk_queue_zone_is_seq(struct request_queue *q,
723 sector_t sector)
724{
f216fdd7 725 if (!blk_queue_is_zoned(q))
6cc77e9c 726 return false;
f216fdd7
CH
727 if (!q->conv_zones_bitmap)
728 return true;
729 return !test_bit(blk_queue_zone_no(q, sector), q->conv_zones_bitmap);
6cc77e9c 730}
e15864f8
NC
731
732static inline void blk_queue_max_open_zones(struct request_queue *q,
733 unsigned int max_open_zones)
734{
735 q->max_open_zones = max_open_zones;
736}
737
738static inline unsigned int queue_max_open_zones(const struct request_queue *q)
739{
740 return q->max_open_zones;
741}
659bf827
NC
742
743static inline void blk_queue_max_active_zones(struct request_queue *q,
744 unsigned int max_active_zones)
745{
746 q->max_active_zones = max_active_zones;
747}
748
749static inline unsigned int queue_max_active_zones(const struct request_queue *q)
750{
751 return q->max_active_zones;
752}
965b652e
DLM
753#else /* CONFIG_BLK_DEV_ZONED */
754static inline unsigned int blk_queue_nr_zones(struct request_queue *q)
755{
756 return 0;
757}
02992df8
JT
758static inline bool blk_queue_zone_is_seq(struct request_queue *q,
759 sector_t sector)
760{
761 return false;
762}
763static inline unsigned int blk_queue_zone_no(struct request_queue *q,
764 sector_t sector)
765{
766 return 0;
767}
e15864f8
NC
768static inline unsigned int queue_max_open_zones(const struct request_queue *q)
769{
770 return 0;
771}
659bf827
NC
772static inline unsigned int queue_max_active_zones(const struct request_queue *q)
773{
774 return 0;
775}
6a5ac984 776#endif /* CONFIG_BLK_DEV_ZONED */
6cc77e9c 777
1faa16d2
JA
778static inline bool rq_is_sync(struct request *rq)
779{
ef295ecf 780 return op_is_sync(rq->cmd_flags);
1faa16d2
JA
781}
782
e2a60da7
MP
783static inline bool rq_mergeable(struct request *rq)
784{
57292b58 785 if (blk_rq_is_passthrough(rq))
e2a60da7 786 return false;
1da177e4 787
3a5e02ce
MC
788 if (req_op(rq) == REQ_OP_FLUSH)
789 return false;
790
a6f0788e
CK
791 if (req_op(rq) == REQ_OP_WRITE_ZEROES)
792 return false;
793
0512a75b
KB
794 if (req_op(rq) == REQ_OP_ZONE_APPEND)
795 return false;
796
e2a60da7 797 if (rq->cmd_flags & REQ_NOMERGE_FLAGS)
e8064021
CH
798 return false;
799 if (rq->rq_flags & RQF_NOMERGE_FLAGS)
e2a60da7
MP
800 return false;
801
802 return true;
803}
1da177e4 804
4363ac7c
MP
805static inline bool blk_write_same_mergeable(struct bio *a, struct bio *b)
806{
efbeccdb
CH
807 if (bio_page(a) == bio_page(b) &&
808 bio_offset(a) == bio_offset(b))
4363ac7c
MP
809 return true;
810
811 return false;
812}
813
d278d4a8
JA
814static inline unsigned int blk_queue_depth(struct request_queue *q)
815{
816 if (q->queue_depth)
817 return q->queue_depth;
818
819 return q->nr_requests;
820}
821
1da177e4
LT
822extern unsigned long blk_max_low_pfn, blk_max_pfn;
823
824/*
825 * standard bounce addresses:
826 *
827 * BLK_BOUNCE_HIGH : bounce all highmem pages
828 * BLK_BOUNCE_ANY : don't bounce anything
829 * BLK_BOUNCE_ISA : bounce pages above ISA DMA boundary
830 */
2472892a
AK
831
832#if BITS_PER_LONG == 32
1da177e4 833#define BLK_BOUNCE_HIGH ((u64)blk_max_low_pfn << PAGE_SHIFT)
2472892a
AK
834#else
835#define BLK_BOUNCE_HIGH -1ULL
836#endif
837#define BLK_BOUNCE_ANY (-1ULL)
bfe17231 838#define BLK_BOUNCE_ISA (DMA_BIT_MASK(24))
1da177e4 839
3d6392cf
JA
840/*
841 * default timeout for SG_IO if none specified
842 */
843#define BLK_DEFAULT_SG_TIMEOUT (60 * HZ)
f2f1fa78 844#define BLK_MIN_SG_TIMEOUT (7 * HZ)
3d6392cf 845
152e283f
FT
846struct rq_map_data {
847 struct page **pages;
848 int page_order;
849 int nr_entries;
56c451f4 850 unsigned long offset;
97ae77a1 851 int null_mapped;
ecb554a8 852 int from_user;
152e283f
FT
853};
854
5705f702 855struct req_iterator {
7988613b 856 struct bvec_iter iter;
5705f702
N
857 struct bio *bio;
858};
859
860/* This should not be used directly - use rq_for_each_segment */
1e428079
JA
861#define for_each_bio(_bio) \
862 for (; _bio; _bio = _bio->bi_next)
5705f702 863#define __rq_for_each_bio(_bio, rq) \
1da177e4
LT
864 if ((rq->bio)) \
865 for (_bio = (rq)->bio; _bio; _bio = _bio->bi_next)
866
5705f702
N
867#define rq_for_each_segment(bvl, _rq, _iter) \
868 __rq_for_each_bio(_iter.bio, _rq) \
7988613b 869 bio_for_each_segment(bvl, _iter.bio, _iter.iter)
5705f702 870
d18d9174
ML
871#define rq_for_each_bvec(bvl, _rq, _iter) \
872 __rq_for_each_bio(_iter.bio, _rq) \
873 bio_for_each_bvec(bvl, _iter.bio, _iter.iter)
874
4550dd6c 875#define rq_iter_last(bvec, _iter) \
7988613b 876 (_iter.bio->bi_next == NULL && \
4550dd6c 877 bio_iter_last(bvec, _iter.iter))
5705f702 878
2d4dc890
IL
879#ifndef ARCH_IMPLEMENTS_FLUSH_DCACHE_PAGE
880# error "You should define ARCH_IMPLEMENTS_FLUSH_DCACHE_PAGE for your platform"
881#endif
882#if ARCH_IMPLEMENTS_FLUSH_DCACHE_PAGE
883extern void rq_flush_dcache_pages(struct request *rq);
884#else
885static inline void rq_flush_dcache_pages(struct request *rq)
886{
887}
888#endif
889
1da177e4
LT
890extern int blk_register_queue(struct gendisk *disk);
891extern void blk_unregister_queue(struct gendisk *disk);
ed00aabd 892blk_qc_t submit_bio_noacct(struct bio *bio);
2a4aa30c 893extern void blk_rq_init(struct request_queue *q, struct request *rq);
1da177e4 894extern void blk_put_request(struct request *);
cd6ce148 895extern struct request *blk_get_request(struct request_queue *, unsigned int op,
ff005a06 896 blk_mq_req_flags_t flags);
ef9e3fac 897extern int blk_lld_busy(struct request_queue *q);
78d8e58a
MS
898extern int blk_rq_prep_clone(struct request *rq, struct request *rq_src,
899 struct bio_set *bs, gfp_t gfp_mask,
900 int (*bio_ctr)(struct bio *, struct bio *, void *),
901 void *data);
902extern void blk_rq_unprep_clone(struct request *rq);
2a842aca 903extern blk_status_t blk_insert_cloned_request(struct request_queue *q,
82124d60 904 struct request *rq);
0abc2a10 905extern int blk_rq_append_bio(struct request *rq, struct bio **bio);
f695ca38 906extern void blk_queue_split(struct bio **);
0bfc96cb 907extern int scsi_verify_blk_ioctl(struct block_device *, unsigned int);
577ebb37
PB
908extern int scsi_cmd_blk_ioctl(struct block_device *, fmode_t,
909 unsigned int, void __user *);
74f3c8af
AV
910extern int scsi_cmd_ioctl(struct request_queue *, struct gendisk *, fmode_t,
911 unsigned int, void __user *);
e915e872
AV
912extern int sg_scsi_ioctl(struct request_queue *, struct gendisk *, fmode_t,
913 struct scsi_ioctl_command __user *);
98aaaec4
AB
914extern int get_sg_io_hdr(struct sg_io_hdr *hdr, const void __user *argp);
915extern int put_sg_io_hdr(const struct sg_io_hdr *hdr, void __user *argp);
3fcfab16 916
9a95e4ef 917extern int blk_queue_enter(struct request_queue *q, blk_mq_req_flags_t flags);
2e6edc95 918extern void blk_queue_exit(struct request_queue *q);
1da177e4 919extern void blk_sync_queue(struct request_queue *q);
a3bce90e 920extern int blk_rq_map_user(struct request_queue *, struct request *,
152e283f
FT
921 struct rq_map_data *, void __user *, unsigned long,
922 gfp_t);
8e5cfc45 923extern int blk_rq_unmap_user(struct bio *);
165125e1
JA
924extern int blk_rq_map_kern(struct request_queue *, struct request *, void *, unsigned int, gfp_t);
925extern int blk_rq_map_user_iov(struct request_queue *, struct request *,
26e49cfc
KO
926 struct rq_map_data *, const struct iov_iter *,
927 gfp_t);
b7819b92 928extern void blk_execute_rq(struct request_queue *, struct gendisk *,
994ca9a1 929 struct request *, int);
165125e1 930extern void blk_execute_rq_nowait(struct request_queue *, struct gendisk *,
15fc858a 931 struct request *, int, rq_end_io_fn *);
6e39b69e 932
e47bc4ed
CK
933/* Helper to convert REQ_OP_XXX to its string format XXX */
934extern const char *blk_op_str(unsigned int op);
935
2a842aca
CH
936int blk_status_to_errno(blk_status_t status);
937blk_status_t errno_to_blk_status(int errno);
938
0a1b8b87 939int blk_poll(struct request_queue *q, blk_qc_t cookie, bool spin);
05229bee 940
165125e1 941static inline struct request_queue *bdev_get_queue(struct block_device *bdev)
1da177e4 942{
ff9ea323 943 return bdev->bd_disk->queue; /* this is never NULL */
1da177e4
LT
944}
945
233bde21
BVA
946/*
947 * The basic unit of block I/O is a sector. It is used in a number of contexts
948 * in Linux (blk, bio, genhd). The size of one sector is 512 = 2**9
949 * bytes. Variables of type sector_t represent an offset or size that is a
950 * multiple of 512 bytes. Hence these two constants.
951 */
952#ifndef SECTOR_SHIFT
953#define SECTOR_SHIFT 9
954#endif
955#ifndef SECTOR_SIZE
956#define SECTOR_SIZE (1 << SECTOR_SHIFT)
957#endif
958
5efccd17 959/*
80a761fd
TH
960 * blk_rq_pos() : the current sector
961 * blk_rq_bytes() : bytes left in the entire request
962 * blk_rq_cur_bytes() : bytes left in the current segment
963 * blk_rq_err_bytes() : bytes left till the next error boundary
964 * blk_rq_sectors() : sectors left in the entire request
965 * blk_rq_cur_sectors() : sectors left in the current segment
3d244306 966 * blk_rq_stats_sectors() : sectors of the entire request used for stats
5efccd17 967 */
5b93629b
TH
968static inline sector_t blk_rq_pos(const struct request *rq)
969{
a2dec7b3 970 return rq->__sector;
2e46e8b2
TH
971}
972
973static inline unsigned int blk_rq_bytes(const struct request *rq)
974{
a2dec7b3 975 return rq->__data_len;
5b93629b
TH
976}
977
2e46e8b2
TH
978static inline int blk_rq_cur_bytes(const struct request *rq)
979{
980 return rq->bio ? bio_cur_bytes(rq->bio) : 0;
981}
5efccd17 982
80a761fd
TH
983extern unsigned int blk_rq_err_bytes(const struct request *rq);
984
5b93629b
TH
985static inline unsigned int blk_rq_sectors(const struct request *rq)
986{
233bde21 987 return blk_rq_bytes(rq) >> SECTOR_SHIFT;
5b93629b
TH
988}
989
990static inline unsigned int blk_rq_cur_sectors(const struct request *rq)
991{
233bde21 992 return blk_rq_cur_bytes(rq) >> SECTOR_SHIFT;
5b93629b
TH
993}
994
3d244306
HT
995static inline unsigned int blk_rq_stats_sectors(const struct request *rq)
996{
997 return rq->stats_sectors;
998}
999
6a5ac984 1000#ifdef CONFIG_BLK_DEV_ZONED
02694e86
CK
1001
1002/* Helper to convert BLK_ZONE_ZONE_XXX to its string format XXX */
1003const char *blk_zone_cond_str(enum blk_zone_cond zone_cond);
1004
6cc77e9c
CH
1005static inline unsigned int blk_rq_zone_no(struct request *rq)
1006{
1007 return blk_queue_zone_no(rq->q, blk_rq_pos(rq));
1008}
1009
1010static inline unsigned int blk_rq_zone_is_seq(struct request *rq)
1011{
1012 return blk_queue_zone_is_seq(rq->q, blk_rq_pos(rq));
1013}
6a5ac984 1014#endif /* CONFIG_BLK_DEV_ZONED */
6cc77e9c 1015
2e3258ec
CH
1016/*
1017 * Some commands like WRITE SAME have a payload or data transfer size which
1018 * is different from the size of the request. Any driver that supports such
1019 * commands using the RQF_SPECIAL_PAYLOAD flag needs to use this helper to
1020 * calculate the data transfer size.
1021 */
1022static inline unsigned int blk_rq_payload_bytes(struct request *rq)
1023{
1024 if (rq->rq_flags & RQF_SPECIAL_PAYLOAD)
1025 return rq->special_vec.bv_len;
1026 return blk_rq_bytes(rq);
1027}
1028
3aef3cae
CH
1029/*
1030 * Return the first full biovec in the request. The caller needs to check that
1031 * there are any bvecs before calling this helper.
1032 */
1033static inline struct bio_vec req_bvec(struct request *rq)
1034{
1035 if (rq->rq_flags & RQF_SPECIAL_PAYLOAD)
1036 return rq->special_vec;
1037 return mp_bvec_iter_bvec(rq->bio->bi_io_vec, rq->bio->bi_iter);
1038}
1039
f31dc1cd 1040static inline unsigned int blk_queue_get_max_sectors(struct request_queue *q,
8fe0d473 1041 int op)
f31dc1cd 1042{
7afafc8a 1043 if (unlikely(op == REQ_OP_DISCARD || op == REQ_OP_SECURE_ERASE))
233bde21
BVA
1044 return min(q->limits.max_discard_sectors,
1045 UINT_MAX >> SECTOR_SHIFT);
f31dc1cd 1046
8fe0d473 1047 if (unlikely(op == REQ_OP_WRITE_SAME))
4363ac7c
MP
1048 return q->limits.max_write_same_sectors;
1049
a6f0788e
CK
1050 if (unlikely(op == REQ_OP_WRITE_ZEROES))
1051 return q->limits.max_write_zeroes_sectors;
1052
f31dc1cd
MP
1053 return q->limits.max_sectors;
1054}
1055
762380ad
JA
1056/*
1057 * Return maximum size of a request at given offset. Only valid for
1058 * file system requests.
1059 */
1060static inline unsigned int blk_max_size_offset(struct request_queue *q,
1061 sector_t offset)
1062{
1063 if (!q->limits.chunk_sectors)
736ed4de 1064 return q->limits.max_sectors;
762380ad 1065
15bfd21f
KB
1066 return min(q->limits.max_sectors, (unsigned int)(q->limits.chunk_sectors -
1067 (offset & (q->limits.chunk_sectors - 1))));
762380ad
JA
1068}
1069
17007f39
DLM
1070static inline unsigned int blk_rq_get_max_sectors(struct request *rq,
1071 sector_t offset)
f31dc1cd
MP
1072{
1073 struct request_queue *q = rq->q;
1074
57292b58 1075 if (blk_rq_is_passthrough(rq))
f31dc1cd
MP
1076 return q->limits.max_hw_sectors;
1077
7afafc8a
AH
1078 if (!q->limits.chunk_sectors ||
1079 req_op(rq) == REQ_OP_DISCARD ||
1080 req_op(rq) == REQ_OP_SECURE_ERASE)
8fe0d473 1081 return blk_queue_get_max_sectors(q, req_op(rq));
762380ad 1082
17007f39 1083 return min(blk_max_size_offset(q, offset),
8fe0d473 1084 blk_queue_get_max_sectors(q, req_op(rq)));
f31dc1cd
MP
1085}
1086
75afb352
JN
1087static inline unsigned int blk_rq_count_bios(struct request *rq)
1088{
1089 unsigned int nr_bios = 0;
1090 struct bio *bio;
1091
1092 __rq_for_each_bio(bio, rq)
1093 nr_bios++;
1094
1095 return nr_bios;
1096}
1097
ef71de8b
CH
1098void blk_steal_bios(struct bio_list *list, struct request *rq);
1099
1da177e4 1100/*
2e60e022
TH
1101 * Request completion related functions.
1102 *
1103 * blk_update_request() completes given number of bytes and updates
1104 * the request without completing it.
1da177e4 1105 */
2a842aca 1106extern bool blk_update_request(struct request *rq, blk_status_t error,
2e60e022 1107 unsigned int nr_bytes);
2e60e022 1108
242f9dcb 1109extern void blk_abort_request(struct request *);
ff856bad 1110
1da177e4
LT
1111/*
1112 * Access functions for manipulating queue properties
1113 */
165125e1 1114extern void blk_cleanup_queue(struct request_queue *);
165125e1 1115extern void blk_queue_bounce_limit(struct request_queue *, u64);
086fa5ff 1116extern void blk_queue_max_hw_sectors(struct request_queue *, unsigned int);
762380ad 1117extern void blk_queue_chunk_sectors(struct request_queue *, unsigned int);
8a78362c 1118extern void blk_queue_max_segments(struct request_queue *, unsigned short);
1e739730
CH
1119extern void blk_queue_max_discard_segments(struct request_queue *,
1120 unsigned short);
165125e1 1121extern void blk_queue_max_segment_size(struct request_queue *, unsigned int);
67efc925
CH
1122extern void blk_queue_max_discard_sectors(struct request_queue *q,
1123 unsigned int max_discard_sectors);
4363ac7c
MP
1124extern void blk_queue_max_write_same_sectors(struct request_queue *q,
1125 unsigned int max_write_same_sectors);
a6f0788e
CK
1126extern void blk_queue_max_write_zeroes_sectors(struct request_queue *q,
1127 unsigned int max_write_same_sectors);
ad6bf88a 1128extern void blk_queue_logical_block_size(struct request_queue *, unsigned int);
0512a75b
KB
1129extern void blk_queue_max_zone_append_sectors(struct request_queue *q,
1130 unsigned int max_zone_append_sectors);
892b6f90 1131extern void blk_queue_physical_block_size(struct request_queue *, unsigned int);
c72758f3
MP
1132extern void blk_queue_alignment_offset(struct request_queue *q,
1133 unsigned int alignment);
7c958e32 1134extern void blk_limits_io_min(struct queue_limits *limits, unsigned int min);
c72758f3 1135extern void blk_queue_io_min(struct request_queue *q, unsigned int min);
3c5820c7 1136extern void blk_limits_io_opt(struct queue_limits *limits, unsigned int opt);
c72758f3 1137extern void blk_queue_io_opt(struct request_queue *q, unsigned int opt);
d278d4a8 1138extern void blk_set_queue_depth(struct request_queue *q, unsigned int depth);
e475bba2 1139extern void blk_set_default_limits(struct queue_limits *lim);
b1bd055d 1140extern void blk_set_stacking_limits(struct queue_limits *lim);
c72758f3
MP
1141extern int blk_stack_limits(struct queue_limits *t, struct queue_limits *b,
1142 sector_t offset);
1143extern void disk_stack_limits(struct gendisk *disk, struct block_device *bdev,
1144 sector_t offset);
27f8221a 1145extern void blk_queue_update_dma_pad(struct request_queue *, unsigned int);
165125e1 1146extern void blk_queue_segment_boundary(struct request_queue *, unsigned long);
03100aad 1147extern void blk_queue_virt_boundary(struct request_queue *, unsigned long);
165125e1 1148extern void blk_queue_dma_alignment(struct request_queue *, int);
11c3e689 1149extern void blk_queue_update_dma_alignment(struct request_queue *, int);
242f9dcb 1150extern void blk_queue_rq_timeout(struct request_queue *, unsigned int);
93e9d8e8 1151extern void blk_queue_write_cache(struct request_queue *q, bool enabled, bool fua);
68c43f13
DLM
1152extern void blk_queue_required_elevator_features(struct request_queue *q,
1153 unsigned int features);
45147fb5
YS
1154extern bool blk_queue_can_use_dma_map_merging(struct request_queue *q,
1155 struct device *dev);
1da177e4 1156
1e739730
CH
1157/*
1158 * Number of physical segments as sent to the device.
1159 *
1160 * Normally this is the number of discontiguous data segments sent by the
1161 * submitter. But for data-less command like discard we might have no
1162 * actual data segments submitted, but the driver might have to add it's
1163 * own special payload. In that case we still return 1 here so that this
1164 * special payload will be mapped.
1165 */
f9d03f96
CH
1166static inline unsigned short blk_rq_nr_phys_segments(struct request *rq)
1167{
1168 if (rq->rq_flags & RQF_SPECIAL_PAYLOAD)
1169 return 1;
1170 return rq->nr_phys_segments;
1171}
1172
1e739730
CH
1173/*
1174 * Number of discard segments (or ranges) the driver needs to fill in.
1175 * Each discard bio merged into a request is counted as one segment.
1176 */
1177static inline unsigned short blk_rq_nr_discard_segments(struct request *rq)
1178{
1179 return max_t(unsigned short, rq->nr_phys_segments, 1);
1180}
1181
89de1504
CH
1182int __blk_rq_map_sg(struct request_queue *q, struct request *rq,
1183 struct scatterlist *sglist, struct scatterlist **last_sg);
1184static inline int blk_rq_map_sg(struct request_queue *q, struct request *rq,
1185 struct scatterlist *sglist)
1186{
1187 struct scatterlist *last_sg = NULL;
1188
1189 return __blk_rq_map_sg(q, rq, sglist, &last_sg);
1190}
1da177e4 1191extern void blk_dump_rq_flags(struct request *, char *);
1da177e4 1192
09ac46c4 1193bool __must_check blk_get_queue(struct request_queue *);
c62b37d9 1194struct request_queue *blk_alloc_queue(int node_id);
165125e1 1195extern void blk_put_queue(struct request_queue *);
3f21c265 1196extern void blk_set_queue_dying(struct request_queue *);
1da177e4 1197
1a4dcfa8 1198#ifdef CONFIG_BLOCK
316cc67d 1199/*
75df7136
SJ
1200 * blk_plug permits building a queue of related requests by holding the I/O
1201 * fragments for a short period. This allows merging of sequential requests
1202 * into single larger request. As the requests are moved from a per-task list to
1203 * the device's request_queue in a batch, this results in improved scalability
1204 * as the lock contention for request_queue lock is reduced.
1205 *
1206 * It is ok not to disable preemption when adding the request to the plug list
1207 * or when attempting a merge, because blk_schedule_flush_list() will only flush
1208 * the plug list when the task sleeps by itself. For details, please see
1209 * schedule() where blk_schedule_flush_plug() is called.
316cc67d 1210 */
73c10101 1211struct blk_plug {
320ae51f 1212 struct list_head mq_list; /* blk-mq requests */
75df7136 1213 struct list_head cb_list; /* md requires an unplug callback */
5f0ed774 1214 unsigned short rq_count;
ce5b009c 1215 bool multiple_queues;
5a473e83 1216 bool nowait;
73c10101 1217};
55c022bb 1218#define BLK_MAX_REQUEST_COUNT 16
50d24c34 1219#define BLK_PLUG_FLUSH_SIZE (128 * 1024)
55c022bb 1220
9cbb1750 1221struct blk_plug_cb;
74018dc3 1222typedef void (*blk_plug_cb_fn)(struct blk_plug_cb *, bool);
048c9374
N
1223struct blk_plug_cb {
1224 struct list_head list;
9cbb1750
N
1225 blk_plug_cb_fn callback;
1226 void *data;
048c9374 1227};
9cbb1750
N
1228extern struct blk_plug_cb *blk_check_plugged(blk_plug_cb_fn unplug,
1229 void *data, int size);
73c10101
JA
1230extern void blk_start_plug(struct blk_plug *);
1231extern void blk_finish_plug(struct blk_plug *);
f6603783 1232extern void blk_flush_plug_list(struct blk_plug *, bool);
73c10101
JA
1233
1234static inline void blk_flush_plug(struct task_struct *tsk)
1235{
1236 struct blk_plug *plug = tsk->plug;
1237
a237c1c5
JA
1238 if (plug)
1239 blk_flush_plug_list(plug, false);
1240}
1241
1242static inline void blk_schedule_flush_plug(struct task_struct *tsk)
1243{
1244 struct blk_plug *plug = tsk->plug;
1245
88b996cd 1246 if (plug)
f6603783 1247 blk_flush_plug_list(plug, true);
73c10101
JA
1248}
1249
1250static inline bool blk_needs_flush_plug(struct task_struct *tsk)
1251{
1252 struct blk_plug *plug = tsk->plug;
1253
320ae51f 1254 return plug &&
a1ce35fa 1255 (!list_empty(&plug->mq_list) ||
320ae51f 1256 !list_empty(&plug->cb_list));
73c10101
JA
1257}
1258
1a4dcfa8
CH
1259int blkdev_issue_flush(struct block_device *, gfp_t);
1260long nr_blockdev_pages(void);
1261#else /* CONFIG_BLOCK */
1262struct blk_plug {
1263};
1264
1265static inline void blk_start_plug(struct blk_plug *plug)
1266{
1267}
1268
1269static inline void blk_finish_plug(struct blk_plug *plug)
1270{
1271}
1272
1273static inline void blk_flush_plug(struct task_struct *task)
1274{
1275}
1276
1277static inline void blk_schedule_flush_plug(struct task_struct *task)
1278{
1279}
1280
1281
1282static inline bool blk_needs_flush_plug(struct task_struct *tsk)
1283{
1284 return false;
1285}
1286
1287static inline int blkdev_issue_flush(struct block_device *bdev, gfp_t gfp_mask)
1288{
1289 return 0;
1290}
1291
1292static inline long nr_blockdev_pages(void)
1293{
1294 return 0;
1295}
1296#endif /* CONFIG_BLOCK */
1297
71ac860a
ML
1298extern void blk_io_schedule(void);
1299
ee472d83
CH
1300extern int blkdev_issue_write_same(struct block_device *bdev, sector_t sector,
1301 sector_t nr_sects, gfp_t gfp_mask, struct page *page);
e950fdf7
CH
1302
1303#define BLKDEV_DISCARD_SECURE (1 << 0) /* issue a secure erase */
dd3932ed 1304
fbd9b09a
DM
1305extern int blkdev_issue_discard(struct block_device *bdev, sector_t sector,
1306 sector_t nr_sects, gfp_t gfp_mask, unsigned long flags);
38f25255 1307extern int __blkdev_issue_discard(struct block_device *bdev, sector_t sector,
288dab8a 1308 sector_t nr_sects, gfp_t gfp_mask, int flags,
469e3216 1309 struct bio **biop);
ee472d83
CH
1310
1311#define BLKDEV_ZERO_NOUNMAP (1 << 0) /* do not free blocks */
cb365b96 1312#define BLKDEV_ZERO_NOFALLBACK (1 << 1) /* don't write explicit zeroes */
ee472d83 1313
e73c23ff
CK
1314extern int __blkdev_issue_zeroout(struct block_device *bdev, sector_t sector,
1315 sector_t nr_sects, gfp_t gfp_mask, struct bio **biop,
ee472d83 1316 unsigned flags);
3f14d792 1317extern int blkdev_issue_zeroout(struct block_device *bdev, sector_t sector,
ee472d83
CH
1318 sector_t nr_sects, gfp_t gfp_mask, unsigned flags);
1319
2cf6d26a
CH
1320static inline int sb_issue_discard(struct super_block *sb, sector_t block,
1321 sector_t nr_blocks, gfp_t gfp_mask, unsigned long flags)
fb2dce86 1322{
233bde21
BVA
1323 return blkdev_issue_discard(sb->s_bdev,
1324 block << (sb->s_blocksize_bits -
1325 SECTOR_SHIFT),
1326 nr_blocks << (sb->s_blocksize_bits -
1327 SECTOR_SHIFT),
2cf6d26a 1328 gfp_mask, flags);
fb2dce86 1329}
e6fa0be6 1330static inline int sb_issue_zeroout(struct super_block *sb, sector_t block,
a107e5a3 1331 sector_t nr_blocks, gfp_t gfp_mask)
e6fa0be6
LC
1332{
1333 return blkdev_issue_zeroout(sb->s_bdev,
233bde21
BVA
1334 block << (sb->s_blocksize_bits -
1335 SECTOR_SHIFT),
1336 nr_blocks << (sb->s_blocksize_bits -
1337 SECTOR_SHIFT),
ee472d83 1338 gfp_mask, 0);
e6fa0be6 1339}
1da177e4 1340
f00c4d80 1341extern int blk_verify_command(unsigned char *cmd, fmode_t mode);
0b07de85 1342
eb28d31b
MP
1343enum blk_default_limits {
1344 BLK_MAX_SEGMENTS = 128,
1345 BLK_SAFE_MAX_SECTORS = 255,
d2be537c 1346 BLK_DEF_MAX_SECTORS = 2560,
eb28d31b
MP
1347 BLK_MAX_SEGMENT_SIZE = 65536,
1348 BLK_SEG_BOUNDARY_MASK = 0xFFFFFFFFUL,
1349};
0e435ac2 1350
af2c68fe 1351static inline unsigned long queue_segment_boundary(const struct request_queue *q)
ae03bf63 1352{
025146e1 1353 return q->limits.seg_boundary_mask;
ae03bf63
MP
1354}
1355
af2c68fe 1356static inline unsigned long queue_virt_boundary(const struct request_queue *q)
03100aad
KB
1357{
1358 return q->limits.virt_boundary_mask;
1359}
1360
af2c68fe 1361static inline unsigned int queue_max_sectors(const struct request_queue *q)
ae03bf63 1362{
025146e1 1363 return q->limits.max_sectors;
ae03bf63
MP
1364}
1365
af2c68fe 1366static inline unsigned int queue_max_hw_sectors(const struct request_queue *q)
ae03bf63 1367{
025146e1 1368 return q->limits.max_hw_sectors;
ae03bf63
MP
1369}
1370
af2c68fe 1371static inline unsigned short queue_max_segments(const struct request_queue *q)
ae03bf63 1372{
8a78362c 1373 return q->limits.max_segments;
ae03bf63
MP
1374}
1375
af2c68fe 1376static inline unsigned short queue_max_discard_segments(const struct request_queue *q)
1e739730
CH
1377{
1378 return q->limits.max_discard_segments;
1379}
1380
af2c68fe 1381static inline unsigned int queue_max_segment_size(const struct request_queue *q)
ae03bf63 1382{
025146e1 1383 return q->limits.max_segment_size;
ae03bf63
MP
1384}
1385
0512a75b
KB
1386static inline unsigned int queue_max_zone_append_sectors(const struct request_queue *q)
1387{
1388 return q->limits.max_zone_append_sectors;
1389}
1390
ad6bf88a 1391static inline unsigned queue_logical_block_size(const struct request_queue *q)
1da177e4
LT
1392{
1393 int retval = 512;
1394
025146e1
MP
1395 if (q && q->limits.logical_block_size)
1396 retval = q->limits.logical_block_size;
1da177e4
LT
1397
1398 return retval;
1399}
1400
ad6bf88a 1401static inline unsigned int bdev_logical_block_size(struct block_device *bdev)
1da177e4 1402{
e1defc4f 1403 return queue_logical_block_size(bdev_get_queue(bdev));
1da177e4
LT
1404}
1405
af2c68fe 1406static inline unsigned int queue_physical_block_size(const struct request_queue *q)
c72758f3
MP
1407{
1408 return q->limits.physical_block_size;
1409}
1410
892b6f90 1411static inline unsigned int bdev_physical_block_size(struct block_device *bdev)
ac481c20
MP
1412{
1413 return queue_physical_block_size(bdev_get_queue(bdev));
1414}
1415
af2c68fe 1416static inline unsigned int queue_io_min(const struct request_queue *q)
c72758f3
MP
1417{
1418 return q->limits.io_min;
1419}
1420
ac481c20
MP
1421static inline int bdev_io_min(struct block_device *bdev)
1422{
1423 return queue_io_min(bdev_get_queue(bdev));
1424}
1425
af2c68fe 1426static inline unsigned int queue_io_opt(const struct request_queue *q)
c72758f3
MP
1427{
1428 return q->limits.io_opt;
1429}
1430
ac481c20
MP
1431static inline int bdev_io_opt(struct block_device *bdev)
1432{
1433 return queue_io_opt(bdev_get_queue(bdev));
1434}
1435
af2c68fe 1436static inline int queue_alignment_offset(const struct request_queue *q)
c72758f3 1437{
ac481c20 1438 if (q->limits.misaligned)
c72758f3
MP
1439 return -1;
1440
ac481c20 1441 return q->limits.alignment_offset;
c72758f3
MP
1442}
1443
e03a72e1 1444static inline int queue_limit_alignment_offset(struct queue_limits *lim, sector_t sector)
81744ee4
MP
1445{
1446 unsigned int granularity = max(lim->physical_block_size, lim->io_min);
233bde21
BVA
1447 unsigned int alignment = sector_div(sector, granularity >> SECTOR_SHIFT)
1448 << SECTOR_SHIFT;
81744ee4 1449
b8839b8c 1450 return (granularity + lim->alignment_offset - alignment) % granularity;
c72758f3
MP
1451}
1452
ac481c20
MP
1453static inline int bdev_alignment_offset(struct block_device *bdev)
1454{
1455 struct request_queue *q = bdev_get_queue(bdev);
1456
1457 if (q->limits.misaligned)
1458 return -1;
ac481c20 1459 if (bdev != bdev->bd_contains)
7b8917f5
CH
1460 return queue_limit_alignment_offset(&q->limits,
1461 bdev->bd_part->start_sect);
ac481c20
MP
1462 return q->limits.alignment_offset;
1463}
1464
af2c68fe 1465static inline int queue_discard_alignment(const struct request_queue *q)
86b37281
MP
1466{
1467 if (q->limits.discard_misaligned)
1468 return -1;
1469
1470 return q->limits.discard_alignment;
1471}
1472
e03a72e1 1473static inline int queue_limit_discard_alignment(struct queue_limits *lim, sector_t sector)
86b37281 1474{
59771079 1475 unsigned int alignment, granularity, offset;
dd3d145d 1476
a934a00a
MP
1477 if (!lim->max_discard_sectors)
1478 return 0;
1479
59771079 1480 /* Why are these in bytes, not sectors? */
233bde21
BVA
1481 alignment = lim->discard_alignment >> SECTOR_SHIFT;
1482 granularity = lim->discard_granularity >> SECTOR_SHIFT;
59771079
LT
1483 if (!granularity)
1484 return 0;
1485
1486 /* Offset of the partition start in 'granularity' sectors */
1487 offset = sector_div(sector, granularity);
1488
1489 /* And why do we do this modulus *again* in blkdev_issue_discard()? */
1490 offset = (granularity + alignment - offset) % granularity;
1491
1492 /* Turn it back into bytes, gaah */
233bde21 1493 return offset << SECTOR_SHIFT;
86b37281
MP
1494}
1495
c6e66634
PB
1496static inline int bdev_discard_alignment(struct block_device *bdev)
1497{
1498 struct request_queue *q = bdev_get_queue(bdev);
1499
1500 if (bdev != bdev->bd_contains)
7cf34d97
CH
1501 return queue_limit_discard_alignment(&q->limits,
1502 bdev->bd_part->start_sect);
c6e66634
PB
1503 return q->limits.discard_alignment;
1504}
1505
4363ac7c
MP
1506static inline unsigned int bdev_write_same(struct block_device *bdev)
1507{
1508 struct request_queue *q = bdev_get_queue(bdev);
1509
1510 if (q)
1511 return q->limits.max_write_same_sectors;
1512
1513 return 0;
1514}
1515
a6f0788e
CK
1516static inline unsigned int bdev_write_zeroes_sectors(struct block_device *bdev)
1517{
1518 struct request_queue *q = bdev_get_queue(bdev);
1519
1520 if (q)
1521 return q->limits.max_write_zeroes_sectors;
1522
1523 return 0;
1524}
1525
797476b8
DLM
1526static inline enum blk_zoned_model bdev_zoned_model(struct block_device *bdev)
1527{
1528 struct request_queue *q = bdev_get_queue(bdev);
1529
1530 if (q)
1531 return blk_queue_zoned_model(q);
1532
1533 return BLK_ZONED_NONE;
1534}
1535
1536static inline bool bdev_is_zoned(struct block_device *bdev)
1537{
1538 struct request_queue *q = bdev_get_queue(bdev);
1539
1540 if (q)
1541 return blk_queue_is_zoned(q);
1542
1543 return false;
1544}
1545
113ab72e 1546static inline sector_t bdev_zone_sectors(struct block_device *bdev)
6a0cb1bc
HR
1547{
1548 struct request_queue *q = bdev_get_queue(bdev);
1549
1550 if (q)
f99e8648 1551 return blk_queue_zone_sectors(q);
6cc77e9c
CH
1552 return 0;
1553}
6a0cb1bc 1554
e15864f8
NC
1555static inline unsigned int bdev_max_open_zones(struct block_device *bdev)
1556{
1557 struct request_queue *q = bdev_get_queue(bdev);
1558
1559 if (q)
1560 return queue_max_open_zones(q);
1561 return 0;
1562}
1563
659bf827
NC
1564static inline unsigned int bdev_max_active_zones(struct block_device *bdev)
1565{
1566 struct request_queue *q = bdev_get_queue(bdev);
1567
1568 if (q)
1569 return queue_max_active_zones(q);
1570 return 0;
1571}
1572
af2c68fe 1573static inline int queue_dma_alignment(const struct request_queue *q)
1da177e4 1574{
482eb689 1575 return q ? q->dma_alignment : 511;
1da177e4
LT
1576}
1577
14417799 1578static inline int blk_rq_aligned(struct request_queue *q, unsigned long addr,
87904074
FT
1579 unsigned int len)
1580{
1581 unsigned int alignment = queue_dma_alignment(q) | q->dma_pad_mask;
14417799 1582 return !(addr & alignment) && !(len & alignment);
87904074
FT
1583}
1584
1da177e4
LT
1585/* assumes size > 256 */
1586static inline unsigned int blksize_bits(unsigned int size)
1587{
1588 unsigned int bits = 8;
1589 do {
1590 bits++;
1591 size >>= 1;
1592 } while (size > 256);
1593 return bits;
1594}
1595
2befb9e3 1596static inline unsigned int block_size(struct block_device *bdev)
1da177e4 1597{
6b7b181b 1598 return 1 << bdev->bd_inode->i_blkbits;
1da177e4
LT
1599}
1600
59c3d45e 1601int kblockd_schedule_work(struct work_struct *work);
818cd1cb 1602int kblockd_mod_delayed_work_on(int cpu, struct delayed_work *dwork, unsigned long delay);
1da177e4 1603
1da177e4
LT
1604#define MODULE_ALIAS_BLOCKDEV(major,minor) \
1605 MODULE_ALIAS("block-major-" __stringify(major) "-" __stringify(minor))
1606#define MODULE_ALIAS_BLOCKDEV_MAJOR(major) \
1607 MODULE_ALIAS("block-major-" __stringify(major) "-*")
1608
7ba1ba12
MP
1609#if defined(CONFIG_BLK_DEV_INTEGRITY)
1610
8288f496
MP
1611enum blk_integrity_flags {
1612 BLK_INTEGRITY_VERIFY = 1 << 0,
1613 BLK_INTEGRITY_GENERATE = 1 << 1,
3aec2f41 1614 BLK_INTEGRITY_DEVICE_CAPABLE = 1 << 2,
aae7df50 1615 BLK_INTEGRITY_IP_CHECKSUM = 1 << 3,
8288f496 1616};
7ba1ba12 1617
18593088 1618struct blk_integrity_iter {
7ba1ba12
MP
1619 void *prot_buf;
1620 void *data_buf;
3be91c4a 1621 sector_t seed;
7ba1ba12 1622 unsigned int data_size;
3be91c4a 1623 unsigned short interval;
7ba1ba12
MP
1624 const char *disk_name;
1625};
1626
4e4cbee9 1627typedef blk_status_t (integrity_processing_fn) (struct blk_integrity_iter *);
54d4e6ab
MG
1628typedef void (integrity_prepare_fn) (struct request *);
1629typedef void (integrity_complete_fn) (struct request *, unsigned int);
7ba1ba12 1630
0f8087ec
MP
1631struct blk_integrity_profile {
1632 integrity_processing_fn *generate_fn;
1633 integrity_processing_fn *verify_fn;
54d4e6ab
MG
1634 integrity_prepare_fn *prepare_fn;
1635 integrity_complete_fn *complete_fn;
0f8087ec
MP
1636 const char *name;
1637};
7ba1ba12 1638
25520d55 1639extern void blk_integrity_register(struct gendisk *, struct blk_integrity *);
7ba1ba12 1640extern void blk_integrity_unregister(struct gendisk *);
ad7fce93 1641extern int blk_integrity_compare(struct gendisk *, struct gendisk *);
13f05c8d
MP
1642extern int blk_rq_map_integrity_sg(struct request_queue *, struct bio *,
1643 struct scatterlist *);
1644extern int blk_rq_count_integrity_sg(struct request_queue *, struct bio *);
4eaf99be
MP
1645extern bool blk_integrity_merge_rq(struct request_queue *, struct request *,
1646 struct request *);
1647extern bool blk_integrity_merge_bio(struct request_queue *, struct request *,
1648 struct bio *);
7ba1ba12 1649
25520d55 1650static inline struct blk_integrity *blk_get_integrity(struct gendisk *disk)
b04accc4 1651{
ac6fc48c 1652 struct blk_integrity *bi = &disk->queue->integrity;
25520d55
MP
1653
1654 if (!bi->profile)
1655 return NULL;
1656
1657 return bi;
b04accc4
JA
1658}
1659
25520d55
MP
1660static inline
1661struct blk_integrity *bdev_get_integrity(struct block_device *bdev)
b02739b0 1662{
25520d55 1663 return blk_get_integrity(bdev->bd_disk);
b02739b0
MP
1664}
1665
d145dc23
ST
1666static inline bool
1667blk_integrity_queue_supports_integrity(struct request_queue *q)
1668{
1669 return q->integrity.profile;
1670}
1671
180b2f95 1672static inline bool blk_integrity_rq(struct request *rq)
7ba1ba12 1673{
180b2f95 1674 return rq->cmd_flags & REQ_INTEGRITY;
7ba1ba12
MP
1675}
1676
13f05c8d
MP
1677static inline void blk_queue_max_integrity_segments(struct request_queue *q,
1678 unsigned int segs)
1679{
1680 q->limits.max_integrity_segments = segs;
1681}
1682
1683static inline unsigned short
af2c68fe 1684queue_max_integrity_segments(const struct request_queue *q)
13f05c8d
MP
1685{
1686 return q->limits.max_integrity_segments;
1687}
1688
359f6427
GE
1689/**
1690 * bio_integrity_intervals - Return number of integrity intervals for a bio
1691 * @bi: blk_integrity profile for device
1692 * @sectors: Size of the bio in 512-byte sectors
1693 *
1694 * Description: The block layer calculates everything in 512 byte
1695 * sectors but integrity metadata is done in terms of the data integrity
1696 * interval size of the storage device. Convert the block layer sectors
1697 * to the appropriate number of integrity intervals.
1698 */
1699static inline unsigned int bio_integrity_intervals(struct blk_integrity *bi,
1700 unsigned int sectors)
1701{
1702 return sectors >> (bi->interval_exp - 9);
1703}
1704
1705static inline unsigned int bio_integrity_bytes(struct blk_integrity *bi,
1706 unsigned int sectors)
1707{
1708 return bio_integrity_intervals(bi, sectors) * bi->tuple_size;
1709}
1710
2a876f5e
CH
1711/*
1712 * Return the first bvec that contains integrity data. Only drivers that are
1713 * limited to a single integrity segment should use this helper.
1714 */
1715static inline struct bio_vec *rq_integrity_vec(struct request *rq)
1716{
1717 if (WARN_ON_ONCE(queue_max_integrity_segments(rq->q) > 1))
1718 return NULL;
1719 return rq->bio->bi_integrity->bip_vec;
1720}
1721
7ba1ba12
MP
1722#else /* CONFIG_BLK_DEV_INTEGRITY */
1723
fd83240a
SR
1724struct bio;
1725struct block_device;
1726struct gendisk;
1727struct blk_integrity;
1728
1729static inline int blk_integrity_rq(struct request *rq)
1730{
1731 return 0;
1732}
1733static inline int blk_rq_count_integrity_sg(struct request_queue *q,
1734 struct bio *b)
1735{
1736 return 0;
1737}
1738static inline int blk_rq_map_integrity_sg(struct request_queue *q,
1739 struct bio *b,
1740 struct scatterlist *s)
1741{
1742 return 0;
1743}
1744static inline struct blk_integrity *bdev_get_integrity(struct block_device *b)
1745{
61a04e5b 1746 return NULL;
fd83240a
SR
1747}
1748static inline struct blk_integrity *blk_get_integrity(struct gendisk *disk)
1749{
1750 return NULL;
1751}
d145dc23
ST
1752static inline bool
1753blk_integrity_queue_supports_integrity(struct request_queue *q)
1754{
1755 return false;
1756}
fd83240a
SR
1757static inline int blk_integrity_compare(struct gendisk *a, struct gendisk *b)
1758{
1759 return 0;
1760}
25520d55 1761static inline void blk_integrity_register(struct gendisk *d,
fd83240a
SR
1762 struct blk_integrity *b)
1763{
fd83240a
SR
1764}
1765static inline void blk_integrity_unregister(struct gendisk *d)
1766{
1767}
1768static inline void blk_queue_max_integrity_segments(struct request_queue *q,
1769 unsigned int segs)
1770{
1771}
af2c68fe 1772static inline unsigned short queue_max_integrity_segments(const struct request_queue *q)
fd83240a
SR
1773{
1774 return 0;
1775}
4eaf99be
MP
1776static inline bool blk_integrity_merge_rq(struct request_queue *rq,
1777 struct request *r1,
1778 struct request *r2)
fd83240a 1779{
cb1a5ab6 1780 return true;
fd83240a 1781}
4eaf99be
MP
1782static inline bool blk_integrity_merge_bio(struct request_queue *rq,
1783 struct request *r,
1784 struct bio *b)
fd83240a 1785{
cb1a5ab6 1786 return true;
fd83240a 1787}
25520d55 1788
359f6427
GE
1789static inline unsigned int bio_integrity_intervals(struct blk_integrity *bi,
1790 unsigned int sectors)
1791{
1792 return 0;
1793}
1794
1795static inline unsigned int bio_integrity_bytes(struct blk_integrity *bi,
1796 unsigned int sectors)
1797{
1798 return 0;
1799}
1800
2a876f5e
CH
1801static inline struct bio_vec *rq_integrity_vec(struct request *rq)
1802{
1803 return NULL;
1804}
1805
7ba1ba12
MP
1806#endif /* CONFIG_BLK_DEV_INTEGRITY */
1807
d145dc23
ST
1808#ifdef CONFIG_BLK_INLINE_ENCRYPTION
1809
1810bool blk_ksm_register(struct blk_keyslot_manager *ksm, struct request_queue *q);
1811
1812void blk_ksm_unregister(struct request_queue *q);
1813
1814#else /* CONFIG_BLK_INLINE_ENCRYPTION */
1815
1816static inline bool blk_ksm_register(struct blk_keyslot_manager *ksm,
1817 struct request_queue *q)
1818{
1819 return true;
1820}
1821
1822static inline void blk_ksm_unregister(struct request_queue *q) { }
1823
1824#endif /* CONFIG_BLK_INLINE_ENCRYPTION */
1825
1826
08f85851 1827struct block_device_operations {
c62b37d9 1828 blk_qc_t (*submit_bio) (struct bio *bio);
d4430d62 1829 int (*open) (struct block_device *, fmode_t);
db2a144b 1830 void (*release) (struct gendisk *, fmode_t);
3f289dcb 1831 int (*rw_page)(struct block_device *, sector_t, struct page *, unsigned int);
d4430d62
AV
1832 int (*ioctl) (struct block_device *, fmode_t, unsigned, unsigned long);
1833 int (*compat_ioctl) (struct block_device *, fmode_t, unsigned, unsigned long);
77ea887e
TH
1834 unsigned int (*check_events) (struct gendisk *disk,
1835 unsigned int clearing);
c3e33e04 1836 void (*unlock_native_capacity) (struct gendisk *);
08f85851
AV
1837 int (*revalidate_disk) (struct gendisk *);
1838 int (*getgeo)(struct block_device *, struct hd_geometry *);
b3a27d05
NG
1839 /* this callback is with swap_lock and sometimes page table lock held */
1840 void (*swap_slot_free_notify) (struct block_device *, unsigned long);
e76239a3 1841 int (*report_zones)(struct gendisk *, sector_t sector,
d4100351 1842 unsigned int nr_zones, report_zones_cb cb, void *data);
348e114b 1843 char *(*devnode)(struct gendisk *disk, umode_t *mode);
08f85851 1844 struct module *owner;
bbd3e064 1845 const struct pr_ops *pr_ops;
08f85851
AV
1846};
1847
ee6a129d
AB
1848#ifdef CONFIG_COMPAT
1849extern int blkdev_compat_ptr_ioctl(struct block_device *, fmode_t,
1850 unsigned int, unsigned long);
1851#else
1852#define blkdev_compat_ptr_ioctl NULL
1853#endif
1854
633a08b8
AV
1855extern int __blkdev_driver_ioctl(struct block_device *, fmode_t, unsigned int,
1856 unsigned long);
47a191fd
MW
1857extern int bdev_read_page(struct block_device *, sector_t, struct page *);
1858extern int bdev_write_page(struct block_device *, sector_t, struct page *,
1859 struct writeback_control *);
6cc77e9c
CH
1860
1861#ifdef CONFIG_BLK_DEV_ZONED
1862bool blk_req_needs_zone_write_lock(struct request *rq);
1392d370 1863bool blk_req_zone_write_trylock(struct request *rq);
6cc77e9c
CH
1864void __blk_req_zone_write_lock(struct request *rq);
1865void __blk_req_zone_write_unlock(struct request *rq);
1866
1867static inline void blk_req_zone_write_lock(struct request *rq)
1868{
1869 if (blk_req_needs_zone_write_lock(rq))
1870 __blk_req_zone_write_lock(rq);
1871}
1872
1873static inline void blk_req_zone_write_unlock(struct request *rq)
1874{
1875 if (rq->rq_flags & RQF_ZONE_WRITE_LOCKED)
1876 __blk_req_zone_write_unlock(rq);
1877}
1878
1879static inline bool blk_req_zone_is_write_locked(struct request *rq)
1880{
1881 return rq->q->seq_zones_wlock &&
1882 test_bit(blk_rq_zone_no(rq), rq->q->seq_zones_wlock);
1883}
1884
1885static inline bool blk_req_can_dispatch_to_zone(struct request *rq)
1886{
1887 if (!blk_req_needs_zone_write_lock(rq))
1888 return true;
1889 return !blk_req_zone_is_write_locked(rq);
1890}
1891#else
1892static inline bool blk_req_needs_zone_write_lock(struct request *rq)
1893{
1894 return false;
1895}
1896
1897static inline void blk_req_zone_write_lock(struct request *rq)
1898{
1899}
1900
1901static inline void blk_req_zone_write_unlock(struct request *rq)
1902{
1903}
1904static inline bool blk_req_zone_is_write_locked(struct request *rq)
1905{
1906 return false;
1907}
1908
1909static inline bool blk_req_can_dispatch_to_zone(struct request *rq)
1910{
1911 return true;
1912}
1913#endif /* CONFIG_BLK_DEV_ZONED */
1914
0619317f
JA
1915static inline void blk_wake_io_task(struct task_struct *waiter)
1916{
1917 /*
1918 * If we're polling, the task itself is doing the completions. For
1919 * that case, we don't need to signal a wakeup, it's enough to just
1920 * mark us as RUNNING.
1921 */
1922 if (waiter == current)
1923 __set_current_state(TASK_RUNNING);
1924 else
1925 wake_up_process(waiter);
1926}
1927
956d510e
CH
1928unsigned long disk_start_io_acct(struct gendisk *disk, unsigned int sectors,
1929 unsigned int op);
1930void disk_end_io_acct(struct gendisk *disk, unsigned int op,
1931 unsigned long start_time);
1932
956d510e
CH
1933/**
1934 * bio_start_io_acct - start I/O accounting for bio based drivers
1935 * @bio: bio to start account for
1936 *
1937 * Returns the start time that should be passed back to bio_end_io_acct().
1938 */
1939static inline unsigned long bio_start_io_acct(struct bio *bio)
1940{
1941 return disk_start_io_acct(bio->bi_disk, bio_sectors(bio), bio_op(bio));
1942}
1943
1944/**
1945 * bio_end_io_acct - end I/O accounting for bio based drivers
1946 * @bio: bio to end account for
1947 * @start: start time returned by bio_start_io_acct()
1948 */
1949static inline void bio_end_io_acct(struct bio *bio, unsigned long start_time)
1950{
1951 return disk_end_io_acct(bio->bi_disk, bio_op(bio), start_time);
1952}
956d510e 1953
3f1266f1
CH
1954int bdev_read_only(struct block_device *bdev);
1955int set_blocksize(struct block_device *bdev, int size);
1956
1957const char *bdevname(struct block_device *bdev, char *buffer);
1958struct block_device *lookup_bdev(const char *);
1959
1960void blkdev_show(struct seq_file *seqf, off_t offset);
1961
1962#define BDEVNAME_SIZE 32 /* Largest string for a blockdev identifier */
1963#define BDEVT_SIZE 10 /* Largest string for MAJ:MIN for blkdev */
1964#ifdef CONFIG_BLOCK
1965#define BLKDEV_MAJOR_MAX 512
1966#else
1967#define BLKDEV_MAJOR_MAX 0
1968#endif
1969
1970int blkdev_get(struct block_device *bdev, fmode_t mode, void *holder);
1971struct block_device *blkdev_get_by_path(const char *path, fmode_t mode,
1972 void *holder);
1973struct block_device *blkdev_get_by_dev(dev_t dev, fmode_t mode, void *holder);
ecbe6bc0
CH
1974int bd_prepare_to_claim(struct block_device *bdev, struct block_device *whole,
1975 void *holder);
3f1266f1
CH
1976void bd_abort_claiming(struct block_device *bdev, struct block_device *whole,
1977 void *holder);
1978void blkdev_put(struct block_device *bdev, fmode_t mode);
1979
621c1f42 1980struct block_device *I_BDEV(struct inode *inode);
3f1266f1
CH
1981struct block_device *bdget(dev_t);
1982struct block_device *bdgrab(struct block_device *bdev);
1983void bdput(struct block_device *);
1984
1985#ifdef CONFIG_BLOCK
1986void invalidate_bdev(struct block_device *bdev);
1987int sync_blockdev(struct block_device *bdev);
1988#else
1989static inline void invalidate_bdev(struct block_device *bdev)
1990{
1991}
1992static inline int sync_blockdev(struct block_device *bdev)
1993{
1994 return 0;
1995}
1da177e4 1996#endif
3f1266f1
CH
1997int fsync_bdev(struct block_device *bdev);
1998
1999struct super_block *freeze_bdev(struct block_device *bdev);
2000int thaw_bdev(struct block_device *bdev, struct super_block *sb);
2001
2002#endif /* _LINUX_BLKDEV_H */