t/zbd: add close_zone helper function
[fio.git] / t / zbd / test-zbd-support
... / ...
CommitLineData
1#!/bin/bash
2#
3# Copyright (C) 2018 Western Digital Corporation or its affiliates.
4#
5# This file is released under the GPL.
6
7usage() {
8 echo "Usage: $(basename "$0") [OPTIONS] <test target device file>"
9 echo "Options:"
10 echo -e "\t-d Run fio with valgrind using DRD tool"
11 echo -e "\t-e Run fio with valgrind using helgrind tool"
12 echo -e "\t-v Run fio with valgrind --read-var-info option"
13 echo -e "\t-l Test with libzbc ioengine"
14 echo -e "\t-r Reset all zones before test start"
15 echo -e "\t-w Reset all zones before executing each write test case"
16 echo -e "\t-o <max_open_zones> Run fio with max_open_zones limit"
17 echo -e "\t-t <test #> Run only a single test case with specified number"
18 echo -e "\t-q Quit the test run after any failed test"
19 echo -e "\t-z Run fio with debug=zbd option"
20 echo -e "\t-u Use io_uring ioengine in place of libaio"
21}
22
23max() {
24 if [ "$1" -gt "$2" ]; then
25 echo "$1"
26 else
27 echo "$2"
28 fi
29}
30
31min() {
32 if [ "$1" -lt "$2" ]; then
33 echo "$1"
34 else
35 echo "$2"
36 fi
37}
38
39ioengine() {
40 if [ -n "$use_libzbc" ]; then
41 echo -n "--ioengine=libzbc"
42 elif [ "$1" = "libaio" -a -n "$force_io_uring" ]; then
43 echo -n "--ioengine=io_uring"
44 else
45 echo -n "--ioengine=$1"
46 fi
47}
48
49set_io_scheduler() {
50 local dev=$1 sched=$2
51
52 [ -e "/sys/block/$dev" ] || return $?
53 if [ -e "/sys/block/$dev/mq" ]; then
54 case "$sched" in
55 noop) sched=none;;
56 deadline) sched=mq-deadline;;
57 esac
58 else
59 case "$sched" in
60 none) sched=noop;;
61 mq-deadline) sched=deadline;;
62 esac
63 fi
64
65 echo "$sched" >"/sys/block/$dev/queue/scheduler"
66}
67
68check_read() {
69 local read
70
71 read=$(fio_read <"${logfile}.${test_number}")
72 echo "read: $read <> $1" >> "${logfile}.${test_number}"
73 [ "$read" = "$1" ]
74}
75
76check_written() {
77 local written
78
79 written=$(fio_written <"${logfile}.${test_number}")
80 echo "written: $written <> $1" >> "${logfile}.${test_number}"
81 [ "$written" = "$1" ]
82}
83
84# Compare the reset count from the log file with reset count $2 using operator
85# $1 (=, -ge, -gt, -le, -lt).
86check_reset_count() {
87 local reset_count
88
89 reset_count=$(fio_reset_count <"${logfile}.${test_number}")
90 echo "reset_count: test $reset_count $1 $2" >> "${logfile}.${test_number}"
91 eval "[ '$reset_count' '$1' '$2' ]"
92}
93
94# Check log for failed assertions and crashes. Without these checks,
95# a test can succeed even when these events happen, but it must fail.
96check_log() {
97 [ ! -f "${logfile}.${1}" ] && return 0
98 ! grep -q -e "Assertion " -e "Aborted " "${logfile}.${1}"
99}
100
101# Whether or not $1 (/dev/...) is a SCSI device.
102is_scsi_device() {
103 local d f
104
105 d=$(basename "$dev")
106 for f in /sys/class/scsi_device/*/device/block/"$d"; do
107 [ -e "$f" ] && return 0
108 done
109 return 1
110}
111
112job_var_opts_exclude() {
113 local o
114 local ex_key="${1}"
115
116 for o in "${job_var_opts[@]}"; do
117 if [[ ${o} =~ "${ex_key}" ]]; then
118 continue
119 fi
120 echo -n "${o}"
121 done
122}
123
124has_max_open_zones() {
125 while (($# > 1)); do
126 if [[ ${1} =~ "--max_open_zones" ]]; then
127 return 0
128 fi
129 shift
130 done
131 return 1
132}
133
134run_fio() {
135 local fio opts
136
137 fio=$(dirname "$0")/../../fio
138
139 opts=(${global_var_opts[@]})
140 opts+=("--max-jobs=16" "--aux-path=/tmp" "--allow_file_create=0" \
141 "--significant_figures=10" "$@")
142 # When max_open_zones option is specified to this test script, add
143 # max_open_zones option to fio command unless the test case already add it.
144 if [[ -n ${max_open_zones_opt} ]] && ! has_max_open_zones "${opts[@]}"; then
145 opts+=("--max_open_zones=${max_open_zones_opt}")
146 fi
147 { echo; echo "fio ${opts[*]}"; echo; } >>"${logfile}.${test_number}"
148
149 "${dynamic_analyzer[@]}" "$fio" "${opts[@]}"
150}
151
152run_one_fio_job() {
153 local r
154
155 r=$(((RANDOM << 16) | RANDOM))
156 run_fio --name="$dev" --filename="$dev" "$@" --randseed="$r" \
157 --thread=1 --direct=1
158}
159
160write_and_run_one_fio_job() {
161 local r
162 local write_offset="${1}"
163 local write_size="${2}"
164 local -a write_opts
165
166 shift 2
167 r=$(((RANDOM << 16) | RANDOM))
168 write_opts=(--name="write_job" --rw=write "$(ioengine "psync")" \
169 --bs="${min_seq_write_size}" --zonemode=zbd \
170 --zonesize="${zone_size}" --thread=1 --direct=1 \
171 --offset="${write_offset}" --size="${write_size}")
172 write_opts+=("${job_var_opts[@]}")
173 run_fio --filename="$dev" --randseed="$r" "${write_opts[@]}" \
174 --name="$dev" --wait_for="write_job" "$@" --thread=1 --direct=1
175}
176
177# Run fio on the first four sequential zones of the disk.
178run_fio_on_seq() {
179 local opts=()
180
181 opts+=("--offset=$((first_sequential_zone_sector * 512))")
182 opts+=("--size=$((4 * zone_size))" "--zonemode=zbd")
183 if [ -z "$is_zbd" ]; then
184 opts+=("--zonesize=${zone_size}")
185 fi
186 run_one_fio_job "${opts[@]}" "$@"
187}
188
189# Prepare for write test by resetting zones. When reset_before_write or
190# max_open_zones option is specified, reset all zones of the test target to
191# ensure that zones out of the test target range do not have open zones. This
192# allows the write test to the target range to be able to open zones up to
193# max_open_zones limit specified as the option or obtained from sysfs.
194prep_write() {
195 [[ -n "${reset_before_write}" || -n "${max_open_zones_opt}" ]] &&
196 [[ -n "${is_zbd}" ]] && reset_zone "${dev}" -1
197}
198
199SKIP_TESTCASE=255
200
201require_scsi_dev() {
202 if ! is_scsi_device "$dev"; then
203 SKIP_REASON="$dev is not a SCSI device"
204 return 1
205 fi
206 return 0
207}
208
209require_conv_zone_bytes() {
210 local req_bytes=${1}
211
212 if ((req_bytes > first_sequential_zone_sector * 512)); then
213 SKIP_REASON="$dev does not have enough conventional zones"
214 return 1
215 fi
216 return 0
217}
218
219require_zbd() {
220 if [[ -z ${is_zbd} ]]; then
221 SKIP_REASON="$dev is not a zoned block device"
222 return 1
223 fi
224 return 0
225}
226
227require_regular_block_dev() {
228 if [[ -n ${is_zbd} ]]; then
229 SKIP_REASON="$dev is not a regular block device"
230 return 1
231 fi
232 return 0
233}
234
235require_block_dev() {
236 if [[ -b "$realdev" ]]; then
237 return 0
238 fi
239 SKIP_REASON="$dev is not a block device"
240 return 1
241}
242
243require_seq_zones() {
244 local req_seq_zones=${1}
245 local seq_bytes=$((disk_size - first_sequential_zone_sector * 512))
246
247 if ((req_seq_zones > seq_bytes / zone_size)); then
248 SKIP_REASON="$dev does not have $req_seq_zones sequential zones"
249 return 1
250 fi
251 return 0
252}
253
254require_conv_zones() {
255 local req_c_zones=${1}
256 local conv_bytes=$((first_sequential_zone_sector * 512))
257
258 if ((req_c_zones > conv_bytes / zone_size)); then
259 SKIP_REASON="$dev does not have $req_c_zones conventional zones"
260 return 1
261 fi
262 return 0
263}
264
265require_max_open_zones() {
266 local min=${1}
267
268 if ((max_open_zones !=0 && max_open_zones < min)); then
269 SKIP_REASON="max_open_zones of $dev is smaller than $min"
270 return 1
271 fi
272 return 0
273}
274
275# Check whether buffered writes are refused for block devices.
276test1() {
277 require_block_dev || return $SKIP_TESTCASE
278 run_fio --name=job1 --filename="$dev" --rw=write --direct=0 --bs=4K \
279 "$(ioengine "psync")" --size="${zone_size}" --thread=1 \
280 --zonemode=zbd --zonesize="${zone_size}" 2>&1 |
281 tee -a "${logfile}.${test_number}" |
282 grep -q 'Using direct I/O is mandatory for writing to ZBD drives'
283 local fio_rc=${PIPESTATUS[0]} grep_rc=${PIPESTATUS[2]}
284 case "$fio_rc" in
285 0|1) ;;
286 *) return "$fio_rc"
287 esac
288 if [ -n "$is_zbd" ]; then
289 [ "$grep_rc" = 0 ]
290 else
291 [ "$grep_rc" != 0 ]
292 fi
293}
294
295# Block size exceeds zone size.
296test2() {
297 local bs off opts=() rc
298
299 off=$(((first_sequential_zone_sector + 2 * sectors_per_zone) * 512))
300 bs=$((2 * zone_size))
301 opts+=("$(ioengine "psync")")
302 opts+=("--name=job1" "--filename=$dev" "--rw=write" "--direct=1")
303 opts+=("--zonemode=zbd" "--offset=$off" "--bs=$bs" "--size=$bs")
304 if [ -z "$is_zbd" ]; then
305 opts+=("--zonesize=${zone_size}")
306 fi
307 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 && return 1
308 grep -q 'buflen exceeds zone size' "${logfile}.${test_number}"
309}
310
311# Run fio against an empty zone. This causes fio to report "No I/O performed".
312test3() {
313 local off opts=() rc
314
315 require_seq_zones 129 || return $SKIP_TESTCASE
316 off=$((first_sequential_zone_sector * 512 + 128 * zone_size))
317 size=$((zone_size))
318 [ -n "$is_zbd" ] && reset_zone "$dev" $((off / 512))
319 opts+=("--name=$dev" "--filename=$dev" "--offset=$off" "--bs=4K")
320 opts+=("--size=$size" "--zonemode=zbd")
321 opts+=("$(ioengine "psync")" "--rw=read" "--direct=1" "--thread=1")
322 if [ -z "$is_zbd" ]; then
323 opts+=("--zonesize=${zone_size}")
324 fi
325 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
326 ! grep -q 'READ:' "${logfile}.${test_number}"
327}
328
329# Run fio with --read_beyond_wp=1 against an empty zone.
330test4() {
331 local off opts=()
332
333 require_seq_zones 130 || return $SKIP_TESTCASE
334 off=$((first_sequential_zone_sector * 512 + 129 * zone_size))
335 size=$((zone_size))
336 [ -n "$is_zbd" ] && reset_zone "$dev" $((off / 512))
337 opts+=("--name=$dev" "--filename=$dev" "--offset=$off")
338 opts+=(--bs="$(min $((min_seq_write_size * 256)) $size)")
339 opts+=("--size=$size" "--thread=1" "--read_beyond_wp=1")
340 opts+=("$(ioengine "psync")" "--rw=read" "--direct=1" "--disable_lat=1")
341 opts+=("--zonemode=zbd" "--zonesize=${zone_size}")
342 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
343 check_read $size || return $?
344}
345
346# Sequential write to sequential zones.
347test5() {
348 local size off capacity bs
349
350 prep_write
351 off=$((first_sequential_zone_sector * 512))
352 capacity=$(total_zone_capacity 4 $off $dev)
353 size=$((4 * zone_size))
354 bs=$(min "$(max $((zone_size / 64)) "$min_seq_write_size")" "$zone_cap_bs")
355 run_fio_on_seq "$(ioengine "psync")" --iodepth=1 --rw=write \
356 --bs="$bs" --do_verify=1 --verify=md5 \
357 >>"${logfile}.${test_number}" 2>&1 || return $?
358 check_written $capacity || return $?
359 check_read $capacity || return $?
360}
361
362# Sequential read from sequential zones.
363test6() {
364 local size off capacity bs
365
366 prep_write
367 off=$((first_sequential_zone_sector * 512))
368 capacity=$(total_zone_capacity 4 $off $dev)
369 size=$((4 * zone_size))
370 bs=$(min "$(max $((zone_size / 64)) "$min_seq_write_size")" "$zone_cap_bs")
371 write_and_run_one_fio_job \
372 $((first_sequential_zone_sector * 512)) "${size}" \
373 --offset="${off}" \
374 --size="${size}" --zonemode=zbd --zonesize="${zone_size}" \
375 "$(ioengine "psync")" --iodepth=1 --rw=read --bs="$bs" \
376 >>"${logfile}.${test_number}" 2>&1 || return $?
377 check_read $capacity || return $?
378}
379
380# Random write to sequential zones, libaio, queue depth 1.
381test7() {
382 local size=$((zone_size))
383 local off capacity
384
385 prep_write
386 off=$((first_sequential_zone_sector * 512))
387 capacity=$(total_zone_capacity 1 $off $dev)
388 run_fio_on_seq "$(ioengine "libaio")" --iodepth=1 --rw=randwrite \
389 --bs="$(min 16384 "${zone_size}")" \
390 --do_verify=1 --verify=md5 --size="$size" \
391 >>"${logfile}.${test_number}" 2>&1 || return $?
392 check_written $capacity || return $?
393 check_read $capacity || return $?
394}
395
396# Random write to sequential zones, libaio, queue depth 64.
397test8() {
398 local size off capacity
399
400 prep_write
401 size=$((4 * zone_size))
402 off=$((first_sequential_zone_sector * 512))
403 capacity=$(total_zone_capacity 4 $off $dev)
404 run_fio_on_seq "$(ioengine "libaio")" --iodepth=64 --rw=randwrite \
405 --bs="$(min 16384 "${zone_size}")" \
406 --do_verify=1 --verify=md5 \
407 >>"${logfile}.${test_number}" 2>&1 || return $?
408 check_written $capacity || return $?
409 check_read $capacity || return $?
410}
411
412# Random write to sequential zones, sg, queue depth 1.
413test9() {
414 local size
415
416 require_scsi_dev || return $SKIP_TESTCASE
417
418 prep_write
419 size=$((4 * zone_size))
420 run_fio_on_seq --ioengine=sg \
421 --iodepth=1 --rw=randwrite --bs=16K \
422 --do_verify=1 --verify=md5 \
423 >>"${logfile}.${test_number}" 2>&1 || return $?
424 check_written $size || return $?
425 check_read $size || return $?
426}
427
428# Random write to sequential zones, sg, queue depth 64.
429test10() {
430 local size
431
432 require_scsi_dev || return $SKIP_TESTCASE
433
434 prep_write
435 size=$((4 * zone_size))
436 run_fio_on_seq --ioengine=sg \
437 --iodepth=64 --rw=randwrite --bs=16K \
438 --do_verify=1 --verify=md5 \
439 >>"${logfile}.${test_number}" 2>&1 || return $?
440 check_written $size || return $?
441 check_read $size || return $?
442}
443
444# Random write to sequential zones, libaio, queue depth 64, random block size.
445test11() {
446 local size off capacity
447
448 prep_write
449 size=$((4 * zone_size))
450 off=$((first_sequential_zone_sector * 512))
451 capacity=$(total_zone_capacity 4 $off $dev)
452 run_fio_on_seq "$(ioengine "libaio")" --iodepth=64 --rw=randwrite \
453 --bsrange=4K-64K --do_verify=1 --verify=md5 \
454 --debug=zbd >>"${logfile}.${test_number}" 2>&1 || return $?
455 check_written $capacity || return $?
456 check_read $capacity || return $?
457}
458
459# Random write to sequential zones, libaio, queue depth 64, max 1 open zone.
460test12() {
461 local size off capacity
462
463 [ -n "$is_zbd" ] && reset_zone "$dev" -1
464
465 size=$((8 * zone_size))
466 off=$((first_sequential_zone_sector * 512))
467 capacity=$(total_zone_capacity 8 $off $dev)
468 run_fio_on_seq "$(ioengine "libaio")" --iodepth=64 --rw=randwrite --bs=16K \
469 --max_open_zones=1 --size=$size --do_verify=1 --verify=md5 \
470 --debug=zbd >>"${logfile}.${test_number}" 2>&1 || return $?
471 check_written $capacity || return $?
472 check_read $capacity || return $?
473}
474
475# Random write to sequential zones, libaio, queue depth 64, max 4 open zones.
476test13() {
477 local size off capacity
478
479 require_max_open_zones 4 || return $SKIP_TESTCASE
480
481 [ -n "$is_zbd" ] && reset_zone "$dev" -1
482
483 size=$((8 * zone_size))
484 off=$((first_sequential_zone_sector * 512))
485 capacity=$(total_zone_capacity 8 $off $dev)
486 run_fio_on_seq "$(ioengine "libaio")" --iodepth=64 --rw=randwrite --bs=16K \
487 --max_open_zones=4 --size=$size --do_verify=1 --verify=md5 \
488 --debug=zbd \
489 >>"${logfile}.${test_number}" 2>&1 || return $?
490 check_written $capacity || return $?
491 check_read $capacity || return $?
492}
493
494# Random write to conventional zones.
495test14() {
496 local off size
497
498 if ! result=($(first_online_zone "$dev")); then
499 echo "Failed to determine first online zone"
500 exit 1
501 fi
502 off=${result[0]}
503 prep_write
504 size=$((16 * 2**20)) # 20 MB
505 require_conv_zone_bytes "${size}" || return $SKIP_TESTCASE
506
507 run_one_fio_job "$(ioengine "libaio")" --iodepth=64 --rw=randwrite --bs=16K \
508 --zonemode=zbd --zonesize="${zone_size}" --do_verify=1 \
509 --verify=md5 --offset=$off --size=$size\
510 >>"${logfile}.${test_number}" 2>&1 || return $?
511 check_written $((size)) || return $?
512 check_read $((size)) || return $?
513}
514
515# Sequential read on a mix of empty and full zones.
516test15() {
517 local i off size bs
518 local w_off w_size w_capacity
519
520 for ((i=0;i<4;i++)); do
521 [ -n "$is_zbd" ] &&
522 reset_zone "$dev" $((first_sequential_zone_sector +
523 i*sectors_per_zone))
524 done
525 prep_write
526 w_off=$(((first_sequential_zone_sector + 2 * sectors_per_zone) * 512))
527 w_size=$((2 * zone_size))
528 w_capacity=$(total_zone_capacity 2 $w_off $dev)
529 off=$((first_sequential_zone_sector * 512))
530 size=$((4 * zone_size))
531 bs=$(min $((zone_size / 16)) "$zone_cap_bs")
532 write_and_run_one_fio_job "${w_off}" "${w_size}" \
533 "$(ioengine "psync")" --rw=read --bs="$bs" \
534 --zonemode=zbd --zonesize="${zone_size}" --offset=$off \
535 --size=$((size)) >>"${logfile}.${test_number}" 2>&1 ||
536 return $?
537 check_written $((w_capacity)) || return $?
538 check_read $((w_capacity))
539}
540
541# Random read on a mix of empty and full zones.
542test16() {
543 local off size
544 local i w_off w_size w_capacity
545
546 for ((i=0;i<4;i++)); do
547 [ -n "$is_zbd" ] &&
548 reset_zone "$dev" $((first_sequential_zone_sector +
549 i*sectors_per_zone))
550 done
551 prep_write
552 w_off=$(((first_sequential_zone_sector + 2 * sectors_per_zone) * 512))
553 w_size=$((2 * zone_size))
554 w_capacity=$(total_zone_capacity 2 $w_off $dev)
555 off=$((first_sequential_zone_sector * 512))
556 size=$((4 * zone_size))
557 write_and_run_one_fio_job "${w_off}" "${w_size}" \
558 "$(ioengine "libaio")" --iodepth=64 --rw=randread --bs=16K \
559 --zonemode=zbd --zonesize="${zone_size}" --offset=$off \
560 --size=$size >>"${logfile}.${test_number}" 2>&1 || return $?
561 check_written $w_capacity || return $?
562 check_read $size || return $?
563}
564
565# Random reads and writes in the last zone.
566test17() {
567 local io off last read size written
568
569 off=$(((disk_size / zone_size - 1) * zone_size))
570 size=$((disk_size - off))
571 if ! last=($(last_online_zone "$dev")); then
572 echo "Failed to determine last online zone"
573 exit 1
574 fi
575 if [[ "$((last * 512))" -lt "$off" ]]; then
576 off=$((last * 512))
577 size=$zone_size
578 fi
579 if [ -n "$is_zbd" ]; then
580 reset_zone "$dev" $((off / 512)) || return $?
581 fi
582 prep_write
583 run_one_fio_job "$(ioengine "libaio")" --iodepth=8 --rw=randrw --bs=4K \
584 --zonemode=zbd --zonesize="${zone_size}" \
585 --offset=$off --loops=2 --norandommap=1 \
586 --size="$size"\
587 >>"${logfile}.${test_number}" 2>&1 || return $?
588 written=$(fio_written <"${logfile}.${test_number}")
589 read=$(fio_read <"${logfile}.${test_number}")
590 io=$((written + read))
591 echo "Total number of bytes read and written: $io <> $size" \
592 >>"${logfile}.${test_number}"
593 [ $io = $((size * 2)) ];
594}
595
596# Out-of-range zone reset threshold and frequency parameters.
597test18() {
598 run_fio_on_seq --zone_reset_threshold=-1 |&
599 tee -a "${logfile}.${test_number}" |
600 grep -q 'value out of range' || return $?
601}
602
603test19() {
604 run_fio_on_seq --zone_reset_threshold=2 |&
605 tee -a "${logfile}.${test_number}" |
606 grep -q 'value out of range' || return $?
607}
608
609test20() {
610 run_fio_on_seq --zone_reset_threshold=.4:.6 |&
611 tee -a "${logfile}.${test_number}" |
612 grep -q 'the list exceeding max length' || return $?
613}
614
615test21() {
616 run_fio_on_seq --zone_reset_frequency=-1 |&
617 tee -a "${logfile}.${test_number}" |
618 grep -q 'value out of range' || return $?
619}
620
621test22() {
622 run_fio_on_seq --zone_reset_frequency=2 |&
623 tee -a "${logfile}.${test_number}" |
624 grep -q 'value out of range' || return $?
625}
626
627test23() {
628 run_fio_on_seq --zone_reset_frequency=.4:.6 |&
629 tee -a "${logfile}.${test_number}" |
630 grep -q 'the list exceeding max length' || return $?
631}
632
633test24() {
634 local bs loops=9 size=$((zone_size))
635 local off capacity
636
637 prep_write
638 off=$((first_sequential_zone_sector * 512))
639 capacity=$(total_zone_capacity 1 $off $dev)
640
641 bs=$(min $((256*1024)) "$zone_size")
642 run_fio_on_seq "$(ioengine "psync")" --rw=write --bs="$bs" \
643 --size=$size --loops=$loops \
644 --zone_reset_frequency=.01 --zone_reset_threshold=.90 \
645 >> "${logfile}.${test_number}" 2>&1 || return $?
646 check_written $((capacity * loops)) || return $?
647 check_reset_count -eq 8 ||
648 check_reset_count -eq 9 ||
649 check_reset_count -eq 10 || return $?
650}
651
652# Multiple non-overlapping sequential write jobs for the same drive.
653test25() {
654 local i opts=()
655
656 for ((i=0;i<16;i++)); do
657 [ -n "$is_zbd" ] &&
658 reset_zone "$dev" $((first_sequential_zone_sector + i*sectors_per_zone))
659 done
660 prep_write
661 for ((i=0;i<16;i++)); do
662 opts+=("--name=job$i" "--filename=$dev" "--thread=1" "--direct=1")
663 opts+=("--offset=$((first_sequential_zone_sector*512 + zone_size*i))")
664 opts+=("--size=$zone_size" "$(ioengine "psync")" "--rw=write" "--bs=16K")
665 opts+=("--zonemode=zbd" "--zonesize=${zone_size}" "--group_reporting=1")
666 opts+=(${job_var_opts[@]})
667 done
668 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
669}
670
671write_to_first_seq_zone() {
672 local loops=4 r
673 local off capacity
674
675 prep_write
676 off=$((first_sequential_zone_sector * 512))
677 capacity=$(total_zone_capacity 1 $off $dev)
678
679 r=$(((RANDOM << 16) | RANDOM))
680 run_fio --name="$dev" --filename="$dev" "$(ioengine "psync")" --rw="$1" \
681 --thread=1 --do_verify=1 --verify=md5 --direct=1 --bs=4K \
682 --offset=$off \
683 --size=$zone_size --loops=$loops --randseed="$r" \
684 --zonemode=zbd --zonesize="${zone_size}" --group_reporting=1 \
685 --gtod_reduce=1 >> "${logfile}.${test_number}" 2>&1 || return $?
686 check_written $((loops * capacity)) || return $?
687}
688
689# Overwrite the first sequential zone four times sequentially.
690test26() {
691 write_to_first_seq_zone write
692}
693
694# Overwrite the first sequential zone four times using random writes.
695test27() {
696 write_to_first_seq_zone randwrite
697}
698
699# Multiple overlapping random write jobs for the same drive.
700test28() {
701 local i jobs=16 off opts
702
703 require_seq_zones 65 || return $SKIP_TESTCASE
704 off=$((first_sequential_zone_sector * 512 + 64 * zone_size))
705 [ -n "$is_zbd" ] && reset_zone "$dev" $((off / 512))
706 prep_write
707 opts=("--debug=zbd")
708 capacity=$(total_zone_capacity 1 $off $dev)
709 for ((i=0;i<jobs;i++)); do
710 opts+=("--name=job$i" "--filename=$dev" "--offset=$off" "--bs=16K")
711 opts+=("--size=$zone_size" "--io_size=$capacity" "$(ioengine "psync")" "--rw=randwrite")
712 opts+=("--thread=1" "--direct=1" "--zonemode=zbd")
713 opts+=("--zonesize=${zone_size}" "--group_reporting=1")
714 opts+=(${job_var_opts[@]})
715 done
716 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
717 check_written $((jobs * $capacity)) || return $?
718 check_reset_count -eq $jobs ||
719 check_reset_count -eq $((jobs - 1)) ||
720 return $?
721}
722
723# Multiple overlapping random write jobs for the same drive and with a limited
724# number of open zones.
725test29() {
726 local i jobs=16 off opts=()
727
728 require_seq_zones 80 || return $SKIP_TESTCASE
729 off=$((first_sequential_zone_sector * 512 + 64 * zone_size))
730 size=$((16*zone_size))
731
732 [ -n "$is_zbd" ] && reset_zone "$dev" -1
733
734 opts=("--debug=zbd")
735 for ((i=0;i<jobs;i++)); do
736 opts+=("--name=job$i" "--filename=$dev" "--offset=$off" "--bs=16K")
737 opts+=("--size=$size" "--io_size=$zone_size" "--thread=1")
738 opts+=("$(ioengine "psync")" "--rw=randwrite" "--direct=1")
739 opts+=("--max_open_zones=4" "--group_reporting=1")
740 opts+=("--zonemode=zbd" "--zonesize=${zone_size}")
741 # max_open_zones is already specified
742 opts+=($(job_var_opts_exclude "--max_open_zones"))
743 done
744 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
745 check_written $((jobs * zone_size)) || return $?
746}
747
748# Random reads and writes across the entire disk for 30s.
749test30() {
750 local off
751
752 prep_write
753 off=$((first_sequential_zone_sector * 512))
754 run_one_fio_job "$(ioengine "libaio")" --iodepth=8 --rw=randrw \
755 --bs="$(max $((zone_size / 128)) "$min_seq_write_size")"\
756 --zonemode=zbd --zonesize="${zone_size}" --offset=$off\
757 --loops=2 --time_based --runtime=30s --norandommap=1\
758 >>"${logfile}.${test_number}" 2>&1
759}
760
761# Random reads across all sequential zones for 30s. This is not only a fio
762# test but also allows to verify the performance of a drive.
763test31() {
764 local bs inc nz off opts size
765
766 [ -n "$is_zbd" ] && reset_zone "$dev" -1
767
768 # As preparation, write 128 KB to sequential write required zones. Limit
769 # write target zones up to max_open_zones to keep test time reasonable.
770 # To distribute the write target zones evenly, skip certain zones for every
771 # write. Utilize zonemode strided for such write patterns.
772 bs=$((128 * 1024))
773 nz=$((max_open_zones))
774 if [[ $nz -eq 0 ]]; then
775 nz=128
776 fi
777 off=$((first_sequential_zone_sector * 512))
778 size=$((disk_size - off))
779 inc=$(((size / nz / zone_size) * zone_size))
780 opts=("--name=$dev" "--filename=$dev" "--rw=write" "--bs=${bs}")
781 opts+=("--offset=$off" "--size=$((inc * nz))" "--io_size=$((bs * nz))")
782 opts+=("--zonemode=strided" "--zonesize=${bs}" "--zonerange=${inc}")
783 opts+=("--direct=1")
784 echo "fio ${opts[@]}" >> "${logfile}.${test_number}"
785 "$(dirname "$0")/../../fio" "${opts[@]}" >> "${logfile}.${test_number}" 2>&1
786
787 # Next, run the test.
788 opts=("--name=$dev" "--filename=$dev" "--offset=$off" "--size=$size")
789 opts+=("--bs=$bs" "$(ioengine "psync")" "--rw=randread" "--direct=1")
790 opts+=("--thread=1" "--time_based" "--runtime=30" "--zonemode=zbd")
791 opts+=("--zonesize=${zone_size}")
792 opts+=(${job_var_opts[@]})
793 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
794}
795
796# Random writes across all sequential zones. This is not only a fio test but
797# also allows to verify the performance of a drive.
798test32() {
799 local off opts=() size
800
801 require_zbd || return $SKIP_TESTCASE
802
803 [ -n "$is_zbd" ] && reset_zone "$dev" -1
804
805 off=$((first_sequential_zone_sector * 512))
806 size=$((disk_size - off))
807 opts+=("--name=$dev" "--filename=$dev" "--offset=$off" "--size=$size")
808 opts+=("--bs=128K" "$(ioengine "psync")" "--rw=randwrite" "--direct=1")
809 opts+=("--thread=1" "--time_based" "--runtime=30")
810 opts+=("--max_open_zones=$max_open_zones" "--zonemode=zbd")
811 opts+=("--zonesize=${zone_size}")
812 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
813}
814
815# Write to sequential zones with a block size that is not a divisor of the
816# zone size.
817test33() {
818 local bs io_size size
819 local off capacity=0;
820
821 [ -n "$is_zbd" ] && reset_zone "$dev" -1
822
823 off=$((first_sequential_zone_sector * 512))
824 capacity=$(total_zone_capacity 1 $off $dev)
825 size=$((2 * zone_size))
826 io_size=$((5 * capacity))
827 bs=$((3 * capacity / 4))
828 run_fio_on_seq "$(ioengine "psync")" --iodepth=1 --rw=write \
829 --size=$size --io_size=$io_size --bs=$bs \
830 >> "${logfile}.${test_number}" 2>&1 || return $?
831 check_written $((io_size / bs * bs)) || return $?
832}
833
834# Test repeated async write job with verify using two unaligned block sizes.
835test34() {
836 local bs off zone_capacity
837 local -a block_sizes
838
839 require_zbd || return $SKIP_TESTCASE
840 prep_write
841
842 off=$((first_sequential_zone_sector * 512))
843 zone_capacity=$(total_zone_capacity 1 $off $dev)
844 block_sizes=($((4096 * 7)) $(($(min ${zone_capacity} 4194304) - 4096)))
845
846 for bs in ${block_sizes[@]}; do
847 run_fio --name=job --filename="${dev}" --rw=randwrite \
848 --bs="${bs}" --offset="${off}" \
849 --size=$((4 * zone_size)) --iodepth=256 \
850 "$(ioengine "libaio")" --time_based=1 --runtime=15s \
851 --zonemode=zbd --direct=1 --zonesize="${zone_size}" \
852 --verify=crc32c --do_verify=1 ${job_var_opts[@]} \
853 >> "${logfile}.${test_number}" 2>&1 || return $?
854 done
855}
856
857# Test 1/4 for the I/O boundary rounding code: $size < $zone_size.
858test35() {
859 local bs off io_size size
860
861 prep_write
862 off=$(((first_sequential_zone_sector + 1) * 512))
863 size=$((zone_size - 2 * 512))
864 bs=$((zone_size / 4))
865 run_one_fio_job --offset=$off --size=$size "$(ioengine "psync")" \
866 --iodepth=1 --rw=write --do_verify=1 --verify=md5 \
867 --bs=$bs --zonemode=zbd --zonesize="${zone_size}" \
868 >> "${logfile}.${test_number}" 2>&1 && return 1
869 grep -q 'io_size must be at least one zone' "${logfile}.${test_number}"
870}
871
872# Test 2/4 for the I/O boundary rounding code: $size < $zone_size.
873test36() {
874 local bs off io_size size
875
876 prep_write
877 off=$(((first_sequential_zone_sector) * 512))
878 size=$((zone_size - 512))
879 bs=$((zone_size / 4))
880 run_one_fio_job --offset=$off --size=$size "$(ioengine "psync")" \
881 --iodepth=1 --rw=write --do_verify=1 --verify=md5 \
882 --bs=$bs --zonemode=zbd --zonesize="${zone_size}" \
883 >> "${logfile}.${test_number}" 2>&1 && return 1
884 grep -q 'io_size must be at least one zone' "${logfile}.${test_number}"
885}
886
887# Test 3/4 for the I/O boundary rounding code: $size > $zone_size.
888test37() {
889 local bs off size capacity
890
891 prep_write
892 capacity=$(total_zone_capacity 1 $((first_sequential_zone_sector*512)) $dev)
893 if [ "$first_sequential_zone_sector" = 0 ]; then
894 off=0
895 else
896 off=$(((first_sequential_zone_sector - 1) * 512))
897 fi
898 size=$((zone_size + 2 * 512))
899 bs=$(min $((zone_size / 4)) "$zone_cap_bs")
900 run_one_fio_job --offset=$off --size=$size "$(ioengine "psync")" \
901 --iodepth=1 --rw=write --do_verify=1 --verify=md5 \
902 --bs=$bs --zonemode=zbd --zonesize="${zone_size}" \
903 >> "${logfile}.${test_number}" 2>&1
904 check_written $capacity || return $?
905}
906
907# Test 4/4 for the I/O boundary rounding code: $offset > $disk_size - $zone_size
908test38() {
909 local bs off size
910
911 prep_write
912 size=$((min_seq_write_size))
913 off=$((disk_size - min_seq_write_size))
914 bs=$((min_seq_write_size))
915 run_one_fio_job --offset=$off --size=$size "$(ioengine "psync")" \
916 --iodepth=1 --rw=write --do_verify=1 --verify=md5 \
917 --bs=$bs --zonemode=zbd --zonesize="${zone_size}" \
918 >> "${logfile}.${test_number}" 2>&1 && return 1
919 grep -q 'io_size must be at least one zone' "${logfile}.${test_number}"
920}
921
922# Read one block from a block device.
923read_one_block() {
924 local off
925 local bs
926
927 if ! result=($(first_online_zone "$dev")); then
928 echo "Failed to determine first online zone"
929 exit 1
930 fi
931 off=${result[0]}
932 bs=$((min_seq_write_size))
933 run_one_fio_job --rw=read "$(ioengine "psync")" --offset=$off --bs=$bs \
934 --size=$bs "$@" 2>&1 |
935 tee -a "${logfile}.${test_number}"
936}
937
938# Check whether fio accepts --zonemode=none for zoned block devices.
939test39() {
940 require_zbd || return $SKIP_TESTCASE
941 read_one_block --zonemode=none >/dev/null || return $?
942 check_read $((min_seq_write_size)) || return $?
943}
944
945# Check whether fio accepts --zonemode=strided for zoned block devices.
946test40() {
947 local bs
948
949 bs=$((min_seq_write_size))
950 require_zbd || return $SKIP_TESTCASE
951 read_one_block --zonemode=strided |
952 grep -q 'fio: --zonesize must be specified when using --zonemode=strided' ||
953 return $?
954 read_one_block --zonemode=strided --zonesize=$bs >/dev/null || return $?
955 check_read $bs || return $?
956}
957
958# Check whether fio checks the zone size for zoned block devices.
959test41() {
960 require_zbd || return $SKIP_TESTCASE
961 read_one_block --zonemode=zbd --zonesize=$((2 * zone_size)) |
962 grep -q 'job parameter zonesize.*does not match disk zone size'
963}
964
965# Check whether fio handles --zonesize=0 correctly for regular block devices.
966test42() {
967 require_regular_block_dev || return $SKIP_TESTCASE
968 read_one_block --zonemode=zbd --zonesize=0 |
969 grep -q 'Specifying the zone size is mandatory for regular file/block device with --zonemode=zbd'
970}
971
972# Check whether fio handles --zonesize=1 correctly for regular block devices.
973test43() {
974 require_regular_block_dev || return $SKIP_TESTCASE
975 read_one_block --zonemode=zbd --zonesize=1 |
976 grep -q 'zone size must be at least 512 bytes for --zonemode=zbd'
977}
978
979# Check whether fio handles --zonemode=none --zonesize=1 correctly.
980test44() {
981 read_one_block --zonemode=none --zonesize=1 |
982 grep -q 'fio: --zonemode=none and --zonesize are not compatible'
983}
984
985test45() {
986 local bs i
987
988 require_zbd || return $SKIP_TESTCASE
989 prep_write
990 bs=$((min_seq_write_size))
991 run_one_fio_job "$(ioengine "psync")" --iodepth=1 --rw=randwrite --bs=$bs\
992 --offset=$((first_sequential_zone_sector * 512)) \
993 --size="$zone_size" --do_verify=1 --verify=md5 2>&1 |
994 tee -a "${logfile}.${test_number}" |
995 grep -q "fio: first I/O failed. If .* is a zoned block device, consider --zonemode=zbd"
996}
997
998# Random write to sequential zones, libaio, 8 jobs, queue depth 64 per job
999test46() {
1000 local size
1001
1002 prep_write
1003 size=$((4 * zone_size))
1004 run_fio_on_seq "$(ioengine "libaio")" --iodepth=64 --rw=randwrite --bs=4K \
1005 --group_reporting=1 --numjobs=8 \
1006 >> "${logfile}.${test_number}" 2>&1 || return $?
1007 check_written $((size * 8)) || return $?
1008}
1009
1010# Check whether fio handles --zonemode=zbd --zoneskip=1 correctly.
1011test47() {
1012 local bs
1013
1014 prep_write
1015 bs=$((min_seq_write_size))
1016 run_fio_on_seq "$(ioengine "psync")" --rw=write --bs=$bs --zoneskip=1 \
1017 >> "${logfile}.${test_number}" 2>&1 && return 1
1018 grep -q 'zoneskip 1 is not a multiple of the device zone size' "${logfile}.${test_number}"
1019}
1020
1021# Multiple overlapping random write jobs for the same drive and with a
1022# limited number of open zones. This is similar to test29, but uses libaio
1023# to stress test zone locking.
1024test48() {
1025 local i jobs=16 off opts=()
1026
1027 require_zbd || return $SKIP_TESTCASE
1028 require_seq_zones 80 || return $SKIP_TESTCASE
1029
1030 off=$((first_sequential_zone_sector * 512 + 64 * zone_size))
1031 size=$((16*zone_size))
1032
1033 [ -n "$is_zbd" ] && reset_zone "$dev" -1
1034
1035 opts=("--aux-path=/tmp" "--allow_file_create=0" "--significant_figures=10")
1036 opts+=("--debug=zbd")
1037 opts+=("$(ioengine "libaio")" "--rw=randwrite" "--direct=1")
1038 opts+=("--time_based" "--runtime=30")
1039 opts+=("--zonemode=zbd" "--zonesize=${zone_size}")
1040 opts+=("--max_open_zones=4")
1041 for ((i=0;i<jobs;i++)); do
1042 opts+=("--name=job$i" "--filename=$dev" "--offset=$off" "--bs=16K")
1043 opts+=("--io_size=$zone_size" "--iodepth=256" "--thread=1")
1044 opts+=("--size=$size" "--group_reporting=1")
1045 # max_open_zones is already specified
1046 opts+=($(job_var_opts_exclude "--max_open_zones"))
1047 done
1048
1049 fio=$(dirname "$0")/../../fio
1050
1051 { echo; echo "fio ${opts[*]}"; echo; } >>"${logfile}.${test_number}"
1052
1053 timeout -v -s KILL 180s \
1054 "${dynamic_analyzer[@]}" "$fio" "${opts[@]}" \
1055 >> "${logfile}.${test_number}" 2>&1 || return $?
1056}
1057
1058# Check if fio handles --zonecapacity on a normal block device correctly
1059test49() {
1060
1061 require_regular_block_dev || return $SKIP_TESTCASE
1062
1063 size=$((2 * zone_size))
1064 capacity=$((zone_size * 3 / 4))
1065
1066 run_one_fio_job "$(ioengine "psync")" --rw=write \
1067 --zonemode=zbd --zonesize="${zone_size}" \
1068 --zonecapacity=${capacity} \
1069 --verify=md5 --size=${size} >>"${logfile}.${test_number}" 2>&1 ||
1070 return $?
1071 check_written $((capacity * 2)) || return $?
1072 check_read $((capacity * 2)) || return $?
1073}
1074
1075# Verify that conv zones are not locked and only seq zones are locked during
1076# random read on conv-seq mixed zones.
1077test50() {
1078 local off
1079
1080 require_zbd || return $SKIP_TESTCASE
1081 require_conv_zones 8 || return $SKIP_TESTCASE
1082 require_seq_zones 8 || return $SKIP_TESTCASE
1083
1084 reset_zone "${dev}" -1
1085
1086 off=$((first_sequential_zone_sector * 512 - 8 * zone_size))
1087 run_fio --name=job --filename=${dev} --offset=${off} --bs=64K \
1088 --size=$((16 * zone_size)) "$(ioengine "libaio")" --rw=randread\
1089 --time_based --runtime=3 --zonemode=zbd --zonesize=${zone_size}\
1090 --direct=1 --group_reporting=1 ${job_var_opts[@]} \
1091 >> "${logfile}.${test_number}" 2>&1 || return $?
1092}
1093
1094# Verify that conv zones are neither locked nor opened during random write on
1095# conv-seq mixed zones. Zone lock and zone open shall happen only on seq zones.
1096test51() {
1097 local off jobs=16
1098 local -a opts
1099
1100 require_zbd || return $SKIP_TESTCASE
1101 require_conv_zones 8 || return $SKIP_TESTCASE
1102 require_seq_zones 8 || return $SKIP_TESTCASE
1103
1104 reset_zone "$dev" -1
1105
1106 off=$((first_sequential_zone_sector * 512 - 8 * zone_size))
1107 opts+=("--size=$((16 * zone_size))" "$(ioengine "libaio")")
1108 opts+=("--zonemode=zbd" "--direct=1" "--zonesize=${zone_size}")
1109 opts+=("--max_open_zones=2" "--offset=$off")
1110 opts+=("--thread=1" "--group_reporting=1")
1111 opts+=("--time_based" "--runtime=30" "--rw=randwrite")
1112 for ((i=0;i<jobs;i++)); do
1113 opts+=("--name=job${i}" "--filename=$dev")
1114 opts+=("--bs=$(((i+1)*16))K")
1115 opts+=($(job_var_opts_exclude "--max_open_zones"))
1116 done
1117 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
1118}
1119
1120# Verify that zone_reset_threshold only accounts written bytes in seq
1121# zones, and written data bytes of conv zones are not counted.
1122test52() {
1123 local off io_size
1124
1125 require_zbd || return $SKIP_TESTCASE
1126 require_conv_zones 8 || return $SKIP_TESTCASE
1127 require_seq_zones 8 || return $SKIP_TESTCASE
1128
1129 reset_zone "${dev}" -1
1130
1131 # Total I/O size is 1/8 = 0.125 of the I/O range of cont + seq zones.
1132 # Set zone_reset_threshold as 0.1. The threshold size is less than
1133 # 0.125, then, reset count zero is expected.
1134 # On the other hand, half of the I/O range is covered by conv zones.
1135 # If fio would count the conv zones for zone_reset_threshold, the ratio
1136 # were more than 0.5 and would trigger zone resets.
1137
1138 off=$((first_sequential_zone_sector * 512 - 8 * zone_size))
1139 io_size=$((zone_size * 16 / 8))
1140 run_fio --name=job --filename=$dev --rw=randwrite --bs=$((zone_size/16))\
1141 --size=$((zone_size * 16)) --softrandommap=1 \
1142 --io_size=$((io_size)) "$(ioengine "psync")" --offset=$off \
1143 --zonemode=zbd --direct=1 --zonesize=${zone_size} \
1144 --zone_reset_threshold=.1 --zone_reset_frequency=1.0 \
1145 ${job_var_opts[@]} --debug=zbd \
1146 >> "${logfile}.${test_number}" 2>&1 || return $?
1147
1148 check_written ${io_size} || return $?
1149 check_reset_count -eq 0 || return $?
1150}
1151
1152# Check both reads and writes are executed by random I/O to conventional zones.
1153test53() {
1154 local off capacity io read_b=0 written_b=0
1155
1156 require_zbd || return $SKIP_TESTCASE
1157 require_conv_zones 4 || return $SKIP_TESTCASE
1158
1159 off=$((first_sequential_zone_sector * 512 - 4 * zone_size))
1160 capacity=$(total_zone_capacity 4 $off $dev)
1161 run_fio --name=job --filename=${dev} --rw=randrw --bs=64K \
1162 --size=$((4 * zone_size)) "$(ioengine "psync")" --offset=${off}\
1163 --zonemode=zbd --direct=1 --zonesize=${zone_size} \
1164 ${job_var_opts[@]} \
1165 >> "${logfile}.${test_number}" 2>&1 || return $?
1166
1167 written_b=$(fio_written <"${logfile}.${test_number}")
1168 read_b=$(fio_read <"${logfile}.${test_number}")
1169 io=$((written_b + read_b))
1170 echo "Number of bytes read: $read_b" >>"${logfile}.${test_number}"
1171 echo "Number of bytes written: $written_b" >>"${logfile}.${test_number}"
1172 echo "Total number of bytes read and written: $io <> $capacity" \
1173 >>"${logfile}.${test_number}"
1174 if ((io==capacity && written_b != 0 && read_b != 0)); then
1175 return 0
1176 fi
1177 return 1
1178}
1179
1180# Test read/write mix with verify.
1181test54() {
1182 require_zbd || return $SKIP_TESTCASE
1183 require_seq_zones 8 || return $SKIP_TESTCASE
1184
1185 run_fio --name=job --filename=${dev} "$(ioengine "libaio")" \
1186 --time_based=1 --runtime=30s --continue_on_error=0 \
1187 --offset=$((first_sequential_zone_sector * 512)) \
1188 --size=$((8*zone_size)) --direct=1 --iodepth=1 \
1189 --rw=randrw:2 --rwmixwrite=25 --bsrange=4k-${zone_size} \
1190 --zonemode=zbd --zonesize=${zone_size} \
1191 --verify=crc32c --do_verify=1 --verify_backlog=2 \
1192 --alloc-size=65536 --random_generator=tausworthe64 \
1193 ${job_var_opts[@]} --debug=zbd \
1194 >> "${logfile}.${test_number}" 2>&1 || return $?
1195}
1196
1197# test 'z' suffix parsing only
1198test55() {
1199 local bs
1200 bs=$((min_seq_write_size))
1201
1202 require_zbd || return $SKIP_TESTCASE
1203 # offset=1z + offset_increment=10z + size=2z
1204 require_seq_zones 13 || return $SKIP_TESTCASE
1205
1206 run_fio --name=j \
1207 --filename=${dev} \
1208 --direct=1 \
1209 "$(ioengine "psync")" \
1210 --zonemode=zbd \
1211 --zonesize=${zone_size} \
1212 --rw=write \
1213 --bs=${bs} \
1214 --numjobs=2 \
1215 --offset_increment=10z \
1216 --offset=1z \
1217 --size=2z \
1218 --io_size=3z \
1219 ${job_var_opts[@]} --debug=zbd \
1220 >> "${logfile}.${test_number}" 2>&1 || return $?
1221}
1222
1223# test 'z' suffix parsing only
1224test56() {
1225 local bs
1226 bs=$((min_seq_write_size))
1227
1228 require_regular_block_dev || return $SKIP_TESTCASE
1229 require_seq_zones 10 || return $SKIP_TESTCASE
1230
1231 run_fio --name=j \
1232 --filename=${dev} \
1233 --direct=1 \
1234 "$(ioengine "psync")" \
1235 --zonemode=strided \
1236 --zonesize=${zone_size} \
1237 --rw=write \
1238 --bs=${bs} \
1239 --size=10z \
1240 --zoneskip=2z \
1241 ${job_var_opts[@]} --debug=zbd \
1242 >> "${logfile}.${test_number}" 2>&1 || return $?
1243}
1244
1245# Test that repeated async write job does not cause zone reset during writes
1246# in-flight, when the block size is not a divisor of the zone size.
1247test57() {
1248 local bs off
1249
1250 require_zbd || return $SKIP_TESTCASE
1251
1252 bs=$((4096 * 7))
1253 off=$((first_sequential_zone_sector * 512))
1254
1255 run_fio --name=job --filename="${dev}" --rw=randwrite --bs="${bs}" \
1256 --offset="${off}" --size=$((4 * zone_size)) --iodepth=256 \
1257 "$(ioengine "libaio")" --time_based=1 --runtime=30s \
1258 --zonemode=zbd --direct=1 --zonesize="${zone_size}" \
1259 ${job_var_opts[@]} \
1260 >> "${logfile}.${test_number}" 2>&1 || return $?
1261}
1262
1263# Random writes and random trims to sequential write required zones for 30s.
1264test58() {
1265 local off size bs
1266
1267 require_seq_zones 128 || return $SKIP_TESTCASE
1268
1269 size=$((zone_size * 128))
1270 bs="$(max $((zone_size / 128)) "$min_seq_write_size")"
1271 prep_write
1272 off=$((first_sequential_zone_sector * 512))
1273 run_fio --zonemode=zbd --direct=1 --zonesize="${zone_size}" --thread=1 \
1274 --filename="${dev}" --norandommap=1 \
1275 --name="precondition" --rw=write "$(ioengine "psync")" \
1276 --offset="${off}" --size=$((zone_size * 16)) --bs="${bs}" \
1277 "${job_var_opts[@]}" \
1278 --name=wjob --wait_for="precondition" --rw=randwrite \
1279 "$(ioengine "libaio")" --iodepth=8 \
1280 --offset="${off}" --size="${size}" --bs="${bs}" \
1281 --time_based --runtime=30s --flow=128 "${job_var_opts[@]}" \
1282 --name=trimjob --wait_for="precondition" --rw=randtrim \
1283 "$(ioengine "psync")" \
1284 --offset="${off}" --size="${size}" --bs="${zone_size}" \
1285 --time_based --runtime=30s --flow=1 "${job_var_opts[@]}" \
1286 >>"${logfile}.${test_number}" 2>&1
1287}
1288
1289# Test zone_reset_threshold with verify.
1290test59() {
1291 local off bs loops=2 size=$((zone_size)) w
1292 local -a workloads=(write randwrite rw randrw)
1293
1294 prep_write
1295 off=$((first_sequential_zone_sector * 512))
1296
1297 bs=$(min $((256*1024)) "$zone_size")
1298 for w in "${workloads[@]}"; do
1299 run_fio_on_seq "$(ioengine "psync")" --rw=${w} --bs="$bs" \
1300 --size=$size --loops=$loops --do_verify=1 \
1301 --verify=md5 --zone_reset_frequency=.9 \
1302 --zone_reset_threshold=.1 \
1303 >> "${logfile}.${test_number}" 2>&1 || return $?
1304 done
1305}
1306
1307# Test fio errors out experimental_verify option with zonemode=zbd.
1308test60() {
1309 run_fio_on_seq "$(ioengine "psync")" --rw=write --size=$zone_size \
1310 --do_verify=1 --verify=md5 --experimental_verify=1 \
1311 >> "${logfile}.${test_number}" 2>&1 && return 1
1312 grep -q 'not support experimental verify' "${logfile}.${test_number}"
1313}
1314
1315# Test fio errors out zone_reset_threshold option for multiple jobs with
1316# different write ranges.
1317test61() {
1318 run_fio_on_seq "$(ioengine "psync")" --rw=write --size="$zone_size" \
1319 --numjobs=2 --offset_increment="$zone_size" \
1320 --zone_reset_threshold=0.1 --zone_reset_frequency=1 \
1321 --exitall_on_error=1 \
1322 >> "${logfile}.${test_number}" 2>&1 && return 1
1323 grep -q 'different write ranges' "${logfile}.${test_number}"
1324}
1325
1326# Test zone_reset_threshold option works for multiple jobs with same write
1327# range.
1328test62() {
1329 local bs loops=2 size=$((zone_size))
1330
1331 [ -n "$is_zbd" ] && reset_zone "$dev" -1
1332
1333 # Two jobs write to single zone twice. Reset zone happens at next write
1334 # after half of the zone gets filled. So 2 * 2 * 2 - 1 = 7 times zone
1335 # resets are expected.
1336 bs=$(min $((256*1024)) $((zone_size / 4)))
1337 run_fio_on_seq "$(ioengine "psync")" --rw=write --bs="$bs" \
1338 --size=$size --loops=$loops --numjobs=2 \
1339 --zone_reset_frequency=1 --zone_reset_threshold=.5 \
1340 --group_reporting=1 \
1341 >> "${logfile}.${test_number}" 2>&1 || return $?
1342 check_written $((size * loops * 2)) || return $?
1343 check_reset_count -eq 7 || return $?
1344}
1345
1346# Test zone_reset_threshold option works for a read job and a write job with
1347# different IO range.
1348test63() {
1349 local bs loops=2 size=$((zone_size)) off1 off2
1350
1351 [ -n "$is_zbd" ] && reset_zone "$dev" -1
1352
1353 off1=$((first_sequential_zone_sector * 512))
1354 off2=$((off1 + zone_size))
1355 bs=$(min $((256*1024)) $((zone_size / 4)))
1356
1357 # One job writes to single zone twice. Reset zone happens at next write
1358 # after half of the zone gets filled. So 2 * 2 - 1 = 3 times zone resets
1359 # are expected.
1360 run_fio "$(ioengine "psync")" --bs="$bs" --size=$size --loops=$loops \
1361 --filename="$dev" --group_reporting=1 \
1362 --zonemode=zbd --zonesize="$zone_size" --direct=1 \
1363 --zone_reset_frequency=1 --zone_reset_threshold=.5 \
1364 --name=r --rw=read --offset=$off1 "${job_var_opts[@]}" \
1365 --name=w --rw=write --offset=$off2 "${job_var_opts[@]}" \
1366 >> "${logfile}.${test_number}" 2>&1 || return $?
1367 check_written $((size * loops)) || return $?
1368 check_reset_count -eq 3 || return $?
1369}
1370
1371# Test write zone accounting handles almost full zones correctly. Prepare an
1372# almost full, but not full zone. Write to the zone with verify using larger
1373# block size. Then confirm fio does not report write zone accounting failure.
1374test64() {
1375 local bs cap
1376
1377 [ -n "$is_zbd" ] && reset_zone "$dev" -1
1378
1379 bs=$((zone_size / 8))
1380 cap=$(total_zone_capacity 1 $((first_sequential_zone_sector*512)) $dev)
1381 run_fio_on_seq "$(ioengine "psync")" --rw=write --bs="$bs" \
1382 --size=$((zone_size)) \
1383 --io_size=$((cap - bs)) \
1384 >> "${logfile}.${test_number}" 2>&1 || return $?
1385
1386 bs=$((zone_size / 2))
1387 run_fio_on_seq "$(ioengine "psync")" --rw=write --bs="$bs" \
1388 --size=$((zone_size)) --do_verify=1 --verify=md5 \
1389 >> "${logfile}.${test_number}" 2>&1 || return $?
1390}
1391
1392# Test open zone accounting handles trim workload correctly. Prepare open zones
1393# as many as max_open_zones=4. Trim one of the 4 zones. Then write to another
1394# zone and check the write amount is expected size.
1395test65() {
1396 local off capacity
1397
1398 [ -n "$is_zbd" ] && reset_zone "$dev" -1
1399
1400 off=$((first_sequential_zone_sector * 512))
1401 capacity=$(total_zone_capacity 1 $off "$dev")
1402 run_fio --zonemode=zbd --direct=1 --zonesize="$zone_size" --thread=1 \
1403 --filename="$dev" --group_reporting=1 --max_open_zones=4 \
1404 "$(ioengine "psync")" \
1405 --name="prep_open_zones" --rw=randwrite --offset="$off" \
1406 --size="$((zone_size * 4))" --bs=4096 --io_size="$zone_size" \
1407 --name=trimjob --wait_for="prep_open_zones" --rw=trim \
1408 --bs="$zone_size" --offset="$off" --size="$zone_size" \
1409 --name=write --wait_for="trimjob" --rw=write --bs=4096 \
1410 --offset="$((off + zone_size * 4))" --size="$zone_size" \
1411 >> "${logfile}.${test_number}" 2>&1
1412
1413 check_written $((zone_size + capacity))
1414}
1415
1416SECONDS=0
1417tests=()
1418dynamic_analyzer=()
1419reset_all_zones=
1420reset_before_write=
1421use_libzbc=
1422zbd_debug=
1423max_open_zones_opt=
1424quit_on_err=
1425force_io_uring=
1426
1427while [ "${1#-}" != "$1" ]; do
1428 case "$1" in
1429 -d) dynamic_analyzer=(valgrind "--read-var-info=yes" "--tool=drd"
1430 "--show-confl-seg=no");
1431 shift;;
1432 -e) dynamic_analyzer=(valgrind "--read-var-info=yes" "--tool=helgrind");
1433 shift;;
1434 -l) use_libzbc=1; shift;;
1435 -r) reset_all_zones=1; shift;;
1436 -w) reset_before_write=1; shift;;
1437 -t) tests+=("$2"); shift; shift;;
1438 -o) max_open_zones_opt="${2}"; shift; shift;;
1439 -v) dynamic_analyzer=(valgrind "--read-var-info=yes");
1440 shift;;
1441 -q) quit_on_err=1; shift;;
1442 -z) zbd_debug=1; shift;;
1443 -u) force_io_uring=1; shift;;
1444 --) shift; break;;
1445 *) usage; exit 1;;
1446 esac
1447done
1448
1449if [ $# != 1 ]; then
1450 usage
1451 exit 1
1452fi
1453
1454if [ -n "$use_libzbc" -a -n "$force_io_uring" ]; then
1455 echo "Please specify only one of -l and -u options"
1456 exit 1
1457fi
1458
1459# shellcheck source=functions
1460source "$(dirname "$0")/functions" || exit $?
1461
1462global_var_opts=()
1463job_var_opts=()
1464if [ -n "$zbd_debug" ]; then
1465 global_var_opts+=("--debug=zbd")
1466fi
1467dev=$1
1468realdev=$(readlink -f "$dev")
1469basename=$(basename "$realdev")
1470
1471if [[ -b "$realdev" ]]; then
1472 major=$((0x$(stat -L -c '%t' "$realdev"))) || exit $?
1473 minor=$((0x$(stat -L -c '%T' "$realdev"))) || exit $?
1474 disk_size=$(($(<"/sys/dev/block/$major:$minor/size")*512))
1475
1476 # When the target is a partition device, get basename of its
1477 # holder device to access sysfs path of the holder device
1478 if [[ -r "/sys/dev/block/$major:$minor/partition" ]]; then
1479 realsysfs=$(readlink "/sys/dev/block/$major:$minor")
1480 basename=$(basename "${realsysfs%/*}")
1481 fi
1482 min_seq_write_size=$(min_seq_write_size "$basename")
1483 case "$(<"/sys/class/block/$basename/queue/zoned")" in
1484 host-managed|host-aware)
1485 is_zbd=true
1486 if ! check_blkzone "${dev}"; then
1487 exit 1
1488 fi
1489 if ! result=($(first_sequential_zone "$dev")); then
1490 echo "Failed to determine first sequential zone"
1491 exit 1
1492 fi
1493 first_sequential_zone_sector=${result[0]}
1494 sectors_per_zone=${result[1]}
1495 zone_size=$((sectors_per_zone * 512))
1496 if ! max_open_zones=$(max_open_zones "$dev"); then
1497 echo "Failed to determine maximum number of open zones"
1498 exit 1
1499 fi
1500 set_io_scheduler "$basename" deadline || exit $?
1501 if [ -n "$reset_all_zones" ]; then
1502 reset_zone "$dev" -1
1503 fi
1504 ;;
1505 *)
1506 first_sequential_zone_sector=$(((disk_size / 2) &
1507 (min_seq_write_size - 1)))
1508 zone_size=$(max 65536 "$min_seq_write_size")
1509 sectors_per_zone=$((zone_size / 512))
1510 max_open_zones=128
1511 set_io_scheduler "$basename" none || exit $?
1512 ;;
1513 esac
1514elif [[ -c "$realdev" ]]; then
1515 # For an SG node, we must have libzbc option specified
1516 if [[ ! -n "$use_libzbc" ]]; then
1517 echo "Character device files can only be used with -l (libzbc) option"
1518 exit 1
1519 fi
1520
1521 if ! $(is_zbc "$dev"); then
1522 echo "Device is not a ZBC disk"
1523 exit 1
1524 fi
1525 is_zbd=true
1526
1527 if ! disk_size=($(( $(zbc_disk_sectors "$dev") * 512))); then
1528 echo "Failed to determine disk size"
1529 exit 1
1530 fi
1531 if ! min_seq_write_size=($(zbc_physical_block_size "$dev")); then
1532 echo "Failed to determine physical block size"
1533 exit 1
1534 fi
1535 if ! result=($(first_sequential_zone "$dev")); then
1536 echo "Failed to determine first sequential zone"
1537 exit 1
1538 fi
1539 first_sequential_zone_sector=${result[0]}
1540 sectors_per_zone=${result[1]}
1541 zone_size=$((sectors_per_zone * 512))
1542 if ! max_open_zones=$(max_open_zones "$dev"); then
1543 echo "Failed to determine maximum number of open zones"
1544 exit 1
1545 fi
1546 if [ -n "$reset_all_zones" ]; then
1547 reset_zone "$dev" -1
1548 fi
1549fi
1550
1551if [[ -n ${max_open_zones_opt} ]]; then
1552 # Override max_open_zones with the script option value
1553 max_open_zones="${max_open_zones_opt}"
1554 global_var_opts+=("--ignore_zone_limits=1")
1555 job_var_opts+=("--max_open_zones=${max_open_zones_opt}")
1556fi
1557
1558echo -n "First sequential zone starts at sector $first_sequential_zone_sector;"
1559echo " zone size: $((zone_size >> 20)) MB"
1560
1561zone_cap_bs=$(zone_cap_bs "$dev" "$zone_size")
1562
1563if [ "${#tests[@]}" = 0 ]; then
1564 readarray -t tests < <(declare -F | grep "test[0-9]*" | \
1565 tr -c -d "[:digit:]\n" | sort -n)
1566fi
1567
1568logfile=$0.log
1569
1570passed=0
1571skipped=0
1572failed=0
1573if [ -t 1 ]; then
1574 red="\e[1;31m"
1575 green="\e[1;32m"
1576 cyan="\e[1;36m"
1577 end="\e[m"
1578else
1579 red=""
1580 green=""
1581 end=""
1582fi
1583rc=0
1584
1585intr=0
1586trap 'intr=1' SIGINT
1587ret=0
1588
1589for test_number in "${tests[@]}"; do
1590 rm -f "${logfile}.${test_number}"
1591 unset SKIP_REASON
1592 echo -n "Running test $(printf "%02d" $test_number) ... "
1593 eval "test$test_number"
1594 ret=$?
1595 if ((!ret)) && check_log $test_number; then
1596 status="PASS"
1597 cc_status="${green}${status}${end}"
1598 ((passed++))
1599 elif ((ret==SKIP_TESTCASE)); then
1600 status="SKIP"
1601 echo "${SKIP_REASON}" >> "${logfile}.${test_number}"
1602 cc_status="${cyan}${status}${end} ${SKIP_REASON}"
1603 ((skipped++))
1604 else
1605 status="FAIL"
1606 cc_status="${red}${status}${end}"
1607 ((failed++))
1608 rc=1
1609 fi
1610 echo -e "$cc_status"
1611 echo "$status" >> "${logfile}.${test_number}"
1612 [ $intr -ne 0 ] && exit 1
1613 [ -n "$quit_on_err" -a "$rc" -ne 0 ] && exit 1
1614done
1615
1616echo "$passed tests passed"
1617if [ $skipped -gt 0 ]; then
1618 echo " $skipped tests skipped"
1619fi
1620if [ $failed -gt 0 ]; then
1621 echo " $failed tests failed"
1622fi
1623echo "Run time: $(TZ=UTC0 printf "%(%H:%M:%S)T\n" $(( SECONDS )) )"
1624exit $rc