t/zbd: Combine write and read fio commands for test case #16
[fio.git] / t / zbd / test-zbd-support
CommitLineData
191d1d1a
BVA
1#!/bin/bash
2#
3# Copyright (C) 2018 Western Digital Corporation or its affiliates.
4#
5# This file is released under the GPL.
6
7usage() {
6dcb098d 8 echo "Usage: $(basename "$0") [-d] [-e] [-l] [-r] [-v] [-t <test>] [-z] <SMR drive device node>"
191d1d1a
BVA
9}
10
11max() {
12 if [ "$1" -gt "$2" ]; then
13 echo "$1"
14 else
15 echo "$2"
16 fi
17}
18
19min() {
20 if [ "$1" -lt "$2" ]; then
21 echo "$1"
22 else
23 echo "$2"
24 fi
25}
26
6dcb098d
DF
27ioengine() {
28 if [ -n "$use_libzbc" ]; then
29 echo -n "--ioengine=libzbc"
30 else
31 echo -n "--ioengine=$1"
32 fi
33}
34
191d1d1a
BVA
35set_io_scheduler() {
36 local dev=$1 sched=$2
37
38 [ -e "/sys/block/$dev" ] || return $?
39 if [ -e "/sys/block/$dev/mq" ]; then
40 case "$sched" in
41 noop) sched=none;;
42 deadline) sched=mq-deadline;;
43 esac
44 else
45 case "$sched" in
46 none) sched=noop;;
47 mq-deadline) sched=deadline;;
48 esac
49 fi
50
51 echo "$sched" >"/sys/block/$dev/queue/scheduler"
52}
53
54check_read() {
55 local read
56
57 read=$(fio_read <"${logfile}.${test_number}")
58 echo "read: $read <> $1" >> "${logfile}.${test_number}"
59 [ "$read" = "$1" ]
60}
61
62check_written() {
63 local written
64
65 written=$(fio_written <"${logfile}.${test_number}")
66 echo "written: $written <> $1" >> "${logfile}.${test_number}"
67 [ "$written" = "$1" ]
68}
69
70# Compare the reset count from the log file with reset count $2 using operator
71# $1 (=, -ge, -gt, -le, -lt).
72check_reset_count() {
73 local reset_count
74
75 reset_count=$(fio_reset_count <"${logfile}.${test_number}")
76 echo "reset_count: test $reset_count $1 $2" >> "${logfile}.${test_number}"
77 eval "[ '$reset_count' '$1' '$2' ]"
78}
79
80# Whether or not $1 (/dev/...) is a SCSI device.
81is_scsi_device() {
82 local d f
83
84 d=$(basename "$dev")
85 for f in /sys/class/scsi_device/*/device/block/"$d"; do
86 [ -e "$f" ] && return 0
87 done
88 return 1
89}
90
91run_fio() {
97e41ee4 92 local fio opts
191d1d1a
BVA
93
94 fio=$(dirname "$0")/../../fio
95
fc3bf67a
DLM
96 opts=("--max-jobs=16" "--aux-path=/tmp" "--allow_file_create=0" \
97 "--significant_figures=10" "$@")
6dcb098d 98 opts+=(${var_opts[@]})
97e41ee4 99 { echo; echo "fio ${opts[*]}"; echo; } >>"${logfile}.${test_number}"
191d1d1a 100
97e41ee4 101 "${dynamic_analyzer[@]}" "$fio" "${opts[@]}"
191d1d1a
BVA
102}
103
104run_one_fio_job() {
105 local r
106
107 r=$(((RANDOM << 16) | RANDOM))
108 run_fio --name="$dev" --filename="$dev" "$@" --randseed="$r" \
109 --thread=1 --direct=1
110}
111
8f601b44
SK
112write_and_run_one_fio_job() {
113 local r
114 local write_offset="${1}"
115 local write_size="${2}"
116
117 shift 2
118 r=$(((RANDOM << 16) | RANDOM))
119 run_fio --filename="$dev" --randseed="$r" --name="write_job" --rw=write \
120 "$(ioengine "psync")" --bs="${logical_block_size}" \
121 --zonemode=zbd --zonesize="${zone_size}" --thread=1 --direct=1 \
122 --offset="${write_offset}" --size="${write_size}" \
123 --name="$dev" --wait_for="write_job" "$@" --thread=1 --direct=1
124}
125
191d1d1a
BVA
126# Run fio on the first four sequential zones of the disk.
127run_fio_on_seq() {
128 local opts=()
129
130 opts+=("--offset=$((first_sequential_zone_sector * 512))")
131 opts+=("--size=$((4 * zone_size))" "--zonemode=zbd")
132 if [ -z "$is_zbd" ]; then
133 opts+=("--zonesize=${zone_size}")
134 fi
135 run_one_fio_job "${opts[@]}" "$@"
136}
137
138# Check whether buffered writes are refused.
139test1() {
140 run_fio --name=job1 --filename="$dev" --rw=write --direct=0 --bs=4K \
6dcb098d 141 "$(ioengine "psync")" --size="${zone_size}" --thread=1 \
191d1d1a
BVA
142 --zonemode=zbd --zonesize="${zone_size}" 2>&1 |
143 tee -a "${logfile}.${test_number}" |
144 grep -q 'Using direct I/O is mandatory for writing to ZBD drives'
145 local fio_rc=${PIPESTATUS[0]} grep_rc=${PIPESTATUS[2]}
146 case "$fio_rc" in
147 0|1) ;;
148 *) return "$fio_rc"
149 esac
150 if [ -n "$is_zbd" ]; then
151 [ "$grep_rc" = 0 ]
152 else
153 [ "$grep_rc" != 0 ]
154 fi
155}
156
157# Block size exceeds zone size.
158test2() {
159 local bs off opts=() rc
160
161 off=$(((first_sequential_zone_sector + 2 * sectors_per_zone) * 512))
162 bs=$((2 * zone_size))
6dcb098d 163 opts+=("$(ioengine "psync")")
191d1d1a
BVA
164 opts+=("--name=job1" "--filename=$dev" "--rw=write" "--direct=1")
165 opts+=("--zonemode=zbd" "--offset=$off" "--bs=$bs" "--size=$bs")
166 if [ -z "$is_zbd" ]; then
167 opts+=("--zonesize=${zone_size}")
168 fi
f572c8f6
DLM
169 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
170 ! grep -q 'WRITE:' "${logfile}.${test_number}"
191d1d1a
BVA
171}
172
173# Run fio against an empty zone. This causes fio to report "No I/O performed".
174test3() {
175 local off opts=() rc
176
177 off=$((first_sequential_zone_sector * 512 + 128 * zone_size))
178 size=$((zone_size))
179 [ -n "$is_zbd" ] && reset_zone "$dev" $((off / 512))
180 opts+=("--name=$dev" "--filename=$dev" "--offset=$off" "--bs=4K")
181 opts+=("--size=$size" "--zonemode=zbd")
6dcb098d 182 opts+=("$(ioengine "psync")" "--rw=read" "--direct=1" "--thread=1")
191d1d1a
BVA
183 if [ -z "$is_zbd" ]; then
184 opts+=("--zonesize=${zone_size}")
185 fi
186 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
bbd6f1bb 187 ! grep -q 'READ:' "${logfile}.${test_number}"
191d1d1a
BVA
188}
189
190# Run fio with --read_beyond_wp=1 against an empty zone.
191test4() {
192 local off opts=()
193
194 off=$((first_sequential_zone_sector * 512 + 129 * zone_size))
195 size=$((zone_size))
196 [ -n "$is_zbd" ] && reset_zone "$dev" $((off / 512))
197 opts+=("--name=$dev" "--filename=$dev" "--offset=$off" "--bs=$size")
198 opts+=("--size=$size" "--thread=1" "--read_beyond_wp=1")
6dcb098d 199 opts+=("$(ioengine "psync")" "--rw=read" "--direct=1" "--disable_lat=1")
191d1d1a
BVA
200 opts+=("--zonemode=zbd" "--zonesize=${zone_size}")
201 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
202 check_read $size || return $?
203}
204
205# Sequential write to sequential zones.
206test5() {
207 local size
208
209 size=$((4 * zone_size))
6dcb098d 210 run_fio_on_seq "$(ioengine "psync")" --iodepth=1 --rw=write \
191d1d1a
BVA
211 --bs="$(max $((zone_size / 64)) "$logical_block_size")"\
212 --do_verify=1 --verify=md5 \
213 >>"${logfile}.${test_number}" 2>&1 || return $?
214 check_written $size || return $?
215 check_read $size || return $?
216}
217
0123751c 218# Sequential read from sequential zones.
191d1d1a
BVA
219test6() {
220 local size
221
222 size=$((4 * zone_size))
0123751c
SK
223 write_and_run_one_fio_job \
224 $((first_sequential_zone_sector * 512)) "${size}" \
225 --offset=$((first_sequential_zone_sector * 512)) \
226 --size="${size}" --zonemode=zbd --zonesize="${zone_size}" \
227 "$(ioengine "psync")" --iodepth=1 --rw=read \
228 --bs="$(max $((zone_size / 64)) "$logical_block_size")" \
229 >>"${logfile}.${test_number}" 2>&1 || return $?
191d1d1a
BVA
230 check_read $size || return $?
231}
232
233# Random write to sequential zones, libaio, queue depth 1.
234test7() {
235 local size=$((zone_size))
236
6dcb098d 237 run_fio_on_seq "$(ioengine "libaio")" --iodepth=1 --rw=randwrite \
191d1d1a
BVA
238 --bs="$(min 16384 "${zone_size}")" \
239 --do_verify=1 --verify=md5 --size="$size" \
240 >>"${logfile}.${test_number}" 2>&1 || return $?
241 check_written $size || return $?
242 check_read $size || return $?
243}
244
245# Random write to sequential zones, libaio, queue depth 64.
246test8() {
247 local size
248
249 size=$((4 * zone_size))
6dcb098d 250 run_fio_on_seq "$(ioengine "libaio")" --iodepth=64 --rw=randwrite \
191d1d1a
BVA
251 --bs="$(min 16384 "${zone_size}")" \
252 --do_verify=1 --verify=md5 \
253 >>"${logfile}.${test_number}" 2>&1 || return $?
254 check_written $size || return $?
255 check_read $size || return $?
256}
257
258# Random write to sequential zones, sg, queue depth 1.
259test9() {
260 local size
261
262 if ! is_scsi_device "$dev"; then
263 echo "$dev is not a SCSI device" >>"${logfile}.${test_number}"
264 return 0
265 fi
266
267 size=$((4 * zone_size))
6dcb098d
DF
268 run_fio_on_seq --ioengine=sg \
269 --iodepth=1 --rw=randwrite --bs=16K \
191d1d1a
BVA
270 --do_verify=1 --verify=md5 \
271 >>"${logfile}.${test_number}" 2>&1 || return $?
272 check_written $size || return $?
273 check_read $size || return $?
274}
275
276# Random write to sequential zones, sg, queue depth 64.
277test10() {
278 local size
279
280 if ! is_scsi_device "$dev"; then
281 echo "$dev is not a SCSI device" >>"${logfile}.${test_number}"
282 return 0
283 fi
284
285 size=$((4 * zone_size))
6dcb098d
DF
286 run_fio_on_seq --ioengine=sg \
287 --iodepth=64 --rw=randwrite --bs=16K \
191d1d1a
BVA
288 --do_verify=1 --verify=md5 \
289 >>"${logfile}.${test_number}" 2>&1 || return $?
290 check_written $size || return $?
291 check_read $size || return $?
292}
293
294# Random write to sequential zones, libaio, queue depth 64, random block size.
295test11() {
296 local size
297
298 size=$((4 * zone_size))
6dcb098d 299 run_fio_on_seq "$(ioengine "libaio")" --iodepth=64 --rw=randwrite \
191d1d1a
BVA
300 --bsrange=4K-64K --do_verify=1 --verify=md5 \
301 --debug=zbd >>"${logfile}.${test_number}" 2>&1 || return $?
302 check_written $size || return $?
303 check_read $size || return $?
304}
305
306# Random write to sequential zones, libaio, queue depth 64, max 1 open zone.
307test12() {
308 local size
309
310 size=$((8 * zone_size))
6dcb098d 311 run_fio_on_seq "$(ioengine "libaio")" --iodepth=64 --rw=randwrite --bs=16K \
191d1d1a
BVA
312 --max_open_zones=1 --size=$size --do_verify=1 --verify=md5 \
313 --debug=zbd >>"${logfile}.${test_number}" 2>&1 || return $?
314 check_written $size || return $?
315 check_read $size || return $?
316}
317
318# Random write to sequential zones, libaio, queue depth 64, max 4 open zones.
319test13() {
320 local size
321
322 size=$((8 * zone_size))
6dcb098d 323 run_fio_on_seq "$(ioengine "libaio")" --iodepth=64 --rw=randwrite --bs=16K \
191d1d1a
BVA
324 --max_open_zones=4 --size=$size --do_verify=1 --verify=md5 \
325 --debug=zbd \
326 >>"${logfile}.${test_number}" 2>&1 || return $?
327 check_written $size || return $?
328 check_read $size || return $?
329}
330
331# Random write to conventional zones.
332test14() {
333 local size
334
335 size=$((16 * 2**20)) # 20 MB
336 if [ $size -gt $((first_sequential_zone_sector * 512)) ]; then
337 echo "$dev does not have enough sequential zones" \
338 >>"${logfile}.${test_number}"
339 return 0
340 fi
6dcb098d 341 run_one_fio_job "$(ioengine "libaio")" --iodepth=64 --rw=randwrite --bs=16K \
191d1d1a
BVA
342 --zonemode=zbd --zonesize="${zone_size}" --do_verify=1 \
343 --verify=md5 --size=$size \
344 >>"${logfile}.${test_number}" 2>&1 || return $?
345 check_written $((size)) || return $?
346 check_read $((size)) || return $?
347}
348
349# Sequential read on a mix of empty and full zones.
350test15() {
351 local i off size
291aa0a7 352 local w_off w_size
191d1d1a
BVA
353
354 for ((i=0;i<4;i++)); do
355 [ -n "$is_zbd" ] &&
356 reset_zone "$dev" $((first_sequential_zone_sector +
357 i*sectors_per_zone))
358 done
291aa0a7
SK
359 w_off=$(((first_sequential_zone_sector + 2 * sectors_per_zone) * 512))
360 w_size=$((2 * zone_size))
191d1d1a
BVA
361 off=$((first_sequential_zone_sector * 512))
362 size=$((4 * zone_size))
291aa0a7
SK
363 write_and_run_one_fio_job "${w_off}" "${w_size}" \
364 "$(ioengine "psync")" --rw=read --bs=$((zone_size / 16)) \
191d1d1a
BVA
365 --zonemode=zbd --zonesize="${zone_size}" --offset=$off \
366 --size=$((size)) >>"${logfile}.${test_number}" 2>&1 ||
367 return $?
291aa0a7
SK
368 check_written $((w_size)) || return $?
369 check_read $((size / 2))
191d1d1a
BVA
370}
371
7285b445 372# Random read on a mix of empty and full zones.
191d1d1a
BVA
373test16() {
374 local off size
7285b445 375 local i w_off w_size
191d1d1a 376
7285b445
SK
377 for ((i=0;i<4;i++)); do
378 [ -n "$is_zbd" ] &&
379 reset_zone "$dev" $((first_sequential_zone_sector +
380 i*sectors_per_zone))
381 done
382 w_off=$(((first_sequential_zone_sector + 2 * sectors_per_zone) * 512))
383 w_size=$((2 * zone_size))
191d1d1a
BVA
384 off=$((first_sequential_zone_sector * 512))
385 size=$((4 * zone_size))
7285b445
SK
386 write_and_run_one_fio_job "${w_off}" "${w_size}" \
387 "$(ioengine "libaio")" --iodepth=64 --rw=randread --bs=16K \
191d1d1a
BVA
388 --zonemode=zbd --zonesize="${zone_size}" --offset=$off \
389 --size=$size >>"${logfile}.${test_number}" 2>&1 || return $?
7285b445 390 check_written $w_size || return $?
191d1d1a
BVA
391 check_read $size || return $?
392}
393
394# Random reads and writes in the last zone.
395test17() {
396 local io off read size written
397
398 off=$(((disk_size / zone_size - 1) * zone_size))
399 size=$((disk_size - off))
400 # Overwrite the last zone to avoid that reading from that zone fails.
401 if [ -n "$is_zbd" ]; then
402 reset_zone "$dev" $((off / 512)) || return $?
403 fi
6dcb098d 404 run_one_fio_job "$(ioengine "psync")" --rw=write --offset="$off" \
191d1d1a
BVA
405 --zonemode=zbd --zonesize="${zone_size}" \
406 --bs="$zone_size" --size="$zone_size" \
407 >>"${logfile}.${test_number}" 2>&1 || return $?
408 check_written "$zone_size" || return $?
6dcb098d 409 run_one_fio_job "$(ioengine "libaio")" --iodepth=8 --rw=randrw --bs=4K \
191d1d1a
BVA
410 --zonemode=zbd --zonesize="${zone_size}" \
411 --offset=$off --loops=2 --norandommap=1\
412 >>"${logfile}.${test_number}" 2>&1 || return $?
413 written=$(fio_written <"${logfile}.${test_number}")
414 read=$(fio_read <"${logfile}.${test_number}")
415 io=$((written + read))
416 echo "Total number of bytes read and written: $io <> $size" \
417 >>"${logfile}.${test_number}"
418 [ $io = $((size * 2)) ];
419}
420
421# Out-of-range zone reset threshold and frequency parameters.
422test18() {
423 run_fio_on_seq --zone_reset_threshold=-1 |&
424 tee -a "${logfile}.${test_number}" |
425 grep -q 'value out of range' || return $?
426}
427
428test19() {
429 run_fio_on_seq --zone_reset_threshold=2 |&
430 tee -a "${logfile}.${test_number}" |
431 grep -q 'value out of range' || return $?
432}
433
434test20() {
435 run_fio_on_seq --zone_reset_threshold=.4:.6 |&
436 tee -a "${logfile}.${test_number}" |
437 grep -q 'the list exceeding max length' || return $?
438}
439
440test21() {
441 run_fio_on_seq --zone_reset_frequency=-1 |&
442 tee -a "${logfile}.${test_number}" |
443 grep -q 'value out of range' || return $?
444}
445
446test22() {
447 run_fio_on_seq --zone_reset_frequency=2 |&
448 tee -a "${logfile}.${test_number}" |
449 grep -q 'value out of range' || return $?
450}
451
452test23() {
453 run_fio_on_seq --zone_reset_frequency=.4:.6 |&
454 tee -a "${logfile}.${test_number}" |
455 grep -q 'the list exceeding max length' || return $?
456}
457
458test24() {
459 local bs loops=9 size=$((zone_size))
460
461 bs=$(min $((256*1024)) "$zone_size")
6dcb098d
DF
462 run_fio_on_seq "$(ioengine "psync")" --rw=write --bs="$bs" \
463 --size=$size --loops=$loops \
191d1d1a
BVA
464 --zone_reset_frequency=.01 --zone_reset_threshold=.90 \
465 >> "${logfile}.${test_number}" 2>&1 || return $?
466 check_written $((size * loops)) || return $?
467 check_reset_count -eq 8 ||
468 check_reset_count -eq 9 ||
469 check_reset_count -eq 10 || return $?
470}
471
472# Multiple non-overlapping sequential write jobs for the same drive.
473test25() {
474 local i opts=()
475
476 for ((i=0;i<16;i++)); do
477 [ -n "$is_zbd" ] &&
478 reset_zone "$dev" $((first_sequential_zone_sector + i*sectors_per_zone))
479 done
480 for ((i=0;i<16;i++)); do
481 opts+=("--name=job$i" "--filename=$dev" "--thread=1" "--direct=1")
482 opts+=("--offset=$((first_sequential_zone_sector*512 + zone_size*i))")
6dcb098d 483 opts+=("--size=$zone_size" "$(ioengine "psync")" "--rw=write" "--bs=16K")
191d1d1a 484 opts+=("--zonemode=zbd" "--zonesize=${zone_size}" "--group_reporting=1")
6dcb098d 485 opts+=(${var_opts[@]})
191d1d1a
BVA
486 done
487 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
488}
489
490write_to_first_seq_zone() {
491 local loops=4 r
492
493 r=$(((RANDOM << 16) | RANDOM))
6dcb098d 494 run_fio --name="$dev" --filename="$dev" "$(ioengine "psync")" --rw="$1" \
191d1d1a
BVA
495 --thread=1 --do_verify=1 --verify=md5 --direct=1 --bs=4K \
496 --offset=$((first_sequential_zone_sector * 512)) \
497 "--size=$zone_size" --loops=$loops --randseed="$r" \
498 --zonemode=zbd --zonesize="${zone_size}" --group_reporting=1 \
499 --gtod_reduce=1 >> "${logfile}.${test_number}" 2>&1 || return $?
500 check_written $((loops * zone_size)) || return $?
501}
502
503# Overwrite the first sequential zone four times sequentially.
504test26() {
505 write_to_first_seq_zone write
506}
507
508# Overwrite the first sequential zone four times using random writes.
509test27() {
510 write_to_first_seq_zone randwrite
511}
512
513# Multiple overlapping random write jobs for the same drive.
514test28() {
515 local i jobs=16 off opts
516
517 off=$((first_sequential_zone_sector * 512 + 64 * zone_size))
518 [ -n "$is_zbd" ] && reset_zone "$dev" $((off / 512))
519 opts=("--debug=zbd")
520 for ((i=0;i<jobs;i++)); do
521 opts+=("--name=job$i" "--filename=$dev" "--offset=$off" "--bs=16K")
6dcb098d 522 opts+=("--size=$zone_size" "$(ioengine "psync")" "--rw=randwrite")
191d1d1a
BVA
523 opts+=("--thread=1" "--direct=1" "--zonemode=zbd")
524 opts+=("--zonesize=${zone_size}" "--group_reporting=1")
6dcb098d 525 opts+=(${var_opts[@]})
191d1d1a
BVA
526 done
527 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
528 check_written $((jobs * zone_size)) || return $?
529 check_reset_count -eq $jobs ||
530 check_reset_count -eq $((jobs - 1)) ||
531 return $?
532}
533
534# Multiple overlapping random write jobs for the same drive and with a limited
535# number of open zones.
536test29() {
537 local i jobs=16 off opts=()
538
539 off=$((first_sequential_zone_sector * 512 + 64 * zone_size))
540 size=$((16*zone_size))
541 [ -n "$is_zbd" ] && reset_zone "$dev" $((off / 512))
542 opts=("--debug=zbd")
543 for ((i=0;i<jobs;i++)); do
544 opts+=("--name=job$i" "--filename=$dev" "--offset=$off" "--bs=16K")
545 opts+=("--size=$size" "--io_size=$zone_size" "--thread=1")
6dcb098d 546 opts+=("$(ioengine "psync")" "--rw=randwrite" "--direct=1")
191d1d1a
BVA
547 opts+=("--max_open_zones=4" "--group_reporting=1")
548 opts+=("--zonemode=zbd" "--zonesize=${zone_size}")
6dcb098d 549 opts+=(${var_opts[@]})
191d1d1a
BVA
550 done
551 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
552 check_written $((jobs * zone_size)) || return $?
553}
554
555# Random reads and writes across the entire disk for 30s.
556test30() {
557 local off
558
559 off=$((first_sequential_zone_sector * 512))
6dcb098d 560 run_one_fio_job "$(ioengine "libaio")" --iodepth=8 --rw=randrw \
191d1d1a
BVA
561 --bs="$(max $((zone_size / 128)) "$logical_block_size")"\
562 --zonemode=zbd --zonesize="${zone_size}" --offset=$off\
563 --loops=2 --time_based --runtime=30s --norandommap=1\
564 >>"${logfile}.${test_number}" 2>&1
565}
566
567# Random reads across all sequential zones for 30s. This is not only a fio
568# test but also allows to verify the performance of a drive.
569test31() {
570 local bs inc nz off opts size
571
572 # Start with writing 128 KB to 128 sequential zones.
573 bs=128K
574 nz=128
575 # shellcheck disable=SC2017
576 inc=$(((disk_size - (first_sequential_zone_sector * 512)) / (nz * zone_size)
577 * zone_size))
578 opts=()
579 for ((off = first_sequential_zone_sector * 512; off < disk_size;
580 off += inc)); do
581 opts+=("--name=$dev" "--filename=$dev" "--offset=$off" "--io_size=$bs")
6dcb098d 582 opts+=("--bs=$bs" "--size=$zone_size" "$(ioengine "libaio")")
191d1d1a
BVA
583 opts+=("--rw=write" "--direct=1" "--thread=1" "--stats=0")
584 opts+=("--zonemode=zbd" "--zonesize=${zone_size}")
6dcb098d 585 opts+=(${var_opts[@]})
191d1d1a
BVA
586 done
587 "$(dirname "$0")/../../fio" "${opts[@]}" >> "${logfile}.${test_number}" 2>&1
588 # Next, run the test.
589 off=$((first_sequential_zone_sector * 512))
590 size=$((disk_size - off))
591 opts=("--name=$dev" "--filename=$dev" "--offset=$off" "--size=$size")
6dcb098d 592 opts+=("--bs=$bs" "$(ioengine "psync")" "--rw=randread" "--direct=1")
191d1d1a
BVA
593 opts+=("--thread=1" "--time_based" "--runtime=30" "--zonemode=zbd")
594 opts+=("--zonesize=${zone_size}")
595 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
596}
597
598# Random writes across all sequential zones. This is not only a fio test but
599# also allows to verify the performance of a drive.
600test32() {
601 local off opts=() size
602
603 off=$((first_sequential_zone_sector * 512))
604 size=$((disk_size - off))
605 opts+=("--name=$dev" "--filename=$dev" "--offset=$off" "--size=$size")
6dcb098d 606 opts+=("--bs=128K" "$(ioengine "psync")" "--rw=randwrite" "--direct=1")
191d1d1a
BVA
607 opts+=("--thread=1" "--time_based" "--runtime=30")
608 opts+=("--max_open_zones=$max_open_zones" "--zonemode=zbd")
609 opts+=("--zonesize=${zone_size}")
610 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
611}
612
613# Write to sequential zones with a block size that is not a divisor of the
614# zone size.
615test33() {
616 local bs io_size size
617
618 size=$((2 * zone_size))
619 io_size=$((5 * zone_size))
620 bs=$((3 * zone_size / 4))
6dcb098d
DF
621 run_fio_on_seq "$(ioengine "psync")" --iodepth=1 --rw=write \
622 --size=$size --io_size=$io_size --bs=$bs \
191d1d1a
BVA
623 >> "${logfile}.${test_number}" 2>&1 || return $?
624 check_written $(((io_size + bs - 1) / bs * bs)) || return $?
625}
626
627# Write to sequential zones with a block size that is not a divisor of the
628# zone size and with data verification enabled.
629test34() {
630 local size
631
632 size=$((2 * zone_size))
6dcb098d 633 run_fio_on_seq "$(ioengine "psync")" --iodepth=1 --rw=write --size=$size \
191d1d1a
BVA
634 --do_verify=1 --verify=md5 --bs=$((3 * zone_size / 4)) \
635 >> "${logfile}.${test_number}" 2>&1 && return 1
636 grep -q 'not a divisor of' "${logfile}.${test_number}"
637}
638
639# Test 1/4 for the I/O boundary rounding code: $size < $zone_size.
640test35() {
641 local bs off io_size size
642
643 off=$(((first_sequential_zone_sector + 1) * 512))
644 size=$((zone_size - 2 * 512))
645 bs=$((zone_size / 4))
6dcb098d
DF
646 run_one_fio_job --offset=$off --size=$size "$(ioengine "psync")" \
647 --iodepth=1 --rw=write --do_verify=1 --verify=md5 \
648 --bs=$bs --zonemode=zbd --zonesize="${zone_size}" \
191d1d1a
BVA
649 >> "${logfile}.${test_number}" 2>&1 && return 1
650 grep -q 'io_size must be at least one zone' "${logfile}.${test_number}"
651}
652
653# Test 2/4 for the I/O boundary rounding code: $size < $zone_size.
654test36() {
655 local bs off io_size size
656
657 off=$(((first_sequential_zone_sector) * 512))
658 size=$((zone_size - 512))
659 bs=$((zone_size / 4))
6dcb098d
DF
660 run_one_fio_job --offset=$off --size=$size "$(ioengine "psync")" \
661 --iodepth=1 --rw=write --do_verify=1 --verify=md5 \
662 --bs=$bs --zonemode=zbd --zonesize="${zone_size}" \
191d1d1a
BVA
663 >> "${logfile}.${test_number}" 2>&1 && return 1
664 grep -q 'io_size must be at least one zone' "${logfile}.${test_number}"
665}
666
667# Test 3/4 for the I/O boundary rounding code: $size > $zone_size.
668test37() {
669 local bs off size
670
671 if [ "$first_sequential_zone_sector" = 0 ]; then
672 off=0
673 else
674 off=$(((first_sequential_zone_sector - 1) * 512))
675 fi
676 size=$((zone_size + 2 * 512))
677 bs=$((zone_size / 4))
6dcb098d
DF
678 run_one_fio_job --offset=$off --size=$size "$(ioengine "psync")" \
679 --iodepth=1 --rw=write --do_verify=1 --verify=md5 \
680 --bs=$bs --zonemode=zbd --zonesize="${zone_size}" \
191d1d1a
BVA
681 >> "${logfile}.${test_number}" 2>&1
682 check_written $((zone_size)) || return $?
683}
684
685# Test 4/4 for the I/O boundary rounding code: $offset > $disk_size - $zone_size
686test38() {
687 local bs off size
688
689 size=$((logical_block_size))
690 off=$((disk_size - logical_block_size))
691 bs=$((logical_block_size))
6dcb098d
DF
692 run_one_fio_job --offset=$off --size=$size "$(ioengine "psync")" \
693 --iodepth=1 --rw=write --do_verify=1 --verify=md5 \
694 --bs=$bs --zonemode=zbd --zonesize="${zone_size}" \
191d1d1a
BVA
695 >> "${logfile}.${test_number}" 2>&1 && return 1
696 grep -q 'io_size must be at least one zone' "${logfile}.${test_number}"
697}
698
699# Read one block from a block device.
700read_one_block() {
701 local bs
702
703 bs=$((logical_block_size))
6dcb098d 704 run_one_fio_job --rw=read "$(ioengine "psync")" --bs=$bs --size=$bs "$@" 2>&1 |
191d1d1a
BVA
705 tee -a "${logfile}.${test_number}"
706}
707
708# Check whether fio accepts --zonemode=none for zoned block devices.
709test39() {
710 [ -n "$is_zbd" ] || return 0
711 read_one_block --zonemode=none >/dev/null || return $?
712 check_read $((logical_block_size)) || return $?
713}
714
715# Check whether fio accepts --zonemode=strided for zoned block devices.
716test40() {
717 local bs
718
719 bs=$((logical_block_size))
720 [ -n "$is_zbd" ] || return 0
721 read_one_block --zonemode=strided |
722 grep -q 'fio: --zonesize must be specified when using --zonemode=strided' ||
723 return $?
724 read_one_block --zonemode=strided --zonesize=$bs >/dev/null || return $?
725 check_read $bs || return $?
726}
727
728# Check whether fio checks the zone size for zoned block devices.
729test41() {
730 [ -n "$is_zbd" ] || return 0
731 read_one_block --zonemode=zbd --zonesize=$((2 * zone_size)) |
732 grep -q 'job parameter zonesize.*does not match disk zone size'
733}
734
735# Check whether fio handles --zonesize=0 correctly for regular block devices.
736test42() {
737 [ -n "$is_zbd" ] && return 0
738 read_one_block --zonemode=zbd --zonesize=0 |
739 grep -q 'Specifying the zone size is mandatory for regular block devices with --zonemode=zbd'
740}
741
a4b7f12b 742# Check whether fio handles --zonesize=1 correctly for regular block devices.
191d1d1a 743test43() {
a4b7f12b 744 [ -n "$is_zbd" ] && return 0
191d1d1a
BVA
745 read_one_block --zonemode=zbd --zonesize=1 |
746 grep -q 'zone size must be at least 512 bytes for --zonemode=zbd'
747}
748
749# Check whether fio handles --zonemode=none --zonesize=1 correctly.
750test44() {
751 read_one_block --zonemode=none --zonesize=1 |
752 grep -q 'fio: --zonemode=none and --zonesize are not compatible'
753}
754
755test45() {
756 local bs i
757
758 [ -z "$is_zbd" ] && return 0
759 bs=$((logical_block_size))
6dcb098d 760 run_one_fio_job "$(ioengine "psync")" --iodepth=1 --rw=randwrite --bs=$bs\
191d1d1a
BVA
761 --offset=$((first_sequential_zone_sector * 512)) \
762 --size="$zone_size" --do_verify=1 --verify=md5 2>&1 |
763 tee -a "${logfile}.${test_number}" |
764 grep -q "fio: first I/O failed. If .* is a zoned block device, consider --zonemode=zbd"
765}
766
bc596cbc
DLM
767# Random write to sequential zones, libaio, 8 jobs, queue depth 64 per job
768test46() {
769 local size
770
771 size=$((4 * zone_size))
6dcb098d 772 run_fio_on_seq "$(ioengine "libaio")" --iodepth=64 --rw=randwrite --bs=4K \
bc596cbc
DLM
773 --group_reporting=1 --numjobs=8 \
774 >> "${logfile}.${test_number}" 2>&1 || return $?
775 check_written $((size * 8)) || return $?
776}
777
4d37720a
DLM
778# Check whether fio handles --zonemode=zbd --zoneskip=1 correctly.
779test47() {
780 local bs
781
782 [ -z "$is_zbd" ] && return 0
783 bs=$((logical_block_size))
6dcb098d 784 run_one_fio_job "$(ioengine "psync")" --rw=write --bs=$bs \
4d37720a
DLM
785 --zonemode=zbd --zoneskip=1 \
786 >> "${logfile}.${test_number}" 2>&1 && return 1
787 grep -q 'zoneskip 1 is not a multiple of the device zone size' "${logfile}.${test_number}"
788}
789
3bd2078b
NA
790# Multiple overlapping random write jobs for the same drive and with a
791# limited number of open zones. This is similar to test29, but uses libaio
792# to stress test zone locking.
793test48() {
794 local i jobs=16 off opts=()
795
796 off=$((first_sequential_zone_sector * 512 + 64 * zone_size))
797 size=$((16*zone_size))
798 [ -n "$is_zbd" ] && reset_zone "$dev" $((off / 512))
799 opts=("--aux-path=/tmp" "--allow_file_create=0" "--significant_figures=10")
800 opts+=("--debug=zbd")
6dcb098d 801 opts+=("$(ioengine "libaio")" "--rw=randwrite" "--direct=1")
3bd2078b
NA
802 opts+=("--time_based" "--runtime=30")
803 opts+=("--zonemode=zbd" "--zonesize=${zone_size}")
804 opts+=("--max_open_zones=4")
805 for ((i=0;i<jobs;i++)); do
806 opts+=("--name=job$i" "--filename=$dev" "--offset=$off" "--bs=16K")
807 opts+=("--io_size=$zone_size" "--iodepth=256" "--thread=1")
808 opts+=("--group_reporting=1")
809 done
810
811 fio=$(dirname "$0")/../../fio
812
813 { echo; echo "fio ${opts[*]}"; echo; } >>"${logfile}.${test_number}"
814
815 timeout -v -s KILL 45s \
816 "${dynamic_analyzer[@]}" "$fio" "${opts[@]}" \
817 >> "${logfile}.${test_number}" 2>&1 || return $?
818}
819
191d1d1a
BVA
820tests=()
821dynamic_analyzer=()
822reset_all_zones=
6dcb098d
DF
823use_libzbc=
824zbd_debug=
191d1d1a
BVA
825
826while [ "${1#-}" != "$1" ]; do
827 case "$1" in
828 -d) dynamic_analyzer=(valgrind "--read-var-info=yes" "--tool=drd"
829 "--show-confl-seg=no");
830 shift;;
831 -e) dynamic_analyzer=(valgrind "--read-var-info=yes" "--tool=helgrind");
832 shift;;
6dcb098d 833 -l) use_libzbc=1; shift;;
191d1d1a
BVA
834 -r) reset_all_zones=1; shift;;
835 -t) tests+=("$2"); shift; shift;;
836 -v) dynamic_analyzer=(valgrind "--read-var-info=yes");
837 shift;;
6dcb098d 838 -z) zbd_debug=1; shift;;
191d1d1a
BVA
839 --) shift; break;;
840 esac
841done
842
843if [ $# != 1 ]; then
844 usage
845 exit 1
846fi
847
848# shellcheck source=functions
849source "$(dirname "$0")/functions" || exit $?
850
6dcb098d
DF
851var_opts=()
852if [ -n "$zbd_debug" ]; then
853 var_opts+=("--debug=zbd")
854fi
191d1d1a
BVA
855dev=$1
856realdev=$(readlink -f "$dev")
857basename=$(basename "$realdev")
6dcb098d
DF
858
859if [[ -b "$realdev" ]]; then
860 major=$((0x$(stat -L -c '%t' "$realdev"))) || exit $?
861 minor=$((0x$(stat -L -c '%T' "$realdev"))) || exit $?
862 disk_size=$(($(<"/sys/dev/block/$major:$minor/size")*512))
863
864 # When the target is a partition device, get basename of its
865 # holder device to access sysfs path of the holder device
866 if [[ -r "/sys/dev/block/$major:$minor/partition" ]]; then
867 realsysfs=$(readlink "/sys/dev/block/$major:$minor")
868 basename=$(basename "${realsysfs%/*}")
869 fi
870 logical_block_size=$(<"/sys/block/$basename/queue/logical_block_size")
871 case "$(<"/sys/class/block/$basename/queue/zoned")" in
872 host-managed|host-aware)
873 is_zbd=true
874 if ! result=($(first_sequential_zone "$dev")); then
875 echo "Failed to determine first sequential zone"
876 exit 1
877 fi
878 first_sequential_zone_sector=${result[0]}
879 sectors_per_zone=${result[1]}
880 zone_size=$((sectors_per_zone * 512))
881 if ! max_open_zones=$(max_open_zones "$dev"); then
882 echo "Failed to determine maximum number of open zones"
883 exit 1
884 fi
885 set_io_scheduler "$basename" deadline || exit $?
886 if [ -n "$reset_all_zones" ]; then
887 reset_zone "$dev" -1
888 fi
889 ;;
890 *)
891 first_sequential_zone_sector=$(((disk_size / 2) &
892 (logical_block_size - 1)))
893 zone_size=$(max 65536 "$logical_block_size")
894 sectors_per_zone=$((zone_size / 512))
895 max_open_zones=128
896 set_io_scheduler "$basename" none || exit $?
897 ;;
898 esac
899elif [[ -c "$realdev" ]]; then
900 # For an SG node, we must have libzbc option specified
901 if [[ ! -n "$use_libzbc" ]]; then
902 echo "Character device files can only be used with -l (libzbc) option"
903 exit 1
904 fi
905
906 if ! $(is_zbc "$dev"); then
907 echo "Device is not a ZBC disk"
908 exit 1
909 fi
191d1d1a 910 is_zbd=true
6dcb098d
DF
911
912 if ! disk_size=($(( $(zbc_disk_sectors "$dev") * 512))); then
913 echo "Failed to determine disk size"
914 exit 1
915 fi
916 if ! logical_block_size=($(zbc_logical_block_size "$dev")); then
917 echo "Failed to determine logical block size"
918 exit 1
919 fi
191d1d1a 920 if ! result=($(first_sequential_zone "$dev")); then
6dcb098d
DF
921 echo "Failed to determine first sequential zone"
922 exit 1
191d1d1a
BVA
923 fi
924 first_sequential_zone_sector=${result[0]}
925 sectors_per_zone=${result[1]}
926 zone_size=$((sectors_per_zone * 512))
927 if ! max_open_zones=$(max_open_zones "$dev"); then
6dcb098d
DF
928 echo "Failed to determine maximum number of open zones"
929 exit 1
191d1d1a 930 fi
191d1d1a 931 if [ -n "$reset_all_zones" ]; then
6dcb098d 932 reset_zone "$dev" -1
191d1d1a 933 fi
6dcb098d
DF
934fi
935
936echo -n "First sequential zone starts at sector $first_sequential_zone_sector;"
937echo " zone size: $((zone_size >> 20)) MB"
191d1d1a
BVA
938
939if [ "${#tests[@]}" = 0 ]; then
106a71cd
SK
940 readarray -t tests < <(declare -F | grep "test[0-9]*" | \
941 tr -c -d "[:digit:]\n" | sort -n)
191d1d1a
BVA
942fi
943
944logfile=$0.log
945
72176dc7
BVA
946passed=0
947failed=0
332fa178
DF
948if [ -t 1 ]; then
949 red="\e[1;31m"
950 green="\e[1;32m"
951 end="\e[m"
952else
953 red=""
954 green=""
955 end=""
956fi
191d1d1a 957rc=0
332fa178 958
c96b385b
DF
959intr=0
960trap 'intr=1' SIGINT
961
191d1d1a
BVA
962for test_number in "${tests[@]}"; do
963 rm -f "${logfile}.${test_number}"
332fa178 964 echo -n "Running test $(printf "%02d" $test_number) ... "
191d1d1a
BVA
965 if eval "test$test_number"; then
966 status="PASS"
332fa178 967 cc_status="${green}${status}${end}"
72176dc7 968 ((passed++))
191d1d1a
BVA
969 else
970 status="FAIL"
332fa178 971 cc_status="${red}${status}${end}"
72176dc7 972 ((failed++))
191d1d1a
BVA
973 rc=1
974 fi
332fa178 975 echo -e "$cc_status"
191d1d1a 976 echo "$status" >> "${logfile}.${test_number}"
c96b385b 977 [ $intr -ne 0 ] && exit 1
191d1d1a
BVA
978done
979
72176dc7
BVA
980echo "$passed tests passed"
981if [ $failed -gt 0 ]; then
982 echo " and $failed tests failed"
983fi
191d1d1a 984exit $rc