t/zbd: Add write_and_run_one_fio_job() helper function
[fio.git] / t / zbd / test-zbd-support
CommitLineData
191d1d1a
BVA
1#!/bin/bash
2#
3# Copyright (C) 2018 Western Digital Corporation or its affiliates.
4#
5# This file is released under the GPL.
6
7usage() {
6dcb098d 8 echo "Usage: $(basename "$0") [-d] [-e] [-l] [-r] [-v] [-t <test>] [-z] <SMR drive device node>"
191d1d1a
BVA
9}
10
11max() {
12 if [ "$1" -gt "$2" ]; then
13 echo "$1"
14 else
15 echo "$2"
16 fi
17}
18
19min() {
20 if [ "$1" -lt "$2" ]; then
21 echo "$1"
22 else
23 echo "$2"
24 fi
25}
26
6dcb098d
DF
27ioengine() {
28 if [ -n "$use_libzbc" ]; then
29 echo -n "--ioengine=libzbc"
30 else
31 echo -n "--ioengine=$1"
32 fi
33}
34
191d1d1a
BVA
35set_io_scheduler() {
36 local dev=$1 sched=$2
37
38 [ -e "/sys/block/$dev" ] || return $?
39 if [ -e "/sys/block/$dev/mq" ]; then
40 case "$sched" in
41 noop) sched=none;;
42 deadline) sched=mq-deadline;;
43 esac
44 else
45 case "$sched" in
46 none) sched=noop;;
47 mq-deadline) sched=deadline;;
48 esac
49 fi
50
51 echo "$sched" >"/sys/block/$dev/queue/scheduler"
52}
53
54check_read() {
55 local read
56
57 read=$(fio_read <"${logfile}.${test_number}")
58 echo "read: $read <> $1" >> "${logfile}.${test_number}"
59 [ "$read" = "$1" ]
60}
61
62check_written() {
63 local written
64
65 written=$(fio_written <"${logfile}.${test_number}")
66 echo "written: $written <> $1" >> "${logfile}.${test_number}"
67 [ "$written" = "$1" ]
68}
69
70# Compare the reset count from the log file with reset count $2 using operator
71# $1 (=, -ge, -gt, -le, -lt).
72check_reset_count() {
73 local reset_count
74
75 reset_count=$(fio_reset_count <"${logfile}.${test_number}")
76 echo "reset_count: test $reset_count $1 $2" >> "${logfile}.${test_number}"
77 eval "[ '$reset_count' '$1' '$2' ]"
78}
79
80# Whether or not $1 (/dev/...) is a SCSI device.
81is_scsi_device() {
82 local d f
83
84 d=$(basename "$dev")
85 for f in /sys/class/scsi_device/*/device/block/"$d"; do
86 [ -e "$f" ] && return 0
87 done
88 return 1
89}
90
91run_fio() {
97e41ee4 92 local fio opts
191d1d1a
BVA
93
94 fio=$(dirname "$0")/../../fio
95
fc3bf67a
DLM
96 opts=("--max-jobs=16" "--aux-path=/tmp" "--allow_file_create=0" \
97 "--significant_figures=10" "$@")
6dcb098d 98 opts+=(${var_opts[@]})
97e41ee4 99 { echo; echo "fio ${opts[*]}"; echo; } >>"${logfile}.${test_number}"
191d1d1a 100
97e41ee4 101 "${dynamic_analyzer[@]}" "$fio" "${opts[@]}"
191d1d1a
BVA
102}
103
104run_one_fio_job() {
105 local r
106
107 r=$(((RANDOM << 16) | RANDOM))
108 run_fio --name="$dev" --filename="$dev" "$@" --randseed="$r" \
109 --thread=1 --direct=1
110}
111
8f601b44
SK
112write_and_run_one_fio_job() {
113 local r
114 local write_offset="${1}"
115 local write_size="${2}"
116
117 shift 2
118 r=$(((RANDOM << 16) | RANDOM))
119 run_fio --filename="$dev" --randseed="$r" --name="write_job" --rw=write \
120 "$(ioengine "psync")" --bs="${logical_block_size}" \
121 --zonemode=zbd --zonesize="${zone_size}" --thread=1 --direct=1 \
122 --offset="${write_offset}" --size="${write_size}" \
123 --name="$dev" --wait_for="write_job" "$@" --thread=1 --direct=1
124}
125
191d1d1a
BVA
126# Run fio on the first four sequential zones of the disk.
127run_fio_on_seq() {
128 local opts=()
129
130 opts+=("--offset=$((first_sequential_zone_sector * 512))")
131 opts+=("--size=$((4 * zone_size))" "--zonemode=zbd")
132 if [ -z "$is_zbd" ]; then
133 opts+=("--zonesize=${zone_size}")
134 fi
135 run_one_fio_job "${opts[@]}" "$@"
136}
137
138# Check whether buffered writes are refused.
139test1() {
140 run_fio --name=job1 --filename="$dev" --rw=write --direct=0 --bs=4K \
6dcb098d 141 "$(ioengine "psync")" --size="${zone_size}" --thread=1 \
191d1d1a
BVA
142 --zonemode=zbd --zonesize="${zone_size}" 2>&1 |
143 tee -a "${logfile}.${test_number}" |
144 grep -q 'Using direct I/O is mandatory for writing to ZBD drives'
145 local fio_rc=${PIPESTATUS[0]} grep_rc=${PIPESTATUS[2]}
146 case "$fio_rc" in
147 0|1) ;;
148 *) return "$fio_rc"
149 esac
150 if [ -n "$is_zbd" ]; then
151 [ "$grep_rc" = 0 ]
152 else
153 [ "$grep_rc" != 0 ]
154 fi
155}
156
157# Block size exceeds zone size.
158test2() {
159 local bs off opts=() rc
160
161 off=$(((first_sequential_zone_sector + 2 * sectors_per_zone) * 512))
162 bs=$((2 * zone_size))
6dcb098d 163 opts+=("$(ioengine "psync")")
191d1d1a
BVA
164 opts+=("--name=job1" "--filename=$dev" "--rw=write" "--direct=1")
165 opts+=("--zonemode=zbd" "--offset=$off" "--bs=$bs" "--size=$bs")
166 if [ -z "$is_zbd" ]; then
167 opts+=("--zonesize=${zone_size}")
168 fi
f572c8f6
DLM
169 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
170 ! grep -q 'WRITE:' "${logfile}.${test_number}"
191d1d1a
BVA
171}
172
173# Run fio against an empty zone. This causes fio to report "No I/O performed".
174test3() {
175 local off opts=() rc
176
177 off=$((first_sequential_zone_sector * 512 + 128 * zone_size))
178 size=$((zone_size))
179 [ -n "$is_zbd" ] && reset_zone "$dev" $((off / 512))
180 opts+=("--name=$dev" "--filename=$dev" "--offset=$off" "--bs=4K")
181 opts+=("--size=$size" "--zonemode=zbd")
6dcb098d 182 opts+=("$(ioengine "psync")" "--rw=read" "--direct=1" "--thread=1")
191d1d1a
BVA
183 if [ -z "$is_zbd" ]; then
184 opts+=("--zonesize=${zone_size}")
185 fi
186 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
bbd6f1bb 187 ! grep -q 'READ:' "${logfile}.${test_number}"
191d1d1a
BVA
188}
189
190# Run fio with --read_beyond_wp=1 against an empty zone.
191test4() {
192 local off opts=()
193
194 off=$((first_sequential_zone_sector * 512 + 129 * zone_size))
195 size=$((zone_size))
196 [ -n "$is_zbd" ] && reset_zone "$dev" $((off / 512))
197 opts+=("--name=$dev" "--filename=$dev" "--offset=$off" "--bs=$size")
198 opts+=("--size=$size" "--thread=1" "--read_beyond_wp=1")
6dcb098d 199 opts+=("$(ioengine "psync")" "--rw=read" "--direct=1" "--disable_lat=1")
191d1d1a
BVA
200 opts+=("--zonemode=zbd" "--zonesize=${zone_size}")
201 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
202 check_read $size || return $?
203}
204
205# Sequential write to sequential zones.
206test5() {
207 local size
208
209 size=$((4 * zone_size))
6dcb098d 210 run_fio_on_seq "$(ioengine "psync")" --iodepth=1 --rw=write \
191d1d1a
BVA
211 --bs="$(max $((zone_size / 64)) "$logical_block_size")"\
212 --do_verify=1 --verify=md5 \
213 >>"${logfile}.${test_number}" 2>&1 || return $?
214 check_written $size || return $?
215 check_read $size || return $?
216}
217
218# Sequential read from sequential zones. Must be run after test5.
219test6() {
220 local size
221
222 size=$((4 * zone_size))
6dcb098d 223 run_fio_on_seq "$(ioengine "psync")" --iodepth=1 --rw=read \
191d1d1a
BVA
224 --bs="$(max $((zone_size / 64)) "$logical_block_size")"\
225 >>"${logfile}.${test_number}" 2>&1 || return $?
226 check_read $size || return $?
227}
228
229# Random write to sequential zones, libaio, queue depth 1.
230test7() {
231 local size=$((zone_size))
232
6dcb098d 233 run_fio_on_seq "$(ioengine "libaio")" --iodepth=1 --rw=randwrite \
191d1d1a
BVA
234 --bs="$(min 16384 "${zone_size}")" \
235 --do_verify=1 --verify=md5 --size="$size" \
236 >>"${logfile}.${test_number}" 2>&1 || return $?
237 check_written $size || return $?
238 check_read $size || return $?
239}
240
241# Random write to sequential zones, libaio, queue depth 64.
242test8() {
243 local size
244
245 size=$((4 * zone_size))
6dcb098d 246 run_fio_on_seq "$(ioengine "libaio")" --iodepth=64 --rw=randwrite \
191d1d1a
BVA
247 --bs="$(min 16384 "${zone_size}")" \
248 --do_verify=1 --verify=md5 \
249 >>"${logfile}.${test_number}" 2>&1 || return $?
250 check_written $size || return $?
251 check_read $size || return $?
252}
253
254# Random write to sequential zones, sg, queue depth 1.
255test9() {
256 local size
257
258 if ! is_scsi_device "$dev"; then
259 echo "$dev is not a SCSI device" >>"${logfile}.${test_number}"
260 return 0
261 fi
262
263 size=$((4 * zone_size))
6dcb098d
DF
264 run_fio_on_seq --ioengine=sg \
265 --iodepth=1 --rw=randwrite --bs=16K \
191d1d1a
BVA
266 --do_verify=1 --verify=md5 \
267 >>"${logfile}.${test_number}" 2>&1 || return $?
268 check_written $size || return $?
269 check_read $size || return $?
270}
271
272# Random write to sequential zones, sg, queue depth 64.
273test10() {
274 local size
275
276 if ! is_scsi_device "$dev"; then
277 echo "$dev is not a SCSI device" >>"${logfile}.${test_number}"
278 return 0
279 fi
280
281 size=$((4 * zone_size))
6dcb098d
DF
282 run_fio_on_seq --ioengine=sg \
283 --iodepth=64 --rw=randwrite --bs=16K \
191d1d1a
BVA
284 --do_verify=1 --verify=md5 \
285 >>"${logfile}.${test_number}" 2>&1 || return $?
286 check_written $size || return $?
287 check_read $size || return $?
288}
289
290# Random write to sequential zones, libaio, queue depth 64, random block size.
291test11() {
292 local size
293
294 size=$((4 * zone_size))
6dcb098d 295 run_fio_on_seq "$(ioengine "libaio")" --iodepth=64 --rw=randwrite \
191d1d1a
BVA
296 --bsrange=4K-64K --do_verify=1 --verify=md5 \
297 --debug=zbd >>"${logfile}.${test_number}" 2>&1 || return $?
298 check_written $size || return $?
299 check_read $size || return $?
300}
301
302# Random write to sequential zones, libaio, queue depth 64, max 1 open zone.
303test12() {
304 local size
305
306 size=$((8 * zone_size))
6dcb098d 307 run_fio_on_seq "$(ioengine "libaio")" --iodepth=64 --rw=randwrite --bs=16K \
191d1d1a
BVA
308 --max_open_zones=1 --size=$size --do_verify=1 --verify=md5 \
309 --debug=zbd >>"${logfile}.${test_number}" 2>&1 || return $?
310 check_written $size || return $?
311 check_read $size || return $?
312}
313
314# Random write to sequential zones, libaio, queue depth 64, max 4 open zones.
315test13() {
316 local size
317
318 size=$((8 * zone_size))
6dcb098d 319 run_fio_on_seq "$(ioengine "libaio")" --iodepth=64 --rw=randwrite --bs=16K \
191d1d1a
BVA
320 --max_open_zones=4 --size=$size --do_verify=1 --verify=md5 \
321 --debug=zbd \
322 >>"${logfile}.${test_number}" 2>&1 || return $?
323 check_written $size || return $?
324 check_read $size || return $?
325}
326
327# Random write to conventional zones.
328test14() {
329 local size
330
331 size=$((16 * 2**20)) # 20 MB
332 if [ $size -gt $((first_sequential_zone_sector * 512)) ]; then
333 echo "$dev does not have enough sequential zones" \
334 >>"${logfile}.${test_number}"
335 return 0
336 fi
6dcb098d 337 run_one_fio_job "$(ioengine "libaio")" --iodepth=64 --rw=randwrite --bs=16K \
191d1d1a
BVA
338 --zonemode=zbd --zonesize="${zone_size}" --do_verify=1 \
339 --verify=md5 --size=$size \
340 >>"${logfile}.${test_number}" 2>&1 || return $?
341 check_written $((size)) || return $?
342 check_read $((size)) || return $?
343}
344
345# Sequential read on a mix of empty and full zones.
346test15() {
347 local i off size
348
349 for ((i=0;i<4;i++)); do
350 [ -n "$is_zbd" ] &&
351 reset_zone "$dev" $((first_sequential_zone_sector +
352 i*sectors_per_zone))
353 done
354 off=$(((first_sequential_zone_sector + 2 * sectors_per_zone) * 512))
355 size=$((2 * zone_size))
6dcb098d 356 run_one_fio_job "$(ioengine "psync")" --rw=write --bs=$((zone_size / 16))\
191d1d1a
BVA
357 --zonemode=zbd --zonesize="${zone_size}" --offset=$off \
358 --size=$size >>"${logfile}.${test_number}" 2>&1 ||
359 return $?
360 check_written $size || return $?
361 off=$((first_sequential_zone_sector * 512))
362 size=$((4 * zone_size))
6dcb098d 363 run_one_fio_job "$(ioengine "psync")" --rw=read --bs=$((zone_size / 16)) \
191d1d1a
BVA
364 --zonemode=zbd --zonesize="${zone_size}" --offset=$off \
365 --size=$((size)) >>"${logfile}.${test_number}" 2>&1 ||
366 return $?
367 if [ -n "$is_zbd" ]; then
368 check_read $((size / 2))
369 else
370 check_read $size
371 fi
372}
373
374# Random read on a mix of empty and full zones. Must be run after test15.
375test16() {
376 local off size
377
378 off=$((first_sequential_zone_sector * 512))
379 size=$((4 * zone_size))
6dcb098d 380 run_one_fio_job "$(ioengine "libaio")" --iodepth=64 --rw=randread --bs=16K \
191d1d1a
BVA
381 --zonemode=zbd --zonesize="${zone_size}" --offset=$off \
382 --size=$size >>"${logfile}.${test_number}" 2>&1 || return $?
383 check_read $size || return $?
384}
385
386# Random reads and writes in the last zone.
387test17() {
388 local io off read size written
389
390 off=$(((disk_size / zone_size - 1) * zone_size))
391 size=$((disk_size - off))
392 # Overwrite the last zone to avoid that reading from that zone fails.
393 if [ -n "$is_zbd" ]; then
394 reset_zone "$dev" $((off / 512)) || return $?
395 fi
6dcb098d 396 run_one_fio_job "$(ioengine "psync")" --rw=write --offset="$off" \
191d1d1a
BVA
397 --zonemode=zbd --zonesize="${zone_size}" \
398 --bs="$zone_size" --size="$zone_size" \
399 >>"${logfile}.${test_number}" 2>&1 || return $?
400 check_written "$zone_size" || return $?
6dcb098d 401 run_one_fio_job "$(ioengine "libaio")" --iodepth=8 --rw=randrw --bs=4K \
191d1d1a
BVA
402 --zonemode=zbd --zonesize="${zone_size}" \
403 --offset=$off --loops=2 --norandommap=1\
404 >>"${logfile}.${test_number}" 2>&1 || return $?
405 written=$(fio_written <"${logfile}.${test_number}")
406 read=$(fio_read <"${logfile}.${test_number}")
407 io=$((written + read))
408 echo "Total number of bytes read and written: $io <> $size" \
409 >>"${logfile}.${test_number}"
410 [ $io = $((size * 2)) ];
411}
412
413# Out-of-range zone reset threshold and frequency parameters.
414test18() {
415 run_fio_on_seq --zone_reset_threshold=-1 |&
416 tee -a "${logfile}.${test_number}" |
417 grep -q 'value out of range' || return $?
418}
419
420test19() {
421 run_fio_on_seq --zone_reset_threshold=2 |&
422 tee -a "${logfile}.${test_number}" |
423 grep -q 'value out of range' || return $?
424}
425
426test20() {
427 run_fio_on_seq --zone_reset_threshold=.4:.6 |&
428 tee -a "${logfile}.${test_number}" |
429 grep -q 'the list exceeding max length' || return $?
430}
431
432test21() {
433 run_fio_on_seq --zone_reset_frequency=-1 |&
434 tee -a "${logfile}.${test_number}" |
435 grep -q 'value out of range' || return $?
436}
437
438test22() {
439 run_fio_on_seq --zone_reset_frequency=2 |&
440 tee -a "${logfile}.${test_number}" |
441 grep -q 'value out of range' || return $?
442}
443
444test23() {
445 run_fio_on_seq --zone_reset_frequency=.4:.6 |&
446 tee -a "${logfile}.${test_number}" |
447 grep -q 'the list exceeding max length' || return $?
448}
449
450test24() {
451 local bs loops=9 size=$((zone_size))
452
453 bs=$(min $((256*1024)) "$zone_size")
6dcb098d
DF
454 run_fio_on_seq "$(ioengine "psync")" --rw=write --bs="$bs" \
455 --size=$size --loops=$loops \
191d1d1a
BVA
456 --zone_reset_frequency=.01 --zone_reset_threshold=.90 \
457 >> "${logfile}.${test_number}" 2>&1 || return $?
458 check_written $((size * loops)) || return $?
459 check_reset_count -eq 8 ||
460 check_reset_count -eq 9 ||
461 check_reset_count -eq 10 || return $?
462}
463
464# Multiple non-overlapping sequential write jobs for the same drive.
465test25() {
466 local i opts=()
467
468 for ((i=0;i<16;i++)); do
469 [ -n "$is_zbd" ] &&
470 reset_zone "$dev" $((first_sequential_zone_sector + i*sectors_per_zone))
471 done
472 for ((i=0;i<16;i++)); do
473 opts+=("--name=job$i" "--filename=$dev" "--thread=1" "--direct=1")
474 opts+=("--offset=$((first_sequential_zone_sector*512 + zone_size*i))")
6dcb098d 475 opts+=("--size=$zone_size" "$(ioengine "psync")" "--rw=write" "--bs=16K")
191d1d1a 476 opts+=("--zonemode=zbd" "--zonesize=${zone_size}" "--group_reporting=1")
6dcb098d 477 opts+=(${var_opts[@]})
191d1d1a
BVA
478 done
479 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
480}
481
482write_to_first_seq_zone() {
483 local loops=4 r
484
485 r=$(((RANDOM << 16) | RANDOM))
6dcb098d 486 run_fio --name="$dev" --filename="$dev" "$(ioengine "psync")" --rw="$1" \
191d1d1a
BVA
487 --thread=1 --do_verify=1 --verify=md5 --direct=1 --bs=4K \
488 --offset=$((first_sequential_zone_sector * 512)) \
489 "--size=$zone_size" --loops=$loops --randseed="$r" \
490 --zonemode=zbd --zonesize="${zone_size}" --group_reporting=1 \
491 --gtod_reduce=1 >> "${logfile}.${test_number}" 2>&1 || return $?
492 check_written $((loops * zone_size)) || return $?
493}
494
495# Overwrite the first sequential zone four times sequentially.
496test26() {
497 write_to_first_seq_zone write
498}
499
500# Overwrite the first sequential zone four times using random writes.
501test27() {
502 write_to_first_seq_zone randwrite
503}
504
505# Multiple overlapping random write jobs for the same drive.
506test28() {
507 local i jobs=16 off opts
508
509 off=$((first_sequential_zone_sector * 512 + 64 * zone_size))
510 [ -n "$is_zbd" ] && reset_zone "$dev" $((off / 512))
511 opts=("--debug=zbd")
512 for ((i=0;i<jobs;i++)); do
513 opts+=("--name=job$i" "--filename=$dev" "--offset=$off" "--bs=16K")
6dcb098d 514 opts+=("--size=$zone_size" "$(ioengine "psync")" "--rw=randwrite")
191d1d1a
BVA
515 opts+=("--thread=1" "--direct=1" "--zonemode=zbd")
516 opts+=("--zonesize=${zone_size}" "--group_reporting=1")
6dcb098d 517 opts+=(${var_opts[@]})
191d1d1a
BVA
518 done
519 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
520 check_written $((jobs * zone_size)) || return $?
521 check_reset_count -eq $jobs ||
522 check_reset_count -eq $((jobs - 1)) ||
523 return $?
524}
525
526# Multiple overlapping random write jobs for the same drive and with a limited
527# number of open zones.
528test29() {
529 local i jobs=16 off opts=()
530
531 off=$((first_sequential_zone_sector * 512 + 64 * zone_size))
532 size=$((16*zone_size))
533 [ -n "$is_zbd" ] && reset_zone "$dev" $((off / 512))
534 opts=("--debug=zbd")
535 for ((i=0;i<jobs;i++)); do
536 opts+=("--name=job$i" "--filename=$dev" "--offset=$off" "--bs=16K")
537 opts+=("--size=$size" "--io_size=$zone_size" "--thread=1")
6dcb098d 538 opts+=("$(ioengine "psync")" "--rw=randwrite" "--direct=1")
191d1d1a
BVA
539 opts+=("--max_open_zones=4" "--group_reporting=1")
540 opts+=("--zonemode=zbd" "--zonesize=${zone_size}")
6dcb098d 541 opts+=(${var_opts[@]})
191d1d1a
BVA
542 done
543 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
544 check_written $((jobs * zone_size)) || return $?
545}
546
547# Random reads and writes across the entire disk for 30s.
548test30() {
549 local off
550
551 off=$((first_sequential_zone_sector * 512))
6dcb098d 552 run_one_fio_job "$(ioengine "libaio")" --iodepth=8 --rw=randrw \
191d1d1a
BVA
553 --bs="$(max $((zone_size / 128)) "$logical_block_size")"\
554 --zonemode=zbd --zonesize="${zone_size}" --offset=$off\
555 --loops=2 --time_based --runtime=30s --norandommap=1\
556 >>"${logfile}.${test_number}" 2>&1
557}
558
559# Random reads across all sequential zones for 30s. This is not only a fio
560# test but also allows to verify the performance of a drive.
561test31() {
562 local bs inc nz off opts size
563
564 # Start with writing 128 KB to 128 sequential zones.
565 bs=128K
566 nz=128
567 # shellcheck disable=SC2017
568 inc=$(((disk_size - (first_sequential_zone_sector * 512)) / (nz * zone_size)
569 * zone_size))
570 opts=()
571 for ((off = first_sequential_zone_sector * 512; off < disk_size;
572 off += inc)); do
573 opts+=("--name=$dev" "--filename=$dev" "--offset=$off" "--io_size=$bs")
6dcb098d 574 opts+=("--bs=$bs" "--size=$zone_size" "$(ioengine "libaio")")
191d1d1a
BVA
575 opts+=("--rw=write" "--direct=1" "--thread=1" "--stats=0")
576 opts+=("--zonemode=zbd" "--zonesize=${zone_size}")
6dcb098d 577 opts+=(${var_opts[@]})
191d1d1a
BVA
578 done
579 "$(dirname "$0")/../../fio" "${opts[@]}" >> "${logfile}.${test_number}" 2>&1
580 # Next, run the test.
581 off=$((first_sequential_zone_sector * 512))
582 size=$((disk_size - off))
583 opts=("--name=$dev" "--filename=$dev" "--offset=$off" "--size=$size")
6dcb098d 584 opts+=("--bs=$bs" "$(ioengine "psync")" "--rw=randread" "--direct=1")
191d1d1a
BVA
585 opts+=("--thread=1" "--time_based" "--runtime=30" "--zonemode=zbd")
586 opts+=("--zonesize=${zone_size}")
587 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
588}
589
590# Random writes across all sequential zones. This is not only a fio test but
591# also allows to verify the performance of a drive.
592test32() {
593 local off opts=() size
594
595 off=$((first_sequential_zone_sector * 512))
596 size=$((disk_size - off))
597 opts+=("--name=$dev" "--filename=$dev" "--offset=$off" "--size=$size")
6dcb098d 598 opts+=("--bs=128K" "$(ioengine "psync")" "--rw=randwrite" "--direct=1")
191d1d1a
BVA
599 opts+=("--thread=1" "--time_based" "--runtime=30")
600 opts+=("--max_open_zones=$max_open_zones" "--zonemode=zbd")
601 opts+=("--zonesize=${zone_size}")
602 run_fio "${opts[@]}" >> "${logfile}.${test_number}" 2>&1 || return $?
603}
604
605# Write to sequential zones with a block size that is not a divisor of the
606# zone size.
607test33() {
608 local bs io_size size
609
610 size=$((2 * zone_size))
611 io_size=$((5 * zone_size))
612 bs=$((3 * zone_size / 4))
6dcb098d
DF
613 run_fio_on_seq "$(ioengine "psync")" --iodepth=1 --rw=write \
614 --size=$size --io_size=$io_size --bs=$bs \
191d1d1a
BVA
615 >> "${logfile}.${test_number}" 2>&1 || return $?
616 check_written $(((io_size + bs - 1) / bs * bs)) || return $?
617}
618
619# Write to sequential zones with a block size that is not a divisor of the
620# zone size and with data verification enabled.
621test34() {
622 local size
623
624 size=$((2 * zone_size))
6dcb098d 625 run_fio_on_seq "$(ioengine "psync")" --iodepth=1 --rw=write --size=$size \
191d1d1a
BVA
626 --do_verify=1 --verify=md5 --bs=$((3 * zone_size / 4)) \
627 >> "${logfile}.${test_number}" 2>&1 && return 1
628 grep -q 'not a divisor of' "${logfile}.${test_number}"
629}
630
631# Test 1/4 for the I/O boundary rounding code: $size < $zone_size.
632test35() {
633 local bs off io_size size
634
635 off=$(((first_sequential_zone_sector + 1) * 512))
636 size=$((zone_size - 2 * 512))
637 bs=$((zone_size / 4))
6dcb098d
DF
638 run_one_fio_job --offset=$off --size=$size "$(ioengine "psync")" \
639 --iodepth=1 --rw=write --do_verify=1 --verify=md5 \
640 --bs=$bs --zonemode=zbd --zonesize="${zone_size}" \
191d1d1a
BVA
641 >> "${logfile}.${test_number}" 2>&1 && return 1
642 grep -q 'io_size must be at least one zone' "${logfile}.${test_number}"
643}
644
645# Test 2/4 for the I/O boundary rounding code: $size < $zone_size.
646test36() {
647 local bs off io_size size
648
649 off=$(((first_sequential_zone_sector) * 512))
650 size=$((zone_size - 512))
651 bs=$((zone_size / 4))
6dcb098d
DF
652 run_one_fio_job --offset=$off --size=$size "$(ioengine "psync")" \
653 --iodepth=1 --rw=write --do_verify=1 --verify=md5 \
654 --bs=$bs --zonemode=zbd --zonesize="${zone_size}" \
191d1d1a
BVA
655 >> "${logfile}.${test_number}" 2>&1 && return 1
656 grep -q 'io_size must be at least one zone' "${logfile}.${test_number}"
657}
658
659# Test 3/4 for the I/O boundary rounding code: $size > $zone_size.
660test37() {
661 local bs off size
662
663 if [ "$first_sequential_zone_sector" = 0 ]; then
664 off=0
665 else
666 off=$(((first_sequential_zone_sector - 1) * 512))
667 fi
668 size=$((zone_size + 2 * 512))
669 bs=$((zone_size / 4))
6dcb098d
DF
670 run_one_fio_job --offset=$off --size=$size "$(ioengine "psync")" \
671 --iodepth=1 --rw=write --do_verify=1 --verify=md5 \
672 --bs=$bs --zonemode=zbd --zonesize="${zone_size}" \
191d1d1a
BVA
673 >> "${logfile}.${test_number}" 2>&1
674 check_written $((zone_size)) || return $?
675}
676
677# Test 4/4 for the I/O boundary rounding code: $offset > $disk_size - $zone_size
678test38() {
679 local bs off size
680
681 size=$((logical_block_size))
682 off=$((disk_size - logical_block_size))
683 bs=$((logical_block_size))
6dcb098d
DF
684 run_one_fio_job --offset=$off --size=$size "$(ioengine "psync")" \
685 --iodepth=1 --rw=write --do_verify=1 --verify=md5 \
686 --bs=$bs --zonemode=zbd --zonesize="${zone_size}" \
191d1d1a
BVA
687 >> "${logfile}.${test_number}" 2>&1 && return 1
688 grep -q 'io_size must be at least one zone' "${logfile}.${test_number}"
689}
690
691# Read one block from a block device.
692read_one_block() {
693 local bs
694
695 bs=$((logical_block_size))
6dcb098d 696 run_one_fio_job --rw=read "$(ioengine "psync")" --bs=$bs --size=$bs "$@" 2>&1 |
191d1d1a
BVA
697 tee -a "${logfile}.${test_number}"
698}
699
700# Check whether fio accepts --zonemode=none for zoned block devices.
701test39() {
702 [ -n "$is_zbd" ] || return 0
703 read_one_block --zonemode=none >/dev/null || return $?
704 check_read $((logical_block_size)) || return $?
705}
706
707# Check whether fio accepts --zonemode=strided for zoned block devices.
708test40() {
709 local bs
710
711 bs=$((logical_block_size))
712 [ -n "$is_zbd" ] || return 0
713 read_one_block --zonemode=strided |
714 grep -q 'fio: --zonesize must be specified when using --zonemode=strided' ||
715 return $?
716 read_one_block --zonemode=strided --zonesize=$bs >/dev/null || return $?
717 check_read $bs || return $?
718}
719
720# Check whether fio checks the zone size for zoned block devices.
721test41() {
722 [ -n "$is_zbd" ] || return 0
723 read_one_block --zonemode=zbd --zonesize=$((2 * zone_size)) |
724 grep -q 'job parameter zonesize.*does not match disk zone size'
725}
726
727# Check whether fio handles --zonesize=0 correctly for regular block devices.
728test42() {
729 [ -n "$is_zbd" ] && return 0
730 read_one_block --zonemode=zbd --zonesize=0 |
731 grep -q 'Specifying the zone size is mandatory for regular block devices with --zonemode=zbd'
732}
733
a4b7f12b 734# Check whether fio handles --zonesize=1 correctly for regular block devices.
191d1d1a 735test43() {
a4b7f12b 736 [ -n "$is_zbd" ] && return 0
191d1d1a
BVA
737 read_one_block --zonemode=zbd --zonesize=1 |
738 grep -q 'zone size must be at least 512 bytes for --zonemode=zbd'
739}
740
741# Check whether fio handles --zonemode=none --zonesize=1 correctly.
742test44() {
743 read_one_block --zonemode=none --zonesize=1 |
744 grep -q 'fio: --zonemode=none and --zonesize are not compatible'
745}
746
747test45() {
748 local bs i
749
750 [ -z "$is_zbd" ] && return 0
751 bs=$((logical_block_size))
6dcb098d 752 run_one_fio_job "$(ioengine "psync")" --iodepth=1 --rw=randwrite --bs=$bs\
191d1d1a
BVA
753 --offset=$((first_sequential_zone_sector * 512)) \
754 --size="$zone_size" --do_verify=1 --verify=md5 2>&1 |
755 tee -a "${logfile}.${test_number}" |
756 grep -q "fio: first I/O failed. If .* is a zoned block device, consider --zonemode=zbd"
757}
758
bc596cbc
DLM
759# Random write to sequential zones, libaio, 8 jobs, queue depth 64 per job
760test46() {
761 local size
762
763 size=$((4 * zone_size))
6dcb098d 764 run_fio_on_seq "$(ioengine "libaio")" --iodepth=64 --rw=randwrite --bs=4K \
bc596cbc
DLM
765 --group_reporting=1 --numjobs=8 \
766 >> "${logfile}.${test_number}" 2>&1 || return $?
767 check_written $((size * 8)) || return $?
768}
769
4d37720a
DLM
770# Check whether fio handles --zonemode=zbd --zoneskip=1 correctly.
771test47() {
772 local bs
773
774 [ -z "$is_zbd" ] && return 0
775 bs=$((logical_block_size))
6dcb098d 776 run_one_fio_job "$(ioengine "psync")" --rw=write --bs=$bs \
4d37720a
DLM
777 --zonemode=zbd --zoneskip=1 \
778 >> "${logfile}.${test_number}" 2>&1 && return 1
779 grep -q 'zoneskip 1 is not a multiple of the device zone size' "${logfile}.${test_number}"
780}
781
3bd2078b
NA
782# Multiple overlapping random write jobs for the same drive and with a
783# limited number of open zones. This is similar to test29, but uses libaio
784# to stress test zone locking.
785test48() {
786 local i jobs=16 off opts=()
787
788 off=$((first_sequential_zone_sector * 512 + 64 * zone_size))
789 size=$((16*zone_size))
790 [ -n "$is_zbd" ] && reset_zone "$dev" $((off / 512))
791 opts=("--aux-path=/tmp" "--allow_file_create=0" "--significant_figures=10")
792 opts+=("--debug=zbd")
6dcb098d 793 opts+=("$(ioengine "libaio")" "--rw=randwrite" "--direct=1")
3bd2078b
NA
794 opts+=("--time_based" "--runtime=30")
795 opts+=("--zonemode=zbd" "--zonesize=${zone_size}")
796 opts+=("--max_open_zones=4")
797 for ((i=0;i<jobs;i++)); do
798 opts+=("--name=job$i" "--filename=$dev" "--offset=$off" "--bs=16K")
799 opts+=("--io_size=$zone_size" "--iodepth=256" "--thread=1")
800 opts+=("--group_reporting=1")
801 done
802
803 fio=$(dirname "$0")/../../fio
804
805 { echo; echo "fio ${opts[*]}"; echo; } >>"${logfile}.${test_number}"
806
807 timeout -v -s KILL 45s \
808 "${dynamic_analyzer[@]}" "$fio" "${opts[@]}" \
809 >> "${logfile}.${test_number}" 2>&1 || return $?
810}
811
191d1d1a
BVA
812tests=()
813dynamic_analyzer=()
814reset_all_zones=
6dcb098d
DF
815use_libzbc=
816zbd_debug=
191d1d1a
BVA
817
818while [ "${1#-}" != "$1" ]; do
819 case "$1" in
820 -d) dynamic_analyzer=(valgrind "--read-var-info=yes" "--tool=drd"
821 "--show-confl-seg=no");
822 shift;;
823 -e) dynamic_analyzer=(valgrind "--read-var-info=yes" "--tool=helgrind");
824 shift;;
6dcb098d 825 -l) use_libzbc=1; shift;;
191d1d1a
BVA
826 -r) reset_all_zones=1; shift;;
827 -t) tests+=("$2"); shift; shift;;
828 -v) dynamic_analyzer=(valgrind "--read-var-info=yes");
829 shift;;
6dcb098d 830 -z) zbd_debug=1; shift;;
191d1d1a
BVA
831 --) shift; break;;
832 esac
833done
834
835if [ $# != 1 ]; then
836 usage
837 exit 1
838fi
839
840# shellcheck source=functions
841source "$(dirname "$0")/functions" || exit $?
842
6dcb098d
DF
843var_opts=()
844if [ -n "$zbd_debug" ]; then
845 var_opts+=("--debug=zbd")
846fi
191d1d1a
BVA
847dev=$1
848realdev=$(readlink -f "$dev")
849basename=$(basename "$realdev")
6dcb098d
DF
850
851if [[ -b "$realdev" ]]; then
852 major=$((0x$(stat -L -c '%t' "$realdev"))) || exit $?
853 minor=$((0x$(stat -L -c '%T' "$realdev"))) || exit $?
854 disk_size=$(($(<"/sys/dev/block/$major:$minor/size")*512))
855
856 # When the target is a partition device, get basename of its
857 # holder device to access sysfs path of the holder device
858 if [[ -r "/sys/dev/block/$major:$minor/partition" ]]; then
859 realsysfs=$(readlink "/sys/dev/block/$major:$minor")
860 basename=$(basename "${realsysfs%/*}")
861 fi
862 logical_block_size=$(<"/sys/block/$basename/queue/logical_block_size")
863 case "$(<"/sys/class/block/$basename/queue/zoned")" in
864 host-managed|host-aware)
865 is_zbd=true
866 if ! result=($(first_sequential_zone "$dev")); then
867 echo "Failed to determine first sequential zone"
868 exit 1
869 fi
870 first_sequential_zone_sector=${result[0]}
871 sectors_per_zone=${result[1]}
872 zone_size=$((sectors_per_zone * 512))
873 if ! max_open_zones=$(max_open_zones "$dev"); then
874 echo "Failed to determine maximum number of open zones"
875 exit 1
876 fi
877 set_io_scheduler "$basename" deadline || exit $?
878 if [ -n "$reset_all_zones" ]; then
879 reset_zone "$dev" -1
880 fi
881 ;;
882 *)
883 first_sequential_zone_sector=$(((disk_size / 2) &
884 (logical_block_size - 1)))
885 zone_size=$(max 65536 "$logical_block_size")
886 sectors_per_zone=$((zone_size / 512))
887 max_open_zones=128
888 set_io_scheduler "$basename" none || exit $?
889 ;;
890 esac
891elif [[ -c "$realdev" ]]; then
892 # For an SG node, we must have libzbc option specified
893 if [[ ! -n "$use_libzbc" ]]; then
894 echo "Character device files can only be used with -l (libzbc) option"
895 exit 1
896 fi
897
898 if ! $(is_zbc "$dev"); then
899 echo "Device is not a ZBC disk"
900 exit 1
901 fi
191d1d1a 902 is_zbd=true
6dcb098d
DF
903
904 if ! disk_size=($(( $(zbc_disk_sectors "$dev") * 512))); then
905 echo "Failed to determine disk size"
906 exit 1
907 fi
908 if ! logical_block_size=($(zbc_logical_block_size "$dev")); then
909 echo "Failed to determine logical block size"
910 exit 1
911 fi
191d1d1a 912 if ! result=($(first_sequential_zone "$dev")); then
6dcb098d
DF
913 echo "Failed to determine first sequential zone"
914 exit 1
191d1d1a
BVA
915 fi
916 first_sequential_zone_sector=${result[0]}
917 sectors_per_zone=${result[1]}
918 zone_size=$((sectors_per_zone * 512))
919 if ! max_open_zones=$(max_open_zones "$dev"); then
6dcb098d
DF
920 echo "Failed to determine maximum number of open zones"
921 exit 1
191d1d1a 922 fi
191d1d1a 923 if [ -n "$reset_all_zones" ]; then
6dcb098d 924 reset_zone "$dev" -1
191d1d1a 925 fi
6dcb098d
DF
926fi
927
928echo -n "First sequential zone starts at sector $first_sequential_zone_sector;"
929echo " zone size: $((zone_size >> 20)) MB"
191d1d1a
BVA
930
931if [ "${#tests[@]}" = 0 ]; then
106a71cd
SK
932 readarray -t tests < <(declare -F | grep "test[0-9]*" | \
933 tr -c -d "[:digit:]\n" | sort -n)
191d1d1a
BVA
934fi
935
936logfile=$0.log
937
72176dc7
BVA
938passed=0
939failed=0
332fa178
DF
940if [ -t 1 ]; then
941 red="\e[1;31m"
942 green="\e[1;32m"
943 end="\e[m"
944else
945 red=""
946 green=""
947 end=""
948fi
191d1d1a 949rc=0
332fa178 950
c96b385b
DF
951intr=0
952trap 'intr=1' SIGINT
953
191d1d1a
BVA
954for test_number in "${tests[@]}"; do
955 rm -f "${logfile}.${test_number}"
332fa178 956 echo -n "Running test $(printf "%02d" $test_number) ... "
191d1d1a
BVA
957 if eval "test$test_number"; then
958 status="PASS"
332fa178 959 cc_status="${green}${status}${end}"
72176dc7 960 ((passed++))
191d1d1a
BVA
961 else
962 status="FAIL"
332fa178 963 cc_status="${red}${status}${end}"
72176dc7 964 ((failed++))
191d1d1a
BVA
965 rc=1
966 fi
332fa178 967 echo -e "$cc_status"
191d1d1a 968 echo "$status" >> "${logfile}.${test_number}"
c96b385b 969 [ $intr -ne 0 ] && exit 1
191d1d1a
BVA
970done
971
72176dc7
BVA
972echo "$passed tests passed"
973if [ $failed -gt 0 ]; then
974 echo " and $failed tests failed"
975fi
191d1d1a 976exit $rc