Commit | Line | Data |
---|---|---|
ebac4655 JA |
1 | #ifndef FIO_H |
2 | #define FIO_H | |
3 | ||
4 | #include <sched.h> | |
5 | #include <limits.h> | |
6 | #include <pthread.h> | |
7 | #include <sys/time.h> | |
8 | #include <sys/resource.h> | |
3c39a379 JA |
9 | #include <errno.h> |
10 | #include <stdlib.h> | |
11 | #include <stdio.h> | |
6d6f031f | 12 | #include <unistd.h> |
34cfcdaf | 13 | #include <string.h> |
cd14cc10 | 14 | #include <inttypes.h> |
7101d9c2 | 15 | #include <assert.h> |
ebac4655 | 16 | |
ecc314ba BC |
17 | struct thread_data; |
18 | ||
317b95d0 | 19 | #include "compiler/compiler.h" |
01743ee1 | 20 | #include "flist.h" |
e2887563 | 21 | #include "fifo.h" |
4b87898e | 22 | #include "rbtree.h" |
317b95d0 JA |
23 | #include "arch/arch.h" |
24 | #include "os/os.h" | |
07739b57 | 25 | #include "mutex.h" |
a3d741fa JA |
26 | #include "log.h" |
27 | #include "debug.h" | |
d6aed795 JA |
28 | #include "file.h" |
29 | #include "io_ddir.h" | |
dcefb588 | 30 | #include "ioengine.h" |
5995a6a4 | 31 | #include "iolog.h" |
c5c8bd5c | 32 | #include "helpers.h" |
07b3232d | 33 | #include "options.h" |
7eb36574 | 34 | #include "profile.h" |
c223da83 | 35 | #include "time.h" |
bf2e821a | 36 | #include "lib/getopt.h" |
2615cc4b | 37 | #include "lib/rand.h" |
ebac4655 | 38 | |
609342ff DL |
39 | #ifdef FIO_HAVE_GUASI |
40 | #include <guasi.h> | |
41 | #endif | |
42 | ||
417f0068 JA |
43 | #ifdef FIO_HAVE_SOLARISAIO |
44 | #include <sys/asynch.h> | |
45 | #endif | |
46 | ||
ebac4655 | 47 | struct group_run_stats { |
9104f874 JA |
48 | unsigned long long max_run[2], min_run[2]; |
49 | unsigned long long max_bw[2], min_bw[2]; | |
e9b2a3fa | 50 | unsigned long long io_kb[2]; |
9104f874 | 51 | unsigned long long agg[2]; |
90fef2d1 | 52 | unsigned int kb_base; |
ebac4655 JA |
53 | }; |
54 | ||
e9c047a0 JA |
55 | /* |
56 | * What type of allocation to use for io buffers | |
57 | */ | |
58 | enum fio_memtype { | |
59 | MEM_MALLOC = 0, /* ordinary malloc */ | |
60 | MEM_SHM, /* use shared memory segments */ | |
74b025b0 | 61 | MEM_SHMHUGE, /* use shared memory segments with huge pages */ |
e9c047a0 | 62 | MEM_MMAP, /* use anonynomous mmap */ |
d0bdaf49 | 63 | MEM_MMAPHUGE, /* memory mapped huge file */ |
e9c047a0 JA |
64 | }; |
65 | ||
38dad62d JA |
66 | /* |
67 | * offset generator types | |
68 | */ | |
69 | enum { | |
70 | RW_SEQ_SEQ = 0, | |
71 | RW_SEQ_IDENT, | |
72 | }; | |
73 | ||
b2560f3c JA |
74 | /* |
75 | * How many depth levels to log | |
76 | */ | |
bb067558 | 77 | #define FIO_IO_U_MAP_NR 7 |
a9a18a3f JA |
78 | #define FIO_IO_U_LAT_U_NR 10 |
79 | #define FIO_IO_U_LAT_M_NR 12 | |
b2560f3c | 80 | |
83349190 YH |
81 | /* |
82 | * Aggregate clat samples to report percentile(s) of them. | |
83 | * | |
84 | * EXECUTIVE SUMMARY | |
85 | * | |
86 | * FIO_IO_U_PLAT_BITS determines the maximum statistical error on the | |
87 | * value of resulting percentiles. The error will be approximately | |
88 | * 1/2^(FIO_IO_U_PLAT_BITS+1) of the value. | |
89 | * | |
90 | * FIO_IO_U_PLAT_GROUP_NR and FIO_IO_U_PLAT_BITS determine the maximum | |
91 | * range being tracked for latency samples. The maximum value tracked | |
92 | * accurately will be 2^(GROUP_NR + PLAT_BITS -1) microseconds. | |
93 | * | |
94 | * FIO_IO_U_PLAT_GROUP_NR and FIO_IO_U_PLAT_BITS determine the memory | |
95 | * requirement of storing those aggregate counts. The memory used will | |
96 | * be (FIO_IO_U_PLAT_GROUP_NR * 2^FIO_IO_U_PLAT_BITS) * sizeof(int) | |
97 | * bytes. | |
98 | * | |
99 | * FIO_IO_U_PLAT_NR is the total number of buckets. | |
100 | * | |
101 | * DETAILS | |
102 | * | |
103 | * Suppose the clat varies from 0 to 999 (usec), the straightforward | |
104 | * method is to keep an array of (999 + 1) buckets, in which a counter | |
105 | * keeps the count of samples which fall in the bucket, e.g., | |
106 | * {[0],[1],...,[999]}. However this consumes a huge amount of space, | |
107 | * and can be avoided if an approximation is acceptable. | |
108 | * | |
109 | * One such method is to let the range of the bucket to be greater | |
110 | * than one. This method has low accuracy when the value is small. For | |
111 | * example, let the buckets be {[0,99],[100,199],...,[900,999]}, and | |
112 | * the represented value of each bucket be the mean of the range. Then | |
113 | * a value 0 has an round-off error of 49.5. To improve on this, we | |
114 | * use buckets with non-uniform ranges, while bounding the error of | |
115 | * each bucket within a ratio of the sample value. A simple example | |
116 | * would be when error_bound = 0.005, buckets are { | |
117 | * {[0],[1],...,[99]}, {[100,101],[102,103],...,[198,199]},.., | |
118 | * {[900,909],[910,919]...} }. The total range is partitioned into | |
119 | * groups with different ranges, then buckets with uniform ranges. An | |
120 | * upper bound of the error is (range_of_bucket/2)/value_of_bucket | |
121 | * | |
122 | * For better efficiency, we implement this using base two. We group | |
123 | * samples by their Most Significant Bit (MSB), extract the next M bit | |
124 | * of them as an index within the group, and discard the rest of the | |
125 | * bits. | |
126 | * | |
127 | * E.g., assume a sample 'x' whose MSB is bit n (starting from bit 0), | |
128 | * and use M bit for indexing | |
129 | * | |
130 | * | n | M bits | bit (n-M-1) ... bit 0 | | |
131 | * | |
132 | * Because x is at least 2^n, and bit 0 to bit (n-M-1) is at most | |
133 | * (2^(n-M) - 1), discarding bit 0 to (n-M-1) makes the round-off | |
134 | * error | |
135 | * | |
136 | * 2^(n-M)-1 2^(n-M) 1 | |
137 | * e <= --------- <= ------- = --- | |
138 | * 2^n 2^n 2^M | |
139 | * | |
140 | * Furthermore, we use "mean" of the range to represent the bucket, | |
141 | * the error e can be lowered by half to 1 / 2^(M+1). By using M bits | |
142 | * as the index, each group must contains 2^M buckets. | |
143 | * | |
144 | * E.g. Let M (FIO_IO_U_PLAT_BITS) be 6 | |
145 | * Error bound is 1/2^(6+1) = 0.0078125 (< 1%) | |
146 | * | |
147 | * Group MSB #discarded range of #buckets | |
148 | * error_bits value | |
149 | * ---------------------------------------------------------------- | |
150 | * 0* 0~5 0 [0,63] 64 | |
151 | * 1* 6 0 [64,127] 64 | |
152 | * 2 7 1 [128,255] 64 | |
153 | * 3 8 2 [256,511] 64 | |
154 | * 4 9 3 [512,1023] 64 | |
155 | * ... ... ... [...,...] ... | |
156 | * 18 23 17 [8838608,+inf]** 64 | |
157 | * | |
158 | * * Special cases: when n < (M-1) or when n == (M-1), in both cases, | |
159 | * the value cannot be rounded off. Use all bits of the sample as | |
160 | * index. | |
161 | * | |
162 | * ** If a sample's MSB is greater than 23, it will be counted as 23. | |
163 | */ | |
164 | ||
165 | #define FIO_IO_U_PLAT_BITS 6 | |
166 | #define FIO_IO_U_PLAT_VAL (1 << FIO_IO_U_PLAT_BITS) | |
167 | #define FIO_IO_U_PLAT_GROUP_NR 19 | |
168 | #define FIO_IO_U_PLAT_NR (FIO_IO_U_PLAT_GROUP_NR * FIO_IO_U_PLAT_VAL) | |
169 | #define FIO_IO_U_LIST_MAX_LEN 20 /* The size of the default and user-specified | |
170 | list of percentiles */ | |
171 | ||
0e92f873 RR |
172 | #define MAX_PATTERN_SIZE 512 |
173 | ||
079ad09b | 174 | struct thread_stat { |
756867bd JA |
175 | char *name; |
176 | char *verror; | |
177 | int error; | |
178 | int groupid; | |
179 | pid_t pid; | |
180 | char *description; | |
6586ee89 | 181 | int members; |
756867bd | 182 | |
079ad09b JA |
183 | struct io_log *slat_log; |
184 | struct io_log *clat_log; | |
02af0988 | 185 | struct io_log *lat_log; |
079ad09b JA |
186 | struct io_log *bw_log; |
187 | ||
188 | /* | |
189 | * bandwidth and latency stats | |
190 | */ | |
191 | struct io_stat clat_stat[2]; /* completion latency */ | |
192 | struct io_stat slat_stat[2]; /* submission latency */ | |
02af0988 | 193 | struct io_stat lat_stat[2]; /* total latency */ |
079ad09b JA |
194 | struct io_stat bw_stat[2]; /* bandwidth stats */ |
195 | ||
196 | unsigned long long stat_io_bytes[2]; | |
197 | struct timeval stat_sample_time[2]; | |
198 | ||
199 | /* | |
200 | * fio system usage accounting | |
201 | */ | |
202 | struct rusage ru_start; | |
203 | struct rusage ru_end; | |
204 | unsigned long usr_time; | |
205 | unsigned long sys_time; | |
206 | unsigned long ctx; | |
81887d5d | 207 | unsigned long minf, majf; |
079ad09b | 208 | |
b2560f3c JA |
209 | /* |
210 | * IO depth and latency stats | |
211 | */ | |
83349190 YH |
212 | unsigned int clat_percentiles; |
213 | double* percentile_list; | |
214 | ||
b2560f3c | 215 | unsigned int io_u_map[FIO_IO_U_MAP_NR]; |
838bc709 JA |
216 | unsigned int io_u_submit[FIO_IO_U_MAP_NR]; |
217 | unsigned int io_u_complete[FIO_IO_U_MAP_NR]; | |
04a0feae JA |
218 | unsigned int io_u_lat_u[FIO_IO_U_LAT_U_NR]; |
219 | unsigned int io_u_lat_m[FIO_IO_U_LAT_M_NR]; | |
0a0b4900 | 220 | unsigned int io_u_plat[3][FIO_IO_U_PLAT_NR]; |
0d29de83 JA |
221 | unsigned long total_io_u[3]; |
222 | unsigned long short_io_u[3]; | |
838bc709 JA |
223 | unsigned long total_submit; |
224 | unsigned long total_complete; | |
756867bd JA |
225 | |
226 | unsigned long long io_bytes[2]; | |
cda99fa0 | 227 | unsigned long long runtime[2]; |
756867bd | 228 | unsigned long total_run_time; |
f2bba182 RR |
229 | |
230 | /* | |
231 | * IO Error related stats | |
232 | */ | |
233 | unsigned continue_on_error; | |
234 | unsigned long total_err_count; | |
235 | int first_error; | |
90fef2d1 JA |
236 | |
237 | unsigned int kb_base; | |
b2560f3c | 238 | }; |
71619dc2 | 239 | |
564ca972 JA |
240 | struct bssplit { |
241 | unsigned int bs; | |
242 | unsigned char perc; | |
243 | }; | |
244 | ||
2dc1bbeb | 245 | struct thread_options { |
b1ec1da6 | 246 | int pad; |
61697c37 | 247 | char *description; |
b4692828 | 248 | char *name; |
ef899b63 | 249 | char *directory; |
13f8e2d2 | 250 | char *filename; |
2dc1bbeb | 251 | char *opendir; |
09629a90 | 252 | char *ioengine; |
413dd459 | 253 | enum td_ddir td_ddir; |
38dad62d | 254 | unsigned int rw_seq; |
90fef2d1 | 255 | unsigned int kb_base; |
5736c10d | 256 | unsigned int ddir_seq_nr; |
2dc1bbeb JA |
257 | unsigned int iodepth; |
258 | unsigned int iodepth_low; | |
259 | unsigned int iodepth_batch; | |
4950421a | 260 | unsigned int iodepth_batch_complete; |
2dc1bbeb JA |
261 | |
262 | unsigned long long size; | |
7bb59102 | 263 | unsigned int size_percent; |
aa31f1f1 | 264 | unsigned int fill_device; |
2dc1bbeb JA |
265 | unsigned long long file_size_low; |
266 | unsigned long long file_size_high; | |
267 | unsigned long long start_offset; | |
268 | ||
269 | unsigned int bs[2]; | |
2b7a01d0 | 270 | unsigned int ba[2]; |
2dc1bbeb JA |
271 | unsigned int min_bs[2]; |
272 | unsigned int max_bs[2]; | |
720e84ad JA |
273 | struct bssplit *bssplit[2]; |
274 | unsigned int bssplit_nr[2]; | |
2dc1bbeb JA |
275 | |
276 | unsigned int nr_files; | |
277 | unsigned int open_files; | |
4d4e80f2 | 278 | enum file_lock_mode file_lock_mode; |
29c1349f | 279 | unsigned int lockfile_batch; |
e9c047a0 | 280 | |
9158d2f7 JA |
281 | unsigned int odirect; |
282 | unsigned int invalidate_cache; | |
283 | unsigned int create_serialize; | |
284 | unsigned int create_fsync; | |
814452bd | 285 | unsigned int create_on_open; |
9158d2f7 | 286 | unsigned int end_fsync; |
afad68f7 | 287 | unsigned int pre_read; |
9158d2f7 JA |
288 | unsigned int sync_io; |
289 | unsigned int verify; | |
e84c73a8 | 290 | unsigned int do_verify; |
160b966d | 291 | unsigned int verifysort; |
a59e170d JA |
292 | unsigned int verify_interval; |
293 | unsigned int verify_offset; | |
0e92f873 | 294 | char verify_pattern[MAX_PATTERN_SIZE]; |
90059d65 | 295 | unsigned int verify_pattern_bytes; |
a12a3b4d | 296 | unsigned int verify_fatal; |
b463e936 | 297 | unsigned int verify_dump; |
e8462bd8 | 298 | unsigned int verify_async; |
9e144189 JA |
299 | unsigned long long verify_backlog; |
300 | unsigned int verify_batch; | |
9158d2f7 JA |
301 | unsigned int use_thread; |
302 | unsigned int unlink; | |
303 | unsigned int do_disk_util; | |
304 | unsigned int override_sync; | |
305 | unsigned int rand_repeatable; | |
2615cc4b | 306 | unsigned int use_os_rand; |
9158d2f7 JA |
307 | unsigned int write_lat_log; |
308 | unsigned int write_bw_log; | |
bb8895e0 | 309 | unsigned int norandommap; |
2b386d25 | 310 | unsigned int softrandommap; |
690adba3 | 311 | unsigned int bs_unaligned; |
ebb1415f | 312 | unsigned int fsync_on_close; |
e9c047a0 | 313 | |
56bb17f2 | 314 | unsigned int hugepage_size; |
a00735e6 | 315 | unsigned int rw_min_bs; |
ebac4655 | 316 | unsigned int thinktime; |
48097d5c | 317 | unsigned int thinktime_spin; |
9c1f7434 | 318 | unsigned int thinktime_blocks; |
ebac4655 | 319 | unsigned int fsync_blocks; |
5f9099ea | 320 | unsigned int fdatasync_blocks; |
1ef2b6be | 321 | unsigned int barrier_blocks; |
dce8b847 | 322 | unsigned long long start_delay; |
0db26797 | 323 | unsigned long long timeout; |
721938ae | 324 | unsigned long long ramp_time; |
ebac4655 | 325 | unsigned int overwrite; |
ebac4655 | 326 | unsigned int bw_avg_time; |
ebac4655 | 327 | unsigned int loops; |
20dc95c4 JA |
328 | unsigned long long zone_size; |
329 | unsigned long long zone_skip; | |
e9c047a0 | 330 | enum fio_memtype mem_type; |
d529ee19 | 331 | unsigned int mem_align; |
2dc1bbeb | 332 | |
ebac4655 | 333 | unsigned int stonewall; |
b3d62a75 | 334 | unsigned int new_group; |
ebac4655 | 335 | unsigned int numjobs; |
ebac4655 | 336 | os_cpu_mask_t cpumask; |
375b2695 | 337 | unsigned int cpumask_set; |
e8462bd8 JA |
338 | os_cpu_mask_t verify_cpumask; |
339 | unsigned int verify_cpumask_set; | |
aea47d44 | 340 | unsigned int iolog; |
a6ccc7be | 341 | unsigned int rwmixcycle; |
e47f799f | 342 | unsigned int rwmix[2]; |
b6f4d880 | 343 | unsigned int nice; |
0aabe160 | 344 | unsigned int file_service_type; |
b2560f3c | 345 | unsigned int group_reporting; |
d2f3ac35 | 346 | unsigned int fadvise_hint; |
a596f047 | 347 | enum fio_fallocate_mode fallocate_mode; |
e9459e5a | 348 | unsigned int zero_buffers; |
5973cafb | 349 | unsigned int refill_buffers; |
cf4464ca | 350 | unsigned int time_based; |
02af0988 | 351 | unsigned int disable_lat; |
9520ebb9 JA |
352 | unsigned int disable_clat; |
353 | unsigned int disable_slat; | |
354 | unsigned int disable_bw; | |
993bf48b | 355 | unsigned int gtod_reduce; |
be4ecfdf JA |
356 | unsigned int gtod_cpu; |
357 | unsigned int gtod_offload; | |
c223da83 | 358 | enum fio_cs clocksource; |
64bbb865 | 359 | unsigned int no_stall; |
0d29de83 JA |
360 | unsigned int trim_percentage; |
361 | unsigned int trim_batch; | |
362 | unsigned int trim_zero; | |
363 | unsigned long long trim_backlog; | |
83349190 YH |
364 | unsigned int clat_percentiles; |
365 | unsigned int overwrite_plist; | |
366 | double percentile_list[FIO_IO_U_LIST_MAX_LEN]; | |
aea47d44 | 367 | |
076efc7c JA |
368 | char *read_iolog_file; |
369 | char *write_iolog_file; | |
e3cedca7 JA |
370 | char *bw_log_file; |
371 | char *lat_log_file; | |
d1c46c04 | 372 | char *replay_redirect; |
2dc1bbeb JA |
373 | |
374 | /* | |
375 | * Pre-run and post-run shell | |
376 | */ | |
377 | char *exec_prerun; | |
378 | char *exec_postrun; | |
379 | ||
581e7141 JA |
380 | unsigned int rate[2]; |
381 | unsigned int ratemin[2]; | |
2dc1bbeb | 382 | unsigned int ratecycle; |
581e7141 JA |
383 | unsigned int rate_iops[2]; |
384 | unsigned int rate_iops_min[2]; | |
2dc1bbeb JA |
385 | |
386 | char *ioscheduler; | |
387 | ||
388 | /* | |
389 | * CPU "io" cycle burner | |
390 | */ | |
391 | unsigned int cpuload; | |
392 | unsigned int cpucycle; | |
f2bba182 RR |
393 | |
394 | /* | |
395 | * I/O Error handling | |
396 | */ | |
397 | unsigned int continue_on_error; | |
9ac8a797 JA |
398 | |
399 | /* | |
400 | * Benchmark profile type | |
401 | */ | |
79d16311 | 402 | char *profile; |
a696fa2a JA |
403 | |
404 | /* | |
405 | * blkio cgroup support | |
406 | */ | |
a696fa2a JA |
407 | char *cgroup; |
408 | unsigned int cgroup_weight; | |
7de87099 | 409 | unsigned int cgroup_nodelete; |
e0b0d892 JA |
410 | |
411 | unsigned int uid; | |
412 | unsigned int gid; | |
44f29692 JA |
413 | |
414 | unsigned int sync_file_range; | |
2dc1bbeb JA |
415 | }; |
416 | ||
e4e33258 JA |
417 | #define FIO_VERROR_SIZE 128 |
418 | ||
2dc1bbeb JA |
419 | /* |
420 | * This describes a single thread/process executing a fio job. | |
421 | */ | |
422 | struct thread_data { | |
423 | struct thread_options o; | |
e4e33258 | 424 | char verror[FIO_VERROR_SIZE]; |
2dc1bbeb JA |
425 | pthread_t thread; |
426 | int thread_number; | |
427 | int groupid; | |
428 | struct thread_stat ts; | |
126d65c6 | 429 | struct fio_file **files; |
dd87b2c9 | 430 | unsigned int files_size; |
2dc1bbeb JA |
431 | unsigned int files_index; |
432 | unsigned int nr_open_files; | |
1020a139 | 433 | unsigned int nr_done_files; |
2dc1bbeb JA |
434 | unsigned int nr_normal_files; |
435 | union { | |
436 | unsigned int next_file; | |
437 | os_random_state_t next_file_state; | |
4c07ad86 | 438 | struct frand_state __next_file_state; |
2dc1bbeb JA |
439 | }; |
440 | int error; | |
20e354ef | 441 | int done; |
2dc1bbeb JA |
442 | pid_t pid; |
443 | char *orig_buffer; | |
444 | size_t orig_buffer_size; | |
445 | volatile int terminate; | |
446 | volatile int runstate; | |
447 | unsigned int ioprio; | |
ac684785 | 448 | unsigned int ioprio_set; |
2dc1bbeb | 449 | unsigned int last_was_sync; |
9e144189 | 450 | enum fio_ddir last_ddir; |
2dc1bbeb JA |
451 | |
452 | char *mmapfile; | |
453 | int mmapfd; | |
454 | ||
843a7413 JA |
455 | void *iolog_buf; |
456 | FILE *iolog_f; | |
ebac4655 | 457 | |
da86774e | 458 | char *sysfs_root; |
da86774e | 459 | |
0d29de83 | 460 | unsigned long rand_seeds[7]; |
5bfc35d7 | 461 | |
4c07ad86 JA |
462 | union { |
463 | os_random_state_t bsrange_state; | |
464 | struct frand_state __bsrange_state; | |
465 | }; | |
466 | union { | |
467 | os_random_state_t verify_state; | |
468 | struct frand_state __verify_state; | |
469 | }; | |
470 | union { | |
471 | os_random_state_t trim_state; | |
472 | struct frand_state __trim_state; | |
473 | }; | |
ebac4655 | 474 | |
9e144189 | 475 | unsigned int verify_batch; |
0d29de83 | 476 | unsigned int trim_batch; |
9e144189 | 477 | |
ebac4655 JA |
478 | int shm_id; |
479 | ||
e9c047a0 JA |
480 | /* |
481 | * IO engine hooks, contains everything needed to submit an io_u | |
482 | * to any of the available IO engines. | |
483 | */ | |
2866c82d | 484 | struct ioengine_ops *io_ops; |
ebac4655 | 485 | |
e9c047a0 JA |
486 | /* |
487 | * Current IO depth and list of free and busy io_u's. | |
488 | */ | |
ebac4655 | 489 | unsigned int cur_depth; |
d8005759 | 490 | unsigned int io_u_queued; |
01743ee1 JA |
491 | struct flist_head io_u_freelist; |
492 | struct flist_head io_u_busylist; | |
493 | struct flist_head io_u_requeues; | |
e8462bd8 JA |
494 | pthread_mutex_t io_u_lock; |
495 | pthread_cond_t free_cond; | |
496 | ||
497 | /* | |
498 | * async verify offload | |
499 | */ | |
500 | struct flist_head verify_list; | |
501 | pthread_t *verify_threads; | |
502 | unsigned int nr_verify_threads; | |
503 | pthread_cond_t verify_cond; | |
504 | int verify_thread_exit; | |
ebac4655 | 505 | |
e9c047a0 JA |
506 | /* |
507 | * Rate state | |
508 | */ | |
ba3e4e0c | 509 | unsigned long rate_nsec_cycle[2]; |
581e7141 JA |
510 | long rate_pending_usleep[2]; |
511 | unsigned long rate_bytes[2]; | |
512 | unsigned long rate_blocks[2]; | |
513 | struct timeval lastrate[2]; | |
ebac4655 | 514 | |
ebac4655 | 515 | unsigned long long total_io_size; |
2e3bd4c2 | 516 | unsigned long long fill_device_size; |
ebac4655 | 517 | |
755200a3 | 518 | unsigned long io_issues[2]; |
9104f874 JA |
519 | unsigned long long io_blocks[2]; |
520 | unsigned long long io_bytes[2]; | |
48f5abd3 | 521 | unsigned long long io_skip_bytes; |
9104f874 | 522 | unsigned long long this_io_bytes[2]; |
079ad09b | 523 | unsigned long long zone_bytes; |
cdd18ad8 | 524 | struct fio_mutex *mutex; |
ebac4655 | 525 | |
e9c047a0 JA |
526 | /* |
527 | * State for random io, a bitmap of blocks done vs not done | |
528 | */ | |
4c07ad86 JA |
529 | union { |
530 | os_random_state_t random_state; | |
531 | struct frand_state __random_state; | |
532 | }; | |
ebac4655 | 533 | |
ebac4655 JA |
534 | struct timeval start; /* start of this loop */ |
535 | struct timeval epoch; /* time job was started */ | |
a61eddec | 536 | struct timeval last_issue; |
993bf48b JA |
537 | struct timeval tv_cache; |
538 | unsigned int tv_cache_nr; | |
539 | unsigned int tv_cache_mask; | |
721938ae | 540 | unsigned int ramp_time_over; |
ebac4655 | 541 | |
e9c047a0 JA |
542 | /* |
543 | * read/write mixed workload state | |
544 | */ | |
4c07ad86 JA |
545 | union { |
546 | os_random_state_t rwmix_state; | |
547 | struct frand_state __rwmix_state; | |
548 | }; | |
e4928662 | 549 | unsigned long rwmix_issues; |
e9c047a0 | 550 | enum fio_ddir rwmix_ddir; |
5736c10d | 551 | unsigned int ddir_seq_nr; |
a6ccc7be | 552 | |
e9c047a0 | 553 | /* |
8de8f047 JA |
554 | * IO history logs for verification. We use a tree for sorting, |
555 | * if we are overwriting. Otherwise just use a fifo. | |
e9c047a0 | 556 | */ |
4b87898e | 557 | struct rb_root io_hist_tree; |
01743ee1 | 558 | struct flist_head io_hist_list; |
9e144189 | 559 | unsigned long io_hist_len; |
8de8f047 JA |
560 | |
561 | /* | |
562 | * For IO replaying | |
563 | */ | |
01743ee1 | 564 | struct flist_head io_log_list; |
433afcb4 | 565 | |
0d29de83 JA |
566 | /* |
567 | * For tracking/handling discards | |
568 | */ | |
569 | struct flist_head trim_list; | |
570 | unsigned long trim_entries; | |
571 | ||
1907dbc6 JA |
572 | /* |
573 | * for fileservice, how often to switch to a new file | |
574 | */ | |
575 | unsigned int file_service_nr; | |
576 | unsigned int file_service_left; | |
577 | struct fio_file *file_service_file; | |
9c60ce64 | 578 | |
44f29692 JA |
579 | unsigned int sync_file_range_nr; |
580 | ||
9c60ce64 JA |
581 | /* |
582 | * For generating file sizes | |
583 | */ | |
4c07ad86 JA |
584 | union { |
585 | os_random_state_t file_size_state; | |
586 | struct frand_state __file_size_state; | |
587 | }; | |
f2bba182 RR |
588 | |
589 | /* | |
590 | * Error counts | |
591 | */ | |
592 | unsigned int total_err_count; | |
593 | int first_error; | |
15dc1934 JA |
594 | |
595 | /* | |
596 | * Can be overloaded by profiles | |
597 | */ | |
7eb36574 | 598 | struct prof_io_ops prof_io_ops; |
58c55ba0 | 599 | void *prof_data; |
ebac4655 JA |
600 | }; |
601 | ||
e592a06b AC |
602 | /* |
603 | * when should interactive ETA output be generated | |
604 | */ | |
605 | enum { | |
606 | FIO_ETA_AUTO, | |
607 | FIO_ETA_ALWAYS, | |
608 | FIO_ETA_NEVER, | |
609 | }; | |
610 | ||
e1161c32 | 611 | #define __td_verror(td, err, msg, func) \ |
ebac4655 | 612 | do { \ |
19abcd3d JA |
613 | if ((td)->error) \ |
614 | break; \ | |
ebac4655 JA |
615 | int e = (err); \ |
616 | (td)->error = e; \ | |
f2bba182 RR |
617 | if (!(td)->first_error) \ |
618 | snprintf(td->verror, sizeof(td->verror) - 1, "file:%s:%d, func=%s, error=%s", __FILE__, __LINE__, (func), (msg)); \ | |
ebac4655 JA |
619 | } while (0) |
620 | ||
b990b5c0 | 621 | |
f2bba182 RR |
622 | #define td_clear_error(td) \ |
623 | (td)->error = 0; | |
e1161c32 JA |
624 | #define td_verror(td, err, func) \ |
625 | __td_verror((td), (err), strerror((err)), (func)) | |
626 | #define td_vmsg(td, err, msg, func) \ | |
627 | __td_verror((td), (err), (msg), (func)) | |
b990b5c0 | 628 | |
ebac4655 JA |
629 | extern int exitall_on_terminate; |
630 | extern int thread_number; | |
9cedf167 | 631 | extern int nr_process, nr_thread; |
ebac4655 JA |
632 | extern int shm_id; |
633 | extern int groupid; | |
c6ae0a5b | 634 | extern int terse_output; |
53cdc686 | 635 | extern int temp_stall_ts; |
1e97cce9 | 636 | extern unsigned long long mlock_size; |
cfc99db7 | 637 | extern unsigned long page_mask, page_size; |
4241ea8f | 638 | extern int read_only; |
e592a06b | 639 | extern int eta_print; |
d3eeeabc | 640 | extern unsigned long done_secs; |
01f06b63 | 641 | extern char *job_section; |
be4ecfdf JA |
642 | extern int fio_gtod_offload; |
643 | extern int fio_gtod_cpu; | |
c223da83 | 644 | extern enum fio_cs fio_clock_source; |
a9523c6f | 645 | extern int warnings_fatal; |
ebac4655 JA |
646 | |
647 | extern struct thread_data *threads; | |
648 | ||
7101d9c2 JA |
649 | static inline void fio_ro_check(struct thread_data *td, struct io_u *io_u) |
650 | { | |
651 | assert(!(io_u->ddir == DDIR_WRITE && !td_write(td))); | |
652 | } | |
653 | ||
0ce8b119 | 654 | #define BLOCKS_PER_MAP (8 * sizeof(unsigned long)) |
aec2de20 JA |
655 | #define TO_MAP_BLOCK(f, b) (b) |
656 | #define RAND_MAP_IDX(f, b) (TO_MAP_BLOCK(f, b) / BLOCKS_PER_MAP) | |
657 | #define RAND_MAP_BIT(f, b) (TO_MAP_BLOCK(f, b) & (BLOCKS_PER_MAP - 1)) | |
ebac4655 | 658 | |
fca70358 | 659 | #define REAL_MAX_JOBS 2048 |
ebac4655 | 660 | |
1ec99eea | 661 | #define td_non_fatal_error(e) ((e) == EIO || (e) == EILSEQ) |
f2bba182 RR |
662 | |
663 | static inline void update_error_count(struct thread_data *td, int err) | |
664 | { | |
665 | td->total_err_count++; | |
666 | if (td->total_err_count == 1) | |
667 | td->first_error = err; | |
668 | } | |
669 | ||
87dc1ab1 JA |
670 | static inline int should_fsync(struct thread_data *td) |
671 | { | |
672 | if (td->last_was_sync) | |
673 | return 0; | |
2dc1bbeb | 674 | if (td->o.odirect) |
87dc1ab1 | 675 | return 0; |
2dc1bbeb | 676 | if (td_write(td) || td_rw(td) || td->o.override_sync) |
87dc1ab1 JA |
677 | return 1; |
678 | ||
679 | return 0; | |
680 | } | |
681 | ||
8914a9d8 | 682 | /* |
214e1eca | 683 | * Init/option functions |
8914a9d8 | 684 | */ |
72cb971b | 685 | extern int __must_check parse_options(int, char **); |
3b8b7135 | 686 | extern int fio_options_parse(struct thread_data *, char **, int); |
74929ac2 | 687 | extern void fio_keywords_init(void); |
214e1eca JA |
688 | extern int fio_cmd_option_parse(struct thread_data *, const char *, char *); |
689 | extern void fio_fill_default_options(struct thread_data *); | |
690 | extern int fio_show_option_help(const char *); | |
691 | extern void fio_options_dup_and_init(struct option *); | |
d23bb327 JA |
692 | extern void options_mem_dupe(struct thread_data *); |
693 | extern void options_mem_free(struct thread_data *); | |
5bfc35d7 | 694 | extern void td_fill_rand_seeds(struct thread_data *); |
79d16311 | 695 | extern void add_job_opts(const char **); |
1ec3d69b JA |
696 | extern char *num2str(unsigned long, int, int, int); |
697 | ||
214e1eca | 698 | #define FIO_GETOPT_JOB 0x89988998 |
07b3232d | 699 | #define FIO_NR_OPTIONS (FIO_MAX_OPTS + 128) |
8914a9d8 | 700 | |
263e529f JA |
701 | /* |
702 | * ETA/status stuff | |
703 | */ | |
704 | extern void print_thread_status(void); | |
705 | extern void print_status_init(int); | |
706 | ||
707 | /* | |
708 | * Thread life cycle. Once a thread has a runstate beyond TD_INITIALIZED, it | |
709 | * will never back again. It may cycle between running/verififying/fsyncing. | |
710 | * Once the thread reaches TD_EXITED, it is just waiting for the core to | |
711 | * reap it. | |
712 | */ | |
713 | enum { | |
714 | TD_NOT_CREATED = 0, | |
715 | TD_CREATED, | |
716 | TD_INITIALIZED, | |
b29ee5b3 | 717 | TD_RAMP, |
263e529f | 718 | TD_RUNNING, |
b0f65863 | 719 | TD_PRE_READING, |
263e529f JA |
720 | TD_VERIFYING, |
721 | TD_FSYNCING, | |
722 | TD_EXITED, | |
723 | TD_REAPED, | |
724 | }; | |
725 | ||
b29ee5b3 JA |
726 | extern void td_set_runstate(struct thread_data *, int); |
727 | ||
2f9ade3c JA |
728 | /* |
729 | * Memory helpers | |
730 | */ | |
b2fdda43 | 731 | extern int __must_check fio_pin_memory(void); |
2f9ade3c | 732 | extern void fio_unpin_memory(void); |
b2fdda43 | 733 | extern int __must_check allocate_io_mem(struct thread_data *); |
2f9ade3c JA |
734 | extern void free_io_mem(struct thread_data *); |
735 | ||
b29ee5b3 JA |
736 | /* |
737 | * Reset stats after ramp time completes | |
738 | */ | |
739 | extern void reset_all_stats(struct thread_data *); | |
740 | ||
fb7b71a3 JA |
741 | /* |
742 | * blktrace support | |
743 | */ | |
5e62c22a | 744 | #ifdef FIO_HAVE_BLKTRACE |
fb7b71a3 JA |
745 | extern int is_blktrace(const char *); |
746 | extern int load_blktrace(struct thread_data *, const char *); | |
5e62c22a | 747 | #endif |
fb7b71a3 | 748 | |
2866c82d JA |
749 | /* |
750 | * Mark unused variables passed to ops functions as unused, to silence gcc | |
751 | */ | |
752 | #define fio_unused __attribute((__unused__)) | |
5f350952 JA |
753 | #define fio_init __attribute__((constructor)) |
754 | #define fio_exit __attribute__((destructor)) | |
2866c82d | 755 | |
34572e28 JA |
756 | #define for_each_td(td, i) \ |
757 | for ((i) = 0, (td) = &threads[0]; (i) < (int) thread_number; (i)++, (td)++) | |
53cdc686 | 758 | #define for_each_file(td, f, i) \ |
691c8fb0 JA |
759 | if ((td)->files_index) \ |
760 | for ((i) = 0, (f) = (td)->files[0]; \ | |
761 | (i) < (td)->o.nr_files && ((f) = (td)->files[i]) != NULL; \ | |
762 | (i)++) | |
53cdc686 | 763 | |
0032bf9f JA |
764 | #define fio_assert(td, cond) do { \ |
765 | if (!(cond)) { \ | |
340fd243 | 766 | int *__foo = NULL; \ |
0032bf9f | 767 | fprintf(stderr, "file:%s:%d, assert %s failed\n", __FILE__, __LINE__, #cond); \ |
ac18ea38 | 768 | td_set_runstate((td), TD_EXITED); \ |
437c9b71 | 769 | (td)->error = EFAULT; \ |
340fd243 | 770 | *__foo = 0; \ |
0032bf9f JA |
771 | } \ |
772 | } while (0) | |
773 | ||
12d9d841 JA |
774 | static inline int fio_fill_issue_time(struct thread_data *td) |
775 | { | |
776 | if (td->o.read_iolog_file || | |
777 | !td->o.disable_clat || !td->o.disable_slat || !td->o.disable_bw) | |
778 | return 1; | |
779 | ||
780 | return 0; | |
781 | } | |
782 | ||
581e7141 JA |
783 | static inline int __should_check_rate(struct thread_data *td, |
784 | enum fio_ddir ddir) | |
785 | { | |
786 | struct thread_options *o = &td->o; | |
787 | ||
788 | /* | |
789 | * If some rate setting was given, we need to check it | |
790 | */ | |
791 | if (o->rate[ddir] || o->ratemin[ddir] || o->rate_iops[ddir] || | |
792 | o->rate_iops_min[ddir]) | |
793 | return 1; | |
794 | ||
795 | return 0; | |
796 | } | |
797 | ||
798 | static inline int should_check_rate(struct thread_data *td, | |
799 | unsigned long *bytes_done) | |
800 | { | |
801 | int ret = 0; | |
802 | ||
803 | if (bytes_done[0]) | |
804 | ret |= __should_check_rate(td, 0); | |
805 | if (bytes_done[1]) | |
806 | ret |= __should_check_rate(td, 1); | |
807 | ||
808 | return ret; | |
809 | } | |
810 | ||
d529ee19 JA |
811 | static inline int is_power_of_2(unsigned int val) |
812 | { | |
813 | return (val != 0 && ((val & (val - 1)) == 0)); | |
814 | } | |
815 | ||
e8462bd8 JA |
816 | /* |
817 | * We currently only need to do locking if we have verifier threads | |
818 | * accessing our internal structures too | |
819 | */ | |
820 | static inline void td_io_u_lock(struct thread_data *td) | |
821 | { | |
822 | if (td->o.verify_async) | |
823 | pthread_mutex_lock(&td->io_u_lock); | |
824 | } | |
825 | ||
826 | static inline void td_io_u_unlock(struct thread_data *td) | |
827 | { | |
828 | if (td->o.verify_async) | |
829 | pthread_mutex_unlock(&td->io_u_lock); | |
830 | } | |
831 | ||
832 | static inline void td_io_u_free_notify(struct thread_data *td) | |
833 | { | |
834 | if (td->o.verify_async) | |
835 | pthread_cond_signal(&td->free_cond); | |
836 | } | |
837 | ||
ebac4655 | 838 | #endif |