[PATCH] Add 'bs_unaligned' option
[fio.git] / fio.h
CommitLineData
ebac4655
JA
1#ifndef FIO_H
2#define FIO_H
3
4#include <sched.h>
5#include <limits.h>
6#include <pthread.h>
7#include <sys/time.h>
8#include <sys/resource.h>
3c39a379
JA
9#include <errno.h>
10#include <stdlib.h>
11#include <stdio.h>
6d6f031f 12#include <unistd.h>
ebac4655
JA
13
14#include "list.h"
15#include "md5.h"
16#include "crc32.h"
17#include "arch.h"
18#include "os.h"
19
20struct io_stat {
21 unsigned long val;
22 unsigned long val_sq;
23 unsigned long max_val;
24 unsigned long min_val;
25 unsigned long samples;
26};
27
28struct io_sample {
29 unsigned long time;
30 unsigned long val;
31 unsigned int ddir;
32};
33
34struct io_log {
35 unsigned long nr_samples;
36 unsigned long max_samples;
37 struct io_sample *log;
38};
39
40struct io_piece {
41 struct list_head list;
53cdc686 42 struct fio_file *file;
ebac4655
JA
43 unsigned long long offset;
44 unsigned int len;
aea47d44 45 int ddir;
ebac4655
JA
46};
47
48/*
49 * The io unit
50 */
51struct io_u {
52 union {
53#ifdef FIO_HAVE_LIBAIO
54 struct iocb iocb;
55#endif
56#ifdef FIO_HAVE_POSIXAIO
57 struct aiocb aiocb;
58#endif
59#ifdef FIO_HAVE_SGIO
60 struct sg_io_hdr hdr;
61#endif
62 };
63 struct timeval start_time;
64 struct timeval issue_time;
65
66 char *buf;
67 unsigned int buflen;
68 unsigned long long offset;
69
70 unsigned int resid;
71 unsigned int error;
72
ebac4655
JA
73 unsigned char ddir;
74
dfd7bc2c
JA
75 /*
76 * io engine private data
77 */
78 union {
79 unsigned int index;
80 unsigned int seen;
81 };
82
53cdc686
JA
83 struct fio_file *file;
84
ebac4655
JA
85 struct list_head list;
86};
87
88#define FIO_HDR_MAGIC 0xf00baaef
89
90enum {
91 VERIFY_NONE = 0,
92 VERIFY_MD5,
93 VERIFY_CRC32,
94};
95
96struct verify_header {
97 unsigned int fio_magic;
98 unsigned int len;
99 unsigned int verify_type;
100 union {
101 char md5_digest[MD5_HASH_WORDS * 4];
102 unsigned long crc32;
103 };
104};
105
106struct group_run_stats {
9104f874
JA
107 unsigned long long max_run[2], min_run[2];
108 unsigned long long max_bw[2], min_bw[2];
e9b2a3fa 109 unsigned long long io_kb[2];
9104f874 110 unsigned long long agg[2];
ebac4655
JA
111};
112
e9c047a0
JA
113enum fio_ddir {
114 DDIR_READ = 0,
115 DDIR_WRITE,
87dc1ab1 116 DDIR_SYNC,
e9c047a0
JA
117};
118
119/*
120 * What type of allocation to use for io buffers
121 */
122enum fio_memtype {
123 MEM_MALLOC = 0, /* ordinary malloc */
124 MEM_SHM, /* use shared memory segments */
125 MEM_MMAP, /* use anonynomous mmap */
126};
127
128/*
129 * The type of object we are working on
130 */
131enum fio_filetype {
132 FIO_TYPE_FILE = 1,
133 FIO_TYPE_BD,
134 FIO_TYPE_CHAR,
135};
136
2866c82d 137enum fio_ioengine_flags {
e9c047a0 138 FIO_SYNCIO = 1 << 0,
2866c82d
JA
139 FIO_CPUIO = 1 << 1,
140 FIO_MMAPIO = 1 << 2,
b2a15192 141 FIO_RAWIO = 1 << 3,
e9c047a0
JA
142};
143
53cdc686
JA
144struct fio_file {
145 /*
146 * A file may not be a file descriptor, let the io engine decide
147 */
148 union {
149 unsigned long file_data;
150 int fd;
151 };
152 char *file_name;
153 void *mmap;
154 unsigned long long file_size;
155 unsigned long long real_file_size;
156 unsigned long long file_offset;
157 unsigned long long last_pos;
158
159 unsigned long *file_map;
160 unsigned int num_maps;
161};
162
e9c047a0
JA
163/*
164 * This describes a single thread/process executing a fio job.
165 */
ebac4655 166struct thread_data {
b4692828 167 char *name;
ef899b63 168 char *directory;
13f8e2d2 169 char *filename;
ebac4655
JA
170 char verror[80];
171 pthread_t thread;
172 int thread_number;
173 int groupid;
e9c047a0 174 enum fio_filetype filetype;
53cdc686
JA
175 struct fio_file *files;
176 unsigned int nr_files;
13f8e2d2 177 unsigned int nr_uniq_files;
53cdc686 178 unsigned int next_file;
ebac4655 179 int error;
ebac4655
JA
180 pid_t pid;
181 char *orig_buffer;
182 size_t orig_buffer_size;
183 volatile int terminate;
184 volatile int runstate;
e9c047a0 185 enum fio_ddir ddir;
3d60d1ed 186 unsigned int iomix;
ebac4655 187 unsigned int ioprio;
87dc1ab1 188 unsigned int last_was_sync;
e9c047a0 189
9158d2f7
JA
190 unsigned int sequential;
191 unsigned int odirect;
192 unsigned int invalidate_cache;
193 unsigned int create_serialize;
194 unsigned int create_fsync;
195 unsigned int end_fsync;
196 unsigned int sync_io;
197 unsigned int verify;
198 unsigned int use_thread;
199 unsigned int unlink;
200 unsigned int do_disk_util;
201 unsigned int override_sync;
202 unsigned int rand_repeatable;
203 unsigned int write_lat_log;
204 unsigned int write_bw_log;
bb8895e0 205 unsigned int norandommap;
690adba3 206 unsigned int bs_unaligned;
e9c047a0 207
ebac4655
JA
208 unsigned int bs;
209 unsigned int min_bs;
210 unsigned int max_bs;
ebac4655
JA
211 unsigned int thinktime;
212 unsigned int fsync_blocks;
213 unsigned int start_delay;
906c8d75 214 unsigned long timeout;
ebac4655 215 unsigned int overwrite;
ebac4655 216 unsigned int bw_avg_time;
ebac4655 217 unsigned int loops;
20dc95c4
JA
218 unsigned long long zone_size;
219 unsigned long long zone_skip;
e9c047a0 220 enum fio_memtype mem_type;
ebac4655
JA
221 unsigned int stonewall;
222 unsigned int numjobs;
ebac4655
JA
223 unsigned int iodepth;
224 os_cpu_mask_t cpumask;
aea47d44 225 unsigned int iolog;
843a7413 226 unsigned int read_iolog;
a6ccc7be
JA
227 unsigned int rwmixcycle;
228 unsigned int rwmixread;
e1f36503 229 unsigned int rwmixwrite;
b6f4d880 230 unsigned int nice;
aea47d44 231
076efc7c
JA
232 char *read_iolog_file;
233 char *write_iolog_file;
843a7413
JA
234 void *iolog_buf;
235 FILE *iolog_f;
ebac4655 236
da86774e 237 char *sysfs_root;
da86774e
JA
238 char *ioscheduler;
239
6dfd46b9
JA
240 os_random_state_t bsrange_state;
241 os_random_state_t verify_state;
ebac4655
JA
242
243 int shm_id;
244
e9c047a0
JA
245 /*
246 * IO engine hooks, contains everything needed to submit an io_u
247 * to any of the available IO engines.
248 */
2866c82d 249 struct ioengine_ops *io_ops;
ebac4655 250
e9c047a0
JA
251 /*
252 * Current IO depth and list of free and busy io_u's.
253 */
ebac4655
JA
254 unsigned int cur_depth;
255 struct list_head io_u_freelist;
256 struct list_head io_u_busylist;
257
e9c047a0
JA
258 /*
259 * Rate state
260 */
ebac4655
JA
261 unsigned int rate;
262 unsigned int ratemin;
263 unsigned int ratecycle;
264 unsigned long rate_usec_cycle;
265 long rate_pending_usleep;
266 unsigned long rate_bytes;
267 struct timeval lastrate;
268
269 unsigned long runtime[2]; /* msec */
270 unsigned long long io_size;
53cdc686
JA
271 unsigned long long total_file_size;
272 unsigned long long start_offset;
ebac4655
JA
273 unsigned long long total_io_size;
274
9104f874
JA
275 unsigned long long io_blocks[2];
276 unsigned long long io_bytes[2];
277 unsigned long long zone_bytes;
278 unsigned long long this_io_bytes[2];
bbfd6b00 279 volatile int mutex;
ebac4655 280
e9c047a0
JA
281 /*
282 * State for random io, a bitmap of blocks done vs not done
283 */
6dfd46b9 284 os_random_state_t random_state;
ebac4655 285
b990b5c0
JA
286 /*
287 * CPU "io" cycle burner
288 */
289 unsigned int cpuload;
290 unsigned int cpucycle;
291
ebac4655
JA
292 /*
293 * bandwidth and latency stats
294 */
295 struct io_stat clat_stat[2]; /* completion latency */
296 struct io_stat slat_stat[2]; /* submission latency */
297 struct io_stat bw_stat[2]; /* bandwidth stats */
298
9104f874 299 unsigned long long stat_io_bytes[2];
ebac4655
JA
300 struct timeval stat_sample_time[2];
301
302 struct io_log *slat_log;
303 struct io_log *clat_log;
304 struct io_log *bw_log;
305
306 struct timeval start; /* start of this loop */
307 struct timeval epoch; /* time job was started */
308
e9c047a0
JA
309 /*
310 * fio system usage accounting
311 */
ebac4655
JA
312 struct rusage ru_start;
313 struct rusage ru_end;
314 unsigned long usr_time;
315 unsigned long sys_time;
316 unsigned long ctx;
317
e9c047a0
JA
318 /*
319 * read/write mixed workload state
320 */
6dfd46b9 321 os_random_state_t rwmix_state;
a6ccc7be 322 struct timeval rwmix_switch;
e9c047a0 323 enum fio_ddir rwmix_ddir;
a6ccc7be 324
4e0ba8af
JA
325 /*
326 * Pre-run and post-run shell
327 */
328 char *exec_prerun;
329 char *exec_postrun;
330
e9c047a0
JA
331 /*
332 * IO historic logs
333 */
ebac4655 334 struct list_head io_hist_list;
aea47d44 335 struct list_head io_log_list;
ebac4655
JA
336};
337
b990b5c0 338#define __td_verror(td, err, msg) \
ebac4655
JA
339 do { \
340 int e = (err); \
341 (td)->error = e; \
b990b5c0 342 snprintf(td->verror, sizeof(td->verror) - 1, "file:%s:%d, error=%s", __FILE__, __LINE__, (msg)); \
ebac4655
JA
343 } while (0)
344
b990b5c0
JA
345
346#define td_verror(td, err) __td_verror((td), (err), strerror((err)))
347#define td_vmsg(td, err, msg) __td_verror((td), (err), (msg))
348
ebac4655 349extern int rate_quit;
ebac4655
JA
350extern int exitall_on_terminate;
351extern int thread_number;
352extern int shm_id;
353extern int groupid;
c6ae0a5b 354extern int terse_output;
eb8bbf48
JA
355extern FILE *f_out;
356extern FILE *f_err;
c1d5725e 357extern char *fio_inst_prefix;
53cdc686 358extern int temp_stall_ts;
ebac4655
JA
359
360extern struct thread_data *threads;
361
ebac4655
JA
362#define td_read(td) ((td)->ddir == DDIR_READ)
363#define td_write(td) ((td)->ddir == DDIR_WRITE)
3d60d1ed 364#define td_rw(td) ((td)->iomix != 0)
ebac4655
JA
365
366#define BLOCKS_PER_MAP (8 * sizeof(long))
53cdc686
JA
367#define TO_MAP_BLOCK(td, f, b) ((b) - ((f)->file_offset / (td)->min_bs))
368#define RAND_MAP_IDX(td, f, b) (TO_MAP_BLOCK(td, f, b) / BLOCKS_PER_MAP)
369#define RAND_MAP_BIT(td, f, b) (TO_MAP_BLOCK(td, f, b) & (BLOCKS_PER_MAP - 1))
ebac4655
JA
370
371#define MAX_JOBS (1024)
372
87dc1ab1
JA
373static inline int should_fsync(struct thread_data *td)
374{
375 if (td->last_was_sync)
376 return 0;
377 if (td->odirect)
378 return 0;
379 if (td_write(td) || td_rw(td) || td->override_sync)
380 return 1;
381
382 return 0;
383}
384
ebac4655
JA
385struct disk_util_stat {
386 unsigned ios[2];
387 unsigned merges[2];
388 unsigned long long sectors[2];
389 unsigned ticks[2];
390 unsigned io_ticks;
391 unsigned time_in_queue;
392};
393
394struct disk_util {
395 struct list_head list;
396
397 char *name;
398 char path[256];
399 dev_t dev;
400
401 struct disk_util_stat dus;
402 struct disk_util_stat last_dus;
403
404 unsigned long msec;
405 struct timeval time;
406};
407
408struct io_completion_data {
409 int nr; /* input */
410
411 int error; /* output */
412 unsigned long bytes_done[2]; /* output */
413};
414
415#define DISK_UTIL_MSEC (250)
416
6a0106a0
JA
417#ifndef min
418#define min(a, b) ((a) < (b) ? (a) : (b))
419#endif
420
6796209a
JA
421/*
422 * Log exports
423 */
424extern int read_iolog_get(struct thread_data *, struct io_u *);
425extern void write_iolog_put(struct thread_data *, struct io_u *);
426extern int init_iolog(struct thread_data *td);
427extern void log_io_piece(struct thread_data *, struct io_u *);
428extern void prune_io_piece_log(struct thread_data *);
429extern void write_iolog_close(struct thread_data *);
430
431/*
432 * Logging
433 */
434extern void add_clat_sample(struct thread_data *, int, unsigned long);
435extern void add_slat_sample(struct thread_data *, int, unsigned long);
436extern void add_bw_sample(struct thread_data *, int);
437extern void show_run_stats(void);
438extern void init_disk_util(struct thread_data *);
439extern void update_rusage_stat(struct thread_data *);
440extern void update_io_ticks(void);
441extern void disk_util_timer_arm(void);
8914a9d8
JA
442extern void setup_log(struct io_log **);
443extern void finish_log(struct thread_data *, struct io_log *, const char *);
444extern int setup_rate(struct thread_data *);
6796209a
JA
445
446/*
447 * Time functions
448 */
263e529f 449extern void time_init(void);
6796209a
JA
450extern unsigned long utime_since(struct timeval *, struct timeval *);
451extern unsigned long mtime_since(struct timeval *, struct timeval *);
452extern unsigned long mtime_since_now(struct timeval *);
453extern unsigned long time_since_now(struct timeval *);
263e529f 454extern unsigned long mtime_since_genesis(void);
b990b5c0 455extern void __usec_sleep(unsigned int);
6796209a
JA
456extern void usec_sleep(struct thread_data *, unsigned long);
457extern void rate_throttle(struct thread_data *, unsigned long, unsigned int);
458
8914a9d8
JA
459/*
460 * Init functions
461 */
462extern int parse_options(int, char **);
463extern int init_random_state(struct thread_data *);
464
53cdc686
JA
465/*
466 * File setup/shutdown
467 */
468extern void close_files(struct thread_data *);
469extern int setup_files(struct thread_data *);
e5b401d4 470extern int file_invalidate_cache(struct thread_data *, struct fio_file *);
53cdc686 471
263e529f
JA
472/*
473 * ETA/status stuff
474 */
475extern void print_thread_status(void);
476extern void print_status_init(int);
477
478/*
479 * Thread life cycle. Once a thread has a runstate beyond TD_INITIALIZED, it
480 * will never back again. It may cycle between running/verififying/fsyncing.
481 * Once the thread reaches TD_EXITED, it is just waiting for the core to
482 * reap it.
483 */
484enum {
485 TD_NOT_CREATED = 0,
486 TD_CREATED,
487 TD_INITIALIZED,
488 TD_RUNNING,
489 TD_VERIFYING,
490 TD_FSYNCING,
491 TD_EXITED,
492 TD_REAPED,
493};
494
e29d1b70
JA
495/*
496 * Verify helpers
497 */
498extern void populate_verify_io_u(struct thread_data *, struct io_u *);
499extern int get_next_verify(struct thread_data *td, struct io_u *);
a9619d44 500extern int do_io_u_verify(struct thread_data *, struct io_u **);
e29d1b70 501
2f9ade3c
JA
502/*
503 * Memory helpers
504 */
505extern int fio_pin_memory(void);
506extern void fio_unpin_memory(void);
507extern int allocate_io_mem(struct thread_data *);
508extern void free_io_mem(struct thread_data *);
509
10ba535a
JA
510/*
511 * io unit handling
512 */
513#define queue_full(td) list_empty(&(td)->io_u_freelist)
514extern struct io_u *__get_io_u(struct thread_data *);
515extern struct io_u *get_io_u(struct thread_data *, struct fio_file *);
516extern void put_io_u(struct thread_data *, struct io_u *);
517extern void ios_completed(struct thread_data *, struct io_completion_data *);
518extern void io_completed(struct thread_data *, struct io_u *, struct io_completion_data *);
519
520/*
521 * io engine entry points
522 */
8c16d840 523extern int td_io_init(struct thread_data *);
10ba535a
JA
524extern int td_io_prep(struct thread_data *, struct io_u *);
525extern int td_io_queue(struct thread_data *, struct io_u *);
526extern int td_io_sync(struct thread_data *, struct fio_file *);
527extern int td_io_getevents(struct thread_data *, int, int, struct timespec *);
528
bbfd6b00
JA
529/*
530 * This is a pretty crappy semaphore implementation, but with the use that fio
531 * has (just signalling start/go conditions), it doesn't have to be better.
532 * Naturally this would not work for any type of contended semaphore or
533 * for real locking.
534 */
1056eaad 535static inline void fio_sem_init(volatile int *sem, int val)
bbfd6b00
JA
536{
537 *sem = val;
538}
539
1056eaad 540static inline void fio_sem_down(volatile int *sem)
bbfd6b00
JA
541{
542 while (*sem == 0)
543 usleep(10000);
544
545 (*sem)--;
546}
547
1056eaad 548static inline void fio_sem_up(volatile int *sem)
bbfd6b00
JA
549{
550 (*sem)++;
551}
552
3b70d7e5
JA
553/*
554 * If logging output to a file, stderr should go to both stderr and f_err
555 */
556#define log_err(args...) do { \
557 fprintf(f_err, ##args); \
558 if (f_err != stderr) \
559 fprintf(stderr, ##args); \
560 } while (0)
561
2866c82d
JA
562struct ioengine_ops {
563 char name[16];
564 int version;
565 int flags;
ea2877a4 566 int (*setup)(struct thread_data *);
2866c82d
JA
567 int (*init)(struct thread_data *);
568 int (*prep)(struct thread_data *, struct io_u *);
569 int (*queue)(struct thread_data *, struct io_u *);
570 int (*getevents)(struct thread_data *, int, int, struct timespec *);
571 struct io_u *(*event)(struct thread_data *, int);
572 int (*cancel)(struct thread_data *, struct io_u *);
573 void (*cleanup)(struct thread_data *);
2866c82d
JA
574 void *data;
575 void *dlhandle;
576};
577
87dc1ab1 578#define FIO_IOOPS_VERSION 3
2866c82d 579
b4692828 580extern struct ioengine_ops *load_ioengine(struct thread_data *, const char *);
2866c82d
JA
581extern void close_ioengine(struct thread_data *);
582
583/*
584 * Mark unused variables passed to ops functions as unused, to silence gcc
585 */
586#define fio_unused __attribute((__unused__))
587
34572e28
JA
588#define for_each_td(td, i) \
589 for ((i) = 0, (td) = &threads[0]; (i) < (int) thread_number; (i)++, (td)++)
53cdc686 590#define for_each_file(td, f, i) \
34572e28 591 for ((i) = 0, (f) = &(td)->files[0]; (i) < (int) (td)->nr_files; (i)++, (f)++)
53cdc686 592
ebac4655 593#endif