Fio 1.16.3
[fio.git] / init.c
... / ...
CommitLineData
1/*
2 * This file contains job initialization and setup functions.
3 */
4#include <stdio.h>
5#include <stdlib.h>
6#include <unistd.h>
7#include <fcntl.h>
8#include <ctype.h>
9#include <string.h>
10#include <errno.h>
11#include <getopt.h>
12#include <sys/ipc.h>
13#include <sys/shm.h>
14#include <sys/types.h>
15#include <sys/stat.h>
16
17#include "fio.h"
18#include "parse.h"
19
20static char fio_version_string[] = "fio 1.16.3";
21
22#define FIO_RANDSEED (0xb1899bedUL)
23
24static char **ini_file;
25static int max_jobs = MAX_JOBS;
26static int dump_cmdline;
27
28struct thread_data def_thread;
29struct thread_data *threads = NULL;
30
31int exitall_on_terminate = 0;
32int terse_output = 0;
33unsigned long long mlock_size = 0;
34FILE *f_out = NULL;
35FILE *f_err = NULL;
36
37int write_bw_log = 0;
38
39static int def_timeout = 0;
40static int write_lat_log = 0;
41
42static int prev_group_jobs;
43
44/*
45 * Command line options. These will contain the above, plus a few
46 * extra that only pertain to fio itself and not jobs.
47 */
48static struct option long_options[FIO_NR_OPTIONS] = {
49 {
50 .name = "output",
51 .has_arg = required_argument,
52 .val = 'o',
53 },
54 {
55 .name = "timeout",
56 .has_arg = required_argument,
57 .val = 't',
58 },
59 {
60 .name = "latency-log",
61 .has_arg = required_argument,
62 .val = 'l',
63 },
64 {
65 .name = "bandwidth-log",
66 .has_arg = required_argument,
67 .val = 'b',
68 },
69 {
70 .name = "minimal",
71 .has_arg = optional_argument,
72 .val = 'm',
73 },
74 {
75 .name = "version",
76 .has_arg = no_argument,
77 .val = 'v',
78 },
79 {
80 .name = "help",
81 .has_arg = no_argument,
82 .val = 'h',
83 },
84 {
85 .name = "cmdhelp",
86 .has_arg = optional_argument,
87 .val = 'c',
88 },
89 {
90 .name = "showcmd",
91 .has_arg = no_argument,
92 .val = 's'
93 },
94 {
95 .name = NULL,
96 },
97};
98
99FILE *get_f_out()
100{
101 return f_out;
102}
103
104FILE *get_f_err()
105{
106 return f_err;
107}
108
109/*
110 * Return a free job structure.
111 */
112static struct thread_data *get_new_job(int global, struct thread_data *parent)
113{
114 struct thread_data *td;
115
116 if (global)
117 return &def_thread;
118 if (thread_number >= max_jobs)
119 return NULL;
120
121 td = &threads[thread_number++];
122 *td = *parent;
123
124 dup_files(td, parent);
125 options_mem_dupe(td);
126
127 td->thread_number = thread_number;
128 return td;
129}
130
131static void put_job(struct thread_data *td)
132{
133 if (td == &def_thread)
134 return;
135
136 if (td->error)
137 log_info("fio: %s\n", td->verror);
138
139 memset(&threads[td->thread_number - 1], 0, sizeof(*td));
140 thread_number--;
141}
142
143static int setup_rate(struct thread_data *td)
144{
145 unsigned long nr_reads_per_msec;
146 unsigned long long rate;
147 unsigned int bs;
148
149 if (!td->o.rate && !td->o.rate_iops)
150 return 0;
151
152 if (td_rw(td))
153 bs = td->o.rw_min_bs;
154 else if (td_read(td))
155 bs = td->o.min_bs[DDIR_READ];
156 else
157 bs = td->o.min_bs[DDIR_WRITE];
158
159 if (td->o.rate) {
160 rate = td->o.rate;
161 nr_reads_per_msec = (rate * 1024 * 1000LL) / bs;
162 } else
163 nr_reads_per_msec = td->o.rate_iops * 1000UL;
164
165 if (!nr_reads_per_msec) {
166 log_err("rate lower than supported\n");
167 return -1;
168 }
169
170 td->rate_usec_cycle = 1000000000ULL / nr_reads_per_msec;
171 td->rate_pending_usleep = 0;
172 return 0;
173}
174
175/*
176 * Lazy way of fixing up options that depend on each other. We could also
177 * define option callback handlers, but this is easier.
178 */
179static int fixup_options(struct thread_data *td)
180{
181 struct thread_options *o = &td->o;
182
183 if (o->rwmix[DDIR_READ] + o->rwmix[DDIR_WRITE] > 100)
184 o->rwmix[DDIR_WRITE] = 100 - o->rwmix[DDIR_READ];
185
186 if (o->write_iolog_file && o->read_iolog_file) {
187 log_err("fio: read iolog overrides write_iolog\n");
188 free(o->write_iolog_file);
189 o->write_iolog_file = NULL;
190 }
191
192 if (td->io_ops->flags & FIO_SYNCIO)
193 o->iodepth = 1;
194 else {
195 if (!o->iodepth)
196 o->iodepth = o->open_files;
197 }
198
199 /*
200 * only really works for sequential io for now, and with 1 file
201 */
202 if (o->zone_size && td_random(td) && o->open_files == 1)
203 o->zone_size = 0;
204
205 /*
206 * Reads can do overwrites, we always need to pre-create the file
207 */
208 if (td_read(td) || td_rw(td))
209 o->overwrite = 1;
210
211 if (!o->min_bs[DDIR_READ])
212 o->min_bs[DDIR_READ]= o->bs[DDIR_READ];
213 if (!o->max_bs[DDIR_READ])
214 o->max_bs[DDIR_READ] = o->bs[DDIR_READ];
215 if (!o->min_bs[DDIR_WRITE])
216 o->min_bs[DDIR_WRITE]= o->bs[DDIR_WRITE];
217 if (!o->max_bs[DDIR_WRITE])
218 o->max_bs[DDIR_WRITE] = o->bs[DDIR_WRITE];
219
220 o->rw_min_bs = min(o->min_bs[DDIR_READ], o->min_bs[DDIR_WRITE]);
221
222 if (!o->file_size_high)
223 o->file_size_high = o->file_size_low;
224
225 if (td_read(td) && !td_rw(td))
226 o->verify = 0;
227
228 if (o->norandommap && o->verify != VERIFY_NONE) {
229 log_err("fio: norandommap given, verify disabled\n");
230 o->verify = VERIFY_NONE;
231 }
232 if (o->bs_unaligned && (o->odirect || td->io_ops->flags & FIO_RAWIO))
233 log_err("fio: bs_unaligned may not work with raw io\n");
234
235 /*
236 * thinktime_spin must be less than thinktime
237 */
238 if (o->thinktime_spin > o->thinktime)
239 o->thinktime_spin = o->thinktime;
240
241 /*
242 * The low water mark cannot be bigger than the iodepth
243 */
244 if (o->iodepth_low > o->iodepth || !o->iodepth_low) {
245 /*
246 * syslet work around - if the workload is sequential,
247 * we want to let the queue drain all the way down to
248 * avoid seeking between async threads
249 */
250 if (!strcmp(td->io_ops->name, "syslet-rw") && !td_random(td))
251 o->iodepth_low = 1;
252 else
253 o->iodepth_low = o->iodepth;
254 }
255
256 /*
257 * If batch number isn't set, default to the same as iodepth
258 */
259 if (o->iodepth_batch > o->iodepth || !o->iodepth_batch)
260 o->iodepth_batch = o->iodepth;
261
262 if (o->nr_files > td->files_index)
263 o->nr_files = td->files_index;
264
265 if (o->open_files > o->nr_files || !o->open_files)
266 o->open_files = o->nr_files;
267
268 if ((o->rate && o->rate_iops) || (o->ratemin && o->rate_iops_min)) {
269 log_err("fio: rate and rate_iops are mutually exclusive\n");
270 return 1;
271 }
272 if ((o->rate < o->ratemin) || (o->rate_iops < o->rate_iops_min)) {
273 log_err("fio: minimum rate exceeds rate\n");
274 return 1;
275 }
276
277 if (!o->timeout && o->time_based) {
278 log_err("fio: time_based requires a runtime/timeout setting\n");
279 o->time_based = 0;
280 }
281
282 return 0;
283}
284
285/*
286 * This function leaks the buffer
287 */
288static char *to_kmg(unsigned int val)
289{
290 char *buf = malloc(32);
291 char post[] = { 0, 'K', 'M', 'G', 'P', 'E', 0 };
292 char *p = post;
293
294 do {
295 if (val & 1023)
296 break;
297
298 val >>= 10;
299 p++;
300 } while (*p);
301
302 snprintf(buf, 31, "%u%c", val, *p);
303 return buf;
304}
305
306/* External engines are specified by "external:name.o") */
307static const char *get_engine_name(const char *str)
308{
309 char *p = strstr(str, ":");
310
311 if (!p)
312 return str;
313
314 p++;
315 strip_blank_front(&p);
316 strip_blank_end(p);
317 return p;
318}
319
320static int exists_and_not_file(const char *filename)
321{
322 struct stat sb;
323
324 if (lstat(filename, &sb) == -1)
325 return 0;
326
327 if (S_ISREG(sb.st_mode))
328 return 0;
329
330 return 1;
331}
332
333/*
334 * Initialize the various random states we need (random io, block size ranges,
335 * read/write mix, etc).
336 */
337static int init_random_state(struct thread_data *td)
338{
339 unsigned long seeds[6];
340 int fd;
341
342 fd = open("/dev/urandom", O_RDONLY);
343 if (fd == -1) {
344 td_verror(td, errno, "open");
345 return 1;
346 }
347
348 if (read(fd, seeds, sizeof(seeds)) < (int) sizeof(seeds)) {
349 td_verror(td, EIO, "read");
350 close(fd);
351 return 1;
352 }
353
354 close(fd);
355
356 os_random_seed(seeds[0], &td->bsrange_state);
357 os_random_seed(seeds[1], &td->verify_state);
358 os_random_seed(seeds[2], &td->rwmix_state);
359
360 if (td->o.file_service_type == FIO_FSERVICE_RANDOM)
361 os_random_seed(seeds[3], &td->next_file_state);
362
363 os_random_seed(seeds[5], &td->file_size_state);
364
365 if (!td_random(td))
366 return 0;
367
368 if (td->o.rand_repeatable)
369 seeds[4] = FIO_RANDSEED * td->thread_number;
370
371 os_random_seed(seeds[4], &td->random_state);
372 return 0;
373}
374
375/*
376 * Adds a job to the list of things todo. Sanitizes the various options
377 * to make sure we don't have conflicts, and initializes various
378 * members of td.
379 */
380static int add_job(struct thread_data *td, const char *jobname, int job_add_num)
381{
382 const char *ddir_str[] = { NULL, "read", "write", "rw", NULL,
383 "randread", "randwrite", "randrw" };
384 unsigned int i;
385 const char *engine;
386 char fname[PATH_MAX];
387 int numjobs, file_alloced;
388
389 /*
390 * the def_thread is just for options, it's not a real job
391 */
392 if (td == &def_thread)
393 return 0;
394
395 /*
396 * if we are just dumping the output command line, don't add the job
397 */
398 if (dump_cmdline) {
399 put_job(td);
400 return 0;
401 }
402
403 engine = get_engine_name(td->o.ioengine);
404 td->io_ops = load_ioengine(td, engine);
405 if (!td->io_ops) {
406 log_err("fio: failed to load engine %s\n", engine);
407 goto err;
408 }
409
410 if (td->o.use_thread)
411 nr_thread++;
412 else
413 nr_process++;
414
415 if (td->o.odirect)
416 td->io_ops->flags |= FIO_RAWIO;
417
418 file_alloced = 0;
419 if (!td->o.filename && !td->files_index) {
420 file_alloced = 1;
421
422 if (td->o.nr_files == 1 && exists_and_not_file(jobname))
423 add_file(td, jobname);
424 else {
425 for (i = 0; i < td->o.nr_files; i++) {
426 sprintf(fname, "%s.%d.%d", jobname, td->thread_number, i);
427 add_file(td, fname);
428 }
429 }
430 }
431
432 if (fixup_options(td))
433 goto err;
434
435 if (td->io_ops->flags & FIO_DISKLESSIO) {
436 struct fio_file *f;
437
438 for_each_file(td, f, i)
439 f->real_file_size = -1ULL;
440 }
441
442 td->mutex = fio_sem_init(0);
443
444 td->ts.clat_stat[0].min_val = td->ts.clat_stat[1].min_val = ULONG_MAX;
445 td->ts.slat_stat[0].min_val = td->ts.slat_stat[1].min_val = ULONG_MAX;
446 td->ts.bw_stat[0].min_val = td->ts.bw_stat[1].min_val = ULONG_MAX;
447 td->ddir_nr = td->o.ddir_nr;
448
449 if ((td->o.stonewall || td->o.numjobs > 1 || td->o.new_group)
450 && prev_group_jobs) {
451 prev_group_jobs = 0;
452 groupid++;
453 }
454
455 td->groupid = groupid;
456 prev_group_jobs++;
457
458 if (init_random_state(td))
459 goto err;
460
461 if (setup_rate(td))
462 goto err;
463
464 if (td->o.write_lat_log) {
465 setup_log(&td->ts.slat_log);
466 setup_log(&td->ts.clat_log);
467 }
468 if (td->o.write_bw_log)
469 setup_log(&td->ts.bw_log);
470
471 if (!td->o.name)
472 td->o.name = strdup(jobname);
473
474 if (!terse_output) {
475 if (!job_add_num) {
476 if (!strcmp(td->io_ops->name, "cpuio"))
477 log_info("%s: ioengine=cpu, cpuload=%u, cpucycle=%u\n", td->o.name, td->o.cpuload, td->o.cpucycle);
478 else {
479 char *c1, *c2, *c3, *c4;
480
481 c1 = to_kmg(td->o.min_bs[DDIR_READ]);
482 c2 = to_kmg(td->o.max_bs[DDIR_READ]);
483 c3 = to_kmg(td->o.min_bs[DDIR_WRITE]);
484 c4 = to_kmg(td->o.max_bs[DDIR_WRITE]);
485
486 log_info("%s: (g=%d): rw=%s, bs=%s-%s/%s-%s, ioengine=%s, iodepth=%u\n", td->o.name, td->groupid, ddir_str[td->o.td_ddir], c1, c2, c3, c4, td->io_ops->name, td->o.iodepth);
487
488 free(c1);
489 free(c2);
490 free(c3);
491 free(c4);
492 }
493 } else if (job_add_num == 1)
494 log_info("...\n");
495 }
496
497 /*
498 * recurse add identical jobs, clear numjobs and stonewall options
499 * as they don't apply to sub-jobs
500 */
501 numjobs = td->o.numjobs;
502 while (--numjobs) {
503 struct thread_data *td_new = get_new_job(0, td);
504
505 if (!td_new)
506 goto err;
507
508 td_new->o.numjobs = 1;
509 td_new->o.stonewall = 0;
510 td_new->o.new_group = 0;
511
512 if (file_alloced) {
513 td_new->o.filename = NULL;
514 td_new->files_index = 0;
515 td_new->files = NULL;
516 }
517
518 job_add_num = numjobs - 1;
519
520 if (add_job(td_new, jobname, job_add_num))
521 goto err;
522 }
523
524 return 0;
525err:
526 put_job(td);
527 return -1;
528}
529
530static int is_empty_or_comment(char *line)
531{
532 unsigned int i;
533
534 for (i = 0; i < strlen(line); i++) {
535 if (line[i] == ';')
536 return 1;
537 if (line[i] == '#')
538 return 1;
539 if (!isspace(line[i]) && !iscntrl(line[i]))
540 return 0;
541 }
542
543 return 1;
544}
545
546/*
547 * This is our [ini] type file parser.
548 */
549static int parse_jobs_ini(char *file, int stonewall_flag)
550{
551 unsigned int global;
552 struct thread_data *td;
553 char *string, *name;
554 fpos_t off;
555 FILE *f;
556 char *p;
557 int ret = 0, stonewall;
558 int first_sect = 1;
559
560 f = fopen(file, "r");
561 if (!f) {
562 perror("fopen job file");
563 return 1;
564 }
565
566 string = malloc(4096);
567 name = malloc(256);
568 memset(name, 0, 256);
569
570 stonewall = stonewall_flag;
571 do {
572 p = fgets(string, 4095, f);
573 if (!p)
574 break;
575
576 strip_blank_front(&p);
577 strip_blank_end(p);
578
579 if (is_empty_or_comment(p))
580 continue;
581 if (sscanf(p, "[%255s]", name) != 1) {
582 log_err("fio: option <%s> outside of job section\n", p);
583 continue;
584 }
585
586 global = !strncmp(name, "global", 6);
587
588 name[strlen(name) - 1] = '\0';
589
590 if (dump_cmdline) {
591 if (first_sect)
592 log_info("fio ");
593 if (!global)
594 log_info("--name=%s ", name);
595 first_sect = 0;
596 }
597
598 td = get_new_job(global, &def_thread);
599 if (!td) {
600 ret = 1;
601 break;
602 }
603
604 /*
605 * Seperate multiple job files by a stonewall
606 */
607 if (!global && stonewall) {
608 td->o.stonewall = stonewall;
609 stonewall = 0;
610 }
611
612 fgetpos(f, &off);
613 while ((p = fgets(string, 4096, f)) != NULL) {
614 if (is_empty_or_comment(p))
615 continue;
616
617 strip_blank_front(&p);
618
619 if (p[0] == '[')
620 break;
621
622 strip_blank_end(p);
623
624 fgetpos(f, &off);
625
626 /*
627 * Don't break here, continue parsing options so we
628 * dump all the bad ones. Makes trial/error fixups
629 * easier on the user.
630 */
631 ret |= fio_option_parse(td, p);
632 if (!ret && dump_cmdline)
633 log_info("--%s ", p);
634 }
635
636 if (!ret) {
637 fsetpos(f, &off);
638 ret = add_job(td, name, 0);
639 } else {
640 log_err("fio: job %s dropped\n", name);
641 put_job(td);
642 }
643 } while (!ret);
644
645 if (dump_cmdline)
646 log_info("\n");
647
648 free(string);
649 free(name);
650 fclose(f);
651 return ret;
652}
653
654static int fill_def_thread(void)
655{
656 memset(&def_thread, 0, sizeof(def_thread));
657
658 fio_getaffinity(getpid(), &def_thread.o.cpumask);
659
660 /*
661 * fill default options
662 */
663 fio_fill_default_options(&def_thread);
664
665 def_thread.o.timeout = def_timeout;
666 def_thread.o.write_bw_log = write_bw_log;
667 def_thread.o.write_lat_log = write_lat_log;
668
669 return 0;
670}
671
672static void free_shm(void)
673{
674 struct shmid_ds sbuf;
675
676 if (threads) {
677 shmdt((void *) threads);
678 threads = NULL;
679 shmctl(shm_id, IPC_RMID, &sbuf);
680 }
681}
682
683/*
684 * The thread area is shared between the main process and the job
685 * threads/processes. So setup a shared memory segment that will hold
686 * all the job info.
687 */
688static int setup_thread_area(void)
689{
690 /*
691 * 1024 is too much on some machines, scale max_jobs if
692 * we get a failure that looks like too large a shm segment
693 */
694 do {
695 size_t size = max_jobs * sizeof(struct thread_data);
696
697 shm_id = shmget(0, size, IPC_CREAT | 0600);
698 if (shm_id != -1)
699 break;
700 if (errno != EINVAL) {
701 perror("shmget");
702 break;
703 }
704
705 max_jobs >>= 1;
706 } while (max_jobs);
707
708 if (shm_id == -1)
709 return 1;
710
711 threads = shmat(shm_id, NULL, 0);
712 if (threads == (void *) -1) {
713 perror("shmat");
714 return 1;
715 }
716
717 atexit(free_shm);
718 return 0;
719}
720
721static void usage(void)
722{
723 printf("%s\n", fio_version_string);
724 printf("\t--output\tWrite output to file\n");
725 printf("\t--timeout\tRuntime in seconds\n");
726 printf("\t--latency-log\tGenerate per-job latency logs\n");
727 printf("\t--bandwidth-log\tGenerate per-job bandwidth logs\n");
728 printf("\t--minimal\tMinimal (terse) output\n");
729 printf("\t--version\tPrint version info and exit\n");
730 printf("\t--help\t\tPrint this page\n");
731 printf("\t--cmdhelp=cmd\tPrint command help, \"all\" for all of them\n");
732 printf("\t--showcmd\tTurn a job file into command line options\n");
733}
734
735static int parse_cmd_line(int argc, char *argv[])
736{
737 struct thread_data *td = NULL;
738 int c, ini_idx = 0, lidx, ret, dont_add_job = 0;
739
740 while ((c = getopt_long_only(argc, argv, "", long_options, &lidx)) != -1) {
741 switch (c) {
742 case 't':
743 def_timeout = atoi(optarg);
744 break;
745 case 'l':
746 write_lat_log = 1;
747 break;
748 case 'w':
749 write_bw_log = 1;
750 break;
751 case 'o':
752 f_out = fopen(optarg, "w+");
753 if (!f_out) {
754 perror("fopen output");
755 exit(1);
756 }
757 f_err = f_out;
758 break;
759 case 'm':
760 terse_output = 1;
761 break;
762 case 'h':
763 usage();
764 exit(0);
765 case 'c':
766 exit(fio_show_option_help(optarg));
767 case 's':
768 dump_cmdline = 1;
769 break;
770 case 'v':
771 printf("%s\n", fio_version_string);
772 exit(0);
773 case FIO_GETOPT_JOB: {
774 const char *opt = long_options[lidx].name;
775 char *val = optarg;
776
777 if (!strncmp(opt, "name", 4) && td) {
778 ret = add_job(td, td->o.name ?: "fio", 0);
779 if (ret) {
780 put_job(td);
781 return 0;
782 }
783 td = NULL;
784 }
785 if (!td) {
786 int global = 0;
787
788 if (strncmp(opt, "name", 4) ||
789 !strncmp(val, "global", 6))
790 global = 1;
791
792 td = get_new_job(global, &def_thread);
793 if (!td)
794 return 0;
795 }
796
797 ret = fio_cmd_option_parse(td, opt, val);
798 if (ret)
799 dont_add_job = 1;
800 break;
801 }
802 default:
803 break;
804 }
805 }
806
807 if (td) {
808 if (dont_add_job)
809 put_job(td);
810 else {
811 ret = add_job(td, td->o.name ?: "fio", 0);
812 if (ret)
813 put_job(td);
814 }
815 }
816
817 while (optind < argc) {
818 ini_idx++;
819 ini_file = realloc(ini_file, ini_idx * sizeof(char *));
820 ini_file[ini_idx - 1] = strdup(argv[optind]);
821 optind++;
822 }
823
824 return ini_idx;
825}
826
827
828int parse_options(int argc, char *argv[])
829{
830 int job_files, i;
831
832 f_out = stdout;
833 f_err = stderr;
834
835 fio_options_dup_and_init(long_options);
836
837 if (setup_thread_area())
838 return 1;
839 if (fill_def_thread())
840 return 1;
841
842 job_files = parse_cmd_line(argc, argv);
843
844 for (i = 0; i < job_files; i++) {
845 if (fill_def_thread())
846 return 1;
847 if (parse_jobs_ini(ini_file[i], i))
848 return 1;
849 free(ini_file[i]);
850 }
851
852 free(ini_file);
853 options_mem_free(&def_thread);
854
855 if (!thread_number) {
856 if (dump_cmdline)
857 return 0;
858
859 log_err("No jobs defined(s)\n");
860 return 1;
861 }
862
863 return 0;
864}