Fix man page documentation for verify_pattern
[fio.git] / filesetup.c
1 #include <unistd.h>
2 #include <fcntl.h>
3 #include <string.h>
4 #include <assert.h>
5 #include <dirent.h>
6 #include <libgen.h>
7 #include <sys/stat.h>
8 #include <sys/mman.h>
9 #include <sys/types.h>
10
11 #include "fio.h"
12 #include "smalloc.h"
13 #include "filehash.h"
14
15 static int root_warn;
16
17 static inline void clear_error(struct thread_data *td)
18 {
19         td->error = 0;
20         td->verror[0] = '\0';
21 }
22
23 /*
24  * Leaves f->fd open on success, caller must close
25  */
26 static int extend_file(struct thread_data *td, struct fio_file *f)
27 {
28         int r, new_layout = 0, unlink_file = 0, flags;
29         unsigned long long left;
30         unsigned int bs;
31         char *b;
32
33         if (read_only) {
34                 log_err("fio: refusing extend of file due to read-only\n");
35                 return 0;
36         }
37
38         /*
39          * check if we need to lay the file out complete again. fio
40          * does that for operations involving reads, or for writes
41          * where overwrite is set
42          */
43         if (td_read(td) || (td_write(td) && td->o.overwrite) ||
44             (td_write(td) && td->io_ops->flags & FIO_NOEXTEND))
45                 new_layout = 1;
46         if (td_write(td) && !td->o.overwrite)
47                 unlink_file = 1;
48
49         if (unlink_file || new_layout) {
50                 dprint(FD_FILE, "layout unlink %s\n", f->file_name);
51                 if ((unlink(f->file_name) < 0) && (errno != ENOENT)) {
52                         td_verror(td, errno, "unlink");
53                         return 1;
54                 }
55         }
56
57         flags = O_WRONLY | O_CREAT;
58         if (new_layout)
59                 flags |= O_TRUNC;
60
61         dprint(FD_FILE, "open file %s, flags %x\n", f->file_name, flags);
62         f->fd = open(f->file_name, flags, 0644);
63         if (f->fd < 0) {
64                 td_verror(td, errno, "open");
65                 return 1;
66         }
67
68 #ifdef FIO_HAVE_FALLOCATE
69         if (td->o.fallocate && !td->o.fill_device) {
70                 dprint(FD_FILE, "fallocate file %s size %llu\n", f->file_name,
71                                                         f->real_file_size);
72
73                 r = posix_fallocate(f->fd, 0, f->real_file_size);
74                 if (r < 0) {
75                         log_err("fio: posix_fallocate fails: %s\n",
76                                         strerror(-r));
77                 }
78         }
79 #endif
80         
81         if (!new_layout)
82                 goto done;
83
84         /*
85          * The size will be -1ULL when fill_device is used, so don't truncate
86          * or fallocate this file, just write it
87          */
88         if (!td->o.fill_device) {
89                 dprint(FD_FILE, "truncate file %s, size %llu\n", f->file_name,
90                                                         f->real_file_size);
91                 if (ftruncate(f->fd, f->real_file_size) == -1) {
92                         td_verror(td, errno, "ftruncate");
93                         goto err;
94                 }
95         }
96
97         b = malloc(td->o.max_bs[DDIR_WRITE]);
98         memset(b, 0, td->o.max_bs[DDIR_WRITE]);
99
100         left = f->real_file_size;
101         while (left && !td->terminate) {
102                 bs = td->o.max_bs[DDIR_WRITE];
103                 if (bs > left)
104                         bs = left;
105
106                 r = write(f->fd, b, bs);
107
108                 if (r > 0) {
109                         left -= r;
110                         continue;
111                 } else {
112                         if (r < 0) {
113                                 int __e = errno;
114
115                                 if (__e == ENOSPC) {
116                                         if (td->o.fill_device)
117                                                 break;
118                                         log_info("fio: ENOSPC on laying out "
119                                                  "file, stopping\n");
120                                         break;
121                                 }
122                                 td_verror(td, errno, "write");
123                         } else
124                                 td_verror(td, EIO, "write");
125
126                         break;
127                 }
128         }
129
130         if (td->terminate) {
131                 dprint(FD_FILE, "terminate unlink %s\n", f->file_name);
132                 unlink(f->file_name);
133         } else if (td->o.create_fsync) {
134                 if (fsync(f->fd) < 0) {
135                         td_verror(td, errno, "fsync");
136                         goto err;
137                 }
138         }
139         if (td->o.fill_device && !td_write(td)) {
140                 fio_file_clear_size_known(f);
141                 if (td_io_get_file_size(td, f))
142                         goto err;
143                 if (f->io_size > f->real_file_size)
144                         f->io_size = f->real_file_size;
145         }
146
147         free(b);
148 done:
149         return 0;
150 err:
151         close(f->fd);
152         f->fd = -1;
153         return 1;
154 }
155
156 static int pre_read_file(struct thread_data *td, struct fio_file *f)
157 {
158         int r, did_open = 0, old_runstate;
159         unsigned long long left;
160         unsigned int bs;
161         char *b;
162
163         if (td->io_ops->flags & FIO_PIPEIO)
164                 return 0;
165
166         if (!fio_file_open(f)) {
167                 if (td->io_ops->open_file(td, f)) {
168                         log_err("fio: cannot pre-read, failed to open file\n");
169                         return 1;
170                 }
171                 did_open = 1;
172         }
173
174         old_runstate = td->runstate;
175         td_set_runstate(td, TD_PRE_READING);
176
177         bs = td->o.max_bs[DDIR_READ];
178         b = malloc(bs);
179         memset(b, 0, bs);
180
181         lseek(f->fd, f->file_offset, SEEK_SET);
182         left = f->io_size;
183
184         while (left && !td->terminate) {
185                 if (bs > left)
186                         bs = left;
187
188                 r = read(f->fd, b, bs);
189
190                 if (r == (int) bs) {
191                         left -= bs;
192                         continue;
193                 } else {
194                         td_verror(td, EIO, "pre_read");
195                         break;
196                 }
197         }
198
199         td_set_runstate(td, old_runstate);
200
201         if (did_open)
202                 td->io_ops->close_file(td, f);
203         free(b);
204         return 0;
205 }
206
207 static unsigned long long get_rand_file_size(struct thread_data *td)
208 {
209         unsigned long long ret, sized;
210         long r;
211
212         r = os_random_long(&td->file_size_state);
213         sized = td->o.file_size_high - td->o.file_size_low;
214         ret = (unsigned long long) ((double) sized * (r / (OS_RAND_MAX + 1.0)));
215         ret += td->o.file_size_low;
216         ret -= (ret % td->o.rw_min_bs);
217         return ret;
218 }
219
220 static int file_size(struct thread_data *td, struct fio_file *f)
221 {
222         struct stat st;
223
224         if (stat(f->file_name, &st) == -1) {
225                 td_verror(td, errno, "fstat");
226                 return 1;
227         }
228
229         f->real_file_size = st.st_size;
230         return 0;
231 }
232
233 static int bdev_size(struct thread_data *td, struct fio_file *f)
234 {
235         unsigned long long bytes;
236         int r;
237
238         if (td->io_ops->open_file(td, f)) {
239                 log_err("fio: failed opening blockdev %s for size check\n",
240                         f->file_name);
241                 return 1;
242         }
243
244         r = blockdev_size(f->fd, &bytes);
245         if (r) {
246                 td_verror(td, r, "blockdev_size");
247                 goto err;
248         }
249
250         if (!bytes) {
251                 log_err("%s: zero sized block device?\n", f->file_name);
252                 goto err;
253         }
254
255         f->real_file_size = bytes;
256         td->io_ops->close_file(td, f);
257         return 0;
258 err:
259         td->io_ops->close_file(td, f);
260         return 1;
261 }
262
263 static int get_file_size(struct thread_data *td, struct fio_file *f)
264 {
265         int ret = 0;
266
267         if (fio_file_size_known(f))
268                 return 0;
269
270         if (f->filetype == FIO_TYPE_FILE)
271                 ret = file_size(td, f);
272         else if (f->filetype == FIO_TYPE_BD)
273                 ret = bdev_size(td, f);
274         else
275                 f->real_file_size = -1;
276
277         if (ret)
278                 return ret;
279
280         if (f->file_offset > f->real_file_size) {
281                 log_err("%s: offset extends end (%Lu > %Lu)\n", td->o.name,
282                                         f->file_offset, f->real_file_size);
283                 return 1;
284         }
285
286         fio_file_set_size_known(f);
287         return 0;
288 }
289
290 static int __file_invalidate_cache(struct thread_data *td, struct fio_file *f,
291                                    unsigned long long off,
292                                    unsigned long long len)
293 {
294         int ret = 0;
295
296         if (len == -1ULL)
297                 len = f->io_size;
298         if (off == -1ULL)
299                 off = f->file_offset;
300
301         if (len == -1ULL || off == -1ULL)
302                 return 0;
303
304         dprint(FD_IO, "invalidate cache %s: %llu/%llu\n", f->file_name, off,
305                                                                 len);
306
307         /*
308          * FIXME: add blockdev flushing too
309          */
310         if (f->mmap_ptr) {
311                 ret = madvise(f->mmap_ptr, f->mmap_sz, MADV_DONTNEED);
312 #ifdef FIO_MADV_FREE
313                 (void) madvise(f->mmap_ptr, f->mmap_sz, FIO_MADV_FREE);
314 #endif
315         } else if (f->filetype == FIO_TYPE_FILE) {
316                 ret = fadvise(f->fd, off, len, POSIX_FADV_DONTNEED);
317         } else if (f->filetype == FIO_TYPE_BD) {
318                 ret = blockdev_invalidate_cache(f->fd);
319                 if (ret < 0 && errno == EACCES && geteuid()) {
320                         if (!root_warn) {
321                                 log_err("fio: only root may flush block "
322                                         "devices. Cache flush bypassed!\n");
323                                 root_warn = 1;
324                         }
325                         ret = 0;
326                 }
327         } else if (f->filetype == FIO_TYPE_CHAR || f->filetype == FIO_TYPE_PIPE)
328                 ret = 0;
329
330         if (ret < 0) {
331                 td_verror(td, errno, "invalidate_cache");
332                 return 1;
333         } else if (ret > 0) {
334                 td_verror(td, ret, "invalidate_cache");
335                 return 1;
336         }
337
338         return ret;
339
340 }
341
342 int file_invalidate_cache(struct thread_data *td, struct fio_file *f)
343 {
344         if (!fio_file_open(f))
345                 return 0;
346
347         return __file_invalidate_cache(td, f, -1ULL, -1ULL);
348 }
349
350 int generic_close_file(struct thread_data fio_unused *td, struct fio_file *f)
351 {
352         int ret = 0;
353
354         dprint(FD_FILE, "fd close %s\n", f->file_name);
355
356         remove_file_hash(f);
357
358         if (close(f->fd) < 0)
359                 ret = errno;
360
361         f->fd = -1;
362         return ret;
363 }
364
365 static int file_lookup_open(struct fio_file *f, int flags)
366 {
367         struct fio_file *__f;
368         int from_hash;
369
370         __f = lookup_file_hash(f->file_name);
371         if (__f) {
372                 dprint(FD_FILE, "found file in hash %s\n", f->file_name);
373                 /*
374                  * racy, need the __f->lock locked
375                  */
376                 f->lock = __f->lock;
377                 f->lock_owner = __f->lock_owner;
378                 f->lock_batch = __f->lock_batch;
379                 f->lock_ddir = __f->lock_ddir;
380                 from_hash = 1;
381         } else {
382                 dprint(FD_FILE, "file not found in hash %s\n", f->file_name);
383                 from_hash = 0;
384         }
385
386         f->fd = open(f->file_name, flags, 0600);
387         return from_hash;
388 }
389
390 int generic_open_file(struct thread_data *td, struct fio_file *f)
391 {
392         int is_std = 0;
393         int flags = 0;
394         int from_hash = 0;
395
396         dprint(FD_FILE, "fd open %s\n", f->file_name);
397
398         if (!strcmp(f->file_name, "-")) {
399                 if (td_rw(td)) {
400                         log_err("fio: can't read/write to stdin/out\n");
401                         return 1;
402                 }
403                 is_std = 1;
404
405                 /*
406                  * move output logging to stderr, if we are writing to stdout
407                  */
408                 if (td_write(td))
409                         f_out = stderr;
410         }
411
412         if (td->o.odirect)
413                 flags |= OS_O_DIRECT;
414         if (td->o.sync_io)
415                 flags |= O_SYNC;
416         if (f->filetype != FIO_TYPE_FILE)
417                 flags |= FIO_O_NOATIME;
418         if (td->o.create_on_open)
419                 flags |= O_CREAT;
420
421 open_again:
422         if (td_write(td)) {
423                 if (!read_only)
424                         flags |= O_RDWR;
425
426                 if (f->filetype == FIO_TYPE_FILE)
427                         flags |= O_CREAT;
428
429                 if (is_std)
430                         f->fd = dup(STDOUT_FILENO);
431                 else
432                         from_hash = file_lookup_open(f, flags);
433         } else {
434                 if (f->filetype == FIO_TYPE_CHAR && !read_only)
435                         flags |= O_RDWR;
436                 else
437                         flags |= O_RDONLY;
438
439                 if (is_std)
440                         f->fd = dup(STDIN_FILENO);
441                 else
442                         from_hash = file_lookup_open(f, flags);
443         }
444
445         if (f->fd == -1) {
446                 char buf[FIO_VERROR_SIZE];
447                 int __e = errno;
448
449                 if (__e == EPERM && (flags & FIO_O_NOATIME)) {
450                         flags &= ~FIO_O_NOATIME;
451                         goto open_again;
452                 }
453
454                 snprintf(buf, sizeof(buf) - 1, "open(%s)", f->file_name);
455
456                 td_verror(td, __e, buf);
457         }
458
459         if (!from_hash && f->fd != -1) {
460                 if (add_file_hash(f)) {
461                         int ret;
462
463                         /*
464                          * OK to ignore, we haven't done anything with it
465                          */
466                         ret = generic_close_file(td, f);
467                         goto open_again;
468                 }
469         }
470
471         return 0;
472 }
473
474 int generic_get_file_size(struct thread_data *td, struct fio_file *f)
475 {
476         return get_file_size(td, f);
477 }
478
479 /*
480  * open/close all files, so that ->real_file_size gets set
481  */
482 static int get_file_sizes(struct thread_data *td)
483 {
484         struct fio_file *f;
485         unsigned int i;
486         int err = 0;
487
488         for_each_file(td, f, i) {
489                 dprint(FD_FILE, "get file size for %p/%d/%p\n", f, i,
490                                                                 f->file_name);
491
492                 if (td_io_get_file_size(td, f)) {
493                         if (td->error != ENOENT) {
494                                 log_err("%s\n", td->verror);
495                                 err = 1;
496                         }
497                         clear_error(td);
498                 }
499
500                 if (f->real_file_size == -1ULL && td->o.size)
501                         f->real_file_size = td->o.size / td->o.nr_files;
502         }
503
504         return err;
505 }
506
507 struct fio_mount {
508         struct flist_head list;
509         const char *base;
510         char __base[256];
511         unsigned int key;
512 };
513
514 /*
515  * Get free number of bytes for each file on each unique mount.
516  */
517 static unsigned long long get_fs_free_counts(struct thread_data *td)
518 {
519         struct flist_head *n, *tmp;
520         unsigned long long ret;
521         struct fio_mount *fm;
522         FLIST_HEAD(list);
523         struct fio_file *f;
524         unsigned int i;
525
526         for_each_file(td, f, i) {
527                 struct stat sb;
528                 char buf[256];
529
530                 strcpy(buf, f->file_name);
531
532                 if (stat(buf, &sb) < 0) {
533                         if (errno != ENOENT)
534                                 break;
535                         strcpy(buf, ".");
536                         if (stat(buf, &sb) < 0)
537                                 break;
538                 }
539
540                 fm = NULL;
541                 flist_for_each(n, &list) {
542                         fm = flist_entry(n, struct fio_mount, list);
543                         if (fm->key == sb.st_dev)
544                                 break;
545
546                         fm = NULL;
547                 }
548
549                 if (fm)
550                         continue;
551
552                 fm = malloc(sizeof(*fm));
553                 strcpy(fm->__base, buf);
554                 fm->base = basename(fm->__base);
555                 fm->key = sb.st_dev;
556                 flist_add(&fm->list, &list);
557         }
558
559         ret = 0;
560         flist_for_each_safe(n, tmp, &list) {
561                 unsigned long long sz;
562
563                 fm = flist_entry(n, struct fio_mount, list);
564                 flist_del(&fm->list);
565
566                 sz = get_fs_size(fm->base);
567                 if (sz && sz != -1ULL)
568                         ret += sz;
569
570                 free(fm);
571         }
572
573         return ret;
574 }
575
576 /*
577  * Open the files and setup files sizes, creating files if necessary.
578  */
579 int setup_files(struct thread_data *td)
580 {
581         unsigned long long total_size, extend_size;
582         struct fio_file *f;
583         unsigned int i;
584         int err = 0, need_extend;
585
586         dprint(FD_FILE, "setup files\n");
587
588         if (td->o.read_iolog_file)
589                 return 0;
590
591         /*
592          * if ioengine defines a setup() method, it's responsible for
593          * opening the files and setting f->real_file_size to indicate
594          * the valid range for that file.
595          */
596         if (td->io_ops->setup)
597                 err = td->io_ops->setup(td);
598         else
599                 err = get_file_sizes(td);
600
601         if (err)
602                 return err;
603
604         /*
605          * check sizes. if the files/devices do not exist and the size
606          * isn't passed to fio, abort.
607          */
608         total_size = 0;
609         for_each_file(td, f, i) {
610                 if (f->real_file_size == -1ULL)
611                         total_size = -1ULL;
612                 else
613                         total_size += f->real_file_size;
614         }
615
616         if (td->o.fill_device)
617                 td->fill_device_size = get_fs_free_counts(td);
618
619         /*
620          * device/file sizes are zero and no size given, punt
621          */
622         if ((!total_size || total_size == -1ULL) && !td->o.size &&
623             !(td->io_ops->flags & FIO_NOIO) && !td->o.fill_device) {
624                 log_err("%s: you need to specify size=\n", td->o.name);
625                 td_verror(td, EINVAL, "total_file_size");
626                 return 1;
627         }
628
629         /*
630          * now file sizes are known, so we can set ->io_size. if size= is
631          * not given, ->io_size is just equal to ->real_file_size. if size
632          * is given, ->io_size is size / nr_files.
633          */
634         extend_size = total_size = 0;
635         need_extend = 0;
636         for_each_file(td, f, i) {
637                 f->file_offset = td->o.start_offset;
638
639                 if (!td->o.file_size_low) {
640                         /*
641                          * no file size range given, file size is equal to
642                          * total size divided by number of files. if that is
643                          * zero, set it to the real file size.
644                          */
645                         f->io_size = td->o.size / td->o.nr_files;
646                         if (!f->io_size)
647                                 f->io_size = f->real_file_size - f->file_offset;
648                 } else if (f->real_file_size < td->o.file_size_low ||
649                            f->real_file_size > td->o.file_size_high) {
650                         if (f->file_offset > td->o.file_size_low)
651                                 goto err_offset;
652                         /*
653                          * file size given. if it's fixed, use that. if it's a
654                          * range, generate a random size in-between.
655                          */
656                         if (td->o.file_size_low == td->o.file_size_high) {
657                                 f->io_size = td->o.file_size_low
658                                                 - f->file_offset;
659                         } else {
660                                 f->io_size = get_rand_file_size(td)
661                                                 - f->file_offset;
662                         }
663                 } else
664                         f->io_size = f->real_file_size - f->file_offset;
665
666                 if (f->io_size == -1ULL)
667                         total_size = -1ULL;
668                 else
669                         total_size += f->io_size;
670
671                 if (f->filetype == FIO_TYPE_FILE &&
672                     (f->io_size + f->file_offset) > f->real_file_size &&
673                     !(td->io_ops->flags & FIO_DISKLESSIO)) {
674                         if (!td->o.create_on_open) {
675                                 need_extend++;
676                                 extend_size += (f->io_size + f->file_offset);
677                         } else
678                                 f->real_file_size = f->io_size + f->file_offset;
679                         fio_file_set_extend(f);
680                 }
681         }
682
683         if (!td->o.size || td->o.size > total_size)
684                 td->o.size = total_size;
685
686         /*
687          * See if we need to extend some files
688          */
689         if (need_extend) {
690                 temp_stall_ts = 1;
691                 if (!terse_output)
692                         log_info("%s: Laying out IO file(s) (%u file(s) /"
693                                  " %LuMB)\n", td->o.name, need_extend,
694                                         extend_size >> 20);
695
696                 for_each_file(td, f, i) {
697                         unsigned long long old_len = -1ULL, extend_len = -1ULL;
698
699                         if (!fio_file_extend(f))
700                                 continue;
701
702                         assert(f->filetype == FIO_TYPE_FILE);
703                         fio_file_clear_extend(f);
704                         if (!td->o.fill_device) {
705                                 old_len = f->real_file_size;
706                                 extend_len = f->io_size + f->file_offset -
707                                                 old_len;
708                         }
709                         f->real_file_size = (f->io_size + f->file_offset);
710                         err = extend_file(td, f);
711                         if (err)
712                                 break;
713
714                         err = __file_invalidate_cache(td, f, old_len,
715                                                                 extend_len);
716                         close(f->fd);
717                         f->fd = -1;
718                         if (err)
719                                 break;
720                 }
721                 temp_stall_ts = 0;
722         }
723
724         if (err)
725                 return err;
726
727         if (!td->o.zone_size)
728                 td->o.zone_size = td->o.size;
729
730         /*
731          * iolog already set the total io size, if we read back
732          * stored entries.
733          */
734         if (!td->o.read_iolog_file)
735                 td->total_io_size = td->o.size * td->o.loops;
736         return 0;
737 err_offset:
738         log_err("%s: you need to specify valid offset=\n", td->o.name);
739         return 1;
740 }
741
742 int pre_read_files(struct thread_data *td)
743 {
744         struct fio_file *f;
745         unsigned int i;
746
747         dprint(FD_FILE, "pre_read files\n");
748
749         for_each_file(td, f, i) {
750                 pre_read_file(td, f);
751         }
752
753         return 1;
754 }
755
756 int init_random_map(struct thread_data *td)
757 {
758         unsigned long long blocks, num_maps;
759         struct fio_file *f;
760         unsigned int i;
761
762         if (td->o.norandommap || !td_random(td))
763                 return 0;
764
765         for_each_file(td, f, i) {
766                 blocks = (f->real_file_size + td->o.rw_min_bs - 1) /
767                                 (unsigned long long) td->o.rw_min_bs;
768                 num_maps = (blocks + BLOCKS_PER_MAP - 1) /
769                                 (unsigned long long) BLOCKS_PER_MAP;
770                 f->file_map = smalloc(num_maps * sizeof(int));
771                 if (f->file_map) {
772                         f->num_maps = num_maps;
773                         continue;
774                 }
775                 if (!td->o.softrandommap) {
776                         log_err("fio: failed allocating random map. If running"
777                                 " a large number of jobs, try the 'norandommap'"
778                                 " option or set 'softrandommap'. Or give"
779                                 " a larger --alloc-size to fio.\n");
780                         return 1;
781                 }
782
783                 log_info("fio: file %s failed allocating random map. Running "
784                          "job without.\n", f->file_name);
785                 f->num_maps = 0;
786         }
787
788         return 0;
789 }
790
791 void close_files(struct thread_data *td)
792 {
793         struct fio_file *f;
794         unsigned int i;
795
796         for_each_file(td, f, i) {
797                 if (fio_file_open(f))
798                         td_io_close_file(td, f);
799         }
800 }
801
802 void close_and_free_files(struct thread_data *td)
803 {
804         struct fio_file *f;
805         unsigned int i;
806
807         dprint(FD_FILE, "close files\n");
808
809         for_each_file(td, f, i) {
810                 if (td->o.unlink && f->filetype == FIO_TYPE_FILE) {
811                         dprint(FD_FILE, "free unlink %s\n", f->file_name);
812                         unlink(f->file_name);
813                 }
814
815                 if (fio_file_open(f))
816                         td_io_close_file(td, f);
817
818                 remove_file_hash(f);
819
820                 sfree(f->file_name);
821                 f->file_name = NULL;
822                 sfree(f->file_map);
823                 f->file_map = NULL;
824                 sfree(f);
825         }
826
827         td->o.filename = NULL;
828         free(td->files);
829         td->files_index = 0;
830         td->files = NULL;
831         td->o.nr_files = 0;
832 }
833
834 static void get_file_type(struct fio_file *f)
835 {
836         struct stat sb;
837
838         if (!strcmp(f->file_name, "-"))
839                 f->filetype = FIO_TYPE_PIPE;
840         else
841                 f->filetype = FIO_TYPE_FILE;
842
843         if (!stat(f->file_name, &sb)) {
844                 if (S_ISBLK(sb.st_mode))
845                         f->filetype = FIO_TYPE_BD;
846                 else if (S_ISCHR(sb.st_mode))
847                         f->filetype = FIO_TYPE_CHAR;
848                 else if (S_ISFIFO(sb.st_mode))
849                         f->filetype = FIO_TYPE_PIPE;
850         }
851 }
852
853 int add_file(struct thread_data *td, const char *fname)
854 {
855         int cur_files = td->files_index;
856         char file_name[PATH_MAX];
857         struct fio_file *f;
858         int len = 0;
859
860         dprint(FD_FILE, "add file %s\n", fname);
861
862         f = smalloc(sizeof(*f));
863         if (!f) {
864                 log_err("fio: smalloc OOM\n");
865                 assert(0);
866         }
867
868         f->fd = -1;
869
870         if (td->files_size <= td->files_index) {
871                 int new_size = td->o.nr_files + 1;
872
873                 dprint(FD_FILE, "resize file array to %d files\n", new_size);
874
875                 td->files = realloc(td->files, new_size * sizeof(f));
876                 td->files_size = new_size;
877         }
878         td->files[cur_files] = f;
879
880         /*
881          * init function, io engine may not be loaded yet
882          */
883         if (td->io_ops && (td->io_ops->flags & FIO_DISKLESSIO))
884                 f->real_file_size = -1ULL;
885
886         if (td->o.directory)
887                 len = sprintf(file_name, "%s/", td->o.directory);
888
889         sprintf(file_name + len, "%s", fname);
890         f->file_name = smalloc_strdup(file_name);
891         if (!f->file_name) {
892                 log_err("fio: smalloc OOM\n");
893                 assert(0);
894         }
895
896         get_file_type(f);
897
898         switch (td->o.file_lock_mode) {
899         case FILE_LOCK_NONE:
900                 break;
901         case FILE_LOCK_READWRITE:
902                 f->lock = fio_mutex_rw_init();
903                 break;
904         case FILE_LOCK_EXCLUSIVE:
905                 f->lock = fio_mutex_init(1);
906                 break;
907         default:
908                 log_err("fio: unknown lock mode: %d\n", td->o.file_lock_mode);
909                 assert(0);
910         }
911
912         td->files_index++;
913         if (f->filetype == FIO_TYPE_FILE)
914                 td->nr_normal_files++;
915
916         dprint(FD_FILE, "file %p \"%s\" added at %d\n", f, f->file_name,
917                                                         cur_files);
918
919         return cur_files;
920 }
921
922 void get_file(struct fio_file *f)
923 {
924         dprint(FD_FILE, "get file %s, ref=%d\n", f->file_name, f->references);
925         assert(fio_file_open(f));
926         f->references++;
927 }
928
929 int put_file(struct thread_data *td, struct fio_file *f)
930 {
931         int f_ret = 0, ret = 0;
932
933         dprint(FD_FILE, "put file %s, ref=%d\n", f->file_name, f->references);
934
935         if (!fio_file_open(f)) {
936                 assert(f->fd == -1);
937                 return 0;
938         }
939
940         assert(f->references);
941         if (--f->references)
942                 return 0;
943
944         if (should_fsync(td) && td->o.fsync_on_close)
945                 f_ret = fsync(f->fd);
946
947         if (td->io_ops->close_file)
948                 ret = td->io_ops->close_file(td, f);
949
950         if (!ret)
951                 ret = f_ret;
952
953         td->nr_open_files--;
954         fio_file_clear_open(f);
955         assert(f->fd == -1);
956         return ret;
957 }
958
959 void lock_file(struct thread_data *td, struct fio_file *f, enum fio_ddir ddir)
960 {
961         if (!f->lock || td->o.file_lock_mode == FILE_LOCK_NONE)
962                 return;
963
964         if (f->lock_owner == td && f->lock_batch--)
965                 return;
966
967         if (td->o.file_lock_mode == FILE_LOCK_READWRITE) {
968                 if (ddir == DDIR_READ)
969                         fio_mutex_down_read(f->lock);
970                 else
971                         fio_mutex_down_write(f->lock);
972         } else if (td->o.file_lock_mode == FILE_LOCK_EXCLUSIVE)
973                 fio_mutex_down(f->lock);
974
975         f->lock_owner = td;
976         f->lock_batch = td->o.lockfile_batch;
977         f->lock_ddir = ddir;
978 }
979
980 void unlock_file(struct thread_data *td, struct fio_file *f)
981 {
982         if (!f->lock || td->o.file_lock_mode == FILE_LOCK_NONE)
983                 return;
984         if (f->lock_batch)
985                 return;
986
987         if (td->o.file_lock_mode == FILE_LOCK_READWRITE) {
988                 const int is_read = f->lock_ddir == DDIR_READ;
989                 int val = fio_mutex_getval(f->lock);
990
991                 if ((is_read && val == 1) || (!is_read && val == -1))
992                         f->lock_owner = NULL;
993
994                 if (is_read)
995                         fio_mutex_up_read(f->lock);
996                 else
997                         fio_mutex_up_write(f->lock);
998         } else if (td->o.file_lock_mode == FILE_LOCK_EXCLUSIVE) {
999                 int val = fio_mutex_getval(f->lock);
1000
1001                 if (val == 0)
1002                         f->lock_owner = NULL;
1003
1004                 fio_mutex_up(f->lock);
1005         }
1006 }
1007
1008 void unlock_file_all(struct thread_data *td, struct fio_file *f)
1009 {
1010         if (f->lock_owner != td)
1011                 return;
1012
1013         f->lock_batch = 0;
1014         unlock_file(td, f);
1015 }
1016
1017 static int recurse_dir(struct thread_data *td, const char *dirname)
1018 {
1019         struct dirent *dir;
1020         int ret = 0;
1021         DIR *D;
1022
1023         D = opendir(dirname);
1024         if (!D) {
1025                 char buf[FIO_VERROR_SIZE];
1026
1027                 snprintf(buf, FIO_VERROR_SIZE - 1, "opendir(%s)", dirname);
1028                 td_verror(td, errno, buf);
1029                 return 1;
1030         }
1031
1032         while ((dir = readdir(D)) != NULL) {
1033                 char full_path[PATH_MAX];
1034                 struct stat sb;
1035
1036                 if (!strcmp(dir->d_name, ".") || !strcmp(dir->d_name, ".."))
1037                         continue;
1038
1039                 sprintf(full_path, "%s/%s", dirname, dir->d_name);
1040
1041                 if (lstat(full_path, &sb) == -1) {
1042                         if (errno != ENOENT) {
1043                                 td_verror(td, errno, "stat");
1044                                 return 1;
1045                         }
1046                 }
1047
1048                 if (S_ISREG(sb.st_mode)) {
1049                         add_file(td, full_path);
1050                         td->o.nr_files++;
1051                         continue;
1052                 }
1053                 if (!S_ISDIR(sb.st_mode))
1054                         continue;
1055
1056                 ret = recurse_dir(td, full_path);
1057                 if (ret)
1058                         break;
1059         }
1060
1061         closedir(D);
1062         return ret;
1063 }
1064
1065 int add_dir_files(struct thread_data *td, const char *path)
1066 {
1067         int ret = recurse_dir(td, path);
1068
1069         if (!ret)
1070                 log_info("fio: opendir added %d files\n", td->o.nr_files);
1071
1072         return ret;
1073 }
1074
1075 void dup_files(struct thread_data *td, struct thread_data *org)
1076 {
1077         struct fio_file *f;
1078         unsigned int i;
1079
1080         dprint(FD_FILE, "dup files: %d\n", org->files_index);
1081
1082         if (!org->files)
1083                 return;
1084
1085         td->files = malloc(org->files_index * sizeof(f));
1086
1087         for_each_file(org, f, i) {
1088                 struct fio_file *__f;
1089
1090                 __f = smalloc(sizeof(*__f));
1091                 if (!__f) {
1092                         log_err("fio: smalloc OOM\n");
1093                         assert(0);
1094                 }
1095                 __f->fd = -1;
1096
1097                 if (f->file_name) {
1098                         __f->file_name = smalloc_strdup(f->file_name);
1099                         if (!__f->file_name) {
1100                                 log_err("fio: smalloc OOM\n");
1101                                 assert(0);
1102                         }
1103
1104                         __f->filetype = f->filetype;
1105                 }
1106
1107                 td->files[i] = __f;
1108         }
1109 }
1110
1111 /*
1112  * Returns the index that matches the filename, or -1 if not there
1113  */
1114 int get_fileno(struct thread_data *td, const char *fname)
1115 {
1116         struct fio_file *f;
1117         unsigned int i;
1118
1119         for_each_file(td, f, i)
1120                 if (!strcmp(f->file_name, fname))
1121                         return i;
1122
1123         return -1;
1124 }
1125
1126 /*
1127  * For log usage, where we add/open/close files automatically
1128  */
1129 void free_release_files(struct thread_data *td)
1130 {
1131         close_files(td);
1132         td->files_index = 0;
1133         td->nr_normal_files = 0;
1134 }