X-Git-Url: https://git.kernel.dk/?p=fio.git;a=blobdiff_plain;f=io_u.c;h=6df4b5eee80190187aa0015b11aca7da73e714b4;hp=89ece538c570391b8812957f2e4a428d1ab1bb65;hb=5af1c6f3b46b40ef6b7021a34fd38889226e137f;hpb=bca4ed4de445a07af393ac8bfcb9dd6aad09e5df diff --git a/io_u.c b/io_u.c index 89ece538..6df4b5ee 100644 --- a/io_u.c +++ b/io_u.c @@ -8,6 +8,19 @@ #include "fio.h" #include "os.h" +/* + * Change this define to play with the timeout handling + */ +#undef FIO_USE_TIMEOUT + +struct io_completion_data { + int nr; /* input */ + + int error; /* output */ + unsigned long bytes_done[2]; /* output */ + struct timeval time; /* output */ +}; + /* * The ->file_map[] contains a map of blocks we have or have not done io * to yet. Used to make sure we cover the entire range in a fair fashion. @@ -24,10 +37,10 @@ static int random_map_free(struct thread_data *td, struct fio_file *f, /* * Mark a given offset as used in the map. */ -static void mark_random_map(struct thread_data *td, struct fio_file *f, - struct io_u *io_u) +static void mark_random_map(struct thread_data *td, struct io_u *io_u) { unsigned int min_bs = td->rw_min_bs; + struct fio_file *f = io_u->file; unsigned long long block; unsigned int blocks; unsigned int nr_blocks; @@ -45,7 +58,7 @@ static void mark_random_map(struct thread_data *td, struct fio_file *f, idx = RAND_MAP_IDX(td, f, block); bit = RAND_MAP_BIT(td, f, block); - assert(idx < f->num_maps); + fio_assert(td, idx < f->num_maps); f->file_map[idx] |= (1UL << bit); block++; @@ -85,14 +98,14 @@ static int get_next_free_block(struct thread_data *td, struct fio_file *f, * until we find a free one. For sequential io, just return the end of * the last io issued. */ -static int get_next_offset(struct thread_data *td, struct fio_file *f, - struct io_u *io_u) +static int get_next_offset(struct thread_data *td, struct io_u *io_u) { + struct fio_file *f = io_u->file; const int ddir = io_u->ddir; unsigned long long b, rb; long r; - if (!td->sequential) { + if (td_random(td)) { unsigned long long max_blocks = f->file_size / td->min_bs[ddir]; int loops = 5; @@ -121,9 +134,9 @@ static int get_next_offset(struct thread_data *td, struct fio_file *f, return 0; } -static unsigned int get_next_buflen(struct thread_data *td, struct fio_file *f, - struct io_u *io_u) +static unsigned int get_next_buflen(struct thread_data *td, struct io_u *io_u) { + struct fio_file *f = io_u->file; const int ddir = io_u->ddir; unsigned int buflen; long r; @@ -138,13 +151,6 @@ static unsigned int get_next_buflen(struct thread_data *td, struct fio_file *f, } while (buflen + io_u->offset > f->real_file_size) { - /* - * if using direct/raw io, we may not be able to - * shrink the size. so just fail it. - */ - if (td->io_ops->flags & FIO_RAWIO) - return 0; - if (buflen == td->min_bs[ddir]) return 0; @@ -192,14 +198,29 @@ static enum fio_ddir get_rw_ddir(struct thread_data *td) void put_io_u(struct thread_data *td, struct io_u *io_u) { + assert((io_u->flags & IO_U_F_FREE) == 0); + io_u->flags |= IO_U_F_FREE; + io_u->file = NULL; list_del(&io_u->list); list_add(&io_u->list, &td->io_u_freelist); td->cur_depth--; } -static int fill_io_u(struct thread_data *td, struct fio_file *f, - struct io_u *io_u) +void requeue_io_u(struct thread_data *td, struct io_u **io_u) +{ + struct io_u *__io_u = *io_u; + + __io_u->flags |= IO_U_F_FREE; + __io_u->flags &= ~IO_U_F_FLIGHT; + + list_del(&__io_u->list); + list_add_tail(&__io_u->list, &td->io_u_requeues); + td->cur_depth--; + *io_u = NULL; +} + +static int fill_io_u(struct thread_data *td, struct io_u *io_u) { /* * If using an iolog, grab next piece if any available. @@ -210,10 +231,9 @@ static int fill_io_u(struct thread_data *td, struct fio_file *f, /* * see if it's time to sync */ - if (td->fsync_blocks && !(td->io_blocks[DDIR_WRITE] % td->fsync_blocks) - && should_fsync(td)) { + if (td->fsync_blocks && !(td->io_issues[DDIR_WRITE] % td->fsync_blocks) + && td->io_issues[DDIR_WRITE] && should_fsync(td)) { io_u->ddir = DDIR_SYNC; - io_u->file = f; return 0; } @@ -223,18 +243,18 @@ static int fill_io_u(struct thread_data *td, struct fio_file *f, * No log, let the seq/rand engine retrieve the next buflen and * position. */ - if (get_next_offset(td, f, io_u)) + if (get_next_offset(td, io_u)) return 1; - io_u->buflen = get_next_buflen(td, f, io_u); + io_u->buflen = get_next_buflen(td, io_u); if (!io_u->buflen) return 1; /* * mark entry before potentially trimming io_u */ - if (!td->read_iolog && !td->sequential && !td->norandommap) - mark_random_map(td, f, io_u); + if (!td->read_iolog && td_random(td) && !td->norandommap) + mark_random_map(td, io_u); /* * If using a write iolog, store this entry. @@ -242,7 +262,6 @@ static int fill_io_u(struct thread_data *td, struct fio_file *f, if (td->write_iolog_file) write_iolog_put(td, io_u); - io_u->file = f; return 0; } @@ -271,16 +290,113 @@ static void io_u_mark_depth(struct thread_data *td) td->total_io_u++; } +static void io_u_mark_latency(struct thread_data *td, unsigned long msec) +{ + int index = 0; + + switch (msec) { + default: + index++; + case 1000 ... 1999: + index++; + case 750 ... 999: + index++; + case 500 ... 749: + index++; + case 250 ... 499: + index++; + case 100 ... 249: + index++; + case 50 ... 99: + index++; + case 20 ... 49: + index++; + case 10 ... 19: + index++; + case 4 ... 9: + index++; + case 2 ... 3: + index++; + case 0 ... 1: + break; + } + + td->io_u_lat[index]++; +} + +/* + * Get next file to service by choosing one at random + */ +static struct fio_file *get_next_file_rand(struct thread_data *td) +{ + unsigned int fileno; + struct fio_file *f; + + do { + long r = os_random_long(&td->next_file_state); + + fileno = (unsigned int) ((double) (td->nr_files - 1) * r / (RAND_MAX + 1.0)); + f = &td->files[fileno]; + if (f->fd != -1) + return f; + } while (1); +} + +/* + * Get next file to service by doing round robin between all available ones + */ +static struct fio_file *get_next_file_rr(struct thread_data *td) +{ + unsigned int old_next_file = td->next_file; + struct fio_file *f; + + do { + f = &td->files[td->next_file]; + + td->next_file++; + if (td->next_file >= td->nr_files) + td->next_file = 0; + + if (f->fd != -1) + break; + + f = NULL; + } while (td->next_file != old_next_file); + + return f; +} + +static struct fio_file *get_next_file(struct thread_data *td) +{ + if (!td->nr_open_files) + return NULL; + + if (td->file_service_type == FIO_FSERVICE_RR) + return get_next_file_rr(td); + else + return get_next_file_rand(td); +} + struct io_u *__get_io_u(struct thread_data *td) { struct io_u *io_u = NULL; - if (!queue_full(td)) { + if (!list_empty(&td->io_u_requeues)) + io_u = list_entry(td->io_u_requeues.next, struct io_u, list); + else if (!queue_full(td)) { io_u = list_entry(td->io_u_freelist.next, struct io_u, list); io_u->buflen = 0; - io_u->error = 0; io_u->resid = 0; + io_u->file = NULL; + io_u->end_io = NULL; + } + + if (io_u) { + assert(io_u->flags & IO_U_F_FREE); + io_u->flags &= ~IO_U_F_FREE; + + io_u->error = 0; list_del(&io_u->list); list_add(&io_u->list, &td->io_u_busylist); td->cur_depth++; @@ -294,24 +410,45 @@ struct io_u *__get_io_u(struct thread_data *td) * Return an io_u to be processed. Gets a buflen and offset, sets direction, * etc. The returned io_u is fully ready to be prepped and submitted. */ -struct io_u *get_io_u(struct thread_data *td, struct fio_file *f) +struct io_u *get_io_u(struct thread_data *td) { + struct fio_file *f; struct io_u *io_u; io_u = __get_io_u(td); if (!io_u) return NULL; + /* + * from a requeue, io_u already setup + */ + if (io_u->file) + goto out; + + do { + f = get_next_file(td); + if (!f) { + put_io_u(td, io_u); + return NULL; + } + + io_u->file = f; + + if (!fill_io_u(td, io_u)) + break; + + /* + * No more to do for this file, close it + */ + io_u->file = NULL; + close_file(td, f); + } while (1); + if (td->zone_bytes >= td->zone_size) { td->zone_bytes = 0; f->last_pos += td->zone_skip; } - if (fill_io_u(td, f, io_u)) { - put_io_u(td, io_u); - return NULL; - } - if (io_u->buflen + io_u->offset > f->real_file_size) { if (td->io_ops->flags & FIO_RAWIO) { put_io_u(td, io_u); @@ -327,32 +464,36 @@ struct io_u *get_io_u(struct thread_data *td, struct fio_file *f) return NULL; } - f->last_pos += io_u->buflen; + f->last_pos = io_u->offset + io_u->buflen; if (td->verify != VERIFY_NONE) populate_verify_io_u(td, io_u); } - if (td_io_prep(td, io_u)) { - put_io_u(td, io_u); - return NULL; - } - /* * Set io data pointers. */ +out: io_u->xfer_buf = io_u->buf; io_u->xfer_buflen = io_u->buflen; + if (td_io_prep(td, io_u)) { + put_io_u(td, io_u); + return NULL; + } + fio_gettime(&io_u->start_time, NULL); return io_u; } -void io_completed(struct thread_data *td, struct io_u *io_u, - struct io_completion_data *icd) +static void io_completed(struct thread_data *td, struct io_u *io_u, + struct io_completion_data *icd) { unsigned long msec; + assert(io_u->flags & IO_U_F_FLIGHT); + io_u->flags &= ~IO_U_F_FLIGHT; + if (io_u->ddir == DDIR_SYNC) { td->last_was_sync = 1; return; @@ -363,6 +504,7 @@ void io_completed(struct thread_data *td, struct io_u *io_u, if (!io_u->error) { unsigned int bytes = io_u->buflen - io_u->resid; const enum fio_ddir idx = io_u->ddir; + int ret; td->io_blocks[idx]++; td->io_bytes[idx] += bytes; @@ -375,24 +517,37 @@ void io_completed(struct thread_data *td, struct io_u *io_u, add_clat_sample(td, idx, msec); add_bw_sample(td, idx, &icd->time); + io_u_mark_latency(td, msec); if ((td_rw(td) || td_write(td)) && idx == DDIR_WRITE) log_io_piece(td, io_u); icd->bytes_done[idx] += bytes; + + if (io_u->end_io) { + ret = io_u->end_io(io_u); + if (ret && !icd->error) + icd->error = ret; + } } else icd->error = io_u->error; } -void ios_completed(struct thread_data *td, struct io_completion_data *icd) +static void init_icd(struct io_completion_data *icd, int nr) { - struct io_u *io_u; - int i; - fio_gettime(&icd->time, NULL); + icd->nr = nr; + icd->error = 0; icd->bytes_done[0] = icd->bytes_done[1] = 0; +} + +static void ios_completed(struct thread_data *td, + struct io_completion_data *icd) +{ + struct io_u *io_u; + int i; for (i = 0; i < icd->nr; i++) { io_u = td->io_ops->event(td, i); @@ -401,3 +556,141 @@ void ios_completed(struct thread_data *td, struct io_completion_data *icd) put_io_u(td, io_u); } } + +/* + * Complete a single io_u for the sync engines. + */ +long io_u_sync_complete(struct thread_data *td, struct io_u *io_u) +{ + struct io_completion_data icd; + + init_icd(&icd, 1); + io_completed(td, io_u, &icd); + put_io_u(td, io_u); + + if (!icd.error) + return icd.bytes_done[0] + icd.bytes_done[1]; + + return -1; +} + +/* + * Called to complete min_events number of io for the async engines. + */ +long io_u_queued_complete(struct thread_data *td, int min_events) +{ + struct io_completion_data icd; + struct timespec *tvp = NULL; + int ret; + + if (!min_events) { + struct timespec ts = { .tv_sec = 0, .tv_nsec = 0, }; + + tvp = &ts; + } + + ret = td_io_getevents(td, min_events, td->cur_depth, tvp); + if (ret < 0) { + td_verror(td, -ret, "td_io_getevents"); + return ret; + } else if (!ret) + return ret; + + init_icd(&icd, ret); + ios_completed(td, &icd); + if (!icd.error) + return icd.bytes_done[0] + icd.bytes_done[1]; + + return -1; +} + +/* + * Call when io_u is really queued, to update the submission latency. + */ +void io_u_queued(struct thread_data *td, struct io_u *io_u) +{ + unsigned long slat_time; + + slat_time = mtime_since(&io_u->start_time, &io_u->issue_time); + add_slat_sample(td, io_u->ddir, slat_time); +} + +#ifdef FIO_USE_TIMEOUT +void io_u_set_timeout(struct thread_data *td) +{ + assert(td->cur_depth); + + td->timer.it_interval.tv_sec = 0; + td->timer.it_interval.tv_usec = 0; + td->timer.it_value.tv_sec = IO_U_TIMEOUT + IO_U_TIMEOUT_INC; + td->timer.it_value.tv_usec = 0; + setitimer(ITIMER_REAL, &td->timer, NULL); + fio_gettime(&td->timeout_end, NULL); +} + +static void io_u_dump(struct io_u *io_u) +{ + unsigned long t_start = mtime_since_now(&io_u->start_time); + unsigned long t_issue = mtime_since_now(&io_u->issue_time); + + log_err("io_u=%p, t_start=%lu, t_issue=%lu\n", io_u, t_start, t_issue); + log_err(" buf=%p/%p, len=%lu/%lu, offset=%llu\n", io_u->buf, io_u->xfer_buf, io_u->buflen, io_u->xfer_buflen, io_u->offset); + log_err(" ddir=%d, fname=%s\n", io_u->ddir, io_u->file->file_name); +} +#else +void io_u_set_timeout(struct thread_data fio_unused *td) +{ +} +#endif + +#ifdef FIO_USE_TIMEOUT +static void io_u_timeout_handler(int fio_unused sig) +{ + struct thread_data *td, *__td; + pid_t pid = getpid(); + struct list_head *entry; + struct io_u *io_u; + int i; + + log_err("fio: io_u timeout\n"); + + /* + * TLS would be nice... + */ + td = NULL; + for_each_td(__td, i) { + if (__td->pid == pid) { + td = __td; + break; + } + } + + if (!td) { + log_err("fio: io_u timeout, can't find job\n"); + exit(1); + } + + if (!td->cur_depth) { + log_err("fio: timeout without pending work?\n"); + return; + } + + log_err("fio: io_u timeout: job=%s, pid=%d\n", td->name, td->pid); + + list_for_each(entry, &td->io_u_busylist) { + io_u = list_entry(entry, struct io_u, list); + + io_u_dump(io_u); + } + + td_verror(td, ETIMEDOUT, "io_u timeout"); + exit(1); +} +#endif + +void io_u_init_timeout(void) +{ +#ifdef FIO_USE_TIMEOUT + signal(SIGALRM, io_u_timeout_handler); +#endif +}