X-Git-Url: https://git.kernel.dk/?p=fio.git;a=blobdiff_plain;f=engines%2Fsyslet-rw.c;h=2a3095d405c7f0a80ef773877e24acbcdb0009f9;hp=d6d9943c0bee29b2b23463c3ea1751f76f198868;hb=7756b0d046ef74c32df134c8b716237cc5e16bad;hpb=2ca50be45bcacd652e2cefb6a69837e051cb297a diff --git a/engines/syslet-rw.c b/engines/syslet-rw.c index d6d9943c..2a3095d4 100644 --- a/engines/syslet-rw.c +++ b/engines/syslet-rw.c @@ -17,31 +17,45 @@ struct syslet_data { struct io_u **events; unsigned int nr_events; - struct async_head_user *ahu; + struct async_head_user ahu; struct syslet_uatom **ring; - unsigned int ring_index; + + struct syslet_uatom *head, *tail; + struct syslet_uatom **event_map; + unsigned int event_map_idx; }; -/* - * Inspect the ring to see if we have completed events - */ -static void fio_syslet_complete(struct thread_data *td) +static void fio_syslet_complete_atom(struct thread_data *td, + struct syslet_uatom *atom) { struct syslet_data *sd = td->io_ops->data; + struct io_u *io_u; + int i, end; - do { - struct syslet_uatom *atom; - struct io_u *io_u; - long ret; + if (!sd->event_map_idx) + return; - atom = sd->ring[sd->ring_index]; - if (!atom) + /* + * Find the start of the string of atoms for this sequence + */ + for (end = sd->event_map_idx - 1; end >= 0; end--) + if (atom == sd->event_map[end]) break; - sd->ring[sd->ring_index] = NULL; - if (++sd->ring_index == td->iodepth) - sd->ring_index = 0; + if (end < 0 || atom != sd->event_map[end]) { + printf("didn't find atom\n"); + return; + } + + //printf("end=%d, total %d\n", end, sd->event_map_idx); + + /* + * now complete in right order + */ + for (i = 0; i <= end; i++) { + long ret; + atom = sd->event_map[i]; io_u = atom->private; ret = *atom->ret_ptr; if (ret > 0) @@ -49,7 +63,42 @@ static void fio_syslet_complete(struct thread_data *td) else if (ret < 0) io_u->error = ret; + assert(sd->nr_events < td->iodepth); sd->events[sd->nr_events++] = io_u; + } + + /* + * Move later completions to the front, if we didn't complete all + */ + if (end == (int) sd->event_map_idx - 1) + sd->event_map_idx = 0; + else { + int nr = sd->event_map_idx - end - 1; + + memmove(sd->event_map, &sd->event_map[end + 1], nr * sizeof(struct syslet_uatom *)); + sd->event_map_idx = nr; + } +} + +/* + * Inspect the ring to see if we have completed events + */ +static void fio_syslet_complete(struct thread_data *td) +{ + struct syslet_data *sd = td->io_ops->data; + + do { + struct syslet_uatom *atom; + + atom = sd->ring[sd->ahu.user_ring_idx]; + if (!atom) + break; + + sd->ring[sd->ahu.user_ring_idx] = NULL; + if (++sd->ahu.user_ring_idx == td->iodepth) + sd->ahu.user_ring_idx = 0; + + fio_syslet_complete_atom(td, atom); } while (1); } @@ -58,7 +107,6 @@ static int fio_syslet_getevents(struct thread_data *td, int min, struct timespec fio_unused *t) { struct syslet_data *sd = td->io_ops->data; - int get_events; long ret; do { @@ -73,10 +121,9 @@ static int fio_syslet_getevents(struct thread_data *td, int min, /* * OK, we need to wait for some events... */ - get_events = min - sd->nr_events; - ret = async_wait(get_events); + ret = async_wait(1, sd->ahu.user_ring_idx, &sd->ahu); if (ret < 0) - return errno; + return -errno; } while (1); ret = sd->nr_events; @@ -113,7 +160,7 @@ static void init_atom(struct syslet_uatom *atom, int nr, void *arg0, static void fio_syslet_prep_sync(struct io_u *io_u, struct fio_file *f) { init_atom(&io_u->req.atom, __NR_fsync, &f->fd, NULL, NULL, NULL, - &io_u->req.ret, SYSLET_STOP_ON_NEGATIVE, io_u); + &io_u->req.ret, 0, io_u); } static void fio_syslet_prep_rw(struct io_u *io_u, struct fio_file *f) @@ -129,8 +176,7 @@ static void fio_syslet_prep_rw(struct io_u *io_u, struct fio_file *f) nr = __NR_pwrite64; init_atom(&io_u->req.atom, nr, &f->fd, &io_u->xfer_buf, - &io_u->xfer_buflen, &io_u->offset, &io_u->req.ret, - SYSLET_STOP_ON_NEGATIVE, io_u); + &io_u->xfer_buflen, &io_u->offset, &io_u->req.ret, 0, io_u); } static int fio_syslet_prep(struct thread_data fio_unused *td, struct io_u *io_u) @@ -145,67 +191,81 @@ static int fio_syslet_prep(struct thread_data fio_unused *td, struct io_u *io_u) return 0; } -static int fio_syslet_queue(struct thread_data *td, struct io_u *io_u) +static void cachemiss_thread_start(void) +{ + while (1) + async_thread(NULL, NULL); +} + +#define THREAD_STACK_SIZE (16384) + +static unsigned long thread_stack_alloc() +{ + return (unsigned long)malloc(THREAD_STACK_SIZE) + THREAD_STACK_SIZE; +} + +static int fio_syslet_commit(struct thread_data *td) { struct syslet_data *sd = td->io_ops->data; struct syslet_uatom *done; - long ret; - done = async_exec(&io_u->req.atom); - if (!done) + if (!sd->head) return 0; + if (!sd->ahu.new_thread_stack) + sd->ahu.new_thread_stack = thread_stack_alloc(); + /* - * completed sync + * On sync completion, the atom is returned. So on NULL return + * it's queued asynchronously. */ - ret = io_u->req.ret; - if (ret != (long) io_u->xfer_buflen) { - if (ret > 0) { - io_u->resid = io_u->xfer_buflen - ret; - io_u->error = 0; - return ret; - } else - io_u->error = errno; - } + done = async_exec(sd->head, &sd->ahu); - if (!io_u->error) - sd->events[sd->nr_events++] = io_u; - else - td_verror(td, io_u->error); + sd->head = sd->tail = NULL; + + if (done) + fio_syslet_complete_atom(td, done); + + return 0; +} - return io_u->error; +static int fio_syslet_queue(struct thread_data *td, struct io_u *io_u) +{ + struct syslet_data *sd = td->io_ops->data; + + if (sd->tail) { + sd->tail->next = &io_u->req.atom; + sd->tail = &io_u->req.atom; + } else + sd->head = sd->tail = &io_u->req.atom; + + sd->event_map[sd->event_map_idx++] = sd->tail; + return FIO_Q_QUEUED; } static int async_head_init(struct syslet_data *sd, unsigned int depth) { unsigned long ring_size; - sd->ahu = malloc(sizeof(struct async_head_user)); - memset(sd->ahu, 0, sizeof(struct async_head_user)); + memset(&sd->ahu, 0, sizeof(struct async_head_user)); ring_size = sizeof(struct syslet_uatom *) * depth; sd->ring = malloc(ring_size); memset(sd->ring, 0, ring_size); - sd->ahu->completion_ring = sd->ring; - sd->ahu->ring_size_bytes = ring_size; - sd->ahu->max_nr_threads = -1; - - if (async_register(sd->ahu, sizeof(*sd->ahu)) < 0) { - perror("async_register"); - fprintf(stderr, "fio: syslet likely not supported\n"); - free(sd->ring); - free(sd->ahu); - return 1; - } + sd->ahu.user_ring_idx = 0; + sd->ahu.completion_ring = sd->ring; + sd->ahu.ring_size_bytes = ring_size; + sd->ahu.head_stack = thread_stack_alloc(); + sd->ahu.head_eip = (unsigned long)cachemiss_thread_start; + sd->ahu.new_thread_eip = (unsigned long)cachemiss_thread_start; return 0; } static void async_head_exit(struct syslet_data *sd) { - if (async_unregister(sd->ahu, sizeof(*sd->ahu)) < 0) - perror("async_register"); + free(sd->ring); } static void fio_syslet_cleanup(struct thread_data *td) @@ -215,6 +275,7 @@ static void fio_syslet_cleanup(struct thread_data *td) if (sd) { async_head_exit(sd); free(sd->events); + free(sd->event_map); free(sd); td->io_ops->data = NULL; } @@ -229,6 +290,8 @@ static int fio_syslet_init(struct thread_data *td) memset(sd, 0, sizeof(*sd)); sd->events = malloc(sizeof(struct io_u *) * td->iodepth); memset(sd->events, 0, sizeof(struct io_u *) * td->iodepth); + sd->event_map = malloc(sizeof(struct syslet_uatom *) * td->iodepth); + memset(sd->event_map, 0, sizeof(struct syslet_uatom *) * td->iodepth); /* * This will handily fail for kernels where syslet isn't available @@ -249,6 +312,7 @@ static struct ioengine_ops ioengine = { .init = fio_syslet_init, .prep = fio_syslet_prep, .queue = fio_syslet_queue, + .commit = fio_syslet_commit, .getevents = fio_syslet_getevents, .event = fio_syslet_event, .cleanup = fio_syslet_cleanup,