X-Git-Url: https://git.kernel.dk/?p=fio.git;a=blobdiff_plain;f=engines%2Frbd.c;h=268b6ebdffad2b71e4da565ed90867e76f90947a;hp=87ed360f7c26a25fb401aac833b9fe05d0c288f4;hb=HEAD;hpb=ecfd2bb08cc87bc9a1b3d612258f1fdfb4d09698 diff --git a/engines/rbd.c b/engines/rbd.c index 87ed360f..2f25889a 100644 --- a/engines/rbd.c +++ b/engines/rbd.c @@ -10,6 +10,12 @@ #include "../fio.h" #include "../optgroup.h" +#ifdef CONFIG_RBD_POLL +/* add for poll */ +#include +#include +#endif + struct fio_rbd_iou { struct io_u *io_u; rbd_completion_t completion; @@ -23,6 +29,8 @@ struct rbd_data { rbd_image_t image; struct io_u **aio_events; struct io_u **sort_events; + int fd; /* add for poll */ + bool connected; }; struct rbd_options { @@ -91,13 +99,18 @@ static int _fio_setup_rbd_data(struct thread_data *td, { struct rbd_data *rbd; - if (td->io_ops->data) + if (td->io_ops_data) return 0; rbd = calloc(1, sizeof(struct rbd_data)); if (!rbd) goto failed; + rbd->connected = false; + + /* add for poll, init fd: -1 */ + rbd->fd = -1; + rbd->aio_events = calloc(td->o.iodepth, sizeof(struct io_u *)); if (!rbd->aio_events) goto failed; @@ -110,15 +123,49 @@ static int _fio_setup_rbd_data(struct thread_data *td, return 0; failed: - if (rbd) + if (rbd) { + if (rbd->aio_events) + free(rbd->aio_events); + if (rbd->sort_events) + free(rbd->sort_events); free(rbd); + } return 1; } +#ifdef CONFIG_RBD_POLL +static bool _fio_rbd_setup_poll(struct rbd_data *rbd) +{ + int r; + + /* add for rbd poll */ + rbd->fd = eventfd(0, EFD_SEMAPHORE); + if (rbd->fd < 0) { + log_err("eventfd failed.\n"); + return false; + } + + r = rbd_set_image_notification(rbd->image, rbd->fd, EVENT_TYPE_EVENTFD); + if (r < 0) { + log_err("rbd_set_image_notification failed.\n"); + close(rbd->fd); + rbd->fd = -1; + return false; + } + + return true; +} +#else +static bool _fio_rbd_setup_poll(struct rbd_data *rbd) +{ + return true; +} +#endif + static int _fio_rbd_connect(struct thread_data *td) { - struct rbd_data *rbd = td->io_ops->data; + struct rbd_data *rbd = td->io_ops_data; struct rbd_options *o = td->eo; int r; @@ -126,18 +173,26 @@ static int _fio_rbd_connect(struct thread_data *td) char *client_name = NULL; /* - * If we specify cluser name, the rados_creat2 + * If we specify cluster name, the rados_create2 * will not assume 'client.'. name is considered * as a full type.id namestr */ - if (!index(o->client_name, '.')) { - client_name = calloc(1, strlen("client.") + - strlen(o->client_name) + 1); - strcat(client_name, "client."); - o->client_name = strcat(client_name, o->client_name); + if (o->client_name) { + if (!index(o->client_name, '.')) { + client_name = calloc(1, strlen("client.") + + strlen(o->client_name) + 1); + strcat(client_name, "client."); + strcat(client_name, o->client_name); + } else { + client_name = o->client_name; + } } + r = rados_create2(&rbd->cluster, o->cluster_name, - o->client_name, 0); + client_name, 0); + + if (client_name && !index(o->client_name, '.')) + free(client_name); } else r = rados_create(&rbd->cluster, o->client_name); @@ -145,6 +200,14 @@ static int _fio_rbd_connect(struct thread_data *td) log_err("rados_create failed.\n"); goto failed_early; } + if (o->pool_name == NULL) { + log_err("rbd pool name must be provided.\n"); + goto failed_early; + } + if (!o->rbd_name) { + log_err("rbdname must be provided.\n"); + goto failed_early; + } r = rados_conf_read_file(rbd->cluster, NULL); if (r < 0) { @@ -164,13 +227,38 @@ static int _fio_rbd_connect(struct thread_data *td) goto failed_shutdown; } + if (td->o.odirect) { + r = rados_conf_set(rbd->cluster, "rbd_cache", "false"); + if (r < 0) { + log_info("failed to disable RBD in-memory cache\n"); + } + } + r = rbd_open(rbd->io_ctx, o->rbd_name, &rbd->image, NULL /*snap */ ); if (r < 0) { log_err("rbd_open failed.\n"); goto failed_open; } + + if (!td->o.odirect) { + /* + * ensure cache enables writeback/around mode unless explicitly + * configured for writethrough mode + */ + r = rbd_flush(rbd->image); + if (r < 0) { + log_info("rbd: failed to issue initial flush\n"); + } + } + + if (!_fio_rbd_setup_poll(rbd)) + goto failed_poll; + return 0; +failed_poll: + rbd_close(rbd->image); + rbd->image = NULL; failed_open: rados_ioctx_destroy(rbd->io_ctx); rbd->io_ctx = NULL; @@ -186,6 +274,12 @@ static void _fio_rbd_disconnect(struct rbd_data *rbd) if (!rbd) return; + /* close eventfd */ + if (rbd->fd != -1) { + close(rbd->fd); + rbd->fd = -1; + } + /* shutdown everything */ if (rbd->image) { rbd_close(rbd->image); @@ -216,7 +310,7 @@ static void _fio_rbd_finish_aiocb(rbd_completion_t comp, void *data) */ ret = rbd_aio_get_return_value(fri->completion); if (ret < 0) { - io_u->error = ret; + io_u->error = -ret; io_u->resid = io_u->xfer_buflen; } else io_u->error = 0; @@ -226,7 +320,7 @@ static void _fio_rbd_finish_aiocb(rbd_completion_t comp, void *data) static struct io_u *fio_rbd_event(struct thread_data *td, int event) { - struct rbd_data *rbd = td->io_ops->data; + struct rbd_data *rbd = td->io_ops_data; return rbd->aio_events[event]; } @@ -248,12 +342,14 @@ static inline int fri_check_complete(struct rbd_data *rbd, struct io_u *io_u, return 0; } +#ifndef CONFIG_RBD_POLL static inline int rbd_io_u_seen(struct io_u *io_u) { struct fio_rbd_iou *fri = io_u->engine_data; return fri->io_seen; } +#endif static void rbd_io_u_wait_complete(struct io_u *io_u) { @@ -282,12 +378,46 @@ static int rbd_io_u_cmp(const void *p1, const void *p2) static int rbd_iter_events(struct thread_data *td, unsigned int *events, unsigned int min_evts, int wait) { - struct rbd_data *rbd = td->io_ops->data; + struct rbd_data *rbd = td->io_ops_data; unsigned int this_events = 0; struct io_u *io_u; - int i, sidx; + int i, sidx = 0; + +#ifdef CONFIG_RBD_POLL + int ret = 0; + int event_num = 0; + struct fio_rbd_iou *fri = NULL; + rbd_completion_t comps[min_evts]; + uint64_t counter; + bool completed; + + struct pollfd pfd; + pfd.fd = rbd->fd; + pfd.events = POLLIN; + + ret = poll(&pfd, 1, wait ? -1 : 0); + if (ret <= 0) + return 0; + if (!(pfd.revents & POLLIN)) + return 0; - sidx = 0; + event_num = rbd_poll_io_events(rbd->image, comps, min_evts); + + for (i = 0; i < event_num; i++) { + fri = rbd_aio_get_arg(comps[i]); + io_u = fri->io_u; + + /* best effort to decrement the semaphore */ + ret = read(rbd->fd, &counter, sizeof(counter)); + if (ret <= 0) + log_err("rbd_iter_events failed to decrement semaphore.\n"); + + completed = fri_check_complete(rbd, io_u, events); + assert(completed); + + this_events++; + } +#else io_u_qiter(&td->io_u_all, io_u, i) { if (!(io_u->flags & IO_U_F_FLIGHT)) continue; @@ -299,6 +429,7 @@ static int rbd_iter_events(struct thread_data *td, unsigned int *events, else if (wait) rbd->sort_events[sidx++] = io_u; } +#endif if (!wait || !sidx) return this_events; @@ -359,9 +490,10 @@ static int fio_rbd_getevents(struct thread_data *td, unsigned int min, return events; } -static int fio_rbd_queue(struct thread_data *td, struct io_u *io_u) +static enum fio_q_status fio_rbd_queue(struct thread_data *td, + struct io_u *io_u) { - struct rbd_data *rbd = td->io_ops->data; + struct rbd_data *rbd = td->io_ops_data; struct fio_rbd_iou *fri = io_u->engine_data; int r = -1; @@ -409,6 +541,7 @@ static int fio_rbd_queue(struct thread_data *td, struct io_u *io_u) } else { dprint(FD_IO, "%s: Warning: unhandled ddir: %d\n", __func__, io_u->ddir); + r = -EINVAL; goto failed_comp; } @@ -416,7 +549,7 @@ static int fio_rbd_queue(struct thread_data *td, struct io_u *io_u) failed_comp: rbd_aio_release(fri->completion); failed: - io_u->error = r; + io_u->error = -r; td_verror(td, io_u->error, "xfer"); return FIO_Q_COMPLETED; } @@ -424,6 +557,10 @@ failed: static int fio_rbd_init(struct thread_data *td) { int r; + struct rbd_data *rbd = td->io_ops_data; + + if (rbd->connected) + return 0; r = _fio_rbd_connect(td); if (r) { @@ -439,7 +576,7 @@ failed: static void fio_rbd_cleanup(struct thread_data *td) { - struct rbd_data *rbd = td->io_ops->data; + struct rbd_data *rbd = td->io_ops_data; if (rbd) { _fio_rbd_disconnect(rbd); @@ -454,20 +591,15 @@ static int fio_rbd_setup(struct thread_data *td) rbd_image_info_t info; struct fio_file *f; struct rbd_data *rbd = NULL; - int major, minor, extra; int r; - /* log version of librbd. No cluster connection required. */ - rbd_version(&major, &minor, &extra); - log_info("rbd engine: RBD version: %d.%d.%d\n", major, minor, extra); - /* allocate engine specific structure to deal with librbd. */ r = _fio_setup_rbd_data(td, &rbd); if (r) { log_err("fio_setup_rbd_data failed.\n"); goto cleanup; } - td->io_ops->data = rbd; + td->io_ops_data = rbd; /* librbd does not allow us to run first in the main thread and later * in a fork child. It needs to be the same process context all the @@ -484,18 +616,24 @@ static int fio_rbd_setup(struct thread_data *td) log_err("fio_rbd_connect failed.\n"); goto cleanup; } + rbd->connected = true; /* get size of the RADOS block device */ r = rbd_stat(rbd->image, &info, sizeof(info)); if (r < 0) { log_err("rbd_status failed.\n"); - goto disconnect; + goto cleanup; + } else if (info.size == 0) { + log_err("image size should be larger than zero.\n"); + r = -EINVAL; + goto cleanup; } - dprint(FD_IO, "rbd-engine: image size: %lu\n", info.size); + + dprint(FD_IO, "rbd-engine: image size: %" PRIu64 "\n", info.size); /* taken from "net" engine. Pretend we deal with files, * even if we do not have any ideas about files. - * The size of the RBD is set instead of a artificial file. + * The size of the RBD is set instead of an artificial file. */ if (!td->files_index) { add_file(td, td->o.filename ? : "rbd", 0, 0); @@ -505,14 +643,8 @@ static int fio_rbd_setup(struct thread_data *td) f = td->files[0]; f->real_file_size = info.size; - /* disconnect, then we were only connected to determine - * the size of the RBD. - */ - _fio_rbd_disconnect(rbd); return 0; -disconnect: - _fio_rbd_disconnect(rbd); cleanup: fio_rbd_cleanup(td); return r; @@ -526,7 +658,7 @@ static int fio_rbd_open(struct thread_data *td, struct fio_file *f) static int fio_rbd_invalidate(struct thread_data *td, struct fio_file *f) { #if defined(CONFIG_RBD_INVAL) - struct rbd_data *rbd = td->io_ops->data; + struct rbd_data *rbd = td->io_ops_data; return rbd_invalidate_cache(rbd->image); #else @@ -554,7 +686,7 @@ static int fio_rbd_io_u_init(struct thread_data *td, struct io_u *io_u) return 0; } -static struct ioengine_ops ioengine = { +FIO_STATIC struct ioengine_ops ioengine = { .name = "rbd", .version = FIO_IOOPS_VERSION, .setup = fio_rbd_setup,