posixaio: speedup by using aio_suspend() instead of manual waiting
[fio.git] / engines / posixaio.c
CommitLineData
2866c82d 1/*
da751ca9
JA
2 * posixaio engine
3 *
4 * IO engine that uses the posix defined aio interface.
2866c82d
JA
5 *
6 */
7#include <stdio.h>
8#include <stdlib.h>
9#include <unistd.h>
10#include <errno.h>
11#include <assert.h>
5f350952
JA
12
13#include "../fio.h"
2866c82d 14
34cfcdaf
JA
15#ifdef FIO_HAVE_POSIXAIO
16
2866c82d
JA
17struct posixaio_data {
18 struct io_u **aio_events;
19};
20
21static int fill_timespec(struct timespec *ts)
22{
23#ifdef _POSIX_TIMERS
24 if (!clock_gettime(CLOCK_MONOTONIC, ts))
25 return 0;
26
27 perror("clock_gettime");
28#endif
29 return 1;
30}
31
32static unsigned long long ts_utime_since_now(struct timespec *t)
33{
34 long long sec, nsec;
35 struct timespec now;
36
37 if (fill_timespec(&now))
38 return 0;
39
40 sec = now.tv_sec - t->tv_sec;
41 nsec = now.tv_nsec - t->tv_nsec;
42 if (sec > 0 && nsec < 0) {
43 sec--;
44 nsec += 1000000000;
45 }
46
47 sec *= 1000000;
48 nsec /= 1000;
49 return sec + nsec;
50}
51
7a16dd02
JA
52static int fio_posixaio_cancel(struct thread_data fio_unused *td,
53 struct io_u *io_u)
2866c82d 54{
53cdc686
JA
55 struct fio_file *f = io_u->file;
56 int r = aio_cancel(f->fd, &io_u->aiocb);
2866c82d
JA
57
58 if (r == 1 || r == AIO_CANCELED)
59 return 0;
60
61 return 1;
62}
63
7a16dd02
JA
64static int fio_posixaio_prep(struct thread_data fio_unused *td,
65 struct io_u *io_u)
2866c82d
JA
66{
67 struct aiocb *aiocb = &io_u->aiocb;
53cdc686 68 struct fio_file *f = io_u->file;
2866c82d 69
53cdc686 70 aiocb->aio_fildes = f->fd;
cec6b55d
JA
71 aiocb->aio_buf = io_u->xfer_buf;
72 aiocb->aio_nbytes = io_u->xfer_buflen;
2866c82d
JA
73 aiocb->aio_offset = io_u->offset;
74
75 io_u->seen = 0;
76 return 0;
77}
78
3c77037e
JA
79#define SUSPEND_ENTRIES 8
80
e7d2e616
JA
81static int fio_posixaio_getevents(struct thread_data *td, unsigned int min,
82 unsigned int max, struct timespec *t)
2866c82d
JA
83{
84 struct posixaio_data *pd = td->io_ops->data;
3c77037e 85 struct aiocb *suspend_list[SUSPEND_ENTRIES];
2866c82d
JA
86 struct list_head *entry;
87 struct timespec start;
a3cc770d 88 int have_timeout = 0;
3c77037e 89 int suspend_entries = 0;
a3cc770d 90 unsigned int r;
2866c82d
JA
91
92 if (t && !fill_timespec(&start))
93 have_timeout = 1;
94
95 r = 0;
3c77037e 96 suspend_list[0] = NULL;
2866c82d
JA
97restart:
98 list_for_each(entry, &td->io_u_busylist) {
99 struct io_u *io_u = list_entry(entry, struct io_u, list);
100 int err;
101
102 if (io_u->seen)
103 continue;
104
105 err = aio_error(&io_u->aiocb);
3c77037e
JA
106 if (err == EINPROGRESS) {
107 if (suspend_entries < SUSPEND_ENTRIES) {
108 suspend_list[suspend_entries] = &io_u->aiocb;
109 suspend_entries++;
110 }
3f344316 111 continue;
3c77037e 112 }
3f344316
JA
113
114 io_u->seen = 1;
115 pd->aio_events[r++] = io_u;
116
117 if (err == ECANCELED)
118 io_u->resid = io_u->xfer_buflen;
119 else if (!err) {
120 ssize_t retval = aio_return(&io_u->aiocb);
121
122 io_u->resid = io_u->xfer_buflen - retval;
123 } else
124 io_u->error = err;
2866c82d
JA
125
126 if (r >= max)
127 break;
128 }
129
130 if (r >= min)
131 return r;
132
133 if (have_timeout) {
134 unsigned long long usec;
135
136 usec = (t->tv_sec * 1000000) + (t->tv_nsec / 1000);
137 if (ts_utime_since_now(&start) > usec)
138 return r;
139 }
140
141 /*
3c77037e 142 * must have some in-flight, wait for at least one
2866c82d 143 */
3c77037e
JA
144 aio_suspend((const struct aiocb * const *)suspend_list,
145 suspend_entries, t);
2866c82d
JA
146 goto restart;
147}
148
149static struct io_u *fio_posixaio_event(struct thread_data *td, int event)
150{
151 struct posixaio_data *pd = td->io_ops->data;
152
153 return pd->aio_events[event];
154}
155
156static int fio_posixaio_queue(struct thread_data fio_unused *td,
157 struct io_u *io_u)
158{
159 struct aiocb *aiocb = &io_u->aiocb;
160 int ret;
161
7101d9c2
JA
162 fio_ro_check(td, io_u);
163
2866c82d
JA
164 if (io_u->ddir == DDIR_READ)
165 ret = aio_read(aiocb);
87dc1ab1 166 else if (io_u->ddir == DDIR_WRITE)
2866c82d 167 ret = aio_write(aiocb);
87dc1ab1
JA
168 else
169 ret = aio_fsync(O_SYNC, aiocb);
2866c82d 170
95bcd815 171 if (ret) {
2866c82d 172 io_u->error = errno;
e1161c32 173 td_verror(td, io_u->error, "xfer");
36167d82 174 return FIO_Q_COMPLETED;
95bcd815 175 }
36167d82
JA
176
177 return FIO_Q_QUEUED;
2866c82d
JA
178}
179
180static void fio_posixaio_cleanup(struct thread_data *td)
181{
182 struct posixaio_data *pd = td->io_ops->data;
183
184 if (pd) {
185 free(pd->aio_events);
186 free(pd);
187 td->io_ops->data = NULL;
188 }
189}
190
191static int fio_posixaio_init(struct thread_data *td)
192{
193 struct posixaio_data *pd = malloc(sizeof(*pd));
194
cb781c75 195 memset(pd, 0, sizeof(*pd));
2dc1bbeb
JA
196 pd->aio_events = malloc(td->o.iodepth * sizeof(struct io_u *));
197 memset(pd->aio_events, 0, td->o.iodepth * sizeof(struct io_u *));
2866c82d
JA
198
199 td->io_ops->data = pd;
200 return 0;
201}
202
5f350952 203static struct ioengine_ops ioengine = {
2866c82d
JA
204 .name = "posixaio",
205 .version = FIO_IOOPS_VERSION,
206 .init = fio_posixaio_init,
207 .prep = fio_posixaio_prep,
208 .queue = fio_posixaio_queue,
209 .cancel = fio_posixaio_cancel,
210 .getevents = fio_posixaio_getevents,
211 .event = fio_posixaio_event,
212 .cleanup = fio_posixaio_cleanup,
b5af8293
JA
213 .open_file = generic_open_file,
214 .close_file = generic_close_file,
2866c82d 215};
34cfcdaf
JA
216
217#else /* FIO_HAVE_POSIXAIO */
218
219/*
220 * When we have a proper configure system in place, we simply wont build
221 * and install this io engine. For now install a crippled version that
222 * just complains and fails to load.
223 */
224static int fio_posixaio_init(struct thread_data fio_unused *td)
225{
226 fprintf(stderr, "fio: posixaio not available\n");
227 return 1;
228}
229
5f350952 230static struct ioengine_ops ioengine = {
34cfcdaf
JA
231 .name = "posixaio",
232 .version = FIO_IOOPS_VERSION,
233 .init = fio_posixaio_init,
234};
235
236#endif
5f350952
JA
237
238static void fio_init fio_posixaio_register(void)
239{
240 register_ioengine(&ioengine);
241}
242
243static void fio_exit fio_posixaio_unregister(void)
244{
245 unregister_ioengine(&ioengine);
246}