blob: 8ab88fbb1faf2821c442015f85f78e24cb1d244d [file] [log] [blame]
Jens Axboe2866c822006-10-09 15:57:48 +02001/*
Jens Axboeda751ca2007-03-14 10:59:33 +01002 * posixaio engine
3 *
4 * IO engine that uses the posix defined aio interface.
Jens Axboe2866c822006-10-09 15:57:48 +02005 *
6 */
7#include <stdio.h>
8#include <stdlib.h>
9#include <unistd.h>
10#include <errno.h>
Jens Axboebc733f32008-06-02 12:25:12 +020011#include <fcntl.h>
Jens Axboe5f350952006-11-07 15:20:59 +010012
13#include "../fio.h"
Jens Axboe2866c822006-10-09 15:57:48 +020014
15struct posixaio_data {
16 struct io_u **aio_events;
Jens Axboe207cb0f2008-06-02 12:28:02 +020017 unsigned int queued;
Jens Axboe2866c822006-10-09 15:57:48 +020018};
19
20static int fill_timespec(struct timespec *ts)
21{
Jens Axboe5351f562013-01-23 14:02:23 -070022#ifdef CONFIG_CLOCK_GETTIME
23#ifdef CONFIG_CLOCK_MONOTONIC
24 clockid_t clk = CLOCK_MONOTONIC;
25#else
26 clockid_t clk = CLOCK_REALTIME;
27#endif
28 if (!clock_gettime(clk, ts))
Jens Axboe2866c822006-10-09 15:57:48 +020029 return 0;
30
31 perror("clock_gettime");
Jens Axboe2866c822006-10-09 15:57:48 +020032 return 1;
Jens Axboe5351f562013-01-23 14:02:23 -070033#else
34 struct timeval tv;
35
36 gettimeofday(&tv, NULL);
37 ts->tv_sec = tv.tv_sec;
38 ts->tv_nsec = tv.tv_usec * 1000;
39 return 0;
40#endif
Jens Axboe2866c822006-10-09 15:57:48 +020041}
42
43static unsigned long long ts_utime_since_now(struct timespec *t)
44{
45 long long sec, nsec;
46 struct timespec now;
47
48 if (fill_timespec(&now))
49 return 0;
50
51 sec = now.tv_sec - t->tv_sec;
52 nsec = now.tv_nsec - t->tv_nsec;
53 if (sec > 0 && nsec < 0) {
54 sec--;
55 nsec += 1000000000;
56 }
57
58 sec *= 1000000;
59 nsec /= 1000;
60 return sec + nsec;
61}
62
Jens Axboe7a16dd02006-10-18 17:21:58 +020063static int fio_posixaio_cancel(struct thread_data fio_unused *td,
64 struct io_u *io_u)
Jens Axboe2866c822006-10-09 15:57:48 +020065{
Jens Axboe53cdc682006-10-18 11:50:58 +020066 struct fio_file *f = io_u->file;
67 int r = aio_cancel(f->fd, &io_u->aiocb);
Jens Axboe2866c822006-10-09 15:57:48 +020068
YAMAMOTO Takashi2faf9ec2010-06-11 09:21:33 +020069 if (r == AIO_ALLDONE || r == AIO_CANCELED)
Jens Axboe2866c822006-10-09 15:57:48 +020070 return 0;
71
72 return 1;
73}
74
Jens Axboe7a16dd02006-10-18 17:21:58 +020075static int fio_posixaio_prep(struct thread_data fio_unused *td,
76 struct io_u *io_u)
Jens Axboe2866c822006-10-09 15:57:48 +020077{
Jens Axboee97c1442011-09-21 09:38:01 +020078 os_aiocb_t *aiocb = &io_u->aiocb;
Jens Axboe53cdc682006-10-18 11:50:58 +020079 struct fio_file *f = io_u->file;
Jens Axboe2866c822006-10-09 15:57:48 +020080
Jens Axboe53cdc682006-10-18 11:50:58 +020081 aiocb->aio_fildes = f->fd;
Jens Axboecec6b552007-02-06 20:15:38 +010082 aiocb->aio_buf = io_u->xfer_buf;
83 aiocb->aio_nbytes = io_u->xfer_buflen;
Jens Axboe2866c822006-10-09 15:57:48 +020084 aiocb->aio_offset = io_u->offset;
Jens Axboe9918be52011-07-09 13:33:38 +020085 aiocb->aio_sigevent.sigev_notify = SIGEV_NONE;
Jens Axboe2866c822006-10-09 15:57:48 +020086
87 io_u->seen = 0;
88 return 0;
89}
90
Jens Axboe3c770372008-03-10 18:45:57 +010091#define SUSPEND_ENTRIES 8
92
Jens Axboee7d2e612007-12-11 10:49:39 +010093static int fio_posixaio_getevents(struct thread_data *td, unsigned int min,
Jens Axboe0cbbc392014-09-30 16:04:12 -060094 unsigned int max, const struct timespec *t)
Jens Axboe2866c822006-10-09 15:57:48 +020095{
96 struct posixaio_data *pd = td->io_ops->data;
Jens Axboee97c1442011-09-21 09:38:01 +020097 os_aiocb_t *suspend_list[SUSPEND_ENTRIES];
Jens Axboe2866c822006-10-09 15:57:48 +020098 struct timespec start;
Jens Axboea3cc7702007-12-11 13:23:27 +010099 int have_timeout = 0;
Jens Axboef8326422013-03-22 15:23:20 -0600100 int suspend_entries;
Jens Axboe2ae0b202013-05-28 14:16:55 +0200101 struct io_u *io_u;
Jens Axboea3cc7702007-12-11 13:23:27 +0100102 unsigned int r;
Jens Axboe2ae0b202013-05-28 14:16:55 +0200103 int i;
Jens Axboe2866c822006-10-09 15:57:48 +0200104
105 if (t && !fill_timespec(&start))
106 have_timeout = 1;
Jens Axboe5351f562013-01-23 14:02:23 -0700107 else
108 memset(&start, 0, sizeof(start));
Jens Axboe2866c822006-10-09 15:57:48 +0200109
110 r = 0;
111restart:
Jens Axboef8326422013-03-22 15:23:20 -0600112 memset(suspend_list, 0, sizeof(*suspend_list));
113 suspend_entries = 0;
Jens Axboe2ae0b202013-05-28 14:16:55 +0200114 io_u_qiter(&td->io_u_all, io_u, i) {
Jens Axboe2866c822006-10-09 15:57:48 +0200115 int err;
116
Jens Axboe2ae0b202013-05-28 14:16:55 +0200117 if (io_u->seen || !(io_u->flags & IO_U_F_FLIGHT))
Jens Axboe2866c822006-10-09 15:57:48 +0200118 continue;
119
120 err = aio_error(&io_u->aiocb);
Jens Axboe3c770372008-03-10 18:45:57 +0100121 if (err == EINPROGRESS) {
122 if (suspend_entries < SUSPEND_ENTRIES) {
123 suspend_list[suspend_entries] = &io_u->aiocb;
124 suspend_entries++;
125 }
Jens Axboe3f344312007-03-14 14:14:48 +0100126 continue;
Jens Axboe3c770372008-03-10 18:45:57 +0100127 }
Jens Axboe3f344312007-03-14 14:14:48 +0100128
129 io_u->seen = 1;
Jens Axboe207cb0f2008-06-02 12:28:02 +0200130 pd->queued--;
Jens Axboe3f344312007-03-14 14:14:48 +0100131 pd->aio_events[r++] = io_u;
132
133 if (err == ECANCELED)
134 io_u->resid = io_u->xfer_buflen;
135 else if (!err) {
136 ssize_t retval = aio_return(&io_u->aiocb);
137
138 io_u->resid = io_u->xfer_buflen - retval;
139 } else
140 io_u->error = err;
Jens Axboe2866c822006-10-09 15:57:48 +0200141 }
142
143 if (r >= min)
144 return r;
145
146 if (have_timeout) {
147 unsigned long long usec;
148
149 usec = (t->tv_sec * 1000000) + (t->tv_nsec / 1000);
150 if (ts_utime_since_now(&start) > usec)
151 return r;
152 }
153
154 /*
Jens Axboe3c770372008-03-10 18:45:57 +0100155 * must have some in-flight, wait for at least one
Jens Axboe2866c822006-10-09 15:57:48 +0200156 */
Jens Axboee97c1442011-09-21 09:38:01 +0200157 aio_suspend((const os_aiocb_t * const *)suspend_list,
Jens Axboe3c770372008-03-10 18:45:57 +0100158 suspend_entries, t);
Jens Axboe2866c822006-10-09 15:57:48 +0200159 goto restart;
160}
161
162static struct io_u *fio_posixaio_event(struct thread_data *td, int event)
163{
164 struct posixaio_data *pd = td->io_ops->data;
165
166 return pd->aio_events[event];
167}
168
Bruce Cran03e20d62011-01-02 20:14:54 +0100169static int fio_posixaio_queue(struct thread_data *td,
Jens Axboe2866c822006-10-09 15:57:48 +0200170 struct io_u *io_u)
171{
Jens Axboe207cb0f2008-06-02 12:28:02 +0200172 struct posixaio_data *pd = td->io_ops->data;
Jens Axboee97c1442011-09-21 09:38:01 +0200173 os_aiocb_t *aiocb = &io_u->aiocb;
Jens Axboe2866c822006-10-09 15:57:48 +0200174 int ret;
175
Jens Axboe7101d9c2007-09-12 13:12:39 +0200176 fio_ro_check(td, io_u);
177
Jens Axboe2866c822006-10-09 15:57:48 +0200178 if (io_u->ddir == DDIR_READ)
179 ret = aio_read(aiocb);
Jens Axboe87dc1ab2006-10-24 14:41:26 +0200180 else if (io_u->ddir == DDIR_WRITE)
Jens Axboe2866c822006-10-09 15:57:48 +0200181 ret = aio_write(aiocb);
Jens Axboea5f30272010-07-19 16:19:55 -0600182 else if (io_u->ddir == DDIR_TRIM) {
183 if (pd->queued)
184 return FIO_Q_BUSY;
185
186 do_io_u_trim(td, io_u);
187 return FIO_Q_COMPLETED;
188 } else {
Jens Axboe67bf9822013-01-10 11:23:19 +0100189#ifdef CONFIG_POSIXAIO_FSYNC
Jens Axboe87dc1ab2006-10-24 14:41:26 +0200190 ret = aio_fsync(O_SYNC, aiocb);
Jens Axboe207cb0f2008-06-02 12:28:02 +0200191#else
192 if (pd->queued)
193 return FIO_Q_BUSY;
Jens Axboe2866c822006-10-09 15:57:48 +0200194
Jens Axboef0115312010-03-09 21:47:15 +0100195 do_io_u_sync(td, io_u);
Jens Axboe207cb0f2008-06-02 12:28:02 +0200196 return FIO_Q_COMPLETED;
197#endif
198 }
Jens Axboe4c057b32013-11-06 14:47:22 -0700199
Jens Axboe95bcd812007-02-11 01:01:57 +0100200 if (ret) {
Jens Axboe4c057b32013-11-06 14:47:22 -0700201 int aio_err = aio_error(aiocb);
202
Jens Axboeafa16402011-07-07 21:06:40 +0200203 /*
204 * At least OSX has a very low limit on the number of pending
Jens Axboedef1d8e2011-07-08 08:33:37 +0200205 * IOs, so if it returns EAGAIN, we are out of resources
206 * to queue more. Just return FIO_Q_BUSY to naturally
207 * drop off at this depth.
Jens Axboeafa16402011-07-07 21:06:40 +0200208 */
Jens Axboe4c057b32013-11-06 14:47:22 -0700209 if (aio_err == EAGAIN)
Jens Axboeafa16402011-07-07 21:06:40 +0200210 return FIO_Q_BUSY;
211
Jens Axboe4c057b32013-11-06 14:47:22 -0700212 io_u->error = aio_err;
Jens Axboee1161c32007-02-22 19:36:48 +0100213 td_verror(td, io_u->error, "xfer");
Jens Axboe36167d82007-02-18 05:41:31 +0100214 return FIO_Q_COMPLETED;
Jens Axboe95bcd812007-02-11 01:01:57 +0100215 }
Jens Axboe36167d82007-02-18 05:41:31 +0100216
Jens Axboe207cb0f2008-06-02 12:28:02 +0200217 pd->queued++;
Jens Axboe36167d82007-02-18 05:41:31 +0100218 return FIO_Q_QUEUED;
Jens Axboe2866c822006-10-09 15:57:48 +0200219}
220
221static void fio_posixaio_cleanup(struct thread_data *td)
222{
223 struct posixaio_data *pd = td->io_ops->data;
224
225 if (pd) {
226 free(pd->aio_events);
227 free(pd);
Jens Axboe2866c822006-10-09 15:57:48 +0200228 }
229}
230
231static int fio_posixaio_init(struct thread_data *td)
232{
233 struct posixaio_data *pd = malloc(sizeof(*pd));
234
Jens Axboecb781c72006-11-07 14:02:48 +0100235 memset(pd, 0, sizeof(*pd));
Jens Axboe2dc1bbe2007-03-15 15:01:33 +0100236 pd->aio_events = malloc(td->o.iodepth * sizeof(struct io_u *));
237 memset(pd->aio_events, 0, td->o.iodepth * sizeof(struct io_u *));
Jens Axboe2866c822006-10-09 15:57:48 +0200238
239 td->io_ops->data = pd;
240 return 0;
241}
242
Jens Axboe5f350952006-11-07 15:20:59 +0100243static struct ioengine_ops ioengine = {
Jens Axboe2866c822006-10-09 15:57:48 +0200244 .name = "posixaio",
245 .version = FIO_IOOPS_VERSION,
246 .init = fio_posixaio_init,
247 .prep = fio_posixaio_prep,
248 .queue = fio_posixaio_queue,
249 .cancel = fio_posixaio_cancel,
250 .getevents = fio_posixaio_getevents,
251 .event = fio_posixaio_event,
252 .cleanup = fio_posixaio_cleanup,
Jens Axboeb5af8292007-03-08 12:43:13 +0100253 .open_file = generic_open_file,
254 .close_file = generic_close_file,
Jens Axboedf9c26b2009-03-05 10:13:58 +0100255 .get_file_size = generic_get_file_size,
Jens Axboe2866c822006-10-09 15:57:48 +0200256};
Jens Axboe34cfcda2006-11-03 14:00:45 +0100257
Jens Axboe5f350952006-11-07 15:20:59 +0100258static void fio_init fio_posixaio_register(void)
259{
260 register_ioengine(&ioengine);
261}
262
263static void fio_exit fio_posixaio_unregister(void)
264{
265 unregister_ioengine(&ioengine);
266}