blob: 7bb1be83618959ee5b7a87ec8e79bdfbbfb095a2 [file] [log] [blame]
Jens Axboea4f4fdd2007-02-14 01:16:39 +01001/*
Jens Axboeda751ca2007-03-14 10:59:33 +01002 * syslet engine
3 *
4 * IO engine that does regular pread(2)/pwrite(2) to transfer data, but
5 * with syslets to make the execution async.
Jens Axboea4f4fdd2007-02-14 01:16:39 +01006 *
7 */
8#include <stdio.h>
9#include <stdlib.h>
10#include <unistd.h>
11#include <errno.h>
12#include <assert.h>
Jens Axboe12cbb462007-12-10 20:24:44 +010013#include <malloc.h>
Jens Axboeb8846352007-03-14 14:29:16 +010014#include <asm/unistd.h>
Jens Axboea4f4fdd2007-02-14 01:16:39 +010015
16#include "../fio.h"
Jens Axboe12cbb462007-12-10 20:24:44 +010017#include "../indirect.h"
18#include "../syslet.h"
Jens Axboee6026f92007-12-12 19:39:59 +010019#include "../fls.h"
Jens Axboea4f4fdd2007-02-14 01:16:39 +010020
21#ifdef FIO_HAVE_SYSLET
22
Jens Axboe1760e672007-03-14 20:41:42 +010023#ifdef __NR_pread64
24#define __NR_fio_pread __NR_pread64
25#define __NR_fio_pwrite __NR_pwrite64
26#else
27#define __NR_fio_pread __NR_pread
28#define __NR_fio_pwrite __NR_pwrite
29#endif
30
Jens Axboea4f4fdd2007-02-14 01:16:39 +010031struct syslet_data {
32 struct io_u **events;
33 unsigned int nr_events;
34
Jens Axboe12cbb462007-12-10 20:24:44 +010035 struct syslet_ring *ring;
Jens Axboedb6defc2007-12-11 08:55:53 +010036 unsigned int ring_mask;
Jens Axboe12cbb462007-12-10 20:24:44 +010037 void *stack;
Jens Axboea4f4fdd2007-02-14 01:16:39 +010038};
39
Jens Axboec6effc32007-12-11 08:46:16 +010040static void fio_syslet_add_event(struct thread_data *td, struct io_u *io_u)
Jens Axboe9ff9de62007-02-23 13:21:45 +010041{
42 struct syslet_data *sd = td->io_ops->data;
Jens Axboe9ff9de62007-02-23 13:21:45 +010043
Jens Axboe12cbb462007-12-10 20:24:44 +010044 assert(sd->nr_events < td->o.iodepth);
45 sd->events[sd->nr_events++] = io_u;
Jens Axboe9ff9de62007-02-23 13:21:45 +010046}
47
Jens Axboec6effc32007-12-11 08:46:16 +010048static void fio_syslet_add_events(struct thread_data *td, unsigned int nr)
Jens Axboea4f4fdd2007-02-14 01:16:39 +010049{
50 struct syslet_data *sd = td->io_ops->data;
Jens Axboedb6defc2007-12-11 08:55:53 +010051 unsigned int i, uidx;
52
53 uidx = sd->ring->user_tail;
54 read_barrier();
Jens Axboea4f4fdd2007-02-14 01:16:39 +010055
Jens Axboe12cbb462007-12-10 20:24:44 +010056 for (i = 0; i < nr; i++) {
Jens Axboedb6defc2007-12-11 08:55:53 +010057 unsigned int idx = (i + uidx) & sd->ring_mask;
Jens Axboe12cbb462007-12-10 20:24:44 +010058 struct syslet_completion *comp = &sd->ring->comp[idx];
59 struct io_u *io_u = (struct io_u *) (long) comp->caller_data;
Jens Axboec6effc32007-12-11 08:46:16 +010060 long ret;
Jens Axboe12cbb462007-12-10 20:24:44 +010061
Jens Axboec6effc32007-12-11 08:46:16 +010062 ret = comp->status;
63 if (ret <= 0) {
64 io_u->resid = io_u->xfer_buflen;
65 io_u->error = -ret;
66 } else {
67 io_u->resid = io_u->xfer_buflen - ret;
68 io_u->error = 0;
69 }
70
71 fio_syslet_add_event(td, io_u);
Jens Axboe12cbb462007-12-10 20:24:44 +010072 }
73}
74
Jens Axboe12cbb462007-12-10 20:24:44 +010075static void fio_syslet_wait_for_events(struct thread_data *td)
76{
77 struct syslet_data *sd = td->io_ops->data;
78 struct syslet_ring *ring = sd->ring;
Jens Axboe12cbb462007-12-10 20:24:44 +010079
Jens Axboea4f4fdd2007-02-14 01:16:39 +010080 do {
Jens Axboe12cbb462007-12-10 20:24:44 +010081 unsigned int kh = ring->kernel_head;
82 int ret;
Jens Axboea4f4fdd2007-02-14 01:16:39 +010083
Jens Axboe12cbb462007-12-10 20:24:44 +010084 /*
85 * first reap events that are already completed
86 */
87 if (ring->user_tail != kh) {
88 unsigned int nr = kh - ring->user_tail;
Jens Axboea4f4fdd2007-02-14 01:16:39 +010089
Jens Axboec6effc32007-12-11 08:46:16 +010090 fio_syslet_add_events(td, nr);
Jens Axboe12cbb462007-12-10 20:24:44 +010091 ring->user_tail = kh;
Jens Axboe4a88edf2007-12-11 10:45:36 +010092 break;
Jens Axboe12cbb462007-12-10 20:24:44 +010093 }
Jens Axboea4f4fdd2007-02-14 01:16:39 +010094
Jens Axboe12cbb462007-12-10 20:24:44 +010095 /*
96 * block waiting for at least one event
97 */
98 ret = syscall(__NR_syslet_ring_wait, ring, ring->user_tail);
99 assert(!ret);
Jens Axboe4a88edf2007-12-11 10:45:36 +0100100 } while (1);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100101}
102
Jens Axboee7d2e612007-12-11 10:49:39 +0100103static int fio_syslet_getevents(struct thread_data *td, unsigned int min,
104 unsigned int fio_unused max,
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100105 struct timespec fio_unused *t)
106{
107 struct syslet_data *sd = td->io_ops->data;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100108 long ret;
109
Jens Axboe4a88edf2007-12-11 10:45:36 +0100110 /*
111 * While we have less events than requested, block waiting for them
Jens Axboea3cc7702007-12-11 13:23:27 +0100112 * (if we have to, there may already be more completed events ready
113 * for us - see fio_syslet_wait_for_events()
Jens Axboe4a88edf2007-12-11 10:45:36 +0100114 */
Jens Axboea3cc7702007-12-11 13:23:27 +0100115 while (sd->nr_events < min)
Jens Axboe12cbb462007-12-10 20:24:44 +0100116 fio_syslet_wait_for_events(td);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100117
118 ret = sd->nr_events;
119 sd->nr_events = 0;
120 return ret;
121}
122
123static struct io_u *fio_syslet_event(struct thread_data *td, int event)
124{
125 struct syslet_data *sd = td->io_ops->data;
126
127 return sd->events[event];
128}
129
Jens Axboe12cbb462007-12-10 20:24:44 +0100130static void fio_syslet_prep_sync(struct fio_file *f,
131 struct indirect_registers *regs)
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100132{
Jens Axboe12cbb462007-12-10 20:24:44 +0100133 FILL_IN(*regs, __NR_fsync, (long) f->fd);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100134}
135
Jens Axboe12cbb462007-12-10 20:24:44 +0100136static void fio_syslet_prep_rw(struct io_u *io_u, struct fio_file *f,
137 struct indirect_registers *regs)
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100138{
Jens Axboe12cbb462007-12-10 20:24:44 +0100139 long nr;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100140
141 /*
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100142 * prepare rw
143 */
144 if (io_u->ddir == DDIR_READ)
Jens Axboe1760e672007-03-14 20:41:42 +0100145 nr = __NR_fio_pread;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100146 else
Jens Axboe1760e672007-03-14 20:41:42 +0100147 nr = __NR_fio_pwrite;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100148
Jens Axboe12cbb462007-12-10 20:24:44 +0100149 FILL_IN(*regs, nr, (long) f->fd, (long) io_u->xfer_buf,
150 (long) io_u->xfer_buflen, (long) io_u->offset);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100151}
152
Jens Axboe12cbb462007-12-10 20:24:44 +0100153static void fio_syslet_prep(struct io_u *io_u, struct indirect_registers *regs)
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100154{
155 struct fio_file *f = io_u->file;
156
157 if (io_u->ddir == DDIR_SYNC)
Jens Axboe12cbb462007-12-10 20:24:44 +0100158 fio_syslet_prep_sync(f, regs);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100159 else
Jens Axboe12cbb462007-12-10 20:24:44 +0100160 fio_syslet_prep_rw(io_u, f, regs);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100161}
162
Jens Axboe12cbb462007-12-10 20:24:44 +0100163static void ret_func(void)
Ingo Molnarbf0dc8f2007-02-21 23:25:44 +0100164{
Jens Axboe12cbb462007-12-10 20:24:44 +0100165 syscall(__NR_exit);
Jens Axboe9ff9de62007-02-23 13:21:45 +0100166}
Ingo Molnarbf0dc8f2007-02-21 23:25:44 +0100167
Jens Axboe9ff9de62007-02-23 13:21:45 +0100168static int fio_syslet_queue(struct thread_data *td, struct io_u *io_u)
169{
170 struct syslet_data *sd = td->io_ops->data;
Jens Axboe12cbb462007-12-10 20:24:44 +0100171 union indirect_params params;
172 struct indirect_registers regs;
173 int ret;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100174
Jens Axboe7101d9c2007-09-12 13:12:39 +0200175 fio_ro_check(td, io_u);
176
Jens Axboe12cbb462007-12-10 20:24:44 +0100177 memset(&params, 0, sizeof(params));
178 fill_syslet_args(&params.syslet, sd->ring, (long)io_u, ret_func, sd->stack);
Jens Axboe9ff9de62007-02-23 13:21:45 +0100179
Jens Axboe12cbb462007-12-10 20:24:44 +0100180 fio_syslet_prep(io_u, &regs);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100181
Jens Axboe12cbb462007-12-10 20:24:44 +0100182 ret = syscall(__NR_indirect, &regs, &params, sizeof(params), 0);
183 if (ret == (int) io_u->xfer_buflen) {
184 /*
185 * completed sync, account. this also catches fsync().
186 */
187 return FIO_Q_COMPLETED;
188 } else if (ret < 0) {
189 /*
190 * queued for async execution
191 */
192 if (errno == ESYSLETPENDING)
193 return FIO_Q_QUEUED;
194 }
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100195
Jens Axboe12cbb462007-12-10 20:24:44 +0100196 io_u->error = errno;
197 td_verror(td, io_u->error, "xfer");
198 return FIO_Q_COMPLETED;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100199}
200
Jens Axboe76f58b92007-03-29 13:26:17 +0200201static int check_syslet_support(struct syslet_data *sd)
202{
Jens Axboe12cbb462007-12-10 20:24:44 +0100203 union indirect_params params;
204 struct indirect_registers regs;
205 pid_t pid, my_pid = getpid();
Jens Axboe76f58b92007-03-29 13:26:17 +0200206
Jens Axboe12cbb462007-12-10 20:24:44 +0100207 memset(&params, 0, sizeof(params));
208 fill_syslet_args(&params.syslet, sd->ring, 0, ret_func, sd->stack);
Jens Axboe76f58b92007-03-29 13:26:17 +0200209
Jens Axboe12cbb462007-12-10 20:24:44 +0100210 FILL_IN(regs, __NR_getpid);
211
212 pid = syscall(__NR_indirect, &regs, &params, sizeof(params), 0);
213 if (pid == my_pid)
214 return 0;
215
216 return 1;
Jens Axboe76f58b92007-03-29 13:26:17 +0200217}
218
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100219static void fio_syslet_cleanup(struct thread_data *td)
220{
221 struct syslet_data *sd = td->io_ops->data;
222
223 if (sd) {
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100224 free(sd->events);
Jens Axboe12cbb462007-12-10 20:24:44 +0100225 free(sd->ring);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100226 free(sd);
227 td->io_ops->data = NULL;
228 }
229}
230
231static int fio_syslet_init(struct thread_data *td)
232{
233 struct syslet_data *sd;
Jens Axboee81f7342007-12-10 20:35:10 +0100234 void *ring = NULL, *stack = NULL;
Jens Axboe05f6a172007-12-11 08:22:53 +0100235 unsigned int ring_size, ring_nr;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100236
237 sd = malloc(sizeof(*sd));
238 memset(sd, 0, sizeof(*sd));
Jens Axboe12cbb462007-12-10 20:24:44 +0100239
Jens Axboe2dc1bbe2007-03-15 15:01:33 +0100240 sd->events = malloc(sizeof(struct io_u *) * td->o.iodepth);
241 memset(sd->events, 0, sizeof(struct io_u *) * td->o.iodepth);
Jens Axboe05f6a172007-12-11 08:22:53 +0100242
243 /*
244 * The ring needs to be a power-of-2, so round it up if we have to
245 */
246 ring_nr = td->o.iodepth;
Jens Axboee6026f92007-12-12 19:39:59 +0100247 if (ring_nr & (ring_nr - 1))
248 ring_nr = 1 << fls(ring_nr);
Jens Axboe05f6a172007-12-11 08:22:53 +0100249
250 ring_size = sizeof(struct syslet_ring) +
251 ring_nr * sizeof(struct syslet_completion);
252 if (posix_memalign(&ring, sizeof(uint64_t), ring_size))
Jens Axboee81f7342007-12-10 20:35:10 +0100253 goto err_mem;
Jens Axboe12cbb462007-12-10 20:24:44 +0100254 if (posix_memalign(&stack, page_size, page_size))
Jens Axboee81f7342007-12-10 20:35:10 +0100255 goto err_mem;
Jens Axboe12cbb462007-12-10 20:24:44 +0100256
257 sd->ring = ring;
Jens Axboedb6defc2007-12-11 08:55:53 +0100258 sd->ring_mask = ring_nr - 1;
Jens Axboe12cbb462007-12-10 20:24:44 +0100259 sd->stack = stack;
260
Jens Axboe05f6a172007-12-11 08:22:53 +0100261 memset(sd->ring, 0, ring_size);
262 sd->ring->elements = ring_nr;
Jens Axboedb64e9b2007-02-14 02:10:59 +0100263
Jens Axboee81f7342007-12-10 20:35:10 +0100264 if (!check_syslet_support(sd)) {
265 td->io_ops->data = sd;
266 return 0;
Jens Axboe76f58b92007-03-29 13:26:17 +0200267 }
268
Jens Axboee81f7342007-12-10 20:35:10 +0100269 log_err("fio: syslets do not appear to work\n");
270err_mem:
271 free(sd->events);
272 if (ring)
273 free(ring);
274 if (stack)
275 free(stack);
276 free(sd);
277 return 1;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100278}
279
280static struct ioengine_ops ioengine = {
281 .name = "syslet-rw",
282 .version = FIO_IOOPS_VERSION,
283 .init = fio_syslet_init,
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100284 .queue = fio_syslet_queue,
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100285 .getevents = fio_syslet_getevents,
286 .event = fio_syslet_event,
287 .cleanup = fio_syslet_cleanup,
Jens Axboeb5af8292007-03-08 12:43:13 +0100288 .open_file = generic_open_file,
289 .close_file = generic_close_file,
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100290};
291
292#else /* FIO_HAVE_SYSLET */
293
294/*
295 * When we have a proper configure system in place, we simply wont build
296 * and install this io engine. For now install a crippled version that
297 * just complains and fails to load.
298 */
299static int fio_syslet_init(struct thread_data fio_unused *td)
300{
301 fprintf(stderr, "fio: syslet not available\n");
302 return 1;
303}
304
305static struct ioengine_ops ioengine = {
306 .name = "syslet-rw",
307 .version = FIO_IOOPS_VERSION,
308 .init = fio_syslet_init,
309};
310
311#endif /* FIO_HAVE_SYSLET */
312
313static void fio_init fio_syslet_register(void)
314{
315 register_ioengine(&ioengine);
316}
317
318static void fio_exit fio_syslet_unregister(void)
319{
320 unregister_ioengine(&ioengine);
321}