blob: 8f2c415d56a4a8aa6d61d2d25e2a279d436b88a3 [file] [log] [blame]
Jens Axboea4f4fdd2007-02-14 01:16:39 +01001/*
Jens Axboeda751ca2007-03-14 10:59:33 +01002 * syslet engine
3 *
4 * IO engine that does regular pread(2)/pwrite(2) to transfer data, but
5 * with syslets to make the execution async.
Jens Axboea4f4fdd2007-02-14 01:16:39 +01006 *
7 */
8#include <stdio.h>
9#include <stdlib.h>
10#include <unistd.h>
11#include <errno.h>
12#include <assert.h>
Jens Axboe12cbb462007-12-10 20:24:44 +010013#include <malloc.h>
Jens Axboeb8846352007-03-14 14:29:16 +010014#include <asm/unistd.h>
Jens Axboea4f4fdd2007-02-14 01:16:39 +010015
16#include "../fio.h"
Jens Axboe12cbb462007-12-10 20:24:44 +010017#include "../indirect.h"
18#include "../syslet.h"
Jens Axboea4f4fdd2007-02-14 01:16:39 +010019
20#ifdef FIO_HAVE_SYSLET
21
Jens Axboe1760e672007-03-14 20:41:42 +010022#ifdef __NR_pread64
23#define __NR_fio_pread __NR_pread64
24#define __NR_fio_pwrite __NR_pwrite64
25#else
26#define __NR_fio_pread __NR_pread
27#define __NR_fio_pwrite __NR_pwrite
28#endif
29
Jens Axboea4f4fdd2007-02-14 01:16:39 +010030struct syslet_data {
31 struct io_u **events;
32 unsigned int nr_events;
33
Jens Axboe12cbb462007-12-10 20:24:44 +010034 struct syslet_ring *ring;
Jens Axboedb6defc2007-12-11 08:55:53 +010035 unsigned int ring_mask;
Jens Axboe12cbb462007-12-10 20:24:44 +010036 void *stack;
Jens Axboea4f4fdd2007-02-14 01:16:39 +010037};
38
Jens Axboec6effc32007-12-11 08:46:16 +010039static void fio_syslet_add_event(struct thread_data *td, struct io_u *io_u)
Jens Axboe9ff9de62007-02-23 13:21:45 +010040{
41 struct syslet_data *sd = td->io_ops->data;
Jens Axboe9ff9de62007-02-23 13:21:45 +010042
Jens Axboe12cbb462007-12-10 20:24:44 +010043 assert(sd->nr_events < td->o.iodepth);
44 sd->events[sd->nr_events++] = io_u;
Jens Axboe9ff9de62007-02-23 13:21:45 +010045}
46
Jens Axboec6effc32007-12-11 08:46:16 +010047static void fio_syslet_add_events(struct thread_data *td, unsigned int nr)
Jens Axboea4f4fdd2007-02-14 01:16:39 +010048{
49 struct syslet_data *sd = td->io_ops->data;
Jens Axboedb6defc2007-12-11 08:55:53 +010050 unsigned int i, uidx;
51
52 uidx = sd->ring->user_tail;
53 read_barrier();
Jens Axboea4f4fdd2007-02-14 01:16:39 +010054
Jens Axboe12cbb462007-12-10 20:24:44 +010055 for (i = 0; i < nr; i++) {
Jens Axboedb6defc2007-12-11 08:55:53 +010056 unsigned int idx = (i + uidx) & sd->ring_mask;
Jens Axboe12cbb462007-12-10 20:24:44 +010057 struct syslet_completion *comp = &sd->ring->comp[idx];
58 struct io_u *io_u = (struct io_u *) (long) comp->caller_data;
Jens Axboec6effc32007-12-11 08:46:16 +010059 long ret;
Jens Axboe12cbb462007-12-10 20:24:44 +010060
Jens Axboec6effc32007-12-11 08:46:16 +010061 ret = comp->status;
62 if (ret <= 0) {
63 io_u->resid = io_u->xfer_buflen;
64 io_u->error = -ret;
65 } else {
66 io_u->resid = io_u->xfer_buflen - ret;
67 io_u->error = 0;
68 }
69
70 fio_syslet_add_event(td, io_u);
Jens Axboe12cbb462007-12-10 20:24:44 +010071 }
72}
73
Jens Axboe12cbb462007-12-10 20:24:44 +010074static void fio_syslet_wait_for_events(struct thread_data *td)
75{
76 struct syslet_data *sd = td->io_ops->data;
77 struct syslet_ring *ring = sd->ring;
Jens Axboe12cbb462007-12-10 20:24:44 +010078
Jens Axboea4f4fdd2007-02-14 01:16:39 +010079 do {
Jens Axboe12cbb462007-12-10 20:24:44 +010080 unsigned int kh = ring->kernel_head;
81 int ret;
Jens Axboea4f4fdd2007-02-14 01:16:39 +010082
Jens Axboe12cbb462007-12-10 20:24:44 +010083 /*
84 * first reap events that are already completed
85 */
86 if (ring->user_tail != kh) {
87 unsigned int nr = kh - ring->user_tail;
Jens Axboea4f4fdd2007-02-14 01:16:39 +010088
Jens Axboec6effc32007-12-11 08:46:16 +010089 fio_syslet_add_events(td, nr);
Jens Axboe12cbb462007-12-10 20:24:44 +010090 ring->user_tail = kh;
Jens Axboe4a88edf2007-12-11 10:45:36 +010091 break;
Jens Axboe12cbb462007-12-10 20:24:44 +010092 }
Jens Axboea4f4fdd2007-02-14 01:16:39 +010093
Jens Axboe12cbb462007-12-10 20:24:44 +010094 /*
95 * block waiting for at least one event
96 */
97 ret = syscall(__NR_syslet_ring_wait, ring, ring->user_tail);
98 assert(!ret);
Jens Axboe4a88edf2007-12-11 10:45:36 +010099 } while (1);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100100}
101
Jens Axboee7d2e612007-12-11 10:49:39 +0100102static int fio_syslet_getevents(struct thread_data *td, unsigned int min,
103 unsigned int fio_unused max,
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100104 struct timespec fio_unused *t)
105{
106 struct syslet_data *sd = td->io_ops->data;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100107 long ret;
108
Jens Axboe4a88edf2007-12-11 10:45:36 +0100109 /*
110 * While we have less events than requested, block waiting for them
111 */
112 while (sd->nr_events < (unsigned int) min)
Jens Axboe12cbb462007-12-10 20:24:44 +0100113 fio_syslet_wait_for_events(td);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100114
115 ret = sd->nr_events;
116 sd->nr_events = 0;
117 return ret;
118}
119
120static struct io_u *fio_syslet_event(struct thread_data *td, int event)
121{
122 struct syslet_data *sd = td->io_ops->data;
123
124 return sd->events[event];
125}
126
Jens Axboe12cbb462007-12-10 20:24:44 +0100127static void fio_syslet_prep_sync(struct fio_file *f,
128 struct indirect_registers *regs)
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100129{
Jens Axboe12cbb462007-12-10 20:24:44 +0100130 FILL_IN(*regs, __NR_fsync, (long) f->fd);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100131}
132
Jens Axboe12cbb462007-12-10 20:24:44 +0100133static void fio_syslet_prep_rw(struct io_u *io_u, struct fio_file *f,
134 struct indirect_registers *regs)
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100135{
Jens Axboe12cbb462007-12-10 20:24:44 +0100136 long nr;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100137
138 /*
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100139 * prepare rw
140 */
141 if (io_u->ddir == DDIR_READ)
Jens Axboe1760e672007-03-14 20:41:42 +0100142 nr = __NR_fio_pread;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100143 else
Jens Axboe1760e672007-03-14 20:41:42 +0100144 nr = __NR_fio_pwrite;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100145
Jens Axboe12cbb462007-12-10 20:24:44 +0100146 FILL_IN(*regs, nr, (long) f->fd, (long) io_u->xfer_buf,
147 (long) io_u->xfer_buflen, (long) io_u->offset);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100148}
149
Jens Axboe12cbb462007-12-10 20:24:44 +0100150static void fio_syslet_prep(struct io_u *io_u, struct indirect_registers *regs)
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100151{
152 struct fio_file *f = io_u->file;
153
154 if (io_u->ddir == DDIR_SYNC)
Jens Axboe12cbb462007-12-10 20:24:44 +0100155 fio_syslet_prep_sync(f, regs);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100156 else
Jens Axboe12cbb462007-12-10 20:24:44 +0100157 fio_syslet_prep_rw(io_u, f, regs);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100158}
159
Jens Axboe12cbb462007-12-10 20:24:44 +0100160static void ret_func(void)
Ingo Molnarbf0dc8f2007-02-21 23:25:44 +0100161{
Jens Axboe12cbb462007-12-10 20:24:44 +0100162 syscall(__NR_exit);
Jens Axboe9ff9de62007-02-23 13:21:45 +0100163}
Ingo Molnarbf0dc8f2007-02-21 23:25:44 +0100164
Jens Axboe9ff9de62007-02-23 13:21:45 +0100165static int fio_syslet_queue(struct thread_data *td, struct io_u *io_u)
166{
167 struct syslet_data *sd = td->io_ops->data;
Jens Axboe12cbb462007-12-10 20:24:44 +0100168 union indirect_params params;
169 struct indirect_registers regs;
170 int ret;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100171
Jens Axboe7101d9c2007-09-12 13:12:39 +0200172 fio_ro_check(td, io_u);
173
Jens Axboe12cbb462007-12-10 20:24:44 +0100174 memset(&params, 0, sizeof(params));
175 fill_syslet_args(&params.syslet, sd->ring, (long)io_u, ret_func, sd->stack);
Jens Axboe9ff9de62007-02-23 13:21:45 +0100176
Jens Axboe12cbb462007-12-10 20:24:44 +0100177 fio_syslet_prep(io_u, &regs);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100178
Jens Axboe12cbb462007-12-10 20:24:44 +0100179 ret = syscall(__NR_indirect, &regs, &params, sizeof(params), 0);
180 if (ret == (int) io_u->xfer_buflen) {
181 /*
182 * completed sync, account. this also catches fsync().
183 */
184 return FIO_Q_COMPLETED;
185 } else if (ret < 0) {
186 /*
187 * queued for async execution
188 */
189 if (errno == ESYSLETPENDING)
190 return FIO_Q_QUEUED;
191 }
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100192
Jens Axboe12cbb462007-12-10 20:24:44 +0100193 io_u->error = errno;
194 td_verror(td, io_u->error, "xfer");
195 return FIO_Q_COMPLETED;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100196}
197
Jens Axboe76f58b92007-03-29 13:26:17 +0200198static int check_syslet_support(struct syslet_data *sd)
199{
Jens Axboe12cbb462007-12-10 20:24:44 +0100200 union indirect_params params;
201 struct indirect_registers regs;
202 pid_t pid, my_pid = getpid();
Jens Axboe76f58b92007-03-29 13:26:17 +0200203
Jens Axboe12cbb462007-12-10 20:24:44 +0100204 memset(&params, 0, sizeof(params));
205 fill_syslet_args(&params.syslet, sd->ring, 0, ret_func, sd->stack);
Jens Axboe76f58b92007-03-29 13:26:17 +0200206
Jens Axboe12cbb462007-12-10 20:24:44 +0100207 FILL_IN(regs, __NR_getpid);
208
209 pid = syscall(__NR_indirect, &regs, &params, sizeof(params), 0);
210 if (pid == my_pid)
211 return 0;
212
213 return 1;
Jens Axboe76f58b92007-03-29 13:26:17 +0200214}
215
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100216static void fio_syslet_cleanup(struct thread_data *td)
217{
218 struct syslet_data *sd = td->io_ops->data;
219
220 if (sd) {
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100221 free(sd->events);
Jens Axboe12cbb462007-12-10 20:24:44 +0100222 free(sd->ring);
223 free(sd->stack);
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100224 free(sd);
225 td->io_ops->data = NULL;
226 }
227}
228
229static int fio_syslet_init(struct thread_data *td)
230{
231 struct syslet_data *sd;
Jens Axboee81f7342007-12-10 20:35:10 +0100232 void *ring = NULL, *stack = NULL;
Jens Axboe05f6a172007-12-11 08:22:53 +0100233 unsigned int ring_size, ring_nr;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100234
235 sd = malloc(sizeof(*sd));
236 memset(sd, 0, sizeof(*sd));
Jens Axboe12cbb462007-12-10 20:24:44 +0100237
Jens Axboe2dc1bbe2007-03-15 15:01:33 +0100238 sd->events = malloc(sizeof(struct io_u *) * td->o.iodepth);
239 memset(sd->events, 0, sizeof(struct io_u *) * td->o.iodepth);
Jens Axboe05f6a172007-12-11 08:22:53 +0100240
241 /*
242 * The ring needs to be a power-of-2, so round it up if we have to
243 */
244 ring_nr = td->o.iodepth;
245 if (ring_nr & (ring_nr - 1)) {
246 int bits = 1;
247
248 while (ring_nr >>= 1)
249 bits++;
250
251 ring_nr = 1 << bits;
252 }
253
254 ring_size = sizeof(struct syslet_ring) +
255 ring_nr * sizeof(struct syslet_completion);
256 if (posix_memalign(&ring, sizeof(uint64_t), ring_size))
Jens Axboee81f7342007-12-10 20:35:10 +0100257 goto err_mem;
Jens Axboe12cbb462007-12-10 20:24:44 +0100258 if (posix_memalign(&stack, page_size, page_size))
Jens Axboee81f7342007-12-10 20:35:10 +0100259 goto err_mem;
Jens Axboe12cbb462007-12-10 20:24:44 +0100260
261 sd->ring = ring;
Jens Axboedb6defc2007-12-11 08:55:53 +0100262 sd->ring_mask = ring_nr - 1;
Jens Axboe12cbb462007-12-10 20:24:44 +0100263 sd->stack = stack;
264
Jens Axboe05f6a172007-12-11 08:22:53 +0100265 memset(sd->ring, 0, ring_size);
266 sd->ring->elements = ring_nr;
Jens Axboedb64e9b2007-02-14 02:10:59 +0100267
Jens Axboee81f7342007-12-10 20:35:10 +0100268 if (!check_syslet_support(sd)) {
269 td->io_ops->data = sd;
270 return 0;
Jens Axboe76f58b92007-03-29 13:26:17 +0200271 }
272
Jens Axboee81f7342007-12-10 20:35:10 +0100273 log_err("fio: syslets do not appear to work\n");
274err_mem:
275 free(sd->events);
276 if (ring)
277 free(ring);
278 if (stack)
279 free(stack);
280 free(sd);
281 return 1;
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100282}
283
284static struct ioengine_ops ioengine = {
285 .name = "syslet-rw",
286 .version = FIO_IOOPS_VERSION,
287 .init = fio_syslet_init,
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100288 .queue = fio_syslet_queue,
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100289 .getevents = fio_syslet_getevents,
290 .event = fio_syslet_event,
291 .cleanup = fio_syslet_cleanup,
Jens Axboeb5af8292007-03-08 12:43:13 +0100292 .open_file = generic_open_file,
293 .close_file = generic_close_file,
Jens Axboea4f4fdd2007-02-14 01:16:39 +0100294};
295
296#else /* FIO_HAVE_SYSLET */
297
298/*
299 * When we have a proper configure system in place, we simply wont build
300 * and install this io engine. For now install a crippled version that
301 * just complains and fails to load.
302 */
303static int fio_syslet_init(struct thread_data fio_unused *td)
304{
305 fprintf(stderr, "fio: syslet not available\n");
306 return 1;
307}
308
309static struct ioengine_ops ioengine = {
310 .name = "syslet-rw",
311 .version = FIO_IOOPS_VERSION,
312 .init = fio_syslet_init,
313};
314
315#endif /* FIO_HAVE_SYSLET */
316
317static void fio_init fio_syslet_register(void)
318{
319 register_ioengine(&ioengine);
320}
321
322static void fio_exit fio_syslet_unregister(void)
323{
324 unregister_ioengine(&ioengine);
325}