blob: c94062279989285ed20a0326e2297f86bf94029b [file] [log] [blame]
#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <fcntl.h>
#include <ctype.h>
#include <string.h>
#include <errno.h>
#include <sys/ipc.h>
#include <sys/shm.h>
#include <sys/types.h>
#include <sys/stat.h>
#include "fio.h"
#define DEF_BS (4096)
#define DEF_TIMEOUT (0)
#define DEF_RATE_CYCLE (1000)
#define DEF_ODIRECT (1)
#define DEF_IO_ENGINE (FIO_SYNCIO)
#define DEF_IO_ENGINE_NAME "sync"
#define DEF_SEQUENTIAL (1)
#define DEF_RAND_REPEAT (1)
#define DEF_OVERWRITE (1)
#define DEF_CREATE (1)
#define DEF_INVALIDATE (1)
#define DEF_SYNCIO (0)
#define DEF_RANDSEED (0xb1899bedUL)
#define DEF_BWAVGTIME (500)
#define DEF_CREATE_SER (1)
#define DEF_CREATE_FSYNC (1)
#define DEF_LOOPS (1)
#define DEF_VERIFY (0)
#define DEF_STONEWALL (0)
#define DEF_NUMJOBS (1)
#define DEF_USE_THREAD (0)
#define DEF_FILE_SIZE (1024 * 1024 * 1024UL)
#define DEF_ZONE_SIZE (0)
#define DEF_ZONE_SKIP (0)
static char fio_version_string[] = "fio 1.1";
static int repeatable = DEF_RAND_REPEAT;
static char *ini_file;
static int max_jobs = MAX_JOBS;
struct thread_data def_thread;
struct thread_data *threads = NULL;
int rate_quit = 0;
int write_lat_log = 0;
int write_bw_log = 0;
int exitall_on_terminate = 0;
static int setup_rate(struct thread_data *td)
{
int nr_reads_per_sec;
if (!td->rate)
return 0;
if (td->rate < td->ratemin) {
fprintf(stderr, "min rate larger than nominal rate\n");
return -1;
}
nr_reads_per_sec = (td->rate * 1024) / td->min_bs;
td->rate_usec_cycle = 1000000 / nr_reads_per_sec;
td->rate_pending_usleep = 0;
return 0;
}
static void setup_log(struct io_log **log)
{
struct io_log *l = malloc(sizeof(*l));
l->nr_samples = 0;
l->max_samples = 1024;
l->log = malloc(l->max_samples * sizeof(struct io_sample));
*log = l;
}
void finish_log(struct thread_data *td, struct io_log *log, const char *name)
{
char file_name[128];
FILE *f;
unsigned int i;
sprintf(file_name, "client%d_%s.log", td->thread_number, name);
f = fopen(file_name, "w");
if (!f) {
perror("fopen log");
return;
}
for (i = 0; i < log->nr_samples; i++)
fprintf(f, "%lu, %lu, %u\n", log->log[i].time, log->log[i].val, log->log[i].ddir);
fclose(f);
free(log->log);
free(log);
}
static struct thread_data *get_new_job(int global, struct thread_data *parent)
{
struct thread_data *td;
if (global)
return &def_thread;
if (thread_number >= max_jobs)
return NULL;
td = &threads[thread_number++];
memset(td, 0, sizeof(*td));
td->fd = -1;
td->thread_number = thread_number;
td->ddir = parent->ddir;
td->ioprio = parent->ioprio;
td->sequential = parent->sequential;
td->bs = parent->bs;
td->min_bs = parent->min_bs;
td->max_bs = parent->max_bs;
td->odirect = parent->odirect;
td->thinktime = parent->thinktime;
td->fsync_blocks = parent->fsync_blocks;
td->start_delay = parent->start_delay;
td->timeout = parent->timeout;
td->io_engine = parent->io_engine;
td->create_file = parent->create_file;
td->overwrite = parent->overwrite;
td->invalidate_cache = parent->invalidate_cache;
td->file_size = parent->file_size;
td->file_offset = parent->file_offset;
td->zone_size = parent->zone_size;
td->zone_skip = parent->zone_skip;
td->rate = parent->rate;
td->ratemin = parent->ratemin;
td->ratecycle = parent->ratecycle;
td->iodepth = parent->iodepth;
td->sync_io = parent->sync_io;
td->mem_type = parent->mem_type;
td->bw_avg_time = parent->bw_avg_time;
td->create_serialize = parent->create_serialize;
td->create_fsync = parent->create_fsync;
td->loops = parent->loops;
td->verify = parent->verify;
td->stonewall = parent->stonewall;
td->numjobs = parent->numjobs;
td->use_thread = parent->use_thread;
td->do_disk_util = parent->do_disk_util;
memcpy(&td->cpumask, &parent->cpumask, sizeof(td->cpumask));
strcpy(td->io_engine_name, parent->io_engine_name);
return td;
}
static void put_job(struct thread_data *td)
{
memset(&threads[td->thread_number - 1], 0, sizeof(*td));
thread_number--;
}
static int add_job(struct thread_data *td, const char *jobname, int prioclass,
int prio)
{
char *ddir_str[] = { "read", "write", "randread", "randwrite" };
struct stat sb;
int numjobs, ddir;
#ifndef FIO_HAVE_LIBAIO
if (td->io_engine == FIO_LIBAIO) {
fprintf(stderr, "Linux libaio not available\n");
return 1;
}
#endif
#ifndef FIO_HAVE_POSIXAIO
if (td->io_engine == FIO_POSIXAIO) {
fprintf(stderr, "posix aio not available\n");
return 1;
}
#endif
#ifdef FIO_HAVE_IOPRIO
td->ioprio = (prioclass << IOPRIO_CLASS_SHIFT) | prio;
#endif
/*
* the def_thread is just for options, it's not a real job
*/
if (td == &def_thread)
return 0;
if (td->io_engine & FIO_SYNCIO)
td->iodepth = 1;
else {
if (!td->iodepth)
td->iodepth = 1;
}
/*
* only really works for sequential io for now
*/
if (td->zone_size && !td->sequential)
td->zone_size = 0;
td->filetype = FIO_TYPE_FILE;
if (!stat(jobname, &sb)) {
if (S_ISBLK(sb.st_mode))
td->filetype = FIO_TYPE_BD;
else if (S_ISCHR(sb.st_mode))
td->filetype = FIO_TYPE_CHAR;
}
if (td->filetype == FIO_TYPE_FILE) {
if (td->directory[0] != '\0')
sprintf(td->file_name, "%s/%s.%d", td->directory, jobname, td->thread_number);
else
sprintf(td->file_name, "%s.%d", jobname, td->thread_number);
} else
strcpy(td->file_name, jobname);
sem_init(&td->mutex, 0, 0);
td->clat_stat[0].min_val = td->clat_stat[1].min_val = ULONG_MAX;
td->slat_stat[0].min_val = td->slat_stat[1].min_val = ULONG_MAX;
td->bw_stat[0].min_val = td->bw_stat[1].min_val = ULONG_MAX;
if (td->min_bs == -1U)
td->min_bs = td->bs;
if (td->max_bs == -1U)
td->max_bs = td->bs;
if (td_read(td))
td->verify = 0;
if (td->stonewall && td->thread_number > 1)
groupid++;
td->groupid = groupid;
if (setup_rate(td))
goto err;
if (write_lat_log) {
setup_log(&td->slat_log);
setup_log(&td->clat_log);
}
if (write_bw_log)
setup_log(&td->bw_log);
ddir = td->ddir + (!td->sequential << 1);
printf("Client%d (g=%d): rw=%s, prio=%d/%d, odir=%d, bs=%d-%d, rate=%d, ioengine=%s, iodepth=%d\n", td->thread_number, td->groupid, ddir_str[ddir], prioclass, prio, td->odirect, td->min_bs, td->max_bs, td->rate, td->io_engine_name, td->iodepth);
/*
* recurse add identical jobs, clear numjobs and stonewall options
* as they don't apply to sub-jobs
*/
numjobs = td->numjobs;
while (--numjobs) {
struct thread_data *td_new = get_new_job(0, td);
if (!td_new)
goto err;
td_new->numjobs = 1;
td_new->stonewall = 0;
if (add_job(td_new, jobname, prioclass, prio))
goto err;
}
return 0;
err:
put_job(td);
return -1;
}
int init_random_state(struct thread_data *td)
{
unsigned long seed;
int fd, num_maps, blocks;
fd = open("/dev/random", O_RDONLY);
if (fd == -1) {
td_verror(td, errno);
return 1;
}
if (read(fd, &seed, sizeof(seed)) < (int) sizeof(seed)) {
td_verror(td, EIO);
close(fd);
return 1;
}
close(fd);
srand48_r(seed, &td->bsrange_state);
srand48_r(seed, &td->verify_state);
if (td->sequential)
return 0;
if (repeatable)
seed = DEF_RANDSEED;
blocks = (td->io_size + td->min_bs - 1) / td->min_bs;
num_maps = blocks / BLOCKS_PER_MAP;
td->file_map = malloc(num_maps * sizeof(long));
td->num_maps = num_maps;
memset(td->file_map, 0, num_maps * sizeof(long));
srand48_r(seed, &td->random_state);
return 0;
}
static void fill_cpu_mask(os_cpu_mask_t cpumask, int cpu)
{
#ifdef FIO_HAVE_CPU_AFFINITY
unsigned int i;
CPU_ZERO(&cpumask);
for (i = 0; i < sizeof(int) * 8; i++) {
if ((1 << i) & cpu)
CPU_SET(i, &cpumask);
}
#endif
}
static unsigned long get_mult(char c)
{
switch (c) {
case 'k':
case 'K':
return 1024;
case 'm':
case 'M':
return 1024 * 1024;
case 'g':
case 'G':
return 1024 * 1024 * 1024;
default:
return 1;
}
}
/*
* convert string after '=' into decimal value, noting any size suffix
*/
static int str_cnv(char *p, unsigned long long *val)
{
char *str;
int len;
str = strchr(p, '=');
if (!str)
return 1;
str++;
len = strlen(str);
*val = strtoul(str, NULL, 10);
if (*val == ULONG_MAX && errno == ERANGE)
return 1;
*val *= get_mult(str[len - 2]);
return 0;
}
static int check_strcnv(char *p, char *name, unsigned long long *val)
{
if (strncmp(p, name, strlen(name) - 1))
return 1;
return str_cnv(p, val);
}
static void strip_blank_front(char **p)
{
char *s = *p;
while (isblank(*s))
s++;
}
static void strip_blank_end(char *p)
{
while (isblank(*p)) {
*p = '\0';
p--;
}
}
typedef int (str_cb_fn)(struct thread_data *, char *);
static int check_str(char *p, char *name, str_cb_fn *cb, struct thread_data *td)
{
char *s = strstr(p, name);
if (!s)
return 1;
s = strchr(s, '=');
if (!s)
return 1;
s++;
strip_blank_front(&s);
return cb(td, s);
}
static int check_strstore(char *p, char *name, char *dest)
{
char *s = strstr(p, name);
if (!s)
return 1;
s = strchr(p, '=');
if (!s)
return 1;
s++;
strip_blank_front(&s);
strcpy(dest, s);
s = dest + strlen(dest) - 1;
strip_blank_end(s);
return 0;
}
static int __check_range(char *str, unsigned long *val)
{
char suffix;
if (sscanf(str, "%lu%c", val, &suffix) == 2) {
*val *= get_mult(suffix);
return 0;
}
if (sscanf(str, "%lu", val) == 1)
return 0;
return 1;
}
static int check_range(char *p, char *name, unsigned long *s, unsigned long *e)
{
char option[128];
char *str, *p1, *p2;
strcpy(option, p);
p = option;
str = strstr(p, name);
if (!str)
return 1;
p += strlen(name);
str = strchr(p, '=');
if (!str)
return 1;
/*
* 'p' now holds whatever is after the '=' sign
*/
p1 = str + 1;
/*
* terminate p1 at the '-' sign
*/
p = strchr(p1, '-');
if (!p)
return 1;
p2 = p + 1;
*p = '\0';
if (!__check_range(p1, s) && !__check_range(p2, e))
return 0;
return 1;
}
static int check_int(char *p, char *name, unsigned int *val)
{
char *str;
str = strstr(p, name);
if (!str)
return 1;
str = strchr(p, '=');
if (!str)
return 1;
str++;
if (sscanf(str, "%u", val) == 1)
return 0;
return 1;
}
static int check_strset(char *p, char *name)
{
return strncmp(p, name, strlen(name));
}
static int is_empty_or_comment(char *line)
{
unsigned int i;
for (i = 0; i < strlen(line); i++) {
if (line[i] == ';')
return 1;
if (!isspace(line[i]) && !iscntrl(line[i]))
return 0;
}
return 1;
}
static int str_rw_cb(struct thread_data *td, char *mem)
{
if (!strncmp(mem, "read", 4) || !strncmp(mem, "0", 1)) {
td->ddir = DDIR_READ;
td->sequential = 1;
return 0;
} else if (!strncmp(mem, "randread", 8)) {
td->ddir = DDIR_READ;
td->sequential = 0;
return 0;
} else if (!strncmp(mem, "write", 5) || !strncmp(mem, "1", 1)) {
td->ddir = DDIR_WRITE;
td->sequential = 1;
return 0;
} else if (!strncmp(mem, "randwrite", 9)) {
td->ddir = DDIR_WRITE;
td->sequential = 0;
return 0;
}
fprintf(stderr, "bad data direction: %s\n", mem);
return 1;
}
static int str_verify_cb(struct thread_data *td, char *mem)
{
if (!strncmp(mem, "0", 1)) {
td->verify = VERIFY_NONE;
return 0;
} else if (!strncmp(mem, "md5", 3) || !strncmp(mem, "1", 1)) {
td->verify = VERIFY_MD5;
return 0;
} else if (!strncmp(mem, "crc32", 5)) {
td->verify = VERIFY_CRC32;
return 0;
}
fprintf(stderr, "bad verify type: %s\n", mem);
return 1;
}
static int str_mem_cb(struct thread_data *td, char *mem)
{
if (!strncmp(mem, "malloc", 6)) {
td->mem_type = MEM_MALLOC;
return 0;
} else if (!strncmp(mem, "shm", 3)) {
td->mem_type = MEM_SHM;
return 0;
} else if (!strncmp(mem, "mmap", 4)) {
td->mem_type = MEM_MMAP;
return 0;
}
fprintf(stderr, "bad mem type: %s\n", mem);
return 1;
}
static int str_ioengine_cb(struct thread_data *td, char *str)
{
if (!strncmp(str, "linuxaio", 8) || !strncmp(str, "aio", 3) ||
!strncmp(str, "libaio", 6)) {
strcpy(td->io_engine_name, "libaio");
td->io_engine = FIO_LIBAIO;
return 0;
} else if (!strncmp(str, "posixaio", 8)) {
strcpy(td->io_engine_name, "posixaio");
td->io_engine = FIO_POSIXAIO;
return 0;
} else if (!strncmp(str, "sync", 4)) {
strcpy(td->io_engine_name, "sync");
td->io_engine = FIO_SYNCIO;
return 0;
} else if (!strncmp(str, "mmap", 4)) {
strcpy(td->io_engine_name, "mmap");
td->io_engine = FIO_MMAPIO;
return 0;
} else if (!strncmp(str, "sgio", 4)) {
strcpy(td->io_engine_name, "sgio");
td->io_engine = FIO_SGIO;
return 0;
}
fprintf(stderr, "bad ioengine type: %s\n", str);
return 1;
}
int parse_jobs_ini(char *file)
{
unsigned int prioclass, prio, cpu, global;
unsigned long long ull;
unsigned long ul1, ul2;
struct thread_data *td;
char *string, *name;
fpos_t off;
FILE *f;
char *p;
f = fopen(file, "r");
if (!f) {
perror("fopen");
return 1;
}
string = malloc(4096);
name = malloc(256);
while ((p = fgets(string, 4096, f)) != NULL) {
if (is_empty_or_comment(p))
continue;
if (sscanf(p, "[%s]", name) != 1)
continue;
global = !strncmp(name, "global", 6);
name[strlen(name) - 1] = '\0';
td = get_new_job(global, &def_thread);
if (!td)
return 1;
prioclass = 2;
prio = 4;
fgetpos(f, &off);
while ((p = fgets(string, 4096, f)) != NULL) {
if (is_empty_or_comment(p))
continue;
if (strstr(p, "["))
break;
if (!check_int(p, "prio", &prio)) {
#ifndef FIO_HAVE_IOPRIO
fprintf(stderr, "io priorities not available\n");
return 1;
#endif
fgetpos(f, &off);
continue;
}
if (!check_int(p, "prioclass", &prioclass)) {
#ifndef FIO_HAVE_IOPRIO
fprintf(stderr, "io priorities not available\n");
return 1;
#endif
fgetpos(f, &off);
continue;
}
if (!check_int(p, "direct", &td->odirect)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "rate", &td->rate)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "ratemin", &td->ratemin)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "ratecycle", &td->ratecycle)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "thinktime", &td->thinktime)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "cpumask", &cpu)) {
#ifndef FIO_HAVE_CPU_AFFINITY
fprintf(stderr, "cpu affinity not available\n");
return 1;
#endif
fill_cpu_mask(td->cpumask, cpu);
fgetpos(f, &off);
continue;
}
if (!check_int(p, "fsync", &td->fsync_blocks)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "startdelay", &td->start_delay)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "timeout", &td->timeout)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "invalidate",&td->invalidate_cache)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "iodepth", &td->iodepth)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "sync", &td->sync_io)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "bwavgtime", &td->bw_avg_time)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "create_serialize", &td->create_serialize)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "create_fsync", &td->create_fsync)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "loops", &td->loops)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "numjobs", &td->numjobs)) {
fgetpos(f, &off);
continue;
}
if (!check_int(p, "overwrite", &td->overwrite)) {
fgetpos(f, &off);
continue;
}
if (!check_range(p, "bsrange", &ul1, &ul2)) {
if (ul1 > ul2) {
td->max_bs = ul1;
td->min_bs = ul2;
} else {
td->max_bs = ul2;
td->min_bs = ul1;
}
fgetpos(f, &off);
continue;
}
if (!check_strcnv(p, "bs", &ull)) {
td->bs = ull;
fgetpos(f, &off);
continue;
}
if (!check_strcnv(p, "size", &td->file_size)) {
fgetpos(f, &off);
continue;
}
if (!check_strcnv(p, "offset", &td->file_offset)) {
fgetpos(f, &off);
continue;
}
if (!check_strcnv(p, "zonesize", &td->zone_size)) {
fgetpos(f, &off);
continue;
}
if (!check_strcnv(p, "zoneskip", &td->zone_skip)) {
fgetpos(f, &off);
continue;
}
if (!check_strstore(p, "directory", td->directory)) {
fgetpos(f, &off);
continue;
}
if (!check_str(p, "mem", str_mem_cb, td)) {
fgetpos(f, &off);
continue;
}
if (!check_str(p, "verify", str_verify_cb, td)) {
fgetpos(f, &off);
continue;
}
if (!check_str(p, "rw", str_rw_cb, td)) {
fgetpos(f, &off);
continue;
}
if (!check_str(p, "ioengine", str_ioengine_cb, td)) {
fgetpos(f, &off);
continue;
}
if (!check_strset(p, "create")) {
td->create_file = 1;
fgetpos(f, &off);
continue;
}
if (!check_strset(p, "exitall")) {
exitall_on_terminate = 1;
fgetpos(f, &off);
continue;
}
if (!check_strset(p, "stonewall")) {
td->stonewall = 1;
fgetpos(f, &off);
continue;
}
if (!check_strset(p, "thread")) {
td->use_thread = 1;
fgetpos(f, &off);
continue;
}
printf("Client%d: bad option %s\n",td->thread_number,p);
}
fsetpos(f, &off);
if (add_job(td, name, prioclass, prio))
return 1;
}
free(string);
free(name);
fclose(f);
return 0;
}
static int fill_def_thread(void)
{
memset(&def_thread, 0, sizeof(def_thread));
if (fio_getaffinity(getpid(), &def_thread.cpumask) == -1) {
perror("sched_getaffinity");
return 1;
}
/*
* fill globals
*/
def_thread.ddir = DDIR_READ;
def_thread.bs = DEF_BS;
def_thread.min_bs = -1;
def_thread.max_bs = -1;
def_thread.io_engine = DEF_IO_ENGINE;
strcpy(def_thread.io_engine_name, DEF_IO_ENGINE_NAME);
def_thread.odirect = DEF_ODIRECT;
def_thread.ratecycle = DEF_RATE_CYCLE;
def_thread.sequential = DEF_SEQUENTIAL;
def_thread.timeout = DEF_TIMEOUT;
def_thread.create_file = DEF_CREATE;
def_thread.overwrite = DEF_OVERWRITE;
def_thread.invalidate_cache = DEF_INVALIDATE;
def_thread.sync_io = DEF_SYNCIO;
def_thread.mem_type = MEM_MALLOC;
def_thread.bw_avg_time = DEF_BWAVGTIME;
def_thread.create_serialize = DEF_CREATE_SER;
def_thread.create_fsync = DEF_CREATE_FSYNC;
def_thread.loops = DEF_LOOPS;
def_thread.verify = DEF_VERIFY;
def_thread.stonewall = DEF_STONEWALL;
def_thread.numjobs = DEF_NUMJOBS;
def_thread.use_thread = DEF_USE_THREAD;
#ifdef FIO_HAVE_DISK_UTIL
def_thread.do_disk_util = 1;
#endif
return 0;
}
static void parse_cmd_line(int argc, char *argv[])
{
int c;
while ((c = getopt(argc, argv, "s:b:t:r:R:o:f:lwv")) != EOF) {
switch (c) {
case 's':
def_thread.sequential = !!atoi(optarg);
break;
case 'b':
def_thread.bs = atoi(optarg);
def_thread.bs <<= 10;
if (!def_thread.bs) {
printf("bad block size\n");
def_thread.bs = DEF_BS;
}
break;
case 't':
def_thread.timeout = atoi(optarg);
break;
case 'r':
repeatable = !!atoi(optarg);
break;
case 'R':
rate_quit = !!atoi(optarg);
break;
case 'o':
def_thread.odirect = !!atoi(optarg);
break;
case 'f':
ini_file = strdup(optarg);
break;
case 'l':
write_lat_log = 1;
break;
case 'w':
write_bw_log = 1;
break;
case 'v':
printf("%s\n", fio_version_string);
exit(0);
}
}
}
static void free_shm(void)
{
struct shmid_ds sbuf;
if (threads) {
shmdt(threads);
threads = NULL;
shmctl(shm_id, IPC_RMID, &sbuf);
}
}
static int setup_thread_area(void)
{
/*
* 1024 is too much on some machines, scale max_jobs if
* we get a failure that looks like too large a shm segment
*/
do {
int s = max_jobs * sizeof(struct thread_data);
shm_id = shmget(0, s, IPC_CREAT | 0600);
if (shm_id != -1)
break;
if (errno != EINVAL) {
perror("shmget");
break;
}
max_jobs >>= 1;
} while (max_jobs);
if (shm_id == -1)
return 1;
threads = shmat(shm_id, NULL, 0);
if (threads == (void *) -1) {
perror("shmat");
return 1;
}
atexit(free_shm);
return 0;
}
int parse_options(int argc, char *argv[])
{
if (setup_thread_area())
return 1;
if (fill_def_thread())
return 1;
parse_cmd_line(argc, argv);
if (!ini_file) {
printf("Need job file\n");
return 1;
}
if (parse_jobs_ini(ini_file))
return 1;
return 0;
}