init.c revision 0a839f308177e95c4c45c41ee1d4fa2b8f231f24
1/*
2 * This file contains job initialization and setup functions.
3 */
4#include <stdio.h>
5#include <stdlib.h>
6#include <unistd.h>
7#include <fcntl.h>
8#include <ctype.h>
9#include <string.h>
10#include <errno.h>
11#include <getopt.h>
12#include <sys/ipc.h>
13#include <sys/shm.h>
14#include <sys/types.h>
15#include <sys/stat.h>
16
17#include "fio.h"
18#include "parse.h"
19
20static char fio_version_string[] = "fio 1.16";
21
22#define FIO_RANDSEED		(0xb1899bedUL)
23
24static char **ini_file;
25static int max_jobs = MAX_JOBS;
26static int dump_cmdline;
27
28struct thread_data def_thread;
29struct thread_data *threads = NULL;
30
31int exitall_on_terminate = 0;
32int terse_output = 0;
33unsigned long long mlock_size = 0;
34FILE *f_out = NULL;
35FILE *f_err = NULL;
36
37int write_bw_log = 0;
38
39static int def_timeout = 0;
40static int write_lat_log = 0;
41
42static int prev_group_jobs;
43
44/*
45 * Command line options. These will contain the above, plus a few
46 * extra that only pertain to fio itself and not jobs.
47 */
48static struct option long_options[FIO_NR_OPTIONS] = {
49	{
50		.name		= "output",
51		.has_arg	= required_argument,
52		.val		= 'o',
53	},
54	{
55		.name		= "timeout",
56		.has_arg	= required_argument,
57		.val		= 't',
58	},
59	{
60		.name		= "latency-log",
61		.has_arg	= required_argument,
62		.val		= 'l',
63	},
64	{
65		.name		= "bandwidth-log",
66		.has_arg	= required_argument,
67		.val		= 'b',
68	},
69	{
70		.name		= "minimal",
71		.has_arg	= optional_argument,
72		.val		= 'm',
73	},
74	{
75		.name		= "version",
76		.has_arg	= no_argument,
77		.val		= 'v',
78	},
79	{
80		.name		= "help",
81		.has_arg	= no_argument,
82		.val		= 'h',
83	},
84	{
85		.name		= "cmdhelp",
86		.has_arg	= optional_argument,
87		.val		= 'c',
88	},
89	{
90		.name		= "showcmd",
91		.has_arg	= no_argument,
92		.val		= 's'
93	},
94	{
95		.name		= NULL,
96	},
97};
98
99FILE *get_f_out()
100{
101	return f_out;
102}
103
104FILE *get_f_err()
105{
106	return f_err;
107}
108
109/*
110 * Return a free job structure.
111 */
112static struct thread_data *get_new_job(int global, struct thread_data *parent)
113{
114	struct thread_data *td;
115
116	if (global)
117		return &def_thread;
118	if (thread_number >= max_jobs)
119		return NULL;
120
121	td = &threads[thread_number++];
122	*td = *parent;
123
124	dup_files(td, parent);
125	options_mem_dupe(td);
126
127	td->thread_number = thread_number;
128	return td;
129}
130
131static void put_job(struct thread_data *td)
132{
133	if (td == &def_thread)
134		return;
135
136	if (td->error)
137		log_info("fio: %s\n", td->verror);
138
139	memset(&threads[td->thread_number - 1], 0, sizeof(*td));
140	thread_number--;
141}
142
143static int setup_rate(struct thread_data *td)
144{
145	unsigned long nr_reads_per_msec;
146	unsigned long long rate;
147	unsigned int bs;
148
149	if (!td->o.rate && !td->o.rate_iops)
150		return 0;
151
152	if (td_rw(td))
153		bs = td->o.rw_min_bs;
154	else if (td_read(td))
155		bs = td->o.min_bs[DDIR_READ];
156	else
157		bs = td->o.min_bs[DDIR_WRITE];
158
159	if (td->o.rate) {
160		rate = td->o.rate;
161		nr_reads_per_msec = (rate * 1024 * 1000LL) / bs;
162	} else
163		nr_reads_per_msec = td->o.rate_iops * 1000UL;
164
165	if (!nr_reads_per_msec) {
166		log_err("rate lower than supported\n");
167		return -1;
168	}
169
170	td->rate_usec_cycle = 1000000000ULL / nr_reads_per_msec;
171	td->rate_pending_usleep = 0;
172	return 0;
173}
174
175/*
176 * Lazy way of fixing up options that depend on each other. We could also
177 * define option callback handlers, but this is easier.
178 */
179static int fixup_options(struct thread_data *td)
180{
181	struct thread_options *o = &td->o;
182
183	if (o->rwmix[DDIR_READ] + o->rwmix[DDIR_WRITE] > 100)
184		o->rwmix[DDIR_WRITE] = 100 - o->rwmix[DDIR_READ];
185
186	if (o->write_iolog_file && o->read_iolog_file) {
187		log_err("fio: read iolog overrides write_iolog\n");
188		free(o->write_iolog_file);
189		o->write_iolog_file = NULL;
190	}
191
192	if (td->io_ops->flags & FIO_SYNCIO)
193		o->iodepth = 1;
194	else {
195		if (!o->iodepth)
196			o->iodepth = o->open_files;
197	}
198
199	/*
200	 * only really works for sequential io for now, and with 1 file
201	 */
202	if (o->zone_size && td_random(td) && o->open_files == 1)
203		o->zone_size = 0;
204
205	/*
206	 * Reads can do overwrites, we always need to pre-create the file
207	 */
208	if (td_read(td) || td_rw(td))
209		o->overwrite = 1;
210
211	if (!o->min_bs[DDIR_READ])
212		o->min_bs[DDIR_READ]= o->bs[DDIR_READ];
213	if (!o->max_bs[DDIR_READ])
214		o->max_bs[DDIR_READ] = o->bs[DDIR_READ];
215	if (!o->min_bs[DDIR_WRITE])
216		o->min_bs[DDIR_WRITE]= o->bs[DDIR_WRITE];
217	if (!o->max_bs[DDIR_WRITE])
218		o->max_bs[DDIR_WRITE] = o->bs[DDIR_WRITE];
219
220	o->rw_min_bs = min(o->min_bs[DDIR_READ], o->min_bs[DDIR_WRITE]);
221
222	if (!o->file_size_high)
223		o->file_size_high = o->file_size_low;
224
225	if (td_read(td) && !td_rw(td))
226		o->verify = 0;
227
228	if (o->norandommap && o->verify != VERIFY_NONE) {
229		log_err("fio: norandommap given, verify disabled\n");
230		o->verify = VERIFY_NONE;
231	}
232	if (o->bs_unaligned && (o->odirect || td->io_ops->flags & FIO_RAWIO))
233		log_err("fio: bs_unaligned may not work with raw io\n");
234
235	/*
236	 * thinktime_spin must be less than thinktime
237	 */
238	if (o->thinktime_spin > o->thinktime)
239		o->thinktime_spin = o->thinktime;
240
241	/*
242	 * The low water mark cannot be bigger than the iodepth
243	 */
244	if (o->iodepth_low > o->iodepth || !o->iodepth_low) {
245		/*
246		 * syslet work around - if the workload is sequential,
247		 * we want to let the queue drain all the way down to
248		 * avoid seeking between async threads
249		 */
250		if (!strcmp(td->io_ops->name, "syslet-rw") && !td_random(td))
251			o->iodepth_low = 1;
252		else
253			o->iodepth_low = o->iodepth;
254	}
255
256	/*
257	 * If batch number isn't set, default to the same as iodepth
258	 */
259	if (o->iodepth_batch > o->iodepth || !o->iodepth_batch)
260		o->iodepth_batch = o->iodepth;
261
262	if (o->nr_files > td->files_index)
263		o->nr_files = td->files_index;
264
265	if (o->open_files > o->nr_files || !o->open_files)
266		o->open_files = o->nr_files;
267
268	if ((o->rate && o->rate_iops) || (o->ratemin && o->rate_iops_min)) {
269		log_err("fio: rate and rate_iops are mutually exclusive\n");
270		return 1;
271	}
272	if ((o->rate < o->ratemin) || (o->rate_iops < o->rate_iops_min)) {
273		log_err("fio: minimum rate exceeds rate\n");
274		return 1;
275	}
276
277	if (!o->timeout && o->time_based) {
278		log_err("fio: time_based requires a runtime/timeout setting\n");
279		o->time_based = 0;
280	}
281
282	return 0;
283}
284
285/*
286 * This function leaks the buffer
287 */
288static char *to_kmg(unsigned int val)
289{
290	char *buf = malloc(32);
291	char post[] = { 0, 'K', 'M', 'G', 'P', 'E', 0 };
292	char *p = post;
293
294	do {
295		if (val & 1023)
296			break;
297
298		val >>= 10;
299		p++;
300	} while (*p);
301
302	snprintf(buf, 31, "%u%c", val, *p);
303	return buf;
304}
305
306/* External engines are specified by "external:name.o") */
307static const char *get_engine_name(const char *str)
308{
309	char *p = strstr(str, ":");
310
311	if (!p)
312		return str;
313
314	p++;
315	strip_blank_front(&p);
316	strip_blank_end(p);
317	return p;
318}
319
320static int exists_and_not_file(const char *filename)
321{
322	struct stat sb;
323
324	if (lstat(filename, &sb) == -1)
325		return 0;
326
327	if (S_ISREG(sb.st_mode))
328		return 0;
329
330	return 1;
331}
332
333/*
334 * Initialize the various random states we need (random io, block size ranges,
335 * read/write mix, etc).
336 */
337static int init_random_state(struct thread_data *td)
338{
339	unsigned long seeds[6];
340	int fd;
341
342	fd = open("/dev/urandom", O_RDONLY);
343	if (fd == -1) {
344		td_verror(td, errno, "open");
345		return 1;
346	}
347
348	if (read(fd, seeds, sizeof(seeds)) < (int) sizeof(seeds)) {
349		td_verror(td, EIO, "read");
350		close(fd);
351		return 1;
352	}
353
354	close(fd);
355
356	os_random_seed(seeds[0], &td->bsrange_state);
357	os_random_seed(seeds[1], &td->verify_state);
358	os_random_seed(seeds[2], &td->rwmix_state);
359
360	if (td->o.file_service_type == FIO_FSERVICE_RANDOM)
361		os_random_seed(seeds[3], &td->next_file_state);
362
363	os_random_seed(seeds[5], &td->file_size_state);
364
365	if (!td_random(td))
366		return 0;
367
368	if (td->o.rand_repeatable)
369		seeds[4] = FIO_RANDSEED * td->thread_number;
370
371	os_random_seed(seeds[4], &td->random_state);
372	return 0;
373}
374
375/*
376 * Adds a job to the list of things todo. Sanitizes the various options
377 * to make sure we don't have conflicts, and initializes various
378 * members of td.
379 */
380static int add_job(struct thread_data *td, const char *jobname, int job_add_num)
381{
382	const char *ddir_str[] = { NULL, "read", "write", "rw", NULL,
383				   "randread", "randwrite", "randrw" };
384	unsigned int i;
385	const char *engine;
386	char fname[PATH_MAX];
387	int numjobs, file_alloced;
388
389	/*
390	 * the def_thread is just for options, it's not a real job
391	 */
392	if (td == &def_thread)
393		return 0;
394
395	/*
396	 * if we are just dumping the output command line, don't add the job
397	 */
398	if (dump_cmdline) {
399		put_job(td);
400		return 0;
401	}
402
403	engine = get_engine_name(td->o.ioengine);
404	td->io_ops = load_ioengine(td, engine);
405	if (!td->io_ops) {
406		log_err("fio: failed to load engine %s\n", engine);
407		goto err;
408	}
409
410	if (td->o.use_thread)
411		nr_thread++;
412	else
413		nr_process++;
414
415	if (td->o.odirect)
416		td->io_ops->flags |= FIO_RAWIO;
417
418	file_alloced = 0;
419	if (!td->o.filename && !td->files_index) {
420		file_alloced = 1;
421
422		if (td->o.nr_files == 1 && exists_and_not_file(jobname))
423			add_file(td, jobname);
424		else {
425			for (i = 0; i < td->o.nr_files; i++) {
426				sprintf(fname, "%s.%d.%d", jobname, td->thread_number, i);
427				add_file(td, fname);
428			}
429		}
430	}
431
432	if (fixup_options(td))
433		goto err;
434
435	if (td->io_ops->flags & FIO_DISKLESSIO) {
436		struct fio_file *f;
437
438		for_each_file(td, f, i)
439			f->real_file_size = -1ULL;
440	}
441
442	td->mutex = fio_sem_init(0);
443
444	td->ts.clat_stat[0].min_val = td->ts.clat_stat[1].min_val = ULONG_MAX;
445	td->ts.slat_stat[0].min_val = td->ts.slat_stat[1].min_val = ULONG_MAX;
446	td->ts.bw_stat[0].min_val = td->ts.bw_stat[1].min_val = ULONG_MAX;
447	td->ddir_nr = td->o.ddir_nr;
448
449	if ((td->o.stonewall || td->o.numjobs > 1 || td->o.new_group)
450	     && prev_group_jobs) {
451		prev_group_jobs = 0;
452		groupid++;
453	}
454
455	td->groupid = groupid;
456	prev_group_jobs++;
457
458	if (init_random_state(td))
459		goto err;
460
461	if (setup_rate(td))
462		goto err;
463
464	if (td->o.write_lat_log) {
465		setup_log(&td->ts.slat_log);
466		setup_log(&td->ts.clat_log);
467	}
468	if (td->o.write_bw_log)
469		setup_log(&td->ts.bw_log);
470
471	if (!td->o.name)
472		td->o.name = strdup(jobname);
473
474	if (!terse_output) {
475		if (!job_add_num) {
476			if (!strcmp(td->io_ops->name, "cpuio"))
477				log_info("%s: ioengine=cpu, cpuload=%u, cpucycle=%u\n", td->o.name, td->o.cpuload, td->o.cpucycle);
478			else {
479				char *c1, *c2, *c3, *c4;
480
481				c1 = to_kmg(td->o.min_bs[DDIR_READ]);
482				c2 = to_kmg(td->o.max_bs[DDIR_READ]);
483				c3 = to_kmg(td->o.min_bs[DDIR_WRITE]);
484				c4 = to_kmg(td->o.max_bs[DDIR_WRITE]);
485
486				log_info("%s: (g=%d): rw=%s, bs=%s-%s/%s-%s, ioengine=%s, iodepth=%u\n", td->o.name, td->groupid, ddir_str[td->o.td_ddir], c1, c2, c3, c4, td->io_ops->name, td->o.iodepth);
487
488				free(c1);
489				free(c2);
490				free(c3);
491				free(c4);
492			}
493		} else if (job_add_num == 1)
494			log_info("...\n");
495	}
496
497	/*
498	 * recurse add identical jobs, clear numjobs and stonewall options
499	 * as they don't apply to sub-jobs
500	 */
501	numjobs = td->o.numjobs;
502	while (--numjobs) {
503		struct thread_data *td_new = get_new_job(0, td);
504
505		if (!td_new)
506			goto err;
507
508		td_new->o.numjobs = 1;
509		td_new->o.stonewall = 0;
510		td_new->o.new_group = 0;
511
512		if (file_alloced) {
513			td_new->o.filename = NULL;
514			td_new->files_index = 0;
515			td_new->files = NULL;
516		}
517
518		job_add_num = numjobs - 1;
519
520		if (add_job(td_new, jobname, job_add_num))
521			goto err;
522	}
523
524	return 0;
525err:
526	put_job(td);
527	return -1;
528}
529
530static int is_empty_or_comment(char *line)
531{
532	unsigned int i;
533
534	for (i = 0; i < strlen(line); i++) {
535		if (line[i] == ';')
536			return 1;
537		if (line[i] == '#')
538			return 1;
539		if (!isspace(line[i]) && !iscntrl(line[i]))
540			return 0;
541	}
542
543	return 1;
544}
545
546/*
547 * This is our [ini] type file parser.
548 */
549static int parse_jobs_ini(char *file, int stonewall_flag)
550{
551	unsigned int global;
552	struct thread_data *td;
553	char *string, *name;
554	fpos_t off;
555	FILE *f;
556	char *p;
557	int ret = 0, stonewall;
558	int first_sect = 1;
559
560	f = fopen(file, "r");
561	if (!f) {
562		perror("fopen job file");
563		return 1;
564	}
565
566	string = malloc(4096);
567	name = malloc(256);
568	memset(name, 0, 256);
569
570	stonewall = stonewall_flag;
571	do {
572		p = fgets(string, 4095, f);
573		if (!p)
574			break;
575
576		strip_blank_front(&p);
577		strip_blank_end(p);
578
579		if (is_empty_or_comment(p))
580			continue;
581		if (sscanf(p, "[%255s]", name) != 1) {
582			log_err("fio: option <%s> outside of job section\n", p);
583			continue;
584		}
585
586		global = !strncmp(name, "global", 6);
587
588		name[strlen(name) - 1] = '\0';
589
590		if (dump_cmdline) {
591			if (first_sect)
592				log_info("fio ");
593			if (!global)
594				log_info("--name=%s ", name);
595			first_sect = 0;
596		}
597
598		td = get_new_job(global, &def_thread);
599		if (!td) {
600			ret = 1;
601			break;
602		}
603
604		/*
605		 * Seperate multiple job files by a stonewall
606		 */
607		if (!global && stonewall) {
608			td->o.stonewall = stonewall;
609			stonewall = 0;
610		}
611
612		fgetpos(f, &off);
613		while ((p = fgets(string, 4096, f)) != NULL) {
614			if (is_empty_or_comment(p))
615				continue;
616
617			strip_blank_front(&p);
618
619			if (p[0] == '[')
620				break;
621
622			strip_blank_end(p);
623
624			fgetpos(f, &off);
625
626			/*
627			 * Don't break here, continue parsing options so we
628			 * dump all the bad ones. Makes trial/error fixups
629			 * easier on the user.
630			 */
631			ret |= fio_option_parse(td, p);
632			if (!ret && dump_cmdline)
633				log_info("--%s ", p);
634		}
635
636		if (!ret) {
637			fsetpos(f, &off);
638			ret = add_job(td, name, 0);
639		} else {
640			log_err("fio: job %s dropped\n", name);
641			put_job(td);
642		}
643	} while (!ret);
644
645	if (dump_cmdline)
646		log_info("\n");
647
648	free(string);
649	free(name);
650	fclose(f);
651	return ret;
652}
653
654static int fill_def_thread(void)
655{
656	memset(&def_thread, 0, sizeof(def_thread));
657
658	if (fio_getaffinity(getpid(), &def_thread.o.cpumask) == -1) {
659		perror("sched_getaffinity");
660		return 1;
661	}
662
663	/*
664	 * fill default options
665	 */
666	fio_fill_default_options(&def_thread);
667
668	def_thread.o.timeout = def_timeout;
669	def_thread.o.write_bw_log = write_bw_log;
670	def_thread.o.write_lat_log = write_lat_log;
671
672	return 0;
673}
674
675static void free_shm(void)
676{
677	struct shmid_ds sbuf;
678
679	if (threads) {
680		shmdt((void *) threads);
681		threads = NULL;
682		shmctl(shm_id, IPC_RMID, &sbuf);
683	}
684}
685
686/*
687 * The thread area is shared between the main process and the job
688 * threads/processes. So setup a shared memory segment that will hold
689 * all the job info.
690 */
691static int setup_thread_area(void)
692{
693	/*
694	 * 1024 is too much on some machines, scale max_jobs if
695	 * we get a failure that looks like too large a shm segment
696	 */
697	do {
698		size_t size = max_jobs * sizeof(struct thread_data);
699
700		shm_id = shmget(0, size, IPC_CREAT | 0600);
701		if (shm_id != -1)
702			break;
703		if (errno != EINVAL) {
704			perror("shmget");
705			break;
706		}
707
708		max_jobs >>= 1;
709	} while (max_jobs);
710
711	if (shm_id == -1)
712		return 1;
713
714	threads = shmat(shm_id, NULL, 0);
715	if (threads == (void *) -1) {
716		perror("shmat");
717		return 1;
718	}
719
720	atexit(free_shm);
721	return 0;
722}
723
724static void usage(void)
725{
726	printf("%s\n", fio_version_string);
727	printf("\t--output\tWrite output to file\n");
728	printf("\t--timeout\tRuntime in seconds\n");
729	printf("\t--latency-log\tGenerate per-job latency logs\n");
730	printf("\t--bandwidth-log\tGenerate per-job bandwidth logs\n");
731	printf("\t--minimal\tMinimal (terse) output\n");
732	printf("\t--version\tPrint version info and exit\n");
733	printf("\t--help\t\tPrint this page\n");
734	printf("\t--cmdhelp=cmd\tPrint command help, \"all\" for all of them\n");
735	printf("\t--showcmd\tTurn a job file into command line options\n");
736}
737
738static int parse_cmd_line(int argc, char *argv[])
739{
740	struct thread_data *td = NULL;
741	int c, ini_idx = 0, lidx, ret, dont_add_job = 0;
742
743	while ((c = getopt_long_only(argc, argv, "", long_options, &lidx)) != -1) {
744		switch (c) {
745		case 't':
746			def_timeout = atoi(optarg);
747			break;
748		case 'l':
749			write_lat_log = 1;
750			break;
751		case 'w':
752			write_bw_log = 1;
753			break;
754		case 'o':
755			f_out = fopen(optarg, "w+");
756			if (!f_out) {
757				perror("fopen output");
758				exit(1);
759			}
760			f_err = f_out;
761			break;
762		case 'm':
763			terse_output = 1;
764			break;
765		case 'h':
766			usage();
767			exit(0);
768		case 'c':
769			exit(fio_show_option_help(optarg));
770		case 's':
771			dump_cmdline = 1;
772			break;
773		case 'v':
774			printf("%s\n", fio_version_string);
775			exit(0);
776		case FIO_GETOPT_JOB: {
777			const char *opt = long_options[lidx].name;
778			char *val = optarg;
779
780			if (!strncmp(opt, "name", 4) && td) {
781				ret = add_job(td, td->o.name ?: "fio", 0);
782				if (ret) {
783					put_job(td);
784					return 0;
785				}
786				td = NULL;
787			}
788			if (!td) {
789				int global = 0;
790
791				if (strncmp(opt, "name", 4) ||
792				    !strncmp(val, "global", 6))
793					global = 1;
794
795				td = get_new_job(global, &def_thread);
796				if (!td)
797					return 0;
798			}
799
800			ret = fio_cmd_option_parse(td, opt, val);
801			if (ret)
802				dont_add_job = 1;
803			break;
804		}
805		default:
806			break;
807		}
808	}
809
810	if (td) {
811		if (dont_add_job)
812			put_job(td);
813		else {
814			ret = add_job(td, td->o.name ?: "fio", 0);
815			if (ret)
816				put_job(td);
817		}
818	}
819
820	while (optind < argc) {
821		ini_idx++;
822		ini_file = realloc(ini_file, ini_idx * sizeof(char *));
823		ini_file[ini_idx - 1] = strdup(argv[optind]);
824		optind++;
825	}
826
827	return ini_idx;
828}
829
830
831int parse_options(int argc, char *argv[])
832{
833	int job_files, i;
834
835	f_out = stdout;
836	f_err = stderr;
837
838	fio_options_dup_and_init(long_options);
839
840	if (setup_thread_area())
841		return 1;
842	if (fill_def_thread())
843		return 1;
844
845	job_files = parse_cmd_line(argc, argv);
846
847	for (i = 0; i < job_files; i++) {
848		if (fill_def_thread())
849			return 1;
850		if (parse_jobs_ini(ini_file[i], i))
851			return 1;
852		free(ini_file[i]);
853	}
854
855	free(ini_file);
856	options_mem_free(&def_thread);
857
858	if (!thread_number) {
859		if (dump_cmdline)
860			return 0;
861
862		log_err("No jobs defined(s)\n");
863		return 1;
864	}
865
866	return 0;
867}
868