init.c revision 0a839f308177e95c4c45c41ee1d4fa2b8f231f24
1/* 2 * This file contains job initialization and setup functions. 3 */ 4#include <stdio.h> 5#include <stdlib.h> 6#include <unistd.h> 7#include <fcntl.h> 8#include <ctype.h> 9#include <string.h> 10#include <errno.h> 11#include <getopt.h> 12#include <sys/ipc.h> 13#include <sys/shm.h> 14#include <sys/types.h> 15#include <sys/stat.h> 16 17#include "fio.h" 18#include "parse.h" 19 20static char fio_version_string[] = "fio 1.16"; 21 22#define FIO_RANDSEED (0xb1899bedUL) 23 24static char **ini_file; 25static int max_jobs = MAX_JOBS; 26static int dump_cmdline; 27 28struct thread_data def_thread; 29struct thread_data *threads = NULL; 30 31int exitall_on_terminate = 0; 32int terse_output = 0; 33unsigned long long mlock_size = 0; 34FILE *f_out = NULL; 35FILE *f_err = NULL; 36 37int write_bw_log = 0; 38 39static int def_timeout = 0; 40static int write_lat_log = 0; 41 42static int prev_group_jobs; 43 44/* 45 * Command line options. These will contain the above, plus a few 46 * extra that only pertain to fio itself and not jobs. 47 */ 48static struct option long_options[FIO_NR_OPTIONS] = { 49 { 50 .name = "output", 51 .has_arg = required_argument, 52 .val = 'o', 53 }, 54 { 55 .name = "timeout", 56 .has_arg = required_argument, 57 .val = 't', 58 }, 59 { 60 .name = "latency-log", 61 .has_arg = required_argument, 62 .val = 'l', 63 }, 64 { 65 .name = "bandwidth-log", 66 .has_arg = required_argument, 67 .val = 'b', 68 }, 69 { 70 .name = "minimal", 71 .has_arg = optional_argument, 72 .val = 'm', 73 }, 74 { 75 .name = "version", 76 .has_arg = no_argument, 77 .val = 'v', 78 }, 79 { 80 .name = "help", 81 .has_arg = no_argument, 82 .val = 'h', 83 }, 84 { 85 .name = "cmdhelp", 86 .has_arg = optional_argument, 87 .val = 'c', 88 }, 89 { 90 .name = "showcmd", 91 .has_arg = no_argument, 92 .val = 's' 93 }, 94 { 95 .name = NULL, 96 }, 97}; 98 99FILE *get_f_out() 100{ 101 return f_out; 102} 103 104FILE *get_f_err() 105{ 106 return f_err; 107} 108 109/* 110 * Return a free job structure. 111 */ 112static struct thread_data *get_new_job(int global, struct thread_data *parent) 113{ 114 struct thread_data *td; 115 116 if (global) 117 return &def_thread; 118 if (thread_number >= max_jobs) 119 return NULL; 120 121 td = &threads[thread_number++]; 122 *td = *parent; 123 124 dup_files(td, parent); 125 options_mem_dupe(td); 126 127 td->thread_number = thread_number; 128 return td; 129} 130 131static void put_job(struct thread_data *td) 132{ 133 if (td == &def_thread) 134 return; 135 136 if (td->error) 137 log_info("fio: %s\n", td->verror); 138 139 memset(&threads[td->thread_number - 1], 0, sizeof(*td)); 140 thread_number--; 141} 142 143static int setup_rate(struct thread_data *td) 144{ 145 unsigned long nr_reads_per_msec; 146 unsigned long long rate; 147 unsigned int bs; 148 149 if (!td->o.rate && !td->o.rate_iops) 150 return 0; 151 152 if (td_rw(td)) 153 bs = td->o.rw_min_bs; 154 else if (td_read(td)) 155 bs = td->o.min_bs[DDIR_READ]; 156 else 157 bs = td->o.min_bs[DDIR_WRITE]; 158 159 if (td->o.rate) { 160 rate = td->o.rate; 161 nr_reads_per_msec = (rate * 1024 * 1000LL) / bs; 162 } else 163 nr_reads_per_msec = td->o.rate_iops * 1000UL; 164 165 if (!nr_reads_per_msec) { 166 log_err("rate lower than supported\n"); 167 return -1; 168 } 169 170 td->rate_usec_cycle = 1000000000ULL / nr_reads_per_msec; 171 td->rate_pending_usleep = 0; 172 return 0; 173} 174 175/* 176 * Lazy way of fixing up options that depend on each other. We could also 177 * define option callback handlers, but this is easier. 178 */ 179static int fixup_options(struct thread_data *td) 180{ 181 struct thread_options *o = &td->o; 182 183 if (o->rwmix[DDIR_READ] + o->rwmix[DDIR_WRITE] > 100) 184 o->rwmix[DDIR_WRITE] = 100 - o->rwmix[DDIR_READ]; 185 186 if (o->write_iolog_file && o->read_iolog_file) { 187 log_err("fio: read iolog overrides write_iolog\n"); 188 free(o->write_iolog_file); 189 o->write_iolog_file = NULL; 190 } 191 192 if (td->io_ops->flags & FIO_SYNCIO) 193 o->iodepth = 1; 194 else { 195 if (!o->iodepth) 196 o->iodepth = o->open_files; 197 } 198 199 /* 200 * only really works for sequential io for now, and with 1 file 201 */ 202 if (o->zone_size && td_random(td) && o->open_files == 1) 203 o->zone_size = 0; 204 205 /* 206 * Reads can do overwrites, we always need to pre-create the file 207 */ 208 if (td_read(td) || td_rw(td)) 209 o->overwrite = 1; 210 211 if (!o->min_bs[DDIR_READ]) 212 o->min_bs[DDIR_READ]= o->bs[DDIR_READ]; 213 if (!o->max_bs[DDIR_READ]) 214 o->max_bs[DDIR_READ] = o->bs[DDIR_READ]; 215 if (!o->min_bs[DDIR_WRITE]) 216 o->min_bs[DDIR_WRITE]= o->bs[DDIR_WRITE]; 217 if (!o->max_bs[DDIR_WRITE]) 218 o->max_bs[DDIR_WRITE] = o->bs[DDIR_WRITE]; 219 220 o->rw_min_bs = min(o->min_bs[DDIR_READ], o->min_bs[DDIR_WRITE]); 221 222 if (!o->file_size_high) 223 o->file_size_high = o->file_size_low; 224 225 if (td_read(td) && !td_rw(td)) 226 o->verify = 0; 227 228 if (o->norandommap && o->verify != VERIFY_NONE) { 229 log_err("fio: norandommap given, verify disabled\n"); 230 o->verify = VERIFY_NONE; 231 } 232 if (o->bs_unaligned && (o->odirect || td->io_ops->flags & FIO_RAWIO)) 233 log_err("fio: bs_unaligned may not work with raw io\n"); 234 235 /* 236 * thinktime_spin must be less than thinktime 237 */ 238 if (o->thinktime_spin > o->thinktime) 239 o->thinktime_spin = o->thinktime; 240 241 /* 242 * The low water mark cannot be bigger than the iodepth 243 */ 244 if (o->iodepth_low > o->iodepth || !o->iodepth_low) { 245 /* 246 * syslet work around - if the workload is sequential, 247 * we want to let the queue drain all the way down to 248 * avoid seeking between async threads 249 */ 250 if (!strcmp(td->io_ops->name, "syslet-rw") && !td_random(td)) 251 o->iodepth_low = 1; 252 else 253 o->iodepth_low = o->iodepth; 254 } 255 256 /* 257 * If batch number isn't set, default to the same as iodepth 258 */ 259 if (o->iodepth_batch > o->iodepth || !o->iodepth_batch) 260 o->iodepth_batch = o->iodepth; 261 262 if (o->nr_files > td->files_index) 263 o->nr_files = td->files_index; 264 265 if (o->open_files > o->nr_files || !o->open_files) 266 o->open_files = o->nr_files; 267 268 if ((o->rate && o->rate_iops) || (o->ratemin && o->rate_iops_min)) { 269 log_err("fio: rate and rate_iops are mutually exclusive\n"); 270 return 1; 271 } 272 if ((o->rate < o->ratemin) || (o->rate_iops < o->rate_iops_min)) { 273 log_err("fio: minimum rate exceeds rate\n"); 274 return 1; 275 } 276 277 if (!o->timeout && o->time_based) { 278 log_err("fio: time_based requires a runtime/timeout setting\n"); 279 o->time_based = 0; 280 } 281 282 return 0; 283} 284 285/* 286 * This function leaks the buffer 287 */ 288static char *to_kmg(unsigned int val) 289{ 290 char *buf = malloc(32); 291 char post[] = { 0, 'K', 'M', 'G', 'P', 'E', 0 }; 292 char *p = post; 293 294 do { 295 if (val & 1023) 296 break; 297 298 val >>= 10; 299 p++; 300 } while (*p); 301 302 snprintf(buf, 31, "%u%c", val, *p); 303 return buf; 304} 305 306/* External engines are specified by "external:name.o") */ 307static const char *get_engine_name(const char *str) 308{ 309 char *p = strstr(str, ":"); 310 311 if (!p) 312 return str; 313 314 p++; 315 strip_blank_front(&p); 316 strip_blank_end(p); 317 return p; 318} 319 320static int exists_and_not_file(const char *filename) 321{ 322 struct stat sb; 323 324 if (lstat(filename, &sb) == -1) 325 return 0; 326 327 if (S_ISREG(sb.st_mode)) 328 return 0; 329 330 return 1; 331} 332 333/* 334 * Initialize the various random states we need (random io, block size ranges, 335 * read/write mix, etc). 336 */ 337static int init_random_state(struct thread_data *td) 338{ 339 unsigned long seeds[6]; 340 int fd; 341 342 fd = open("/dev/urandom", O_RDONLY); 343 if (fd == -1) { 344 td_verror(td, errno, "open"); 345 return 1; 346 } 347 348 if (read(fd, seeds, sizeof(seeds)) < (int) sizeof(seeds)) { 349 td_verror(td, EIO, "read"); 350 close(fd); 351 return 1; 352 } 353 354 close(fd); 355 356 os_random_seed(seeds[0], &td->bsrange_state); 357 os_random_seed(seeds[1], &td->verify_state); 358 os_random_seed(seeds[2], &td->rwmix_state); 359 360 if (td->o.file_service_type == FIO_FSERVICE_RANDOM) 361 os_random_seed(seeds[3], &td->next_file_state); 362 363 os_random_seed(seeds[5], &td->file_size_state); 364 365 if (!td_random(td)) 366 return 0; 367 368 if (td->o.rand_repeatable) 369 seeds[4] = FIO_RANDSEED * td->thread_number; 370 371 os_random_seed(seeds[4], &td->random_state); 372 return 0; 373} 374 375/* 376 * Adds a job to the list of things todo. Sanitizes the various options 377 * to make sure we don't have conflicts, and initializes various 378 * members of td. 379 */ 380static int add_job(struct thread_data *td, const char *jobname, int job_add_num) 381{ 382 const char *ddir_str[] = { NULL, "read", "write", "rw", NULL, 383 "randread", "randwrite", "randrw" }; 384 unsigned int i; 385 const char *engine; 386 char fname[PATH_MAX]; 387 int numjobs, file_alloced; 388 389 /* 390 * the def_thread is just for options, it's not a real job 391 */ 392 if (td == &def_thread) 393 return 0; 394 395 /* 396 * if we are just dumping the output command line, don't add the job 397 */ 398 if (dump_cmdline) { 399 put_job(td); 400 return 0; 401 } 402 403 engine = get_engine_name(td->o.ioengine); 404 td->io_ops = load_ioengine(td, engine); 405 if (!td->io_ops) { 406 log_err("fio: failed to load engine %s\n", engine); 407 goto err; 408 } 409 410 if (td->o.use_thread) 411 nr_thread++; 412 else 413 nr_process++; 414 415 if (td->o.odirect) 416 td->io_ops->flags |= FIO_RAWIO; 417 418 file_alloced = 0; 419 if (!td->o.filename && !td->files_index) { 420 file_alloced = 1; 421 422 if (td->o.nr_files == 1 && exists_and_not_file(jobname)) 423 add_file(td, jobname); 424 else { 425 for (i = 0; i < td->o.nr_files; i++) { 426 sprintf(fname, "%s.%d.%d", jobname, td->thread_number, i); 427 add_file(td, fname); 428 } 429 } 430 } 431 432 if (fixup_options(td)) 433 goto err; 434 435 if (td->io_ops->flags & FIO_DISKLESSIO) { 436 struct fio_file *f; 437 438 for_each_file(td, f, i) 439 f->real_file_size = -1ULL; 440 } 441 442 td->mutex = fio_sem_init(0); 443 444 td->ts.clat_stat[0].min_val = td->ts.clat_stat[1].min_val = ULONG_MAX; 445 td->ts.slat_stat[0].min_val = td->ts.slat_stat[1].min_val = ULONG_MAX; 446 td->ts.bw_stat[0].min_val = td->ts.bw_stat[1].min_val = ULONG_MAX; 447 td->ddir_nr = td->o.ddir_nr; 448 449 if ((td->o.stonewall || td->o.numjobs > 1 || td->o.new_group) 450 && prev_group_jobs) { 451 prev_group_jobs = 0; 452 groupid++; 453 } 454 455 td->groupid = groupid; 456 prev_group_jobs++; 457 458 if (init_random_state(td)) 459 goto err; 460 461 if (setup_rate(td)) 462 goto err; 463 464 if (td->o.write_lat_log) { 465 setup_log(&td->ts.slat_log); 466 setup_log(&td->ts.clat_log); 467 } 468 if (td->o.write_bw_log) 469 setup_log(&td->ts.bw_log); 470 471 if (!td->o.name) 472 td->o.name = strdup(jobname); 473 474 if (!terse_output) { 475 if (!job_add_num) { 476 if (!strcmp(td->io_ops->name, "cpuio")) 477 log_info("%s: ioengine=cpu, cpuload=%u, cpucycle=%u\n", td->o.name, td->o.cpuload, td->o.cpucycle); 478 else { 479 char *c1, *c2, *c3, *c4; 480 481 c1 = to_kmg(td->o.min_bs[DDIR_READ]); 482 c2 = to_kmg(td->o.max_bs[DDIR_READ]); 483 c3 = to_kmg(td->o.min_bs[DDIR_WRITE]); 484 c4 = to_kmg(td->o.max_bs[DDIR_WRITE]); 485 486 log_info("%s: (g=%d): rw=%s, bs=%s-%s/%s-%s, ioengine=%s, iodepth=%u\n", td->o.name, td->groupid, ddir_str[td->o.td_ddir], c1, c2, c3, c4, td->io_ops->name, td->o.iodepth); 487 488 free(c1); 489 free(c2); 490 free(c3); 491 free(c4); 492 } 493 } else if (job_add_num == 1) 494 log_info("...\n"); 495 } 496 497 /* 498 * recurse add identical jobs, clear numjobs and stonewall options 499 * as they don't apply to sub-jobs 500 */ 501 numjobs = td->o.numjobs; 502 while (--numjobs) { 503 struct thread_data *td_new = get_new_job(0, td); 504 505 if (!td_new) 506 goto err; 507 508 td_new->o.numjobs = 1; 509 td_new->o.stonewall = 0; 510 td_new->o.new_group = 0; 511 512 if (file_alloced) { 513 td_new->o.filename = NULL; 514 td_new->files_index = 0; 515 td_new->files = NULL; 516 } 517 518 job_add_num = numjobs - 1; 519 520 if (add_job(td_new, jobname, job_add_num)) 521 goto err; 522 } 523 524 return 0; 525err: 526 put_job(td); 527 return -1; 528} 529 530static int is_empty_or_comment(char *line) 531{ 532 unsigned int i; 533 534 for (i = 0; i < strlen(line); i++) { 535 if (line[i] == ';') 536 return 1; 537 if (line[i] == '#') 538 return 1; 539 if (!isspace(line[i]) && !iscntrl(line[i])) 540 return 0; 541 } 542 543 return 1; 544} 545 546/* 547 * This is our [ini] type file parser. 548 */ 549static int parse_jobs_ini(char *file, int stonewall_flag) 550{ 551 unsigned int global; 552 struct thread_data *td; 553 char *string, *name; 554 fpos_t off; 555 FILE *f; 556 char *p; 557 int ret = 0, stonewall; 558 int first_sect = 1; 559 560 f = fopen(file, "r"); 561 if (!f) { 562 perror("fopen job file"); 563 return 1; 564 } 565 566 string = malloc(4096); 567 name = malloc(256); 568 memset(name, 0, 256); 569 570 stonewall = stonewall_flag; 571 do { 572 p = fgets(string, 4095, f); 573 if (!p) 574 break; 575 576 strip_blank_front(&p); 577 strip_blank_end(p); 578 579 if (is_empty_or_comment(p)) 580 continue; 581 if (sscanf(p, "[%255s]", name) != 1) { 582 log_err("fio: option <%s> outside of job section\n", p); 583 continue; 584 } 585 586 global = !strncmp(name, "global", 6); 587 588 name[strlen(name) - 1] = '\0'; 589 590 if (dump_cmdline) { 591 if (first_sect) 592 log_info("fio "); 593 if (!global) 594 log_info("--name=%s ", name); 595 first_sect = 0; 596 } 597 598 td = get_new_job(global, &def_thread); 599 if (!td) { 600 ret = 1; 601 break; 602 } 603 604 /* 605 * Seperate multiple job files by a stonewall 606 */ 607 if (!global && stonewall) { 608 td->o.stonewall = stonewall; 609 stonewall = 0; 610 } 611 612 fgetpos(f, &off); 613 while ((p = fgets(string, 4096, f)) != NULL) { 614 if (is_empty_or_comment(p)) 615 continue; 616 617 strip_blank_front(&p); 618 619 if (p[0] == '[') 620 break; 621 622 strip_blank_end(p); 623 624 fgetpos(f, &off); 625 626 /* 627 * Don't break here, continue parsing options so we 628 * dump all the bad ones. Makes trial/error fixups 629 * easier on the user. 630 */ 631 ret |= fio_option_parse(td, p); 632 if (!ret && dump_cmdline) 633 log_info("--%s ", p); 634 } 635 636 if (!ret) { 637 fsetpos(f, &off); 638 ret = add_job(td, name, 0); 639 } else { 640 log_err("fio: job %s dropped\n", name); 641 put_job(td); 642 } 643 } while (!ret); 644 645 if (dump_cmdline) 646 log_info("\n"); 647 648 free(string); 649 free(name); 650 fclose(f); 651 return ret; 652} 653 654static int fill_def_thread(void) 655{ 656 memset(&def_thread, 0, sizeof(def_thread)); 657 658 if (fio_getaffinity(getpid(), &def_thread.o.cpumask) == -1) { 659 perror("sched_getaffinity"); 660 return 1; 661 } 662 663 /* 664 * fill default options 665 */ 666 fio_fill_default_options(&def_thread); 667 668 def_thread.o.timeout = def_timeout; 669 def_thread.o.write_bw_log = write_bw_log; 670 def_thread.o.write_lat_log = write_lat_log; 671 672 return 0; 673} 674 675static void free_shm(void) 676{ 677 struct shmid_ds sbuf; 678 679 if (threads) { 680 shmdt((void *) threads); 681 threads = NULL; 682 shmctl(shm_id, IPC_RMID, &sbuf); 683 } 684} 685 686/* 687 * The thread area is shared between the main process and the job 688 * threads/processes. So setup a shared memory segment that will hold 689 * all the job info. 690 */ 691static int setup_thread_area(void) 692{ 693 /* 694 * 1024 is too much on some machines, scale max_jobs if 695 * we get a failure that looks like too large a shm segment 696 */ 697 do { 698 size_t size = max_jobs * sizeof(struct thread_data); 699 700 shm_id = shmget(0, size, IPC_CREAT | 0600); 701 if (shm_id != -1) 702 break; 703 if (errno != EINVAL) { 704 perror("shmget"); 705 break; 706 } 707 708 max_jobs >>= 1; 709 } while (max_jobs); 710 711 if (shm_id == -1) 712 return 1; 713 714 threads = shmat(shm_id, NULL, 0); 715 if (threads == (void *) -1) { 716 perror("shmat"); 717 return 1; 718 } 719 720 atexit(free_shm); 721 return 0; 722} 723 724static void usage(void) 725{ 726 printf("%s\n", fio_version_string); 727 printf("\t--output\tWrite output to file\n"); 728 printf("\t--timeout\tRuntime in seconds\n"); 729 printf("\t--latency-log\tGenerate per-job latency logs\n"); 730 printf("\t--bandwidth-log\tGenerate per-job bandwidth logs\n"); 731 printf("\t--minimal\tMinimal (terse) output\n"); 732 printf("\t--version\tPrint version info and exit\n"); 733 printf("\t--help\t\tPrint this page\n"); 734 printf("\t--cmdhelp=cmd\tPrint command help, \"all\" for all of them\n"); 735 printf("\t--showcmd\tTurn a job file into command line options\n"); 736} 737 738static int parse_cmd_line(int argc, char *argv[]) 739{ 740 struct thread_data *td = NULL; 741 int c, ini_idx = 0, lidx, ret, dont_add_job = 0; 742 743 while ((c = getopt_long_only(argc, argv, "", long_options, &lidx)) != -1) { 744 switch (c) { 745 case 't': 746 def_timeout = atoi(optarg); 747 break; 748 case 'l': 749 write_lat_log = 1; 750 break; 751 case 'w': 752 write_bw_log = 1; 753 break; 754 case 'o': 755 f_out = fopen(optarg, "w+"); 756 if (!f_out) { 757 perror("fopen output"); 758 exit(1); 759 } 760 f_err = f_out; 761 break; 762 case 'm': 763 terse_output = 1; 764 break; 765 case 'h': 766 usage(); 767 exit(0); 768 case 'c': 769 exit(fio_show_option_help(optarg)); 770 case 's': 771 dump_cmdline = 1; 772 break; 773 case 'v': 774 printf("%s\n", fio_version_string); 775 exit(0); 776 case FIO_GETOPT_JOB: { 777 const char *opt = long_options[lidx].name; 778 char *val = optarg; 779 780 if (!strncmp(opt, "name", 4) && td) { 781 ret = add_job(td, td->o.name ?: "fio", 0); 782 if (ret) { 783 put_job(td); 784 return 0; 785 } 786 td = NULL; 787 } 788 if (!td) { 789 int global = 0; 790 791 if (strncmp(opt, "name", 4) || 792 !strncmp(val, "global", 6)) 793 global = 1; 794 795 td = get_new_job(global, &def_thread); 796 if (!td) 797 return 0; 798 } 799 800 ret = fio_cmd_option_parse(td, opt, val); 801 if (ret) 802 dont_add_job = 1; 803 break; 804 } 805 default: 806 break; 807 } 808 } 809 810 if (td) { 811 if (dont_add_job) 812 put_job(td); 813 else { 814 ret = add_job(td, td->o.name ?: "fio", 0); 815 if (ret) 816 put_job(td); 817 } 818 } 819 820 while (optind < argc) { 821 ini_idx++; 822 ini_file = realloc(ini_file, ini_idx * sizeof(char *)); 823 ini_file[ini_idx - 1] = strdup(argv[optind]); 824 optind++; 825 } 826 827 return ini_idx; 828} 829 830 831int parse_options(int argc, char *argv[]) 832{ 833 int job_files, i; 834 835 f_out = stdout; 836 f_err = stderr; 837 838 fio_options_dup_and_init(long_options); 839 840 if (setup_thread_area()) 841 return 1; 842 if (fill_def_thread()) 843 return 1; 844 845 job_files = parse_cmd_line(argc, argv); 846 847 for (i = 0; i < job_files; i++) { 848 if (fill_def_thread()) 849 return 1; 850 if (parse_jobs_ini(ini_file[i], i)) 851 return 1; 852 free(ini_file[i]); 853 } 854 855 free(ini_file); 856 options_mem_free(&def_thread); 857 858 if (!thread_number) { 859 if (dump_cmdline) 860 return 0; 861 862 log_err("No jobs defined(s)\n"); 863 return 1; 864 } 865 866 return 0; 867} 868