init.c revision e6203e9e73039537d41810e91e3dfe6abeb919d9
1/* 2 * This file contains job initialization and setup functions. 3 */ 4#include <stdio.h> 5#include <stdlib.h> 6#include <unistd.h> 7#include <fcntl.h> 8#include <ctype.h> 9#include <string.h> 10#include <errno.h> 11#include <getopt.h> 12#include <sys/ipc.h> 13#include <sys/shm.h> 14#include <sys/types.h> 15#include <sys/stat.h> 16 17#include "fio.h" 18#include "parse.h" 19 20static char fio_version_string[] = "fio 1.17.1"; 21 22#define FIO_RANDSEED (0xb1899bedUL) 23 24static char **ini_file; 25static int max_jobs = MAX_JOBS; 26static int dump_cmdline; 27 28struct thread_data def_thread; 29struct thread_data *threads = NULL; 30 31int exitall_on_terminate = 0; 32int terse_output = 0; 33unsigned long long mlock_size = 0; 34FILE *f_out = NULL; 35FILE *f_err = NULL; 36 37int write_bw_log = 0; 38 39static int def_timeout = 0; 40static int write_lat_log = 0; 41 42static int prev_group_jobs; 43 44/* 45 * Command line options. These will contain the above, plus a few 46 * extra that only pertain to fio itself and not jobs. 47 */ 48static struct option long_options[FIO_NR_OPTIONS] = { 49 { 50 .name = "output", 51 .has_arg = required_argument, 52 .val = 'o', 53 }, 54 { 55 .name = "timeout", 56 .has_arg = required_argument, 57 .val = 't', 58 }, 59 { 60 .name = "latency-log", 61 .has_arg = required_argument, 62 .val = 'l', 63 }, 64 { 65 .name = "bandwidth-log", 66 .has_arg = required_argument, 67 .val = 'b', 68 }, 69 { 70 .name = "minimal", 71 .has_arg = optional_argument, 72 .val = 'm', 73 }, 74 { 75 .name = "version", 76 .has_arg = no_argument, 77 .val = 'v', 78 }, 79 { 80 .name = "help", 81 .has_arg = no_argument, 82 .val = 'h', 83 }, 84 { 85 .name = "cmdhelp", 86 .has_arg = optional_argument, 87 .val = 'c', 88 }, 89 { 90 .name = "showcmd", 91 .has_arg = no_argument, 92 .val = 's' 93 }, 94 { 95 .name = NULL, 96 }, 97}; 98 99FILE *get_f_out() 100{ 101 return f_out; 102} 103 104FILE *get_f_err() 105{ 106 return f_err; 107} 108 109/* 110 * Return a free job structure. 111 */ 112static struct thread_data *get_new_job(int global, struct thread_data *parent) 113{ 114 struct thread_data *td; 115 116 if (global) 117 return &def_thread; 118 if (thread_number >= max_jobs) 119 return NULL; 120 121 td = &threads[thread_number++]; 122 *td = *parent; 123 124 dup_files(td, parent); 125 options_mem_dupe(td); 126 127 td->thread_number = thread_number; 128 return td; 129} 130 131static void put_job(struct thread_data *td) 132{ 133 if (td == &def_thread) 134 return; 135 136 if (td->error) 137 log_info("fio: %s\n", td->verror); 138 139 memset(&threads[td->thread_number - 1], 0, sizeof(*td)); 140 thread_number--; 141} 142 143static int setup_rate(struct thread_data *td) 144{ 145 unsigned long nr_reads_per_msec; 146 unsigned long long rate; 147 unsigned int bs; 148 149 if (!td->o.rate && !td->o.rate_iops) 150 return 0; 151 152 if (td_rw(td)) 153 bs = td->o.rw_min_bs; 154 else if (td_read(td)) 155 bs = td->o.min_bs[DDIR_READ]; 156 else 157 bs = td->o.min_bs[DDIR_WRITE]; 158 159 if (td->o.rate) { 160 rate = td->o.rate; 161 nr_reads_per_msec = (rate * 1024 * 1000LL) / bs; 162 } else 163 nr_reads_per_msec = td->o.rate_iops * 1000UL; 164 165 if (!nr_reads_per_msec) { 166 log_err("rate lower than supported\n"); 167 return -1; 168 } 169 170 td->rate_usec_cycle = 1000000000ULL / nr_reads_per_msec; 171 td->rate_pending_usleep = 0; 172 return 0; 173} 174 175/* 176 * Lazy way of fixing up options that depend on each other. We could also 177 * define option callback handlers, but this is easier. 178 */ 179static int fixup_options(struct thread_data *td) 180{ 181 struct thread_options *o = &td->o; 182 183 if (o->rwmix[DDIR_READ] + o->rwmix[DDIR_WRITE] > 100) 184 o->rwmix[DDIR_WRITE] = 100 - o->rwmix[DDIR_READ]; 185 186 if (o->write_iolog_file && o->read_iolog_file) { 187 log_err("fio: read iolog overrides write_iolog\n"); 188 free(o->write_iolog_file); 189 o->write_iolog_file = NULL; 190 } 191 192 if (td->io_ops->flags & FIO_SYNCIO) 193 o->iodepth = 1; 194 else { 195 if (!o->iodepth) 196 o->iodepth = o->open_files; 197 } 198 199 /* 200 * only really works for sequential io for now, and with 1 file 201 */ 202 if (o->zone_size && td_random(td) && o->open_files == 1) 203 o->zone_size = 0; 204 205 /* 206 * Reads can do overwrites, we always need to pre-create the file 207 */ 208 if (td_read(td) || td_rw(td)) 209 o->overwrite = 1; 210 211 if (!o->min_bs[DDIR_READ]) 212 o->min_bs[DDIR_READ]= o->bs[DDIR_READ]; 213 if (!o->max_bs[DDIR_READ]) 214 o->max_bs[DDIR_READ] = o->bs[DDIR_READ]; 215 if (!o->min_bs[DDIR_WRITE]) 216 o->min_bs[DDIR_WRITE]= o->bs[DDIR_WRITE]; 217 if (!o->max_bs[DDIR_WRITE]) 218 o->max_bs[DDIR_WRITE] = o->bs[DDIR_WRITE]; 219 220 o->rw_min_bs = min(o->min_bs[DDIR_READ], o->min_bs[DDIR_WRITE]); 221 222 if (!o->file_size_high) 223 o->file_size_high = o->file_size_low; 224 225 if (o->norandommap && o->verify != VERIFY_NONE) { 226 log_err("fio: norandommap given, verify disabled\n"); 227 o->verify = VERIFY_NONE; 228 } 229 if (o->bs_unaligned && (o->odirect || td->io_ops->flags & FIO_RAWIO)) 230 log_err("fio: bs_unaligned may not work with raw io\n"); 231 232 /* 233 * thinktime_spin must be less than thinktime 234 */ 235 if (o->thinktime_spin > o->thinktime) 236 o->thinktime_spin = o->thinktime; 237 238 /* 239 * The low water mark cannot be bigger than the iodepth 240 */ 241 if (o->iodepth_low > o->iodepth || !o->iodepth_low) { 242 /* 243 * syslet work around - if the workload is sequential, 244 * we want to let the queue drain all the way down to 245 * avoid seeking between async threads 246 */ 247 if (!strcmp(td->io_ops->name, "syslet-rw") && !td_random(td)) 248 o->iodepth_low = 1; 249 else 250 o->iodepth_low = o->iodepth; 251 } 252 253 /* 254 * If batch number isn't set, default to the same as iodepth 255 */ 256 if (o->iodepth_batch > o->iodepth || !o->iodepth_batch) 257 o->iodepth_batch = o->iodepth; 258 259 if (o->nr_files > td->files_index) 260 o->nr_files = td->files_index; 261 262 if (o->open_files > o->nr_files || !o->open_files) 263 o->open_files = o->nr_files; 264 265 if ((o->rate && o->rate_iops) || (o->ratemin && o->rate_iops_min)) { 266 log_err("fio: rate and rate_iops are mutually exclusive\n"); 267 return 1; 268 } 269 if ((o->rate < o->ratemin) || (o->rate_iops < o->rate_iops_min)) { 270 log_err("fio: minimum rate exceeds rate\n"); 271 return 1; 272 } 273 274 if (!o->timeout && o->time_based) { 275 log_err("fio: time_based requires a runtime/timeout setting\n"); 276 o->time_based = 0; 277 } 278 279 return 0; 280} 281 282/* 283 * This function leaks the buffer 284 */ 285static char *to_kmg(unsigned int val) 286{ 287 char *buf = malloc(32); 288 char post[] = { 0, 'K', 'M', 'G', 'P', 'E', 0 }; 289 char *p = post; 290 291 do { 292 if (val & 1023) 293 break; 294 295 val >>= 10; 296 p++; 297 } while (*p); 298 299 snprintf(buf, 31, "%u%c", val, *p); 300 return buf; 301} 302 303/* External engines are specified by "external:name.o") */ 304static const char *get_engine_name(const char *str) 305{ 306 char *p = strstr(str, ":"); 307 308 if (!p) 309 return str; 310 311 p++; 312 strip_blank_front(&p); 313 strip_blank_end(p); 314 return p; 315} 316 317static int exists_and_not_file(const char *filename) 318{ 319 struct stat sb; 320 321 if (lstat(filename, &sb) == -1) 322 return 0; 323 324 if (S_ISREG(sb.st_mode)) 325 return 0; 326 327 return 1; 328} 329 330/* 331 * Initialize the various random states we need (random io, block size ranges, 332 * read/write mix, etc). 333 */ 334static int init_random_state(struct thread_data *td) 335{ 336 unsigned long seeds[6]; 337 int fd; 338 339 fd = open("/dev/urandom", O_RDONLY); 340 if (fd == -1) { 341 td_verror(td, errno, "open"); 342 return 1; 343 } 344 345 if (read(fd, seeds, sizeof(seeds)) < (int) sizeof(seeds)) { 346 td_verror(td, EIO, "read"); 347 close(fd); 348 return 1; 349 } 350 351 close(fd); 352 353 os_random_seed(seeds[0], &td->bsrange_state); 354 os_random_seed(seeds[1], &td->verify_state); 355 os_random_seed(seeds[2], &td->rwmix_state); 356 357 if (td->o.file_service_type == FIO_FSERVICE_RANDOM) 358 os_random_seed(seeds[3], &td->next_file_state); 359 360 os_random_seed(seeds[5], &td->file_size_state); 361 362 if (!td_random(td)) 363 return 0; 364 365 if (td->o.rand_repeatable) 366 seeds[4] = FIO_RANDSEED * td->thread_number; 367 368 os_random_seed(seeds[4], &td->random_state); 369 return 0; 370} 371 372/* 373 * Adds a job to the list of things todo. Sanitizes the various options 374 * to make sure we don't have conflicts, and initializes various 375 * members of td. 376 */ 377static int add_job(struct thread_data *td, const char *jobname, int job_add_num) 378{ 379 const char *ddir_str[] = { NULL, "read", "write", "rw", NULL, 380 "randread", "randwrite", "randrw" }; 381 unsigned int i; 382 const char *engine; 383 char fname[PATH_MAX]; 384 int numjobs, file_alloced; 385 386 /* 387 * the def_thread is just for options, it's not a real job 388 */ 389 if (td == &def_thread) 390 return 0; 391 392 /* 393 * if we are just dumping the output command line, don't add the job 394 */ 395 if (dump_cmdline) { 396 put_job(td); 397 return 0; 398 } 399 400 engine = get_engine_name(td->o.ioengine); 401 td->io_ops = load_ioengine(td, engine); 402 if (!td->io_ops) { 403 log_err("fio: failed to load engine %s\n", engine); 404 goto err; 405 } 406 407 if (td->o.use_thread) 408 nr_thread++; 409 else 410 nr_process++; 411 412 if (td->o.odirect) 413 td->io_ops->flags |= FIO_RAWIO; 414 415 file_alloced = 0; 416 if (!td->o.filename && !td->files_index) { 417 file_alloced = 1; 418 419 if (td->o.nr_files == 1 && exists_and_not_file(jobname)) 420 add_file(td, jobname); 421 else { 422 for (i = 0; i < td->o.nr_files; i++) { 423 sprintf(fname, "%s.%d.%d", jobname, td->thread_number, i); 424 add_file(td, fname); 425 } 426 } 427 } 428 429 if (fixup_options(td)) 430 goto err; 431 432 if (td->io_ops->flags & FIO_DISKLESSIO) { 433 struct fio_file *f; 434 435 for_each_file(td, f, i) 436 f->real_file_size = -1ULL; 437 } 438 439 td->mutex = fio_sem_init(0); 440 441 td->ts.clat_stat[0].min_val = td->ts.clat_stat[1].min_val = ULONG_MAX; 442 td->ts.slat_stat[0].min_val = td->ts.slat_stat[1].min_val = ULONG_MAX; 443 td->ts.bw_stat[0].min_val = td->ts.bw_stat[1].min_val = ULONG_MAX; 444 td->ddir_nr = td->o.ddir_nr; 445 446 if ((td->o.stonewall || td->o.numjobs > 1 || td->o.new_group) 447 && prev_group_jobs) { 448 prev_group_jobs = 0; 449 groupid++; 450 } 451 452 td->groupid = groupid; 453 prev_group_jobs++; 454 455 if (init_random_state(td)) 456 goto err; 457 458 if (setup_rate(td)) 459 goto err; 460 461 if (td->o.write_lat_log) { 462 setup_log(&td->ts.slat_log); 463 setup_log(&td->ts.clat_log); 464 } 465 if (td->o.write_bw_log) 466 setup_log(&td->ts.bw_log); 467 468 if (!td->o.name) 469 td->o.name = strdup(jobname); 470 471 if (!terse_output) { 472 if (!job_add_num) { 473 if (!strcmp(td->io_ops->name, "cpuio")) 474 log_info("%s: ioengine=cpu, cpuload=%u, cpucycle=%u\n", td->o.name, td->o.cpuload, td->o.cpucycle); 475 else { 476 char *c1, *c2, *c3, *c4; 477 478 c1 = to_kmg(td->o.min_bs[DDIR_READ]); 479 c2 = to_kmg(td->o.max_bs[DDIR_READ]); 480 c3 = to_kmg(td->o.min_bs[DDIR_WRITE]); 481 c4 = to_kmg(td->o.max_bs[DDIR_WRITE]); 482 483 log_info("%s: (g=%d): rw=%s, bs=%s-%s/%s-%s, ioengine=%s, iodepth=%u\n", td->o.name, td->groupid, ddir_str[td->o.td_ddir], c1, c2, c3, c4, td->io_ops->name, td->o.iodepth); 484 485 free(c1); 486 free(c2); 487 free(c3); 488 free(c4); 489 } 490 } else if (job_add_num == 1) 491 log_info("...\n"); 492 } 493 494 /* 495 * recurse add identical jobs, clear numjobs and stonewall options 496 * as they don't apply to sub-jobs 497 */ 498 numjobs = td->o.numjobs; 499 while (--numjobs) { 500 struct thread_data *td_new = get_new_job(0, td); 501 502 if (!td_new) 503 goto err; 504 505 td_new->o.numjobs = 1; 506 td_new->o.stonewall = 0; 507 td_new->o.new_group = 0; 508 509 if (file_alloced) { 510 td_new->o.filename = NULL; 511 td_new->files_index = 0; 512 td_new->files = NULL; 513 } 514 515 job_add_num = numjobs - 1; 516 517 if (add_job(td_new, jobname, job_add_num)) 518 goto err; 519 } 520 521 return 0; 522err: 523 put_job(td); 524 return -1; 525} 526 527static int is_empty_or_comment(char *line) 528{ 529 unsigned int i; 530 531 for (i = 0; i < strlen(line); i++) { 532 if (line[i] == ';') 533 return 1; 534 if (line[i] == '#') 535 return 1; 536 if (!isspace(line[i]) && !iscntrl(line[i])) 537 return 0; 538 } 539 540 return 1; 541} 542 543/* 544 * This is our [ini] type file parser. 545 */ 546static int parse_jobs_ini(char *file, int stonewall_flag) 547{ 548 unsigned int global; 549 struct thread_data *td; 550 char *string, *name; 551 fpos_t off; 552 FILE *f; 553 char *p; 554 int ret = 0, stonewall; 555 int first_sect = 1; 556 557 f = fopen(file, "r"); 558 if (!f) { 559 perror("fopen job file"); 560 return 1; 561 } 562 563 string = malloc(4096); 564 565 /* 566 * it's really 256 + small bit, 280 should suffice 567 */ 568 name = malloc(280); 569 memset(name, 0, 280); 570 571 stonewall = stonewall_flag; 572 do { 573 p = fgets(string, 4095, f); 574 if (!p) 575 break; 576 577 strip_blank_front(&p); 578 strip_blank_end(p); 579 580 if (is_empty_or_comment(p)) 581 continue; 582 if (sscanf(p, "[%255s]", name) != 1) { 583 log_err("fio: option <%s> outside of [] job section\n", p); 584 break; 585 } 586 587 global = !strncmp(name, "global", 6); 588 589 name[strlen(name) - 1] = '\0'; 590 591 if (dump_cmdline) { 592 if (first_sect) 593 log_info("fio "); 594 if (!global) 595 log_info("--name=%s ", name); 596 first_sect = 0; 597 } 598 599 td = get_new_job(global, &def_thread); 600 if (!td) { 601 ret = 1; 602 break; 603 } 604 605 /* 606 * Seperate multiple job files by a stonewall 607 */ 608 if (!global && stonewall) { 609 td->o.stonewall = stonewall; 610 stonewall = 0; 611 } 612 613 fgetpos(f, &off); 614 while ((p = fgets(string, 4096, f)) != NULL) { 615 if (is_empty_or_comment(p)) 616 continue; 617 618 strip_blank_front(&p); 619 620 if (p[0] == '[') 621 break; 622 623 strip_blank_end(p); 624 625 fgetpos(f, &off); 626 627 /* 628 * Don't break here, continue parsing options so we 629 * dump all the bad ones. Makes trial/error fixups 630 * easier on the user. 631 */ 632 ret |= fio_option_parse(td, p); 633 if (!ret && dump_cmdline) 634 log_info("--%s ", p); 635 } 636 637 if (!ret) { 638 fsetpos(f, &off); 639 ret = add_job(td, name, 0); 640 } else { 641 log_err("fio: job %s dropped\n", name); 642 put_job(td); 643 } 644 } while (!ret); 645 646 if (dump_cmdline) 647 log_info("\n"); 648 649 free(string); 650 free(name); 651 fclose(f); 652 return ret; 653} 654 655static int fill_def_thread(void) 656{ 657 memset(&def_thread, 0, sizeof(def_thread)); 658 659 fio_getaffinity(getpid(), &def_thread.o.cpumask); 660 661 /* 662 * fill default options 663 */ 664 fio_fill_default_options(&def_thread); 665 666 def_thread.o.timeout = def_timeout; 667 def_thread.o.write_bw_log = write_bw_log; 668 def_thread.o.write_lat_log = write_lat_log; 669 670 return 0; 671} 672 673static void free_shm(void) 674{ 675 struct shmid_ds sbuf; 676 677 if (threads) { 678 shmdt((void *) threads); 679 threads = NULL; 680 shmctl(shm_id, IPC_RMID, &sbuf); 681 } 682} 683 684/* 685 * The thread area is shared between the main process and the job 686 * threads/processes. So setup a shared memory segment that will hold 687 * all the job info. 688 */ 689static int setup_thread_area(void) 690{ 691 /* 692 * 1024 is too much on some machines, scale max_jobs if 693 * we get a failure that looks like too large a shm segment 694 */ 695 do { 696 size_t size = max_jobs * sizeof(struct thread_data); 697 698 shm_id = shmget(0, size, IPC_CREAT | 0600); 699 if (shm_id != -1) 700 break; 701 if (errno != EINVAL) { 702 perror("shmget"); 703 break; 704 } 705 706 max_jobs >>= 1; 707 } while (max_jobs); 708 709 if (shm_id == -1) 710 return 1; 711 712 threads = shmat(shm_id, NULL, 0); 713 if (threads == (void *) -1) { 714 perror("shmat"); 715 return 1; 716 } 717 718 atexit(free_shm); 719 return 0; 720} 721 722static void usage(void) 723{ 724 printf("%s\n", fio_version_string); 725 printf("\t--output\tWrite output to file\n"); 726 printf("\t--timeout\tRuntime in seconds\n"); 727 printf("\t--latency-log\tGenerate per-job latency logs\n"); 728 printf("\t--bandwidth-log\tGenerate per-job bandwidth logs\n"); 729 printf("\t--minimal\tMinimal (terse) output\n"); 730 printf("\t--version\tPrint version info and exit\n"); 731 printf("\t--help\t\tPrint this page\n"); 732 printf("\t--cmdhelp=cmd\tPrint command help, \"all\" for all of them\n"); 733 printf("\t--showcmd\tTurn a job file into command line options\n"); 734} 735 736static int parse_cmd_line(int argc, char *argv[]) 737{ 738 struct thread_data *td = NULL; 739 int c, ini_idx = 0, lidx, ret, dont_add_job = 0; 740 741 while ((c = getopt_long_only(argc, argv, "", long_options, &lidx)) != -1) { 742 switch (c) { 743 case 't': 744 def_timeout = atoi(optarg); 745 break; 746 case 'l': 747 write_lat_log = 1; 748 break; 749 case 'w': 750 write_bw_log = 1; 751 break; 752 case 'o': 753 f_out = fopen(optarg, "w+"); 754 if (!f_out) { 755 perror("fopen output"); 756 exit(1); 757 } 758 f_err = f_out; 759 break; 760 case 'm': 761 terse_output = 1; 762 break; 763 case 'h': 764 usage(); 765 exit(0); 766 case 'c': 767 exit(fio_show_option_help(optarg)); 768 case 's': 769 dump_cmdline = 1; 770 break; 771 case 'v': 772 printf("%s\n", fio_version_string); 773 exit(0); 774 case FIO_GETOPT_JOB: { 775 const char *opt = long_options[lidx].name; 776 char *val = optarg; 777 778 if (!strncmp(opt, "name", 4) && td) { 779 ret = add_job(td, td->o.name ?: "fio", 0); 780 if (ret) { 781 put_job(td); 782 return 0; 783 } 784 td = NULL; 785 } 786 if (!td) { 787 int global = 0; 788 789 if (strncmp(opt, "name", 4) || 790 !strncmp(val, "global", 6)) 791 global = 1; 792 793 td = get_new_job(global, &def_thread); 794 if (!td) 795 return 0; 796 } 797 798 ret = fio_cmd_option_parse(td, opt, val); 799 if (ret) 800 dont_add_job = 1; 801 break; 802 } 803 default: 804 break; 805 } 806 } 807 808 if (td) { 809 if (dont_add_job) 810 put_job(td); 811 else { 812 ret = add_job(td, td->o.name ?: "fio", 0); 813 if (ret) 814 put_job(td); 815 } 816 } 817 818 while (optind < argc) { 819 ini_idx++; 820 ini_file = realloc(ini_file, ini_idx * sizeof(char *)); 821 ini_file[ini_idx - 1] = strdup(argv[optind]); 822 optind++; 823 } 824 825 return ini_idx; 826} 827 828 829int parse_options(int argc, char *argv[]) 830{ 831 int job_files, i; 832 833 f_out = stdout; 834 f_err = stderr; 835 836 fio_options_dup_and_init(long_options); 837 838 if (setup_thread_area()) 839 return 1; 840 if (fill_def_thread()) 841 return 1; 842 843 job_files = parse_cmd_line(argc, argv); 844 845 for (i = 0; i < job_files; i++) { 846 if (fill_def_thread()) 847 return 1; 848 if (parse_jobs_ini(ini_file[i], i)) 849 return 1; 850 free(ini_file[i]); 851 } 852 853 free(ini_file); 854 options_mem_free(&def_thread); 855 856 if (!thread_number) { 857 if (dump_cmdline) 858 return 0; 859 860 log_err("No jobs defined(s)\n"); 861 return 1; 862 } 863 864 return 0; 865} 866