toolchain-utils/crosperf/results_organizer.py

04dc5dc8547dbfbe524cf35ac39537346ad749bbYunlian Jiang# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
04dc5dc8547dbfbe524cf35ac39537346ad749bbYunlian Jiang# Use of this source code is governed by a BSD-style license that can be
04dc5dc8547dbfbe524cf35ac39537346ad749bbYunlian Jiang# found in the LICENSE file.
4467f004e7f0854963bec90daff1879fbd9d2fecAhmad Sharif"""Parse data from benchmark_runs for tabulator."""
89d263c7cf9773129cbe8e8858ad21ea539a2ba0Luis Lozano
89d263c7cf9773129cbe8e8858ad21ea539a2ba0Luis Lozanofrom __future__ import print_function
89d263c7cf9773129cbe8e8858ad21ea539a2ba0Luis Lozano
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IVimport errno
44a44befd1f500b9a227ebfd849702efce83ef6acmticeimport json
44a44befd1f500b9a227ebfd849702efce83ef6acmticeimport os
4467f004e7f0854963bec90daff1879fbd9d2fecAhmad Sharifimport re
44a44befd1f500b9a227ebfd849702efce83ef6acmticeimport sys
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif
1974c70a4e0b161a18a843229fc1af8344e11600Yunlian Jiangfrom cros_utils import misc
44a44befd1f500b9a227ebfd849702efce83ef6acmtice
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV_TELEMETRY_RESULT_DEFAULTS_FILE = 'default-telemetry-results.json'
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV_DUP_KEY_REGEX = re.compile(r'(\w+)\{(\d+)\}')
f2a3ef46f75d2196a93d3ed27f4d1fcf22b54fbeLuis Lozano
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IVdef _AdjustIteration(benchmarks, max_dup, bench):
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  """Adjust the interation numbers if they have keys like ABCD{i}."""
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  for benchmark in benchmarks:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    if benchmark.name != bench or benchmark.iteration_adjusted:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      continue
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    benchmark.iteration_adjusted = True
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    benchmark.iterations *= (max_dup + 1)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IVdef _GetMaxDup(data):
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  """Find the maximum i inside ABCD{i}.
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  data should be a [[[Key]]], where Key is a string that may look like
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  ABCD{i}.
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  """
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  max_dup = 0
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  for label in data:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    for run in label:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      for key in run:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV        match = _DUP_KEY_REGEX.match(key)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV        if match:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV          max_dup = max(max_dup, int(match.group(2)))
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  return max_dup
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IVdef _Repeat(func, times):
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  """Returns the result of running func() n times."""
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  return [func() for _ in xrange(times)]
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IVdef _GetNonDupLabel(max_dup, runs):
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  """Create new list for the runs of the same label.
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  Specifically, this will split out keys like foo{0}, foo{1} from one run into
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  their own runs. For example, given a run like:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    {"foo": 1, "bar{0}": 2, "baz": 3, "qux{1}": 4, "pirate{0}": 5}
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  You'll get:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    [{"foo": 1, "baz": 3}, {"bar": 2, "pirate": 5}, {"qux": 4}]
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  Hands back the lists of transformed runs, all concatenated together.
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  """
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  new_runs = []
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  for run in runs:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    new_run = {}
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    added_runs = _Repeat(dict, max_dup)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    for key, value in run.iteritems():
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      match = _DUP_KEY_REGEX.match(key)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      if not match:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV        new_run[key] = value
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      else:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV        new_key, index_str = match.groups()
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV        added_runs[int(index_str)-1][new_key] = str(value)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    new_runs.append(new_run)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    new_runs += added_runs
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  return new_runs
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IVdef _DuplicatePass(result, benchmarks):
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  """Properly expands keys like `foo{1}` in `result`."""
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  for bench, data in result.iteritems():
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    max_dup = _GetMaxDup(data)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    # If there's nothing to expand, there's nothing to do.
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    if not max_dup:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      continue
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    for i, runs in enumerate(data):
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      data[i] = _GetNonDupLabel(max_dup, runs)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    _AdjustIteration(benchmarks, max_dup, bench)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IVdef _ReadSummaryFile(filename):
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  """Reads the summary file at filename."""
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  dirname, _ = misc.GetRoot(filename)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  fullname = os.path.join(dirname, _TELEMETRY_RESULT_DEFAULTS_FILE)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  try:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    # Slurp the summary file into a dictionary. The keys in the dictionary are
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    # the benchmark names. The value for a key is a list containing the names
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    # of all the result fields that should be returned in a 'default' report.
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    with open(fullname) as in_file:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      return json.load(in_file)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  except IOError as e:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    # ENOENT means "no such file or directory"
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    if e.errno == errno.ENOENT:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      return {}
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    raise
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IVdef _MakeOrganizeResultOutline(benchmark_runs, labels):
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  """Creates the "outline" of the OrganizeResults result for a set of runs.
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  Report generation returns lists of different sizes, depending on the input
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  data. Depending on the order in which we iterate through said input data, we
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  may populate the Nth index of a list, then the N-1st, then the N+Mth, ...
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  It's cleaner to figure out the "skeleton"/"outline" ahead of time, so we don't
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  have to worry about resizing while computing results.
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  """
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  # Count how many iterations exist for each benchmark run.
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  # We can't simply count up, since we may be given an incomplete set of
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  # iterations (e.g. [r.iteration for r in benchmark_runs] == [1, 3])
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  iteration_count = {}
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  for run in benchmark_runs:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    name = run.benchmark.name
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    old_iterations = iteration_count.get(name, -1)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    # N.B. run.iteration starts at 1, not 0.
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    iteration_count[name] = max(old_iterations, run.iteration)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  # Result structure: {benchmark_name: [[{key: val}]]}
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  result = {}
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  for run in benchmark_runs:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    name = run.benchmark.name
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    num_iterations = iteration_count[name]
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    # default param makes cros lint be quiet about defining num_iterations in a
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    # loop.
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    make_dicts = lambda n=num_iterations: _Repeat(dict, n)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    result[name] = _Repeat(make_dicts, len(labels))
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  return result
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IVdef OrganizeResults(benchmark_runs, labels, benchmarks=None, json_report=False):
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif  """Create a dict from benchmark_runs.
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif  The structure of the output dict is as follows:
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif  {"benchmark_1":[
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif    [{"key1":"v1", "key2":"v2"},{"key1":"v1", "key2","v2"}]
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif    #one label
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif    []
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif    #the other label
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif    ]
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif   "benchmark_2":
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif    [
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif    ]}.
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif  """
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  result = _MakeOrganizeResultOutline(benchmark_runs, labels)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  label_names = [label.name for label in labels]
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  label_indices = {name: i for i, name in enumerate(label_names)}
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  summary_file = _ReadSummaryFile(sys.argv[0])
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  if benchmarks is None:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    benchmarks = []
f395c26437cbdabc2960447fba89b226f4409e82Ahmad Sharif
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  for benchmark_run in benchmark_runs:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    if not benchmark_run.result:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      continue
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    benchmark = benchmark_run.benchmark
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    label_index = label_indices[benchmark_run.label.name]
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    cur_label_list = result[benchmark.name][label_index]
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    cur_dict = cur_label_list[benchmark_run.iteration - 1]
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    show_all_results = json_report or benchmark.show_all_results
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    if not show_all_results:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      summary_list = summary_file.get(benchmark.test_name)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      if summary_list:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV        summary_list.append('retval')
9b852cfd9a602c5f80c8e621c696b796ce5177fdCaroline Tice      else:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV        # Did not find test_name in json file; show everything.
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV        show_all_results = True
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    for test_key in benchmark_run.result.keyvals:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      if show_all_results or test_key in summary_list:
89d263c7cf9773129cbe8e8858ad21ea539a2ba0Luis Lozano        cur_dict[test_key] = benchmark_run.result.keyvals[test_key]
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    # Occasionally Telemetry tests will not fail but they will not return a
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    # result, either.  Look for those cases, and force them to be a fail.
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    # (This can happen if, for example, the test has been disabled.)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    if len(cur_dict) == 1 and cur_dict['retval'] == 0:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      cur_dict['retval'] = 1
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      # TODO: This output should be sent via logger.
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      print("WARNING: Test '%s' appears to have succeeded but returned"
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV            ' no results.' % benchmark.name,
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV            file=sys.stderr)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV    if json_report and benchmark_run.machine:
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      cur_dict['machine'] = benchmark_run.machine.name
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      cur_dict['machine_checksum'] = benchmark_run.machine.checksum
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV      cur_dict['machine_string'] = benchmark_run.machine.checksum_string
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  _DuplicatePass(result, benchmarks)
afb8cc77e82c35faedfe541d097fc01fd1d7ca3dGeorge Burgess IV  return result