v811_spc009/test/mlts/benchmark/results/generate_result.py

#!/usr/bin/python3
#
# Copyright 2018, The Android Open Source Project
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""MLTS benchmark result generator.

Reads a CSV produced by MLTS benchmark and generates
an HTML page with results summary.

Usage:
  generate_result [csv input file] [html output file]
"""

import argparse
import collections
import csv
import os
import re
import math


class ScoreException(Exception):
  """Generator base exception type. """
  pass


LatencyResult = collections.namedtuple(
    'LatencyResult',
    ['iterations', 'total_time_sec', 'time_freq_start_sec', 'time_freq_step_sec', 'time_freq_sec'])


COMPILATION_TYPES = ['compile_without_cache', 'save_to_cache', 'prepare_from_cache']
BASELINE_COMPILATION_TYPE = COMPILATION_TYPES[0]
CompilationResult = collections.namedtuple(
    'CompilationResult',
    ['cache_size_bytes'] + COMPILATION_TYPES)


BenchmarkResult = collections.namedtuple(
    'BenchmarkResult',
    ['name', 'backend_type', 'inference_latency', 'max_single_error',
     'testset_size', 'evaluator_keys', 'evaluator_values', 'validation_errors',
     'compilation_results'])


ResultsWithBaseline = collections.namedtuple(
    'ResultsWithBaseline',
    ['baseline', 'other'])


BASELINE_BACKEND = 'TFLite_CPU'
KNOWN_GROUPS = [
    (re.compile('mobilenet_v1.*quant.*'), 'MobileNet v1 Quantized'),
    (re.compile('mobilenet_v1.*'), 'MobileNet v1 Float'),
    (re.compile('mobilenet_v2.*quant.*'), 'MobileNet v2 Quantized'),
    (re.compile('mobilenet_v2.*'), 'MobileNet v2 Float'),
    (re.compile('mobilenet_v3.*uint8.*'), 'MobileNet v3 Quantized'),
    (re.compile('mobilenet_v3.*'), 'MobileNet v3 Float'),
    (re.compile('tts.*'), 'LSTM Text-to-speech'),
    (re.compile('asr.*'), 'LSTM Automatic Speech Recognition'),
]


class BenchmarkResultParser:
  """A helper class to parse the input CSV file."""

  def __init__(self, csvfile):
    self.csv_reader = csv.reader(filter(lambda row: row[0] != '#', csvfile))
    self.row = None
    self.index = 0

  def next(self):
    """Advance to the next row, returns the current row or None if reaches the end."""
    try:
      self.row = next(self.csv_reader)
    except StopIteration:
      self.row = None
    finally:
      self.index = 0
      return self.row

  def read_boolean(self):
    """Read the next CSV cell as a boolean."""
    s = self.read_typed(str).lower()
    if s == 'true':
      return True
    elif s == 'false':
      return False
    else:
      raise ValueError('Cannot convert \'%s\' to a boolean' % s)

  def read_typed(self, Type):
    """Read the next CSV cell as the given type."""
    if Type is bool:
      return self.read_boolean()
    entry = self.row[self.index]
    self.index += 1
    return Type(entry)

  def read_typed_array(self, Type, length):
    """Read the next CSV cells as a typed array."""
    return [self.read_typed(Type) for _ in range(length)]

  def read_latency_result(self):
    """Read the next CSV cells as a LatencyResult."""
    result = {}
    result['iterations'] = self.read_typed(int)
    result['total_time_sec'] = self.read_typed(float)
    result['time_freq_start_sec'] = self.read_typed(float)
    result['time_freq_step_sec'] = self.read_typed(float)
    time_freq_sec_count = self.read_typed(int)
    result['time_freq_sec'] = self.read_typed_array(float, time_freq_sec_count)
    return LatencyResult(**result)

  def read_compilation_result(self):
    """Read the next CSV cells as a CompilationResult."""
    result = {}
    for compilation_type in COMPILATION_TYPES:
      has_results = self.read_typed(bool)
      result[compilation_type] = self.read_latency_result() if has_results else None
    result['cache_size_bytes'] = self.read_typed(int)
    return CompilationResult(**result)

  def read_benchmark_result(self):
    """Read the next CSV cells as a BenchmarkResult."""
    result = {}
    result['name'] = self.read_typed(str)
    result['backend_type'] = self.read_typed(str)
    result['inference_latency'] = self.read_latency_result()
    result['max_single_error'] = self.read_typed(float)
    result['testset_size'] = self.read_typed(int)
    evaluator_keys_count = self.read_typed(int)
    validation_error_count = self.read_typed(int)
    result['evaluator_keys'] = self.read_typed_array(str, evaluator_keys_count)
    result['evaluator_values'] = self.read_typed_array(float, evaluator_keys_count)
    result['validation_errors'] = self.read_typed_array(str, validation_error_count)
    result['compilation_results'] = self.read_compilation_result()
    return BenchmarkResult(**result)


def parse_csv_input(input_filename):
  """Parse input CSV file, returns: (benchmarkInfo, list of BenchmarkResult)."""
  with open(input_filename, 'r') as csvfile:
    parser = BenchmarkResultParser(csvfile)

    # First line contain device info
    benchmark_info = parser.next()

    results = []
    while parser.next():
      results.append(parser.read_benchmark_result())

    return (benchmark_info, results)


def group_results(results):
  """Group list of results by their name/backend, returns list of lists."""
  # Group by name
  groupings = collections.defaultdict(list)
  for result in results:
    groupings[result.name].append(result)

  # Find baseline for each group, make ResultsWithBaseline for each name
  groupings_baseline = {}
  for name, results in groupings.items():
    baseline = next(filter(lambda x: x.backend_type == BASELINE_BACKEND,
                           results))
    other = sorted(filter(lambda x: x is not baseline, results),
                   key=lambda x: x.backend_type)
    groupings_baseline[name] = ResultsWithBaseline(
        baseline=baseline,
        other=other)

  # Merge ResultsWithBaseline for known groups
  known_groupings_baseline = collections.defaultdict(list)
  for name, results_with_bl in sorted(groupings_baseline.items()):
    group_name = name
    for known_group in KNOWN_GROUPS:
      if known_group[0].match(results_with_bl.baseline.name):
        group_name = known_group[1]
        break
    known_groupings_baseline[group_name].append(results_with_bl)

  # Turn into a list sorted by name
  groupings_list = []
  for name, results_wbl in sorted(known_groupings_baseline.items()):
    groupings_list.append((name, results_wbl))
  return groupings_list


def get_frequency_graph_min_max(latencies):
  """Get min and max times of latencies frequency."""
  mins = []
  maxs = []
  for latency in latencies:
    mins.append(latency.time_freq_start_sec)
    to_add = len(latency.time_freq_sec) * latency.time_freq_step_sec
    maxs.append(latency.time_freq_start_sec + to_add)
  return min(mins), max(maxs)


def get_frequency_graph(time_freq_start_sec, time_freq_step_sec, time_freq_sec,
                        start_sec, end_sec):
  """Generate input x/y data for latency frequency graph."""
  left_to_pad = (int((time_freq_start_sec - start_sec) / time_freq_step_sec)
                 if time_freq_step_sec != 0
                 else math.inf)
  end_time = time_freq_start_sec + len(time_freq_sec) * time_freq_step_sec
  right_to_pad = (int((end_sec - end_time) / time_freq_step_sec)
                  if time_freq_step_sec != 0
                  else math.inf)

  # After pading more that 64 values, graphs start to look messy,
  # bail out in that case.
  if (left_to_pad + right_to_pad) < 64:
    left_pad = (['{:.2f}ms'.format(
        (start_sec + x * time_freq_step_sec) * 1000.0)
                 for x in range(left_to_pad)], [0] * left_to_pad)

    right_pad = (['{:.2f}ms'.format(
        (end_time + x * time_freq_step_sec) * 1000.0)
                  for x in range(right_to_pad)], [0] * right_to_pad)
  else:
    left_pad = [[], []]
    right_pad = [[], []]

  data = (['{:.2f}ms'.format(
      (time_freq_start_sec + x * time_freq_step_sec) * 1000.0)
           for x in range(len(time_freq_sec))], time_freq_sec)

  return (left_pad[0] + data[0] + right_pad[0],
          left_pad[1] + data[1] + right_pad[1])


def is_topk_evaluator(evaluator_keys):
  """Are these evaluator keys from TopK evaluator?"""
  return (len(evaluator_keys) == 5 and
          evaluator_keys[0] == 'top_1' and
          evaluator_keys[1] == 'top_2' and
          evaluator_keys[2] == 'top_3' and
          evaluator_keys[3] == 'top_4' and
          evaluator_keys[4] == 'top_5')


def is_melceplogf0_evaluator(evaluator_keys):
  """Are these evaluator keys from MelCepLogF0 evaluator?"""
  return (len(evaluator_keys) == 2 and
          evaluator_keys[0] == 'max_mel_cep_distortion' and
          evaluator_keys[1] == 'max_log_f0_error')


def is_phone_error_rate_evaluator(evaluator_keys):
  """Are these evaluator keys from PhoneErrorRate evaluator?"""
  return (len(evaluator_keys) == 1 and
          evaluator_keys[0] == 'max_phone_error_rate')


def generate_accuracy_headers(result):
  """Accuracy-related headers for result table."""
  if is_topk_evaluator(result.evaluator_keys):
    return ACCURACY_HEADERS_TOPK_TEMPLATE
  elif is_melceplogf0_evaluator(result.evaluator_keys):
    return ACCURACY_HEADERS_MELCEPLOGF0_TEMPLATE
  elif is_phone_error_rate_evaluator(result.evaluator_keys):
    return ACCURACY_HEADERS_PHONE_ERROR_RATE_TEMPLATE
  else:
    return ACCURACY_HEADERS_BASIC_TEMPLATE
  raise ScoreException('Unknown accuracy headers for: ' + str(result))


def get_diff_span(value, same_delta, positive_is_better):
  if abs(value) < same_delta:
    return 'same'
  if positive_is_better and value > 0 or not positive_is_better and value < 0:
    return 'better'
  return 'worse'


def generate_accuracy_values(baseline, result):
  """Accuracy-related data for result table."""
  if is_topk_evaluator(result.evaluator_keys):
    val = [float(x) * 100.0 for x in result.evaluator_values]
    if result is baseline:
      topk = [TOPK_BASELINE_TEMPLATE.format(val=x) for x in val]
      return ACCURACY_VALUES_TOPK_TEMPLATE.format(
          top1=topk[0], top2=topk[1], top3=topk[2], top4=topk[3],
          top5=topk[4]
      )
    else:
      base = [float(x) * 100.0 for x in baseline.evaluator_values]
      diff = [a - b for a, b in zip(val, base)]
      topk = [TOPK_DIFF_TEMPLATE.format(
          val=v, diff=d, span=get_diff_span(d, 1.0, positive_is_better=True))
              for v, d in zip(val, diff)]
      return ACCURACY_VALUES_TOPK_TEMPLATE.format(
          top1=topk[0], top2=topk[1], top3=topk[2], top4=topk[3],
          top5=topk[4]
      )
  elif is_melceplogf0_evaluator(result.evaluator_keys):
    val = [float(x) for x in
           result.evaluator_values + [result.max_single_error]]
    if result is baseline:
      return ACCURACY_VALUES_MELCEPLOGF0_TEMPLATE.format(
          max_log_f0=MELCEPLOGF0_BASELINE_TEMPLATE.format(
              val=val[0]),
          max_mel_cep_distortion=MELCEPLOGF0_BASELINE_TEMPLATE.format(
              val=val[1]),
          max_single_error=MELCEPLOGF0_BASELINE_TEMPLATE.format(
              val=val[2]),
      )
    else:
      base = [float(x) for x in
              baseline.evaluator_values + [baseline.max_single_error]]
      diff = [a - b for a, b in zip(val, base)]
      v = [MELCEPLOGF0_DIFF_TEMPLATE.format(
          val=v, diff=d, span=get_diff_span(d, 1.0, positive_is_better=False))
           for v, d in zip(val, diff)]
      return ACCURACY_VALUES_MELCEPLOGF0_TEMPLATE.format(
          max_log_f0=v[0],
          max_mel_cep_distortion=v[1],
          max_single_error=v[2],
      )
  elif is_phone_error_rate_evaluator(result.evaluator_keys):
    val = [float(x) for x in
           result.evaluator_values + [result.max_single_error]]
    if result is baseline:
      return ACCURACY_VALUES_PHONE_ERROR_RATE_TEMPLATE.format(
          max_phone_error_rate=PHONE_ERROR_RATE_BASELINE_TEMPLATE.format(
              val=val[0]),
          max_single_error=PHONE_ERROR_RATE_BASELINE_TEMPLATE.format(
              val=val[1]),
      )
    else:
      base = [float(x) for x in
              baseline.evaluator_values + [baseline.max_single_error]]
      diff = [a - b for a, b in zip(val, base)]
      v = [PHONE_ERROR_RATE_DIFF_TEMPLATE.format(
          val=v, diff=d, span=get_diff_span(d, 1.0, positive_is_better=False))
           for v, d in zip(val, diff)]
      return ACCURACY_VALUES_PHONE_ERROR_RATE_TEMPLATE.format(
          max_phone_error_rate=v[0],
          max_single_error=v[1],
      )
  else:
    return ACCURACY_VALUES_BASIC_TEMPLATE.format(
        max_single_error=result.max_single_error,
    )
  raise ScoreException('Unknown accuracy values for: ' + str(result))


def getchartjs_source():
  return open(os.path.dirname(os.path.abspath(__file__)) + '/' +
              CHART_JS_FILE).read()


def generate_avg_ms(baseline, latency):
  """Generate average latency value."""
  if latency is None:
    latency = baseline

  result_avg_ms = (latency.total_time_sec / latency.iterations)*1000.0
  if latency is baseline:
    return LATENCY_BASELINE_TEMPLATE.format(val=result_avg_ms)
  baseline_avg_ms = (baseline.total_time_sec / baseline.iterations)*1000.0
  diff = (result_avg_ms/baseline_avg_ms - 1.0) * 100.0
  diff_val = result_avg_ms - baseline_avg_ms
  return LATENCY_DIFF_TEMPLATE.format(
      val=result_avg_ms,
      diff=diff,
      diff_val=diff_val,
      span=get_diff_span(diff, same_delta=1.0, positive_is_better=False))


def generate_result_entry(baseline, result):
  if result is None:
    result = baseline

  return RESULT_ENTRY_TEMPLATE.format(
      row_class='failed' if result.validation_errors else 'normal',
      name=result.name,
      backend=result.backend_type,
      iterations=result.inference_latency.iterations,
      testset_size=result.testset_size,
      accuracy_values=generate_accuracy_values(baseline, result),
      avg_ms=generate_avg_ms(baseline.inference_latency, result.inference_latency))


def generate_latency_graph_entry(tag, latency, tmin, tmax):
  """Generate a single latency graph."""
  return LATENCY_GRAPH_ENTRY_TEMPLATE.format(
      tag=tag,
      i=id(latency),
      freq_data=get_frequency_graph(latency.time_freq_start_sec,
                                    latency.time_freq_step_sec,
                                    latency.time_freq_sec,
                                    tmin, tmax))


def generate_latency_graphs_group(tags, latencies):
  """Generate a group of latency graphs with the same tmin and tmax."""
  tmin, tmax = get_frequency_graph_min_max(latencies)
  return ''.join(
      generate_latency_graph_entry(tag, latency, tmin, tmax)
      for tag, latency in zip(tags, latencies))


def snake_case_to_title(string):
  return string.replace('_', ' ').title()


def generate_inference_latency_graph_entry(results_with_bl):
  """Generate a group of latency graphs for inference latencies."""
  results = [results_with_bl.baseline] + results_with_bl.other
  tags = [result.backend_type for result in results]
  latencies = [result.inference_latency for result in results]
  return generate_latency_graphs_group(tags, latencies)


def generate_compilation_latency_graph_entry(results_with_bl):
  """Generate a group of latency graphs for compilation latencies."""
  tags = [
      result.backend_type + ', ' + snake_case_to_title(type)
      for result in results_with_bl.other
      for type in COMPILATION_TYPES
      if getattr(result.compilation_results, type)
  ]
  latencies = [
      getattr(result.compilation_results, type)
      for result in results_with_bl.other
      for type in COMPILATION_TYPES
      if getattr(result.compilation_results, type)
  ]
  return generate_latency_graphs_group(tags, latencies)


def generate_validation_errors(entries_group):
  """Generate validation errors table."""
  errors = []
  for result_and_bl in entries_group:
    for result in [result_and_bl.baseline] + result_and_bl.other:
      for error in result.validation_errors:
        errors.append((result.name, result.backend_type, error))

  if errors:
    return VALIDATION_ERRORS_TEMPLATE.format(
        results=''.join(
            VALIDATION_ERRORS_ENTRY_TEMPLATE.format(
                name=name,
                backend=backend,
                error=error) for name, backend, error in errors))
  return ''


def generate_compilation_result_entry(result):
  format_args = {
      'row_class':
          'failed' if result.validation_errors else 'normal',
      'name':
          result.name,
      'backend':
          result.backend_type,
      'cache_size':
          f'{result.compilation_results.cache_size_bytes:,}'
          if result.compilation_results.cache_size_bytes > 0 else '-'
  }
  for compilation_type in COMPILATION_TYPES:
    latency = getattr(result.compilation_results, compilation_type)
    if latency:
      format_args[compilation_type + '_iterations'] = f'{latency.iterations}'
      format_args[compilation_type + '_avg_ms'] = generate_avg_ms(
          result.compilation_results.compile_without_cache, latency)
    else:
      format_args[compilation_type + '_iterations'] = '-'
      format_args[compilation_type + '_avg_ms'] = '-'
  return COMPILATION_RESULT_ENTRY_TEMPLATE.format(**format_args)


def generate_result(benchmark_info, data):
  """Turn list of results into HTML."""
  return MAIN_TEMPLATE.format(
      jsdeps=getchartjs_source(),
      device_info=DEVICE_INFO_TEMPLATE.format(
          benchmark_time=benchmark_info[0],
          device_info=benchmark_info[1],
          ),
      results_list=''.join((
          RESULT_GROUP_TEMPLATE.format(
              group_name=entries_name,
              accuracy_headers=generate_accuracy_headers(
                  entries_group[0].baseline),
              results=''.join(
                  RESULT_ENTRY_WITH_BASELINE_TEMPLATE.format(
                      baseline=generate_result_entry(
                          result_and_bl.baseline, None),
                      other=''.join(
                          generate_result_entry(
                              result_and_bl.baseline, x)
                          for x in result_and_bl.other)
                  ) for result_and_bl in entries_group),
              validation_errors=generate_validation_errors(entries_group),
              latency_graphs=LATENCY_GRAPHS_TEMPLATE.format(
                  results=''.join(
                      LATENCY_GRAPH_ENTRY_GROUP_TEMPLATE.format(
                          name=result_and_bl.baseline.name,
                          results=generate_inference_latency_graph_entry(result_and_bl)
                      ) for result_and_bl in entries_group)
              ),
              compilation_results=''.join(
                  COMPILATION_RESULT_ENTRIES_TEMPLATE.format(
                      entries=''.join(
                          generate_compilation_result_entry(x) for x in result_and_bl.other)
                  ) for result_and_bl in entries_group),
              compilation_latency_graphs=LATENCY_GRAPHS_TEMPLATE.format(
                  results=''.join(
                      LATENCY_GRAPH_ENTRY_GROUP_TEMPLATE.format(
                          name=result_and_bl.baseline.name,
                          results=generate_compilation_latency_graph_entry(result_and_bl)
                      ) for result_and_bl in entries_group)
              ),
          ) for entries_name, entries_group in group_results(data))
                          ))


def main():
  parser = argparse.ArgumentParser()
  parser.add_argument('input', help='input csv filename')
  parser.add_argument('output', help='output html filename')
  args = parser.parse_args()

  benchmark_info, data = parse_csv_input(args.input)

  with open(args.output, 'w') as htmlfile:
    htmlfile.write(generate_result(benchmark_info, data))


# -----------------
# Templates below

MAIN_TEMPLATE = """<!doctype html>
<html lang='en-US'>
<head>
  <meta http-equiv='Content-Type' content='text/html; charset=utf-8'>
  <script src='https://ajax.googleapis.com/ajax/libs/jquery/3.3.1/jquery.min.js'></script>
  <script>{jsdeps}</script>
  <title>MLTS results</title>
  <style>
    .results {{
      border-collapse: collapse;
      width: 100%;
    }}
    .results td, .results th {{
      border: 1px solid #ddd;
      padding: 6px;
    }}
    .results tbody.values {{
      border-bottom: 8px solid #333;
    }}
    span.better {{
      color: #070;
    }}
    span.worse {{
      color: #700;
    }}
    span.same {{
      color: #000;
    }}
    .results tr:nth-child(even) {{background-color: #eee;}}
    .results tr:hover {{background-color: #ddd;}}
    .results th {{
      padding: 10px;
      font-weight: bold;
      text-align: left;
      background-color: #333;
      color: white;
    }}
    .results tr.failed {{
      background-color: #ffc4ca;
    }}
    .group {{
      padding-top: 25px;
    }}
    .group_name {{
      padding-left: 10px;
      font-size: 140%;
      font-weight: bold;
    }}
    .section_name {{
      padding: 10px;
      font-size: 120%;
      font-weight: bold;
    }}
    .latency_results {{
       padding: 10px;
       border: 1px solid #ddd;
       overflow: hidden;
    }}
    .latency_with_baseline {{
       padding: 10px;
       border: 1px solid #ddd;
       overflow: hidden;
    }}
  </style>
</head>
<body>
{device_info}
{results_list}
</body>
</html>"""

DEVICE_INFO_TEMPLATE = """<div id='device_info'>
Benchmark for {device_info}, started at {benchmark_time}
</div>"""


RESULT_GROUP_TEMPLATE = """<div class="group">
<div class="group_name">{group_name}</div>
<div class="section_name">Inference results</div>
<table class="results">
 <tr>
   <th>Name</th>
   <th>Backend</th>
   <th>Iterations</th>
   <th>Test set size</th>
   <th>Average latency ms</th>
   {accuracy_headers}
 </tr>
 {results}
</table>
{validation_errors}
{latency_graphs}
<div class="section_name">Compilation results</div>
<table class="results">
 <tr>
   <th rowspan="2">Name</th>
   <th rowspan="2">Backend</th>
   <th colspan="2">Compile Without Cache</th>
   <th colspan="2">Save To Cache</th>
   <th colspan="2">Prepare From Cache</th>
   <th rowspan="2">Cache size bytes</th>
 </tr>
 <tr>
   <th>Iterations</th>
   <th>Average latency ms</th>
   <th>Iterations</th>
   <th>Average latency ms</th>
   <th>Iterations</th>
   <th>Average latency ms</th>
 </tr>
 {compilation_results}
</table>
{compilation_latency_graphs}
</div>"""


VALIDATION_ERRORS_TEMPLATE = """
<table class="results">
 <tr>
   <th>Name</th>
   <th>Backend</th>
   <th>Error</th>
 </tr>
 {results}
</table>"""
VALIDATION_ERRORS_ENTRY_TEMPLATE = """
  <tr class="failed">
    <td>{name}</td>
    <td>{backend}</td>
    <td>{error}</td>
  </tr>
"""

LATENCY_GRAPHS_TEMPLATE = """
<div class="latency_results">
{results}
</div>
<div style="clear: left;"></div>
"""

LATENCY_GRAPH_ENTRY_GROUP_TEMPLATE = """
<div class="latency_with_baseline" style="float: left;">
<b>{name}</b>
{results}
</div>
"""

LATENCY_GRAPH_ENTRY_TEMPLATE = """
<div class="latency_result" style='width: 350px;'>
{tag}
<canvas id='latency_chart{i}' class='latency_chart'></canvas>
  <script>
   $(function() {{
       var freqData = {{
         labels: {freq_data[0]},
         datasets: [{{
            data: {freq_data[1]},
            backgroundColor: 'rgba(255, 99, 132, 0.6)',
            borderColor:  'rgba(255, 0, 0, 0.6)',
            borderWidth: 1,
         }}]
       }};
       var ctx = $('#latency_chart{i}')[0].getContext('2d');
       window.latency_chart{i} = new Chart(ctx,
        {{
          type: 'bar',
          data: freqData,
          options: {{
           responsive: true,
           title: {{
             display: false,
             text: 'Latency frequency'
           }},
           legend: {{
             display: false
           }},
           scales: {{
            xAxes: [ {{
              barPercentage: 1.0,
              categoryPercentage: 0.9,
            }}],
            yAxes: [{{
              scaleLabel: {{
                display: false,
                labelString: 'Iterations Count'
              }}
            }}]
           }}
         }}
       }});
     }});
    </script>
</div>
"""


RESULT_ENTRY_WITH_BASELINE_TEMPLATE = """
 <tbody class="values">
 {baseline}
 {other}
 </tbody>
"""
RESULT_ENTRY_TEMPLATE = """
  <tr class={row_class}>
   <td>{name}</td>
   <td>{backend}</td>
   <td>{iterations:d}</td>
   <td>{testset_size:d}</td>
   <td>{avg_ms}</td>
   {accuracy_values}
  </tr>"""

COMPILATION_RESULT_ENTRIES_TEMPLATE = """
 <tbody class="values">
 {entries}
 </tbody>
"""
COMPILATION_RESULT_ENTRY_TEMPLATE = """
  <tr class={row_class}>
   <td>{name}</td>
   <td>{backend}</td>
   <td>{compile_without_cache_iterations}</td>
   <td>{compile_without_cache_avg_ms}</td>
   <td>{save_to_cache_iterations}</td>
   <td>{save_to_cache_avg_ms}</td>
   <td>{prepare_from_cache_iterations}</td>
   <td>{prepare_from_cache_avg_ms}</td>
   <td>{cache_size}</td>
  </tr>"""

LATENCY_BASELINE_TEMPLATE = """{val:.2f}ms"""
LATENCY_DIFF_TEMPLATE = """{val:.2f}ms <span class='{span}'>
({diff_val:.2f}ms, {diff:.1f}%)</span>"""


ACCURACY_HEADERS_TOPK_TEMPLATE = """
<th>Top 1</th>
<th>Top 2</th>
<th>Top 3</th>
<th>Top 4</th>
<th>Top 5</th>
"""
ACCURACY_VALUES_TOPK_TEMPLATE = """
<td>{top1}</td>
<td>{top2}</td>
<td>{top3}</td>
<td>{top4}</td>
<td>{top5}</td>
"""
TOPK_BASELINE_TEMPLATE = """{val:.3f}%"""
TOPK_DIFF_TEMPLATE = """{val:.3f}% <span class='{span}'>({diff:.1f}%)</span>"""


ACCURACY_HEADERS_MELCEPLOGF0_TEMPLATE = """
<th>Max log(F0) error</th>
<th>Max Mel Cep distortion</th>
<th>Max scalar error</th>
"""

ACCURACY_VALUES_MELCEPLOGF0_TEMPLATE = """
<td>{max_log_f0}</td>
<td>{max_mel_cep_distortion}</td>
<td>{max_single_error}</td>
"""

MELCEPLOGF0_BASELINE_TEMPLATE = """{val:.2E}"""
MELCEPLOGF0_DIFF_TEMPLATE = \
"""{val:.2E} <span class='{span}'>({diff:.1f}%)</span>"""


ACCURACY_HEADERS_PHONE_ERROR_RATE_TEMPLATE = """
<th>Max phone error rate</th>
<th>Max scalar error</th>
"""

ACCURACY_VALUES_PHONE_ERROR_RATE_TEMPLATE = """
<td>{max_phone_error_rate}</td>
<td>{max_single_error}</td>
"""

PHONE_ERROR_RATE_BASELINE_TEMPLATE = """{val:.3f}"""
PHONE_ERROR_RATE_DIFF_TEMPLATE = \
"""{val:.3f} <span class='{span}'>({diff:.1f}%)</span>"""


ACCURACY_HEADERS_BASIC_TEMPLATE = """
<th>Max single scalar error</th>
"""


ACCURACY_VALUES_BASIC_TEMPLATE = """
<td>{max_single_error:.2f}</td>
"""

CHART_JS_FILE = 'Chart.bundle.min.js'

if __name__ == '__main__':
  main()