blob: 21f46632df32b23565dd87dc1e363e7b29aa469a [file] [log] [blame]
#!/usr/bin/env python
# Copyright 2016 Google Inc.
#
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.
from __future__ import print_function
from _benchresult import BenchResult
from argparse import ArgumentParser
from datetime import datetime
import collections
import operator
import os
import sys
import tempfile
import urllib
import urlparse
import webbrowser
__argparse = ArgumentParser(description="""
Parses output files from skpbench.py into csv.
This script can also be used to generate a Google sheet:
(1) Install the "Office Editing for Docs, Sheets & Slides" Chrome extension:
https://chrome.google.com/webstore/detail/office-editing-for-docs-s/gbkeegbaiigmenfmjfclcdgdpimamgkj
(2) Designate Chrome os-wide as the default application for opening .csv files.
(3) Run parseskpbench.py with the --open flag.
""")
__argparse.add_argument('-r', '--result',
choices=['median', 'accum', 'max', 'min'], default='median',
help='result to use for cell values')
__argparse.add_argument('-f', '--force',
action='store_true', help='silently ignore warnings')
__argparse.add_argument('-o', '--open',
action='store_true',
help='generate a temp file and open it (theoretically in a web browser)')
__argparse.add_argument('-n', '--name',
default='skpbench_%s' % datetime.now().strftime('%Y-%m-%d_%H.%M.%S.csv'),
help='if using --open, a name for the temp file')
__argparse.add_argument('sources',
nargs='+', help='source files with skpbench results ("-" for stdin)')
FLAGS = __argparse.parse_args()
class Parser:
def __init__(self):
self.configs = list() # use list to preserve the order configs appear in.
self.rows = collections.defaultdict(dict)
self.cols = collections.defaultdict(dict)
self.metric = None
self.samples = None
self.sample_ms = None
def parse_file(self, infile):
for line in infile:
match = BenchResult.match(line)
if not match:
continue
if self.metric is None:
self.metric = match.metric
elif match.metric != self.metric:
raise ValueError('results have mismatched metrics (%s and %s)' %
(self.metric, match.metric))
if self.samples is None:
self.samples = match.samples
elif not FLAGS.force and match.samples != self.samples:
raise ValueError('results have mismatched number of samples. '
'(use --force to ignore)')
if self.sample_ms is None:
self.sample_ms = match.sample_ms
elif not FLAGS.force and match.sample_ms != self.sample_ms:
raise ValueError('results have mismatched sampling times. '
'(use --force to ignore)')
if not match.config in self.configs:
self.configs.append(match.config)
self.rows[match.bench][match.config] = match.get_string(FLAGS.result)
self.cols[match.config][match.bench] = getattr(match, FLAGS.result)
def print_csv(self, outfile=sys.stdout):
print('%s_%s' % (FLAGS.result, self.metric), file=outfile)
# Write the header.
outfile.write('bench,')
for config in self.configs:
outfile.write('%s,' % config)
outfile.write('\n')
# Write the rows.
for bench, row in self.rows.items():
outfile.write('%s,' % bench)
for config in self.configs:
if config in row:
outfile.write('%s,' % row[config])
elif FLAGS.force:
outfile.write(',')
else:
raise ValueError('%s: missing value for %s. (use --force to ignore)' %
(bench, config))
outfile.write('\n')
# Add simple, literal averages.
if len(self.rows) > 1:
outfile.write('\n')
self.__print_computed_row('MEAN',
lambda col: reduce(operator.add, col.values()) / len(col),
outfile=outfile)
self.__print_computed_row('GEOMEAN',
lambda col: reduce(operator.mul, col.values()) ** (1.0 / len(col)),
outfile=outfile)
def __print_computed_row(self, name, func, outfile=sys.stdout):
outfile.write('%s,' % name)
for config in self.configs:
assert(len(self.cols[config]) == len(self.rows))
outfile.write('%.4g,' % func(self.cols[config]))
outfile.write('\n')
def main():
parser = Parser()
# Parse the input files.
for src in FLAGS.sources:
if src == '-':
parser.parse_file(sys.stdin)
else:
with open(src, mode='r') as infile:
parser.parse_file(infile)
# Print the csv.
if not FLAGS.open:
parser.print_csv()
else:
dirname = tempfile.mkdtemp()
basename = FLAGS.name
if os.path.splitext(basename)[1] != '.csv':
basename += '.csv';
pathname = os.path.join(dirname, basename)
with open(pathname, mode='w') as tmpfile:
parser.print_csv(outfile=tmpfile)
fileuri = urlparse.urljoin('file:', urllib.pathname2url(pathname))
print('opening %s' % fileuri)
webbrowser.open(fileuri)
if __name__ == '__main__':
main()