tools/profiling/microbenchmarks/bm2bq.py - platform/external/grpc-grpc - Gitiles

 #!/usr/bin/env python2.7
 #
 # Convert google-benchmark json output to something that can be uploaded to
 # BigQuery
 #
 #
 # Copyright 2017, Google Inc.
 # All rights reserved.
 #
 # Redistribution and use in source and binary forms, with or without
 # modification, are permitted provided that the following conditions are
 # met:
 #
 #     * Redistributions of source code must retain the above copyright
 # notice, this list of conditions and the following disclaimer.
 #     * Redistributions in binary form must reproduce the above
 # copyright notice, this list of conditions and the following disclaimer
 # in the documentation and/or other materials provided with the
 # distribution.
 #     * Neither the name of Google Inc. nor the names of its
 # contributors may be used to endorse or promote products derived from
 # this software without specific prior written permission.
 #
 # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 import sys
 import json
 import csv
 import os

 columns = [
   ('jenkins_build', 'integer'),
   ('jenkins_job', 'string'),
   ('date', 'timestamp'),
   ('cpu_scaling_enabled', 'boolean'),
   ('num_cpus', 'integer'),
   ('mhz_per_cpu', 'integer'),
   ('library_build_type', 'string'),
   ('name', 'string'),
   ('fixture', 'string'),
   ('client_mutator', 'string'),
   ('server_mutator', 'string'),
   ('request_size', 'integer'),
   ('response_size', 'integer'),
   ('request_count', 'integer'),
   ('iterations', 'integer'),
   ('time_unit', 'string'),
   ('real_time', 'integer'),
   ('cpu_time', 'integer'),
   ('bytes_per_second', 'float'),
   ('allocs_per_iteration', 'float'),
   ('locks_per_iteration', 'float'),
   ('writes_per_iteration', 'float'),
   ('bandwidth_kilobits', 'integer'),
   ('cli_transport_stalls_per_iteration', 'float'),
   ('cli_stream_stalls_per_iteration', 'float'),
   ('svr_transport_stalls_per_iteration', 'float'),
   ('svr_stream_stalls_per_iteration', 'float'),
 ]

 if sys.argv[1] == '--schema':
   print ',\n'.join('%s:%s' % (k, t.upper()) for k, t in columns)
   sys.exit(0)

 with open(sys.argv[1]) as f:
   js = json.loads(f.read())

 writer = csv.DictWriter(sys.stdout, [c for c,t in columns])

 bm_specs = {
   'BM_UnaryPingPong': {
     'tpl': ['fixture', 'client_mutator', 'server_mutator'],
     'dyn': ['request_size', 'response_size'],
   },
   'BM_PumpStreamClientToServer': {
     'tpl': ['fixture'],
     'dyn': ['request_size'],
   },
   'BM_PumpStreamServerToClient': {
     'tpl': ['fixture'],
     'dyn': ['request_size'],
   },
   'BM_StreamingPingPong': {
     'tpl': ['fixture', 'client_mutator', 'server_mutator'],
     'dyn': ['request_size', 'request_count'],
   },
   'BM_StreamingPingPongMsgs': {
     'tpl': ['fixture', 'client_mutator', 'server_mutator'],
     'dyn': ['request_size'],
   },
   'BM_PumpStreamServerToClient_Trickle': {
     'tpl': [],
     'dyn': ['request_size', 'bandwidth_kilobits'],
   },
 }

 def numericalize(s):
   if not s: return ''
   if s[-1] == 'k':
     return int(s[:-1]) * 1024
   if s[-1] == 'M':
     return int(s[:-1]) * 1024 * 1024
   if 0 <= (ord(s[-1]) - ord('0')) <= 9:
     return int(s)
   assert 'not a number: %s' % s

 def parse_name(name):
   if '<' not in name and '/' not in name and name not in bm_specs:
     return {'name': name}
   rest = name
   out = {}
   tpl_args = []
   dyn_args = []
   if '<' in rest:
     tpl_bit = rest[rest.find('<') + 1 : rest.rfind('>')]
     arg = ''
     nesting = 0
     for c in tpl_bit:
       if c == '<':
         nesting += 1
         arg += c
       elif c == '>':
         nesting -= 1
         arg += c
       elif c == ',':
         if nesting == 0:
           tpl_args.append(arg.strip())
           arg = ''
         else:
           arg += c
       else:
         arg += c
     tpl_args.append(arg.strip())
     rest = rest[:rest.find('<')] + rest[rest.rfind('>') + 1:]
   if '/' in rest:
     s = rest.split('/')
     rest = s[0]
     dyn_args = s[1:]
   name = rest
   assert name in bm_specs, 'bm_specs needs to be expanded for %s' % name
   assert len(dyn_args) == len(bm_specs[name]['dyn'])
   assert len(tpl_args) == len(bm_specs[name]['tpl'])
   out['name'] = name
   out.update(dict((k, numericalize(v)) for k, v in zip(bm_specs[name]['dyn'], dyn_args)))
   out.update(dict(zip(bm_specs[name]['tpl'], tpl_args)))
   return out

 for bm in js['benchmarks']:
   context = js['context']
   if 'label' in bm:
     labels_list = [s.split(':') for s in bm['label'].split(' ')]
     for el in labels_list:
       el[0] = el[0].replace('/iter', '_per_iteration')
     labels = dict(labels_list)
   else:
     labels = {}
   row = {
     'jenkins_build': os.environ.get('BUILD_NUMBER', ''),
     'jenkins_job': os.environ.get('JOB_NAME', ''),
   }
   row.update(context)
   row.update(bm)
   row.update(parse_name(row['name']))
   row.update(labels)
   if 'label' in row:
     del row['label']
   writer.writerow(row)
	#!/usr/bin/env python2.7
	#
	# Convert google-benchmark json output to something that can be uploaded to
	# BigQuery
	#
	#
	# Copyright 2017, Google Inc.
	# All rights reserved.
	#
	# Redistribution and use in source and binary forms, with or without
	# modification, are permitted provided that the following conditions are
	# met:
	#
	# * Redistributions of source code must retain the above copyright
	# notice, this list of conditions and the following disclaimer.
	# * Redistributions in binary form must reproduce the above
	# copyright notice, this list of conditions and the following disclaimer
	# in the documentation and/or other materials provided with the
	# distribution.
	# * Neither the name of Google Inc. nor the names of its
	# contributors may be used to endorse or promote products derived from
	# this software without specific prior written permission.
	#
	# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
	# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
	# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
	# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
	# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
	# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
	# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
	# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
	# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
	# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
	# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

	import sys
	import json
	import csv
	import os

	columns = [
	('jenkins_build', 'integer'),
	('jenkins_job', 'string'),
	('date', 'timestamp'),
	('cpu_scaling_enabled', 'boolean'),
	('num_cpus', 'integer'),
	('mhz_per_cpu', 'integer'),
	('library_build_type', 'string'),
	('name', 'string'),
	('fixture', 'string'),
	('client_mutator', 'string'),
	('server_mutator', 'string'),
	('request_size', 'integer'),
	('response_size', 'integer'),
	('request_count', 'integer'),
	('iterations', 'integer'),
	('time_unit', 'string'),
	('real_time', 'integer'),
	('cpu_time', 'integer'),
	('bytes_per_second', 'float'),
	('allocs_per_iteration', 'float'),
	('locks_per_iteration', 'float'),
	('writes_per_iteration', 'float'),
	('bandwidth_kilobits', 'integer'),
	('cli_transport_stalls_per_iteration', 'float'),
	('cli_stream_stalls_per_iteration', 'float'),
	('svr_transport_stalls_per_iteration', 'float'),
	('svr_stream_stalls_per_iteration', 'float'),
	]

	if sys.argv[1] == '--schema':
	print ',\n'.join('%s:%s' % (k, t.upper()) for k, t in columns)
	sys.exit(0)

	with open(sys.argv[1]) as f:
	js = json.loads(f.read())

	writer = csv.DictWriter(sys.stdout, [c for c,t in columns])

	bm_specs = {
	'BM_UnaryPingPong': {
	'tpl': ['fixture', 'client_mutator', 'server_mutator'],
	'dyn': ['request_size', 'response_size'],
	},
	'BM_PumpStreamClientToServer': {
	'tpl': ['fixture'],
	'dyn': ['request_size'],
	},
	'BM_PumpStreamServerToClient': {
	'tpl': ['fixture'],
	'dyn': ['request_size'],
	},
	'BM_StreamingPingPong': {
	'tpl': ['fixture', 'client_mutator', 'server_mutator'],
	'dyn': ['request_size', 'request_count'],
	},
	'BM_StreamingPingPongMsgs': {
	'tpl': ['fixture', 'client_mutator', 'server_mutator'],
	'dyn': ['request_size'],
	},
	'BM_PumpStreamServerToClient_Trickle': {
	'tpl': [],
	'dyn': ['request_size', 'bandwidth_kilobits'],
	},
	}

	def numericalize(s):
	if not s: return ''
	if s[-1] == 'k':
	return int(s[:-1]) * 1024
	if s[-1] == 'M':
	return int(s[:-1]) * 1024 * 1024
	if 0 <= (ord(s[-1]) - ord('0')) <= 9:
	return int(s)
	assert 'not a number: %s' % s

	def parse_name(name):
	if '<' not in name and '/' not in name and name not in bm_specs:
	return {'name': name}
	rest = name
	out = {}
	tpl_args = []
	dyn_args = []
	if '<' in rest:
	tpl_bit = rest[rest.find('<') + 1 : rest.rfind('>')]
	arg = ''
	nesting = 0
	for c in tpl_bit:
	if c == '<':
	nesting += 1
	arg += c
	elif c == '>':
	nesting -= 1
	arg += c
	elif c == ',':
	if nesting == 0:
	tpl_args.append(arg.strip())
	arg = ''
	else:
	arg += c
	else:
	arg += c
	tpl_args.append(arg.strip())
	rest = rest[:rest.find('<')] + rest[rest.rfind('>') + 1:]
	if '/' in rest:
	s = rest.split('/')
	rest = s[0]
	dyn_args = s[1:]
	name = rest
	assert name in bm_specs, 'bm_specs needs to be expanded for %s' % name
	assert len(dyn_args) == len(bm_specs[name]['dyn'])
	assert len(tpl_args) == len(bm_specs[name]['tpl'])
	out['name'] = name
	out.update(dict((k, numericalize(v)) for k, v in zip(bm_specs[name]['dyn'], dyn_args)))
	out.update(dict(zip(bm_specs[name]['tpl'], tpl_args)))
	return out

	for bm in js['benchmarks']:
	context = js['context']
	if 'label' in bm:
	labels_list = [s.split(':') for s in bm['label'].split(' ')]
	for el in labels_list:
	el[0] = el[0].replace('/iter', '_per_iteration')
	labels = dict(labels_list)
	else:
	labels = {}
	row = {
	'jenkins_build': os.environ.get('BUILD_NUMBER', ''),
	'jenkins_job': os.environ.get('JOB_NAME', ''),
	}
	row.update(context)
	row.update(bm)
	row.update(parse_name(row['name']))
	row.update(labels)
	if 'label' in row:
	del row['label']
	writer.writerow(row)