#!/usr/bin/env python2.7 # # Convert google-benchmark json output to something that can be uploaded to # BigQuery # # # Copyright 2017, Google Inc. # All rights reserved. # # Redistribution and use in source and binary forms, with or without # modification, are permitted provided that the following conditions are # met: # # * Redistributions of source code must retain the above copyright # notice, this list of conditions and the following disclaimer. # * Redistributions in binary form must reproduce the above # copyright notice, this list of conditions and the following disclaimer # in the documentation and/or other materials provided with the # distribution. # * Neither the name of Google Inc. nor the names of its # contributors may be used to endorse or promote products derived from # this software without specific prior written permission. # # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. import sys import json import csv import os columns = [ ('jenkins_build', 'integer'), ('jenkins_job', 'string'), ('date', 'timestamp'), ('cpu_scaling_enabled', 'boolean'), ('num_cpus', 'integer'), ('mhz_per_cpu', 'integer'), ('library_build_type', 'string'), ('name', 'string'), ('fixture', 'string'), ('client_mutator', 'string'), ('server_mutator', 'string'), ('request_size', 'integer'), ('response_size', 'integer'), ('request_count', 'integer'), ('iterations', 'integer'), ('time_unit', 'string'), ('real_time', 'integer'), ('cpu_time', 'integer'), ('bytes_per_second', 'float'), ('allocs_per_iteration', 'float'), ('locks_per_iteration', 'float'), ('writes_per_iteration', 'float'), ('bandwidth_kilobits', 'integer'), ('cli_transport_stalls_per_iteration', 'float'), ('cli_stream_stalls_per_iteration', 'float'), ('svr_transport_stalls_per_iteration', 'float'), ('svr_stream_stalls_per_iteration', 'float'), ('atm_cas_per_iteration', 'float'), ('atm_add_per_iteration', 'float') ] if sys.argv[1] == '--schema': print ',\n'.join('%s:%s' % (k, t.upper()) for k, t in columns) sys.exit(0) with open(sys.argv[1]) as f: js = json.loads(f.read()) writer = csv.DictWriter(sys.stdout, [c for c,t in columns]) bm_specs = { 'BM_UnaryPingPong': { 'tpl': ['fixture', 'client_mutator', 'server_mutator'], 'dyn': ['request_size', 'response_size'], }, 'BM_PumpStreamClientToServer': { 'tpl': ['fixture'], 'dyn': ['request_size'], }, 'BM_PumpStreamServerToClient': { 'tpl': ['fixture'], 'dyn': ['request_size'], }, 'BM_StreamingPingPong': { 'tpl': ['fixture', 'client_mutator', 'server_mutator'], 'dyn': ['request_size', 'request_count'], }, 'BM_StreamingPingPongMsgs': { 'tpl': ['fixture', 'client_mutator', 'server_mutator'], 'dyn': ['request_size'], }, 'BM_PumpStreamServerToClient_Trickle': { 'tpl': [], 'dyn': ['request_size', 'bandwidth_kilobits'], }, } def numericalize(s): if not s: return '' if s[-1] == 'k': return int(s[:-1]) * 1024 if s[-1] == 'M': return int(s[:-1]) * 1024 * 1024 if 0 <= (ord(s[-1]) - ord('0')) <= 9: return int(s) assert 'not a number: %s' % s def parse_name(name): if '<' not in name and '/' not in name and name not in bm_specs: return {'name': name} rest = name out = {} tpl_args = [] dyn_args = [] if '<' in rest: tpl_bit = rest[rest.find('<') + 1 : rest.rfind('>')] arg = '' nesting = 0 for c in tpl_bit: if c == '<': nesting += 1 arg += c elif c == '>': nesting -= 1 arg += c elif c == ',': if nesting == 0: tpl_args.append(arg.strip()) arg = '' else: arg += c else: arg += c tpl_args.append(arg.strip()) rest = rest[:rest.find('<')] + rest[rest.rfind('>') + 1:] if '/' in rest: s = rest.split('/') rest = s[0] dyn_args = s[1:] name = rest assert name in bm_specs, 'bm_specs needs to be expanded for %s' % name assert len(dyn_args) == len(bm_specs[name]['dyn']) assert len(tpl_args) == len(bm_specs[name]['tpl']) out['name'] = name out.update(dict((k, numericalize(v)) for k, v in zip(bm_specs[name]['dyn'], dyn_args))) out.update(dict(zip(bm_specs[name]['tpl'], tpl_args))) return out for bm in js['benchmarks']: context = js['context'] if 'label' in bm: labels_list = [s.split(':') for s in bm['label'].strip().split(' ')] for el in labels_list: el[0] = el[0].replace('/iter', '_per_iteration') labels = dict(labels_list) else: labels = {} row = { 'jenkins_build': os.environ.get('BUILD_NUMBER', ''), 'jenkins_job': os.environ.get('JOB_NAME', ''), } row.update(context) row.update(bm) row.update(parse_name(row['name'])) row.update(labels) if 'label' in row: del row['label'] writer.writerow(row)