tools/run_tests/run_microbenchmark.py - third_party/grpc - Git at Google

 #!/usr/bin/env python
 # Copyright 2017 gRPC authors.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.

 import cgi
 import multiprocessing
 import os
 import subprocess
 import sys
 import argparse

 import python_utils.jobset as jobset
 import python_utils.start_port_server as start_port_server

 sys.path.append(os.path.join(os.path.dirname(sys.argv[0]), '..', 'profiling', 'microbenchmarks', 'bm_diff'))
 import bm_constants

 flamegraph_dir = os.path.join(os.path.expanduser('~'), 'FlameGraph')

 os.chdir(os.path.join(os.path.dirname(sys.argv[0]), '../..'))
 if not os.path.exists('reports'):
   os.makedirs('reports')

 start_port_server.start_port_server()

 def fnize(s):
   out = ''
   for c in s:
     if c in '<>, /':
       if len(out) and out[-1] == '_': continue
       out += '_'
     else:
       out += c
   return out

 # index html
 index_html = """
 <html>
 <head>
 <title>Microbenchmark Results</title>
 </head>
 <body>
 """

 def heading(name):
   global index_html
   index_html += "<h1>%s</h1>\n" % name

 def link(txt, tgt):
   global index_html
   index_html += "<p><a href=\"%s\">%s</a></p>\n" % (
       cgi.escape(tgt, quote=True), cgi.escape(txt))

 def text(txt):
   global index_html
   index_html += "<p><pre>%s</pre></p>\n" % cgi.escape(txt)

 def collect_latency(bm_name, args):
   """generate latency profiles"""
   benchmarks = []
   profile_analysis = []
   cleanup = []

   heading('Latency Profiles: %s' % bm_name)
   subprocess.check_call(
       ['make', bm_name,
        'CONFIG=basicprof', '-j', '%d' % multiprocessing.cpu_count()])
   for line in subprocess.check_output(['bins/basicprof/%s' % bm_name,
                                        '--benchmark_list_tests']).splitlines():
     link(line, '%s.txt' % fnize(line))
     benchmarks.append(
         jobset.JobSpec(['bins/basicprof/%s' % bm_name,
                         '--benchmark_filter=^%s$' % line,
                         '--benchmark_min_time=0.05'],
                        environ={'LATENCY_TRACE': '%s.trace' % fnize(line)},
                        shortname='profile-%s' % fnize(line)))
     profile_analysis.append(
         jobset.JobSpec([sys.executable,
                         'tools/profiling/latency_profile/profile_analyzer.py',
                         '--source', '%s.trace' % fnize(line), '--fmt', 'simple',
                         '--out', 'reports/%s.txt' % fnize(line)], timeout_seconds=20*60,
                         shortname='analyze-%s' % fnize(line)))
     cleanup.append(jobset.JobSpec(['rm', '%s.trace' % fnize(line)]))
     # periodically flush out the list of jobs: profile_analysis jobs at least
     # consume upwards of five gigabytes of ram in some cases, and so analysing
     # hundreds of them at once is impractical -- but we want at least some
     # concurrency or the work takes too long
     if len(benchmarks) >= min(16, multiprocessing.cpu_count()):
       # run up to half the cpu count: each benchmark can use up to two cores
       # (one for the microbenchmark, one for the data flush)
       jobset.run(benchmarks, maxjobs=max(1, multiprocessing.cpu_count()/2))
       jobset.run(profile_analysis, maxjobs=multiprocessing.cpu_count())
       jobset.run(cleanup, maxjobs=multiprocessing.cpu_count())
       benchmarks = []
       profile_analysis = []
       cleanup = []
   # run the remaining benchmarks that weren't flushed
   if len(benchmarks):
     jobset.run(benchmarks, maxjobs=max(1, multiprocessing.cpu_count()/2))
     jobset.run(profile_analysis, maxjobs=multiprocessing.cpu_count())
     jobset.run(cleanup, maxjobs=multiprocessing.cpu_count())

 def collect_perf(bm_name, args):
   """generate flamegraphs"""
   heading('Flamegraphs: %s' % bm_name)
   subprocess.check_call(
       ['make', bm_name,
        'CONFIG=mutrace', '-j', '%d' % multiprocessing.cpu_count()])
   benchmarks = []
   profile_analysis = []
   cleanup = []
   for line in subprocess.check_output(['bins/mutrace/%s' % bm_name,
                                        '--benchmark_list_tests']).splitlines():
     link(line, '%s.svg' % fnize(line))
     benchmarks.append(
         jobset.JobSpec(['perf', 'record', '-o', '%s-perf.data' % fnize(line),
                         '-g', '-F', '997',
                         'bins/mutrace/%s' % bm_name,
                         '--benchmark_filter=^%s$' % line,
                         '--benchmark_min_time=10'],
                         shortname='perf-%s' % fnize(line)))
     profile_analysis.append(
         jobset.JobSpec(['tools/run_tests/performance/process_local_perf_flamegraphs.sh'],
                        environ = {
                            'PERF_BASE_NAME': fnize(line),
                            'OUTPUT_DIR': 'reports',
                            'OUTPUT_FILENAME': fnize(line),
                        },
                        shortname='flame-%s' % fnize(line)))
     cleanup.append(jobset.JobSpec(['rm', '%s-perf.data' % fnize(line)]))
     cleanup.append(jobset.JobSpec(['rm', '%s-out.perf' % fnize(line)]))
     # periodically flush out the list of jobs: temporary space required for this
     # processing is large
     if len(benchmarks) >= 20:
       # run up to half the cpu count: each benchmark can use up to two cores
       # (one for the microbenchmark, one for the data flush)
       jobset.run(benchmarks, maxjobs=1)
       jobset.run(profile_analysis, maxjobs=multiprocessing.cpu_count())
       jobset.run(cleanup, maxjobs=multiprocessing.cpu_count())
       benchmarks = []
       profile_analysis = []
       cleanup = []
   # run the remaining benchmarks that weren't flushed
   if len(benchmarks):
     jobset.run(benchmarks, maxjobs=1)
     jobset.run(profile_analysis, maxjobs=multiprocessing.cpu_count())
     jobset.run(cleanup, maxjobs=multiprocessing.cpu_count())

 def run_summary(bm_name, cfg, base_json_name):
   subprocess.check_call(
       ['make', bm_name,
        'CONFIG=%s' % cfg, '-j', '%d' % multiprocessing.cpu_count()])
   cmd = ['bins/%s/%s' % (cfg, bm_name),
          '--benchmark_out=%s.%s.json' % (base_json_name, cfg),
          '--benchmark_out_format=json']
   if args.summary_time is not None:
     cmd += ['--benchmark_min_time=%d' % args.summary_time]
   return subprocess.check_output(cmd)

 def collect_summary(bm_name, args):
   heading('Summary: %s [no counters]' % bm_name)
   text(run_summary(bm_name, 'opt', bm_name))
   heading('Summary: %s [with counters]' % bm_name)
   text(run_summary(bm_name, 'counters', bm_name))
   if args.bigquery_upload:
     with open('%s.csv' % bm_name, 'w') as f:
       f.write(subprocess.check_output(['tools/profiling/microbenchmarks/bm2bq.py',
                                        '%s.counters.json' % bm_name,
                                        '%s.opt.json' % bm_name]))
     subprocess.check_call(['bq', 'load', 'microbenchmarks.microbenchmarks', '%s.csv' % bm_name])

 collectors = {
   'latency': collect_latency,
   'perf': collect_perf,
   'summary': collect_summary,
 }

 argp = argparse.ArgumentParser(description='Collect data from microbenchmarks')
 argp.add_argument('-c', '--collect',
                   choices=sorted(collectors.keys()),
                   nargs='*',
                   default=sorted(collectors.keys()),
                   help='Which collectors should be run against each benchmark')
 argp.add_argument('-b', '--benchmarks',
                   choices=bm_constants._AVAILABLE_BENCHMARK_TESTS,
                   default=bm_constants._AVAILABLE_BENCHMARK_TESTS,
                   nargs='+',
                   type=str,
                   help='Which microbenchmarks should be run')
 argp.add_argument('--bigquery_upload',
                   default=False,
                   action='store_const',
                   const=True,
                   help='Upload results from summary collection to bigquery')
 argp.add_argument('--summary_time',
                   default=None,
                   type=int,
                   help='Minimum time to run benchmarks for the summary collection')
 args = argp.parse_args()

 try:
   for collect in args.collect:
     for bm_name in args.benchmarks:
       collectors[collect](bm_name, args)
 finally:
   if not os.path.exists('reports'):
     os.makedirs('reports')
   index_html += "</body>\n</html>\n"
   with open('reports/index.html', 'w') as f:
     f.write(index_html)
	#!/usr/bin/env python
	# Copyright 2017 gRPC authors.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.

	import cgi
	import multiprocessing
	import os
	import subprocess
	import sys
	import argparse

	import python_utils.jobset as jobset
	import python_utils.start_port_server as start_port_server

	sys.path.append(os.path.join(os.path.dirname(sys.argv[0]), '..', 'profiling', 'microbenchmarks', 'bm_diff'))
	import bm_constants

	flamegraph_dir = os.path.join(os.path.expanduser('~'), 'FlameGraph')

	os.chdir(os.path.join(os.path.dirname(sys.argv[0]), '../..'))
	if not os.path.exists('reports'):
	os.makedirs('reports')

	start_port_server.start_port_server()

	def fnize(s):
	out = ''
	for c in s:
	if c in '<>, /':
	if len(out) and out[-1] == '_': continue
	out += '_'
	else:
	out += c
	return out

	# index html
	index_html = """
	<html>
	<head>
	<title>Microbenchmark Results</title>
	</head>
	<body>
	"""

	def heading(name):
	global index_html
	index_html += "<h1>%s</h1>\n" % name

	def link(txt, tgt):
	global index_html
	index_html += "<p><a href=\"%s\">%s</a></p>\n" % (
	cgi.escape(tgt, quote=True), cgi.escape(txt))

	def text(txt):
	global index_html
	index_html += "<p><pre>%s</pre></p>\n" % cgi.escape(txt)

	def collect_latency(bm_name, args):
	"""generate latency profiles"""
	benchmarks = []
	profile_analysis = []
	cleanup = []

	heading('Latency Profiles: %s' % bm_name)
	subprocess.check_call(
	['make', bm_name,
	'CONFIG=basicprof', '-j', '%d' % multiprocessing.cpu_count()])
	for line in subprocess.check_output(['bins/basicprof/%s' % bm_name,
	'--benchmark_list_tests']).splitlines():
	link(line, '%s.txt' % fnize(line))
	benchmarks.append(
	jobset.JobSpec(['bins/basicprof/%s' % bm_name,
	'--benchmark_filter=^%s$' % line,
	'--benchmark_min_time=0.05'],
	environ={'LATENCY_TRACE': '%s.trace' % fnize(line)},
	shortname='profile-%s' % fnize(line)))
	profile_analysis.append(
	jobset.JobSpec([sys.executable,
	'tools/profiling/latency_profile/profile_analyzer.py',
	'--source', '%s.trace' % fnize(line), '--fmt', 'simple',
	'--out', 'reports/%s.txt' % fnize(line)], timeout_seconds=20*60,
	shortname='analyze-%s' % fnize(line)))
	cleanup.append(jobset.JobSpec(['rm', '%s.trace' % fnize(line)]))
	# periodically flush out the list of jobs: profile_analysis jobs at least
	# consume upwards of five gigabytes of ram in some cases, and so analysing
	# hundreds of them at once is impractical -- but we want at least some
	# concurrency or the work takes too long
	if len(benchmarks) >= min(16, multiprocessing.cpu_count()):
	# run up to half the cpu count: each benchmark can use up to two cores
	# (one for the microbenchmark, one for the data flush)
	jobset.run(benchmarks, maxjobs=max(1, multiprocessing.cpu_count()/2))
	jobset.run(profile_analysis, maxjobs=multiprocessing.cpu_count())
	jobset.run(cleanup, maxjobs=multiprocessing.cpu_count())
	benchmarks = []
	profile_analysis = []
	cleanup = []
	# run the remaining benchmarks that weren't flushed
	if len(benchmarks):
	jobset.run(benchmarks, maxjobs=max(1, multiprocessing.cpu_count()/2))
	jobset.run(profile_analysis, maxjobs=multiprocessing.cpu_count())
	jobset.run(cleanup, maxjobs=multiprocessing.cpu_count())

	def collect_perf(bm_name, args):
	"""generate flamegraphs"""
	heading('Flamegraphs: %s' % bm_name)
	subprocess.check_call(
	['make', bm_name,
	'CONFIG=mutrace', '-j', '%d' % multiprocessing.cpu_count()])
	benchmarks = []
	profile_analysis = []
	cleanup = []
	for line in subprocess.check_output(['bins/mutrace/%s' % bm_name,
	'--benchmark_list_tests']).splitlines():
	link(line, '%s.svg' % fnize(line))
	benchmarks.append(
	jobset.JobSpec(['perf', 'record', '-o', '%s-perf.data' % fnize(line),
	'-g', '-F', '997',
	'bins/mutrace/%s' % bm_name,
	'--benchmark_filter=^%s$' % line,
	'--benchmark_min_time=10'],
	shortname='perf-%s' % fnize(line)))
	profile_analysis.append(
	jobset.JobSpec(['tools/run_tests/performance/process_local_perf_flamegraphs.sh'],
	environ = {
	'PERF_BASE_NAME': fnize(line),
	'OUTPUT_DIR': 'reports',
	'OUTPUT_FILENAME': fnize(line),
	},
	shortname='flame-%s' % fnize(line)))
	cleanup.append(jobset.JobSpec(['rm', '%s-perf.data' % fnize(line)]))
	cleanup.append(jobset.JobSpec(['rm', '%s-out.perf' % fnize(line)]))
	# periodically flush out the list of jobs: temporary space required for this
	# processing is large
	if len(benchmarks) >= 20:
	# run up to half the cpu count: each benchmark can use up to two cores
	# (one for the microbenchmark, one for the data flush)
	jobset.run(benchmarks, maxjobs=1)
	jobset.run(profile_analysis, maxjobs=multiprocessing.cpu_count())
	jobset.run(cleanup, maxjobs=multiprocessing.cpu_count())
	benchmarks = []
	profile_analysis = []
	cleanup = []
	# run the remaining benchmarks that weren't flushed
	if len(benchmarks):
	jobset.run(benchmarks, maxjobs=1)
	jobset.run(profile_analysis, maxjobs=multiprocessing.cpu_count())
	jobset.run(cleanup, maxjobs=multiprocessing.cpu_count())

	def run_summary(bm_name, cfg, base_json_name):
	subprocess.check_call(
	['make', bm_name,
	'CONFIG=%s' % cfg, '-j', '%d' % multiprocessing.cpu_count()])
	cmd = ['bins/%s/%s' % (cfg, bm_name),
	'--benchmark_out=%s.%s.json' % (base_json_name, cfg),
	'--benchmark_out_format=json']
	if args.summary_time is not None:
	cmd += ['--benchmark_min_time=%d' % args.summary_time]
	return subprocess.check_output(cmd)

	def collect_summary(bm_name, args):
	heading('Summary: %s [no counters]' % bm_name)
	text(run_summary(bm_name, 'opt', bm_name))
	heading('Summary: %s [with counters]' % bm_name)
	text(run_summary(bm_name, 'counters', bm_name))
	if args.bigquery_upload:
	with open('%s.csv' % bm_name, 'w') as f:
	f.write(subprocess.check_output(['tools/profiling/microbenchmarks/bm2bq.py',
	'%s.counters.json' % bm_name,
	'%s.opt.json' % bm_name]))
	subprocess.check_call(['bq', 'load', 'microbenchmarks.microbenchmarks', '%s.csv' % bm_name])

	collectors = {
	'latency': collect_latency,
	'perf': collect_perf,
	'summary': collect_summary,
	}

	argp = argparse.ArgumentParser(description='Collect data from microbenchmarks')
	argp.add_argument('-c', '--collect',
	choices=sorted(collectors.keys()),
	nargs='*',
	default=sorted(collectors.keys()),
	help='Which collectors should be run against each benchmark')
	argp.add_argument('-b', '--benchmarks',
	choices=bm_constants._AVAILABLE_BENCHMARK_TESTS,
	default=bm_constants._AVAILABLE_BENCHMARK_TESTS,
	nargs='+',
	type=str,
	help='Which microbenchmarks should be run')
	argp.add_argument('--bigquery_upload',
	default=False,
	action='store_const',
	const=True,
	help='Upload results from summary collection to bigquery')
	argp.add_argument('--summary_time',
	default=None,
	type=int,
	help='Minimum time to run benchmarks for the summary collection')
	args = argp.parse_args()

	try:
	for collect in args.collect:
	for bm_name in args.benchmarks:
	collectors[collect](bm_name, args)
	finally:
	if not os.path.exists('reports'):
	os.makedirs('reports')
	index_html += "</body>\n</html>\n"
	with open('reports/index.html', 'w') as f:
	f.write(index_html)