Speed up latency profiling (and tune down the memory usage)

commit: ece502fa12ae9db7fc969f0bae1f7c26ece1dce3 [log] [tgz]
author: Craig Tiller <ctiller@google.com> Fri Feb 17 16:20:50 2017 -0800
committer: Craig Tiller <ctiller@google.com> Fri Feb 17 16:20:50 2017 -0800
tree: 278a8706a3522790ef68cc2b078502c91f593e0b
parent: 9c30e98ce5c5df7ad08cfb06919e213a32f87485 [diff] [blame]
diff --git a/tools/run_tests/run_microbenchmark.py b/tools/run_tests/run_microbenchmark.py
index a9a563c..1cafffb 100755
--- a/tools/run_tests/run_microbenchmark.py
+++ b/tools/run_tests/run_microbenchmark.py

@@ -91,7 +91,9 @@
                                        '--benchmark_list_tests']).splitlines():
     link(line, '%s.txt' % fnize(line))
     benchmarks.append(
-        jobset.JobSpec(['bins/basicprof/%s' % bm_name, '--benchmark_filter=^%s$' % line],
+        jobset.JobSpec(['bins/basicprof/%s' % bm_name,
+                        '--benchmark_filter=^%s$' % line,
+                        '--benchmark_min_time=0.05'],
                        environ={'LATENCY_TRACE': '%s.trace' % fnize(line)}))
     profile_analysis.append(
         jobset.JobSpec([sys.executable,
@@ -103,7 +105,7 @@
     # consume upwards of five gigabytes of ram in some cases, and so analysing
     # hundreds of them at once is impractical -- but we want at least some
     # concurrency or the work takes too long
-    if len(benchmarks) >= min(4, multiprocessing.cpu_count()):
+    if len(benchmarks) >= min(16, multiprocessing.cpu_count()):
       # run up to half the cpu count: each benchmark can use up to two cores
       # (one for the microbenchmark, one for the data flush)
       jobset.run(benchmarks, maxjobs=max(1, multiprocessing.cpu_count()/2),
commit	ece502fa12ae9db7fc969f0bae1f7c26ece1dce3	[log] [tgz]
author	Craig Tiller <ctiller@google.com>	Fri Feb 17 16:20:50 2017 -0800
committer	Craig Tiller <ctiller@google.com>	Fri Feb 17 16:20:50 2017 -0800
tree	278a8706a3522790ef68cc2b078502c91f593e0b
parent	9c30e98ce5c5df7ad08cfb06919e213a32f87485 [diff] [blame]