[tools/perf] Add BenchmarkRunnerIntegrationTest

Add an integration tests for benchmark running and results processing. This includes writing traces and running metrics on them. The test can also serve as an example for writing other integration tests (e.g. for ad hoc measurements). This test is intended to replace the existing testTBM2ForSmoke: https://cs.chromium.org/chromium/src/third_party/catapult/telemetry/telemetry/web_perf/timeline_based_measurement_unittest.py?rcl=0b1af463167af25923a31dd190b41a32841e05fe&l=99 Note: depends on landing first https://chromium-review.googlesource.com/c/catapult/+/1847392 Bug: 1012227 Change-Id: I784a0e08a495f3489e46ac4c8b9e83857ff8cc98 Reviewed-on: https://chromium-review.googlesource.com/c/chromium/src/+/1847340 Commit-Queue: Juan Antonio Navarro Pérez <perezju@chromium.org> Reviewed-by: Caleb Rouleau <crouleau@chromium.org> Cr-Commit-Position: refs/heads/master@{#705534}

[tools/perf] Add BenchmarkRunnerIntegrationTest
Add an integration tests for benchmark running and results processing. This includes writing traces and running metrics on them. The test can also serve as an example for writing other integration tests (e.g. for ad hoc measurements). This test is intended to replace the existing testTBM2ForSmoke: https://cs.chromium.org/chromium/src/third_party/catapult/telemetry/telemetry/web_perf/timeline_based_measurement_unittest.py?rcl=0b1af463167af25923a31dd190b41a32841e05fe&l=99 Note: depends on landing first https://chromium-review.googlesource.com/c/catapult/+/1847392 Bug: 1012227 Change-Id: I784a0e08a495f3489e46ac4c8b9e83857ff8cc98 Reviewed-on: https://chromium-review.googlesource.com/c/chromium/src/+/1847340 Commit-Queue: Juan Antonio Navarro Pérez <perezju@chromium.org> Reviewed-by: Caleb Rouleau <crouleau@chromium.org> Cr-Commit-Position: refs/heads/master@{#705534}
d3bf2a16 · Juan Antonio Navarro Perez · Commit Bot · dd4c10b0 · d3bf2a16 · dd4c10b0
Commit d3bf2a16 authored Oct 14, 2019 by Juan Antonio Navarro Perez Committed by Commit Bot Oct 14, 2019
Showing with 127 additions and 38 deletions

tools/perf/core/benchmark_runner_test.py tools/perf/core/benchmark_runner_test.py +127 -0

tools/perf/core/benchmark_runner_unittest.py tools/perf/core/benchmark_runner_unittest.py +0 -38

No files found.
--- a/tools/perf/core/benchmark_runner_test.py
+++ b/tools/perf/core/benchmark_runner_test.py
+# Copyright 2019 The Chromium Authors. All rights reserved.
+# Use of this source code is governed by a BSD-style license that can be
+# found in the LICENSE file.
+import json
+import os
+import shutil
+import tempfile
+import unittest
+import mock
+from telemetry.testing import options_for_unittests
+from telemetry.testing import test_stories
+from telemetry.web_perf import timeline_based_measurement
+from tracing.value.diagnostics import all_diagnostics
+from tracing.value.diagnostics import reserved_infos
+from tracing.value import histogram_set
+from core import benchmark_runner
+from core import perf_benchmark
+from core import results_processor
+def _FakeParseArgs(environment, args, results_arg_parser):
+  del environment  # Unused.
+  options, _ = results_arg_parser.parse_known_args(args)
+  return options
+class BenchmarkRunnerUnittest(unittest.TestCase):
+  """Tests for benchmark_runner.main which mock out benchmark running."""
+  def testMain_ReturnCode(self):
+    """Test that benchmark_runner.main() respects return code from Telemetry."""
+    config = mock.Mock()
+    with mock.patch('core.benchmark_runner.command_line') as telemetry_cli:
+      telemetry_cli.ParseArgs.side_effect = _FakeParseArgs
+      telemetry_cli.RunCommand.return_value = 42
+      # Note: We pass `--output-format none` and a non-existent output
+      # dir to prevent the results processor from processing any results.
+      return_code = benchmark_runner.main(config, [
+          'run', 'some.benchmark', '--browser', 'stable',
+          '--output-dir', '/does/not/exist', '--output-format', 'none'])
+      self.assertEqual(return_code, 42)
+class BenchmarkRunnerIntegrationTest(unittest.TestCase):
+  """Integration tests for benchmark running and results processing.
+  Note, however, no command line processing is tested.
+  """
+  def setUp(self):
+    self.options = options_for_unittests.GetRunOptions(
+        output_dir=tempfile.mkdtemp())
+    self.options.output_formats = ['histograms']
+  def tearDown(self):
+    shutil.rmtree(self.options.output_dir)
+  def assertHasDiagnostic(self, hist, diag_info, value=None):
+    """Assert that a histogram is associated with the given diagnostic."""
+    self.assertIn(diag_info.name, hist.diagnostics)
+    diag = hist.diagnostics[diag_info.name]
+    self.assertIsInstance(
+        diag, all_diagnostics.GetDiagnosticClassForName(diag_info.type))
+    if value is not None:
+      # Assume we expect singleton GenericSet with the given value.
+      self.assertEqual(len(diag), 1)
+      self.assertEqual(next(iter(diag)), value)
+  def RunBenchmark(self, benchmark_class):
+    """Run a benchmark, process results, and return generated histograms."""
+    # TODO(crbug.com/985712): Ideally we should be able to just call
+    # telemetry.command_line.RunCommand(self.options) with the right set
+    # of options chosen. However, argument parsing and command running are
+    # currently tangled in Telemetry. In particular the class property
+    # Run._benchmark is not set when we skip argument parsing, and the Run.Run
+    # method call fails. Simplify this when argument parsing and command
+    # running are no longer intertwined like this.
+    run_return_code = benchmark_class().Run(self.options)
+    self.assertEqual(run_return_code, 0)
+    process_return_code = results_processor.ProcessResults(self.options)
+    self.assertEqual(process_return_code, 0)
+    histograms_file = os.path.join(self.options.output_dir, 'histograms.json')
+    self.assertTrue(os.path.exists(histograms_file))
+    with open(histograms_file) as f:
+      dicts = json.load(f)
+    histograms = histogram_set.HistogramSet()
+    histograms.ImportDicts(dicts)
+    return histograms
+  def testTimelineBasedEndToEnd(self):
+    class TestTimelineBasedBenchmark(perf_benchmark.PerfBenchmark):
+      """A dummy benchmark that records a trace and runs sampleMetric on it."""
+      def CreateCoreTimelineBasedMeasurementOptions(self):
+        options = timeline_based_measurement.Options()
+        options.config.enable_chrome_trace = True
+        options.SetTimelineBasedMetrics(['consoleErrorMetric'])
+        return options
+      def CreateStorySet(self, _):
+        def log_error(action_runner):
+          action_runner.EvaluateJavaScript('console.error("foo!")')
+        return test_stories.SinglePageStorySet(
+            name='log_error_story', story_run_side_effect=log_error)
+      @classmethod
+      def Name(cls):
+        return 'test_benchmark.timeline_based'
+    histograms = self.RunBenchmark(TestTimelineBasedBenchmark)
+    # Verify that the injected console.log error was counted by the metric.
+    hist = histograms.GetHistogramNamed('console:error:js')
+    self.assertEqual(hist.average, 1)
+    self.assertHasDiagnostic(hist, reserved_infos.BENCHMARKS,
+                             'test_benchmark.timeline_based')
+    self.assertHasDiagnostic(hist, reserved_infos.STORIES, 'log_error_story')
+    self.assertHasDiagnostic(hist, reserved_infos.STORYSET_REPEATS, 0)
+    self.assertHasDiagnostic(hist, reserved_infos.TRACE_START)
--- a/tools/perf/core/benchmark_runner_unittest.py
+++ b/tools/perf/core/benchmark_runner_unittest.py
-# Copyright 2019 The Chromium Authors. All rights reserved.
-# Use of this source code is governed by a BSD-style license that can be
-# found in the LICENSE file.
-import unittest
-import mock
-from core import benchmark_runner
-def _FakeParseArgs(environment, args, results_arg_parser):
-  del environment  # Unused.
-  options, _ = results_arg_parser.parse_known_args(args)
-  return options
-class BenchmarkRunnerUnittest(unittest.TestCase):
-  def testMain_returnCode(self):
-    """Test that benchmark_runner.main() respects return code from Telemetry."""
-    # TODO(crbug.com/985712): Ideally we should write a more "integration" kind
-    # of test, where we don't mock out the Telemetry command line. This is
-    # hard to do now, however, because we need a way to convert the browser
-    # selection done by the test runner, back to a suitable --browser arg for
-    # the command line below. Namely, we need an equivalent of
-    # options_for_unittests.GetCopy() that returns a list of string args
-    # rather than the parsed options object.
-    config = mock.Mock()
-    with mock.patch('core.benchmark_runner.command_line') as telemetry_cli:
-      telemetry_cli.ParseArgs.side_effect = _FakeParseArgs
-      telemetry_cli.RunCommand.return_value = 42
-      # Note: For now we pass `--output-format none` and a non-existent output
-      # dir to prevent the results processor from processing any results.
-      return_code = benchmark_runner.main(config, [
-          'run', 'some.benchmark', '--browser', 'stable',
-          '--output-dir', '/does/not/exist', '--output-format', 'none'])
-      self.assertEqual(return_code, 42)