diff options
Diffstat (limited to 'testing/jsshell/benchmark.py')
-rw-r--r-- | testing/jsshell/benchmark.py | 433 |
1 files changed, 433 insertions, 0 deletions
diff --git a/testing/jsshell/benchmark.py b/testing/jsshell/benchmark.py new file mode 100644 index 0000000000..41a8db460e --- /dev/null +++ b/testing/jsshell/benchmark.py @@ -0,0 +1,433 @@ +# This Source Code Form is subject to the terms of the Mozilla Public +# License, v. 2.0. If a copy of the MPL was not distributed with this +# file, You can obtain one at http://mozilla.org/MPL/2.0/. + +import six +import json +import os +import re +import shutil +import sys +from abc import ABCMeta, abstractmethod, abstractproperty +from argparse import ArgumentParser +from collections import defaultdict + +from mozbuild.base import MozbuildObject, BuildEnvironmentNotFoundException +from mozprocess import run_and_wait + +here = os.path.abspath(os.path.dirname(__file__)) +build = MozbuildObject.from_environment(cwd=here) + +JSSHELL_NOT_FOUND = """ +Could not detect a JS shell. Either make sure you have a non-artifact build +with `ac_add_options --enable-js-shell` or specify it with `--binary`. +""".strip() + + +@six.add_metaclass(ABCMeta) +class Benchmark(object): + lower_is_better = True + should_alert = True + + def __init__(self, shell, args=None, shell_name=None): + self.shell = shell + self.args = args + self.shell_name = shell_name + + @abstractproperty + def unit(self): + """Returns the unit of measurement of the benchmark.""" + + @abstractproperty + def name(self): + """Returns the string name of the benchmark.""" + + @abstractproperty + def path(self): + """Return the path to the benchmark relative to topsrcdir.""" + + @abstractmethod + def process_line(self, proc, line): + """Process a line of stdout from the benchmark.""" + + @abstractmethod + def collect_results(self): + """Build the result after the process has finished.""" + + @property + def command(self): + """Returns the command to run as a list.""" + cmd = [self.shell] + if self.args: + cmd += self.args + return cmd + + @property + def version(self): + if self._version: + return self._version + + with open(os.path.join(self.path, "VERSION"), "r") as fh: + self._version = fh.read().strip("\r\n\r\n \t") + return self._version + + def reset(self): + """Resets state between runs.""" + name = self.name + if self.shell_name: + name = "{}-{}".format(name, self.shell_name) + + self.perfherder_data = { + "framework": { + "name": "js-bench", + }, + "suites": [ + { + "lowerIsBetter": self.lower_is_better, + "name": name, + "shouldAlert": self.should_alert, + "subtests": [], + "unit": self.unit, + "value": None, + }, + ], + } + self.suite = self.perfherder_data["suites"][0] + + def _provision_benchmark_script(self): + if os.path.isdir(self.path): + return + + # Some benchmarks may have been downloaded from a fetch task, make + # sure they get copied over. + fetches_dir = os.environ.get("MOZ_FETCHES_DIR") + if fetches_dir and os.path.isdir(fetches_dir): + fetchdir = os.path.join(fetches_dir, self.name) + if os.path.isdir(fetchdir): + shutil.copytree(fetchdir, self.path) + + def run(self): + self.reset() + + # Update the environment variables + env = os.environ.copy() + + process_args = { + "args": self.command, + "cwd": self.path, + "env": env, + "output_line_handler": self.process_line, + } + proc = run_and_wait(**process_args) + self.collect_results() + return proc.returncode + + +class RunOnceBenchmark(Benchmark): + def collect_results(self): + bench_total = 0 + # NOTE: for this benchmark we run the test once, so we have a single value array + for bench, scores in self.scores.items(): + for score, values in scores.items(): + test_name = "{}-{}".format(self.name, score) + # pylint --py3k W1619 + mean = sum(values) / len(values) + self.suite["subtests"].append({"name": test_name, "value": mean}) + bench_total += int(sum(values)) + self.suite["value"] = bench_total + + +class Ares6(Benchmark): + name = "ares6" + path = os.path.join("third_party", "webkit", "PerformanceTests", "ARES-6") + unit = "ms" + + @property + def command(self): + cmd = super(Ares6, self).command + return cmd + ["cli.js"] + + def reset(self): + super(Ares6, self).reset() + + self.bench_name = None + self.last_summary = None + # Scores are of the form: + # {<bench_name>: {<score_name>: [<values>]}} + self.scores = defaultdict(lambda: defaultdict(list)) + + def _try_find_score(self, score_name, line): + m = re.search(score_name + ":\s*(\d+\.?\d*?) (\+-)?.+", line) + if not m: + return False + + score = m.group(1) + self.scores[self.bench_name][score_name].append(float(score)) + return True + + def process_line(self, proc, line): + line = line.strip("\n") + print(line) + m = re.search("Running... (.+) \(.+\)", line) + if m: + self.bench_name = m.group(1) + return + + if self._try_find_score("firstIteration", line): + return + + if self._try_find_score("averageWorstCase", line): + return + + if self._try_find_score("steadyState", line): + return + + m = re.search("summary:\s*(\d+\.?\d*?) (\+-)?.+", line) + if m: + self.last_summary = float(m.group(1)) + + def collect_results(self): + for bench, scores in self.scores.items(): + for score, values in scores.items(): + # pylint --py3k W1619 + mean = sum(values) / len(values) + test_name = "{}-{}".format(bench, score) + self.suite["subtests"].append({"name": test_name, "value": mean}) + + if self.last_summary: + self.suite["value"] = self.last_summary + + +class SixSpeed(RunOnceBenchmark): + name = "six-speed" + path = os.path.join("third_party", "webkit", "PerformanceTests", "six-speed") + unit = "ms" + + @property + def command(self): + cmd = super(SixSpeed, self).command + return cmd + ["test.js"] + + def reset(self): + super(SixSpeed, self).reset() + + # Scores are of the form: + # {<bench_name>: {<score_name>: [<values>]}} + self.scores = defaultdict(lambda: defaultdict(list)) + + def process_line(self, proc, output): + output = output.strip("\n") + print(output) + m = re.search("(.+): (\d+)", output) + if not m: + return + subtest = m.group(1) + score = m.group(2) + if subtest not in self.scores[self.name]: + self.scores[self.name][subtest] = [] + self.scores[self.name][subtest].append(int(score)) + + +class SunSpider(RunOnceBenchmark): + name = "sunspider" + path = os.path.join( + "third_party", "webkit", "PerformanceTests", "SunSpider", "sunspider-0.9.1" + ) + unit = "ms" + + @property + def command(self): + cmd = super(SunSpider, self).command + return cmd + ["sunspider-standalone-driver.js"] + + def reset(self): + super(SunSpider, self).reset() + + # Scores are of the form: + # {<bench_name>: {<score_name>: [<values>]}} + self.scores = defaultdict(lambda: defaultdict(list)) + + def process_line(self, proc, output): + output = output.strip("\n") + print(output) + m = re.search("(.+): (\d+)", output) + if not m: + return + subtest = m.group(1) + score = m.group(2) + if subtest not in self.scores[self.name]: + self.scores[self.name][subtest] = [] + self.scores[self.name][subtest].append(int(score)) + + +class WebToolingBenchmark(Benchmark): + name = "web-tooling-benchmark" + path = os.path.join( + "third_party", "webkit", "PerformanceTests", "web-tooling-benchmark" + ) + main_js = "cli.js" + unit = "score" + lower_is_better = False + subtests_lower_is_better = False + + @property + def command(self): + cmd = super(WebToolingBenchmark, self).command + return cmd + [self.main_js] + + def reset(self): + super(WebToolingBenchmark, self).reset() + + # Scores are of the form: + # {<bench_name>: {<score_name>: [<values>]}} + self.scores = defaultdict(lambda: defaultdict(list)) + + def process_line(self, proc, output): + output = output.strip("\n") + print(output) + m = re.search(" +([a-zA-Z].+): +([.0-9]+) +runs/sec", output) + if not m: + return + subtest = m.group(1) + score = m.group(2) + if subtest not in self.scores[self.name]: + self.scores[self.name][subtest] = [] + self.scores[self.name][subtest].append(float(score)) + + def collect_results(self): + # NOTE: for this benchmark we run the test once, so we have a single value array + bench_mean = None + for bench, scores in self.scores.items(): + for score_name, values in scores.items(): + test_name = "{}-{}".format(self.name, score_name) + # pylint --py3k W1619 + mean = sum(values) / len(values) + self.suite["subtests"].append( + { + "lowerIsBetter": self.subtests_lower_is_better, + "name": test_name, + "value": mean, + } + ) + if score_name == "mean": + bench_mean = mean + self.suite["value"] = bench_mean + + def run(self): + self._provision_benchmark_script() + return super(WebToolingBenchmark, self).run() + + +class Octane(RunOnceBenchmark): + name = "octane" + path = os.path.join("third_party", "webkit", "PerformanceTests", "octane") + unit = "score" + lower_is_better = False + + @property + def command(self): + cmd = super(Octane, self).command + return cmd + ["run.js"] + + def reset(self): + super(Octane, self).reset() + + # Scores are of the form: + # {<bench_name>: {<score_name>: [<values>]}} + self.scores = defaultdict(lambda: defaultdict(list)) + + def process_line(self, proc, output): + output = output.strip("\n") + print(output) + m = re.search("(.+): (\d+)", output) + if not m: + return + subtest = m.group(1) + score = m.group(2) + if subtest.startswith("Score"): + subtest = "score" + if subtest not in self.scores[self.name]: + self.scores[self.name][subtest] = [] + self.scores[self.name][subtest].append(int(score)) + + def collect_results(self): + bench_score = None + # NOTE: for this benchmark we run the test once, so we have a single value array + for bench, scores in self.scores.items(): + for score_name, values in scores.items(): + test_name = "{}-{}".format(self.name, score_name) + # pylint --py3k W1619 + mean = sum(values) / len(values) + self.suite["subtests"].append({"name": test_name, "value": mean}) + if score_name == "score": + bench_score = mean + self.suite["value"] = bench_score + + def run(self): + self._provision_benchmark_script() + return super(Octane, self).run() + + +all_benchmarks = { + "ares6": Ares6, + "six-speed": SixSpeed, + "sunspider": SunSpider, + "web-tooling-benchmark": WebToolingBenchmark, + "octane": Octane, +} + + +def run(benchmark, binary=None, extra_args=None, perfherder=None): + if not binary: + try: + binary = os.path.join(build.bindir, "js" + build.substs["BIN_SUFFIX"]) + except BuildEnvironmentNotFoundException: + binary = None + + if not binary or not os.path.isfile(binary): + print(JSSHELL_NOT_FOUND) + return 1 + + bench = all_benchmarks.get(benchmark)( + binary, args=extra_args, shell_name=perfherder + ) + res = bench.run() + + if perfherder: + print("PERFHERDER_DATA: {}".format(json.dumps(bench.perfherder_data))) + return res + + +def get_parser(): + parser = ArgumentParser() + parser.add_argument( + "benchmark", + choices=list(all_benchmarks), + help="The name of the benchmark to run.", + ) + parser.add_argument( + "-b", "--binary", default=None, help="Path to the JS shell binary to use." + ) + parser.add_argument( + "--arg", + dest="extra_args", + action="append", + default=None, + help="Extra arguments to pass to the JS shell.", + ) + parser.add_argument( + "--perfherder", + default=None, + help="Log PERFHERDER_DATA to stdout using the given suite name.", + ) + return parser + + +def cli(args=sys.argv[1:]): + parser = get_parser() + args = parser.parser_args(args) + return run(**vars(args)) + + +if __name__ == "__main__": + sys.exit(cli()) |