gecko-dev/testing/jsshell/benchmark.py

# This Source Code Form is subject to the terms of the Mozilla Public
# License, v. 2.0. If a copy of the MPL was not distributed with this
# file, You can obtain one at http://mozilla.org/MPL/2.0/.

from __future__ import absolute_import, print_function

import json
import os
import re
import shutil
import sys
from abc import ABCMeta, abstractmethod, abstractproperty
from argparse import ArgumentParser
from collections import defaultdict

from mozbuild.base import MozbuildObject, BuildEnvironmentNotFoundException
from mozprocess import ProcessHandler

here = os.path.abspath(os.path.dirname(__file__))
build = MozbuildObject.from_environment(cwd=here)

JSSHELL_NOT_FOUND = """
Could not detect a JS shell. Either make sure you have a non-artifact build
with `ac_add_options --enable-js-shell` or specify it with `--binary`.
""".strip()


class Benchmark(object):
    __metaclass__ = ABCMeta
    lower_is_better = True
    should_alert = False

    def __init__(self, shell, args=None, shell_name=None):
        self.shell = shell
        self.args = args
        self.shell_name = shell_name

    @abstractproperty
    def units(self):
        """Returns the unit of measurement of the benchmark."""

    @abstractproperty
    def name(self):
        """Returns the string name of the benchmark."""

    @abstractproperty
    def path(self):
        """Return the path to the benchmark relative to topsrcdir."""

    @abstractmethod
    def process_line(self, line):
        """Process a line of stdout from the benchmark."""

    @abstractmethod
    def collect_results(self):
        """Build the result after the process has finished."""

    @property
    def command(self):
        """Returns the command to run as a list."""
        cmd = [self.shell]
        if self.args:
            cmd += self.args
        return cmd

    @property
    def version(self):
        if self._version:
            return self._version

        with open(os.path.join(self.path, 'VERSION'), 'r') as fh:
            self._version = fh.read().strip("\r\n\r\n \t")
        return self._version

    def reset(self):
        """Resets state between runs."""
        name = self.name
        if self.shell_name:
            name = '{}-{}'.format(name, self.shell_name)

        self.perfherder_data = {
            'framework': {
                'name': 'js-bench',
            },
            'suites': [
                {
                    'lowerIsBetter': self.lower_is_better,
                    'name': name,
                    'shouldAlert': self.should_alert,
                    'subtests': [],
                    'units': self.units,
                    'value': None
                },
            ],
        }
        self.suite = self.perfherder_data['suites'][0]

    def _provision_benchmark_script(self):
        if os.path.isdir(self.path):
            return

        # Some benchmarks may have been downloaded from a fetch task, make
        # sure they get copied over.
        fetches_dir = os.environ.get('MOZ_FETCHES_DIR')
        if fetches_dir and os.path.isdir(fetches_dir):
            fetchdir = os.path.join(fetches_dir, self.name)
            if os.path.isdir(fetchdir):
                shutil.copytree(fetchdir, self.path)

    def run(self):
        self.reset()

        # Update the environment variables
        env = os.environ.copy()

        # disable "GC poisoning" Bug# 1499043
        env['JSGC_DISABLE_POISONING'] = '1'

        process_args = {
            'cmd': self.command,
            'cwd': self.path,
            'onFinish': self.collect_results,
            'processOutputLine': self.process_line,
            'stream': sys.stdout,
            'env': env,
        }
        proc = ProcessHandler(**process_args)
        proc.run()
        return proc.wait()


class RunOnceBenchmark(Benchmark):
    def collect_results(self):
        bench_total = 0
        # NOTE: for this benchmark we run the test once, so we have a single value array
        for bench, scores in self.scores.items():
            for score, values in scores.items():
                test_name = "{}-{}".format(self.name, score)
                mean = sum(values) / len(values)
                self.suite['subtests'].append({'name': test_name, 'value': mean})
                bench_total += int(sum(values))
        self.suite['value'] = bench_total


class Ares6(Benchmark):
    name = 'ares6'
    path = os.path.join('third_party', 'webkit', 'PerformanceTests', 'ARES-6')
    units = 'ms'

    @property
    def command(self):
        cmd = super(Ares6, self).command
        return cmd + ['cli.js']

    def reset(self):
        super(Ares6, self).reset()

        self.bench_name = None
        self.last_summary = None
        # Scores are of the form:
        # {<bench_name>: {<score_name>: [<values>]}}
        self.scores = defaultdict(lambda: defaultdict(list))

    def _try_find_score(self, score_name, line):
        m = re.search(score_name + ':\s*(\d+\.?\d*?) (\+-)?.+', line)
        if not m:
            return False

        score = m.group(1)
        self.scores[self.bench_name][score_name].append(float(score))
        return True

    def process_line(self, line):
        m = re.search("Running... (.+) \(.+\)", line)
        if m:
            self.bench_name = m.group(1)
            return

        if self._try_find_score('firstIteration', line):
            return

        if self._try_find_score('averageWorstCase', line):
            return

        if self._try_find_score('steadyState', line):
            return

        m = re.search('summary:\s*(\d+\.?\d*?) (\+-)?.+', line)
        if m:
            self.last_summary = float(m.group(1))

    def collect_results(self):
        for bench, scores in self.scores.items():
            for score, values in scores.items():
                mean = sum(values) / len(values)
                test_name = "{}-{}".format(bench, score)
                self.suite['subtests'].append({'name': test_name, 'value': mean})

        if self.last_summary:
            self.suite['value'] = self.last_summary


class SixSpeed(RunOnceBenchmark):
    name = 'six-speed'
    path = os.path.join('third_party', 'webkit', 'PerformanceTests', 'six-speed')
    units = 'ms'

    @property
    def command(self):
        cmd = super(SixSpeed, self).command
        return cmd + ['test.js']

    def reset(self):
        super(SixSpeed, self).reset()

        # Scores are of the form:
        # {<bench_name>: {<score_name>: [<values>]}}
        self.scores = defaultdict(lambda: defaultdict(list))

    def process_line(self, output):
        m = re.search("(.+): (\d+)", output)
        if not m:
            return
        subtest = m.group(1)
        score = m.group(2)
        if subtest not in self.scores[self.name]:
            self.scores[self.name][subtest] = []
        self.scores[self.name][subtest].append(int(score))


class SunSpider(RunOnceBenchmark):
    name = 'sunspider'
    path = os.path.join('third_party', 'webkit', 'PerformanceTests', 'SunSpider', 'sunspider-0.9.1')
    units = 'ms'

    @property
    def command(self):
        cmd = super(SunSpider, self).command
        return cmd + ['sunspider-standalone-driver.js']

    def reset(self):
        super(SunSpider, self).reset()

        # Scores are of the form:
        # {<bench_name>: {<score_name>: [<values>]}}
        self.scores = defaultdict(lambda: defaultdict(list))

    def process_line(self, output):
        m = re.search("(.+): (\d+)", output)
        if not m:
            return
        subtest = m.group(1)
        score = m.group(2)
        if subtest not in self.scores[self.name]:
            self.scores[self.name][subtest] = []
        self.scores[self.name][subtest].append(int(score))


class WebToolingBenchmark(Benchmark):
    name = 'web-tooling-benchmark'
    path = os.path.join('third_party', 'webkit', 'PerformanceTests', 'web-tooling-benchmark')
    main_js = 'cli.js'
    units = 'score'
    lower_is_better = False

    @property
    def command(self):
        cmd = super(WebToolingBenchmark, self).command
        return cmd + [self.main_js]

    def reset(self):
        super(WebToolingBenchmark, self).reset()

        # Scores are of the form:
        # {<bench_name>: {<score_name>: [<values>]}}
        self.scores = defaultdict(lambda: defaultdict(list))

    def process_line(self, output):
        m = re.search(" +([a-zA-Z].+): +([.0-9]+) +runs/sec", output)
        if not m:
            return
        subtest = m.group(1)
        score = m.group(2)
        if subtest not in self.scores[self.name]:
            self.scores[self.name][subtest] = []
        self.scores[self.name][subtest].append(float(score))

    def collect_results(self):
        # NOTE: for this benchmark we run the test once, so we have a single value array
        for bench, scores in self.scores.items():
            for score_name, values in scores.items():
                test_name = "{}-{}".format(self.name, score_name)
                mean = sum(values) / len(values)
                self.suite['subtests'].append({'name': test_name, 'value': mean})
                if score_name == 'mean':
                    bench_mean = mean
        self.suite['value'] = bench_mean

    def run(self):
        self._provision_benchmark_script()
        return super(WebToolingBenchmark, self).run()


class Octane(RunOnceBenchmark):
    name = 'octane'
    path = os.path.join('third_party', 'webkit', 'PerformanceTests', 'octane')
    units = 'score'
    lower_is_better = False

    @property
    def command(self):
        cmd = super(Octane, self).command
        return cmd + ['run.js']

    def reset(self):
        super(Octane, self).reset()

        # Scores are of the form:
        # {<bench_name>: {<score_name>: [<values>]}}
        self.scores = defaultdict(lambda: defaultdict(list))

    def process_line(self, output):
        m = re.search("(.+): (\d+)", output)
        if not m:
            return
        subtest = m.group(1)
        score = m.group(2)
        if subtest.startswith('Score'):
            subtest = 'score'
        if subtest not in self.scores[self.name]:
            self.scores[self.name][subtest] = []
        self.scores[self.name][subtest].append(int(score))

    def collect_results(self):
        # NOTE: for this benchmark we run the test once, so we have a single value array
        for bench, scores in self.scores.items():
            for score_name, values in scores.items():
                test_name = "{}-{}".format(self.name, score_name)
                mean = sum(values) / len(values)
                self.suite['subtests'].append({'name': test_name, 'value': mean})
                if score_name == 'score':
                    bench_score = mean
        self.suite['value'] = bench_score

    def run(self):
        self._provision_benchmark_script()
        return super(Octane, self).run()


all_benchmarks = {
    'ares6': Ares6,
    'six-speed': SixSpeed,
    'sunspider': SunSpider,
    'web-tooling-benchmark': WebToolingBenchmark,
    'octane': Octane
}


def run(benchmark, binary=None, extra_args=None, perfherder=None):
    if not binary:
        try:
            binary = os.path.join(build.bindir, 'js' + build.substs['BIN_SUFFIX'])
        except BuildEnvironmentNotFoundException:
            binary = None

        if not binary or not os.path.isfile(binary):
            print(JSSHELL_NOT_FOUND)
            return 1

    bench = all_benchmarks.get(benchmark)(binary, args=extra_args, shell_name=perfherder)
    res = bench.run()

    if perfherder:
        print("PERFHERDER_DATA: {}".format(json.dumps(bench.perfherder_data)))
    return res


def get_parser():
    parser = ArgumentParser()
    parser.add_argument('benchmark', choices=all_benchmarks.keys(),
                        help="The name of the benchmark to run.")
    parser.add_argument('-b', '--binary', default=None,
                        help="Path to the JS shell binary to use.")
    parser.add_argument('--arg', dest='extra_args', action='append', default=None,
                        help="Extra arguments to pass to the JS shell.")
    parser.add_argument('--perfherder', default=None,
                        help="Log PERFHERDER_DATA to stdout using the given suite name.")
    return parser


def cli(args=sys.argv[1:]):
    parser = get_parser()
    args = parser.parser_args(args)
    return run(**vars(args))


if __name__ == '__main__':
    sys.exit(cli())