gecko-dev/testing/web-platform/update/fetchlogs.py

# This Source Code Form is subject to the terms of the Mozilla Public
# License, v. 2.0. If a copy of the MPL was not distributed with this
# file, You can obtain one at http://mozilla.org/MPL/2.0/.

import argparse
import os
import requests
import urlparse

treeherder_base = "https://treeherder.mozilla.org/"

"""Simple script for downloading structured logs from treeherder.

For the moment this is specialised to work with web-platform-tests
logs; in due course it should move somewhere generic and get hooked
up to mach or similar"""

# Interpretation of the "job" list from
# https://github.com/mozilla/treeherder-service/blob/master/treeherder/webapp/api/utils.py#L18


def create_parser():
    parser = argparse.ArgumentParser()
    parser.add_argument("branch", action="store",
                        help="Branch on which jobs ran")
    parser.add_argument("commit",
                        action="store",
                        help="Commit hash for push")

    return parser


def download(url, prefix, dest, force_suffix=True):
    if dest is None:
        dest = "."

    if prefix and not force_suffix:
        name = os.path.join(dest, prefix + ".log")
    else:
        name = None
    counter = 0

    while not name or os.path.exists(name):
        counter += 1
        sep = "" if not prefix else "-"
        name = os.path.join(dest, prefix + sep + str(counter) + ".log")

    with open(name, "wb") as f:
        resp = requests.get(url, stream=True)
        for chunk in resp.iter_content(1024):
            f.write(chunk)


def fetch_json(url, params=None):
    headers = {
        'Accept': 'application/json',
        'User-Agent': 'wpt-fetchlogs',
    }
    response = requests.get(url=url, params=params, headers=headers, timeout=30)
    response.raise_for_status()
    return response.json()


def get_blobber_url(branch, job):
    job_guid = job["job_guid"]
    artifact_url = urlparse.urljoin(treeherder_base, "/api/jobdetail/")
    artifact_params = {
        'job_guid': job_guid,
    }
    job_data = fetch_json(artifact_url, params=artifact_params)

    if job_data:
        try:
            for item in job_data["results"]:
                if item["value"] == "wpt_raw.log" or item["value"] == "log_raw.log":
                    return item["url"]
        except:
            return None


def get_structured_logs(branch, commit, dest=None):
    resultset_url = urlparse.urljoin(treeherder_base, "/api/project/%s/resultset/" % branch)
    resultset_params = {
        'revision': commit,
    }
    revision_data = fetch_json(resultset_url, params=resultset_params)
    result_set = revision_data["results"][0]["id"]

    jobs_url = urlparse.urljoin(treeherder_base, "/api/project/%s/jobs/" % branch)
    jobs_params = {
        'result_set_id': result_set,
        'count': 2000,
        'exclusion_profile': 'false',
    }
    job_data = fetch_json(jobs_url, params=jobs_params)

    for result in job_data["results"]:
        job_type_name = result["job_type_name"]
        if (job_type_name.startswith("W3C Web Platform") or
            job_type_name.startswith("test-") and "-web-platform-tests-" in job_type_name):
            url = get_blobber_url(branch, result)
            if url:
                prefix = result["platform"] # platform
                download(url, prefix, None)


def main():
    parser = create_parser()
    args = parser.parse_args()

    get_structured_logs(args.branch, args.commit)

if __name__ == "__main__":
    main()
Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 15:52:43 +04:00			`# This Source Code Form is subject to the terms of the Mozilla Public`
			`# License, v. 2.0. If a copy of the MPL was not distributed with this`
			`# file, You can obtain one at http://mozilla.org/MPL/2.0/.`

			`import argparse`
			`import os`
			`import requests`
			`import urlparse`

			`treeherder_base = "https://treeherder.mozilla.org/"`

			`"""Simple script for downloading structured logs from treeherder.`

			`For the moment this is specialised to work with web-platform-tests`
			`logs; in due course it should move somewhere generic and get hooked`
			`up to mach or similar"""`

			`# Interpretation of the "job" list from`
			`# https://github.com/mozilla/treeherder-service/blob/master/treeherder/webapp/api/utils.py#L18`

Bug 1248710 - Add a User Agent to fetchlogs.py's requests to Treeherder Also removes some unused imports and whitespace flake8 warnings. 2016-02-21 23:14:56 +03:00
Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 15:52:43 +04:00			`def create_parser():`
			`parser = argparse.ArgumentParser()`
			`parser.add_argument("branch", action="store",`
			`help="Branch on which jobs ran")`
			`parser.add_argument("commit",`
			`action="store",`
			`help="Commit hash for push")`

			`return parser`

Bug 1248710 - Add a User Agent to fetchlogs.py's requests to Treeherder Also removes some unused imports and whitespace flake8 warnings. 2016-02-21 23:14:56 +03:00
Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 15:52:43 +04:00			`def download(url, prefix, dest, force_suffix=True):`
			`if dest is None:`
			`dest = "."`

			`if prefix and not force_suffix:`
			`name = os.path.join(dest, prefix + ".log")`
			`else:`
			`name = None`
			`counter = 0`

			`while not name or os.path.exists(name):`
			`counter += 1`
			`sep = "" if not prefix else "-"`
			`name = os.path.join(dest, prefix + sep + str(counter) + ".log")`

			`with open(name, "wb") as f:`
Bug 1102907 - Script for allowing web-platform-tests changes to be upstreamed, r=ahal This extends the upstream update script with steps for pushing local changes to upstream. The general approach is to look for all commits to the tests directory since the last sync, rewrite those so they apply to upstream at the last sync point, then rebase onto the sync commit, before creating and merging a PR for each in turn. --HG-- rename : testing/web-platform/fetchlogs.py => testing/web-platform/update/fetchlogs.py 2015-01-13 12:42:40 +03:00			`resp = requests.get(url, stream=True)`
			`for chunk in resp.iter_content(1024):`
			`f.write(chunk)`
Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 15:52:43 +04:00
Bug 1248710 - Add a User Agent to fetchlogs.py's requests to Treeherder Also removes some unused imports and whitespace flake8 warnings. 2016-02-21 23:14:56 +03:00
			`def fetch_json(url, params=None):`
			`headers = {`
			`'Accept': 'application/json',`
			`'User-Agent': 'wpt-fetchlogs',`
			`}`
			`response = requests.get(url=url, params=params, headers=headers, timeout=30)`
			`response.raise_for_status()`
			`return response.json()`


Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 15:52:43 +04:00			`def get_blobber_url(branch, job):`
Bug 1279534 - Update wpt log fetching script for treeherder changes, r=wlach MozReview-Commit-ID: J52eCZJUp6Q 2016-06-10 15:16:56 +03:00			`job_guid = job["job_guid"]`
			`artifact_url = urlparse.urljoin(treeherder_base, "/api/jobdetail/")`
Bug 1248710 - Add a User Agent to fetchlogs.py's requests to Treeherder Also removes some unused imports and whitespace flake8 warnings. 2016-02-21 23:14:56 +03:00			`artifact_params = {`
Bug 1279534 - Update wpt log fetching script for treeherder changes, r=wlach MozReview-Commit-ID: J52eCZJUp6Q 2016-06-10 15:16:56 +03:00			`'job_guid': job_guid,`
Bug 1248710 - Add a User Agent to fetchlogs.py's requests to Treeherder Also removes some unused imports and whitespace flake8 warnings. 2016-02-21 23:14:56 +03:00			`}`
			`job_data = fetch_json(artifact_url, params=artifact_params)`
Bug 1140143 - Fix wpt log fetching script for treeherder changes, r=edmorley 2015-03-02 17:07:09 +03:00
Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 15:52:43 +04:00			`if job_data:`
			`try:`
Bug 1279534 - Update wpt log fetching script for treeherder changes, r=wlach MozReview-Commit-ID: J52eCZJUp6Q 2016-06-10 15:16:56 +03:00			`for item in job_data["results"]:`
Bug 1331899 - Update fetchlogs script to work with taskcluster, r=emorley MozReview-Commit-ID: 3ENwyvJaXJY 2017-01-16 21:32:16 +03:00			`if item["value"] == "wpt_raw.log" or item["value"] == "log_raw.log":`
Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 15:52:43 +04:00			`return item["url"]`
			`except:`
			`return None`


			`def get_structured_logs(branch, commit, dest=None):`
Bug 1248710 - Add a User Agent to fetchlogs.py's requests to Treeherder Also removes some unused imports and whitespace flake8 warnings. 2016-02-21 23:14:56 +03:00			`resultset_url = urlparse.urljoin(treeherder_base, "/api/project/%s/resultset/" % branch)`
			`resultset_params = {`
			`'revision': commit,`
			`}`
			`revision_data = fetch_json(resultset_url, params=resultset_params)`
Bug 1140143 - Fix wpt log fetching script for treeherder changes, r=edmorley 2015-03-02 17:07:09 +03:00			`result_set = revision_data["results"][0]["id"]`

Bug 1248710 - Add a User Agent to fetchlogs.py's requests to Treeherder Also removes some unused imports and whitespace flake8 warnings. 2016-02-21 23:14:56 +03:00			`jobs_url = urlparse.urljoin(treeherder_base, "/api/project/%s/jobs/" % branch)`
			`jobs_params = {`
			`'result_set_id': result_set,`
			`'count': 2000,`
			`'exclusion_profile': 'false',`
			`}`
			`job_data = fetch_json(jobs_url, params=jobs_params)`
Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 15:52:43 +04:00
			`for result in job_data["results"]:`
Bug 1140143 - Fix wpt log fetching script for treeherder changes, r=edmorley 2015-03-02 17:07:09 +03:00			`job_type_name = result["job_type_name"]`
Bug 1331899 - Update fetchlogs script to work with taskcluster, r=emorley MozReview-Commit-ID: 3ENwyvJaXJY 2017-01-16 21:32:16 +03:00			`if (job_type_name.startswith("W3C Web Platform") or`
			`job_type_name.startswith("test-") and "-web-platform-tests-" in job_type_name):`
Bug 1140143 - Fix wpt log fetching script for treeherder changes, r=edmorley 2015-03-02 17:07:09 +03:00			`url = get_blobber_url(branch, result)`
			`if url:`
			`prefix = result["platform"] # platform`
			`download(url, prefix, None)`
Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 15:52:43 +04:00
Bug 1248710 - Add a User Agent to fetchlogs.py's requests to Treeherder Also removes some unused imports and whitespace flake8 warnings. 2016-02-21 23:14:56 +03:00
Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 15:52:43 +04:00			`def main():`
			`parser = create_parser()`
			`args = parser.parse_args()`

			`get_structured_logs(args.branch, args.commit)`

			`if __name__ == "__main__":`
			`main()`