gecko-dev/testing/web-platform/manifestdownload.py

136 строки
4.3 KiB
Python

from __future__ import absolute_import
import argparse
import json
import os
from datetime import datetime, timedelta
import tarfile
import vcs
import requests
from cStringIO import StringIO
def abs_path(path):
return os.path.abspath(os.path.expanduser(path))
def hg_commits(repo_root):
hg = vcs.Mercurial.get_func(repo_root)
for item in hg("log", "-fl50", "--template={node}\n", "testing/web-platform/tests",
"testing/web-platform/mozilla/tests").splitlines():
yield item
def git_commits(repo_root):
git = vcs.Git.get_func(repo_root)
for item in git("log", "--format=%H", "-n50", "testing/web-platform/tests",
"testing/web-platform/mozilla/tests").splitlines():
yield git("cinnabar", "git2hg", item)
def get_commits(logger, repo_root):
if vcs.Mercurial.is_hg_repo(repo_root):
return hg_commits(repo_root)
elif vcs.Git.is_git_repo(repo_root):
return git_commits(repo_root)
logger.warning("No VCS found")
return False
def should_download(logger, manifest_path, rebuild_time=timedelta(days=5)):
# TODO: Improve logic for when to download. Maybe if x revisions behind?
if not os.path.exists(manifest_path):
return True
mtime = datetime.fromtimestamp(os.path.getmtime(manifest_path))
if mtime < datetime.now() - rebuild_time:
return True
logger.info("Skipping manifest download because existing file is recent")
return False
def taskcluster_url(logger, commits):
cset_url = ('https://hg.mozilla.org/mozilla-central/json-pushes?'
'changeset={changeset}&version=2&tipsonly=1')
tc_url = ('https://index.taskcluster.net/v1/task/gecko.v2.mozilla-central.'
'revision.{changeset}.source.manifest-upload')
for revision in commits:
req = requests.get(cset_url.format(changeset=revision),
headers={'Accept': 'application/json'})
req.raise_for_status()
result = req.json()
[cset] = result['pushes'].values()[0]['changesets']
req = requests.get(tc_url.format(changeset=cset))
if req.status_code == 200:
return tc_url.format(changeset=cset)
logger.info("Can't find a commit-specific manifest so just using the most"
"recent one")
return ("https://index.taskcluster.net/v1/task/gecko.v2.mozilla-central."
"latest.source.manifest-upload")
def download_manifest(logger, wpt_dir, commits_func, url_func, force=False):
if not force and not should_download(logger, os.path.join(wpt_dir, "meta", "MANIFEST.json")):
return False
commits = commits_func()
if not commits:
return False
url = url_func(logger, commits) + "/artifacts/public/manifests.tar.gz"
if not url:
logger.warning("No generated manifest found")
return False
logger.info("Downloading manifest from %s" % url)
try:
req = requests.get(url)
except Exception:
logger.warning("Downloading pregenerated manifest failed")
return False
if req.status_code != 200:
logger.warning("Downloading pregenerated manifest failed; got"
"HTTP status %d" % req.status_code)
return False
tar = tarfile.open(mode="r:gz", fileobj=StringIO(req.content))
try:
tar.extractall(path=wpt_dir)
except IOError:
logger.warning("Failed to decompress downloaded file")
return False
os.utime(os.path.join(wpt_dir, "meta", "MANIFEST.json"), None)
os.utime(os.path.join(wpt_dir, "mozilla", "meta", "MANIFEST.json"), None)
logger.info("Manifest downloaded")
return True
def create_parser():
parser = argparse.ArgumentParser()
parser.add_argument(
"-p", "--path", type=abs_path, help="Path to manifest file.")
parser.add_argument(
"--force", action="store_true",
help="Always download, even if the existing manifest is recent")
return parser
def download_from_taskcluster(logger, wpt_dir, repo_root, force=False):
return download_manifest(logger, wpt_dir, lambda: get_commits(logger, repo_root),
taskcluster_url, force)
def run(logger, wpt_dir, repo_root, force=False):
success = download_from_taskcluster(logger, wpt_dir, repo_root, force)
return 0 if success else 1