gecko/testing/web-platform/update/fetchlogs.py

# This Source Code Form is subject to the terms of the Mozilla Public
# License, v. 2.0. If a copy of the MPL was not distributed with this
# file, You can obtain one at http://mozilla.org/MPL/2.0/.

import argparse
import cStringIO
import gzip
import json
import os
import requests
import urlparse

treeherder_base = "https://treeherder.mozilla.org/"

"""Simple script for downloading structured logs from treeherder.

For the moment this is specialised to work with web-platform-tests
logs; in due course it should move somewhere generic and get hooked
up to mach or similar"""

# Interpretation of the "job" list from
# https://github.com/mozilla/treeherder-service/blob/master/treeherder/webapp/api/utils.py#L18

def create_parser():
    parser = argparse.ArgumentParser()
    parser.add_argument("branch", action="store",
                        help="Branch on which jobs ran")
    parser.add_argument("commit",
                        action="store",
                        help="Commit hash for push")

    return parser

def download(url, prefix, dest, force_suffix=True):
    if dest is None:
        dest = "."

    if prefix and not force_suffix:
        name = os.path.join(dest, prefix + ".log")
    else:
        name = None
    counter = 0

    while not name or os.path.exists(name):
        counter += 1
        sep = "" if not prefix else "-"
        name = os.path.join(dest, prefix + sep + str(counter) + ".log")

    with open(name, "wb") as f:
        resp = requests.get(url, stream=True)
        for chunk in resp.iter_content(1024):
            f.write(chunk)

def get_blobber_url(branch, job):
    job_id = job["id"]
    resp = requests.get(urlparse.urljoin(treeherder_base,
                                         "/api/project/%s/artifact/?job_id=%i&name=Job%%20Info" % (branch,
                                                                                                   job_id)))
    job_data = resp.json()

    if job_data:
        assert len(job_data) == 1
        job_data = job_data[0]
        try:
            details = job_data["blob"]["job_details"]
            for item in details:
                if item["value"] == "wpt_raw.log":
                    return item["url"]
        except:
            return None


def get_structured_logs(branch, commit, dest=None):
    resp = requests.get(urlparse.urljoin(treeherder_base, "/api/project/%s/resultset/?revision=%s" % (branch, commit)))

    revision_data = resp.json()

    result_set = revision_data["results"][0]["id"]

    resp = requests.get(urlparse.urljoin(treeherder_base, "/api/project/%s/jobs/?result_set_id=%s&count=2000&exclusion_profile=false" % (branch, result_set)))

    job_data = resp.json()

    for result in job_data["results"]:
        job_type_name = result["job_type_name"]
        if job_type_name.startswith("W3C Web Platform"):
            url = get_blobber_url(branch, result)
            if url:
                prefix = result["platform"] # platform
                download(url, prefix, None)

def main():
    parser = create_parser()
    args = parser.parse_args()

    get_structured_logs(args.branch, args.commit)

if __name__ == "__main__":
    main()
Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 04:52:43 -07:00			`# This Source Code Form is subject to the terms of the Mozilla Public`
			`# License, v. 2.0. If a copy of the MPL was not distributed with this`
			`# file, You can obtain one at http://mozilla.org/MPL/2.0/.`

			`import argparse`
			`import cStringIO`
			`import gzip`
			`import json`
			`import os`
			`import requests`
			`import urlparse`

			`treeherder_base = "https://treeherder.mozilla.org/"`

			`"""Simple script for downloading structured logs from treeherder.`

			`For the moment this is specialised to work with web-platform-tests`
			`logs; in due course it should move somewhere generic and get hooked`
			`up to mach or similar"""`

			`# Interpretation of the "job" list from`
			`# https://github.com/mozilla/treeherder-service/blob/master/treeherder/webapp/api/utils.py#L18`

			`def create_parser():`
			`parser = argparse.ArgumentParser()`
			`parser.add_argument("branch", action="store",`
			`help="Branch on which jobs ran")`
			`parser.add_argument("commit",`
			`action="store",`
			`help="Commit hash for push")`

			`return parser`

			`def download(url, prefix, dest, force_suffix=True):`
			`if dest is None:`
			`dest = "."`

			`if prefix and not force_suffix:`
			`name = os.path.join(dest, prefix + ".log")`
			`else:`
			`name = None`
			`counter = 0`

			`while not name or os.path.exists(name):`
			`counter += 1`
			`sep = "" if not prefix else "-"`
			`name = os.path.join(dest, prefix + sep + str(counter) + ".log")`

			`with open(name, "wb") as f:`
Bug 1102907 - Script for allowing web-platform-tests changes to be upstreamed, r=ahal This extends the upstream update script with steps for pushing local changes to upstream. The general approach is to look for all commits to the tests directory since the last sync, rewrite those so they apply to upstream at the last sync point, then rebase onto the sync commit, before creating and merging a PR for each in turn. --HG-- rename : testing/web-platform/fetchlogs.py => testing/web-platform/update/fetchlogs.py 2015-01-13 01:42:40 -08:00			`resp = requests.get(url, stream=True)`
			`for chunk in resp.iter_content(1024):`
			`f.write(chunk)`
Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 04:52:43 -07:00
			`def get_blobber_url(branch, job):`
Bug 1140143 - Fix wpt log fetching script for treeherder changes, r=edmorley 2015-03-02 06:07:09 -08:00			`job_id = job["id"]`
Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 04:52:43 -07:00			`resp = requests.get(urlparse.urljoin(treeherder_base,`
			`"/api/project/%s/artifact/?job_id=%i&name=Job%%20Info" % (branch,`
			`job_id)))`
			`job_data = resp.json()`
Bug 1140143 - Fix wpt log fetching script for treeherder changes, r=edmorley 2015-03-02 06:07:09 -08:00
Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 04:52:43 -07:00			`if job_data:`
			`assert len(job_data) == 1`
			`job_data = job_data[0]`
			`try:`
			`details = job_data["blob"]["job_details"]`
			`for item in details:`
Bug 1102907 - Script for allowing web-platform-tests changes to be upstreamed, r=ahal This extends the upstream update script with steps for pushing local changes to upstream. The general approach is to look for all commits to the tests directory since the last sync, rewrite those so they apply to upstream at the last sync point, then rebase onto the sync commit, before creating and merging a PR for each in turn. --HG-- rename : testing/web-platform/fetchlogs.py => testing/web-platform/update/fetchlogs.py 2015-01-13 01:42:40 -08:00			`if item["value"] == "wpt_raw.log":`
Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 04:52:43 -07:00			`return item["url"]`
			`except:`
			`return None`


			`def get_structured_logs(branch, commit, dest=None):`
Bug 1140143 - Fix wpt log fetching script for treeherder changes, r=edmorley 2015-03-02 06:07:09 -08:00			`resp = requests.get(urlparse.urljoin(treeherder_base, "/api/project/%s/resultset/?revision=%s" % (branch, commit)))`

			`revision_data = resp.json()`

			`result_set = revision_data["results"][0]["id"]`

			`resp = requests.get(urlparse.urljoin(treeherder_base, "/api/project/%s/jobs/?result_set_id=%s&count=2000&exclusion_profile=false" % (branch, result_set)))`

Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 04:52:43 -07:00			`job_data = resp.json()`

			`for result in job_data["results"]:`
Bug 1140143 - Fix wpt log fetching script for treeherder changes, r=edmorley 2015-03-02 06:07:09 -08:00			`job_type_name = result["job_type_name"]`
			`if job_type_name.startswith("W3C Web Platform"):`
			`url = get_blobber_url(branch, result)`
			`if url:`
			`prefix = result["platform"] # platform`
			`download(url, prefix, None)`
Bug 945222 - Initial import of web-platform-tests testsuite 4/4 : Integration with build system, mach and mozharness, r=ahal,gps --HG-- extra : rebase_source : 0d704f5a3edcbcef56d15b76ef26aae1b7232c4d 2014-09-04 04:52:43 -07:00
			`def main():`
			`parser = create_parser()`
			`args = parser.parse_args()`

			`get_structured_logs(args.branch, args.commit)`

			`if __name__ == "__main__":`
			`main()`