skia2/gm/rebaseline_server/download_actuals.py
bungeman 842ab70966 Fix "Add support for rebaselining from trybots."
Commit d09ade4b44 was missing a needed edit.
2014-11-11 15:28:02 -05:00

287 lines
11 KiB
Python
Executable File

#!/usr/bin/python
"""
Copyright 2014 Google Inc.
Use of this source code is governed by a BSD-style license that can be
found in the LICENSE file.
Download actual GM results for a particular builder.
"""
# System-level imports
import httplib
import logging
import optparse
import os
import posixpath
import re
import urllib2
# Must fix up PYTHONPATH before importing from within Skia
import rs_fixpypath # pylint: disable=W0611
# Imports from within Skia
from py.utils import gs_utils
from py.utils import url_utils
import buildbot_globals
import gm_json
GM_SUMMARIES_BUCKET = buildbot_globals.Get('gm_summaries_bucket')
DEFAULT_ACTUALS_BASE_URL = (
'http://storage.googleapis.com/%s' % GM_SUMMARIES_BUCKET)
DEFAULT_JSON_FILENAME = 'actual-results.json'
class Download(object):
def __init__(self, actuals_base_url=DEFAULT_ACTUALS_BASE_URL,
json_filename=DEFAULT_JSON_FILENAME,
gm_actuals_root_url=gm_json.GM_ACTUALS_ROOT_HTTP_URL):
"""
Args:
actuals_base_url: URL pointing at the root directory
containing all actual-results.json files, e.g.,
http://domain.name/path/to/dir OR
file:///absolute/path/to/localdir
json_filename: The JSON filename to read from within each directory.
gm_actuals_root_url: Base URL under which the actually-generated-by-bots
GM images are stored.
"""
self._actuals_base_url = actuals_base_url
self._json_filename = json_filename
self._gm_actuals_root_url = gm_actuals_root_url
self._image_filename_re = re.compile(gm_json.IMAGE_FILENAME_PATTERN)
def fetch(self, builder_name, dest_dir):
""" Downloads actual GM results for a particular builder.
Args:
builder_name: which builder to download results of
dest_dir: path to directory where the image files will be written;
if the directory does not exist yet, it will be created
TODO(epoger): Display progress info. Right now, it can take a long time
to download all of the results, and there is no indication of progress.
TODO(epoger): Download multiple images in parallel to speed things up.
"""
json_url = posixpath.join(self._actuals_base_url, builder_name,
self._json_filename)
json_contents = urllib2.urlopen(json_url).read()
results_dict = gm_json.LoadFromString(json_contents)
actual_results_dict = results_dict[gm_json.JSONKEY_ACTUALRESULTS]
for result_type in sorted(actual_results_dict.keys()):
results_of_this_type = actual_results_dict[result_type]
if not results_of_this_type:
continue
for image_name in sorted(results_of_this_type.keys()):
(test, config) = self._image_filename_re.match(image_name).groups()
(hash_type, hash_digest) = results_of_this_type[image_name]
source_url = gm_json.CreateGmActualUrl(
test_name=test, hash_type=hash_type, hash_digest=hash_digest,
gm_actuals_root_url=self._gm_actuals_root_url)
dest_path = os.path.join(dest_dir, config, test + '.png')
url_utils.copy_contents(source_url=source_url, dest_path=dest_path,
create_subdirs_if_needed=True)
def get_builders_list(summaries_bucket=GM_SUMMARIES_BUCKET):
""" Returns the list of builders we have actual results for.
Args:
summaries_bucket: Google Cloud Storage bucket containing the summary
JSON files
"""
dirs, _ = gs_utils.GSUtils().list_bucket_contents(bucket=GM_SUMMARIES_BUCKET)
return dirs
class ActualLocation(object):
def __init__(self, bucket, path, generation):
self.bucket = bucket
self.path = path
self.generation = generation
class TipOfTreeActuals(object):
def __init__(self, summaries_bucket=GM_SUMMARIES_BUCKET,
json_filename=DEFAULT_JSON_FILENAME):
"""
Args:
summaries_bucket: URL pointing at the root directory
containing all actual-results.json files, e.g.,
http://domain.name/path/to/dir OR
file:///absolute/path/to/localdir
json_filename: The JSON filename to read from within each directory.
"""
self._json_filename = json_filename
self._summaries_bucket = summaries_bucket
def description(self):
return 'gm_summaries_bucket %s' % (self._summaries_bucket,)
def get_builders(self):
""" Returns the list of builders we have actual results for.
{builder:string -> ActualLocation}
"""
dirs = get_builders_list(self._summaries_bucket)
result = dict()
for builder in dirs:
result[builder] = ActualLocation(
self._summaries_bucket,
"%s/%s" % (builder, self._json_filename),
None)
return result
class RietveldIssueActuals(object):
def __init__(self, issue, json_filename=DEFAULT_JSON_FILENAME):
"""
Args:
issue: The rietveld issue from which to obtain actuals.
json_filename: The JSON filename to read from within each directory.
"""
self._issue = issue
self._json_filename = json_filename
def description(self):
return 'rietveld issue %s' % (self._issue,)
def get_builders(self):
""" Returns the actuals for the given rietveld issue's tryjobs.
{builder:string -> ActualLocation}
e.g.
{'Test-Android-Xoom-Tegra2-Arm7-Release': (
'chromium-skia-gm-summaries',
'Test-Android-Xoom-Tegra2-Arm7-Release-Trybot/actual-results.json',
'1415041165535000')}
"""
result = dict()
json_filename_re = re.compile(
'^Created: gs://([^/]+)/((?:[^/]+/)+%s)#(\d+)$'
% re.escape(self._json_filename), re.MULTILINE)
codereview_api_url = 'https://codereview.chromium.org/api'
upload_gm_step_url = '/steps/Upload GM Results/logs/stdio'
logging.info('Fetching issue %s ...' % (self._issue,))
json_issue_url = '%s/%s' % (codereview_api_url, self._issue)
json_issue_data = urllib2.urlopen(json_issue_url).read()
issue_dict = gm_json.LoadFromString(json_issue_data)
patchsets = issue_dict.get("patchsets", [])
patchset = patchsets[-1]
if not patchset:
logging.warning('No patchsets for rietveld issue %s.' % (self._issue,))
return result
logging.info('Fetching issue %s patch %s...' % (self._issue, patchset))
json_patchset_url = '%s/%s/%s' % (codereview_api_url, self._issue, patchset)
json_patchset_data = urllib2.urlopen(json_patchset_url).read()
patchset_dict = gm_json.LoadFromString(json_patchset_data)
# try_job_results is ordered reverse chronologically
try_job_results = patchset_dict.get('try_job_results', [])
for try_job_result in try_job_results:
try_builder = try_job_result.get('builder', '<bad builder>')
if not try_builder.endswith('-Trybot'):
logging.warning('Builder %s is not a trybot?' % (try_builder,))
continue
builder = try_builder[:-len('-Trybot')]
if builder in result:
continue
logging.info('Fetching issue %s patch %s try %s...' %
(self._issue, patchset, try_builder))
build_url = try_job_result.get('url', '<bad url>')
gm_upload_output_url = build_url + urllib2.quote(upload_gm_step_url)
logging.info('Fetching %s ...' % (gm_upload_output_url,))
# Tryjobs might not produce the step, but don't let that fail everything.
gm_upload_output = None
try:
gm_upload_output = urllib2.urlopen(gm_upload_output_url).read()
except (urllib2.HTTPError, urllib2.URLError, httplib.HTTPException) as e:
logging.warning(e)
except Exception:
logging.exception('Error opening %s .' % (gm_upload_output_url,))
if not gm_upload_output:
logging.warning('Could not fetch %s .' % (gm_upload_output_url,))
continue
json_filename_match = json_filename_re.search(gm_upload_output)
if json_filename_match:
logging.info('Found issue %s patch %s try %s result gs://%s/%s#%s .' %
(self._issue, patchset, builder,
json_filename_match.group(1),
json_filename_match.group(2),
json_filename_match.group(3)))
result[builder] = ActualLocation(json_filename_match.group(1),
json_filename_match.group(2),
json_filename_match.group(3))
else:
logging.warning('Did not find %s for issue %s patch %s try %s.' %
(self._json_filename, self._issue, patchset, try_builder))
return result
def main():
parser = optparse.OptionParser()
required_params = []
parser.add_option('--actuals-base-url',
action='store', type='string',
default=DEFAULT_ACTUALS_BASE_URL,
help=('Base URL from which to read files containing JSON '
'summaries of actual GM results; defaults to '
'"%default".'))
required_params.append('builder')
# TODO(epoger): Before https://codereview.chromium.org/309653005 , when this
# tool downloaded the JSON summaries from skia-autogen, it had the ability
# to get results as of a specific revision number. We should add similar
# functionality when retrieving the summaries from Google Storage.
parser.add_option('--builder',
action='store', type='string',
help=('REQUIRED: Which builder to download results for. '
'To see a list of builders, run with the '
'--list-builders option set.'))
required_params.append('dest_dir')
parser.add_option('--dest-dir',
action='store', type='string',
help=('REQUIRED: Directory where all images should be '
'written. If this directory does not exist yet, it '
'will be created.'))
parser.add_option('--json-filename',
action='store', type='string',
default=DEFAULT_JSON_FILENAME,
help=('JSON summary filename to read for each builder; '
'defaults to "%default".'))
parser.add_option('--list-builders', action='store_true',
help=('List all available builders.'))
(params, remaining_args) = parser.parse_args()
if params.list_builders:
print '\n'.join(get_builders_list())
return
# Make sure all required options were set,
# and that there were no items left over in the command line.
for required_param in required_params:
if not getattr(params, required_param):
raise Exception('required option \'%s\' was not set' % required_param)
if len(remaining_args) is not 0:
raise Exception('extra items specified in the command line: %s' %
remaining_args)
downloader = Download(actuals_base_url=params.actuals_base_url)
downloader.fetch(builder_name=params.builder,
dest_dir=params.dest_dir)
if __name__ == '__main__':
main()