/bench/tile_analyze.py
Python | 279 lines | 261 code | 8 blank | 10 comment | 0 complexity | 8688473ed9627e8e904e134c324a099f MD5 | raw file
- #!/usr/bin/env python
- # Copyright (c) 2013 The Chromium Authors. All rights reserved.
- # Use of this source code is governed by a BSD-style license that can be found
- # in the LICENSE file.
- """ Analyze per-tile and viewport bench data, and output visualized results.
- """
- __author__ = 'bensong@google.com (Ben Chen)'
- import bench_util
- import boto
- import math
- import optparse
- import os
- import re
- import shutil
- from oauth2_plugin import oauth2_plugin
- # The default platform to analyze. Used when OPTION_PLATFORM flag is not set.
- DEFAULT_PLATFORM = 'Nexus10_4-1_Float_Bench_32'
- # Template for gsutil uri.
- GOOGLE_STORAGE_URI_SCHEME = 'gs'
- URI_BUCKET = 'chromium-skia-gm'
- # Maximum number of rows of tiles to track for viewport covering.
- MAX_TILE_ROWS = 8
- # Constants for optparse.
- USAGE_STRING = 'USAGE: %s [options]'
- HOWTO_STRING = """
- Note: to read bench data stored in Google Storage, you will need to set up the
- corresponding Python library.
- See http://developers.google.com/storage/docs/gspythonlibrary for details.
- """
- HELP_STRING = """
- For the given platform and revision number, find corresponding viewport and
- tile benchmarks for each available picture bench, and output visualization and
- analysis in HTML. By default it reads from Skia's Google Storage location where
- bot data are stored, but if --dir is given, will read from local directory
- instead.
- """ + HOWTO_STRING
- OPTION_DIR = '--dir'
- OPTION_DIR_SHORT = '-d'
- OPTION_REVISION = '--rev'
- OPTION_REVISION_SHORT = '-r'
- OPTION_PLATFORM = '--platform'
- OPTION_PLATFORM_SHORT = '-p'
- # Bench representation algorithm flag.
- OPTION_REPRESENTATION_ALG = '--algorithm'
- OPTION_REPRESENTATION_ALG_SHORT = '-a'
- # Bench representation algorithm. See trunk/bench/bench_util.py.
- REPRESENTATION_ALG = bench_util.ALGORITHM_25TH_PERCENTILE
- # Constants for bench file matching.
- GOOGLE_STORAGE_OBJECT_NAME_PREFIX = 'perfdata/Skia_'
- BENCH_FILE_PREFIX_TEMPLATE = 'bench_r%s_'
- TILING_FILE_NAME_INDICATOR = '_tile_'
- VIEWPORT_FILE_NAME_INDICATOR = '_viewport_'
- # Regular expression for matching format '<integer>x<integer>'.
- DIMENSIONS_RE = '(\d+)x(\d+)'
- # HTML and JS output templates.
- HTML_PREFIX = """
- <html><head><script type="text/javascript" src="https://www.google.com/jsapi">
- </script><script type="text/javascript">google.load("visualization", "1.1",
- {packages:["table"]});google.load("prototype", "1.6");</script>
- <script type="text/javascript" src="https://systemsbiology-visualizations.googlecode.com/svn/trunk/src/main/js/load.js"></script><script
- type="text/javascript"> systemsbiology.load("visualization", "1.0",
- {packages:["bioheatmap"]});</script><script type="text/javascript">
- google.setOnLoadCallback(drawVisualization); function drawVisualization() {
- """
- HTML_SUFFIX = '</body></html>'
- BAR_CHART_TEMPLATE = ('<img src="https://chart.googleapis.com/chart?chxr=0,0,'
- '300&chxt=x&chbh=15,0&chs=600x150&cht=bhg&chco=80C65A,224499,FF0000,0A8C8A,'
- 'EBB671,DE091A,000000,00ffff&chds=a&chdl=%s&chd=t:%s" /><br>\n')
- DRAW_OPTIONS = ('{passThroughBlack:false,useRowLabels:false,cellWidth:30,'
- 'cellHeight:30}')
- TABLE_OPTIONS = '{showRowNumber:true,firstRowNumber:" ",sort:"disable"}'
- def GetFiles(rev, bench_dir, platform):
- """Reads in bench files of interest into a dictionary.
- If bench_dir is not empty, tries to read in local bench files; otherwise check
- Google Storage. Filters files by revision (rev) and platform, and ignores
- non-tile, non-viewport bench files.
- Outputs dictionary [filename] -> [file content].
- """
- file_dic = {}
- if not bench_dir:
- uri = boto.storage_uri(URI_BUCKET, GOOGLE_STORAGE_URI_SCHEME)
- # The boto API does not allow prefix/wildcard matching of Google Storage
- # objects. And Google Storage has a flat structure instead of being
- # organized in directories. Therefore, we have to scan all objects in the
- # Google Storage bucket to find the files we need, which is slow.
- # The option of implementing prefix matching as in gsutil seems to be
- # overkill, but gsutil does not provide an API ready for use. If speed is a
- # big concern, we suggest copying bot bench data from Google Storage using
- # gsutil and use --log_dir for fast local data reading.
- for obj in uri.get_bucket():
- # Filters out files of no interest.
- if (not obj.name.startswith(GOOGLE_STORAGE_OBJECT_NAME_PREFIX) or
- (obj.name.find(TILING_FILE_NAME_INDICATOR) < 0 and
- obj.name.find(VIEWPORT_FILE_NAME_INDICATOR) < 0) or
- obj.name.find(platform) < 0 or
- obj.name.find(BENCH_FILE_PREFIX_TEMPLATE % rev) < 0):
- continue
- file_dic[
- obj.name[obj.name.rfind('/') + 1 : ]] = obj.get_contents_as_string()
- else:
- for f in os.listdir(bench_dir):
- if (not os.path.isfile(os.path.join(bench_dir, f)) or
- (f.find(TILING_FILE_NAME_INDICATOR) < 0 and
- f.find(VIEWPORT_FILE_NAME_INDICATOR) < 0) or
- not f.startswith(BENCH_FILE_PREFIX_TEMPLATE % rev)):
- continue
- file_dic[f] = open(os.path.join(bench_dir, f)).read()
- if not file_dic:
- raise Exception('No bench file found in "%s" or Google Storage.' %
- bench_dir)
- return file_dic
- def GetTileMatrix(layout, tile_size, values, viewport):
- """For the given tile layout and per-tile bench values, returns a matrix of
- bench values with tiles outside the given viewport set to 0.
- layout, tile_size and viewport are given in string of format <w>x<h>, where
- <w> is viewport width or number of tile columns, and <h> is viewport height or
- number of tile rows. We truncate tile rows to MAX_TILE_ROWS to adjust for very
- long skp's.
- values: per-tile benches ordered row-by-row, starting from the top-left tile.
- Returns [sum, matrix] where sum is the total bench tile time that covers the
- viewport, and matrix is used for visualizing the tiles.
- """
- [tile_cols, tile_rows] = [int(i) for i in layout.split('x')]
- [tile_x, tile_y] = [int(i) for i in tile_size.split('x')]
- [viewport_x, viewport_y] = [int(i) for i in viewport.split('x')]
- viewport_cols = int(math.ceil(viewport_x * 1.0 / tile_x))
- viewport_rows = int(math.ceil(viewport_y * 1.0 / tile_y))
- truncated_tile_rows = min(tile_rows, MAX_TILE_ROWS)
- viewport_tile_sum = 0
- matrix = [[0 for y in range(tile_cols)] for x in range(truncated_tile_rows)]
- for y in range(min(viewport_cols, tile_cols)):
- for x in range(min(truncated_tile_rows, viewport_rows)):
- matrix[x][y] = values[x * tile_cols + y]
- viewport_tile_sum += values[x * tile_cols + y]
- return [viewport_tile_sum, matrix]
- def GetTileVisCodes(suffix, matrix):
- """Generates and returns strings of [js_codes, row1, row2] which are codes for
- visualizing the benches from the given tile config and matrix data.
- row1 is used for the first row of heatmaps; row2 is for corresponding tables.
- suffix is only used to avoid name conflicts in the whole html output.
- """
- this_js = 'var data_%s=new google.visualization.DataTable();' % suffix
- for i in range(len(matrix[0])):
- this_js += 'data_%s.addColumn("number","%s");' % (suffix, i)
- this_js += 'data_%s.addRows(%s);' % (suffix, str(matrix))
- # Adds heatmap chart.
- this_js += ('var heat_%s=new org.systemsbiology.visualization' % suffix +
- '.BioHeatMap(document.getElementById("%s"));' % suffix +
- 'heat_%s.draw(data_%s,%s);' % (suffix, suffix, DRAW_OPTIONS))
- # Adds data table chart.
- this_js += ('var table_%s=new google.visualization.Table(document.' % suffix +
- 'getElementById("t%s"));table_%s.draw(data_%s,%s);\n' % (
- suffix, suffix, suffix, TABLE_OPTIONS))
- table_row1 = '<td>%s<div id="%s"></div></td>' % (suffix, suffix)
- table_row2 = '<td><div id="t%s"></div></td>' % suffix
- return [this_js, table_row1, table_row2]
- def OutputTileAnalysis(rev, representation_alg, bench_dir, platform):
- """Reads skp bench data and outputs tile vs. viewport analysis for the given
- platform.
- Ignores data with revisions other than rev. If bench_dir is not empty, read
- from the local directory instead of Google Storage.
- Uses the provided representation_alg for calculating bench representations.
- Returns (js_codes, body_codes): strings of js/html codes for stats and
- visualization.
- """
- js_codes = ''
- body_codes = ('}</script></head><body>'
- '<h3>PLATFORM: %s REVISION: %s</h3><br>' % (platform, rev))
- bench_dic = {} # [bench][config] -> [layout, [values]]
- file_dic = GetFiles(rev, bench_dir, platform)
- for f in file_dic:
- for point in bench_util.parse('', file_dic[f].split('\n'),
- representation_alg):
- if point.time_type: # Ignores non-walltime time_type.
- continue
- bench = point.bench.replace('.skp', '')
- config = point.config.replace('simple_', '')
- components = config.split('_')
- if components[0] == 'viewport':
- bench_dic.setdefault(bench, {})[config] = [components[1], [point.time]]
- else: # Stores per-tile benches.
- bench_dic.setdefault(bench, {})[config] = [
- point.tile_layout, point.per_tile_values]
- benches = bench_dic.keys()
- benches.sort()
- for bench in benches:
- body_codes += '<h4>%s</h4><br><table><tr>' % bench
- heat_plots = '' # For table row of heatmap plots.
- table_plots = '' # For table row of data table plots.
- # For bar plot legends and values in URL string.
- legends = ''
- values = ''
- keys = bench_dic[bench].keys()
- keys.sort()
- if not keys[-1].startswith('viewport'): # No viewport to analyze; skip.
- continue
- else:
- # Extracts viewport size, which for all viewport configs is the same.
- viewport = bench_dic[bench][keys[-1]][0]
- for config in keys:
- [layout, value_li] = bench_dic[bench][config]
- if config.startswith('tile_'): # For per-tile data, visualize tiles.
- tile_size = config.split('_')[1]
- if (not re.search(DIMENSIONS_RE, layout) or
- not re.search(DIMENSIONS_RE, tile_size) or
- not re.search(DIMENSIONS_RE, viewport)):
- continue # Skip unrecognized formats.
- [viewport_tile_sum, matrix] = GetTileMatrix(
- layout, tile_size, value_li, viewport)
- values += '%s|' % viewport_tile_sum
- [this_js, row1, row2] = GetTileVisCodes(config + '_' + bench, matrix)
- heat_plots += row1
- table_plots += row2
- js_codes += this_js
- else: # For viewport data, there is only one element in value_li.
- values += '%s|' % sum(value_li)
- legends += '%s:%s|' % (config, sum(value_li))
- body_codes += (heat_plots + '</tr><tr>' + table_plots + '</tr></table>' +
- '<br>' + BAR_CHART_TEMPLATE % (legends[:-1], values[:-1]))
- return (js_codes, body_codes)
- def main():
- """Parses flags and outputs expected Skia picture bench results."""
- parser = optparse.OptionParser(USAGE_STRING % '%prog' + HELP_STRING)
- parser.add_option(OPTION_PLATFORM_SHORT, OPTION_PLATFORM,
- dest='plat', default=DEFAULT_PLATFORM,
- help='Platform to analyze. Set to DEFAULT_PLATFORM if not given.')
- parser.add_option(OPTION_REVISION_SHORT, OPTION_REVISION,
- dest='rev',
- help='(Mandatory) revision number to analyze.')
- parser.add_option(OPTION_DIR_SHORT, OPTION_DIR,
- dest='log_dir', default='',
- help=('(Optional) local directory where bench log files reside. If left '
- 'empty (by default), will try to read from Google Storage.'))
- parser.add_option(OPTION_REPRESENTATION_ALG_SHORT, OPTION_REPRESENTATION_ALG,
- dest='alg', default=REPRESENTATION_ALG,
- help=('Bench representation algorithm. '
- 'Default to "%s".' % REPRESENTATION_ALG))
- (options, args) = parser.parse_args()
- if not (options.rev and options.rev.isdigit()):
- parser.error('Please provide correct mandatory flag %s' % OPTION_REVISION)
- return
- rev = int(options.rev)
- (js_codes, body_codes) = OutputTileAnalysis(
- rev, options.alg, options.log_dir, options.plat)
- print HTML_PREFIX + js_codes + body_codes + HTML_SUFFIX
- if '__main__' == __name__:
- main()