callstats.py 28 KB
Newer Older
1 2 3 4 5
#!/usr/bin/env python
# Copyright 2016 the V8 project authors. All rights reserved.
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.
'''
6
Usage: callstats.py [-h] <command> ...
7 8 9 10 11 12 13 14 15 16 17 18 19

Optional arguments:
  -h, --help  show this help message and exit

Commands:
  run         run chrome with --runtime-call-stats and generate logs
  stats       process logs and print statistics
  json        process logs from several versions and generate JSON
  help        help information

For each command, you can try ./runtime-call-stats.py help command.
'''

20 21 22
# for py2/py3 compatibility
from __future__ import print_function

23 24 25 26 27 28 29 30
import argparse
import json
import os
import re
import shutil
import subprocess
import sys
import tempfile
31
import operator
32
from callstats_groups import RUNTIME_CALL_STATS_GROUPS
33 34 35 36 37

import numpy
from math import sqrt


38 39 40
MAX_NOF_RETRIES = 5


41 42 43 44 45 46 47 48 49 50
# Run benchmarks.

def print_command(cmd_args):
  def fix_for_printing(arg):
    m = re.match(r'^--([^=]+)=(.*)$', arg)
    if m and (' ' in m.group(2) or m.group(2).startswith('-')):
      arg = "--{}='{}'".format(m.group(1), m.group(2))
    elif ' ' in arg:
      arg = "'{}'".format(arg)
    return arg
51
  print(" ".join(map(fix_for_printing, cmd_args)))
52 53


54
def start_replay_server(args, sites, discard_output=True):
55 56 57
  with tempfile.NamedTemporaryFile(prefix='callstats-inject-', suffix='.js',
                                   mode='wt', delete=False) as f:
    injection = f.name
58
    generate_injection(f, sites, args.refresh)
59 60
  http_port = 4080 + args.port_offset
  https_port = 4443 + args.port_offset
61 62
  cmd_args = [
      args.replay_bin,
63 64
      "--port=%s" % http_port,
      "--ssl_port=%s" % https_port,
65 66 67
      "--no-dns_forwarding",
      "--use_closest_match",
      "--no-diff_unknown_requests",
68
      "--inject_scripts=deterministic.js,{}".format(injection),
69 70
      args.replay_wpr,
  ]
71
  print("=" * 80)
72
  print_command(cmd_args)
73 74 75 76 77
  if discard_output:
    with open(os.devnull, 'w') as null:
      server = subprocess.Popen(cmd_args, stdout=null, stderr=null)
  else:
      server = subprocess.Popen(cmd_args)
78 79
  print("RUNNING REPLAY SERVER: %s with PID=%s" % (args.replay_bin, server.pid))
  print("=" * 80)
80
  return {'process': server, 'injection': injection}
81 82 83


def stop_replay_server(server):
84 85 86 87 88
  print("SHUTTING DOWN REPLAY SERVER %s" % server['process'].pid)
  server['process'].terminate()
  os.remove(server['injection'])


89
def generate_injection(f, sites, refreshes=0):
90
  print("""\
91
(function() {
92 93 94 95
  var s = window.sessionStorage.getItem("refreshCounter");
  var refreshTotal = """, refreshes, """;
  var refreshCounter = s ? parseInt(s) : refreshTotal;
  var refreshId = refreshTotal - refreshCounter;
96 97 98
  if (refreshCounter > 0) {
    window.sessionStorage.setItem("refreshCounter", refreshCounter-1);
  }
99
  function match(url, item) {
100 101 102
    if ('regexp' in item) { return url.match(item.regexp) !== null };
    var url_wanted = item.url;
    /* Allow automatic redirections from http to https. */
103 104 105 106
    if (url_wanted.startsWith("http://") && url.startsWith("https://")) {
      url_wanted = "https://" + url_wanted.substr(7);
    }
    return url.startsWith(url_wanted);
107
  };
108 109
  function onLoad(url) {
    for (var item of sites) {
110
      if (!match(url, item)) continue;
111
      var timeout = 'timeline' in item ? 2000 * item.timeline
112 113 114
                  : 'timeout'  in item ? 1000 * (item.timeout - 3)
                  : 10000;
      console.log("Setting time out of " + timeout + " for: " + url);
115
      window.setTimeout(function() {
116
        console.log("Time is out for: " + url);
117
        var msg = "STATS: (" + refreshId + ") " + url;
118 119
        %GetAndResetRuntimeCallStats(1, msg);
        if (refreshCounter > 0) {
120 121
          console.log(
              "Refresh counter is " + refreshCounter + ", refreshing: " + url);
122 123
          window.location.reload();
        }
124 125 126 127 128
      }, timeout);
      return;
    }
    console.log("Ignoring: " + url);
  };
129 130 131
  var sites =
    """, json.dumps(sites), """;
  onLoad(window.location.href);
132
})();""", file=f)
133

134
def get_chrome_flags(js_flags, user_data_dir, arg_delimiter=""):
135 136 137 138 139
  return [
      "--no-default-browser-check",
      "--no-sandbox",
      "--disable-translate",
      "--enable-benchmarking",
140 141
      "--enable-stats-table",
      "--js-flags={}{}{}".format(arg_delimiter, js_flags, arg_delimiter),
142
      "--no-first-run",
143 144
      "--user-data-dir={}{}{}".format(arg_delimiter, user_data_dir,
                                      arg_delimiter),
145 146
      "--data-path={}{}{}".format(arg_delimiter,
          os.path.join(user_data_dir, 'content-shell-data'), arg_delimiter),
147 148
    ]

149
def get_chrome_replay_flags(args, arg_delimiter=""):
150 151 152
  http_port = 4080 + args.port_offset
  https_port = 4443 + args.port_offset
  return [
153 154 155 156 157
      "--host-resolver-rules=%sMAP *:80 localhost:%s, "  \
                              "MAP *:443 localhost:%s, " \
                              "EXCLUDE localhost%s" % (
                               arg_delimiter, http_port, https_port,
                               arg_delimiter),
158 159 160 161 162 163
      "--ignore-certificate-errors",
      "--disable-seccomp-sandbox",
      "--disable-web-security",
      "--reduce-security-for-testing",
      "--allow-insecure-localhost",
    ]
164 165

def run_site(site, domain, args, timeout=None):
166 167 168
  print("="*80)
  print("RUNNING DOMAIN %s" % domain)
  print("="*80)
169 170
  result_template = "{domain}#{count}.txt" if args.repeat else "{domain}.txt"
  count = 0
171
  if timeout is None: timeout = args.timeout
172 173 174
  if args.replay_wpr:
    timeout *= 1 + args.refresh
    timeout += 1
175
  retries_since_good_run = 0
176 177 178 179 180 181 182
  while count == 0 or args.repeat is not None and count < args.repeat:
    count += 1
    result = result_template.format(domain=domain, count=count)
    retries = 0
    while args.retries is None or retries < args.retries:
      retries += 1
      try:
183 184 185
        if args.user_data_dir:
          user_data_dir = args.user_data_dir
        else:
186
          user_data_dir = tempfile.mkdtemp(prefix="chr_")
187
        js_flags = "--runtime-call-stats"
188
        if args.replay_wpr: js_flags += " --allow-natives-syntax"
189
        if args.js_flags: js_flags += " " + args.js_flags
190
        chrome_flags = get_chrome_flags(js_flags, user_data_dir)
191
        if args.replay_wpr:
192
          chrome_flags += get_chrome_replay_flags(args)
193
        else:
194
          chrome_flags += [ "--single-process", ]
195 196 197 198 199 200
        if args.chrome_flags:
          chrome_flags += args.chrome_flags.split()
        cmd_args = [
            "timeout", str(timeout),
            args.with_chrome
        ] + chrome_flags + [ site ]
201
        print("- " * 40)
202
        print_command(cmd_args)
203
        print("- " * 40)
204
        with open(result, "wt") as f:
205 206
          with open(args.log_stderr or os.devnull, 'at') as err:
            status = subprocess.call(cmd_args, stdout=f, stderr=err)
207 208 209 210 211 212 213 214 215 216
        # 124 means timeout killed chrome, 0 means the user was bored first!
        # If none of these two happened, then chrome apparently crashed, so
        # it must be called again.
        if status != 124 and status != 0:
          print("CHROME CRASHED, REPEATING RUN");
          continue
        # If the stats file is empty, chrome must be called again.
        if os.path.isfile(result) and os.path.getsize(result) > 0:
          if args.print_url:
            with open(result, "at") as f:
217 218
              print(file=f)
              print("URL: {}".format(site), file=f)
219
          retries_since_good_run = 0
220
          break
221 222 223 224
        if retries_since_good_run > MAX_NOF_RETRIES:
          # Abort after too many retries, no point in ever increasing the
          # timeout.
          print("TOO MANY EMPTY RESULTS ABORTING RUN")
225
          return
226 227
        timeout += 2 ** retries_since_good_run
        retries_since_good_run += 1
228 229
        print("EMPTY RESULT, REPEATING RUN ({})".format(
            retries_since_good_run));
230
      finally:
231
        if not args.user_data_dir:
232 233 234 235 236 237 238 239 240 241 242
          shutil.rmtree(user_data_dir)


def read_sites_file(args):
  try:
    sites = []
    try:
      with open(args.sites_file, "rt") as f:
        for item in json.load(f):
          if 'timeout' not in item:
            # This is more-or-less arbitrary.
243
            item['timeout'] = int(1.5 * item['timeline'] + 7)
244 245 246
          if item['timeout'] > args.timeout: item['timeout'] = args.timeout
          sites.append(item)
    except ValueError:
247 248
      args.error("Warning: Could not read sites file as JSON, falling back to "
                 "primitive file")
249 250 251 252 253 254 255 256 257 258 259
      with open(args.sites_file, "rt") as f:
        for line in f:
          line = line.strip()
          if not line or line.startswith('#'): continue
          sites.append({'url': line, 'timeout': args.timeout})
    return sites
  except IOError as e:
    args.error("Cannot read from {}. {}.".format(args.sites_file, e.strerror))
    sys.exit(1)


260
def read_sites(args):
261 262
  # Determine the websites to benchmark.
  if args.sites_file:
263 264 265 266 267 268
    return read_sites_file(args)
  return [{'url': site, 'timeout': args.timeout} for site in args.sites]

def do_run(args):
  sites = read_sites(args)
  replay_server = start_replay_server(args, sites) if args.replay_wpr else None
269 270 271 272 273
  # Disambiguate domains, if needed.
  L = []
  domains = {}
  for item in sites:
    site = item['url']
274 275 276 277 278 279 280 281 282 283 284
    domain = None
    if args.domain:
      domain = args.domain
    elif 'domain' in item:
      domain = item['domain']
    else:
      m = re.match(r'^(https?://)?([^/]+)(/.*)?$', site)
      if not m:
        args.error("Invalid URL {}.".format(site))
        continue
      domain = m.group(2)
285 286 287 288 289 290 291 292 293 294 295 296 297 298
    entry = [site, domain, None, item['timeout']]
    if domain not in domains:
      domains[domain] = entry
    else:
      if not isinstance(domains[domain], int):
        domains[domain][2] = 1
        domains[domain] = 1
      domains[domain] += 1
      entry[2] = domains[domain]
    L.append(entry)
  try:
    # Run them.
    for site, domain, count, timeout in L:
      if count is not None: domain = "{}%{}".format(domain, count)
299
      print((site, domain, timeout))
300 301 302 303 304 305
      run_site(site, domain, args, timeout)
  finally:
    if replay_server:
      stop_replay_server(replay_server)


306 307 308 309 310 311 312 313
def do_run_replay_server(args):
  sites = read_sites(args)
  print("- " * 40)
  print("Available URLs:")
  for site in sites:
    print("    "+site['url'])
  print("- " * 40)
  print("Launch chromium with the following commands for debugging:")
314 315 316 317
  flags = get_chrome_flags("--runtime-call-stats --allow-natives-syntax",
                           "/var/tmp/`date +%s`", '"')
  flags += get_chrome_replay_flags(args, "'")
  print("    $CHROMIUM_DIR/out/Release/chrome " + (" ".join(flags)) + " <URL>")
318
  print("- " * 40)
319
  replay_server = start_replay_server(args, sites, discard_output=False)
320 321 322 323 324 325
  try:
    replay_server['process'].wait()
  finally:
   stop_replay_server(replay_server)


326 327 328
# Calculate statistics.

def statistics(data):
329 330 331 332
  # NOTE(V8:10269): imports moved here to mitigate the outage.
  import scipy
  import scipy.stats

333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361
  N = len(data)
  average = numpy.average(data)
  median = numpy.median(data)
  low = numpy.min(data)
  high= numpy.max(data)
  if N > 1:
    # evaluate sample variance by setting delta degrees of freedom (ddof) to
    # 1. The degree used in calculations is N - ddof
    stddev = numpy.std(data, ddof=1)
    # Get the endpoints of the range that contains 95% of the distribution
    t_bounds = scipy.stats.t.interval(0.95, N-1)
    #assert abs(t_bounds[0] + t_bounds[1]) < 1e-6
    # sum mean to the confidence interval
    ci = {
        'abs': t_bounds[1] * stddev / sqrt(N),
        'low': average + t_bounds[0] * stddev / sqrt(N),
        'high': average + t_bounds[1] * stddev / sqrt(N)
    }
  else:
    stddev = 0
    ci = { 'abs': 0, 'low': average, 'high': average }
  if abs(stddev) > 0.0001 and abs(average) > 0.0001:
    ci['perc'] = t_bounds[1] * stddev / sqrt(N) / average * 100
  else:
    ci['perc'] = 0
  return { 'samples': N, 'average': average, 'median': median,
           'stddev': stddev, 'min': low, 'max': high, 'ci': ci }


362 363 364 365 366 367 368 369 370
def add_category_total(entries, groups, category_prefix):
  group_data = { 'time': 0, 'count': 0 }
  for group_name, regexp in groups:
    if not group_name.startswith('Group-' + category_prefix): continue
    group_data['time'] += entries[group_name]['time']
    group_data['count'] += entries[group_name]['count']
  entries['Group-' + category_prefix + '-Total'] = group_data


371 372 373 374
def read_stats(path, domain, args):
  groups = [];
  if args.aggregate:
    groups = [
375
        ('Group-IC', re.compile(".*IC_.*")),
376
        ('Group-OptimizeBackground', re.compile(".*OptimizeBackground.*")),
377 378
        ('Group-Optimize',
         re.compile("StackGuard|.*Optimize.*|.*Deoptimize.*|Recompile.*")),
379
        ('Group-CompileBackground', re.compile("(.*CompileBackground.*)")),
380
        ('Group-Compile', re.compile("(^Compile.*)|(.*_Compile.*)")),
381
        ('Group-ParseBackground', re.compile(".*ParseBackground.*")),
382 383 384
        ('Group-Parse', re.compile(".*Parse.*")),
        ('Group-Callback', re.compile(".*Callback.*")),
        ('Group-API', re.compile(".*API.*")),
385
        ('Group-GC-Custom', re.compile("GC_Custom_.*")),
386
        ('Group-GC-Background', re.compile(".*GC.*BACKGROUND.*")),
387
        ('Group-GC', re.compile("GC_.*|AllocateInTargetSpace")),
388 389
        ('Group-JavaScript', re.compile("JS_Execution")),
        ('Group-Runtime', re.compile(".*"))]
390 391
  with open(path, "rt") as f:
    # Process the whole file and sum repeating entries.
392 393 394
    entries = { 'Sum': {'time': 0, 'count': 0} }
    for group_name, regexp in groups:
      entries[group_name] = { 'time': 0, 'count': 0 }
395 396 397 398 399 400 401 402
    for line in f:
      line = line.strip()
      # Discard headers and footers.
      if not line: continue
      if line.startswith("Runtime Function"): continue
      if line.startswith("===="): continue
      if line.startswith("----"): continue
      if line.startswith("URL:"): continue
403
      if line.startswith("STATS:"): continue
404 405 406 407 408
      # We have a regular line.
      fields = line.split()
      key = fields[0]
      time = float(fields[1].replace("ms", ""))
      count = int(fields[3])
409 410 411
      if key not in entries: entries[key] = { 'time': 0, 'count': 0 }
      entries[key]['time'] += time
      entries[key]['count'] += count
412 413
      # We calculate the sum, if it's not the "total" line.
      if key != "Total":
414 415 416 417 418 419 420
        entries['Sum']['time'] += time
        entries['Sum']['count'] += count
        for group_name, regexp in groups:
          if not regexp.match(key): continue
          entries[group_name]['time'] += time
          entries[group_name]['count'] += count
          break
421
    # Calculate the V8-Total (all groups except Callback)
422
    group_data = { 'time': 0, 'count': 0 }
423 424
    for group_name, regexp in groups:
      if group_name == 'Group-Callback': continue
425 426 427
      group_data['time'] += entries[group_name]['time']
      group_data['count'] += entries[group_name]['count']
    entries['Group-Total-V8'] = group_data
428 429 430 431
    # Calculate the Parse-Total, Compile-Total and Optimize-Total groups
    add_category_total(entries, groups, 'Parse')
    add_category_total(entries, groups, 'Compile')
    add_category_total(entries, groups, 'Optimize')
432
    # Append the sums as single entries to domain.
433
    for key in entries:
434 435 436
      if key not in domain: domain[key] = { 'time_list': [], 'count_list': [] }
      domain[key]['time_list'].append(entries[key]['time'])
      domain[key]['count_list'].append(entries[key]['count'])
437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466


def print_stats(S, args):
  # Sort by ascending/descending time average, then by ascending/descending
  # count average, then by ascending name.
  def sort_asc_func(item):
    return (item[1]['time_stat']['average'],
            item[1]['count_stat']['average'],
            item[0])
  def sort_desc_func(item):
    return (-item[1]['time_stat']['average'],
            -item[1]['count_stat']['average'],
            item[0])
  # Sorting order is in the commend-line arguments.
  sort_func = sort_asc_func if args.sort == "asc" else sort_desc_func
  # Possibly limit how many elements to print.
  L = [item for item in sorted(S.items(), key=sort_func)
       if item[0] not in ["Total", "Sum"]]
  N = len(L)
  if args.limit == 0:
    low, high = 0, N
  elif args.sort == "desc":
    low, high = 0, args.limit
  else:
    low, high = N-args.limit, N
  # How to print entries.
  def print_entry(key, value):
    def stats(s, units=""):
      conf = "{:0.1f}({:0.2f}%)".format(s['ci']['abs'], s['ci']['perc'])
      return "{:8.1f}{} +/- {:15s}".format(s['average'], units, conf)
467
    print("{:>50s}  {}  {}".format(
468 469 470
      key,
      stats(value['time_stat'], units="ms"),
      stats(value['count_stat'])
471
    ))
472 473 474
  # Print and calculate partial sums, if necessary.
  for i in range(low, high):
    print_entry(*L[i])
475
    if args.totals and args.limit != 0 and not args.aggregate:
476 477 478 479 480 481 482 483 484 485 486
      if i == low:
        partial = { 'time_list': [0] * len(L[i][1]['time_list']),
                    'count_list': [0] * len(L[i][1]['count_list']) }
      assert len(partial['time_list']) == len(L[i][1]['time_list'])
      assert len(partial['count_list']) == len(L[i][1]['count_list'])
      for j, v in enumerate(L[i][1]['time_list']):
        partial['time_list'][j] += v
      for j, v in enumerate(L[i][1]['count_list']):
        partial['count_list'][j] += v
  # Print totals, if necessary.
  if args.totals:
487
    print('-' * 80)
488
    if args.limit != 0 and not args.aggregate:
489 490 491 492 493 494 495 496
      partial['time_stat'] = statistics(partial['time_list'])
      partial['count_stat'] = statistics(partial['count_list'])
      print_entry("Partial", partial)
    print_entry("Sum", S["Sum"])
    print_entry("Total", S["Total"])


def do_stats(args):
497
  domains = {}
498 499 500 501
  for path in args.logfiles:
    filename = os.path.basename(path)
    m = re.match(r'^([^#]+)(#.*)?$', filename)
    domain = m.group(1)
502 503 504 505 506 507
    if domain not in domains: domains[domain] = {}
    read_stats(path, domains[domain], args)
  if args.aggregate:
    create_total_page_stats(domains, args)
  for i, domain in enumerate(sorted(domains)):
    if len(domains) > 1:
508 509 510
      if i > 0: print()
      print("{}:".format(domain))
      print('=' * 80)
511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529
    domain_stats = domains[domain]
    for key in domain_stats:
      domain_stats[key]['time_stat'] = \
          statistics(domain_stats[key]['time_list'])
      domain_stats[key]['count_stat'] = \
          statistics(domain_stats[key]['count_list'])
    print_stats(domain_stats, args)


# Create a Total page with all entries summed up.
def create_total_page_stats(domains, args):
  total = {}
  def sum_up(parent, key, other):
    sums = parent[key]
    for i, item in enumerate(other[key]):
      if i >= len(sums):
        sums.extend([0] * (i - len(sums) + 1))
      if item is not None:
        sums[i] += item
530 531 532 533 534 535
  # Exclude adwords and speedometer pages from aggrigate total, since adwords
  # dominates execution time and speedometer is measured elsewhere.
  excluded_domains = ['adwords.google.com', 'speedometer-angular',
                      'speedometer-jquery', 'speedometer-backbone',
                      'speedometer-ember', 'speedometer-vanilla'];
  # Sum up all the entries/metrics from all non-excluded domains
536
  for domain, entries in domains.items():
537 538
    if domain in excluded_domains:
      continue;
539 540 541 542 543 544 545 546 547 548
    for key, domain_stats in entries.items():
      if key not in total:
        total[key] = {}
        total[key]['time_list'] = list(domain_stats['time_list'])
        total[key]['count_list'] = list(domain_stats['count_list'])
      else:
        sum_up(total[key], 'time_list', domain_stats)
        sum_up(total[key], 'count_list', domain_stats)
  # Add a new "Total" page containing the summed up metrics.
  domains['Total'] = total
549

550 551
# Generate Raw JSON file.

552
def _read_logs(args):
553 554 555 556 557 558 559 560 561 562 563 564 565 566
  versions = {}
  for path in args.logdirs:
    if os.path.isdir(path):
      for root, dirs, files in os.walk(path):
        version = os.path.basename(root)
        if version not in versions: versions[version] = {}
        for filename in files:
          if filename.endswith(".txt"):
            m = re.match(r'^([^#]+)(#.*)?\.txt$', filename)
            domain = m.group(1)
            if domain not in versions[version]: versions[version][domain] = {}
            read_stats(os.path.join(root, filename),
                       versions[version][domain], args)

567 568 569 570 571
  return versions

def do_raw_json(args):
  versions = _read_logs(args)

572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589
  for version, domains in versions.items():
    if args.aggregate:
      create_total_page_stats(domains, args)
    for domain, entries in domains.items():
      raw_entries = []
      for name, value in entries.items():
        # We don't want the calculated sum in the JSON file.
        if name == "Sum": continue
        raw_entries.append({
          'name': name,
          'duration': value['time_list'],
          'count': value['count_list'],
        })

      domains[domain] = raw_entries

  print(json.dumps(versions, separators=(',', ':')))

590 591 592 593

# Generate JSON file.

def do_json(args):
594 595
  versions = _read_logs(args)

596 597 598 599 600 601
  for version, domains in versions.items():
    if args.aggregate:
      create_total_page_stats(domains, args)
    for domain, entries in domains.items():
      stats = []
      for name, value in entries.items():
602 603 604 605
        # We don't want the calculated sum in the JSON file.
        if name == "Sum": continue
        entry = [name]
        for x in ['time_list', 'count_list']:
606
          s = statistics(entries[name][x])
607 608 609
          entry.append(round(s['average'], 1))
          entry.append(round(s['ci']['abs'], 1))
          entry.append(round(s['ci']['perc'], 2))
610 611
        stats.append(entry)
      domains[domain] = stats
612
  print(json.dumps(versions, separators=(',', ':')))
613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628


# Help.

def do_help(parser, subparsers, args):
  if args.help_cmd:
    if args.help_cmd in subparsers:
      subparsers[args.help_cmd].print_help()
    else:
      args.error("Unknown command '{}'".format(args.help_cmd))
  else:
    parser.print_help()


# Main program, parse command line and execute.

629 630 631 632
def coexist(*l):
  given = sum(1 for x in l if x)
  return given == 0 or given == len(l)

633 634 635 636 637 638 639
def main():
  parser = argparse.ArgumentParser()
  subparser_adder = parser.add_subparsers(title="commands", dest="command",
                                          metavar="<command>")
  subparsers = {}
  # Command: run.
  subparsers["run"] = subparser_adder.add_parser(
640
      "run", help="Replay websites and collect runtime stats data.")
641 642 643 644 645 646 647 648 649 650 651 652 653 654 655
  subparsers["run"].set_defaults(
      func=do_run, error=subparsers["run"].error)
  subparsers["run"].add_argument(
      "--chrome-flags", type=str, default="",
      help="specify additional chrome flags")
  subparsers["run"].add_argument(
      "--js-flags", type=str, default="",
      help="specify additional V8 flags")
  subparsers["run"].add_argument(
      "-u", "--user-data-dir", type=str, metavar="<path>",
      help="specify user data dir (default is temporary)")
  subparsers["run"].add_argument(
      "-c", "--with-chrome", type=str, metavar="<path>",
      default="/usr/bin/google-chrome",
      help="specify chrome executable to use")
656
  subparsers["run"].add_argument(
657 658 659 660 661 662 663 664
      "-r", "--retries", type=int, metavar="<num>",
      help="specify retries if website is down (default: forever)")
  subparsers["run"].add_argument(
      "--no-url", dest="print_url", action="store_false", default=True,
      help="do not include url in statistics file")
  subparsers["run"].add_argument(
      "--domain", type=str, default="",
      help="specify the output file domain name")
665
  subparsers["run"].add_argument(
666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692
      "-n", "--repeat", type=int, metavar="<num>",
      help="specify iterations for each website (default: once)")

  def add_replay_args(subparser):
    subparser.add_argument(
        "-k", "--refresh", type=int, metavar="<num>", default=0,
        help="specify refreshes for each iteration (default: 0)")
    subparser.add_argument(
        "--replay-wpr", type=str, metavar="<path>",
        help="use the specified web page replay (.wpr) archive")
    subparser.add_argument(
        "--replay-bin", type=str, metavar="<path>",
        help="specify the replay.py script typically located in " \
             "$CHROMIUM/src/third_party/webpagereplay/replay.py")
    subparser.add_argument(
        "-f", "--sites-file", type=str, metavar="<path>",
        help="specify file containing benchmark websites")
    subparser.add_argument(
        "-t", "--timeout", type=int, metavar="<seconds>", default=60,
        help="specify seconds before chrome is killed")
    subparser.add_argument(
        "-p", "--port-offset", type=int, metavar="<offset>", default=0,
        help="specify the offset for the replay server's default ports")
    subparser.add_argument(
        "-l", "--log-stderr", type=str, metavar="<path>",
        help="specify where chrome's stderr should go (default: /dev/null)")
    subparser.add_argument(
693
        "--sites", type=str, metavar="<URL>", nargs="*",
694 695 696 697 698 699 700 701 702 703
        help="specify benchmark website")
  add_replay_args(subparsers["run"])

  # Command: replay-server
  subparsers["replay"] = subparser_adder.add_parser(
      "replay", help="Run the replay server for debugging purposes")
  subparsers["replay"].set_defaults(
      func=do_run_replay_server, error=subparsers["replay"].error)
  add_replay_args(subparsers["replay"])

704 705
  # Command: stats.
  subparsers["stats"] = subparser_adder.add_parser(
706
      "stats", help="Analize the results file create by the 'run' command.")
707 708 709 710 711 712 713 714 715 716 717 718 719 720
  subparsers["stats"].set_defaults(
      func=do_stats, error=subparsers["stats"].error)
  subparsers["stats"].add_argument(
      "-l", "--limit", type=int, metavar="<num>", default=0,
      help="limit how many items to print (default: none)")
  subparsers["stats"].add_argument(
      "-s", "--sort", choices=["asc", "desc"], default="asc",
      help="specify sorting order (default: ascending)")
  subparsers["stats"].add_argument(
      "-n", "--no-total", dest="totals", action="store_false", default=True,
      help="do not print totals")
  subparsers["stats"].add_argument(
      "logfiles", type=str, metavar="<logfile>", nargs="*",
      help="specify log files to parse")
721 722
  subparsers["stats"].add_argument(
      "--aggregate", dest="aggregate", action="store_true", default=False,
723
      help="Create aggregated entries. Adds Group-* entries at the toplevel. " \
724
      "Additionally creates a Total page with all entries.")
725

726 727
  # Command: json.
  subparsers["json"] = subparser_adder.add_parser(
728 729
      "json", help="Collect results file created by the 'run' command into" \
          "a single json file.")
730 731 732 733 734
  subparsers["json"].set_defaults(
      func=do_json, error=subparsers["json"].error)
  subparsers["json"].add_argument(
      "logdirs", type=str, metavar="<logdir>", nargs="*",
      help="specify directories with log files to parse")
735 736
  subparsers["json"].add_argument(
      "--aggregate", dest="aggregate", action="store_true", default=False,
737
      help="Create aggregated entries. Adds Group-* entries at the toplevel. " \
738 739 740 741 742 743 744 745 746 747 748 749 750 751
      "Additionally creates a Total page with all entries.")

  # Command: raw-json.
  subparsers["raw-json"] = subparser_adder.add_parser(
      "raw-json", help="Collect raw results from 'run' command into" \
          "a single json file.")
  subparsers["raw-json"].set_defaults(
      func=do_raw_json, error=subparsers["json"].error)
  subparsers["raw-json"].add_argument(
      "logdirs", type=str, metavar="<logdir>", nargs="*",
      help="specify directories with log files to parse")
  subparsers["raw-json"].add_argument(
      "--aggregate", dest="aggregate", action="store_true", default=False,
      help="Create aggregated entries. Adds Group-* entries at the toplevel. " \
752
      "Additionally creates a Total page with all entries.")
753

754 755 756 757 758 759 760 761 762
  # Command: help.
  subparsers["help"] = subparser_adder.add_parser(
      "help", help="help information")
  subparsers["help"].set_defaults(
      func=lambda args: do_help(parser, subparsers, args),
      error=subparsers["help"].error)
  subparsers["help"].add_argument(
      "help_cmd", type=str, metavar="<command>", nargs="?",
      help="command for which to display help")
763

764 765
  # Execute the command.
  args = parser.parse_args()
766 767 768
  setattr(args, 'script_path', os.path.dirname(sys.argv[0]))
  if args.command == "run" and coexist(args.sites_file, args.sites):
    args.error("use either option --sites-file or site URLs")
769
    sys.exit(1)
770 771
  elif args.command == "run" and not coexist(args.replay_wpr, args.replay_bin):
    args.error("options --replay-wpr and --replay-bin must be used together")
772 773 774 775 776 777
    sys.exit(1)
  else:
    args.func(args)

if __name__ == "__main__":
  sys.exit(main())