| Index: testing/buildbot/timeouts.py
|
| diff --git a/testing/buildbot/timeouts.py b/testing/buildbot/timeouts.py
|
| new file mode 100755
|
| index 0000000000000000000000000000000000000000..f3204b1a3e65f92ebc8c9f73e84dee9d45d00858
|
| --- /dev/null
|
| +++ b/testing/buildbot/timeouts.py
|
| @@ -0,0 +1,199 @@
|
| +#!/usr/bin/env python
|
| +# Copyright 2016 The Chromium Authors. All rights reserved.
|
| +# Use of this source code is governed by a BSD-style license that can be
|
| +# found in the LICENSE file.
|
| +
|
| +"""Calculate reasonable timeout for each step as analysed by the actual runtimes
|
| +on the Swarming server.
|
| +"""
|
| +
|
| +import Queue
|
| +import argparse
|
| +import json
|
| +import os
|
| +import subprocess
|
| +import sys
|
| +import threading
|
| +import time
|
| +import urllib
|
| +
|
| +
|
| +THIS_DIR = os.path.dirname(os.path.abspath(__file__))
|
| +
|
| +
|
| +def human_int(s):
|
| + """Returns human readable time rounded to the second."""
|
| + s = int(round(s))
|
| + if s <= 60:
|
| + return '%ds' % s
|
| + m = s/60
|
| + if m <= 60:
|
| + return '%dm%02ds' % (m, s%60)
|
| + return '%dh%02dm%02ds' % (m/60, m%60, s%60)
|
| +
|
| +
|
| +def human(s):
|
| + """Returns human readable time rounded to the tenth of second."""
|
| + if s <= 60:
|
| + return '%.1fs' % s
|
| + m = int(round(s/60))
|
| + if m <= 60:
|
| + return '%dm%04.1fs' % (m, s%60)
|
| + return '%dh%02dm%04.1fs' % (m/60, m%60, s%60)
|
| +
|
| +
|
| +class Stats(object):
|
| + """Holds runtimes statistics for a step run on a builder."""
|
| + def __init__(self, builder, step, durations):
|
| + self.builder = builder
|
| + self.step = step
|
| + self.durations = durations
|
| + self.avg = sum(durations) / float(len(durations))
|
| + self.len = len(durations)
|
| + self.max = max(durations)
|
| + self.timeout = max(120, int(round(self.max / 60.)) * 120)
|
| +
|
| + def __str__(self):
|
| + return 'avg: %4ds max: %4ds timeout: %4ds' % (
|
| + round(self.avg), round(self.max), self.timeout)
|
| +
|
| +
|
| +class Pool(object):
|
| + def __init__(self, size):
|
| + self._durations = []
|
| + self._inputs = Queue.Queue()
|
| + self._lock = threading.Lock()
|
| + self._outputs = []
|
| + self._start = time.time()
|
| + self._total = 0
|
| + self._threads = [
|
| + threading.Thread(name=str(i), target=self._run) for i in xrange(size)
|
| + ]
|
| + for t in self._threads:
|
| + t.start()
|
| +
|
| + def put(self, f):
|
| + self._inputs.put(f)
|
| + with self._lock:
|
| + self._total += 1
|
| +
|
| + def join(self):
|
| + for _ in xrange(len(self._threads)):
|
| + self._inputs.put(None)
|
| + try:
|
| + for t in self._threads:
|
| + while t.isAlive():
|
| + t.join(0.1)
|
| + self._print_eta()
|
| + except KeyboardInterrupt:
|
| + sys.stderr.write('\nInterrupted!\n')
|
| + with self._lock:
|
| + return self._outputs[:]
|
| +
|
| + def _print_eta(self):
|
| + elapsed = human(time.time() - self._start)
|
| + with self._lock:
|
| + out = '\r%d/%d Elapsed: %s' % (len(self._outputs), self._total, elapsed)
|
| + if self._durations:
|
| + avg = sum(self._durations) / float(len(self._durations))
|
| + rem = self._total - len(self._outputs)
|
| + eta = avg * rem / float(len(self._threads))
|
| + out += ' ETA: %s ' % human_int(eta)
|
| + sys.stderr.write(out)
|
| + sys.stderr.flush()
|
| +
|
| + def _run(self):
|
| + while True:
|
| + f = self._inputs.get()
|
| + if not f:
|
| + return
|
| + s = time.time()
|
| + o = f()
|
| + e = time.time() - s
|
| + with self._lock:
|
| + self._durations.append(e)
|
| + self._outputs.append(o)
|
| +
|
| +
|
| +def query(server, number, builder, step):
|
| + q = 'tasks/list?%s' % urllib.urlencode([
|
| + ('tags', 'buildername:%s' % builder),
|
| + ('tags', 'name:%s' % step),
|
| + ])
|
| + cmd = [
|
| + sys.executable, '../../tools/swarming_client/swarming.py', 'query',
|
| + '-S', server, '--limit', str(number), q,
|
| + ]
|
| + out = subprocess.check_output(cmd, stderr=subprocess.PIPE)
|
| + try:
|
| + data = json.loads(out)
|
| + except ValueError:
|
| + sys.stderr.write(out)
|
| + return None
|
| + if not 'items' in data:
|
| + # No task with this pattern.
|
| + return None
|
| + durations = [i['duration'] for i in data['items'] if i.get('duration')]
|
| + if not durations:
|
| + # There was tasks but none completed correctly, i.e. internal_failure.
|
| + return None
|
| + return Stats(builder, step, durations)
|
| +
|
| +
|
| +def extract_tags(data, test_name):
|
| + """Returns all the tags that should be queried from a json file."""
|
| + out = []
|
| + for b, d in sorted(data.iteritems()):
|
| + if not 'gtest_tests' in d:
|
| + continue
|
| + for t in d['gtest_tests']:
|
| + if not t.get('swarming', {}).get('can_use_on_swarming_builders'):
|
| + continue
|
| + if test_name and t['test'] != test_name:
|
| + continue
|
| + out.append((b, t['test']))
|
| + return out
|
| +
|
| +
|
| +def query_server(server, number, data):
|
| + """Query the Swarming server to steps durations."""
|
| + def _get_func(builder, step):
|
| + return lambda: query(server, number, builder, step)
|
| + # Limit to 256 threads, otherwise some OSes have trouble with it.
|
| + p = Pool(min(len(data), 256))
|
| + for builder, step in data:
|
| + p.put(_get_func(builder, step))
|
| + return p.join()
|
| +
|
| +
|
| +def main():
|
| + os.chdir(THIS_DIR)
|
| + parser = argparse.ArgumentParser(description=sys.modules[__name__].__doc__)
|
| + parser.add_argument(
|
| + '-f', metavar='chromium.foo.json', help='file to open', required=True)
|
| + parser.add_argument('-s', metavar='foo_unittest', help='step to process')
|
| + parser.add_argument(
|
| + '-N', metavar='200', default=200, type=int,
|
| + help='number of executions to look at')
|
| + parser.add_argument(
|
| + '-S', metavar='chromium-swarm.appspot.com',
|
| + default='chromium-swarm.appspot.com', help='server to use')
|
| + args = parser.parse_args()
|
| +
|
| + with open(args.f) as f:
|
| + d = json.load(f)
|
| + tags = extract_tags(d, args.s)
|
| + if not tags:
|
| + print('No step to process found')
|
| + return 1
|
| + out = [i for i in query_server(args.S, args.N, tags) if i]
|
| + print('')
|
| + maxbuilder = max(len(i.builder) for i in out)
|
| + maxstep = max(len(i.step) for i in out)
|
| + for i in sorted(out, key=lambda i: (i.builder, i.step)):
|
| + print('%-*s / %-*s %s' % (maxbuilder, i.builder, maxstep, i.step, i))
|
| + return 0
|
| +
|
| +
|
| +if __name__ == "__main__":
|
| + sys.exit(main())
|
|
|