Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(3054)

Unified Diff: build/android/pylib/local/device/local_device_perf_test_run.py

Issue 2012323002: [Android] Implement perf tests to platform mode. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master
Patch Set: add retry logic and some clean up Created 4 years, 7 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View side-by-side diff with in-line comments
Download patch
Index: build/android/pylib/local/device/local_device_perf_test_run.py
diff --git a/build/android/pylib/local/device/local_device_perf_test_run.py b/build/android/pylib/local/device/local_device_perf_test_run.py
new file mode 100644
index 0000000000000000000000000000000000000000..fb8b2590173f33ded1696a7ae0e5bb8cf2e5803d
--- /dev/null
+++ b/build/android/pylib/local/device/local_device_perf_test_run.py
@@ -0,0 +1,429 @@
+# Copyright 2015 The Chromium Authors. All rights reserved.
mikecase (-- gone --) 2016/06/01 17:40:27 nit 2016
rnephew (Reviews Here) 2016/06/01 20:32:04 Done.
+# Use of this source code is governed by a BSD-style license that can be
+# found in the LICENSE file.
+
+import io
+import json
+import logging
+import os
+import pickle
+import re
+import shutil
+import sys
+import tempfile
+import threading
+import time
+import zipfile
+
+from devil.android import battery_utils
+from devil.android import device_errors
+from devil.android import device_list
+from devil.android import device_utils
+from devil.android import forwarder
+from devil.utils import cmd_helper
+from devil.utils import reraiser_thread
+from devil.utils import watchdog_timer
+from pylib import constants
+from pylib.base import base_test_result
+from pylib.constants import host_paths
+from pylib.local.device import local_device_test_run
+
+
+# Regex for the master branch commit position.
+_GIT_CR_POS_RE = re.compile(r'^Cr-Commit-Position: refs/heads/master@{#(\d+)}$')
+
+
+class _HeartBeatLogger(object):
+ # How often to print the heartbeat on flush().
mikecase (-- gone --) 2016/06/01 17:40:28 nit: add "in <time_unit>" (Im guessing it is secon
rnephew (Reviews Here) 2016/06/01 20:32:04 Done.
+ _PRINT_INTERVAL = 30.0
+
+ def __init__(self):
+ """A file-like class for keeping the buildbot alive."""
+ self._len = 0
+ self._tick = time.time()
+ self._stopped = threading.Event()
+ self._timer = threading.Thread(target=self._runner)
+ self._timer.start()
+
+ def _runner(self):
+ while not self._stopped.is_set():
+ self.flush()
+ self._stopped.wait(_HeartBeatLogger._PRINT_INTERVAL)
+
+ def write(self, data):
+ self._len += len(data)
+
+ def flush(self):
+ now = time.time()
+ if now - self._tick >= _HeartBeatLogger._PRINT_INTERVAL:
+ self._tick = now
+ print '--single-step output length %d' % self._len
mikecase (-- gone --) 2016/06/01 17:40:28 Since you are doing this on a separate thread I wo
rnephew (Reviews Here) 2016/06/01 20:32:04 Done.
+ sys.stdout.flush()
+
+ def stop(self):
+ self._stopped.set()
+
+
+def _GetChromiumRevision():
+ # pylint: disable=line-too-long
+ """Get the git hash and commit position of the chromium master branch.
+
+ See: https://chromium.googlesource.com/chromium/tools/build/+/master/scripts/slave/runtest.py#212
mikecase (-- gone --) 2016/06/01 17:40:28 This comment is probably going to get out of date
+
+ Returns:
+ A dictionary with 'revision' and 'commit_pos' keys.
+ """
+ # pylint: enable=line-too-long
+ status, output = cmd_helper.GetCmdStatusAndOutput(
mikecase (-- gone --) 2016/06/01 17:40:28 you will have to set cwd=CHROMIUM_SRC_DIR or somet
rnephew (Reviews Here) 2016/06/01 20:32:04 It already does, the host_paths.DIR_SOURCE_ROOT pa
+ ['git', 'log', '-n', '1', '--pretty=format:%H%n%B', 'HEAD'],
+ host_paths.DIR_SOURCE_ROOT)
+ revision = None
+ commit_pos = None
+ if not status:
+ lines = output.splitlines()
+ revision = lines[0]
+ for line in reversed(lines):
+ m = _GIT_CR_POS_RE.match(line.strip())
+ if m:
+ commit_pos = int(m.group(1))
+ break
+ return {'revision': revision, 'commit_pos': commit_pos}
+
+
+class TestShard(object):
+ def __init__(self, test_instance, device, index, tests, results, watcher=None,
+ retries=3):
+ logging.info('Create shard %s for device %s to run the following tests:',
+ index, device)
+ for t in tests:
+ logging.info(' %s', t)
+ self._battery = battery_utils.BatteryUtils(device)
+ self._device = device
+ self._index = index
+ self._tests = tests
+ self._watcher = watcher
+ self._test_instance = test_instance
+ self._output_dir = None
+ self._results = results
+ self._retries = retries
mikecase (-- gone --) 2016/06/01 17:40:28 nit: probably just alphabetize all of the things O
rnephew (Reviews Here) 2016/06/01 20:32:05 Done.
+
+ def _WriteBuildBotJson(self):
+ """Write metadata about the buildbot environment to the output dir."""
+ if not self._output_dir:
+ return
+ data = {
+ 'chromium': _GetChromiumRevision(),
+ 'environment': dict(os.environ)
+ }
+ with open(os.path.join(self._output_dir, 'buildbot.json'), 'w') as f:
+ json.dump(data, f, sort_keys=True, indent=2, separators=(',', ': '))
+
+ def _TestSetUp(self):
+ self._ResetWatcher()
+ try:
+ logging.info('Unmapping device ports.')
+ forwarder.Forwarder.UnmapAllDevicePorts(self._device)
+ self._device.RestartAdbd()
+ except Exception: # pylint: disable=broad-except
+ logging.exception('Exception when resetting ports.')
mikecase (-- gone --) 2016/06/01 17:40:27 I would say this is fine except you also have Rest
rnephew (Reviews Here) 2016/06/01 20:32:04 Done.
+
+ self._BatteryLevelCheck()
+ self._BatteryTempCheck()
+ self._ScreenCheck()
+
+ if not self._device.IsOnline():
+ msg = 'Device %s is unresponsive.' % str(self._device)
+ logging.warning(msg)
+ raise device_errors.DeviceUnreachableError(msg)
+ self._ResetWatcher()
+
+ def _CleanupOutputDirectory(self):
+ if self._output_dir:
+ shutil.rmtree(self._output_dir, ignore_errors=True)
+ self._output_dir = None
+
+ def _CreateCmd(self, test):
+ cmd = '%s --device %s' % (self._tests[test]['cmd'], str(self._device))
+ if (self._test_instance.collect_chartjson_data
+ or self._tests[test].get('archive_output_dir')):
+ self._output_dir = tempfile.mkdtemp()
+ cmd = cmd + ' --output-dir=%s' % self._output_dir
+ if self._test_instance.dry_run:
+ cmd = 'echo %s' % cmd
+ return cmd
+
+ def _ReadChartjsonOutput(self):
+ if not self._output_dir:
+ return ''
+ json_output_path = os.path.join(self._output_dir, 'results-chart.json')
+ try:
+ with open(json_output_path) as f:
+ return f.read()
+ except IOError:
+ logging.exception('Exception when reading chartjson.')
+ logging.error('This usually means that telemetry did not run, so it could'
+ ' not generate the file. Please check the device running'
+ ' the test.')
+ return ''
+
+ def _RunSingleTest(self, test):
+
+ logging.info('Running %s on shard %s', test, self._index)
+ timeout = (
+ None if self._test_instance.no_timeout
+ else self._tests[test].get('timeout', 3600))
mikecase (-- gone --) 2016/06/01 17:40:27 probably factor out this 3600 somewhere and make i
rnephew (Reviews Here) 2016/06/01 20:32:05 Switched it to use the class varialbe _timeout whi
+ logging.info('Timeout for %s test: %s', test, timeout)
+
+ logfile = sys.stdout
+ if self._test_instance.single_step:
+ logfile = _HeartBeatLogger()
+ cmd = self._CreateCmd(test)
+ self._WriteBuildBotJson()
+ cwd = os.path.abspath(host_paths.DIR_SOURCE_ROOT)
+ if cmd.startswith('src/'):
+ cwd = os.path.abspath(os.path.join(host_paths.DIR_SOURCE_ROOT, os.pardir))
mikecase (-- gone --) 2016/06/01 17:40:28 Im not a fan of things like this. Probably would b
rnephew (Reviews Here) 2016/06/01 20:32:05 This is from the old test runner. I want to eventu
jbudorick 2016/06/01 20:46:06 In general, I'd prefer to make these breaking sani
rnephew (Reviews Here) 2016/06/01 22:14:14 Done.
+
+ try:
+ logging.debug('Running test with command \'%s\'', cmd)
+ exit_code, output = cmd_helper.GetCmdStatusAndOutputWithTimeout(
+ cmd, timeout, cwd=cwd, shell=True, logfile=logfile)
+ json_output = self._ReadChartjsonOutput()
+ except cmd_helper.TimeoutError as e:
+ exit_code = -1
+ output = e.output
+ json_output = ''
+ finally:
+ if self._test_instance.single_step:
+ logfile.stop()
+ return cmd, exit_code, output, json_output
+
+ def _ProcessTestResult(
+ self, test, cmd, start_time, end_time, exit_code, output, json_output):
+ if exit_code is None:
+ exit_code = -1
+ logging.info('%s : exit_code=%d in %d secs on device %s',
+ test, exit_code, end_time - start_time,
+ str(self._device))
+ if exit_code == 0:
+ result_type = base_test_result.ResultType.PASS
+ else:
+ result_type = base_test_result.ResultType.FAIL
+ # TODO(rnephew): Improve device recovery logic.
+ try:
+ self._device.WaitUntilFullyBooted(timeout=120)
mikecase (-- gone --) 2016/06/01 17:40:27 We should probably have some shared GetDeviceBootT
rnephew (Reviews Here) 2016/06/01 20:32:04 Done.
+ except device_errors.CommandTimeoutError:
+ logging.exception('Device failed to return after %s.', test)
+ actual_exit_code = exit_code
+ if (self._test_instance.flaky_steps
+ and test in self._test_instance.flaky_steps):
+ exit_code = 0
+ archive_bytes = (self._ArchiveOutputDir()
+ if self._tests[test].get('archive_output_dir')
+ else None)
+ persisted_result = {
+ 'name': test,
+ 'output': [output],
+ 'chartjson': json_output,
+ 'archive_bytes': archive_bytes,
+ 'exit_code': exit_code,
+ 'actual_exit_code': actual_exit_code,
+ 'result_type': result_type,
+ 'start_time': start_time,
+ 'end_time': end_time,
+ 'total_time': end_time - start_time,
+ 'device': str(self._device),
+ 'cmd': cmd,
+ }
+ self._SaveResult(persisted_result)
+ return result_type
+
+ def RunTestsOnShard(self):
+ for test in self._tests:
+ self._TestSetUp()
+
+ try:
+ exit_code = None
+ tries_left = self._retries
+
+ while exit_code != 0 and tries_left > 0:
+ tries_left = tries_left - 1
+ start_time = time.time()
+ cmd, exit_code, output, json_output = self._RunSingleTest(test)
+ end_time = time.time()
+ result_type = self._ProcessTestResult(
+ test, cmd, start_time, end_time, exit_code, output, json_output)
+
+ result = base_test_result.TestRunResults()
+ result.AddResult(base_test_result.BaseTestResult(test, result_type))
+ self._results.append(result)
+ finally:
+ self._CleanupOutputDirectory()
+
+ @staticmethod
+ def _SaveResult(result):
+ pickled = os.path.join(constants.PERF_OUTPUT_DIR, result['name'])
+ if os.path.exists(pickled):
+ with file(pickled, 'r') as f:
+ previous = pickle.loads(f.read())
+ result['output'] = previous['output'] + result['output']
mikecase (-- gone --) 2016/06/01 17:40:28 Do this save files ever get cleared? It looks like
rnephew (Reviews Here) 2016/06/01 20:32:05 That.. that is a bug. It should be deleted in the
+ with file(pickled, 'w') as f:
+ f.write(pickle.dumps(result))
+
+ def _ArchiveOutputDir(self):
+ """Archive all files in the output dir, and return as compressed bytes."""
+ with io.BytesIO() as archive:
+ with zipfile.ZipFile(archive, 'w', zipfile.ZIP_DEFLATED) as contents:
+ num_files = 0
+ for absdir, _, files in os.walk(self._output_dir):
+ reldir = os.path.relpath(absdir, self._output_dir)
+ for filename in files:
+ src_path = os.path.join(absdir, filename)
+ # We use normpath to turn './file.txt' into just 'file.txt'.
+ dst_path = os.path.normpath(os.path.join(reldir, filename))
+ contents.write(src_path, dst_path)
+ num_files += 1
+ if num_files:
+ logging.info('%d files in the output dir were archived.', num_files)
+ else:
+ logging.warning('No files in the output dir. Archive is empty.')
+ return archive.getvalue()
+
+ def _ResetWatcher(self):
+ if self._watcher:
+ self._watcher.Reset()
+
+ def _BatteryLevelCheck(self):
+ logging.info('Charge level: %s%%',
+ str(self._battery.GetBatteryInfo().get('level')))
+ if self._test_instance.min_battery_level:
+ self._battery.ChargeDeviceToLevel(self._test_instance.min_battery_level)
+
+ def _ScreenCheck(self):
+ if not self._device.IsScreenOn():
+ self._device.SetScreen(True)
+
+ def _BatteryTempCheck(self):
+ logging.info('temperature: %s (0.1 C)',
+ str(self._battery.GetBatteryInfo().get('temperature')))
+ if self._test_instance.max_battery_temp:
+ self._battery.LetBatteryCoolToTemperature(
+ self._test_instance.max_battery_temp)
+
+
+class LocalDevicePerfTestRun(local_device_test_run.LocalDeviceTestRun):
+ def __init__(self, env, test_instance):
+ super(LocalDevicePerfTestRun, self).__init__(env, test_instance)
+ self._test_instance = test_instance
+ self._env = env
+ self._timeout = 10 * 60 # Ten minutes
+ self._devices = None
+ self._test_buckets = []
+ self._watcher = None
+
+ def SetUp(self):
+ self._devices = self._GetAllDevices(self._env.devices,
+ self._test_instance.known_devices_file)
+ self._watcher = watchdog_timer.WatchdogTimer(self._timeout)
+
+ def TearDown(self):
+ pass
+
+ def _GetStepsFromDict(self):
+ if self._test_instance.single_step:
+ return {
+ 'version': 1,
+ 'steps': {
+ 'single_step': {
+ 'device_affinity': 0,
+ 'cmd': self._test_instance.single_step
+ },
+ }
+ }
+ if self._test_instance.steps:
+ with file(self._test_instance.steps, 'r') as f:
+ steps = json.load(f)
+ assert steps['version'] == 1
+ return steps
+
+ def _SplitTestsByAffinity(self):
+ test_dict = self._GetStepsFromDict()
+ for test in test_dict['steps']:
+ affinity = test_dict['steps'][test]['device_affinity']
+ if len(self._test_buckets) < affinity + 1:
+ while len(self._test_buckets) != affinity + 1:
+ self._test_buckets.append({})
+ self._test_buckets[affinity][test] = test_dict['steps'][test]
+ return self._test_buckets
+
+ @staticmethod
+ def _GetAllDevices(active_devices, devices_path):
+ if not devices_path:
+ logging.warning('Known devices file path not being passed. For device '
+ 'affinity to work properly, it must be passed.')
+ try:
+ if devices_path:
+ devices = [device_utils.DeviceUtils(s)
+ for s in device_list.GetPersistentDeviceList(devices_path)]
+ else:
+ logging.warning('Known devices file path not being passed. For device '
+ 'affinity to work properly, it must be passed.')
+ devices = active_devices
+ except IOError as e:
+ logging.error('Unable to find %s [%s]', devices_path, e)
+ devices = active_devices
+ return sorted(devices)
+
+
+ def RunTests(self):
+ # Option selected for saving a json file with a list of test names.
+ if self._test_instance.output_json_list:
+ return self._test_instance.OutputJsonList()
+
+ # Just print the results from a single previously executed step.
+ if self._test_instance.print_step:
+ return self._test_instance.PrintTestOutput()
+
+ # Affinitize the tests.
+ test_buckets = self._SplitTestsByAffinity()
+ if not test_buckets:
+ raise NotImplementedError('No tests found!')
+
+ threads = []
+ results = []
+ for x in xrange(len(self._devices)):
+ new_shard = TestShard(self._test_instance, self._devices[x], x,
+ test_buckets[x], results, watcher=self._watcher)
+ threads.append(reraiser_thread.ReraiserThread(new_shard.RunTestsOnShard))
+
+ workers = reraiser_thread.ReraiserThreadGroup(threads)
+ workers.StartAll()
+
+ try:
+ workers.JoinAll(self._watcher)
+ except device_errors.CommandFailedError:
+ logging.exception('Command failed on device.')
+ except device_errors.CommandTimeoutError:
+ logging.exception('Command timed out on device.')
+ except device_errors.DeviceUnreachableError:
+ logging.exception('Device became unreachable.')
+ return results
+
+ # override
+ def TestPackage(self):
+ return 'Perf'
+
+ # override
+ def _CreateShards(self, _tests):
+ raise NotImplementedError
+
+ # override
+ def _GetTests(self):
+ return self._test_buckets
+
+ # override
+ def _RunTest(self, _device, _test):
+ raise NotImplementedError
+
+ # override
+ def _ShouldShard(self):
+ return False

Powered by Google App Engine
This is Rietveld 408576698