scripts/slave/recipes/findit/chromium/test.py - Issue 1946463003: [Findit] Change test.py recipe to speed up test try jobs(Recipe side change).

Unified Diff: scripts/slave/recipes/findit/chromium/test.py

Issue 1946463003: [Findit] Change test.py recipe to speed up test try jobs(Recipe side change). (Closed) Base URL: https://chromium.googlesource.com/chromium/tools/build.git@master

Patch Set: fix nits. Created 4 years, 7 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: scripts/slave/recipes/findit/chromium/test.py

diff --git a/scripts/slave/recipes/findit/chromium/test.py b/scripts/slave/recipes/findit/chromium/test.py

index 5f3a2cceb5781af954205650576c97e2950ebd4d..3dbbe4b63ae1d7fb24599dc15fef1210f954e8d6 100644

--- a/scripts/slave/recipes/findit/chromium/test.py

+++ b/scripts/slave/recipes/findit/chromium/test.py

@@ -2,9 +2,11 @@

# Use of this source code is governed by a BSD-style license that can be

# found in the LICENSE file.

+from collections import defaultdict

import json

from recipe_engine.config import Dict

+from recipe_engine.config import List

from recipe_engine.config import Single

from recipe_engine.recipe_api import Property

@@ -53,6 +55,9 @@ PROPERTIES = {

'use_analyze': Property(

kind=Single(bool, empty_val=False, required=False), default=True,

help='Use analyze to skip commits that do not affect tests.'),

+ 'suspected_revisions': Property(

+ kind=List(basestring), default=[],

+ help='A list of suspected revisions from heuristic analysis.'),

}

@@ -126,6 +131,7 @@ def _compile_and_test_at_revision(api, target_mastername, target_buildername,

override_bot_type='builder_tester')

# Run the tests.

+ failed_tests_dict = defaultdict(list)

with api.chromium_tests.wrap_chromium_tests(

bot_config, actual_tests_to_run):

failed_tests = api.test_utils.run_tests(

@@ -140,8 +146,9 @@ def _compile_and_test_at_revision(api, target_mastername, target_buildername,

'valid': valid,

}

if valid:

- results[failed_test.name]['failures'] = list(

- failed_test.failures(api, suffix=revision))

+ test_list = list(failed_test.failures(api, suffix=revision))

+ results[failed_test.name]['failures'] = test_list

+ failed_tests_dict[failed_test.name].extend(test_list)

# Process passed tests.

for test in actual_tests_to_run:

@@ -161,11 +168,26 @@ def _compile_and_test_at_revision(api, target_mastername, target_buildername,

'valid': True,

}

- return results

+ return results, failed_tests_dict

-def RunSteps(api, target_mastername, target_testername,

- good_revision, bad_revision, tests, use_analyze):

+def _get_subtracted_test_dict(original_test_dict, failed_tests_dict):

lijeffrey 2016/05/04 19:15:19 Naming this one's tricky, how about 'reduced' inst

chanli 2016/05/04 22:52:43 Done.

+ # Remove tests that are in both dicts from the original test dict.

+ if not failed_tests_dict:

+ return original_test_dict

+ subtracted_dict = defaultdict(list)

+ for step, tests in original_test_dict.iteritems():

+ if step in failed_tests_dict:

+ for test in tests:

+ if test not in failed_tests_dict[step]:

+ subtracted_dict[step].append(test)

+ else:

+ subtracted_dict[step].extend(tests)

+ return subtracted_dict

+def RunSteps(api, target_mastername, target_testername, good_revision,

+ bad_revision, tests, use_analyze, suspected_revisions):

assert tests, 'No failed tests were specified.'

# Figure out which builder configuration we should match for compile config.

@@ -197,6 +219,36 @@ def RunSteps(api, target_mastername, target_testername,

root_solution_revision=bad_revision)

revisions_to_check = api.findit.revisions_between(good_revision, bad_revision)

+ suspected_revision_index = [

+ revisions_to_check.index(r)

+ for r in set(suspected_revisions) if r in revisions_to_check]

+ # Segments revisions_to_check by suspected_revisions.

+ # Each sub_range will contain following elements:

+ # 1. Revision before a suspected_revision or None as a placeholder

+ # when no such revision

+ # 2. Suspected_revision

+ # 3. Revisions between a suspected_revision and the revision before next

+ # suspected_revision, or remaining revisions before all suspect_revisions.

+ # For example, if revisions_to_check are [r0, r1, ..., r6] and

+ # suspected_revisions are [r2, r5], sub_ranges will be:

+ # [[None, r0], [r1, r2, r3], [r4, r5, r6]]

+ if suspected_revision_index:

+ sub_ranges = []

+ remaining_revisions = revisions_to_check[:]

+ for index in sorted(suspected_revision_index, reverse=True):

+ if index > 0:

+ if index < len(remaining_revisions):

+ sub_ranges.append(remaining_revisions[index - 1:])

+ else: # Consecutive revisions are suspected, merges them in one range.

+ sub_ranges[-1].insert(0, remaining_revisions[index - 1])

stgao 2016/05/04 21:35:28 Can we handle this separately by operating just on

chanli 2016/05/04 22:52:43 I don't rally understand what you're suggesting he

+ remaining_revisions = remaining_revisions[:index - 1]

+ # None is a placeholder for the last known good revision.

+ sub_ranges.append([None] + remaining_revisions)

+ else:

+ # Treats the entire regression range as a single sub-range.

+ sub_ranges = [[None] + revisions_to_check]

test_results = {}

try_job_metadata = {

'regression_range_size': len(revisions_to_check)

@@ -207,19 +259,50 @@ def RunSteps(api, target_mastername, target_testername,

}

try:

- # We compile & run tests from the first revision to the last revision in the

- # regression range serially instead of a typical bisecting, because jumping

- # between new and old revisions might affect Goma capacity and build cycle

- # times. Thus we plan to go with this simple serial approach first so that

- # compile would be fast due to incremental compile.

- # If this won't work out, we will figure out a better solution for speed of

- # both compile and test.

- for current_revision in revisions_to_check:

- test_results[current_revision] = _compile_and_test_at_revision(

- api, target_mastername, target_buildername, target_testername,

- current_revision, tests, use_analyze)

- # TODO(http://crbug.com/566975): check whether culprits for all failed

- # tests are found and stop running tests at later revisions if so.

+ # Tests that haven't found culprits in tested revision(s).

+ no_culprit_tests = tests

stgao 2016/05/04 21:35:28 naming nit: this name seems misleading -- these te

chanli 2016/05/04 22:52:43 Done.

+ # Iterates through sub_ranges and find culprits for each failed test.

+ for sub_range in sub_ranges:

stgao 2016/05/04 21:35:28 Can we have a comment on why sub-ranges with newer

chanli 2016/05/04 22:52:43 Done.

+ if not no_culprit_tests: # All tests have found culprits.

+ break

+ # The revision right before the suspected revision provided by

+ # the heuristic result.

+ potential_green_rev = sub_range[0]

+ following_revisions = sub_range[1:]

+ if potential_green_rev:

+ test_results[potential_green_rev], tests_failed_in_potential_green = (

+ _compile_and_test_at_revision(

+ api, target_mastername, target_buildername, target_testername,

+ potential_green_rev, no_culprit_tests, use_analyze))

+ else:

+ tests_failed_in_potential_green = {}

+ tests_passed_in_potential_green = _get_subtracted_test_dict(

+ no_culprit_tests, tests_failed_in_potential_green)

+ # Culprits for tests that failed in potential green should be earlier, so

+ # takes out passed tests and only runs failed ones in following revisions.

lijeffrey 2016/05/04 19:15:19 nit: 'remove' instead of 'takes out'

chanli 2016/05/04 22:52:43 Done.

+ if tests_passed_in_potential_green:

+ tests_to_run = tests_passed_in_potential_green

+ for revision in following_revisions:

stgao 2016/05/04 21:35:28 Maybe add a comment on the general idea how this w

chanli 2016/05/04 22:52:43 Done.

+ test_results[revision], tests_failed_in_revision = (

+ _compile_and_test_at_revision(

+ api, target_mastername, target_buildername, target_testername,

+ revision, tests_to_run, use_analyze))

+ # Takes out tests that passed in potential green and failed in

+ # following revisions: culprits have been found for them.

+ no_culprit_tests = _get_subtracted_test_dict(

+ no_culprit_tests, tests_failed_in_revision)

+ # Only runs tests that have not found culprits in later revisions.

+ tests_to_run = _get_subtracted_test_dict(

+ tests_to_run, tests_failed_in_revision)

+ if not tests_to_run:

+ break

finally:

# Give the full report including test results and metadata.

step_result = api.python.succeeding_step(

@@ -233,7 +316,9 @@ def RunSteps(api, target_mastername, target_testername,

def GenTests(api):

- def props(tests, platform_name, tester_name, use_analyze=False):

+ def props(

+ tests, platform_name, tester_name, use_analyze=False, good_revision=None,

+ bad_revision=None, suspected_revisions=None):

properties = {

'mastername': 'tryserver.chromium.%s' % platform_name,

'buildername': '%s_chromium_variable' % platform_name,

@@ -241,11 +326,13 @@ def GenTests(api):

'buildnumber': 1,

'target_mastername': 'chromium.%s' % platform_name,

'target_testername': tester_name,

- 'good_revision': 'r0',

- 'bad_revision': 'r1',

+ 'good_revision': good_revision or 'r0',

+ 'bad_revision': bad_revision or 'r1',

'tests': tests,

'use_analyze': use_analyze,

}

+ if suspected_revisions:

+ properties['suspected_revisions'] = suspected_revisions

return api.properties(**properties) + api.platform.name(platform_name)

def simulated_gtest_output(failed_test_names=(), passed_test_names=()):

@@ -467,3 +554,319 @@ def GenTests(api):

simulated_gtest_output(passed_test_names=['Test.One'])

)

+ yield (

+ api.test('findit_culprit_in_last_sub_range') +

+ props(

+ {'gl_tests': ['Test.One']}, 'mac', 'Mac10.9 Tests', use_analyze=False,

+ good_revision='r0', bad_revision='r6', suspected_revisions=['r3']) +

+ api.override_step_data('test r2.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data('test r3.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data(

+ 'git commits in range',

+ api.raw_io.stream_output(

+ '\n'.join('r%d' % i for i in reversed(range(1, 7))))) +

+ api.override_step_data(

+ 'test r2.gl_tests (r2) on Mac-10.9',

+ simulated_gtest_output(passed_test_names=['Test.One'])) +

+ api.override_step_data(

+ 'test r3.gl_tests (r3) on Mac-10.9',

+ simulated_gtest_output(failed_test_names=['Test.One']))

+ )

+ yield (

+ api.test('findit_culprit_in_middle_sub_range') +

+ props(

+ {'gl_tests': ['Test.One']}, 'mac', 'Mac10.9 Tests', use_analyze=False,

+ good_revision='r0', bad_revision='r6',

+ suspected_revisions=['r3', 'r6']) +

+ api.override_step_data('test r2.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data('test r3.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data('test r5.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data('test r6.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data(

+ 'git commits in range',

+ api.raw_io.stream_output(

+ '\n'.join('r%d' % i for i in reversed(range(1, 7))))) +

+ api.override_step_data(

+ 'test r2.gl_tests (r2) on Mac-10.9',

+ simulated_gtest_output(passed_test_names=['Test.One'])) +

+ api.override_step_data(

+ 'test r3.gl_tests (r3) on Mac-10.9',

+ simulated_gtest_output(failed_test_names=['Test.One'])) +

+ api.override_step_data(

+ 'test r5.gl_tests (r5) on Mac-10.9',

+ simulated_gtest_output(passed_test_names=['Test.One'])) +

+ api.override_step_data(

+ 'test r6.gl_tests (r6) on Mac-10.9',

+ simulated_gtest_output(passed_test_names=['Test.One']))

+ )

+ yield (

+ api.test('findit_culprit_in_first_sub_range') +

+ props(

+ {'gl_tests': ['Test.One']}, 'mac', 'Mac10.9 Tests', use_analyze=False,

+ good_revision='r0', bad_revision='r6',

+ suspected_revisions=['r6']) +

+ api.override_step_data('test r1.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data('test r5.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data('test r6.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data(

+ 'git commits in range',

+ api.raw_io.stream_output(

+ '\n'.join('r%d' % i for i in reversed(range(1, 7))))) +

+ api.override_step_data(

+ 'test r1.gl_tests (r1) on Mac-10.9',

+ simulated_gtest_output(failed_test_names=['Test.One'])) +

+ api.override_step_data(

+ 'test r5.gl_tests (r5) on Mac-10.9',

+ simulated_gtest_output(passed_test_names=['Test.One'])) +

+ api.override_step_data(

+ 'test r6.gl_tests (r6) on Mac-10.9',

+ simulated_gtest_output(passed_test_names=['Test.One']))

+ )

+ yield (

+ api.test('findit_steps_multiple_culprits') +

+ props(

+ {'gl_tests': ['Test.gl_One'], 'browser_tests': ['Test.browser_One']},

+ 'mac', 'Mac10.9 Tests', use_analyze=False,

+ good_revision='r0', bad_revision='r6',

+ suspected_revisions=['r3','r6']) +

+ api.override_step_data('test r2.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ {

+ 'test': 'browser_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data('test r3.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ {

+ 'test': 'browser_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data('test r5.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ {

+ 'test': 'browser_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data('test r6.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ {

+ 'test': 'browser_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data(

+ 'git commits in range',

+ api.raw_io.stream_output(

+ '\n'.join('r%d' % i for i in reversed(range(1, 7))))) +

+ api.override_step_data(

+ 'test r5.gl_tests (r5) on Mac-10.9',

+ simulated_gtest_output(failed_test_names=['Test.gl_One'])) +

+ api.override_step_data(

+ 'test r5.browser_tests (r5) on Mac-10.9',

+ simulated_gtest_output(passed_test_names=['Test.browser_One'])) +

+ api.override_step_data(

+ 'test r6.browser_tests (r6) on Mac-10.9',

+ simulated_gtest_output(failed_test_names=['Test.browser_One']))+

+ api.override_step_data(

+ 'test r2.gl_tests (r2) on Mac-10.9',

+ simulated_gtest_output(passed_test_names=['Test.gl_One'])) +

+ api.override_step_data(

+ 'test r3.gl_tests (r3) on Mac-10.9',

+ simulated_gtest_output(failed_test_names=['Test.gl_One']))

+ )

+ yield (

+ api.test('findit_tests_multiple_culprits') +

+ props(

+ {'gl_tests': ['Test.One', 'Test.Two', 'Test.Three']},

+ 'mac', 'Mac10.9 Tests', use_analyze=False,

+ good_revision='r0', bad_revision='r6',

+ suspected_revisions=['r3', 'r5']) +

+ api.override_step_data('test r2.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data('test r3.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data('test r4.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data('test r5.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data('test r6.read test spec', api.json.output({

+ 'Mac10.9 Tests': {

+ 'gtest_tests': [

+ {

+ 'test': 'gl_tests',

+ 'swarming': {'can_use_on_swarming_builders': True},

+ },

+ ],

+ },

+ })) +

+ api.override_step_data(

+ 'git commits in range',

+ api.raw_io.stream_output(

+ '\n'.join('r%d' % i for i in reversed(range(1, 7))))) +

+ api.override_step_data(

+ 'test r4.gl_tests (r4) on Mac-10.9',

+ simulated_gtest_output(passed_test_names=['Test.One', 'Test.Three'],

+ failed_test_names=['Test.Two'])) +

+ api.override_step_data(

+ 'test r5.gl_tests (r5) on Mac-10.9',

+ simulated_gtest_output(passed_test_names=['Test.One'],

+ failed_test_names=['Test.Three'])) +

+ api.override_step_data(

+ 'test r6.gl_tests (r6) on Mac-10.9',

+ simulated_gtest_output(failed_test_names=['Test.One']))+

+ api.override_step_data(

+ 'test r2.gl_tests (r2) on Mac-10.9',

+ simulated_gtest_output(passed_test_names=['Test.Two'])) +

+ api.override_step_data(

+ 'test r3.gl_tests (r3) on Mac-10.9',

+ simulated_gtest_output(failed_test_names=['Test.Two']))

+ )

« no previous file with comments | « no previous file | scripts/slave/recipes/findit/chromium/test.expected/findit_culprit_in_first_sub_range.json » ('j') | no next file with comments »