Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(9)

Side by Side Diff: tools/auto_bisect/bisect_perf_regression_test.py

Issue 644323002: Requiring confidence in initial regression range before bisecting. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master
Patch Set: Rebasing. Created 6 years, 2 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
« no previous file with comments | « tools/auto_bisect/bisect_perf_regression.py ('k') | no next file » | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 # Copyright 2014 The Chromium Authors. All rights reserved. 1 # Copyright 2014 The Chromium Authors. All rights reserved.
2 # Use of this source code is governed by a BSD-style license that can be 2 # Use of this source code is governed by a BSD-style license that can be
3 # found in the LICENSE file. 3 # found in the LICENSE file.
4 4
5 import os 5 import os
6 import re 6 import re
7 import shutil 7 import shutil
8 import sys 8 import sys
9 import unittest 9 import unittest
10 10
11 SRC = os.path.join(os.path.dirname(__file__), os.path.pardir, os.path.pardir) 11 SRC = os.path.join(os.path.dirname(__file__), os.path.pardir, os.path.pardir)
12 sys.path.append(os.path.join(SRC, 'third_party', 'pymock')) 12 sys.path.append(os.path.join(SRC, 'third_party', 'pymock'))
13 13
14 import bisect_perf_regression 14 import bisect_perf_regression
15 import bisect_results 15 import bisect_results
16 import mock 16 import mock
17 import source_control 17 import source_control
18 18
19 19
20 # Regression confidence: 0%
21 CLEAR_NON_REGRESSION = [
22 # Mean: 30.223 Std. Dev.: 11.383
23 [[16.886], [16.909], [16.99], [17.723], [17.952], [18.118], [19.028],
24 [19.552], [21.954], [38.573], [38.839], [38.965], [40.007], [40.572],
25 [41.491], [42.002], [42.33], [43.109], [43.238]],
26 # Mean: 34.76 Std. Dev.: 11.516
27 [[16.426], [17.347], [20.593], [21.177], [22.791], [27.843], [28.383],
28 [28.46], [29.143], [40.058], [40.303], [40.558], [41.918], [42.44],
29 [45.223], [46.494], [50.002], [50.625], [50.839]]
30 ]
31 # Regression confidence: ~ 90%
32 ALMOST_REGRESSION = [
33 # Mean: 30.042 Std. Dev.: 2.002
34 [[26.146], [28.04], [28.053], [28.074], [28.168], [28.209], [28.471],
35 [28.652], [28.664], [30.862], [30.973], [31.002], [31.897], [31.929],
36 [31.99], [32.214], [32.323], [32.452], [32.696]],
37 # Mean: 33.008 Std. Dev.: 4.265
38 [[34.963], [30.741], [39.677], [39.512], [34.314], [31.39], [34.361],
39 [25.2], [30.489], [29.434]]
40 ]
41 # Regression confidence: ~ 98%
42 BARELY_REGRESSION = [
43 # Mean: 28.828 Std. Dev.: 1.993
44 [[26.96], [27.605], [27.768], [27.829], [28.006], [28.206], [28.393],
45 [28.911], [28.933], [30.38], [30.462], [30.808], [31.74], [31.805],
46 [31.899], [32.077], [32.454], [32.597], [33.155]],
47 # Mean: 31.156 Std. Dev.: 1.980
48 [[28.729], [29.112], [29.258], [29.454], [29.789], [30.036], [30.098],
49 [30.174], [30.534], [32.285], [32.295], [32.552], [32.572], [32.967],
50 [33.165], [33.403], [33.588], [33.744], [34.147], [35.84]]
51 ]
52 # Regression confidence: 99.5%
53 CLEAR_REGRESSION = [
54 # Mean: 30.254 Std. Dev.: 2.987
55 [[26.494], [26.621], [26.701], [26.997], [26.997], [27.05], [27.37],
56 [27.488], [27.556], [31.846], [32.192], [32.21], [32.586], [32.596],
57 [32.618], [32.95], [32.979], [33.421], [33.457], [34.97]],
58 # Mean: 33.190 Std. Dev.: 2.972
59 [[29.547], [29.713], [29.835], [30.132], [30.132], [30.33], [30.406],
60 [30.592], [30.72], [34.486], [35.247], [35.253], [35.335], [35.378],
61 [35.934], [36.233], [36.41], [36.947], [37.982]]
62 ]
20 # Default options for the dry run 63 # Default options for the dry run
21 DEFAULT_OPTIONS = { 64 DEFAULT_OPTIONS = {
22 'debug_ignore_build': True, 65 'debug_ignore_build': True,
23 'debug_ignore_sync': True, 66 'debug_ignore_sync': True,
24 'debug_ignore_perf_test': True, 67 'debug_ignore_perf_test': True,
68 'debug_ignore_regression_confidence': True,
25 'command': 'fake_command', 69 'command': 'fake_command',
26 'metric': 'fake/metric', 70 'metric': 'fake/metric',
27 'good_revision': 280000, 71 'good_revision': 280000,
28 'bad_revision': 280005, 72 'bad_revision': 280005,
29 } 73 }
30 74
75 # This global is a placeholder for a generator to be defined by the testcases
76 # that use _MockRunTest
77 _MockResultsGenerator = (x for x in [])
78
79 def _FakeTestResult(values):
80 result_dict = {'mean': 0.0, 'std_err': 0.0, 'std_dev': 0.0, 'values': values}
81 success_code = 0
82 return (result_dict, success_code)
83
84
85 def _MockRunTests(*args, **kwargs):
86 _, _ = args, kwargs
87 return _FakeTestResult(_MockResultsGenerator.next())
88
31 89
32 def _GetBisectPerformanceMetricsInstance(options_dict): 90 def _GetBisectPerformanceMetricsInstance(options_dict):
33 """Returns an instance of the BisectPerformanceMetrics class.""" 91 """Returns an instance of the BisectPerformanceMetrics class."""
34 bisect_options = bisect_perf_regression.BisectOptions.FromDict(options_dict) 92 bisect_options = bisect_perf_regression.BisectOptions.FromDict(options_dict)
35 bisect_instance = bisect_perf_regression.BisectPerformanceMetrics( 93 bisect_instance = bisect_perf_regression.BisectPerformanceMetrics(
36 bisect_options) 94 bisect_options)
37 return bisect_instance 95 return bisect_instance
38 96
39 97
40 def _GetExtendedOptions(d, f): 98 def _GetExtendedOptions(improvement_dir, fake_first, ignore_confidence=True):
41 """Returns the a copy of the default options dict plus some options.""" 99 """Returns the a copy of the default options dict plus some options."""
42 result = dict(DEFAULT_OPTIONS) 100 result = dict(DEFAULT_OPTIONS)
43 result.update({ 101 result.update({
44 'improvement_direction': d, 102 'improvement_direction': improvement_dir,
45 'debug_fake_first_test_mean': f}) 103 'debug_fake_first_test_mean': fake_first,
104 'debug_ignore_regression_confidence': ignore_confidence})
46 return result 105 return result
47 106
48 107
49 def _GenericDryRun(options, print_results=False): 108 def _GenericDryRun(options, print_results=False):
50 """Performs a dry run of the bisector. 109 """Performs a dry run of the bisector.
51 110
52 Args: 111 Args:
53 options: Dictionary containing the options for the bisect instance. 112 options: Dictionary containing the options for the bisect instance.
54 print_results: Boolean telling whether to call FormatAndPrintResults. 113 print_results: Boolean telling whether to call FormatAndPrintResults.
55 114
(...skipping 238 matching lines...) Expand 10 before | Expand all | Expand 10 after
294 def testDryRun(self): 353 def testDryRun(self):
295 """Does a dry run of the bisect script. 354 """Does a dry run of the bisect script.
296 355
297 This serves as a smoke test to catch errors in the basic execution of the 356 This serves as a smoke test to catch errors in the basic execution of the
298 script. 357 script.
299 """ 358 """
300 _GenericDryRun(DEFAULT_OPTIONS, True) 359 _GenericDryRun(DEFAULT_OPTIONS, True)
301 360
302 def testBisectImprovementDirectionFails(self): 361 def testBisectImprovementDirectionFails(self):
303 """Dry run of a bisect with an improvement instead of regression.""" 362 """Dry run of a bisect with an improvement instead of regression."""
304
305 # Test result goes from 0 to 100 where higher is better 363 # Test result goes from 0 to 100 where higher is better
306 results = _GenericDryRun(_GetExtendedOptions(1, 100)) 364 results = _GenericDryRun(_GetExtendedOptions(1, 100))
307 self.assertIsNotNone(results.error) 365 self.assertIsNotNone(results.error)
308 self.assertIn('not a regression', results.error) 366 self.assertIn('not a regression', results.error)
367
309 # Test result goes from 0 to -100 where lower is better 368 # Test result goes from 0 to -100 where lower is better
310 results = _GenericDryRun(_GetExtendedOptions(-1, -100)) 369 results = _GenericDryRun(_GetExtendedOptions(-1, -100))
311 self.assertIsNotNone(results.error) 370 self.assertIsNotNone(results.error)
312 self.assertIn('not a regression', results.error) 371 self.assertIn('not a regression', results.error)
313 372
314 def testBisectImprovementDirectionSucceeds(self): 373 def testBisectImprovementDirectionSucceeds(self):
315 """Bisects with improvement direction matching regression range.""" 374 """Bisects with improvement direction matching regression range."""
316 # Test result goes from 0 to 100 where lower is better 375 # Test result goes from 0 to 100 where lower is better
317 results = _GenericDryRun(_GetExtendedOptions(-1, 100)) 376 results = _GenericDryRun(_GetExtendedOptions(-1, 100))
318 self.assertIsNone(results.error) 377 self.assertIsNone(results.error)
319 # Test result goes from 0 to -100 where higher is better 378 # Test result goes from 0 to -100 where higher is better
320 results = _GenericDryRun(_GetExtendedOptions(1, -100)) 379 results = _GenericDryRun(_GetExtendedOptions(1, -100))
321 self.assertIsNone(results.error) 380 self.assertIsNone(results.error)
322 381
382 @mock.patch('bisect_perf_regression.BisectPerformanceMetrics.'
383 'RunPerformanceTestAndParseResults', _MockRunTests)
384 def testBisectStopsOnDoubtfulRegression(self):
385 global _MockResultsGenerator
386 _MockResultsGenerator = (rs for rs in CLEAR_NON_REGRESSION)
387 results = _GenericDryRun(_GetExtendedOptions(0, 0, False))
388 self.assertIsNotNone(results.error)
389 self.assertIn('could not reproduce the regression', results.error)
390
391 _MockResultsGenerator = (rs for rs in ALMOST_REGRESSION)
392 results = _GenericDryRun(_GetExtendedOptions(0, 0, False))
393 self.assertIsNotNone(results.error)
394 self.assertIn('could not reproduce the regression', results.error)
395
396 @mock.patch('bisect_perf_regression.BisectPerformanceMetrics.'
397 'RunPerformanceTestAndParseResults', _MockRunTests)
398 def testBisectContinuesOnClearRegression(self):
399 global _MockResultsGenerator
400 _MockResultsGenerator = (rs for rs in CLEAR_REGRESSION)
401 with self.assertRaises(StopIteration):
402 _GenericDryRun(_GetExtendedOptions(0, 0, False))
403
404 _MockResultsGenerator = (rs for rs in BARELY_REGRESSION)
405 with self.assertRaises(StopIteration):
406 _GenericDryRun(_GetExtendedOptions(0, 0, False))
323 407
324 def testGetCommitPosition(self): 408 def testGetCommitPosition(self):
325 cp_git_rev = '7017a81991de983e12ab50dfc071c70e06979531' 409 cp_git_rev = '7017a81991de983e12ab50dfc071c70e06979531'
326 self.assertEqual(291765, source_control.GetCommitPosition(cp_git_rev)) 410 self.assertEqual(291765, source_control.GetCommitPosition(cp_git_rev))
327 411
328 svn_git_rev = 'e6db23a037cad47299a94b155b95eebd1ee61a58' 412 svn_git_rev = 'e6db23a037cad47299a94b155b95eebd1ee61a58'
329 self.assertEqual(291467, source_control.GetCommitPosition(svn_git_rev)) 413 self.assertEqual(291467, source_control.GetCommitPosition(svn_git_rev))
330 414
331 def testGetCommitPositionForV8(self): 415 def testGetCommitPositionForV8(self):
332 bisect_instance = _GetBisectPerformanceMetricsInstance(DEFAULT_OPTIONS) 416 bisect_instance = _GetBisectPerformanceMetricsInstance(DEFAULT_OPTIONS)
(...skipping 209 matching lines...) Expand 10 before | Expand all | Expand 10 after
542 '--diff=%s' % patch_content 626 '--diff=%s' % patch_content
543 ], (None, 0)) 627 ], (None, 0))
544 ] 628 ]
545 self._SetupRunGitMock(try_cmd) 629 self._SetupRunGitMock(try_cmd)
546 bisect_perf_regression._BuilderTryjob( 630 bisect_perf_regression._BuilderTryjob(
547 git_revision, bot_name, bisect_job_name, patch) 631 git_revision, bot_name, bisect_job_name, patch)
548 632
549 633
550 if __name__ == '__main__': 634 if __name__ == '__main__':
551 unittest.main() 635 unittest.main()
OLDNEW
« no previous file with comments | « tools/auto_bisect/bisect_perf_regression.py ('k') | no next file » | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698