tools/bisect-builds.py - Issue 7329005: Add programmatic interface

Unified Diff: tools/bisect-builds.py

Issue 7329005: Add programmatic interface (Closed) Base URL: http://git.chromium.org/git/chromium.git@trunk

Patch Set: Created 9 years, 5 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Index: tools/bisect-builds.py

diff --git a/tools/bisect-builds.py b/tools/bisect-builds.py

index d9c056904b113b295266d6b2b5716e7eae0a9222..549d4228f86809ad58977ced0af03b012c0c7822 100755

--- a/tools/bisect-builds.py

+++ b/tools/bisect-builds.py

@@ -13,7 +13,7 @@ it will ask you whether it is good or bad before continuing the search.

"""

# The root URL for storage.

-BASE_URL = 'http://commondatastorage.googleapis.com/chromium-browser-continuous'

+BASE_URL = 'http://commondatastorage.googleapis.com/chromium-browser-snapshots'

# URL to the ViewVC commit page.

BUILD_VIEWVC_URL = 'http://src.chromium.org/viewvc/chrome?view=rev&revision=%d'

@@ -35,6 +35,8 @@ import tempfile

import urllib

from xml.etree import ElementTree

import zipfile

+import subprocess

+import threading

Evan Martin 2011/07/14 18:57:52 I think this list is alphabetized.

szager 2011/07/14 19:23:03 Done.

class PathContext(object):

"""A PathContext is used to carry the information used to construct URLs and

@@ -53,13 +55,13 @@ class PathContext(object):

# _listing_platform_dir = Directory that holds revisions. Ends with a '/'.

# _archive_extract_dir = Uncompressed directory in the archive_name file.

# _binary_name = The name of the executable to run.

- if self.platform == 'linux' or self.platform == 'linux-64':

+ if self.platform == 'linux' or self.platform == 'linux64':

self._listing_platform_dir = 'Linux/'

self.archive_name = 'chrome-linux.zip'

self._archive_extract_dir = 'chrome-linux'

self._binary_name = 'chrome'

# Linux and x64 share all the same path data except for the archive dir.

- if self.platform == 'linux-64':

+ if self.platform == 'linux64':

self._listing_platform_dir = 'Linux_x64/'

elif self.platform == 'mac':

self._listing_platform_dir = 'Mac/'

@@ -84,8 +86,8 @@ class PathContext(object):

def GetDownloadURL(self, revision):

"""Gets the download URL for a build archive of a specific revision."""

- return BASE_URL + '/' + self._listing_platform_dir + str(revision) + '/' + \

- self.archive_name

+ return "%s/%s%d/%s" % (

+ BASE_URL, self._listing_platform_dir, revision, self.archive_name)

def GetLastChangeURL(self):

"""Returns a URL to the LAST_CHANGE file."""

@@ -99,9 +101,11 @@ class PathContext(object):

def UnzipFilenameToDir(filename, dir):

"""Unzip |filename| to directory |dir|."""

+ pushd = os.getcwd()

+ if not os.path.isabs(filename):

+ filename = os.path.join(pushd, filename)

zf = zipfile.ZipFile(filename)

# Make base.

- pushd = os.getcwd()

try:

if not os.path.isdir(dir):

os.mkdir(dir)

@@ -161,7 +165,15 @@ def ParseDirectoryIndex(context):

# The <Prefix> nodes have content of the form of

# |_listing_platform_dir/revision/|. Strip off the platform dir and the

# trailing slash to just have a number.

- revisions = map(lambda x: x.text[len(prefix):-1], all_prefixes)

+ #revisions = map(lambda x: x.text[len(prefix):-1], all_prefixes)

Evan Martin 2011/07/14 18:57:52 Did you mean to leave in this commented-out code?

szager 2011/07/14 19:23:03 Deleted!

+ revisions = []

+ for pf in all_prefixes:

Robert Sesek 2011/07/15 16:27:14 What's "pf"? |prefix| is fine.

+ revnum = pf.text[len(prefix):-1]

+ try:

+ revnum = int(revnum)

+ revisions.append(revnum)

+ except ValueError:

+ pass

return (revisions, next_marker)

# Fetch the first list of revisions.

@@ -186,63 +198,164 @@ def GetRevList(context):

revlist.sort()

return revlist

+def FetchRevision(context, rev, filename, quit_event=None) :

+ """Downloads and unzips revision |rev|"""

-def TryRevision(context, rev, profile, args):

- """Downloads revision |rev|, unzips it, and opens it for the user to test.

- |profile| is the profile to use."""

- # Do this in a temp dir so we don't collide with user files.

- cwd = os.getcwd()

- tempdir = tempfile.mkdtemp(prefix='bisect_tmp')

- os.chdir(tempdir)

+ def ReportHook(blocknum, blocksize, totalsize):

+ if quit_event and quit_event.is_set():

+ raise RuntimeError("Aborting download of revision %d" % rev)

- # Download the file.

download_url = context.GetDownloadURL(rev)

- def _ReportHook(blocknum, blocksize, totalsize):

- size = blocknum * blocksize

- if totalsize == -1: # Total size not known.

- progress = "Received %d bytes" % size

- else:

- size = min(totalsize, size)

- progress = "Received %d of %d bytes, %.2f%%" % (

- size, totalsize, 100.0 * size / totalsize)

- # Send a \r to let all progress messages use just one line of output.

- sys.stdout.write("\r" + progress)

- sys.stdout.flush()

try:

- print 'Fetching ' + download_url

- urllib.urlretrieve(download_url, context.archive_name, _ReportHook)

- print

- except Exception, e:

- print('Could not retrieve the download. Sorry.')

- sys.exit(-1)

+ urllib.urlretrieve(download_url, filename, ReportHook)

+ except RuntimeError, e:

+ pass

+def RunRevision(context, revision, zipfile, profile, args) :

+ """Given a zipped revision, unzip it and run the test"""

+ print "Trying revision %d..." % revision

- # Unzip the file.

- print 'Unzipping ...'

- UnzipFilenameToDir(context.archive_name, os.curdir)

+ # Create a temp directory and unzip the revision into it

+ cwd = os.getcwd()

+ tempdir = tempfile.mkdtemp(prefix='bisect_tmp')

+ UnzipFilenameToDir(zipfile, tempdir)

+ os.chdir(tempdir)

- # Tell the system to open the app.

- args = ['--user-data-dir=%s' % profile] + args

- flags = ' '.join(map(pipes.quote, args))

- cmd = '%s %s' % (context.GetLaunchPath(), flags)

- print 'Running %s' % cmd

- os.system(cmd)

+ # Run the test

+ testargs = [context.GetLaunchPath(), '--user-data-dir=%s' % profile] + args

+ subproc = subprocess.Popen(testargs,

+ bufsize=-1,

+ stdout=subprocess.PIPE,

+ stderr=subprocess.PIPE)

+ (stdout, stderr) = subproc.communicate()

os.chdir(cwd)

- print 'Cleaning temp dir ...'

try:

shutil.rmtree(tempdir, True)

except Exception, e:

pass

+ return (subproc.returncode, stdout, stderr)

-def AskIsGoodBuild(rev):

+def ResultIsGood(status, stdout, stderr) :

"""Ask the user whether build |rev| is good or bad."""

# Loop until we get a response that we can parse.

while True:

- response = raw_input('\nBuild %d is [(g)ood/(b)ad]: ' % int(rev))

+ response = raw_input('Build is [(g)ood/(b)ad/(q)uit]: ')

if response and response in ('g', 'b'):

return response == 'g'

+ if response and response == 'q':

+ raise SystemExit()

+def bisect(platform=None,

Evan Martin 2011/07/14 18:57:52 Capital B on function names. (Our Python style is

szager 2011/07/14 19:23:03 Done.

+ profile="",

+ run_args=(),

+ good_rev=0,

+ bad_rev=0,

+ predicate=ResultIsGood):

+ """Given known good and known bad revisions, run a binary search on all

+ archived revisions to determine the last known good revision."""

+ context = PathContext(platform, good_rev, bad_rev)

+ cwd = os.getcwd()

+ revlist = GetRevList(context)

+ # Get a list of revisions to bisect across.

+ if len(revlist) < 2: # Don't have enough builds to bisect

+ msg = 'We don\'t have enough builds to bisect. revlist: %s' % revlist

+ raise RuntimeError(msg)

+ # If we don't have a |good_rev|, set it to be the first revision possible.

+ if good_rev == 0:

+ good_rev = revlist[0]

+ # Figure out our bookends and first pivot point; fetch the pivot revision

+ good = 0

+ bad = len(revlist) - 1

+ pivot = bad/2

+ rev = revlist[pivot]

+ zipfile = os.path.join(cwd, '%d-%s' % (rev, context.archive_name))

+ FetchRevision(context, rev, zipfile)

+ # Binary search time!

+ while zipfile and bad - good > 1:

+ print "iterating with good=%d bad=%d pivot=%d" % (

+ revlist[good], revlist[bad], revlist[pivot])

+ # Pre-fetch next two possible pivots

+ down_pivot = int((pivot - good) / 2) + good

+ down_thread = None

+ if down_pivot != pivot and down_pivot != good :

+ down_rev = revlist[down_pivot]

+ zipfile_base = '%d-%s' % (down_rev, context.archive_name)

+ down_zipfile = os.path.join(cwd, zipfile_base)

+ down_event = threading.Event()

+ fetchargs = (context, down_rev, down_zipfile, down_event)

+ down_thread = threading.Thread(target=FetchRevision,

+ name='down_fetch',

+ args=fetchargs)

+ down_thread.start()

+ up_pivot = int((bad - pivot) / 2) + pivot

+ up_thread = None

+ if up_pivot != pivot and up_pivot != bad :

+ up_rev = revlist[up_pivot]

+ zipfile_base = '%d-%s' % (up_rev, context.archive_name)

+ up_zipfile = os.path.join(cwd, zipfile_base)

+ up_event = threading.Event()

+ fetchargs = (context, up_rev, up_zipfile, up_event)

+ up_thread = threading.Thread(target=FetchRevision,

+ name='up_fetch',

+ args=fetchargs)

+ up_thread.start()

+ # Run test on the pivot revision

+ (status, stdout, stderr) = RunRevision(context,

+ rev,

+ zipfile,

+ profile,

+ run_args)

+ os.unlink(zipfile)

+ zipfile = None

+ try:

+ if predicate(status, stdout, stderr) :

+ good = pivot

+ if down_thread :

+ down_event.set() # Kill the download of older revision

+ down_thread.join()

+ os.unlink(down_zipfile)

+ if up_thread :

+ print "Downloading revision %d..." % up_rev

+ up_thread.join() # Wait for newer revision to finish downloading

+ pivot = up_pivot

+ zipfile = up_zipfile

+ else :

+ bad = pivot

+ if up_thread :

+ up_event.set() # Kill download of newer revision

+ up_thread.join()

+ os.unlink(up_zipfile)

+ if down_thread :

+ print "Downloading revision %d..." % down_rev

+ down_thread.join() # Wait for older revision to finish downloading

+ pivot = down_pivot

+ zipfile = down_zipfile

+ except SystemExit:

+ for f in [down_zipfile, up_zipfile]:

+ try:

+ os.unlink(f)

+ except OSError:

+ pass

+ sys.exit(0)

Evan Martin 2011/07/14 18:57:52 Is this both moving the code and making changes to

szager 2011/07/14 19:23:03 I had move the main loop out of main() to enable t

+ rev = revlist[pivot]

+ return (good, bad)

+################################################################################

def main():

usage = ('%prog [options] [-- chromium-options]\n'

@@ -281,11 +394,7 @@ def main():

# Create the context. Initialize 0 for the revisions as they are set below.

context = PathContext(opts.archive, 0, 0)

- # Pick a starting point, try to get HEAD for this.

- if opts.bad:

- bad_rev = opts.bad

- else:

- bad_rev = 0

+ if not opts.bad :

try:

# Location of the latest build revision number

nh = urllib.urlopen(context.GetLastChangeURL())

@@ -294,71 +403,30 @@ def main():

bad_rev = raw_input('Bad revision [HEAD:%d]: ' % latest)

if (bad_rev == ''):

bad_rev = latest

- bad_rev = int(bad_rev)

+ opts.bad = int(bad_rev)

except Exception, e:

print('Could not determine latest revision. This could be bad...')

- bad_rev = int(raw_input('Bad revision: '))

+ opts.bad = int(raw_input('Bad revision: '))

- # Find out when we were good.

- if opts.good:

- good_rev = opts.good

- else:

- good_rev = 0

+ if not opts.good :

try:

- good_rev = int(raw_input('Last known good [0]: '))

+ opts.good = int(raw_input('Last known good [0]: '))

except Exception, e:

pass

- # Set the input parameters now that they've been validated.

- context.good_revision = good_rev

- context.bad_revision = bad_rev

- # Get a list of revisions to bisect across.

- revlist = GetRevList(context)

- if len(revlist) < 2: # Don't have enough builds to bisect

- print 'We don\'t have enough builds to bisect. revlist: %s' % revlist

- sys.exit(1)

- # If we don't have a |good_rev|, set it to be the first revision possible.

- if good_rev == 0:

- good_rev = revlist[0]

- # These are indexes of |revlist|.

- good = 0

- bad = len(revlist) - 1

- last_known_good_rev = revlist[good]

+ try :

+ (good, bad) = bisect(opts.archive, opts.profile, args, opts.good, opts.bad)

+ # We're done. Let the user know the results in an official manner.

+ print('You are probably looking for build %d.' % bad)

+ clog_url = CHANGELOG_URL % (good, bad)

+ print('CHANGELOG URL: %s' % clog_url)

+ build_url = BUILD_VIEWVC_URL % bad

+ print('Built at revision: %s' % build_url)

+ return 0

+ except Exception, e:

+ print e

+ return 1

- # Binary search time!

- while good < bad:

- candidates = revlist[good:bad]

- num_poss = len(candidates)

- if num_poss > 10:

- print('%d candidates. %d tries left.' %

- (num_poss, round(math.log(num_poss, 2))))

- else:

- print('Candidates: %s' % revlist[good:bad])

- # Cut the problem in half...

- test = int((bad - good) / 2) + good

- test_rev = revlist[test]

- # Let the user give this rev a spin (in her own profile, if she wants).

- profile = opts.profile

- if not profile:

- profile = 'profile' # In a temp dir.

- TryRevision(context, test_rev, profile, args)

- if AskIsGoodBuild(test_rev):

- last_known_good_rev = revlist[good]

- good = test + 1

- else:

- bad = test

- # We're done. Let the user know the results in an official manner.

- print('You are probably looking for build %d.' % revlist[bad])

- print('CHANGELOG URL:')

- print(CHANGELOG_URL % (last_known_good_rev, revlist[bad]))

- print('Built at revision:')

- print(BUILD_VIEWVC_URL % revlist[bad])

if __name__ == '__main__':

sys.exit(main())

« no previous file with comments | « no previous file | no next file » | no next file with comments »