Chromium Code Reviews| Index: tools/bisect-builds.py |
| diff --git a/tools/bisect-builds.py b/tools/bisect-builds.py |
| index 4aa177279052db497244d634e8f26194a47b330e..d41c1c227ff427e14151671630a55625f00b5d71 100755 |
| --- a/tools/bisect-builds.py |
| +++ b/tools/bisect-builds.py |
| @@ -12,33 +12,13 @@ unzipping, and opening Chromium for you. After testing the specific revision, |
| it will ask you whether it is good or bad before continuing the search. |
| """ |
| -# Base URL to download snapshots from. |
| -BUILD_BASE_URL = 'http://build.chromium.org/f/chromium/continuous/' |
| - |
| -# The index file that lists all the builds. This lives in BUILD_BASE_URL. |
| -BUILD_INDEX_FILE = 'all_builds.txt' |
| - |
| -# The type (platform) of the build archive. This is what's passed in to the |
| -# '-a/--archive' option. |
| -BUILD_ARCHIVE_TYPE = '' |
| - |
| -# The location of the builds. Format this with a (date, revision) tuple, which |
| -# can be obtained through ParseIndexLine(). |
| -BUILD_ARCHIVE_URL = '/%s/%d/' |
| - |
| -# Name of the build archive. |
| -BUILD_ZIP_NAME = '' |
| - |
| -# Directory name inside the archive. |
| -BUILD_DIR_NAME = '' |
| - |
| -# Name of the executable. |
| -BUILD_EXE_NAME = '' |
| +# The root URL for storage. |
| +BASE_URL = 'http://commondatastorage.googleapis.com/chromium-browser-continuous' |
| # URL to the ViewVC commit page. |
| BUILD_VIEWVC_URL = 'http://src.chromium.org/viewvc/chrome?view=rev&revision=%d' |
| -# Changelogs URL |
| +# Changelogs URL. |
| CHANGELOG_URL = 'http://build.chromium.org/f/chromium/' \ |
| 'perf/dashboard/ui/changelog.html?url=/trunk/src&range=%d:%d' |
| @@ -53,8 +33,71 @@ import shutil |
| import sys |
| import tempfile |
| import urllib |
| +from xml.etree import ElementTree |
| import zipfile |
| +class PathContext(object): |
| + """A PathContext is used to carry the information used to construct URLs and |
| + paths when dealing with the storage server and archives.""" |
| + def __init__(self, platform, good_revision, bad_revision): |
| + super(PathContext, self).__init__() |
| + # Store off the input parameters. |
| + self.platform = platform # What's passed in to the '-a/--archive' option. |
| + self.good_revision = good_revision |
| + self.bad_revision = bad_revision |
| + |
| + # The name of the ZIP file in a revision directory on the server. |
| + self.archive_name = None |
| + |
| + # Set some internal members: |
| + # _listing_platform_dir = Directory that holds revisions. Ends with a '/'. |
| + # _archive_extract_dir = Uncompressed directory in the archive_name file. |
| + # _binary_name = The name of the executable to run. |
| + if self.platform == 'linux' or self.platform == 'linux-64': |
| + self._listing_platform_dir = 'Linux/' |
| + self.archive_name = 'chrome-linux.zip' |
| + self._archive_extract_dir = 'chrome-linux' |
| + self._binary_name = 'chrome' |
| + # Linux and x64 share all the same path data except for the archive dir. |
| + if self.platform == 'linux-64': |
| + self._listing_platform_dir = 'Linux_x64/' |
| + elif self.platform == 'mac': |
| + self._listing_platform_dir = 'Mac/' |
| + self.archive_name = 'chrome-mac.zip' |
| + self._archive_extract_dir = 'chrome-mac' |
| + self._binary_name = 'Chromium.app/Contents/MacOS/Chromium' |
| + elif self.platform == 'win': |
| + self._listing_platform_dir = 'Win/' |
| + self.archive_name = 'chrome-win32.zip' |
| + self._archive_extract_dir = 'chrome-win32' |
| + self._binary_name = 'chrome.exe' |
| + else: |
| + raise Exception("Invalid platform") |
| + |
| + def GetListingURL(self, revision_offset=None): |
| + """Returns the URL for a directory listing, with an optional starting |
| + revision.""" |
| + marker = '' |
| + if revision_offset: |
| + marker = '&marker=' + self._listing_platform_dir + \ |
| + str(revision_offset) + '/' |
| + return BASE_URL + '/?delimiter=/&prefix=' + self._listing_platform_dir + \ |
| + marker |
| + |
| + def GetDownloadURL(self, revision): |
| + """Gets the download URL for a build archive of a specific revision.""" |
| + return BASE_URL + '/' + self._listing_platform_dir + str(revision) + '/' + \ |
| + self.archive_name |
| + |
| + def GetLastChangeURL(self): |
| + """Returns a URL to the LAST_CHANGE file.""" |
| + return BASE_URL + '/' + self._listing_platform_dir + 'LAST_CHANGE' |
| + |
| + def GetLaunchPath(self): |
| + """Returns a relative path (presumably from the archive extraction location) |
| + that is used to run the executable.""" |
| + return os.path.join(self._archive_extract_dir, self._binary_name) |
| + |
| def UnzipFilenameToDir(filename, dir): |
| """Unzip |filename| to directory |dir|.""" |
| @@ -86,89 +129,78 @@ def UnzipFilenameToDir(filename, dir): |
| sys.exit(1) |
| -def SetArchiveVars(archive): |
| - """Set a bunch of global variables appropriate for the specified archive.""" |
| - global BUILD_ARCHIVE_TYPE |
| - global BUILD_ZIP_NAME |
| - global BUILD_DIR_NAME |
| - global BUILD_EXE_NAME |
| - global BUILD_BASE_URL |
| - |
| - BUILD_ARCHIVE_TYPE = archive |
| - |
| - if BUILD_ARCHIVE_TYPE in ('linux', 'linux64', 'linux-chromiumos'): |
| - BUILD_ZIP_NAME = 'chrome-linux.zip' |
| - BUILD_DIR_NAME = 'chrome-linux' |
| - BUILD_EXE_NAME = 'chrome' |
| - elif BUILD_ARCHIVE_TYPE in ('mac'): |
| - BUILD_ZIP_NAME = 'chrome-mac.zip' |
| - BUILD_DIR_NAME = 'chrome-mac' |
| - BUILD_EXE_NAME = 'Chromium.app/Contents/MacOS/Chromium' |
| - elif BUILD_ARCHIVE_TYPE in ('win'): |
| - BUILD_ZIP_NAME = 'chrome-win32.zip' |
| - BUILD_DIR_NAME = 'chrome-win32' |
| - BUILD_EXE_NAME = 'chrome.exe' |
| - |
| - |
| -def ParseDirectoryIndex(url): |
| - """Parses the all_builds.txt index file. The format of this file is: |
| - mac/2011-02-16/75130 |
| - mac/2011-02-16/75218 |
| - mac/2011-02-16/75226 |
| - mac/2011-02-16/75234 |
| - mac/2011-02-16/75184 |
| - This function will return a list of DATE/REVISION strings for the platform |
| - specified by BUILD_ARCHIVE_TYPE. |
| - """ |
| - handle = urllib.urlopen(url) |
| - dirindex = handle.readlines() |
| - handle.close() |
| - |
| - # Only return values for the specified platform. Include the trailing slash to |
| - # not confuse linux and linux64. |
| - archtype = BUILD_ARCHIVE_TYPE + '/' |
| - dirindex = filter(lambda l: l.startswith(archtype), dirindex) |
| - |
| - # Remove the newline separator and the platform token. |
| - dirindex = map(lambda l: l[len(archtype):].strip(), dirindex) |
| - dirindex.sort() |
| - return dirindex |
| - |
| - |
| -def ParseIndexLine(iline): |
| - """Takes an index line returned by ParseDirectoryIndex() and returns a |
| - 2-tuple of (date, revision). |date| is a string and |revision| is an int.""" |
| - split = iline.split('/') |
| - assert(len(split) == 2) |
| - return (split[0], int(split[1])) |
| - |
| - |
| -def GetRevision(iline): |
| - """Takes an index line, parses it, and returns the revision.""" |
| - return ParseIndexLine(iline)[1] |
| - |
| - |
| -def GetRevList(good, bad): |
| - """Gets the list of revision numbers between |good| and |bad|.""" |
| - # Download the main revlist. |
| - revlist = ParseDirectoryIndex(BUILD_BASE_URL + BUILD_INDEX_FILE) |
| - revrange = range(good, bad) |
| - revlist = filter(lambda r: GetRevision(r) in revrange, revlist) |
| +def ParseDirectoryIndex(context): |
| + """Parses the Google Storage directory listing into a list of revision |
| + numbers. The range starts with context.good_revision and goes until the latest |
| + revision.""" |
| + def _FetchAndParse(url): |
| + """Fetches a URL and returns a 2-Tuple of ([revisions], next-marker). If |
| + next-marker is not None, then the listing is a partial listing and another |
| + fetch should be performed with next-marker being the marker= GET |
| + parameter.""" |
| + handle = urllib.urlopen(url) |
| + document = ElementTree.parse(handle) |
| + |
| + # All nodes in the tree are namespaced. Get the root's tag name to extract |
| + # the namespace. Etree does namespaces as |{namespace}tag|. |
| + root_tag = document.getroot().tag |
| + end_ns_pos = root_tag.find('}') |
| + if end_ns_pos == -1: |
| + raise Exception("Could not locate end namespace for directory index") |
| + namespace = root_tag[:end_ns_pos + 1] |
| + |
| + # Find the prefix (_listing_platform_dir) and whether or not the list is |
| + # truncated. |
| + prefix = document.find(namespace + 'Prefix').text |
| + next_marker = None |
| + is_truncated = document.find(namespace + 'IsTruncated') |
| + if is_truncated is not None and is_truncated.text.lower() == 'true': |
| + next_marker = document.find(namespace + 'NextMarker').text |
| + |
| + # Get a list of all the revisions. |
| + all_prefixes = document.findall(namespace + 'CommonPrefixes/' + |
| + namespace + 'Prefix') |
| + # The <Prefix> nodes have content of the form of |
| + # |_listing_platform_dir/revision/|. Strip off the platform dir and the |
| + # trailing slash to just have a number. |
| + revisions = map(lambda x: x.text[len(prefix):-1], all_prefixes) |
| + return (revisions, next_marker) |
| + |
| + # Set the marker to be the good revision, as bisecting before that is not |
| + # necessary. |
| + (revisions, next_marker) = _FetchAndParse( |
| + context.GetListingURL(context.good_revision)) |
|
nsylvain
2011/06/09 21:12:03
I'm not sure this works well. I don't think the o
Robert Sesek
2011/06/09 23:38:58
Ah, thanks. I didn't realize that; was just trying
|
| + # If the result list was truncated, refetch with the next marker. Do this |
| + # until an entire directory listing is done. |
| + while next_marker: |
| + (new_revisions, next_marker) = _FetchAndParse( |
| + context.GetListingURL(next_marker)) |
| + revisions.extend(new_revisions) |
| + |
| + return revisions |
| + |
| + |
| +def GetRevList(context): |
| + """Gets the list of revision numbers between |good_revision| and |
| + |bad_revision| of the |context|.""" |
| + # Download the revlist and filter for just the range between good and bad. |
| + rev_range = range(context.good_revision, context.bad_revision) |
| + revlist = map(int, ParseDirectoryIndex(context)) |
| + revlist = filter(lambda r: r in rev_range, revlist) |
| revlist.sort() |
| return revlist |
| -def TryRevision(iline, profile, args): |
| - """Downloads revision from |iline|, unzips it, and opens it for the user to |
| - test. |profile| is the profile to use.""" |
| +def TryRevision(context, rev, profile, args): |
| + """Downloads revision |rev|, unzips it, and opens it for the user to test. |
| + |profile| is the profile to use.""" |
| # Do this in a temp dir so we don't collide with user files. |
| cwd = os.getcwd() |
| tempdir = tempfile.mkdtemp(prefix='bisect_tmp') |
| os.chdir(tempdir) |
| # Download the file. |
| - download_url = BUILD_BASE_URL + BUILD_ARCHIVE_TYPE + \ |
| - (BUILD_ARCHIVE_URL % ParseIndexLine(iline)) + BUILD_ZIP_NAME |
| + download_url = context.GetDownloadURL(rev) |
| def _ReportHook(blocknum, blocksize, totalsize): |
| size = blocknum * blocksize |
| if totalsize == -1: # Total size not known. |
| @@ -182,7 +214,7 @@ def TryRevision(iline, profile, args): |
| sys.stdout.flush() |
| try: |
| print 'Fetching ' + download_url |
| - urllib.urlretrieve(download_url, BUILD_ZIP_NAME, _ReportHook) |
| + urllib.urlretrieve(download_url, context.archive_name, _ReportHook) |
| except Exception, e: |
| print('Could not retrieve the download. Sorry.') |
| @@ -190,13 +222,12 @@ def TryRevision(iline, profile, args): |
| # Unzip the file. |
| print 'Unzipping ...' |
| - UnzipFilenameToDir(BUILD_ZIP_NAME, os.curdir) |
| + UnzipFilenameToDir(context.archive_name, os.curdir) |
| # Tell the system to open the app. |
| args = ['--user-data-dir=%s' % profile] + args |
| flags = ' '.join(map(pipes.quote, args)) |
| - exe = os.path.join(os.getcwd(), BUILD_DIR_NAME, BUILD_EXE_NAME) |
| - cmd = '%s %s' % (exe, flags) |
| + cmd = '%s %s' % (context.GetLaunchPath(), flags) |
| print 'Running %s' % cmd |
| os.system(cmd) |
| @@ -208,14 +239,15 @@ def TryRevision(iline, profile, args): |
| pass |
| -def AskIsGoodBuild(iline): |
| - """Ask the user whether build from index line |iline| is good or bad.""" |
| +def AskIsGoodBuild(rev): |
| + """Ask the user whether build |rev| is good or bad.""" |
| # Loop until we get a response that we can parse. |
| while True: |
| - response = raw_input('\nBuild %d is [(g)ood/(b)ad]: ' % GetRevision(iline)) |
| + response = raw_input('\nBuild %d is [(g)ood/(b)ad]: ' % int(rev)) |
| if response and response in ('g', 'b'): |
| return response == 'g' |
| + |
| def main(): |
| usage = ('%prog [options] [-- chromium-options]\n' |
| 'Perform binary search on the snapshot builds.\n' |
| @@ -250,7 +282,8 @@ def main(): |
| parser.print_help() |
| return 1 |
| - SetArchiveVars(opts.archive) |
| + # Create the context. Initialize 0 for the revisions as they are set below. |
| + context = PathContext(opts.archive, 0, 0) |
| # Pick a starting point, try to get HEAD for this. |
| if opts.bad: |
| @@ -259,8 +292,7 @@ def main(): |
| bad_rev = 0 |
| try: |
| # Location of the latest build revision number |
| - BUILD_LATEST_URL = '%s/LATEST/REVISION' % (BUILD_BASE_URL) |
| - nh = urllib.urlopen(BUILD_LATEST_URL) |
| + nh = urllib.urlopen(context.GetLastChangeURL()) |
| latest = int(nh.read()) |
| nh.close() |
| bad_rev = raw_input('Bad revision [HEAD:%d]: ' % latest) |
| @@ -281,8 +313,12 @@ def main(): |
| except Exception, e: |
| pass |
| + # Set the input parameters now that they've been validated. |
| + context.good_revision = good_rev |
| + context.bad_revision = bad_rev |
| + |
| # Get a list of revisions to bisect across. |
| - revlist = GetRevList(good_rev, bad_rev) |
| + revlist = GetRevList(context) |
| if len(revlist) < 2: # Don't have enough builds to bisect |
| print 'We don\'t have enough builds to bisect. revlist: %s' % revlist |
| sys.exit(1) |
| @@ -304,7 +340,7 @@ def main(): |
| print('%d candidates. %d tries left.' % |
| (num_poss, round(math.log(num_poss, 2)))) |
| else: |
| - print('Candidates: %s' % map(GetRevision, revlist[good:bad])) |
| + print('Candidates: %s' % revlist[good:bad]) |
| # Cut the problem in half... |
| test = int((bad - good) / 2) + good |
| @@ -314,7 +350,7 @@ def main(): |
| profile = opts.profile |
| if not profile: |
| profile = 'profile' # In a temp dir. |
| - TryRevision(test_rev, profile, args) |
| + TryRevision(context, test_rev, profile, args) |
| if AskIsGoodBuild(test_rev): |
| last_known_good_rev = revlist[good] |
| good = test + 1 |
| @@ -322,12 +358,11 @@ def main(): |
| bad = test |
| # We're done. Let the user know the results in an official manner. |
| - bad_revision = GetRevision(revlist[bad]) |
| - print('You are probably looking for build %d.' % bad_revision) |
| + print('You are probably looking for build %d.' % revlist[bad]) |
| print('CHANGELOG URL:') |
| - print(CHANGELOG_URL % (GetRevision(last_known_good_rev), bad_revision)) |
| + print(CHANGELOG_URL % (last_known_good_rev, revlist[bad])) |
| print('Built at revision:') |
| - print(BUILD_VIEWVC_URL % bad_revision) |
| + print(BUILD_VIEWVC_URL % revlist[bad]) |
| if __name__ == '__main__': |
| sys.exit(main()) |