tools/bisect-builds.py - Issue 6995117: bisect-builds.py: Use Google Common Data Storage instead of build.chromium.org.

Unified Diff: tools/bisect-builds.py

Issue 6995117: bisect-builds.py: Use Google Common Data Storage instead of build.chromium.org. (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/src

Patch Set: Created 9 years, 6 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: tools/bisect-builds.py

diff --git a/tools/bisect-builds.py b/tools/bisect-builds.py

index 4aa177279052db497244d634e8f26194a47b330e..d41c1c227ff427e14151671630a55625f00b5d71 100755

--- a/tools/bisect-builds.py

+++ b/tools/bisect-builds.py

@@ -12,33 +12,13 @@ unzipping, and opening Chromium for you. After testing the specific revision,

it will ask you whether it is good or bad before continuing the search.

"""

-# Base URL to download snapshots from.

-BUILD_BASE_URL = 'http://build.chromium.org/f/chromium/continuous/'

-# The index file that lists all the builds. This lives in BUILD_BASE_URL.

-BUILD_INDEX_FILE = 'all_builds.txt'

-# The type (platform) of the build archive. This is what's passed in to the

-# '-a/--archive' option.

-BUILD_ARCHIVE_TYPE = ''

-# The location of the builds. Format this with a (date, revision) tuple, which

-# can be obtained through ParseIndexLine().

-BUILD_ARCHIVE_URL = '/%s/%d/'

-# Name of the build archive.

-BUILD_ZIP_NAME = ''

-# Directory name inside the archive.

-BUILD_DIR_NAME = ''

-# Name of the executable.

-BUILD_EXE_NAME = ''

+# The root URL for storage.

+BASE_URL = 'http://commondatastorage.googleapis.com/chromium-browser-continuous'

# URL to the ViewVC commit page.

BUILD_VIEWVC_URL = 'http://src.chromium.org/viewvc/chrome?view=rev&revision=%d'

-# Changelogs URL

+# Changelogs URL.

CHANGELOG_URL = 'http://build.chromium.org/f/chromium/' \

'perf/dashboard/ui/changelog.html?url=/trunk/src&range=%d:%d'

@@ -53,8 +33,71 @@ import shutil

import sys

import tempfile

import urllib

+from xml.etree import ElementTree

import zipfile

+class PathContext(object):

+ """A PathContext is used to carry the information used to construct URLs and

+ paths when dealing with the storage server and archives."""

+ def __init__(self, platform, good_revision, bad_revision):

+ super(PathContext, self).__init__()

+ # Store off the input parameters.

+ self.platform = platform # What's passed in to the '-a/--archive' option.

+ self.good_revision = good_revision

+ self.bad_revision = bad_revision

+ # The name of the ZIP file in a revision directory on the server.

+ self.archive_name = None

+ # Set some internal members:

+ # _listing_platform_dir = Directory that holds revisions. Ends with a '/'.

+ # _archive_extract_dir = Uncompressed directory in the archive_name file.

+ # _binary_name = The name of the executable to run.

+ if self.platform == 'linux' or self.platform == 'linux-64':

+ self._listing_platform_dir = 'Linux/'

+ self.archive_name = 'chrome-linux.zip'

+ self._archive_extract_dir = 'chrome-linux'

+ self._binary_name = 'chrome'

+ # Linux and x64 share all the same path data except for the archive dir.

+ if self.platform == 'linux-64':

+ self._listing_platform_dir = 'Linux_x64/'

+ elif self.platform == 'mac':

+ self._listing_platform_dir = 'Mac/'

+ self.archive_name = 'chrome-mac.zip'

+ self._archive_extract_dir = 'chrome-mac'

+ self._binary_name = 'Chromium.app/Contents/MacOS/Chromium'

+ elif self.platform == 'win':

+ self._listing_platform_dir = 'Win/'

+ self.archive_name = 'chrome-win32.zip'

+ self._archive_extract_dir = 'chrome-win32'

+ self._binary_name = 'chrome.exe'

+ else:

+ raise Exception("Invalid platform")

+ def GetListingURL(self, revision_offset=None):

+ """Returns the URL for a directory listing, with an optional starting

+ revision."""

+ marker = ''

+ if revision_offset:

+ marker = '&marker=' + self._listing_platform_dir + \

+ str(revision_offset) + '/'

+ return BASE_URL + '/?delimiter=/&prefix=' + self._listing_platform_dir + \

+ marker

+ def GetDownloadURL(self, revision):

+ """Gets the download URL for a build archive of a specific revision."""

+ return BASE_URL + '/' + self._listing_platform_dir + str(revision) + '/' + \

+ self.archive_name

+ def GetLastChangeURL(self):

+ """Returns a URL to the LAST_CHANGE file."""

+ return BASE_URL + '/' + self._listing_platform_dir + 'LAST_CHANGE'

+ def GetLaunchPath(self):

+ """Returns a relative path (presumably from the archive extraction location)

+ that is used to run the executable."""

+ return os.path.join(self._archive_extract_dir, self._binary_name)

def UnzipFilenameToDir(filename, dir):

"""Unzip |filename| to directory |dir|."""

@@ -86,89 +129,78 @@ def UnzipFilenameToDir(filename, dir):

sys.exit(1)

-def SetArchiveVars(archive):

- """Set a bunch of global variables appropriate for the specified archive."""

- global BUILD_ARCHIVE_TYPE

- global BUILD_ZIP_NAME

- global BUILD_DIR_NAME

- global BUILD_EXE_NAME

- global BUILD_BASE_URL

- BUILD_ARCHIVE_TYPE = archive

- if BUILD_ARCHIVE_TYPE in ('linux', 'linux64', 'linux-chromiumos'):

- BUILD_ZIP_NAME = 'chrome-linux.zip'

- BUILD_DIR_NAME = 'chrome-linux'

- BUILD_EXE_NAME = 'chrome'

- elif BUILD_ARCHIVE_TYPE in ('mac'):

- BUILD_ZIP_NAME = 'chrome-mac.zip'

- BUILD_DIR_NAME = 'chrome-mac'

- BUILD_EXE_NAME = 'Chromium.app/Contents/MacOS/Chromium'

- elif BUILD_ARCHIVE_TYPE in ('win'):

- BUILD_ZIP_NAME = 'chrome-win32.zip'

- BUILD_DIR_NAME = 'chrome-win32'

- BUILD_EXE_NAME = 'chrome.exe'

-def ParseDirectoryIndex(url):

- """Parses the all_builds.txt index file. The format of this file is:

- mac/2011-02-16/75130

- mac/2011-02-16/75218

- mac/2011-02-16/75226

- mac/2011-02-16/75234

- mac/2011-02-16/75184

- This function will return a list of DATE/REVISION strings for the platform

- specified by BUILD_ARCHIVE_TYPE.

- """

- handle = urllib.urlopen(url)

- dirindex = handle.readlines()

- handle.close()

- # Only return values for the specified platform. Include the trailing slash to

- # not confuse linux and linux64.

- archtype = BUILD_ARCHIVE_TYPE + '/'

- dirindex = filter(lambda l: l.startswith(archtype), dirindex)

- # Remove the newline separator and the platform token.

- dirindex = map(lambda l: l[len(archtype):].strip(), dirindex)

- dirindex.sort()

- return dirindex

-def ParseIndexLine(iline):

- """Takes an index line returned by ParseDirectoryIndex() and returns a

- 2-tuple of (date, revision). |date| is a string and |revision| is an int."""

- split = iline.split('/')

- assert(len(split) == 2)

- return (split[0], int(split[1]))

-def GetRevision(iline):

- """Takes an index line, parses it, and returns the revision."""

- return ParseIndexLine(iline)[1]

-def GetRevList(good, bad):

- """Gets the list of revision numbers between |good| and |bad|."""

- # Download the main revlist.

- revlist = ParseDirectoryIndex(BUILD_BASE_URL + BUILD_INDEX_FILE)

- revrange = range(good, bad)

- revlist = filter(lambda r: GetRevision(r) in revrange, revlist)

+def ParseDirectoryIndex(context):

+ """Parses the Google Storage directory listing into a list of revision

+ numbers. The range starts with context.good_revision and goes until the latest

+ revision."""

+ def _FetchAndParse(url):

+ """Fetches a URL and returns a 2-Tuple of ([revisions], next-marker). If

+ next-marker is not None, then the listing is a partial listing and another

+ fetch should be performed with next-marker being the marker= GET

+ parameter."""

+ handle = urllib.urlopen(url)

+ document = ElementTree.parse(handle)

+ # All nodes in the tree are namespaced. Get the root's tag name to extract

+ # the namespace. Etree does namespaces as |{namespace}tag|.

+ root_tag = document.getroot().tag

+ end_ns_pos = root_tag.find('}')

+ if end_ns_pos == -1:

+ raise Exception("Could not locate end namespace for directory index")

+ namespace = root_tag[:end_ns_pos + 1]

+ # Find the prefix (_listing_platform_dir) and whether or not the list is

+ # truncated.

+ prefix = document.find(namespace + 'Prefix').text

+ next_marker = None

+ is_truncated = document.find(namespace + 'IsTruncated')

+ if is_truncated is not None and is_truncated.text.lower() == 'true':

+ next_marker = document.find(namespace + 'NextMarker').text

+ # Get a list of all the revisions.

+ all_prefixes = document.findall(namespace + 'CommonPrefixes/' +

+ namespace + 'Prefix')

+ # The <Prefix> nodes have content of the form of

+ # |_listing_platform_dir/revision/|. Strip off the platform dir and the

+ # trailing slash to just have a number.

+ revisions = map(lambda x: x.text[len(prefix):-1], all_prefixes)

+ return (revisions, next_marker)

+ # Set the marker to be the good revision, as bisecting before that is not

+ # necessary.

+ (revisions, next_marker) = _FetchAndParse(

+ context.GetListingURL(context.good_revision))

nsylvain 2011/06/09 21:12:03 I'm not sure this works well. I don't think the o

Robert Sesek 2011/06/09 23:38:58 Ah, thanks. I didn't realize that; was just trying

+ # If the result list was truncated, refetch with the next marker. Do this

+ # until an entire directory listing is done.

+ while next_marker:

+ (new_revisions, next_marker) = _FetchAndParse(

+ context.GetListingURL(next_marker))

+ revisions.extend(new_revisions)

+ return revisions

+def GetRevList(context):

+ """Gets the list of revision numbers between |good_revision| and

+ |bad_revision| of the |context|."""

+ # Download the revlist and filter for just the range between good and bad.

+ rev_range = range(context.good_revision, context.bad_revision)

+ revlist = map(int, ParseDirectoryIndex(context))

+ revlist = filter(lambda r: r in rev_range, revlist)

revlist.sort()

return revlist

-def TryRevision(iline, profile, args):

- """Downloads revision from |iline|, unzips it, and opens it for the user to

- test. |profile| is the profile to use."""

+def TryRevision(context, rev, profile, args):

+ """Downloads revision |rev|, unzips it, and opens it for the user to test.

+ |profile| is the profile to use."""

# Do this in a temp dir so we don't collide with user files.

cwd = os.getcwd()

tempdir = tempfile.mkdtemp(prefix='bisect_tmp')

os.chdir(tempdir)

# Download the file.

- download_url = BUILD_BASE_URL + BUILD_ARCHIVE_TYPE + \

- (BUILD_ARCHIVE_URL % ParseIndexLine(iline)) + BUILD_ZIP_NAME

+ download_url = context.GetDownloadURL(rev)

def _ReportHook(blocknum, blocksize, totalsize):

size = blocknum * blocksize

if totalsize == -1: # Total size not known.

@@ -182,7 +214,7 @@ def TryRevision(iline, profile, args):

sys.stdout.flush()

try:

print 'Fetching ' + download_url

- urllib.urlretrieve(download_url, BUILD_ZIP_NAME, _ReportHook)

+ urllib.urlretrieve(download_url, context.archive_name, _ReportHook)

except Exception, e:

print('Could not retrieve the download. Sorry.')

@@ -190,13 +222,12 @@ def TryRevision(iline, profile, args):

# Unzip the file.

print 'Unzipping ...'

- UnzipFilenameToDir(BUILD_ZIP_NAME, os.curdir)

+ UnzipFilenameToDir(context.archive_name, os.curdir)

# Tell the system to open the app.

args = ['--user-data-dir=%s' % profile] + args

flags = ' '.join(map(pipes.quote, args))

- exe = os.path.join(os.getcwd(), BUILD_DIR_NAME, BUILD_EXE_NAME)

- cmd = '%s %s' % (exe, flags)

+ cmd = '%s %s' % (context.GetLaunchPath(), flags)

print 'Running %s' % cmd

os.system(cmd)

@@ -208,14 +239,15 @@ def TryRevision(iline, profile, args):

pass

-def AskIsGoodBuild(iline):

- """Ask the user whether build from index line |iline| is good or bad."""

+def AskIsGoodBuild(rev):

+ """Ask the user whether build |rev| is good or bad."""

# Loop until we get a response that we can parse.

while True:

- response = raw_input('\nBuild %d is [(g)ood/(b)ad]: ' % GetRevision(iline))

+ response = raw_input('\nBuild %d is [(g)ood/(b)ad]: ' % int(rev))

if response and response in ('g', 'b'):

return response == 'g'

def main():

usage = ('%prog [options] [-- chromium-options]\n'

'Perform binary search on the snapshot builds.\n'

@@ -250,7 +282,8 @@ def main():

parser.print_help()

return 1

- SetArchiveVars(opts.archive)

+ # Create the context. Initialize 0 for the revisions as they are set below.

+ context = PathContext(opts.archive, 0, 0)

# Pick a starting point, try to get HEAD for this.

if opts.bad:

@@ -259,8 +292,7 @@ def main():

bad_rev = 0

try:

# Location of the latest build revision number

- BUILD_LATEST_URL = '%s/LATEST/REVISION' % (BUILD_BASE_URL)

- nh = urllib.urlopen(BUILD_LATEST_URL)

+ nh = urllib.urlopen(context.GetLastChangeURL())

latest = int(nh.read())

nh.close()

bad_rev = raw_input('Bad revision [HEAD:%d]: ' % latest)

@@ -281,8 +313,12 @@ def main():

except Exception, e:

pass

+ # Set the input parameters now that they've been validated.

+ context.good_revision = good_rev

+ context.bad_revision = bad_rev

# Get a list of revisions to bisect across.

- revlist = GetRevList(good_rev, bad_rev)

+ revlist = GetRevList(context)

if len(revlist) < 2: # Don't have enough builds to bisect

print 'We don\'t have enough builds to bisect. revlist: %s' % revlist

sys.exit(1)

@@ -304,7 +340,7 @@ def main():

print('%d candidates. %d tries left.' %

(num_poss, round(math.log(num_poss, 2))))

else:

- print('Candidates: %s' % map(GetRevision, revlist[good:bad]))

+ print('Candidates: %s' % revlist[good:bad])

# Cut the problem in half...

test = int((bad - good) / 2) + good

@@ -314,7 +350,7 @@ def main():

profile = opts.profile

if not profile:

profile = 'profile' # In a temp dir.

- TryRevision(test_rev, profile, args)

+ TryRevision(context, test_rev, profile, args)

if AskIsGoodBuild(test_rev):

last_known_good_rev = revlist[good]

good = test + 1

@@ -322,12 +358,11 @@ def main():

bad = test

# We're done. Let the user know the results in an official manner.

- bad_revision = GetRevision(revlist[bad])

- print('You are probably looking for build %d.' % bad_revision)

+ print('You are probably looking for build %d.' % revlist[bad])

print('CHANGELOG URL:')

- print(CHANGELOG_URL % (GetRevision(last_known_good_rev), bad_revision))

+ print(CHANGELOG_URL % (last_known_good_rev, revlist[bad]))

print('Built at revision:')

- print(BUILD_VIEWVC_URL % bad_revision)

+ print(BUILD_VIEWVC_URL % revlist[bad])

if __name__ == '__main__':

sys.exit(main())

« no previous file with comments | « no previous file | no next file » | no next file with comments »