summaryrefslogtreecommitdiffstats
path: root/tools/bisect-builds.py
diff options
context:
space:
mode:
authorrsesek@chromium.org <rsesek@chromium.org@0039d316-1c4b-4281-b951-d872f2087c98>2011-06-10 13:06:22 +0000
committerrsesek@chromium.org <rsesek@chromium.org@0039d316-1c4b-4281-b951-d872f2087c98>2011-06-10 13:06:22 +0000
commit183706d96a9ccedeb0c442e272f0f71db2978bcc (patch)
treee96ea01f816c59ab1e475a850ab78852a257073a /tools/bisect-builds.py
parenta1d266f3291a4ae75be8f89a1f3681a28ebaca4d (diff)
downloadchromium_src-183706d96a9ccedeb0c442e272f0f71db2978bcc.zip
chromium_src-183706d96a9ccedeb0c442e272f0f71db2978bcc.tar.gz
chromium_src-183706d96a9ccedeb0c442e272f0f71db2978bcc.tar.bz2
bisect-builds.py: Use Google Common Data Storage instead of build.chromium.org.
The continuous archive's index file appears to be incomplete/problematic for some platforms and revision ranges, so go back to just using directory lists via the CDS API. This also cleans up the code by using a PathContext object rather than a slew of global variables to format/create the various URLs. BUG=85498 TEST=See bug. Review URL: http://codereview.chromium.org/6995117 git-svn-id: svn://svn.chromium.org/chrome/trunk/src@88658 0039d316-1c4b-4281-b951-d872f2087c98
Diffstat (limited to 'tools/bisect-builds.py')
-rwxr-xr-xtools/bisect-builds.py257
1 files changed, 144 insertions, 113 deletions
diff --git a/tools/bisect-builds.py b/tools/bisect-builds.py
index 4aa1772..d9c0569 100755
--- a/tools/bisect-builds.py
+++ b/tools/bisect-builds.py
@@ -12,33 +12,13 @@ unzipping, and opening Chromium for you. After testing the specific revision,
it will ask you whether it is good or bad before continuing the search.
"""
-# Base URL to download snapshots from.
-BUILD_BASE_URL = 'http://build.chromium.org/f/chromium/continuous/'
-
-# The index file that lists all the builds. This lives in BUILD_BASE_URL.
-BUILD_INDEX_FILE = 'all_builds.txt'
-
-# The type (platform) of the build archive. This is what's passed in to the
-# '-a/--archive' option.
-BUILD_ARCHIVE_TYPE = ''
-
-# The location of the builds. Format this with a (date, revision) tuple, which
-# can be obtained through ParseIndexLine().
-BUILD_ARCHIVE_URL = '/%s/%d/'
-
-# Name of the build archive.
-BUILD_ZIP_NAME = ''
-
-# Directory name inside the archive.
-BUILD_DIR_NAME = ''
-
-# Name of the executable.
-BUILD_EXE_NAME = ''
+# The root URL for storage.
+BASE_URL = 'http://commondatastorage.googleapis.com/chromium-browser-continuous'
# URL to the ViewVC commit page.
BUILD_VIEWVC_URL = 'http://src.chromium.org/viewvc/chrome?view=rev&revision=%d'
-# Changelogs URL
+# Changelogs URL.
CHANGELOG_URL = 'http://build.chromium.org/f/chromium/' \
'perf/dashboard/ui/changelog.html?url=/trunk/src&range=%d:%d'
@@ -53,8 +33,69 @@ import shutil
import sys
import tempfile
import urllib
+from xml.etree import ElementTree
import zipfile
+class PathContext(object):
+ """A PathContext is used to carry the information used to construct URLs and
+ paths when dealing with the storage server and archives."""
+ def __init__(self, platform, good_revision, bad_revision):
+ super(PathContext, self).__init__()
+ # Store off the input parameters.
+ self.platform = platform # What's passed in to the '-a/--archive' option.
+ self.good_revision = good_revision
+ self.bad_revision = bad_revision
+
+ # The name of the ZIP file in a revision directory on the server.
+ self.archive_name = None
+
+ # Set some internal members:
+ # _listing_platform_dir = Directory that holds revisions. Ends with a '/'.
+ # _archive_extract_dir = Uncompressed directory in the archive_name file.
+ # _binary_name = The name of the executable to run.
+ if self.platform == 'linux' or self.platform == 'linux-64':
+ self._listing_platform_dir = 'Linux/'
+ self.archive_name = 'chrome-linux.zip'
+ self._archive_extract_dir = 'chrome-linux'
+ self._binary_name = 'chrome'
+ # Linux and x64 share all the same path data except for the archive dir.
+ if self.platform == 'linux-64':
+ self._listing_platform_dir = 'Linux_x64/'
+ elif self.platform == 'mac':
+ self._listing_platform_dir = 'Mac/'
+ self.archive_name = 'chrome-mac.zip'
+ self._archive_extract_dir = 'chrome-mac'
+ self._binary_name = 'Chromium.app/Contents/MacOS/Chromium'
+ elif self.platform == 'win':
+ self._listing_platform_dir = 'Win/'
+ self.archive_name = 'chrome-win32.zip'
+ self._archive_extract_dir = 'chrome-win32'
+ self._binary_name = 'chrome.exe'
+ else:
+ raise Exception("Invalid platform")
+
+ def GetListingURL(self, marker=None):
+ """Returns the URL for a directory listing, with an optional marker."""
+ marker_param = ''
+ if marker:
+ marker_param = '&marker=' + str(marker)
+ return BASE_URL + '/?delimiter=/&prefix=' + self._listing_platform_dir + \
+ marker_param
+
+ def GetDownloadURL(self, revision):
+ """Gets the download URL for a build archive of a specific revision."""
+ return BASE_URL + '/' + self._listing_platform_dir + str(revision) + '/' + \
+ self.archive_name
+
+ def GetLastChangeURL(self):
+ """Returns a URL to the LAST_CHANGE file."""
+ return BASE_URL + '/' + self._listing_platform_dir + 'LAST_CHANGE'
+
+ def GetLaunchPath(self):
+ """Returns a relative path (presumably from the archive extraction location)
+ that is used to run the executable."""
+ return os.path.join(self._archive_extract_dir, self._binary_name)
+
def UnzipFilenameToDir(filename, dir):
"""Unzip |filename| to directory |dir|."""
@@ -86,89 +127,76 @@ def UnzipFilenameToDir(filename, dir):
sys.exit(1)
-def SetArchiveVars(archive):
- """Set a bunch of global variables appropriate for the specified archive."""
- global BUILD_ARCHIVE_TYPE
- global BUILD_ZIP_NAME
- global BUILD_DIR_NAME
- global BUILD_EXE_NAME
- global BUILD_BASE_URL
-
- BUILD_ARCHIVE_TYPE = archive
-
- if BUILD_ARCHIVE_TYPE in ('linux', 'linux64', 'linux-chromiumos'):
- BUILD_ZIP_NAME = 'chrome-linux.zip'
- BUILD_DIR_NAME = 'chrome-linux'
- BUILD_EXE_NAME = 'chrome'
- elif BUILD_ARCHIVE_TYPE in ('mac'):
- BUILD_ZIP_NAME = 'chrome-mac.zip'
- BUILD_DIR_NAME = 'chrome-mac'
- BUILD_EXE_NAME = 'Chromium.app/Contents/MacOS/Chromium'
- elif BUILD_ARCHIVE_TYPE in ('win'):
- BUILD_ZIP_NAME = 'chrome-win32.zip'
- BUILD_DIR_NAME = 'chrome-win32'
- BUILD_EXE_NAME = 'chrome.exe'
-
-
-def ParseDirectoryIndex(url):
- """Parses the all_builds.txt index file. The format of this file is:
- mac/2011-02-16/75130
- mac/2011-02-16/75218
- mac/2011-02-16/75226
- mac/2011-02-16/75234
- mac/2011-02-16/75184
- This function will return a list of DATE/REVISION strings for the platform
- specified by BUILD_ARCHIVE_TYPE.
- """
- handle = urllib.urlopen(url)
- dirindex = handle.readlines()
- handle.close()
-
- # Only return values for the specified platform. Include the trailing slash to
- # not confuse linux and linux64.
- archtype = BUILD_ARCHIVE_TYPE + '/'
- dirindex = filter(lambda l: l.startswith(archtype), dirindex)
-
- # Remove the newline separator and the platform token.
- dirindex = map(lambda l: l[len(archtype):].strip(), dirindex)
- dirindex.sort()
- return dirindex
-
-
-def ParseIndexLine(iline):
- """Takes an index line returned by ParseDirectoryIndex() and returns a
- 2-tuple of (date, revision). |date| is a string and |revision| is an int."""
- split = iline.split('/')
- assert(len(split) == 2)
- return (split[0], int(split[1]))
-
-
-def GetRevision(iline):
- """Takes an index line, parses it, and returns the revision."""
- return ParseIndexLine(iline)[1]
-
-
-def GetRevList(good, bad):
- """Gets the list of revision numbers between |good| and |bad|."""
- # Download the main revlist.
- revlist = ParseDirectoryIndex(BUILD_BASE_URL + BUILD_INDEX_FILE)
- revrange = range(good, bad)
- revlist = filter(lambda r: GetRevision(r) in revrange, revlist)
+def ParseDirectoryIndex(context):
+ """Parses the Google Storage directory listing into a list of revision
+ numbers. The range starts with context.good_revision and goes until the latest
+ revision."""
+ def _FetchAndParse(url):
+ """Fetches a URL and returns a 2-Tuple of ([revisions], next-marker). If
+ next-marker is not None, then the listing is a partial listing and another
+ fetch should be performed with next-marker being the marker= GET
+ parameter."""
+ handle = urllib.urlopen(url)
+ document = ElementTree.parse(handle)
+
+ # All nodes in the tree are namespaced. Get the root's tag name to extract
+ # the namespace. Etree does namespaces as |{namespace}tag|.
+ root_tag = document.getroot().tag
+ end_ns_pos = root_tag.find('}')
+ if end_ns_pos == -1:
+ raise Exception("Could not locate end namespace for directory index")
+ namespace = root_tag[:end_ns_pos + 1]
+
+ # Find the prefix (_listing_platform_dir) and whether or not the list is
+ # truncated.
+ prefix = document.find(namespace + 'Prefix').text
+ next_marker = None
+ is_truncated = document.find(namespace + 'IsTruncated')
+ if is_truncated is not None and is_truncated.text.lower() == 'true':
+ next_marker = document.find(namespace + 'NextMarker').text
+
+ # Get a list of all the revisions.
+ all_prefixes = document.findall(namespace + 'CommonPrefixes/' +
+ namespace + 'Prefix')
+ # The <Prefix> nodes have content of the form of
+ # |_listing_platform_dir/revision/|. Strip off the platform dir and the
+ # trailing slash to just have a number.
+ revisions = map(lambda x: x.text[len(prefix):-1], all_prefixes)
+ return (revisions, next_marker)
+
+ # Fetch the first list of revisions.
+ (revisions, next_marker) = _FetchAndParse(context.GetListingURL())
+ # If the result list was truncated, refetch with the next marker. Do this
+ # until an entire directory listing is done.
+ while next_marker:
+ (new_revisions, next_marker) = _FetchAndParse(
+ context.GetListingURL(next_marker))
+ revisions.extend(new_revisions)
+
+ return revisions
+
+
+def GetRevList(context):
+ """Gets the list of revision numbers between |good_revision| and
+ |bad_revision| of the |context|."""
+ # Download the revlist and filter for just the range between good and bad.
+ rev_range = range(context.good_revision, context.bad_revision)
+ revlist = map(int, ParseDirectoryIndex(context))
+ revlist = filter(lambda r: r in rev_range, revlist)
revlist.sort()
return revlist
-def TryRevision(iline, profile, args):
- """Downloads revision from |iline|, unzips it, and opens it for the user to
- test. |profile| is the profile to use."""
+def TryRevision(context, rev, profile, args):
+ """Downloads revision |rev|, unzips it, and opens it for the user to test.
+ |profile| is the profile to use."""
# Do this in a temp dir so we don't collide with user files.
cwd = os.getcwd()
tempdir = tempfile.mkdtemp(prefix='bisect_tmp')
os.chdir(tempdir)
# Download the file.
- download_url = BUILD_BASE_URL + BUILD_ARCHIVE_TYPE + \
- (BUILD_ARCHIVE_URL % ParseIndexLine(iline)) + BUILD_ZIP_NAME
+ download_url = context.GetDownloadURL(rev)
def _ReportHook(blocknum, blocksize, totalsize):
size = blocknum * blocksize
if totalsize == -1: # Total size not known.
@@ -182,7 +210,7 @@ def TryRevision(iline, profile, args):
sys.stdout.flush()
try:
print 'Fetching ' + download_url
- urllib.urlretrieve(download_url, BUILD_ZIP_NAME, _ReportHook)
+ urllib.urlretrieve(download_url, context.archive_name, _ReportHook)
print
except Exception, e:
print('Could not retrieve the download. Sorry.')
@@ -190,13 +218,12 @@ def TryRevision(iline, profile, args):
# Unzip the file.
print 'Unzipping ...'
- UnzipFilenameToDir(BUILD_ZIP_NAME, os.curdir)
+ UnzipFilenameToDir(context.archive_name, os.curdir)
# Tell the system to open the app.
args = ['--user-data-dir=%s' % profile] + args
flags = ' '.join(map(pipes.quote, args))
- exe = os.path.join(os.getcwd(), BUILD_DIR_NAME, BUILD_EXE_NAME)
- cmd = '%s %s' % (exe, flags)
+ cmd = '%s %s' % (context.GetLaunchPath(), flags)
print 'Running %s' % cmd
os.system(cmd)
@@ -208,14 +235,15 @@ def TryRevision(iline, profile, args):
pass
-def AskIsGoodBuild(iline):
- """Ask the user whether build from index line |iline| is good or bad."""
+def AskIsGoodBuild(rev):
+ """Ask the user whether build |rev| is good or bad."""
# Loop until we get a response that we can parse.
while True:
- response = raw_input('\nBuild %d is [(g)ood/(b)ad]: ' % GetRevision(iline))
+ response = raw_input('\nBuild %d is [(g)ood/(b)ad]: ' % int(rev))
if response and response in ('g', 'b'):
return response == 'g'
+
def main():
usage = ('%prog [options] [-- chromium-options]\n'
'Perform binary search on the snapshot builds.\n'
@@ -250,7 +278,8 @@ def main():
parser.print_help()
return 1
- SetArchiveVars(opts.archive)
+ # Create the context. Initialize 0 for the revisions as they are set below.
+ context = PathContext(opts.archive, 0, 0)
# Pick a starting point, try to get HEAD for this.
if opts.bad:
@@ -259,8 +288,7 @@ def main():
bad_rev = 0
try:
# Location of the latest build revision number
- BUILD_LATEST_URL = '%s/LATEST/REVISION' % (BUILD_BASE_URL)
- nh = urllib.urlopen(BUILD_LATEST_URL)
+ nh = urllib.urlopen(context.GetLastChangeURL())
latest = int(nh.read())
nh.close()
bad_rev = raw_input('Bad revision [HEAD:%d]: ' % latest)
@@ -281,8 +309,12 @@ def main():
except Exception, e:
pass
+ # Set the input parameters now that they've been validated.
+ context.good_revision = good_rev
+ context.bad_revision = bad_rev
+
# Get a list of revisions to bisect across.
- revlist = GetRevList(good_rev, bad_rev)
+ revlist = GetRevList(context)
if len(revlist) < 2: # Don't have enough builds to bisect
print 'We don\'t have enough builds to bisect. revlist: %s' % revlist
sys.exit(1)
@@ -304,7 +336,7 @@ def main():
print('%d candidates. %d tries left.' %
(num_poss, round(math.log(num_poss, 2))))
else:
- print('Candidates: %s' % map(GetRevision, revlist[good:bad]))
+ print('Candidates: %s' % revlist[good:bad])
# Cut the problem in half...
test = int((bad - good) / 2) + good
@@ -314,7 +346,7 @@ def main():
profile = opts.profile
if not profile:
profile = 'profile' # In a temp dir.
- TryRevision(test_rev, profile, args)
+ TryRevision(context, test_rev, profile, args)
if AskIsGoodBuild(test_rev):
last_known_good_rev = revlist[good]
good = test + 1
@@ -322,12 +354,11 @@ def main():
bad = test
# We're done. Let the user know the results in an official manner.
- bad_revision = GetRevision(revlist[bad])
- print('You are probably looking for build %d.' % bad_revision)
+ print('You are probably looking for build %d.' % revlist[bad])
print('CHANGELOG URL:')
- print(CHANGELOG_URL % (GetRevision(last_known_good_rev), bad_revision))
+ print(CHANGELOG_URL % (last_known_good_rev, revlist[bad]))
print('Built at revision:')
- print(BUILD_VIEWVC_URL % bad_revision)
+ print(BUILD_VIEWVC_URL % revlist[bad])
if __name__ == '__main__':
sys.exit(main())