| Index: git_cache.py
|
| diff --git a/git_cache.py b/git_cache.py
|
| new file mode 100755
|
| index 0000000000000000000000000000000000000000..77463a6013780b98e6e63b91bb082a1b6947a7a3
|
| --- /dev/null
|
| +++ b/git_cache.py
|
| @@ -0,0 +1,303 @@
|
| +#!/usr/bin/env python
|
| +# Copyright 2014 The Chromium Authors. All rights reserved.
|
| +# Use of this source code is governed by a BSD-style license that can be
|
| +# found in the LICENSE file.
|
| +
|
| +"""A git command for managing a local cache of git repositories."""
|
| +
|
| +import errno
|
| +import logging
|
| +import optparse
|
| +import os
|
| +import tempfile
|
| +import subprocess
|
| +import sys
|
| +import urlparse
|
| +
|
| +import gclient_utils
|
| +import subcommand
|
| +
|
| +
|
| +GIT_EXECUTABLE = 'git.bat' if sys.platform.startswith('win') else 'git'
|
| +
|
| +
|
| +def NormalizeUrl(url):
|
| + """Convert a git url to a normalized form."""
|
| + parsed = urlparse.urlparse(url)
|
| + norm_url = 'https://' + parsed.netloc + parsed.path
|
| + if not norm_url.endswith('.git'):
|
| + norm_url += '.git'
|
| + return norm_url
|
| +
|
| +
|
| +def UrlToCacheDir(url):
|
| + """Convert a git url to a normalized form for the cache dir path."""
|
| + parsed = urlparse.urlparse(url)
|
| + norm_url = parsed.netloc + parsed.path
|
| + if norm_url.endswith('.git'):
|
| + norm_url = norm_url[:-len('.git')]
|
| + return norm_url.replace('-', '--').replace('/', '-').lower()
|
| +
|
| +
|
| +def RunGit(cmd, **kwargs):
|
| + """Run git in a subprocess."""
|
| + kwargs.setdefault('cwd', os.getcwd())
|
| + if kwargs.get('filter_fn'):
|
| + kwargs['filter_fn'] = gclient_utils.GitFilter(kwargs.get('filter_fn'))
|
| + kwargs.setdefault('print_stdout', False)
|
| + env = kwargs.get('env') or kwargs.setdefault('env', os.environ.copy())
|
| + env.setdefault('GIT_ASKPASS', 'true')
|
| + env.setdefault('SSH_ASKPASS', 'true')
|
| + else:
|
| + kwargs.setdefault('print_stdout', True)
|
| + stdout = kwargs.get('stdout', sys.stdout)
|
| + print >> stdout, 'running "git %s" in "%s"' % (' '.join(cmd), kwargs['cwd'])
|
| + gclient_utils.CheckCallAndFilter([GIT_EXECUTABLE] + cmd, **kwargs)
|
| +
|
| +
|
| +class LockError(Exception):
|
| + pass
|
| +
|
| +
|
| +class Lockfile(object):
|
| + """Class to represent a cross-platform process-specific lockfile."""
|
| +
|
| + def __init__(self, path):
|
| + self.path = os.path.abspath(path)
|
| + self.lockfile = self.path + ".lock"
|
| + self.pid = os.getpid()
|
| +
|
| + def _read_pid(self):
|
| + """Read the pid stored in the lockfile.
|
| +
|
| + Note: This method is potentially racy. By the time it returns the lockfile
|
| + may have been unlocked, removed, or stolen by some other process.
|
| + """
|
| + try:
|
| + with open(self.lockfile, 'r') as f:
|
| + pid = int(f.readline().strip())
|
| + except (IOError, ValueError):
|
| + pid = None
|
| + return pid
|
| +
|
| + def _make_lockfile(self):
|
| + """Safely creates a lockfile containing the current pid."""
|
| + open_flags = (os.O_CREAT | os.O_EXCL | os.O_WRONLY)
|
| + fd = os.open(self.lockfile, open_flags, 0o644)
|
| + f = os.fdopen(fd, 'w')
|
| + print >> f, self.pid
|
| + f.close()
|
| +
|
| + def _remove_lockfile(self):
|
| + """Delete the lockfile. Complains (implicitly) if it doesn't exist."""
|
| + os.remove(self.lockfile)
|
| +
|
| + def lock(self):
|
| + """Acquire the lock.
|
| +
|
| + Note: This is a NON-BLOCKING FAIL-FAST operation.
|
| + Do. Or do not. There is no try.
|
| + """
|
| + try:
|
| + self._make_lockfile()
|
| + except OSError as e:
|
| + if e.errno == errno.EEXIST:
|
| + raise LockError("%s is already locked" % self.path)
|
| + else:
|
| + raise LockError("Failed to create %s (err %s)" % (self.path, e.errno))
|
| +
|
| + def unlock(self):
|
| + """Release the lock."""
|
| + if not self.is_locked():
|
| + raise LockError("%s is not locked" % self.path)
|
| + if not self.i_am_locking():
|
| + raise LockError("%s is locked, but not by me" % self.path)
|
| + self._remove_lockfile()
|
| +
|
| + def break_lock(self):
|
| + """Remove the lock, even if it was created by someone else."""
|
| + try:
|
| + self._remove_lockfile()
|
| + return True
|
| + except OSError as exc:
|
| + if exc.errno == errno.ENOENT:
|
| + return False
|
| + else:
|
| + raise
|
| +
|
| + def is_locked(self):
|
| + """Test if the file is locked by anyone.
|
| +
|
| + Note: This method is potentially racy. By the time it returns the lockfile
|
| + may have been unlocked, removed, or stolen by some other process.
|
| + """
|
| + return os.path.exists(self.lockfile)
|
| +
|
| + def i_am_locking(self):
|
| + """Test if the file is locked by this process."""
|
| + return self.is_locked() and self.pid == self._read_pid()
|
| +
|
| + def __enter__(self):
|
| + self.lock()
|
| + return self
|
| +
|
| + def __exit__(self, *_exc):
|
| + self.unlock()
|
| +
|
| +
|
| +@subcommand.usage('[url of repo to check for caching]')
|
| +def CMDexists(parser, args):
|
| + """Check to see if there already is a cache of the given repo."""
|
| + options, args = parser.parse_args(args)
|
| + if not len(args) == 1:
|
| + parser.error('git cache exists only takes exactly one repo url.')
|
| + url = args[0]
|
| + repo_dir = os.path.join(options.cache_dir, UrlToCacheDir(url))
|
| + flag_file = os.path.join(repo_dir, 'config')
|
| + if os.path.isdir(repo_dir) and os.path.isfile(flag_file):
|
| + print repo_dir
|
| + return 0
|
| + return 1
|
| +
|
| +
|
| +@subcommand.usage('[url of repo to add to or update in cache]')
|
| +def CMDpopulate(parser, args):
|
| + """Ensure that the cache has all up-to-date objects for the given repo."""
|
| + parser.add_option('--depth', type='int',
|
| + help='Only cache DEPTH commits of history')
|
| + parser.add_option('--shallow', '-s', action='store_true',
|
| + help='Only cache 10000 commits of history')
|
| + parser.add_option('--ref', action='append',
|
| + help='Specify additional refs to be fetched')
|
| + options, args = parser.parse_args(args)
|
| + if options.shallow and not options.depth:
|
| + options.depth = 10000
|
| + if not len(args) == 1:
|
| + parser.error('git cache populate only takes exactly one repo url.')
|
| + url = args[0]
|
| +
|
| + gclient_utils.safe_makedirs(options.cache_dir)
|
| + repo_dir = os.path.join(options.cache_dir, UrlToCacheDir(url))
|
| +
|
| + v = []
|
| + filter_fn = lambda l: '[up to date]' not in l
|
| + if options.verbose:
|
| + v = ['-v', '--progress']
|
| + filter_fn = None
|
| +
|
| + d = []
|
| + if options.depth:
|
| + d = ['--depth', '%d' % options.depth]
|
| +
|
| + def _config(directory):
|
| + RunGit(['config', 'core.deltaBaseCacheLimit', '2g'],
|
| + cwd=directory)
|
| + RunGit(['config', 'remote.origin.url', NormalizeUrl(url)],
|
| + cwd=directory)
|
| + RunGit(['config', '--replace-all', 'remote.origin.fetch',
|
| + '+refs/heads/*:refs/heads/*'],
|
| + cwd=directory)
|
| + for ref in options.ref or []:
|
| + ref = ref.rstrip('/')
|
| + refspec = '+refs/%s/*:refs/%s/*' % (ref, ref)
|
| + RunGit(['config', '--add', 'remote.origin.fetch', refspec],
|
| + cwd=directory)
|
| +
|
| + with Lockfile(repo_dir):
|
| + # Setup from scratch if the repo is new or is in a bad state.
|
| + if not os.path.exists(os.path.join(repo_dir, 'config')):
|
| + gclient_utils.rmtree(repo_dir)
|
| + tempdir = tempfile.mkdtemp(suffix=UrlToCacheDir(url),
|
| + dir=options.cache_dir)
|
| + RunGit(['init', '--bare'], cwd=tempdir)
|
| + _config(tempdir)
|
| + fetch_cmd = ['fetch'] + v + d + ['--tags', 'origin']
|
| + RunGit(fetch_cmd, filter_fn=filter_fn, cwd=tempdir, retry=True)
|
| + os.rename(tempdir, repo_dir)
|
| + else:
|
| + _config(repo_dir)
|
| + if options.depth and os.path.exists(os.path.join(repo_dir, 'shallow')):
|
| + logging.warn('Shallow fetch requested, but repo cache already exists.')
|
| + fetch_cmd = ['fetch'] + v + ['--update-shallow', '--tags', 'origin']
|
| + RunGit(fetch_cmd, filter_fn=filter_fn, cwd=repo_dir, retry=True)
|
| +
|
| +
|
| +@subcommand.usage('[url of repo to unlock, or -a|--all]')
|
| +def CMDunlock(parser, args):
|
| + """Unlock one or all repos if their lock files are still around."""
|
| + parser.add_option('--force', '-f', action='store_true',
|
| + help='Actually perform the action')
|
| + parser.add_option('--all', '-a', action='store_true',
|
| + help='Unlock all repository caches')
|
| + options, args = parser.parse_args(args)
|
| + if len(args) > 1 or (len(args) == 0 and not options.all):
|
| + parser.error('git cache unlock takes exactly one repo url, or --all')
|
| +
|
| + if not options.all:
|
| + url = args[0]
|
| + repo_dirs = [os.path.join(options.cache_dir, UrlToCacheDir(url))]
|
| + else:
|
| + repo_dirs = [path for path in os.listdir(options.cache_dir)
|
| + if os.path.isdir(path)]
|
| + lockfiles = [repo_dir + '.lock' for repo_dir in repo_dirs
|
| + if os.path.exists(repo_dir + '.lock')]
|
| +
|
| + if not options.force:
|
| + parser.error('git cache unlock requires -f|--force to do anything. '
|
| + 'Refusing to unlock the following repo caches: '
|
| + ', '.join(lockfiles))
|
| +
|
| + unlocked = []
|
| + untouched = []
|
| + for repo_dir in repo_dirs:
|
| + lf = Lockfile(repo_dir)
|
| + if lf.break_lock():
|
| + unlocked.append(repo_dir)
|
| + else:
|
| + untouched.append(repo_dir)
|
| +
|
| + if unlocked:
|
| + logging.info('Broke locks on these caches: %s' % unlocked)
|
| + if untouched:
|
| + logging.debug('Did not touch these caches: %s' % untouched)
|
| +
|
| +
|
| +class OptionParser(optparse.OptionParser):
|
| + """Wrapper class for OptionParser to handle global options."""
|
| +
|
| + def __init__(self, *args, **kwargs):
|
| + optparse.OptionParser.__init__(self, *args, prog='git cache', **kwargs)
|
| + self.add_option('-c', '--cache-dir',
|
| + help='Path to the directory containing the cache')
|
| + self.add_option('-v', '--verbose', action='count', default=0,
|
| + help='Increase verbosity (can be passed multiple times)')
|
| +
|
| + def parse_args(self, args=None, values=None):
|
| + options, args = optparse.OptionParser.parse_args(self, args, values)
|
| +
|
| + try:
|
| + global_cache_dir = subprocess.check_output(
|
| + [GIT_EXECUTABLE, 'config', '--global', 'cache.cachepath']).strip()
|
| + if options.cache_dir:
|
| + logging.warn('Overriding globally-configured cache directory.')
|
| + else:
|
| + options.cache_dir = global_cache_dir
|
| + except subprocess.CalledProcessError:
|
| + if not options.cache_dir:
|
| + self.error('No cache directory specified on command line '
|
| + 'or in cache.cachepath.')
|
| + options.cache_dir = os.path.abspath(options.cache_dir)
|
| +
|
| + levels = [logging.WARNING, logging.INFO, logging.DEBUG]
|
| + logging.basicConfig(level=levels[min(options.verbose, len(levels) - 1)])
|
| +
|
| + return options, args
|
| +
|
| +
|
| +def main(argv):
|
| + dispatcher = subcommand.CommandDispatcher(__name__)
|
| + return dispatcher.execute(OptionParser(), argv)
|
| +
|
| +
|
| +if __name__ == '__main__':
|
| + sys.exit(main(sys.argv[1:]))
|
|
|