Index: git_common.py |
diff --git a/git_common.py b/git_common.py |
new file mode 100644 |
index 0000000000000000000000000000000000000000..a8229cf5ff30066f0c432767327296cbdcd4b4b4 |
--- /dev/null |
+++ b/git_common.py |
@@ -0,0 +1,301 @@ |
+# Copyright (c) 2013 The Chromium Authors. All rights reserved. |
+# Use of this source code is governed by a BSD-style license that can be |
+# found in the LICENSE file. |
+ |
+# Monkeypatch IMapIterator so that Ctrl-C can kill everything properly. |
+# Derived from https://gist.github.com/aljungberg/626518 |
+import multiprocessing.pool |
+from multiprocessing.pool import IMapIterator |
+def wrapper(func): |
+ def wrap(self, timeout=None): |
+ return func(self, timeout=timeout or 1e100) |
+ return wrap |
+IMapIterator.next = wrapper(IMapIterator.next) |
+IMapIterator.__next__ = IMapIterator.next |
+# TODO(iannucci): Monkeypatch all other 'wait' methods too. |
+ |
+ |
+import binascii |
+import contextlib |
+import functools |
+import logging |
+import signal |
+import sys |
+import tempfile |
+import threading |
+ |
+import subprocess2 |
+ |
+ |
+GIT_EXE = 'git.bat' if sys.platform.startswith('win') else 'git' |
+ |
+ |
+class BadCommitRefException(Exception): |
+ def __init__(self, refs): |
+ msg = ('one of %s does not seem to be a valid commitref.' % |
+ str(refs)) |
+ super(BadCommitRefException, self).__init__(msg) |
+ |
+ |
+def memoize_one(**kwargs): |
+ """Memoizes a single-argument pure function. |
+ |
+ Values of None are not cached. |
+ |
+ Kwargs: |
+ threadsafe (bool) - REQUIRED. Specifies whether to use locking around |
+ cache manipulation functions. This is a kwarg so that users of memoize_one |
+ are forced to explicitly and verbosely pick True or False. |
+ |
+ Adds three methods to the decorated function: |
+ * get(key, default=None) - Gets the value for this key from the cache. |
+ * set(key, value) - Sets the value for this key from the cache. |
+ * clear() - Drops the entire contents of the cache. Useful for unittests. |
+ * update(other) - Updates the contents of the cache from another dict. |
+ """ |
+ assert 'threadsafe' in kwargs, 'Must specify threadsafe={True,False}' |
+ threadsafe = kwargs['threadsafe'] |
+ |
+ if threadsafe: |
+ def withlock(lock, f): |
+ def inner(*args, **kwargs): |
+ with lock: |
+ return f(*args, **kwargs) |
+ return inner |
+ else: |
+ def withlock(_lock, f): |
+ return f |
+ |
+ def decorator(f): |
+ # Instantiate the lock in decorator, in case users of memoize_one do: |
+ # |
+ # memoizer = memoize_one(threadsafe=True) |
+ # |
+ # @memoizer |
+ # def fn1(val): ... |
+ # |
+ # @memoizer |
+ # def fn2(val): ... |
+ |
+ lock = threading.Lock() if threadsafe else None |
+ cache = {} |
+ _get = withlock(lock, cache.get) |
+ _set = withlock(lock, cache.__setitem__) |
+ |
+ @functools.wraps(f) |
+ def inner(arg): |
+ ret = _get(arg) |
+ if ret is None: |
+ ret = f(arg) |
+ if ret is not None: |
+ _set(arg, ret) |
+ return ret |
+ inner.get = _get |
+ inner.set = _set |
+ inner.clear = withlock(lock, cache.clear) |
+ inner.update = withlock(lock, cache.update) |
+ return inner |
+ return decorator |
+ |
+ |
+def _ScopedPool_initer(orig, orig_args): # pragma: no cover |
+ """Initializer method for ScopedPool's subprocesses. |
+ |
+ This helps ScopedPool handle Ctrl-C's correctly. |
+ """ |
+ signal.signal(signal.SIGINT, signal.SIG_IGN) |
+ if orig: |
+ orig(*orig_args) |
+ |
+ |
+@contextlib.contextmanager |
+def ScopedPool(*args, **kwargs): |
+ """Context Manager which returns a multiprocessing.pool instance which |
+ correctly deals with thrown exceptions. |
+ |
+ *args - Arguments to multiprocessing.pool |
+ |
+ Kwargs: |
+ kind ('threads', 'procs') - The type of underlying coprocess to use. |
+ **etc - Arguments to multiprocessing.pool |
+ """ |
+ if kwargs.pop('kind', None) == 'threads': |
+ pool = multiprocessing.pool.ThreadPool(*args, **kwargs) |
+ else: |
+ orig, orig_args = kwargs.get('initializer'), kwargs.get('initargs', ()) |
+ kwargs['initializer'] = _ScopedPool_initer |
+ kwargs['initargs'] = orig, orig_args |
+ pool = multiprocessing.pool.Pool(*args, **kwargs) |
+ |
+ try: |
+ yield pool |
+ pool.close() |
+ except: |
+ pool.terminate() |
+ raise |
+ finally: |
+ pool.join() |
+ |
+ |
+class ProgressPrinter(object): |
+ """Threaded single-stat status message printer.""" |
+ def __init__(self, fmt, enabled=None, stream=sys.stderr, period=0.5): |
+ """Create a ProgressPrinter. |
+ |
+ Use it as a context manager which produces a simple 'increment' method: |
+ |
+ with ProgressPrinter('(%%(count)d/%d)' % 1000) as inc: |
+ for i in xrange(1000): |
+ # do stuff |
+ if i % 10 == 0: |
+ inc(10) |
+ |
+ Args: |
+ fmt - String format with a single '%(count)d' where the counter value |
+ should go. |
+ enabled (bool) - If this is None, will default to True if |
+ logging.getLogger() is set to INFO or more verbose. |
+ stream (file-like) - The stream to print status messages to. |
+ period (float) - The time in seconds for the printer thread to wait |
+ between printing. |
+ """ |
+ self.fmt = fmt |
+ if enabled is None: # pragma: no cover |
+ self.enabled = logging.getLogger().isEnabledFor(logging.INFO) |
+ else: |
+ self.enabled = enabled |
+ |
+ self._count = 0 |
+ self._dead = False |
+ self._dead_cond = threading.Condition() |
+ self._stream = stream |
+ self._thread = threading.Thread(target=self._run) |
+ self._period = period |
+ |
+ def _emit(self, s): |
+ if self.enabled: |
+ self._stream.write('\r' + s) |
+ self._stream.flush() |
+ |
+ def _run(self): |
+ with self._dead_cond: |
+ while not self._dead: |
+ self._emit(self.fmt % {'count': self._count}) |
+ self._dead_cond.wait(self._period) |
+ self._emit((self.fmt + '\n') % {'count': self._count}) |
+ |
+ def inc(self, amount=1): |
+ self._count += amount |
+ |
+ def __enter__(self): |
+ self._thread.start() |
+ return self.inc |
+ |
+ def __exit__(self, _exc_type, _exc_value, _traceback): |
+ self._dead = True |
+ with self._dead_cond: |
+ self._dead_cond.notifyAll() |
+ self._thread.join() |
+ del self._thread |
+ |
+ |
+def parse_commitrefs(*commitrefs): |
+ """Returns binary encoded commit hashes for one or more commitrefs. |
+ |
+ A commitref is anything which can resolve to a commit. Popular examples: |
+ * 'HEAD' |
+ * 'origin/master' |
+ * 'cool_branch~2' |
+ """ |
+ try: |
+ return map(binascii.unhexlify, hashes(*commitrefs)) |
+ except subprocess2.CalledProcessError: |
+ raise BadCommitRefException(commitrefs) |
+ |
+ |
+def run(*cmd, **kwargs): |
+ """Runs a git command. Returns stdout as a string. |
+ |
+ If logging is DEBUG, we'll print the command before we run it. |
+ |
+ kwargs |
+ autostrip (bool) - Strip the output. Defaults to True. |
+ Output string is always strip()'d. |
+ """ |
+ autostrip = kwargs.pop('autostrip', True) |
+ cmd = (GIT_EXE,) + cmd |
+ logging.debug('Running %s', ' '.join(repr(tok) for tok in cmd)) |
+ ret = subprocess2.check_output(cmd, stderr=subprocess2.PIPE, **kwargs) |
+ if autostrip: |
+ ret = (ret or '').strip() |
+ return ret |
+ |
+ |
+def hashes(*reflike): |
+ return run('rev-parse', *reflike).splitlines() |
+ |
+ |
+def intern_f(f, kind='blob'): |
+ """Interns a file object into the git object store. |
+ |
+ Args: |
+ f (file-like object) - The file-like object to intern |
+ kind (git object type) - One of 'blob', 'commit', 'tree', 'tag'. |
+ |
+ Returns the git hash of the interned object (hex encoded). |
+ """ |
+ ret = run('hash-object', '-t', kind, '-w', '--stdin', stdin=f) |
+ f.close() |
+ return ret |
+ |
+ |
+def tree(treeref, recurse=False): |
+ """Returns a dict representation of a git tree object. |
+ |
+ Args: |
+ treeref (str) - a git ref which resolves to a tree (commits count as trees). |
+ recurse (bool) - include all of the tree's decendants too. File names will |
+ take the form of 'some/path/to/file'. |
+ |
+ Return format: |
+ { 'file_name': (mode, type, ref) } |
+ |
+ mode is an integer where: |
+ * 0040000 - Directory |
+ * 0100644 - Regular non-executable file |
+ * 0100664 - Regular non-executable group-writeable file |
+ * 0100755 - Regular executable file |
+ * 0120000 - Symbolic link |
+ * 0160000 - Gitlink |
+ |
+ type is a string where it's one of 'blob', 'commit', 'tree', 'tag'. |
+ |
+ ref is the hex encoded hash of the entry. |
+ """ |
+ ret = {} |
+ opts = ['ls-tree', '--full-tree'] |
+ if recurse: |
+ opts.append('-r') |
+ opts.append(treeref) |
+ try: |
+ for line in run(*opts).splitlines(): |
+ mode, typ, ref, name = line.split(None, 3) |
+ ret[name] = (mode, typ, ref) |
+ except subprocess2.CalledProcessError: |
+ return None |
+ return ret |
+ |
+ |
+def mktree(treedict): |
+ """Makes a git tree object and returns its hash. |
+ |
+ See |tree()| for the values of mode, type, and ref. |
+ |
+ Args: |
+ treedict - { name: (mode, type, ref) } |
+ """ |
+ with tempfile.TemporaryFile() as f: |
+ for name, (mode, typ, ref) in treedict.iteritems(): |
+ f.write('%s %s %s\t%s\0' % (mode, typ, ref, name)) |
+ f.seek(0) |
+ return run('mktree', '-z', stdin=f) |