| # Copyright 2013 The Chromium Authors. All rights reserved. |
| # Use of this source code is governed by a BSD-style license that can be |
| # found in the LICENSE file. |
| |
| # Monkeypatch IMapIterator so that Ctrl-C can kill everything properly. |
| # Derived from https://gist.github.com/aljungberg/626518 |
| import multiprocessing.pool |
| from multiprocessing.pool import IMapIterator |
| def wrapper(func): |
| def wrap(self, timeout=None): |
| return func(self, timeout=timeout or 1e100) |
| return wrap |
| IMapIterator.next = wrapper(IMapIterator.next) |
| IMapIterator.__next__ = IMapIterator.next |
| # TODO(iannucci): Monkeypatch all other 'wait' methods too. |
| |
| |
| import binascii |
| import contextlib |
| import functools |
| import logging |
| import signal |
| import sys |
| import tempfile |
| import threading |
| |
| import subprocess2 |
| |
| |
| GIT_EXE = 'git.bat' if sys.platform.startswith('win') else 'git' |
| |
| |
| class BadCommitRefException(Exception): |
| def __init__(self, refs): |
| msg = ('one of %s does not seem to be a valid commitref.' % |
| str(refs)) |
| super(BadCommitRefException, self).__init__(msg) |
| |
| |
| def memoize_one(**kwargs): |
| """Memoizes a single-argument pure function. |
| |
| Values of None are not cached. |
| |
| Kwargs: |
| threadsafe (bool) - REQUIRED. Specifies whether to use locking around |
| cache manipulation functions. This is a kwarg so that users of memoize_one |
| are forced to explicitly and verbosely pick True or False. |
| |
| Adds three methods to the decorated function: |
| * get(key, default=None) - Gets the value for this key from the cache. |
| * set(key, value) - Sets the value for this key from the cache. |
| * clear() - Drops the entire contents of the cache. Useful for unittests. |
| * update(other) - Updates the contents of the cache from another dict. |
| """ |
| assert 'threadsafe' in kwargs, 'Must specify threadsafe={True,False}' |
| threadsafe = kwargs['threadsafe'] |
| |
| if threadsafe: |
| def withlock(lock, f): |
| def inner(*args, **kwargs): |
| with lock: |
| return f(*args, **kwargs) |
| return inner |
| else: |
| def withlock(_lock, f): |
| return f |
| |
| def decorator(f): |
| # Instantiate the lock in decorator, in case users of memoize_one do: |
| # |
| # memoizer = memoize_one(threadsafe=True) |
| # |
| # @memoizer |
| # def fn1(val): ... |
| # |
| # @memoizer |
| # def fn2(val): ... |
| |
| lock = threading.Lock() if threadsafe else None |
| cache = {} |
| _get = withlock(lock, cache.get) |
| _set = withlock(lock, cache.__setitem__) |
| |
| @functools.wraps(f) |
| def inner(arg): |
| ret = _get(arg) |
| if ret is None: |
| ret = f(arg) |
| if ret is not None: |
| _set(arg, ret) |
| return ret |
| inner.get = _get |
| inner.set = _set |
| inner.clear = withlock(lock, cache.clear) |
| inner.update = withlock(lock, cache.update) |
| return inner |
| return decorator |
| |
| |
| def _ScopedPool_initer(orig, orig_args): # pragma: no cover |
| """Initializer method for ScopedPool's subprocesses. |
| |
| This helps ScopedPool handle Ctrl-C's correctly. |
| """ |
| signal.signal(signal.SIGINT, signal.SIG_IGN) |
| if orig: |
| orig(*orig_args) |
| |
| |
| @contextlib.contextmanager |
| def ScopedPool(*args, **kwargs): |
| """Context Manager which returns a multiprocessing.pool instance which |
| correctly deals with thrown exceptions. |
| |
| *args - Arguments to multiprocessing.pool |
| |
| Kwargs: |
| kind ('threads', 'procs') - The type of underlying coprocess to use. |
| **etc - Arguments to multiprocessing.pool |
| """ |
| if kwargs.pop('kind', None) == 'threads': |
| pool = multiprocessing.pool.ThreadPool(*args, **kwargs) |
| else: |
| orig, orig_args = kwargs.get('initializer'), kwargs.get('initargs', ()) |
| kwargs['initializer'] = _ScopedPool_initer |
| kwargs['initargs'] = orig, orig_args |
| pool = multiprocessing.pool.Pool(*args, **kwargs) |
| |
| try: |
| yield pool |
| pool.close() |
| except: |
| pool.terminate() |
| raise |
| finally: |
| pool.join() |
| |
| |
| class ProgressPrinter(object): |
| """Threaded single-stat status message printer.""" |
| def __init__(self, fmt, enabled=None, stream=sys.stderr, period=0.5): |
| """Create a ProgressPrinter. |
| |
| Use it as a context manager which produces a simple 'increment' method: |
| |
| with ProgressPrinter('(%%(count)d/%d)' % 1000) as inc: |
| for i in xrange(1000): |
| # do stuff |
| if i % 10 == 0: |
| inc(10) |
| |
| Args: |
| fmt - String format with a single '%(count)d' where the counter value |
| should go. |
| enabled (bool) - If this is None, will default to True if |
| logging.getLogger() is set to INFO or more verbose. |
| stream (file-like) - The stream to print status messages to. |
| period (float) - The time in seconds for the printer thread to wait |
| between printing. |
| """ |
| self.fmt = fmt |
| if enabled is None: # pragma: no cover |
| self.enabled = logging.getLogger().isEnabledFor(logging.INFO) |
| else: |
| self.enabled = enabled |
| |
| self._count = 0 |
| self._dead = False |
| self._dead_cond = threading.Condition() |
| self._stream = stream |
| self._thread = threading.Thread(target=self._run) |
| self._period = period |
| |
| def _emit(self, s): |
| if self.enabled: |
| self._stream.write('\r' + s) |
| self._stream.flush() |
| |
| def _run(self): |
| with self._dead_cond: |
| while not self._dead: |
| self._emit(self.fmt % {'count': self._count}) |
| self._dead_cond.wait(self._period) |
| self._emit((self.fmt + '\n') % {'count': self._count}) |
| |
| def inc(self, amount=1): |
| self._count += amount |
| |
| def __enter__(self): |
| self._thread.start() |
| return self.inc |
| |
| def __exit__(self, _exc_type, _exc_value, _traceback): |
| self._dead = True |
| with self._dead_cond: |
| self._dead_cond.notifyAll() |
| self._thread.join() |
| del self._thread |
| |
| |
| def parse_commitrefs(*commitrefs): |
| """Returns binary encoded commit hashes for one or more commitrefs. |
| |
| A commitref is anything which can resolve to a commit. Popular examples: |
| * 'HEAD' |
| * 'origin/master' |
| * 'cool_branch~2' |
| """ |
| try: |
| return map(binascii.unhexlify, hashes(*commitrefs)) |
| except subprocess2.CalledProcessError: |
| raise BadCommitRefException(commitrefs) |
| |
| |
| def run(*cmd, **kwargs): |
| """Runs a git command. Returns stdout as a string. |
| |
| If logging is DEBUG, we'll print the command before we run it. |
| |
| kwargs |
| autostrip (bool) - Strip the output. Defaults to True. |
| Output string is always strip()'d. |
| """ |
| autostrip = kwargs.pop('autostrip', True) |
| cmd = (GIT_EXE,) + cmd |
| logging.debug('Running %s', ' '.join(repr(tok) for tok in cmd)) |
| ret = subprocess2.check_output(cmd, stderr=subprocess2.PIPE, **kwargs) |
| if autostrip: |
| ret = (ret or '').strip() |
| return ret |
| |
| |
| def hashes(*reflike): |
| return run('rev-parse', *reflike).splitlines() |
| |
| |
| def intern_f(f, kind='blob'): |
| """Interns a file object into the git object store. |
| |
| Args: |
| f (file-like object) - The file-like object to intern |
| kind (git object type) - One of 'blob', 'commit', 'tree', 'tag'. |
| |
| Returns the git hash of the interned object (hex encoded). |
| """ |
| ret = run('hash-object', '-t', kind, '-w', '--stdin', stdin=f) |
| f.close() |
| return ret |
| |
| |
| def tree(treeref, recurse=False): |
| """Returns a dict representation of a git tree object. |
| |
| Args: |
| treeref (str) - a git ref which resolves to a tree (commits count as trees). |
| recurse (bool) - include all of the tree's decendants too. File names will |
| take the form of 'some/path/to/file'. |
| |
| Return format: |
| { 'file_name': (mode, type, ref) } |
| |
| mode is an integer where: |
| * 0040000 - Directory |
| * 0100644 - Regular non-executable file |
| * 0100664 - Regular non-executable group-writeable file |
| * 0100755 - Regular executable file |
| * 0120000 - Symbolic link |
| * 0160000 - Gitlink |
| |
| type is a string where it's one of 'blob', 'commit', 'tree', 'tag'. |
| |
| ref is the hex encoded hash of the entry. |
| """ |
| ret = {} |
| opts = ['ls-tree', '--full-tree'] |
| if recurse: |
| opts.append('-r') |
| opts.append(treeref) |
| try: |
| for line in run(*opts).splitlines(): |
| mode, typ, ref, name = line.split(None, 3) |
| ret[name] = (mode, typ, ref) |
| except subprocess2.CalledProcessError: |
| return None |
| return ret |
| |
| |
| def mktree(treedict): |
| """Makes a git tree object and returns its hash. |
| |
| See |tree()| for the values of mode, type, and ref. |
| |
| Args: |
| treedict - { name: (mode, type, ref) } |
| """ |
| with tempfile.TemporaryFile() as f: |
| for name, (mode, typ, ref) in treedict.iteritems(): |
| f.write('%s %s %s\t%s\0' % (mode, typ, ref, name)) |
| f.seek(0) |
| return run('mktree', '-z', stdin=f) |