blob: c1e4f0bac0ba4df6ef6d3d4226117cc92e43b939 [file] [log] [blame]
iannucci@chromium.orgaa74cf62013-11-19 20:00:49 +00001# Copyright 2013 The Chromium Authors. All rights reserved.
2# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4
5# Monkeypatch IMapIterator so that Ctrl-C can kill everything properly.
6# Derived from https://gist.github.com/aljungberg/626518
7import multiprocessing.pool
8from multiprocessing.pool import IMapIterator
9def wrapper(func):
10 def wrap(self, timeout=None):
11 return func(self, timeout=timeout or 1e100)
12 return wrap
13IMapIterator.next = wrapper(IMapIterator.next)
14IMapIterator.__next__ = IMapIterator.next
15# TODO(iannucci): Monkeypatch all other 'wait' methods too.
16
17
18import binascii
19import contextlib
20import functools
21import logging
22import signal
23import sys
24import tempfile
25import threading
26
27import subprocess2
28
29
30GIT_EXE = 'git.bat' if sys.platform.startswith('win') else 'git'
31
32
33class BadCommitRefException(Exception):
34 def __init__(self, refs):
35 msg = ('one of %s does not seem to be a valid commitref.' %
36 str(refs))
37 super(BadCommitRefException, self).__init__(msg)
38
39
40def memoize_one(**kwargs):
41 """Memoizes a single-argument pure function.
42
43 Values of None are not cached.
44
45 Kwargs:
46 threadsafe (bool) - REQUIRED. Specifies whether to use locking around
47 cache manipulation functions. This is a kwarg so that users of memoize_one
48 are forced to explicitly and verbosely pick True or False.
49
50 Adds three methods to the decorated function:
51 * get(key, default=None) - Gets the value for this key from the cache.
52 * set(key, value) - Sets the value for this key from the cache.
53 * clear() - Drops the entire contents of the cache. Useful for unittests.
54 * update(other) - Updates the contents of the cache from another dict.
55 """
56 assert 'threadsafe' in kwargs, 'Must specify threadsafe={True,False}'
57 threadsafe = kwargs['threadsafe']
58
59 if threadsafe:
60 def withlock(lock, f):
61 def inner(*args, **kwargs):
62 with lock:
63 return f(*args, **kwargs)
64 return inner
65 else:
66 def withlock(_lock, f):
67 return f
68
69 def decorator(f):
70 # Instantiate the lock in decorator, in case users of memoize_one do:
71 #
72 # memoizer = memoize_one(threadsafe=True)
73 #
74 # @memoizer
75 # def fn1(val): ...
76 #
77 # @memoizer
78 # def fn2(val): ...
79
80 lock = threading.Lock() if threadsafe else None
81 cache = {}
82 _get = withlock(lock, cache.get)
83 _set = withlock(lock, cache.__setitem__)
84
85 @functools.wraps(f)
86 def inner(arg):
87 ret = _get(arg)
88 if ret is None:
89 ret = f(arg)
90 if ret is not None:
91 _set(arg, ret)
92 return ret
93 inner.get = _get
94 inner.set = _set
95 inner.clear = withlock(lock, cache.clear)
96 inner.update = withlock(lock, cache.update)
97 return inner
98 return decorator
99
100
101def _ScopedPool_initer(orig, orig_args): # pragma: no cover
102 """Initializer method for ScopedPool's subprocesses.
103
104 This helps ScopedPool handle Ctrl-C's correctly.
105 """
106 signal.signal(signal.SIGINT, signal.SIG_IGN)
107 if orig:
108 orig(*orig_args)
109
110
111@contextlib.contextmanager
112def ScopedPool(*args, **kwargs):
113 """Context Manager which returns a multiprocessing.pool instance which
114 correctly deals with thrown exceptions.
115
116 *args - Arguments to multiprocessing.pool
117
118 Kwargs:
119 kind ('threads', 'procs') - The type of underlying coprocess to use.
120 **etc - Arguments to multiprocessing.pool
121 """
122 if kwargs.pop('kind', None) == 'threads':
123 pool = multiprocessing.pool.ThreadPool(*args, **kwargs)
124 else:
125 orig, orig_args = kwargs.get('initializer'), kwargs.get('initargs', ())
126 kwargs['initializer'] = _ScopedPool_initer
127 kwargs['initargs'] = orig, orig_args
128 pool = multiprocessing.pool.Pool(*args, **kwargs)
129
130 try:
131 yield pool
132 pool.close()
133 except:
134 pool.terminate()
135 raise
136 finally:
137 pool.join()
138
139
140class ProgressPrinter(object):
141 """Threaded single-stat status message printer."""
142 def __init__(self, fmt, enabled=None, stream=sys.stderr, period=0.5):
143 """Create a ProgressPrinter.
144
145 Use it as a context manager which produces a simple 'increment' method:
146
147 with ProgressPrinter('(%%(count)d/%d)' % 1000) as inc:
148 for i in xrange(1000):
149 # do stuff
150 if i % 10 == 0:
151 inc(10)
152
153 Args:
154 fmt - String format with a single '%(count)d' where the counter value
155 should go.
156 enabled (bool) - If this is None, will default to True if
157 logging.getLogger() is set to INFO or more verbose.
158 stream (file-like) - The stream to print status messages to.
159 period (float) - The time in seconds for the printer thread to wait
160 between printing.
161 """
162 self.fmt = fmt
163 if enabled is None: # pragma: no cover
164 self.enabled = logging.getLogger().isEnabledFor(logging.INFO)
165 else:
166 self.enabled = enabled
167
168 self._count = 0
169 self._dead = False
170 self._dead_cond = threading.Condition()
171 self._stream = stream
172 self._thread = threading.Thread(target=self._run)
173 self._period = period
174
175 def _emit(self, s):
176 if self.enabled:
177 self._stream.write('\r' + s)
178 self._stream.flush()
179
180 def _run(self):
181 with self._dead_cond:
182 while not self._dead:
183 self._emit(self.fmt % {'count': self._count})
184 self._dead_cond.wait(self._period)
185 self._emit((self.fmt + '\n') % {'count': self._count})
186
187 def inc(self, amount=1):
188 self._count += amount
189
190 def __enter__(self):
191 self._thread.start()
192 return self.inc
193
194 def __exit__(self, _exc_type, _exc_value, _traceback):
195 self._dead = True
196 with self._dead_cond:
197 self._dead_cond.notifyAll()
198 self._thread.join()
199 del self._thread
200
201
iannucci@chromium.org8bc9b5c2014-03-12 01:36:18 +0000202def branches(*args):
203 NO_BRANCH = ('* (no branch)', '* (detached from ')
204 for line in run('branch', *args).splitlines():
205 if line.startswith(NO_BRANCH):
206 continue
207 yield line.split()[-1]
208
209
210def config_list(option):
211 try:
212 return run('config', '--get-all', option).split()
213 except subprocess2.CalledProcessError:
214 return []
215
216
217def current_branch():
218 return run('rev-parse', '--abbrev-ref', 'HEAD')
219
220
iannucci@chromium.orgaa74cf62013-11-19 20:00:49 +0000221def parse_commitrefs(*commitrefs):
222 """Returns binary encoded commit hashes for one or more commitrefs.
223
224 A commitref is anything which can resolve to a commit. Popular examples:
225 * 'HEAD'
226 * 'origin/master'
227 * 'cool_branch~2'
228 """
229 try:
iannucci@chromium.org8bc9b5c2014-03-12 01:36:18 +0000230 return map(binascii.unhexlify, hash_multi(*commitrefs))
iannucci@chromium.orgaa74cf62013-11-19 20:00:49 +0000231 except subprocess2.CalledProcessError:
232 raise BadCommitRefException(commitrefs)
233
234
235def run(*cmd, **kwargs):
236 """Runs a git command. Returns stdout as a string.
237
238 If logging is DEBUG, we'll print the command before we run it.
239
240 kwargs
241 autostrip (bool) - Strip the output. Defaults to True.
242 Output string is always strip()'d.
243 """
244 autostrip = kwargs.pop('autostrip', True)
245 cmd = (GIT_EXE,) + cmd
246 logging.debug('Running %s', ' '.join(repr(tok) for tok in cmd))
247 ret = subprocess2.check_output(cmd, stderr=subprocess2.PIPE, **kwargs)
248 if autostrip:
249 ret = (ret or '').strip()
250 return ret
251
252
iannucci@chromium.org8bc9b5c2014-03-12 01:36:18 +0000253def hash_one(reflike):
254 return run('rev-parse', reflike)
255
256
257def hash_multi(*reflike):
iannucci@chromium.orgaa74cf62013-11-19 20:00:49 +0000258 return run('rev-parse', *reflike).splitlines()
259
260
261def intern_f(f, kind='blob'):
262 """Interns a file object into the git object store.
263
264 Args:
265 f (file-like object) - The file-like object to intern
266 kind (git object type) - One of 'blob', 'commit', 'tree', 'tag'.
267
268 Returns the git hash of the interned object (hex encoded).
269 """
270 ret = run('hash-object', '-t', kind, '-w', '--stdin', stdin=f)
271 f.close()
272 return ret
273
274
iannucci@chromium.org8bc9b5c2014-03-12 01:36:18 +0000275def tags(*args):
276 return run('tag', *args).splitlines()
277
278
iannucci@chromium.orgaa74cf62013-11-19 20:00:49 +0000279def tree(treeref, recurse=False):
280 """Returns a dict representation of a git tree object.
281
282 Args:
283 treeref (str) - a git ref which resolves to a tree (commits count as trees).
284 recurse (bool) - include all of the tree's decendants too. File names will
285 take the form of 'some/path/to/file'.
286
287 Return format:
288 { 'file_name': (mode, type, ref) }
289
290 mode is an integer where:
291 * 0040000 - Directory
292 * 0100644 - Regular non-executable file
293 * 0100664 - Regular non-executable group-writeable file
294 * 0100755 - Regular executable file
295 * 0120000 - Symbolic link
296 * 0160000 - Gitlink
297
298 type is a string where it's one of 'blob', 'commit', 'tree', 'tag'.
299
300 ref is the hex encoded hash of the entry.
301 """
302 ret = {}
303 opts = ['ls-tree', '--full-tree']
304 if recurse:
305 opts.append('-r')
306 opts.append(treeref)
307 try:
308 for line in run(*opts).splitlines():
309 mode, typ, ref, name = line.split(None, 3)
310 ret[name] = (mode, typ, ref)
311 except subprocess2.CalledProcessError:
312 return None
313 return ret
314
315
iannucci@chromium.org8bc9b5c2014-03-12 01:36:18 +0000316def upstream(branch):
317 try:
318 return run('rev-parse', '--abbrev-ref', '--symbolic-full-name',
319 branch+'@{upstream}')
320 except subprocess2.CalledProcessError:
321 return None
322
323
iannucci@chromium.orgaa74cf62013-11-19 20:00:49 +0000324def mktree(treedict):
325 """Makes a git tree object and returns its hash.
326
327 See |tree()| for the values of mode, type, and ref.
328
329 Args:
330 treedict - { name: (mode, type, ref) }
331 """
332 with tempfile.TemporaryFile() as f:
333 for name, (mode, typ, ref) in treedict.iteritems():
334 f.write('%s %s %s\t%s\0' % (mode, typ, ref, name))
335 f.seek(0)
336 return run('mktree', '-z', stdin=f)