blob: b8a05d68f17ef29f1ab2a5ca04afc51be05e11cb [file] [log] [blame]
Kuang-che Wu6e4beca2018-06-27 17:45:02 +08001# -*- coding: utf-8 -*-
Kuang-che Wu3eb6b502018-06-06 16:15:18 +08002# Copyright 2018 The Chromium OS Authors. All rights reserved.
3# Use of this source code is governed by a BSD-style license that can be
4# found in the LICENSE file.
5"""Model of source code organization and changes.
6
7This module modeled complex source code organization, i.e. nested git repos,
8and their version relationship, i.e. pinned or floating git repo. In other
9words, it's abstraction of chrome's gclient DEPS, and chromeos and Android's
10repo manifest.
11"""
12
13from __future__ import print_function
Kuang-che Wu13acc7b2020-06-15 10:45:35 +080014import collections
Kuang-che Wu3eb6b502018-06-06 16:15:18 +080015import copy
16import json
17import logging
18import os
19import re
20import shutil
21
22from bisect_kit import cli
Kuang-che Wue121fae2018-11-09 16:18:39 +080023from bisect_kit import errors
Kuang-che Wu3eb6b502018-06-06 16:15:18 +080024from bisect_kit import git_util
25
26logger = logging.getLogger(__name__)
27
28_re_intra_rev = r'^([^,]+)~([^,]+)/(\d+)$'
29
30SPEC_FIXED = 'fixed'
31SPEC_FLOAT = 'float'
32_DIFF_CACHE_DIR = 'bisectkit-cache'
33
34
35def make_intra_rev(a, b, index):
36 """Makes intra-rev version string.
37
38 Between two major "named" versions a and b, there are many small changes
39 (commits) in-between. bisect-kit will identify all those instances and bisect
40 them. We give names to those instances and call these names as "intra-rev"
41 which stands for minor version numbers within two major version.
42
43 Note, a+index (without b) is not enough to identify an unique change due to
44 branches. Take chromeos as example, both 9900.1.0 and 9901.0.0 are derived
45 from 9900.0.0, so "9900.0.0 plus 100 changes" may ambiguously refer to states
46 in 9900.1.0 and 9901.0.0.
47
48 Args:
49 a: the start version
50 b: the end version
51 index: the index number of changes between a and b
52
53 Returns:
54 the intra-rev version string
55 """
56 return '%s~%s/%d' % (a, b, index)
57
58
59def parse_intra_rev(rev):
60 """Decomposes intra-rev string.
61
62 See comments of make_intra_rev for what is intra-rev.
63
64 Args:
65 rev: intra-rev string or normal version number
66
67 Returns:
68 (start, end, index). If rev is not intra-rev, it must be normal version
69 number and returns (rev, rev, 0).
70 """
71 m = re.match(_re_intra_rev, rev)
Kuang-che Wu89ac2e72018-07-25 17:39:07 +080072 if not m:
Kuang-che Wu3eb6b502018-06-06 16:15:18 +080073 return rev, rev, 0
74
Kuang-che Wu89ac2e72018-07-25 17:39:07 +080075 return m.group(1), m.group(2), int(m.group(3))
76
Kuang-che Wu3eb6b502018-06-06 16:15:18 +080077
78def argtype_intra_rev(argtype):
79 """Validates argument is intra-rev.
80
81 Args:
82 argtype: argtype function which validates major version number
83
84 Returns:
85 A new argtype function which matches intra-rev
86 """
87
88 def argtype_function(s):
Kuang-che Wucab92452019-01-19 18:24:29 +080089 examples = []
90 try:
91 return argtype(s)
92 except cli.ArgTypeError as e:
93 examples += e.example
94
Kuang-che Wu3eb6b502018-06-06 16:15:18 +080095 m = re.match(_re_intra_rev, s)
96 if m:
97 try:
98 argtype(m.group(1))
99 argtype(m.group(2))
100 return s
101 except cli.ArgTypeError as e:
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800102 for example in e.example:
103 examples.append(make_intra_rev(example, example, 10))
104 raise cli.ArgTypeError('Invalid intra rev', examples)
Kuang-che Wucab92452019-01-19 18:24:29 +0800105
106 examples.append(make_intra_rev('<rev1>', '<rev2>', 10))
107 raise cli.ArgTypeError('Invalid rev', examples)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800108
109 return argtype_function
110
111
112def _normalize_repo_url(repo_url):
113 repo_url = re.sub(r'https://chrome-internal.googlesource.com/a/',
114 r'https://chrome-internal.googlesource.com/', repo_url)
115 repo_url = re.sub(r'\.git$', '', repo_url)
116 return repo_url
117
118
Kuang-che Wu23192ad2020-03-11 18:12:46 +0800119class PathSpec:
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800120 """Specified code version of one path.
121
122 Attributes:
123 path: local path, relative to project base dir
124 repo_url: code repository location
125 at: code version, could be git hash or branch name
126 """
127
128 def __init__(self, path, repo_url, at):
129 self.path = path
130 self.repo_url = repo_url
131 self.at = at
132
133 def is_static(self):
134 return git_util.is_git_rev(self.at)
135
136 def __eq__(self, rhs):
137 if self.path != rhs.path:
138 return False
139 if self.at != rhs.at:
140 return False
141 if _normalize_repo_url(self.repo_url) != _normalize_repo_url(rhs.repo_url):
142 return False
143 return True
144
145 def __ne__(self, rhs):
146 return not self == rhs
147
148
Kuang-che Wu23192ad2020-03-11 18:12:46 +0800149class Spec:
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800150 """Collection of PathSpec.
151
152 Spec is analogy to gclient's DEPS and repo's manifest.
153
154 Attributes:
155 spec_type: type of spec, SPEC_FIXED or SPEC_FLOAT. SPEC_FIXED means code
156 version is pinned and fixed. On the other hand, SPEC_FLOAT is not
157 pinned and the actual version (git commit) may change over time.
158 name: name of this spec, for debugging purpose. usually version number
159 or git hash
160 timestamp: timestamp of this spec
161 path: path of spec
162 entries: paths to PathSpec dict
Zheng-Jie Changd968f552020-01-16 13:31:57 +0800163 revision: a commit id of manifest-internal indicates the manifest revision,
164 this argument is not used in DEPS.
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800165 """
166
Zheng-Jie Changd968f552020-01-16 13:31:57 +0800167 def __init__(self,
168 spec_type,
169 name,
170 timestamp,
171 path,
172 entries=None,
173 revision=None):
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800174 self.spec_type = spec_type
175 self.name = name
176 self.timestamp = timestamp
177 self.path = path
178 self.entries = entries
Zheng-Jie Changd968f552020-01-16 13:31:57 +0800179 self.revision = revision
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800180
181 def copy(self):
182 return copy.deepcopy(self)
183
184 def similar_score(self, rhs):
185 """Calculates similar score to another Spec.
186
187 Returns:
188 score of similarity. Smaller value is more similar.
189 """
190 score = 0
191 for path in set(self.entries) & set(rhs.entries):
192 if rhs[path] == self[path]:
193 continue
194 if rhs[path].at == self[path].at:
195 # it's often that remote repo moved around but should be treated as the
196 # same one
197 score += 0.1
198 else:
199 score += 1
200 score += len(set(self.entries) ^ set(rhs.entries))
201 return score
202
203 def is_static(self):
204 return all(path_spec.is_static() for path_spec in self.entries.values())
205
206 def is_subset(self, rhs):
207 return set(self.entries.keys()) <= set(rhs.entries.keys())
208
209 def __getitem__(self, path):
210 return self.entries[path]
211
212 def __contains__(self, path):
213 return path in self.entries
214
215 def apply(self, action_group):
216 self.timestamp = action_group.timestamp
217 self.name = '(%s)' % self.timestamp
218 for action in action_group.actions:
219 if isinstance(action, GitAddRepo):
220 self.entries[action.path] = PathSpec(action.path, action.repo_url,
221 action.rev)
222 elif isinstance(action, GitCheckoutCommit):
223 self.entries[action.path].at = action.rev
224 elif isinstance(action, GitRemoveRepo):
225 del self.entries[action.path]
226 else:
227 assert 0, 'unknown action: %s' % action.__class__.__name__
228
229 def dump(self):
230 # for debugging
231 print(self.name, self.path, self.timestamp)
232 print('size', len(self.entries))
233 for path, path_spec in sorted(self.entries.items()):
234 print(path, path_spec.at)
235
236 def diff(self, rhs):
237 logger.info('diff between %s and %s', self.name, rhs.name)
238 expect = set(self.entries)
239 actual = set(rhs.entries)
Kuang-che Wu4997bfd2019-03-18 13:09:26 +0800240 common_count = 0
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800241 for path in sorted(expect - actual):
242 logger.info('-%s', path)
243 for path in sorted(actual - expect):
244 logger.info('+%s', path)
245 for path in sorted(expect & actual):
246 if self[path] == rhs[path]:
Kuang-che Wu4997bfd2019-03-18 13:09:26 +0800247 common_count += 1
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800248 continue
249 if self[path].at != rhs[path].at:
250 logger.info(' %s: at %s vs %s', path, self[path].at, rhs[path].at)
251 if self[path].repo_url != rhs[path].repo_url:
252 logger.info(' %s: repo_url %s vs %s', path, self[path].repo_url,
253 rhs[path].repo_url)
Kuang-che Wu4997bfd2019-03-18 13:09:26 +0800254 logger.info('and common=%s', common_count)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800255
256
Kuang-che Wu23192ad2020-03-11 18:12:46 +0800257class Action:
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800258 """Actions describe changes from one Spec to another.
259
260 Attributes:
261 timestamp: action time
262 path: action path, which is relative to project root
263 """
264
265 def __init__(self, timestamp, path):
266 self.timestamp = timestamp
267 self.path = path
268
Kuang-che Wu6948ecc2018-09-11 17:43:49 +0800269 def apply(self, _code_storage, _root_dir):
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800270 raise NotImplementedError
271
Kuang-che Wu13acc7b2020-06-15 10:45:35 +0800272 def summary(self):
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800273 raise NotImplementedError
274
275 def __eq__(self, rhs):
276 return self.__dict__ == rhs.__dict__
277
278 def serialize(self):
279 return self.__class__.__name__, self.__dict__
280
281
282def unserialize_action(data):
283 classes = [GitCheckoutCommit, GitAddRepo, GitRemoveRepo]
284 class_name, values = data
285 assert class_name in [cls.__name__ for cls in classes
286 ], 'unknown action class: %s' % class_name
287 for cls in classes:
288 if class_name == cls.__name__:
Kuang-che Wu89ac2e72018-07-25 17:39:07 +0800289 action = cls(**values)
290 break
291 return action
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800292
293
Kuang-che Wu23192ad2020-03-11 18:12:46 +0800294class ActionGroup:
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800295 """Atomic group of Action objects
296
Kuang-che Wuae6847c2020-01-13 16:06:08 +0800297 This models atomic actions, ex:
298 - repo added/removed in the same manifest commit
299 - commits appears at the same time due to repo add
300 - gerrit topic
301 - circular CQ-DEPEND (Cq-Depend)
302 Otherwise, one ActionGroup usually consists only one Action object.
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800303 """
304
305 def __init__(self, timestamp, comment=None):
306 self.timestamp = timestamp
307 self.name = None
308 self.actions = []
309 self.comment = comment
310
311 def add(self, action):
312 self.actions.append(action)
313
314 def serialize(self):
Kuang-che Wu22455262018-08-03 15:38:29 +0800315 return dict(
316 timestamp=self.timestamp,
317 name=self.name,
318 comment=self.comment,
319 actions=[a.serialize() for a in self.actions])
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800320
Kuang-che Wu13acc7b2020-06-15 10:45:35 +0800321 def summary(self):
Kuang-che Wue80bb872018-11-15 19:45:25 +0800322 result = {}
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800323 if self.comment:
Kuang-che Wue80bb872018-11-15 19:45:25 +0800324 result['comment'] = self.comment
Kuang-che Wu13acc7b2020-06-15 10:45:35 +0800325 result['actions'] = [action.summary() for action in self.actions]
Kuang-che Wue80bb872018-11-15 19:45:25 +0800326 return result
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800327
328 @staticmethod
329 def unserialize(data):
Kuang-che Wu22455262018-08-03 15:38:29 +0800330 ag = ActionGroup(data['timestamp'])
331 ag.name = data['name']
332 ag.comment = data['comment']
333 for x in data['actions']:
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800334 ag.add(unserialize_action(x))
335 return ag
336
Kuang-che Wu6948ecc2018-09-11 17:43:49 +0800337 def apply(self, code_storage, root_dir):
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800338 for action in self.actions:
Kuang-che Wu6948ecc2018-09-11 17:43:49 +0800339 action.apply(code_storage, root_dir)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800340
341
342class GitCheckoutCommit(Action):
343 """Describes a git commit action.
344
345 Attributes:
346 repo_url: the corresponding url of git repo
347 rev: git commit to checkout
348 """
349
350 def __init__(self, timestamp, path, repo_url, rev):
Kuang-che Wu6d91b8c2020-11-24 20:14:35 +0800351 super().__init__(timestamp, path)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800352 self.repo_url = repo_url
353 self.rev = rev
354
Kuang-che Wu6948ecc2018-09-11 17:43:49 +0800355 def apply(self, code_storage, root_dir):
356 del code_storage # unused
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800357 git_repo = os.path.join(root_dir, self.path)
358 assert git_util.is_git_root(git_repo)
359 git_util.checkout_version(git_repo, self.rev)
360
Kuang-che Wu13acc7b2020-06-15 10:45:35 +0800361 def summary(self):
362 text = 'commit %s %s' % (self.rev[:10], self.path)
Kuang-che Wue80bb872018-11-15 19:45:25 +0800363 return dict(
364 timestamp=self.timestamp,
365 action_type='commit',
366 path=self.path,
Kuang-che Wue80bb872018-11-15 19:45:25 +0800367 repo_url=self.repo_url,
368 rev=self.rev,
369 text=text,
370 )
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800371
372
373class GitAddRepo(Action):
374 """Describes a git repo add action.
375
376 Attributes:
377 repo_url: the corresponding url of git repo to add
378 rev: git commit to checkout
379 """
380
381 def __init__(self, timestamp, path, repo_url, rev):
Kuang-che Wu6d91b8c2020-11-24 20:14:35 +0800382 super().__init__(timestamp, path)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800383 self.repo_url = repo_url
384 self.rev = rev
385
Kuang-che Wu6948ecc2018-09-11 17:43:49 +0800386 def apply(self, code_storage, root_dir):
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800387 git_repo = os.path.join(root_dir, self.path)
Kuang-che Wudf11c8a2019-03-18 13:21:24 +0800388 if os.path.exists(git_repo):
389 if os.path.isdir(git_repo) and not os.listdir(git_repo):
390 # mimic gclient's behavior; don't panic
391 logger.warning(
392 'adding repo %s; there is already an empty directory; '
393 'assume it is okay', git_repo)
394 else:
395 assert not os.path.exists(git_repo), '%s already exists' % git_repo
Kuang-che Wu6948ecc2018-09-11 17:43:49 +0800396
397 reference = code_storage.cached_git_root(self.repo_url)
398 git_util.clone(git_repo, self.repo_url, reference=reference)
399 git_util.checkout_version(git_repo, self.rev)
400
401 code_storage.add_to_project_list(root_dir, self.path, self.repo_url)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800402
Kuang-che Wu13acc7b2020-06-15 10:45:35 +0800403 def summary(self):
Kuang-che Wue80bb872018-11-15 19:45:25 +0800404 text = 'add repo %s from %s@%s' % (self.path, self.repo_url, self.rev[:10])
405 return dict(
406 timestamp=self.timestamp,
407 action_type='add_repo',
408 path=self.path,
Kuang-che Wu356ecb92019-04-02 16:30:25 +0800409 repo_url=self.repo_url,
410 rev=self.rev,
Kuang-che Wue80bb872018-11-15 19:45:25 +0800411 text=text,
412 )
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800413
414
415class GitRemoveRepo(Action):
416 """Describes a git repo remove action."""
417
Kuang-che Wu6948ecc2018-09-11 17:43:49 +0800418 def apply(self, code_storage, root_dir):
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800419 assert self.path
Kuang-che Wuf5db90c2021-01-05 17:16:19 +0800420 root_dir = os.path.normpath(root_dir)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800421 git_repo = os.path.join(root_dir, self.path)
Kuang-che Wu95e77ff2020-12-25 21:34:09 +0800422 assert git_util.is_git_root(git_repo), '%r should be a git repo' % git_repo
Kuang-che Wu067ff292019-02-14 18:16:23 +0800423 # TODO(kcwu): other projects may be sub-tree of `git_repo`.
424 # They should not be deleted. (crbug/930047)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800425 shutil.rmtree(git_repo)
426
Kuang-che Wuf5db90c2021-01-05 17:16:19 +0800427 # Remove empty parents. (But don't delete `root_dir` and its upper parents.)
428 parent = os.path.dirname(git_repo)
429 while (parent != root_dir and
430 os.path.commonpath([parent, root_dir]) == root_dir):
431 if os.listdir(parent):
432 break
433 os.rmdir(parent)
434 parent = os.path.dirname(parent)
435
Kuang-che Wu6948ecc2018-09-11 17:43:49 +0800436 code_storage.remove_from_project_list(root_dir, self.path)
437
Kuang-che Wu13acc7b2020-06-15 10:45:35 +0800438 def summary(self):
Kuang-che Wue80bb872018-11-15 19:45:25 +0800439 return dict(
440 timestamp=self.timestamp,
441 action_type='remove_repo',
442 path=self.path,
443 text='remove repo %s' % self.path,
444 )
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800445
446
447def apply_actions(code_storage, action_groups, root_dir):
448 # Speed optimization: only apply the last one of consecutive commits per
449 # repo. It is possible to optimize further, but need to take care git repo
450 # add/remove within another repo.
451 commits = {}
452
453 def batch_apply(commits):
Kuang-che Wu261174e2020-01-09 17:51:31 +0800454 for i, _, commit_action in sorted(commits.values(), key=lambda x: x[:2]):
Zheng-Jie Chang011bf952020-06-18 07:45:30 +0800455 logger.debug('[%d] applying "%r"', i, commit_action.summary())
Kuang-che Wu6948ecc2018-09-11 17:43:49 +0800456 commit_action.apply(code_storage, root_dir)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800457
458 for i, action_group in enumerate(action_groups, 1):
Kuang-che Wud1d45b42018-07-05 00:46:45 +0800459 for action in action_group.actions:
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800460 if not isinstance(action, GitCheckoutCommit):
461 break
462 else:
463 # If all actions are commits, defer them for batch processing.
Kuang-che Wu261174e2020-01-09 17:51:31 +0800464 for j, action in enumerate(action_group.actions):
465 commits[action.path] = (i, j, action)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800466 continue
467
468 batch_apply(commits)
469 commits = {}
Kuang-che Wu95e77ff2020-12-25 21:34:09 +0800470 logger.debug('[%d] applying "%r"', i, action_group.summary())
471 action_group.apply(code_storage, root_dir)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800472
473 batch_apply(commits)
474
475
Kuang-che Wu23192ad2020-03-11 18:12:46 +0800476class SpecManager:
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800477 """Spec related abstract operations.
478
479 This class enumerates Spec instances and switch disk state to Spec.
480
481 In other words, this class abstracts:
482 - discovery of gclient's DEPS and repo's manifest
483 - gclient sync and repo sync
484 """
485
Zheng-Jie Changd968f552020-01-16 13:31:57 +0800486 def collect_float_spec(self, old, new, fixed_specs=None):
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800487 """Collects float Spec between two versions.
488
489 This method may fetch spec from network. However, it should not switch tree
490 version state.
Zheng-Jie Changd968f552020-01-16 13:31:57 +0800491
492 Args:
493 old: old version
494 new: new version
495 fixed_specs: fixed specs from collect_fixed_spec(old, new) for Chrome OS
496 or None for others
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800497 """
498 raise NotImplementedError
499
500 def collect_fixed_spec(self, old, new):
501 """Collects fixed Spec between two versions.
502
503 This method may fetch spec from network. However, it should not switch tree
504 version state.
505 """
506 raise NotImplementedError
507
508 def parse_spec(self, spec):
509 """Parses information for Spec object.
510
511 Args:
512 spec: Spec object. It specifies what to parse and the parsed information
513 is stored inside.
514 """
515 raise NotImplementedError
516
517 def sync_disk_state(self, rev):
518 """Switch source tree state to given version."""
519 raise NotImplementedError
520
521
Kuang-che Wu23192ad2020-03-11 18:12:46 +0800522class CodeStorage:
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800523 """Query code history and commit relationship without checkout.
524
525 Because paths inside source tree may be deleted or map to different remote
526 repo in different versions, we cannot query git information of one version
527 but the tree state is at another version. In order to query information
528 without changing tree state and fast, we need out of tree source code
529 storage.
530
531 This class assumes all git repos are mirrored somewhere on local disk.
532 Subclasses just need to implement cached_git_root() which returns the
533 location.
534
535 In other words, this class abstracts operations upon gclient's cache-dir
536 repo's mirror.
537 """
538
539 def cached_git_root(self, repo_url):
540 """The cached path of given remote git repo.
541
542 Args:
543 repo_url: URL of git remote repo
544
545 Returns:
546 path of cache folder
547 """
548 raise NotImplementedError
549
Kuang-che Wu6948ecc2018-09-11 17:43:49 +0800550 def add_to_project_list(self, project_root, path, repo_url):
551 raise NotImplementedError
552
553 def remove_from_project_list(self, project_root, path):
554 raise NotImplementedError
555
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800556 def is_ancestor_commit(self, spec, path, old, new):
557 """Determine one commit is ancestor of another.
558
559 Args:
560 spec: Spec object
561 path: local path relative to project root
562 old: commit id
563 new: commit id
564
565 Returns:
566 True if `old` is ancestor of `new`
567 """
568 git_root = self.cached_git_root(spec[path].repo_url)
569 return git_util.is_ancestor_commit(git_root, old, new)
570
571 def get_rev_by_time(self, spec, path, timestamp):
572 """Get commit hash of given spec by time.
573
574 Args:
575 spec: Spec object
576 path: local path relative to project root
Kuang-che Wue4bae0b2018-07-19 12:10:14 +0800577 timestamp: timestamp
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800578
579 Returns:
580 The commit hash of given time. If there are commits with the given
581 timestamp, returns the last commit.
582 """
583 git_root = self.cached_git_root(spec[path].repo_url)
Kuang-che Wue4bae0b2018-07-19 12:10:14 +0800584 # spec[path].at is remote reference name. Since git_root is a mirror (not
585 # a local checkout), there is no need to convert the name.
Kuang-che Wu8a28a9d2018-09-11 17:43:36 +0800586 return git_util.get_rev_by_time(git_root, timestamp, spec[path].at)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800587
Zheng-Jie Chang868c1752020-01-21 14:42:41 +0800588 def get_actions_between_two_commit(self,
589 spec,
590 path,
591 old,
592 new,
593 ignore_not_ancestor=False):
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800594 git_root = self.cached_git_root(spec[path].repo_url)
595 result = []
Zheng-Jie Chang868c1752020-01-21 14:42:41 +0800596 # not in the same branch, regard as an atomic operation
597 # this situation happens when
598 # 1. new is branched from old and
599 # 2. commit timestamp is not reliable(i.e. commit time != merged time)
600 # old and new might not have ancestor relation
601 if ignore_not_ancestor and old != new and not git_util.is_ancestor_commit(
602 git_root, old, new):
603 timestamp = git_util.get_commit_time(git_root, new)
604 result.append(
605 GitCheckoutCommit(timestamp, path, spec[path].repo_url, new))
606 return result
607
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800608 for timestamp, git_rev in git_util.list_commits_between_commits(
609 git_root, old, new):
610 result.append(
611 GitCheckoutCommit(timestamp, path, spec[path].repo_url, git_rev))
612 return result
613
614 def is_containing_commit(self, spec, path, rev):
615 git_root = self.cached_git_root(spec[path].repo_url)
616 return git_util.is_containing_commit(git_root, rev)
617
618 def are_spec_commits_available(self, spec):
619 for path, path_spec in spec.entries.items():
620 if not path_spec.is_static():
621 continue
622 if not self.is_containing_commit(spec, path, path_spec.at):
623 return False
624 return True
625
626
Kuang-che Wu23192ad2020-03-11 18:12:46 +0800627class CodeManager:
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800628 """Class to reconstruct historical source tree state.
629
630 This class can reconstruct all moments of source tree state and diffs between
631 them.
632
633 Attributes:
634 root_dir: root path of project source tree
635 spec_manager: SpecManager object
636 code_storage: CodeStorage object
637 """
638
639 def __init__(self, root_dir, spec_manager, code_storage):
640 self.root_dir = root_dir
641 self.spec_manager = spec_manager
642 self.code_storage = code_storage
643
Kuang-che Wuae6847c2020-01-13 16:06:08 +0800644 def generate_action_groups_between_specs(self, prev_float, next_float):
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800645 """Generates actions between two float specs.
646
647 Args:
648 prev_float: start of spec object (exclusive)
649 next_float: end of spec object (inclusive)
650
651 Returns:
Kuang-che Wuae6847c2020-01-13 16:06:08 +0800652 list of ActionGroup object (ordered)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800653 """
Kuang-che Wuae6847c2020-01-13 16:06:08 +0800654 groups = []
655 last_group = ActionGroup(next_float.timestamp)
Zheng-Jie Changeb5aaf32020-01-10 16:36:58 +0800656 is_removed = set()
Zheng-Jie Chang868c1752020-01-21 14:42:41 +0800657
658 # `branch_between_float_specs` is currently a chromeos-only logic,
659 # and branch behavior is not verified for android and chrome now.
660 is_chromeos_branched = False
661 if hasattr(self.spec_manager, 'branch_between_float_specs'
662 ) and self.spec_manager.branch_between_float_specs(
663 prev_float, next_float):
664 is_chromeos_branched = True
665
Kuang-che Wuae6847c2020-01-13 16:06:08 +0800666 # Sort alphabetically, so parent directories are handled before children
667 # directories.
Zheng-Jie Changeb5aaf32020-01-10 16:36:58 +0800668 for path in sorted(set(prev_float.entries) | set(next_float.entries)):
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800669 # Add repo
670 if path not in prev_float:
671 if next_float[path].is_static():
672 next_at = next_float[path].at
673 else:
674 next_at = self.code_storage.get_rev_by_time(next_float, path,
675 next_float.timestamp)
Kuang-che Wuae6847c2020-01-13 16:06:08 +0800676 last_group.add(
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800677 GitAddRepo(next_float.timestamp, path, next_float[path].repo_url,
678 next_at))
679 continue
680
Zheng-Jie Chang868c1752020-01-21 14:42:41 +0800681 # Existing path is floating.
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800682 if not prev_float[path].is_static():
Zheng-Jie Chang868c1752020-01-21 14:42:41 +0800683 # Enumerates commits until next spec. Get `prev_at` and `till_at`
684 # by prev_float and next_float's timestamp.
685 #
686 # 1. Non-branched case:
687 #
688 # prev_at till_at
689 # prev branch ---> o --------> o --------> o --------> o --------> ...
690 # ^ ^
691 # prev_float.timestamp next_float.timestamp
692 #
693 # building an image between prev_at and till_at should follow
694 # prev_float's spec.
695 #
696 # 2. Branched case:
697 #
698 # till_at
699 # /------->o---------->
700 # / ^ next_float.timestamp
701 # / prev_at
702 # ---------->o---------------------->
703 # ^prev_float.timestamp
704 #
705 # building an image between prev_at and till_at should follow
706 # next_float's spec.
707 #
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800708 prev_at = self.code_storage.get_rev_by_time(prev_float, path,
709 prev_float.timestamp)
Zheng-Jie Chang868c1752020-01-21 14:42:41 +0800710 if is_chromeos_branched:
711 till_at = self.code_storage.get_rev_by_time(next_float, path,
712 next_float.timestamp)
713 else:
714 till_at = self.code_storage.get_rev_by_time(prev_float, path,
715 next_float.timestamp)
Kuang-che Wuae6847c2020-01-13 16:06:08 +0800716 actions = self.code_storage.get_actions_between_two_commit(
Zheng-Jie Chang868c1752020-01-21 14:42:41 +0800717 prev_float, path, prev_at, till_at, ignore_not_ancestor=True)
Kuang-che Wuae6847c2020-01-13 16:06:08 +0800718
719 # Assume commits with the same timestamp as manifest/DEPS change are
720 # atomic.
721 if actions and actions[-1].timestamp == next_float.timestamp:
722 last_group.add(actions.pop())
723
724 for action in actions:
725 group = ActionGroup(action.timestamp)
726 group.add(action)
727 groups.append(group)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800728 else:
729 prev_at = till_at = prev_float[path].at
730
731 # At next_float.timestamp.
732 if path not in next_float:
Zheng-Jie Changeb5aaf32020-01-10 16:36:58 +0800733 if path in is_removed:
734 continue
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800735 # remove repo
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800736 next_at = None
Kuang-che Wucbe12432019-03-18 19:35:03 +0800737 sub_repos = [p for p in prev_float.entries if p.startswith(path + '/')]
Kuang-che Wucbe12432019-03-18 19:35:03 +0800738 # Remove deeper repo first
739 for path2 in sorted(sub_repos, reverse=True):
Kuang-che Wuae6847c2020-01-13 16:06:08 +0800740 last_group.add(GitRemoveRepo(next_float.timestamp, path2))
Zheng-Jie Changeb5aaf32020-01-10 16:36:58 +0800741 is_removed.add(path2)
Kuang-che Wuae6847c2020-01-13 16:06:08 +0800742 last_group.add(GitRemoveRepo(next_float.timestamp, path))
Zheng-Jie Changeb5aaf32020-01-10 16:36:58 +0800743 is_removed.add(path)
Kuang-che Wucbe12432019-03-18 19:35:03 +0800744 for path2 in sorted(set(sub_repos) & set(next_float.entries)):
Kuang-che Wuae6847c2020-01-13 16:06:08 +0800745 last_group.add(
Kuang-che Wucbe12432019-03-18 19:35:03 +0800746 GitAddRepo(next_float.timestamp, path2,
747 next_float[path2].repo_url, prev_float[path2].at))
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800748
749 elif next_float[path].is_static():
750 # pinned to certain commit on different branch
751 next_at = next_float[path].at
752
753 elif next_float[path].at == prev_float[path].at:
754 # keep floating on the same branch
755 next_at = till_at
756
757 else:
758 # switch to another branch
759 # prev_at till_at
760 # prev branch ---> o --------> o --------> o --------> o --------> ...
761 #
762 # next_at
763 # next branch ...... o ------> o --------> o -----> ...
764 # ^ ^
765 # prev_float.timestamp next_float.timestamp
766 next_at = self.code_storage.get_rev_by_time(next_float, path,
767 next_float.timestamp)
768
769 if next_at and next_at != till_at:
Kuang-che Wuae6847c2020-01-13 16:06:08 +0800770 last_group.add(
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800771 GitCheckoutCommit(next_float.timestamp, path,
772 next_float[path].repo_url, next_at))
773
Kuang-che Wuae6847c2020-01-13 16:06:08 +0800774 groups.sort(key=lambda x: x.timestamp)
775 if last_group.actions:
776 groups.append(last_group)
777 return groups
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800778
779 def synthesize_fixed_spec(self, float_spec, timestamp):
780 """Synthesizes fixed spec from float spec of given time.
781
782 Args:
783 float_spec: the float spec
784 timestamp: snapshot time
785
786 Returns:
787 Spec object
788 """
789 result = {}
790 for path, path_spec in float_spec.entries.items():
791 if not path_spec.is_static():
792 at = self.code_storage.get_rev_by_time(float_spec, path, timestamp)
793 path_spec = PathSpec(path_spec.path, path_spec.repo_url, at)
794
795 result[path] = copy.deepcopy(path_spec)
796
797 name = '%s@%s' % (float_spec.path, timestamp)
798 return Spec(SPEC_FIXED, name, timestamp, float_spec.path, result)
799
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800800 def match_spec(self, target, specs, start_index=0):
801 threshold = 3600
802 # ideal_index is the index of last spec before target
803 # begin and end are the range of indexes within threshold (inclusive)
804 ideal_index = None
805 begin, end = None, None
806 for i, spec in enumerate(specs[start_index:], start_index):
807 if spec.timestamp <= target.timestamp:
808 ideal_index = i
809 if abs(spec.timestamp - target.timestamp) < threshold:
810 if begin is None:
811 begin = i
812 end = i
813
814 candidates = []
815 if ideal_index is not None:
816 candidates.append(ideal_index)
817 if begin is not None:
Kuang-che Wuae6824b2019-08-27 22:20:01 +0800818 candidates.extend(list(range(begin, end + 1)))
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800819 if not candidates:
820 logger.error('unable to match %s: all specs are after it', target.name)
821 return None
822
823 compatible_candidates = [
824 i for i in candidates if specs[i].is_subset(target)
825 ]
826 if not compatible_candidates:
827 logger.error('unable to match %s: no compatible specs', target.name)
828 spec = specs[candidates[0]]
829 target.diff(spec)
830 return None
831
832 scores = []
833 for i in compatible_candidates:
Kuang-che Wu8a28a9d2018-09-11 17:43:36 +0800834 # Tie-break: prefer earlier timestamp and smaller difference.
835 if specs[i].timestamp <= target.timestamp:
836 timediff = 0, target.timestamp - specs[i].timestamp
837 else:
838 timediff = 1, specs[i].timestamp - target.timestamp
839 scores.append((specs[i].similar_score(target), timediff, i))
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800840 scores.sort()
841
Kuang-che Wu8a28a9d2018-09-11 17:43:36 +0800842 score, _, index = scores[0]
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800843 if score != 0:
844 logger.warning('not exactly match (score=%s): %s', score, target.name)
845 target.diff(specs[index])
846
847 if index < ideal_index:
848 logger.warning(
849 '%s (%s) matched earlier spec at %s instead of %s, racing? offset %d',
850 target.name, target.timestamp, specs[index].timestamp,
851 specs[ideal_index].timestamp,
Kuang-che Wue4bae0b2018-07-19 12:10:14 +0800852 specs[index].timestamp - target.timestamp)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800853 if index > ideal_index:
854 logger.warning(
855 'spec committed at %d matched later commit at %d. bad server clock?',
856 target.timestamp, specs[index].timestamp)
857
858 return index
859
860 def associate_fixed_and_synthesized_specs(self, fixed_specs,
861 synthesized_specs):
862 # All fixed specs are snapshot of float specs. Theoretically, they
863 # should be identical to one of the synthesized specs.
864 # However, it's not always true for some reasons --- maybe due to race
865 # condition, maybe due to bugs of this bisect-kit.
866 # To overcome this glitch, we try to match them by similarity instead of
867 # exact match.
868 result = []
869 last_index = 0
870 for i, fixed_spec in enumerate(fixed_specs):
871 matched_index = self.match_spec(fixed_spec, synthesized_specs, last_index)
872 if matched_index is None:
873 if i in (0, len(fixed_specs) - 1):
874 logger.error('essential spec mismatch, unable to continue')
Kuang-che Wufe1e88a2019-09-10 21:52:25 +0800875 raise ValueError('Commit history analyze failed. '
876 'Bisector cannot deal with this version range.')
Kuang-che Wuc0baf752020-06-29 11:32:26 +0800877 logger.warning('%s do not match, skip', fixed_spec.name)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800878 continue
879 result.append((i, matched_index))
880 last_index = matched_index
881
882 return result
883
884 def _create_make_up_actions(self, fixed_spec, synthesized):
885 timestamp = synthesized.timestamp
886 make_up = ActionGroup(
887 timestamp, comment='make up glitch for %s' % fixed_spec.name)
888 for path in set(fixed_spec.entries) & set(synthesized.entries):
889 if fixed_spec[path].at == synthesized[path].at:
890 continue
891 action = GitCheckoutCommit(timestamp, path, synthesized[path].repo_url,
892 synthesized[path].at)
893 make_up.add(action)
894
895 if not make_up.actions:
896 return None
897 return make_up
898
Kuang-che Wu13acc7b2020-06-15 10:45:35 +0800899 def _batch_fill_action_commit_log(self, details):
900 group_by_repo = collections.defaultdict(list)
901 for detail in details.values():
902 for action in detail.get('actions', []):
903 if action['action_type'] == 'commit':
904 group_by_repo[action['repo_url']].append(action)
905
906 for repo_url, actions in group_by_repo.items():
907 git_root = self.code_storage.cached_git_root(repo_url)
908 revs = set(a['rev'] for a in actions)
909 metas = git_util.get_batch_commit_metadata(git_root, revs)
910 for action in actions:
911 meta = metas[action['rev']]
912 if meta is None:
913 commit_summary = '(unknown)'
914 else:
915 commit_summary = meta['message'].splitlines()[0]
916 action['commit_summary'] = commit_summary
917
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800918 def build_revlist(self, old, new):
919 """Build revlist.
920
921 Returns:
Kuang-che Wu13acc7b2020-06-15 10:45:35 +0800922 (revlist, details):
923 revlist: list of rev string
924 details: dict of rev to rev detail
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800925 """
Kuang-che Wu13acc7b2020-06-15 10:45:35 +0800926 logger.info('build_revlist: old=%s, new=%s', old, new)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800927 revlist = []
Kuang-che Wu13acc7b2020-06-15 10:45:35 +0800928 details = {}
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800929
Kuang-che Wu020a1182020-09-08 17:17:22 +0800930 # Enable cache for repetitive git operations. The space complexity is
Kuang-che Wufcbcc502020-06-01 11:48:20 +0800931 # O(number of candidates).
932 git_util.get_commit_metadata.enable_cache()
933 git_util.get_file_from_revision.enable_cache()
Kuang-che Wu98d98462020-06-19 17:07:22 +0800934 git_util.is_containing_commit.enable_cache()
Zheng-Jie Changad174a42020-06-20 15:28:10 +0800935 git_util.is_ancestor_commit.enable_cache()
Kuang-che Wufcbcc502020-06-01 11:48:20 +0800936
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800937 # step 1, find all float and fixed specs in the given range.
938 fixed_specs = self.spec_manager.collect_fixed_spec(old, new)
Kuang-che Wue4bae0b2018-07-19 12:10:14 +0800939 assert fixed_specs
Zheng-Jie Changd968f552020-01-16 13:31:57 +0800940 for spec in fixed_specs:
941 self.spec_manager.parse_spec(spec)
942
943 float_specs = self.spec_manager.collect_float_spec(old, new, fixed_specs)
Kuang-che Wue4bae0b2018-07-19 12:10:14 +0800944 assert float_specs
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800945 while float_specs[-1].timestamp > fixed_specs[-1].timestamp:
946 float_specs.pop()
947 assert float_specs
Zheng-Jie Changd968f552020-01-16 13:31:57 +0800948 for spec in float_specs:
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800949 self.spec_manager.parse_spec(spec)
950
Kuang-che Wued1bb622020-05-30 23:06:23 +0800951 git_util.fast_lookup.optimize(
952 (float_specs[0].timestamp, float_specs[-1].timestamp))
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800953 # step 2, synthesize all fixed specs in the range from float specs.
954 specs = float_specs + [fixed_specs[-1]]
Kuang-che Wuae6847c2020-01-13 16:06:08 +0800955 action_groups = []
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800956 logger.debug('len(specs)=%d', len(specs))
957 for i in range(len(specs) - 1):
958 prev_float = specs[i]
959 next_float = specs[i + 1]
960 logger.debug('[%d], between %s (%s) and %s (%s)', i, prev_float.name,
961 prev_float.timestamp, next_float.name, next_float.timestamp)
Kuang-che Wuae6847c2020-01-13 16:06:08 +0800962 action_groups += self.generate_action_groups_between_specs(
963 prev_float, next_float)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +0800964
965 spec = self.synthesize_fixed_spec(float_specs[0], fixed_specs[0].timestamp)
966 synthesized = [spec.copy()]
967 for action_group in action_groups:
968 spec.apply(action_group)
969 synthesized.append(spec.copy())
970
971 # step 3, associate fixed specs with synthesized specs.
972 associated_pairs = self.associate_fixed_and_synthesized_specs(
973 fixed_specs, synthesized)
974
975 # step 4, group actions and cache them
976 for i, (fixed_index, synthesized_index) in enumerate(associated_pairs[:-1]):
977 next_fixed_index, next_synthesized_index = associated_pairs[i + 1]
978 revlist.append(fixed_specs[fixed_index].name)
979 this_action_groups = []
980
981 # handle glitch
982 if fixed_specs[fixed_index].similar_score(
983 synthesized[synthesized_index]) != 0:
984 assert synthesized[synthesized_index].is_subset(
985 fixed_specs[fixed_index])
986 skipped = set(fixed_specs[fixed_index].entries) - set(
987 synthesized[synthesized_index].entries)
988 if skipped:
989 logger.warning(
990 'between %s and %s, '
991 'bisect-kit cannot analyze commit history of following paths:',
992 fixed_specs[fixed_index].name, fixed_specs[next_fixed_index].name)
993 for path in sorted(skipped):
994 logger.warning(' %s', path)
995
996 make_up = self._create_make_up_actions(fixed_specs[fixed_index],
997 synthesized[synthesized_index])
998 if make_up:
999 this_action_groups.append(make_up)
1000
1001 this_action_groups.extend(
1002 action_groups[synthesized_index:next_synthesized_index])
1003 for idx, ag in enumerate(this_action_groups, 1):
1004 rev = make_intra_rev(fixed_specs[fixed_index].name,
1005 fixed_specs[next_fixed_index].name, idx)
1006 ag.name = rev
1007 revlist.append(rev)
Kuang-che Wu13acc7b2020-06-15 10:45:35 +08001008 details[rev] = ag.summary()
Kuang-che Wu3eb6b502018-06-06 16:15:18 +08001009
1010 self.save_action_groups_between_releases(
1011 fixed_specs[fixed_index].name, fixed_specs[next_fixed_index].name,
1012 this_action_groups)
1013 revlist.append(fixed_specs[associated_pairs[-1][0]].name)
1014
Kuang-che Wu13acc7b2020-06-15 10:45:35 +08001015 self._batch_fill_action_commit_log(details)
1016
Kuang-che Wu98d98462020-06-19 17:07:22 +08001017 # Verify all repos in between are cached.
1018 for spec in reversed(float_specs):
1019 if self.code_storage.are_spec_commits_available(spec):
1020 continue
1021 raise errors.InternalError('Some commits in %s (%s) are unavailable' %
1022 (spec.name, spec.path))
1023
Kuang-che Wued1bb622020-05-30 23:06:23 +08001024 # Disable cache because there might be write or even destructive git
1025 # operations when switch git versions. Be conservative now. We can cache
1026 # more if we observed more slow git operations later.
1027 git_util.fast_lookup.disable()
Kuang-che Wufcbcc502020-06-01 11:48:20 +08001028 git_util.get_commit_metadata.disable_cache()
1029 git_util.get_file_from_revision.disable_cache()
Kuang-che Wu98d98462020-06-19 17:07:22 +08001030 git_util.is_containing_commit.disable_cache()
Zheng-Jie Changad174a42020-06-20 15:28:10 +08001031 git_util.is_ancestor_commit.disable_cache()
Kuang-che Wu13acc7b2020-06-15 10:45:35 +08001032
1033 return revlist, details
Kuang-che Wu3eb6b502018-06-06 16:15:18 +08001034
1035 def save_action_groups_between_releases(self, old, new, action_groups):
1036 data = [ag.serialize() for ag in action_groups]
1037
1038 cache_dir = os.path.join(self.root_dir, _DIFF_CACHE_DIR)
1039 if not os.path.exists(cache_dir):
1040 os.makedirs(cache_dir)
1041 cache_filename = os.path.join(cache_dir, '%s,%s.json' % (old, new))
Kuang-che Wuae6824b2019-08-27 22:20:01 +08001042 with open(cache_filename, 'w') as fp:
Kuang-che Wu3eb6b502018-06-06 16:15:18 +08001043 json.dump(data, fp, indent=4, sort_keys=True)
1044
1045 def load_action_groups_between_releases(self, old, new):
1046 cache_dir = os.path.join(self.root_dir, _DIFF_CACHE_DIR)
1047 cache_filename = os.path.join(cache_dir, '%s,%s.json' % (old, new))
1048 if not os.path.exists(cache_filename):
Kuang-che Wud1b74152020-05-20 08:46:46 +08001049 raise errors.InternalError('cached revlist not found: %s' %
1050 cache_filename)
Kuang-che Wu3eb6b502018-06-06 16:15:18 +08001051
1052 result = []
Kuang-che Wu74bcb642020-02-20 18:45:53 +08001053 with open(cache_filename) as f:
1054 for data in json.load(f):
1055 result.append(ActionGroup.unserialize(data))
Kuang-che Wu3eb6b502018-06-06 16:15:18 +08001056
1057 return result
1058
Kuang-che Wu3eb6b502018-06-06 16:15:18 +08001059 def switch(self, rev):
Zheng-Jie Chang0fc704b2019-12-09 18:43:38 +08001060 rev_old, action_groups = self.get_intra_and_diff(rev)
1061 self.spec_manager.sync_disk_state(rev_old)
1062 apply_actions(self.code_storage, action_groups, self.root_dir)
1063
1064 def get_intra_and_diff(self, rev):
Kuang-che Wu3eb6b502018-06-06 16:15:18 +08001065 # easy case
1066 if not re.match(_re_intra_rev, rev):
Zheng-Jie Chang0fc704b2019-12-09 18:43:38 +08001067 return rev, []
Kuang-che Wu3eb6b502018-06-06 16:15:18 +08001068
1069 rev_old, rev_new, idx = parse_intra_rev(rev)
1070 action_groups = self.load_action_groups_between_releases(rev_old, rev_new)
1071 assert 0 <= idx <= len(action_groups)
1072 action_groups = action_groups[:idx]
Zheng-Jie Chang0fc704b2019-12-09 18:43:38 +08001073 return rev_old, action_groups