blob: 94b9881a4829bd4b2341056b171f7ba8916ada39 [file] [log] [blame]
Mike Frysinger9f7e4ee2013-03-13 15:43:03 -04001#!/usr/bin/python
Mike Frysinger0a647fc2012-08-06 14:36:05 -04002# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
David Jamesfcb70ef2011-02-02 16:02:30 -08003# Use of this source code is governed by a BSD-style license that can be
4# found in the LICENSE file.
5
6"""Program to run emerge in parallel, for significant speedup.
7
8Usage:
David James386ccd12011-05-04 20:17:42 -07009 ./parallel_emerge [--board=BOARD] [--workon=PKGS]
David Jamesfcb70ef2011-02-02 16:02:30 -080010 [--force-remote-binary=PKGS] [emerge args] package
11
David James78b6cd92012-04-02 21:36:12 -070012This script runs multiple emerge processes in parallel, using appropriate
13Portage APIs. It is faster than standard emerge because it has a
14multiprocess model instead of an asynchronous model.
David Jamesfcb70ef2011-02-02 16:02:30 -080015"""
16
17import codecs
18import copy
19import errno
Brian Harring8294d652012-05-23 02:20:52 -070020import gc
David James8c7e5e32011-06-28 11:26:03 -070021import heapq
David Jamesfcb70ef2011-02-02 16:02:30 -080022import multiprocessing
23import os
Mike Frysinger1ae28092013-10-17 17:17:22 -040024try:
25 import Queue
26except ImportError:
27 # Python-3 renamed to "queue". We still use Queue to avoid collisions
28 # with naming variables as "queue". Maybe we'll transition at some point.
29 # pylint: disable=F0401
30 import queue as Queue
David Jamesfcb70ef2011-02-02 16:02:30 -080031import signal
32import sys
33import tempfile
Brian Harring8294d652012-05-23 02:20:52 -070034import threading
David Jamesfcb70ef2011-02-02 16:02:30 -080035import time
36import traceback
David Jamesfcb70ef2011-02-02 16:02:30 -080037
Thiago Goncalesf4acc422013-07-17 10:26:35 -070038from chromite.lib import cros_build_lib
David James6d47d8c2014-04-24 09:40:05 -070039from chromite.lib import osutils
Thiago Goncalesf4acc422013-07-17 10:26:35 -070040
David Jamesfcb70ef2011-02-02 16:02:30 -080041# If PORTAGE_USERNAME isn't specified, scrape it from the $HOME variable. On
42# Chromium OS, the default "portage" user doesn't have the necessary
43# permissions. It'd be easier if we could default to $USERNAME, but $USERNAME
44# is "root" here because we get called through sudo.
45#
46# We need to set this before importing any portage modules, because portage
47# looks up "PORTAGE_USERNAME" at import time.
48#
49# NOTE: .bashrc sets PORTAGE_USERNAME = $USERNAME, so most people won't
50# encounter this case unless they have an old chroot or blow away the
51# environment by running sudo without the -E specifier.
52if "PORTAGE_USERNAME" not in os.environ:
53 homedir = os.environ.get("HOME")
54 if homedir:
55 os.environ["PORTAGE_USERNAME"] = os.path.basename(homedir)
56
57# Portage doesn't expose dependency trees in its public API, so we have to
58# make use of some private APIs here. These modules are found under
59# /usr/lib/portage/pym/.
60#
61# TODO(davidjames): Update Portage to expose public APIs for these features.
Don Garrett25f309a2014-03-19 14:02:12 -070062# pylint: disable=F0401
David Jamesfcb70ef2011-02-02 16:02:30 -080063from _emerge.actions import adjust_configs
64from _emerge.actions import load_emerge_config
65from _emerge.create_depgraph_params import create_depgraph_params
David James386ccd12011-05-04 20:17:42 -070066from _emerge.depgraph import backtrack_depgraph
Mike Frysinger901eaad2012-10-10 18:18:03 -040067try:
68 from _emerge.main import clean_logs
69except ImportError:
70 # Older portage versions did not provide clean_logs, so stub it.
71 # We need this if running in an older chroot that hasn't yet upgraded
72 # the portage version.
73 clean_logs = lambda x: None
David Jamesfcb70ef2011-02-02 16:02:30 -080074from _emerge.main import emerge_main
75from _emerge.main import parse_opts
76from _emerge.Package import Package
77from _emerge.Scheduler import Scheduler
David Jamesfcb70ef2011-02-02 16:02:30 -080078from _emerge.stdout_spinner import stdout_spinner
David James386ccd12011-05-04 20:17:42 -070079from portage._global_updates import _global_updates
David Jamesfcb70ef2011-02-02 16:02:30 -080080import portage
81import portage.debug
David James9becf572014-04-25 14:39:05 +000082from portage.versions import vercmp
Don Garrettf8bf7842014-03-20 17:03:42 -070083# pylint: enable=F0401
Mike Frysinger91d7da92013-02-19 15:53:46 -050084
David Jamesfcb70ef2011-02-02 16:02:30 -080085
David Jamesfcb70ef2011-02-02 16:02:30 -080086def Usage():
87 """Print usage."""
88 print "Usage:"
David James386ccd12011-05-04 20:17:42 -070089 print " ./parallel_emerge [--board=BOARD] [--workon=PKGS]"
David Jamesfcb70ef2011-02-02 16:02:30 -080090 print " [--rebuild] [emerge args] package"
91 print
92 print "Packages specified as workon packages are always built from source."
David Jamesfcb70ef2011-02-02 16:02:30 -080093 print
94 print "The --workon argument is mainly useful when you want to build and"
95 print "install packages that you are working on unconditionally, but do not"
96 print "to have to rev the package to indicate you want to build it from"
97 print "source. The build_packages script will automatically supply the"
98 print "workon argument to emerge, ensuring that packages selected using"
99 print "cros-workon are rebuilt."
100 print
101 print "The --rebuild option rebuilds packages whenever their dependencies"
102 print "are changed. This ensures that your build is correct."
David Jamesfcb70ef2011-02-02 16:02:30 -0800103
104
David Jamesfcb70ef2011-02-02 16:02:30 -0800105# Global start time
106GLOBAL_START = time.time()
107
David James7358d032011-05-19 10:40:03 -0700108# Whether process has been killed by a signal.
109KILLED = multiprocessing.Event()
110
David Jamesfcb70ef2011-02-02 16:02:30 -0800111
112class EmergeData(object):
113 """This simple struct holds various emerge variables.
114
115 This struct helps us easily pass emerge variables around as a unit.
116 These variables are used for calculating dependencies and installing
117 packages.
118 """
119
David Jamesbf1e3442011-05-28 07:44:20 -0700120 __slots__ = ["action", "cmdline_packages", "depgraph", "favorites",
121 "mtimedb", "opts", "root_config", "scheduler_graph",
122 "settings", "spinner", "trees"]
David Jamesfcb70ef2011-02-02 16:02:30 -0800123
124 def __init__(self):
125 # The action the user requested. If the user is installing packages, this
126 # is None. If the user is doing anything other than installing packages,
127 # this will contain the action name, which will map exactly to the
128 # long-form name of the associated emerge option.
129 #
130 # Example: If you call parallel_emerge --unmerge package, the action name
131 # will be "unmerge"
132 self.action = None
133
134 # The list of packages the user passed on the command-line.
135 self.cmdline_packages = None
136
137 # The emerge dependency graph. It'll contain all the packages involved in
138 # this merge, along with their versions.
139 self.depgraph = None
140
David Jamesbf1e3442011-05-28 07:44:20 -0700141 # The list of candidates to add to the world file.
142 self.favorites = None
143
David Jamesfcb70ef2011-02-02 16:02:30 -0800144 # A dict of the options passed to emerge. This dict has been cleaned up
145 # a bit by parse_opts, so that it's a bit easier for the emerge code to
146 # look at the options.
147 #
148 # Emerge takes a few shortcuts in its cleanup process to make parsing of
149 # the options dict easier. For example, if you pass in "--usepkg=n", the
150 # "--usepkg" flag is just left out of the dictionary altogether. Because
151 # --usepkg=n is the default, this makes parsing easier, because emerge
152 # can just assume that if "--usepkg" is in the dictionary, it's enabled.
153 #
154 # These cleanup processes aren't applied to all options. For example, the
155 # --with-bdeps flag is passed in as-is. For a full list of the cleanups
156 # applied by emerge, see the parse_opts function in the _emerge.main
157 # package.
158 self.opts = None
159
160 # A dictionary used by portage to maintain global state. This state is
161 # loaded from disk when portage starts up, and saved to disk whenever we
162 # call mtimedb.commit().
163 #
164 # This database contains information about global updates (i.e., what
165 # version of portage we have) and what we're currently doing. Portage
166 # saves what it is currently doing in this database so that it can be
167 # resumed when you call it with the --resume option.
168 #
169 # parallel_emerge does not save what it is currently doing in the mtimedb,
170 # so we do not support the --resume option.
171 self.mtimedb = None
172
173 # The portage configuration for our current root. This contains the portage
174 # settings (see below) and the three portage trees for our current root.
175 # (The three portage trees are explained below, in the documentation for
176 # the "trees" member.)
177 self.root_config = None
178
179 # The scheduler graph is used by emerge to calculate what packages to
180 # install. We don't actually install any deps, so this isn't really used,
181 # but we pass it in to the Scheduler object anyway.
182 self.scheduler_graph = None
183
184 # Portage settings for our current session. Most of these settings are set
185 # in make.conf inside our current install root.
186 self.settings = None
187
188 # The spinner, which spews stuff to stdout to indicate that portage is
189 # doing something. We maintain our own spinner, so we set the portage
190 # spinner to "silent" mode.
191 self.spinner = None
192
193 # The portage trees. There are separate portage trees for each root. To get
194 # the portage tree for the current root, you can look in self.trees[root],
195 # where root = self.settings["ROOT"].
196 #
197 # In each root, there are three trees: vartree, porttree, and bintree.
198 # - vartree: A database of the currently-installed packages.
199 # - porttree: A database of ebuilds, that can be used to build packages.
200 # - bintree: A database of binary packages.
201 self.trees = None
202
203
204class DepGraphGenerator(object):
205 """Grab dependency information about packages from portage.
206
207 Typical usage:
208 deps = DepGraphGenerator()
209 deps.Initialize(sys.argv[1:])
210 deps_tree, deps_info = deps.GenDependencyTree()
211 deps_graph = deps.GenDependencyGraph(deps_tree, deps_info)
212 deps.PrintTree(deps_tree)
213 PrintDepsMap(deps_graph)
214 """
215
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700216 __slots__ = ["board", "emerge", "package_db", "show_output", "unpack_only"]
David Jamesfcb70ef2011-02-02 16:02:30 -0800217
218 def __init__(self):
219 self.board = None
220 self.emerge = EmergeData()
David Jamesfcb70ef2011-02-02 16:02:30 -0800221 self.package_db = {}
David Jamesfcb70ef2011-02-02 16:02:30 -0800222 self.show_output = False
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700223 self.unpack_only = False
David Jamesfcb70ef2011-02-02 16:02:30 -0800224
225 def ParseParallelEmergeArgs(self, argv):
226 """Read the parallel emerge arguments from the command-line.
227
228 We need to be compatible with emerge arg format. We scrape arguments that
229 are specific to parallel_emerge, and pass through the rest directly to
230 emerge.
Mike Frysinger1a736a82013-12-12 01:50:59 -0500231
David Jamesfcb70ef2011-02-02 16:02:30 -0800232 Args:
233 argv: arguments list
Mike Frysinger1a736a82013-12-12 01:50:59 -0500234
David Jamesfcb70ef2011-02-02 16:02:30 -0800235 Returns:
236 Arguments that don't belong to parallel_emerge
237 """
238 emerge_args = []
239 for arg in argv:
240 # Specifically match arguments that are specific to parallel_emerge, and
241 # pass through the rest.
242 if arg.startswith("--board="):
243 self.board = arg.replace("--board=", "")
244 elif arg.startswith("--workon="):
245 workon_str = arg.replace("--workon=", "")
David James7a1ea4b2011-10-13 15:06:41 -0700246 emerge_args.append("--reinstall-atoms=%s" % workon_str)
247 emerge_args.append("--usepkg-exclude=%s" % workon_str)
David Jamesfcb70ef2011-02-02 16:02:30 -0800248 elif arg.startswith("--force-remote-binary="):
249 force_remote_binary = arg.replace("--force-remote-binary=", "")
David James7a1ea4b2011-10-13 15:06:41 -0700250 emerge_args.append("--useoldpkg-atoms=%s" % force_remote_binary)
David Jamesfcb70ef2011-02-02 16:02:30 -0800251 elif arg == "--show-output":
252 self.show_output = True
David James386ccd12011-05-04 20:17:42 -0700253 elif arg == "--rebuild":
David James7a1ea4b2011-10-13 15:06:41 -0700254 emerge_args.append("--rebuild-if-unbuilt")
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700255 elif arg == "--unpackonly":
256 emerge_args.append("--fetchonly")
257 self.unpack_only = True
David Jamesfcb70ef2011-02-02 16:02:30 -0800258 else:
259 # Not one of our options, so pass through to emerge.
260 emerge_args.append(arg)
261
David James386ccd12011-05-04 20:17:42 -0700262 # These packages take a really long time to build, so, for expediency, we
263 # are blacklisting them from automatic rebuilds because one of their
264 # dependencies needs to be recompiled.
Mike Frysinger5c2a9052014-04-15 15:52:04 -0400265 for pkg in ("chromeos-base/chromeos-chrome",):
David James7a1ea4b2011-10-13 15:06:41 -0700266 emerge_args.append("--rebuild-exclude=%s" % pkg)
David Jamesfcb70ef2011-02-02 16:02:30 -0800267
268 return emerge_args
269
270 def Initialize(self, args):
271 """Initializer. Parses arguments and sets up portage state."""
272
273 # Parse and strip out args that are just intended for parallel_emerge.
274 emerge_args = self.ParseParallelEmergeArgs(args)
275
276 # Setup various environment variables based on our current board. These
277 # variables are normally setup inside emerge-${BOARD}, but since we don't
278 # call that script, we have to set it up here. These variables serve to
279 # point our tools at /build/BOARD and to setup cross compiles to the
280 # appropriate board as configured in toolchain.conf.
281 if self.board:
Yu-Ju Hongdd9bb2b2014-01-03 17:08:26 -0800282 sysroot = cros_build_lib.GetSysroot(board=self.board)
283 os.environ["PORTAGE_CONFIGROOT"] = sysroot
284 os.environ["PORTAGE_SYSROOT"] = sysroot
285 os.environ["SYSROOT"] = sysroot
David Jamesfcb70ef2011-02-02 16:02:30 -0800286
287 # Although CHROMEOS_ROOT isn't specific to boards, it's normally setup
288 # inside emerge-${BOARD}, so we set it up here for compatibility. It
289 # will be going away soon as we migrate to CROS_WORKON_SRCROOT.
290 os.environ.setdefault("CHROMEOS_ROOT", os.environ["HOME"] + "/trunk")
291
292 # Turn off interactive delays
293 os.environ["EBEEP_IGNORE"] = "1"
294 os.environ["EPAUSE_IGNORE"] = "1"
Mike Frysinger0a647fc2012-08-06 14:36:05 -0400295 os.environ["CLEAN_DELAY"] = "0"
David Jamesfcb70ef2011-02-02 16:02:30 -0800296
297 # Parse the emerge options.
David Jamesea3ca332011-05-26 11:48:29 -0700298 action, opts, cmdline_packages = parse_opts(emerge_args, silent=True)
David Jamesfcb70ef2011-02-02 16:02:30 -0800299
300 # Set environment variables based on options. Portage normally sets these
301 # environment variables in emerge_main, but we can't use that function,
302 # because it also does a bunch of other stuff that we don't want.
303 # TODO(davidjames): Patch portage to move this logic into a function we can
304 # reuse here.
305 if "--debug" in opts:
306 os.environ["PORTAGE_DEBUG"] = "1"
307 if "--config-root" in opts:
308 os.environ["PORTAGE_CONFIGROOT"] = opts["--config-root"]
309 if "--root" in opts:
310 os.environ["ROOT"] = opts["--root"]
311 if "--accept-properties" in opts:
312 os.environ["ACCEPT_PROPERTIES"] = opts["--accept-properties"]
313
David James88d780c2014-02-05 13:03:29 -0800314 # If we're installing packages to the board, we can disable vardb locks.
315 # This is safe because we only run up to one instance of parallel_emerge in
316 # parallel.
317 # TODO(davidjames): Enable this for the host too.
318 if self.board:
David Jamesfcb70ef2011-02-02 16:02:30 -0800319 os.environ.setdefault("PORTAGE_LOCKS", "false")
David Jamesfcb70ef2011-02-02 16:02:30 -0800320
321 # Now that we've setup the necessary environment variables, we can load the
322 # emerge config from disk.
323 settings, trees, mtimedb = load_emerge_config()
324
David Jamesea3ca332011-05-26 11:48:29 -0700325 # Add in EMERGE_DEFAULT_OPTS, if specified.
326 tmpcmdline = []
327 if "--ignore-default-opts" not in opts:
328 tmpcmdline.extend(settings["EMERGE_DEFAULT_OPTS"].split())
329 tmpcmdline.extend(emerge_args)
330 action, opts, cmdline_packages = parse_opts(tmpcmdline)
331
332 # If we're installing to the board, we want the --root-deps option so that
333 # portage will install the build dependencies to that location as well.
334 if self.board:
335 opts.setdefault("--root-deps", True)
336
David Jamesfcb70ef2011-02-02 16:02:30 -0800337 # Check whether our portage tree is out of date. Typically, this happens
338 # when you're setting up a new portage tree, such as in setup_board and
339 # make_chroot. In that case, portage applies a bunch of global updates
340 # here. Once the updates are finished, we need to commit any changes
341 # that the global update made to our mtimedb, and reload the config.
342 #
343 # Portage normally handles this logic in emerge_main, but again, we can't
344 # use that function here.
345 if _global_updates(trees, mtimedb["updates"]):
346 mtimedb.commit()
347 settings, trees, mtimedb = load_emerge_config(trees=trees)
348
349 # Setup implied options. Portage normally handles this logic in
350 # emerge_main.
351 if "--buildpkgonly" in opts or "buildpkg" in settings.features:
352 opts.setdefault("--buildpkg", True)
353 if "--getbinpkgonly" in opts:
354 opts.setdefault("--usepkgonly", True)
355 opts.setdefault("--getbinpkg", True)
356 if "getbinpkg" in settings.features:
357 # Per emerge_main, FEATURES=getbinpkg overrides --getbinpkg=n
358 opts["--getbinpkg"] = True
359 if "--getbinpkg" in opts or "--usepkgonly" in opts:
360 opts.setdefault("--usepkg", True)
361 if "--fetch-all-uri" in opts:
362 opts.setdefault("--fetchonly", True)
363 if "--skipfirst" in opts:
364 opts.setdefault("--resume", True)
365 if "--buildpkgonly" in opts:
366 # --buildpkgonly will not merge anything, so it overrides all binary
367 # package options.
368 for opt in ("--getbinpkg", "--getbinpkgonly",
369 "--usepkg", "--usepkgonly"):
370 opts.pop(opt, None)
371 if (settings.get("PORTAGE_DEBUG", "") == "1" and
372 "python-trace" in settings.features):
373 portage.debug.set_trace(True)
374
375 # Complain about unsupported options
David James386ccd12011-05-04 20:17:42 -0700376 for opt in ("--ask", "--ask-enter-invalid", "--resume", "--skipfirst"):
David Jamesfcb70ef2011-02-02 16:02:30 -0800377 if opt in opts:
378 print "%s is not supported by parallel_emerge" % opt
379 sys.exit(1)
380
381 # Make emerge specific adjustments to the config (e.g. colors!)
382 adjust_configs(opts, trees)
383
384 # Save our configuration so far in the emerge object
385 emerge = self.emerge
386 emerge.action, emerge.opts = action, opts
387 emerge.settings, emerge.trees, emerge.mtimedb = settings, trees, mtimedb
388 emerge.cmdline_packages = cmdline_packages
389 root = settings["ROOT"]
390 emerge.root_config = trees[root]["root_config"]
391
David James386ccd12011-05-04 20:17:42 -0700392 if "--usepkg" in opts:
David Jamesfcb70ef2011-02-02 16:02:30 -0800393 emerge.trees[root]["bintree"].populate("--getbinpkg" in opts)
394
David Jamesfcb70ef2011-02-02 16:02:30 -0800395 def CreateDepgraph(self, emerge, packages):
396 """Create an emerge depgraph object."""
397 # Setup emerge options.
398 emerge_opts = emerge.opts.copy()
399
David James386ccd12011-05-04 20:17:42 -0700400 # Ask portage to build a dependency graph. with the options we specified
401 # above.
David Jamesfcb70ef2011-02-02 16:02:30 -0800402 params = create_depgraph_params(emerge_opts, emerge.action)
David Jamesbf1e3442011-05-28 07:44:20 -0700403 success, depgraph, favorites = backtrack_depgraph(
David James386ccd12011-05-04 20:17:42 -0700404 emerge.settings, emerge.trees, emerge_opts, params, emerge.action,
405 packages, emerge.spinner)
406 emerge.depgraph = depgraph
David Jamesfcb70ef2011-02-02 16:02:30 -0800407
David James386ccd12011-05-04 20:17:42 -0700408 # Is it impossible to honor the user's request? Bail!
409 if not success:
410 depgraph.display_problems()
411 sys.exit(1)
David Jamesfcb70ef2011-02-02 16:02:30 -0800412
413 emerge.depgraph = depgraph
David Jamesbf1e3442011-05-28 07:44:20 -0700414 emerge.favorites = favorites
David Jamesfcb70ef2011-02-02 16:02:30 -0800415
David Jamesdeebd692011-05-09 17:02:52 -0700416 # Prime and flush emerge caches.
417 root = emerge.settings["ROOT"]
418 vardb = emerge.trees[root]["vartree"].dbapi
David James0bdc5de2011-05-12 16:22:26 -0700419 if "--pretend" not in emerge.opts:
420 vardb.counter_tick()
David Jamesdeebd692011-05-09 17:02:52 -0700421 vardb.flush_cache()
422
David James386ccd12011-05-04 20:17:42 -0700423 def GenDependencyTree(self):
David Jamesfcb70ef2011-02-02 16:02:30 -0800424 """Get dependency tree info from emerge.
425
David Jamesfcb70ef2011-02-02 16:02:30 -0800426 Returns:
427 Dependency tree
428 """
429 start = time.time()
430
431 emerge = self.emerge
432
433 # Create a list of packages to merge
434 packages = set(emerge.cmdline_packages[:])
David Jamesfcb70ef2011-02-02 16:02:30 -0800435
436 # Tell emerge to be quiet. We print plenty of info ourselves so we don't
437 # need any extra output from portage.
438 portage.util.noiselimit = -1
439
440 # My favorite feature: The silent spinner. It doesn't spin. Ever.
441 # I'd disable the colors by default too, but they look kind of cool.
442 emerge.spinner = stdout_spinner()
443 emerge.spinner.update = emerge.spinner.update_quiet
444
445 if "--quiet" not in emerge.opts:
446 print "Calculating deps..."
447
448 self.CreateDepgraph(emerge, packages)
449 depgraph = emerge.depgraph
450
451 # Build our own tree from the emerge digraph.
452 deps_tree = {}
Don Garrett25f309a2014-03-19 14:02:12 -0700453 # pylint: disable=W0212
David Jamesfcb70ef2011-02-02 16:02:30 -0800454 digraph = depgraph._dynamic_config.digraph
David James3f778802011-08-25 19:31:45 -0700455 root = emerge.settings["ROOT"]
456 final_db = depgraph._dynamic_config.mydbapi[root]
David Jamesfcb70ef2011-02-02 16:02:30 -0800457 for node, node_deps in digraph.nodes.items():
458 # Calculate dependency packages that need to be installed first. Each
459 # child on the digraph is a dependency. The "operation" field specifies
460 # what we're doing (e.g. merge, uninstall, etc.). The "priorities" array
461 # contains the type of dependency (e.g. build, runtime, runtime_post,
462 # etc.)
463 #
David Jamesfcb70ef2011-02-02 16:02:30 -0800464 # Portage refers to the identifiers for packages as a CPV. This acronym
465 # stands for Component/Path/Version.
466 #
467 # Here's an example CPV: chromeos-base/power_manager-0.0.1-r1
468 # Split up, this CPV would be:
469 # C -- Component: chromeos-base
470 # P -- Path: power_manager
471 # V -- Version: 0.0.1-r1
472 #
473 # We just refer to CPVs as packages here because it's easier.
474 deps = {}
475 for child, priorities in node_deps[0].items():
David James3f778802011-08-25 19:31:45 -0700476 if isinstance(child, Package) and child.root == root:
477 cpv = str(child.cpv)
478 action = str(child.operation)
479
480 # If we're uninstalling a package, check whether Portage is
481 # installing a replacement. If so, just depend on the installation
482 # of the new package, because the old package will automatically
483 # be uninstalled at that time.
484 if action == "uninstall":
485 for pkg in final_db.match_pkgs(child.slot_atom):
486 cpv = str(pkg.cpv)
487 action = "merge"
488 break
489
490 deps[cpv] = dict(action=action,
491 deptypes=[str(x) for x in priorities],
492 deps={})
David Jamesfcb70ef2011-02-02 16:02:30 -0800493
494 # We've built our list of deps, so we can add our package to the tree.
David James3f778802011-08-25 19:31:45 -0700495 if isinstance(node, Package) and node.root == root:
David Jamesfcb70ef2011-02-02 16:02:30 -0800496 deps_tree[str(node.cpv)] = dict(action=str(node.operation),
497 deps=deps)
498
David Jamesfcb70ef2011-02-02 16:02:30 -0800499 # Ask portage for its install plan, so that we can only throw out
David James386ccd12011-05-04 20:17:42 -0700500 # dependencies that portage throws out.
David Jamesfcb70ef2011-02-02 16:02:30 -0800501 deps_info = {}
502 for pkg in depgraph.altlist():
503 if isinstance(pkg, Package):
David James3f778802011-08-25 19:31:45 -0700504 assert pkg.root == root
David Jamesfcb70ef2011-02-02 16:02:30 -0800505 self.package_db[pkg.cpv] = pkg
506
David Jamesfcb70ef2011-02-02 16:02:30 -0800507 # Save off info about the package
David James386ccd12011-05-04 20:17:42 -0700508 deps_info[str(pkg.cpv)] = {"idx": len(deps_info)}
David Jamesfcb70ef2011-02-02 16:02:30 -0800509
510 seconds = time.time() - start
511 if "--quiet" not in emerge.opts:
512 print "Deps calculated in %dm%.1fs" % (seconds / 60, seconds % 60)
513
514 return deps_tree, deps_info
515
516 def PrintTree(self, deps, depth=""):
517 """Print the deps we have seen in the emerge output.
518
519 Args:
520 deps: Dependency tree structure.
521 depth: Allows printing the tree recursively, with indentation.
522 """
523 for entry in sorted(deps):
524 action = deps[entry]["action"]
525 print "%s %s (%s)" % (depth, entry, action)
526 self.PrintTree(deps[entry]["deps"], depth=depth + " ")
527
David James386ccd12011-05-04 20:17:42 -0700528 def GenDependencyGraph(self, deps_tree, deps_info):
David Jamesfcb70ef2011-02-02 16:02:30 -0800529 """Generate a doubly linked dependency graph.
530
531 Args:
532 deps_tree: Dependency tree structure.
533 deps_info: More details on the dependencies.
Mike Frysinger1a736a82013-12-12 01:50:59 -0500534
David Jamesfcb70ef2011-02-02 16:02:30 -0800535 Returns:
536 Deps graph in the form of a dict of packages, with each package
537 specifying a "needs" list and "provides" list.
538 """
539 emerge = self.emerge
David Jamesfcb70ef2011-02-02 16:02:30 -0800540
David Jamesfcb70ef2011-02-02 16:02:30 -0800541 # deps_map is the actual dependency graph.
542 #
543 # Each package specifies a "needs" list and a "provides" list. The "needs"
544 # list indicates which packages we depend on. The "provides" list
545 # indicates the reverse dependencies -- what packages need us.
546 #
547 # We also provide some other information in the dependency graph:
548 # - action: What we're planning on doing with this package. Generally,
549 # "merge", "nomerge", or "uninstall"
David Jamesfcb70ef2011-02-02 16:02:30 -0800550 deps_map = {}
551
552 def ReverseTree(packages):
553 """Convert tree to digraph.
554
555 Take the tree of package -> requirements and reverse it to a digraph of
556 buildable packages -> packages they unblock.
Mike Frysinger1a736a82013-12-12 01:50:59 -0500557
David Jamesfcb70ef2011-02-02 16:02:30 -0800558 Args:
559 packages: Tree(s) of dependencies.
Mike Frysinger1a736a82013-12-12 01:50:59 -0500560
David Jamesfcb70ef2011-02-02 16:02:30 -0800561 Returns:
562 Unsanitized digraph.
563 """
David James8c7e5e32011-06-28 11:26:03 -0700564 binpkg_phases = set(["setup", "preinst", "postinst"])
David James3f778802011-08-25 19:31:45 -0700565 needed_dep_types = set(["blocker", "buildtime", "runtime"])
David Jamesfcb70ef2011-02-02 16:02:30 -0800566 for pkg in packages:
567
568 # Create an entry for the package
569 action = packages[pkg]["action"]
David James8c7e5e32011-06-28 11:26:03 -0700570 default_pkg = {"needs": {}, "provides": set(), "action": action,
571 "nodeps": False, "binary": False}
David Jamesfcb70ef2011-02-02 16:02:30 -0800572 this_pkg = deps_map.setdefault(pkg, default_pkg)
573
David James8c7e5e32011-06-28 11:26:03 -0700574 if pkg in deps_info:
575 this_pkg["idx"] = deps_info[pkg]["idx"]
576
577 # If a package doesn't have any defined phases that might use the
578 # dependent packages (i.e. pkg_setup, pkg_preinst, or pkg_postinst),
579 # we can install this package before its deps are ready.
580 emerge_pkg = self.package_db.get(pkg)
581 if emerge_pkg and emerge_pkg.type_name == "binary":
582 this_pkg["binary"] = True
David James9becf572014-04-25 14:39:05 +0000583 if 0 <= vercmp(portage.VERSION, "2.1.11.50"):
584 defined_phases = emerge_pkg.defined_phases
585 else:
586 defined_phases = emerge_pkg.metadata.defined_phases
David James8c7e5e32011-06-28 11:26:03 -0700587 defined_binpkg_phases = binpkg_phases.intersection(defined_phases)
588 if not defined_binpkg_phases:
589 this_pkg["nodeps"] = True
590
David Jamesfcb70ef2011-02-02 16:02:30 -0800591 # Create entries for dependencies of this package first.
592 ReverseTree(packages[pkg]["deps"])
593
594 # Add dependencies to this package.
595 for dep, dep_item in packages[pkg]["deps"].iteritems():
David James8c7e5e32011-06-28 11:26:03 -0700596 # We only need to enforce strict ordering of dependencies if the
David James3f778802011-08-25 19:31:45 -0700597 # dependency is a blocker, or is a buildtime or runtime dependency.
598 # (I.e., ignored, optional, and runtime_post dependencies don't
599 # depend on ordering.)
David James8c7e5e32011-06-28 11:26:03 -0700600 dep_types = dep_item["deptypes"]
601 if needed_dep_types.intersection(dep_types):
602 deps_map[dep]["provides"].add(pkg)
603 this_pkg["needs"][dep] = "/".join(dep_types)
David Jamesfcb70ef2011-02-02 16:02:30 -0800604
David James3f778802011-08-25 19:31:45 -0700605 # If there's a blocker, Portage may need to move files from one
606 # package to another, which requires editing the CONTENTS files of
607 # both packages. To avoid race conditions while editing this file,
608 # the two packages must not be installed in parallel, so we can't
609 # safely ignore dependencies. See http://crosbug.com/19328
610 if "blocker" in dep_types:
611 this_pkg["nodeps"] = False
612
David Jamesfcb70ef2011-02-02 16:02:30 -0800613 def FindCycles():
614 """Find cycles in the dependency tree.
615
616 Returns:
617 A dict mapping cyclic packages to a dict of the deps that cause
618 cycles. For each dep that causes cycles, it returns an example
619 traversal of the graph that shows the cycle.
620 """
621
622 def FindCyclesAtNode(pkg, cycles, unresolved, resolved):
623 """Find cycles in cyclic dependencies starting at specified package.
624
625 Args:
626 pkg: Package identifier.
627 cycles: A dict mapping cyclic packages to a dict of the deps that
628 cause cycles. For each dep that causes cycles, it returns an
629 example traversal of the graph that shows the cycle.
630 unresolved: Nodes that have been visited but are not fully processed.
631 resolved: Nodes that have been visited and are fully processed.
632 """
633 pkg_cycles = cycles.get(pkg)
634 if pkg in resolved and not pkg_cycles:
635 # If we already looked at this package, and found no cyclic
636 # dependencies, we can stop now.
637 return
638 unresolved.append(pkg)
639 for dep in deps_map[pkg]["needs"]:
640 if dep in unresolved:
641 idx = unresolved.index(dep)
642 mycycle = unresolved[idx:] + [dep]
David James321490a2012-12-17 12:05:56 -0800643 for i in xrange(len(mycycle) - 1):
David Jamesfcb70ef2011-02-02 16:02:30 -0800644 pkg1, pkg2 = mycycle[i], mycycle[i+1]
645 cycles.setdefault(pkg1, {}).setdefault(pkg2, mycycle)
646 elif not pkg_cycles or dep not in pkg_cycles:
647 # Looks like we haven't seen this edge before.
648 FindCyclesAtNode(dep, cycles, unresolved, resolved)
649 unresolved.pop()
650 resolved.add(pkg)
651
652 cycles, unresolved, resolved = {}, [], set()
653 for pkg in deps_map:
654 FindCyclesAtNode(pkg, cycles, unresolved, resolved)
655 return cycles
656
David James386ccd12011-05-04 20:17:42 -0700657 def RemoveUnusedPackages():
David Jamesfcb70ef2011-02-02 16:02:30 -0800658 """Remove installed packages, propagating dependencies."""
David Jamesfcb70ef2011-02-02 16:02:30 -0800659 # Schedule packages that aren't on the install list for removal
660 rm_pkgs = set(deps_map.keys()) - set(deps_info.keys())
661
David Jamesfcb70ef2011-02-02 16:02:30 -0800662 # Remove the packages we don't want, simplifying the graph and making
663 # it easier for us to crack cycles.
664 for pkg in sorted(rm_pkgs):
665 this_pkg = deps_map[pkg]
666 needs = this_pkg["needs"]
667 provides = this_pkg["provides"]
668 for dep in needs:
669 dep_provides = deps_map[dep]["provides"]
670 dep_provides.update(provides)
671 dep_provides.discard(pkg)
672 dep_provides.discard(dep)
673 for target in provides:
674 target_needs = deps_map[target]["needs"]
675 target_needs.update(needs)
676 target_needs.pop(pkg, None)
677 target_needs.pop(target, None)
678 del deps_map[pkg]
679
680 def PrintCycleBreak(basedep, dep, mycycle):
681 """Print details about a cycle that we are planning on breaking.
682
Mike Frysinger02e1e072013-11-10 22:11:34 -0500683 We are breaking a cycle where dep needs basedep. mycycle is an
684 example cycle which contains dep -> basedep.
685 """
David Jamesfcb70ef2011-02-02 16:02:30 -0800686
David Jamesfcb70ef2011-02-02 16:02:30 -0800687 needs = deps_map[dep]["needs"]
688 depinfo = needs.get(basedep, "deleted")
David Jamesfcb70ef2011-02-02 16:02:30 -0800689
David James3f778802011-08-25 19:31:45 -0700690 # It's OK to swap install order for blockers, as long as the two
691 # packages aren't installed in parallel. If there is a cycle, then
692 # we know the packages depend on each other already, so we can drop the
693 # blocker safely without printing a warning.
694 if depinfo == "blocker":
695 return
696
David Jamesfcb70ef2011-02-02 16:02:30 -0800697 # Notify the user that we're breaking a cycle.
698 print "Breaking %s -> %s (%s)" % (dep, basedep, depinfo)
699
700 # Show cycle.
David James321490a2012-12-17 12:05:56 -0800701 for i in xrange(len(mycycle) - 1):
David Jamesfcb70ef2011-02-02 16:02:30 -0800702 pkg1, pkg2 = mycycle[i], mycycle[i+1]
703 needs = deps_map[pkg1]["needs"]
704 depinfo = needs.get(pkg2, "deleted")
705 if pkg1 == dep and pkg2 == basedep:
706 depinfo = depinfo + ", deleting"
707 print " %s -> %s (%s)" % (pkg1, pkg2, depinfo)
708
709 def SanitizeTree():
710 """Remove circular dependencies.
711
712 We prune all dependencies involved in cycles that go against the emerge
713 ordering. This has a nice property: we're guaranteed to merge
714 dependencies in the same order that portage does.
715
716 Because we don't treat any dependencies as "soft" unless they're killed
717 by a cycle, we pay attention to a larger number of dependencies when
718 merging. This hurts performance a bit, but helps reliability.
719 """
720 start = time.time()
721 cycles = FindCycles()
722 while cycles:
723 for dep, mycycles in cycles.iteritems():
724 for basedep, mycycle in mycycles.iteritems():
725 if deps_info[basedep]["idx"] >= deps_info[dep]["idx"]:
Matt Tennant08797302011-10-17 16:18:45 -0700726 if "--quiet" not in emerge.opts:
727 PrintCycleBreak(basedep, dep, mycycle)
David Jamesfcb70ef2011-02-02 16:02:30 -0800728 del deps_map[dep]["needs"][basedep]
729 deps_map[basedep]["provides"].remove(dep)
730 cycles = FindCycles()
731 seconds = time.time() - start
732 if "--quiet" not in emerge.opts and seconds >= 0.1:
733 print "Tree sanitized in %dm%.1fs" % (seconds / 60, seconds % 60)
734
David James8c7e5e32011-06-28 11:26:03 -0700735 def FindRecursiveProvides(pkg, seen):
736 """Find all nodes that require a particular package.
737
738 Assumes that graph is acyclic.
739
740 Args:
741 pkg: Package identifier.
742 seen: Nodes that have been visited so far.
743 """
744 if pkg in seen:
745 return
746 seen.add(pkg)
747 info = deps_map[pkg]
748 info["tprovides"] = info["provides"].copy()
749 for dep in info["provides"]:
750 FindRecursiveProvides(dep, seen)
751 info["tprovides"].update(deps_map[dep]["tprovides"])
752
David Jamesa22906f2011-05-04 19:53:26 -0700753 ReverseTree(deps_tree)
David Jamesa22906f2011-05-04 19:53:26 -0700754
David James386ccd12011-05-04 20:17:42 -0700755 # We need to remove unused packages so that we can use the dependency
756 # ordering of the install process to show us what cycles to crack.
757 RemoveUnusedPackages()
David Jamesfcb70ef2011-02-02 16:02:30 -0800758 SanitizeTree()
David James8c7e5e32011-06-28 11:26:03 -0700759 seen = set()
760 for pkg in deps_map:
761 FindRecursiveProvides(pkg, seen)
David Jamesfcb70ef2011-02-02 16:02:30 -0800762 return deps_map
763
764 def PrintInstallPlan(self, deps_map):
765 """Print an emerge-style install plan.
766
767 The install plan lists what packages we're installing, in order.
768 It's useful for understanding what parallel_emerge is doing.
769
770 Args:
771 deps_map: The dependency graph.
772 """
773
774 def InstallPlanAtNode(target, deps_map):
775 nodes = []
776 nodes.append(target)
777 for dep in deps_map[target]["provides"]:
778 del deps_map[dep]["needs"][target]
779 if not deps_map[dep]["needs"]:
780 nodes.extend(InstallPlanAtNode(dep, deps_map))
781 return nodes
782
783 deps_map = copy.deepcopy(deps_map)
784 install_plan = []
785 plan = set()
786 for target, info in deps_map.iteritems():
787 if not info["needs"] and target not in plan:
788 for item in InstallPlanAtNode(target, deps_map):
789 plan.add(item)
790 install_plan.append(self.package_db[item])
791
792 for pkg in plan:
793 del deps_map[pkg]
794
795 if deps_map:
796 print "Cyclic dependencies:", " ".join(deps_map)
797 PrintDepsMap(deps_map)
798 sys.exit(1)
799
800 self.emerge.depgraph.display(install_plan)
801
802
803def PrintDepsMap(deps_map):
804 """Print dependency graph, for each package list it's prerequisites."""
805 for i in sorted(deps_map):
806 print "%s: (%s) needs" % (i, deps_map[i]["action"])
807 needs = deps_map[i]["needs"]
808 for j in sorted(needs):
809 print " %s" % (j)
810 if not needs:
811 print " no dependencies"
812
813
814class EmergeJobState(object):
Don Garrett25f309a2014-03-19 14:02:12 -0700815 """Structure describing the EmergeJobState."""
816
David Jamesfcb70ef2011-02-02 16:02:30 -0800817 __slots__ = ["done", "filename", "last_notify_timestamp", "last_output_seek",
818 "last_output_timestamp", "pkgname", "retcode", "start_timestamp",
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700819 "target", "fetch_only", "unpack_only"]
David Jamesfcb70ef2011-02-02 16:02:30 -0800820
821 def __init__(self, target, pkgname, done, filename, start_timestamp,
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700822 retcode=None, fetch_only=False, unpack_only=False):
David Jamesfcb70ef2011-02-02 16:02:30 -0800823
824 # The full name of the target we're building (e.g.
Mike Frysingerfd969312014-04-02 22:16:42 -0400825 # virtual/target-os-1-r60)
David Jamesfcb70ef2011-02-02 16:02:30 -0800826 self.target = target
827
Mike Frysingerfd969312014-04-02 22:16:42 -0400828 # The short name of the target we're building (e.g. target-os-1-r60)
David Jamesfcb70ef2011-02-02 16:02:30 -0800829 self.pkgname = pkgname
830
831 # Whether the job is done. (True if the job is done; false otherwise.)
832 self.done = done
833
834 # The filename where output is currently stored.
835 self.filename = filename
836
837 # The timestamp of the last time we printed the name of the log file. We
838 # print this at the beginning of the job, so this starts at
839 # start_timestamp.
840 self.last_notify_timestamp = start_timestamp
841
842 # The location (in bytes) of the end of the last complete line we printed.
843 # This starts off at zero. We use this to jump to the right place when we
844 # print output from the same ebuild multiple times.
845 self.last_output_seek = 0
846
847 # The timestamp of the last time we printed output. Since we haven't
848 # printed output yet, this starts at zero.
849 self.last_output_timestamp = 0
850
851 # The return code of our job, if the job is actually finished.
852 self.retcode = retcode
853
Brian Harring0be85c62012-03-17 19:52:12 -0700854 # Was this just a fetch job?
855 self.fetch_only = fetch_only
856
David Jamesfcb70ef2011-02-02 16:02:30 -0800857 # The timestamp when our job started.
858 self.start_timestamp = start_timestamp
859
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700860 # No emerge, only unpack packages.
861 self.unpack_only = unpack_only
862
David Jamesfcb70ef2011-02-02 16:02:30 -0800863
David James321490a2012-12-17 12:05:56 -0800864def KillHandler(_signum, _frame):
David James7358d032011-05-19 10:40:03 -0700865 # Kill self and all subprocesses.
866 os.killpg(0, signal.SIGKILL)
867
David Jamesfcb70ef2011-02-02 16:02:30 -0800868def SetupWorkerSignals():
David James321490a2012-12-17 12:05:56 -0800869 def ExitHandler(_signum, _frame):
David James7358d032011-05-19 10:40:03 -0700870 # Set KILLED flag.
871 KILLED.set()
David James13cead42011-05-18 16:22:01 -0700872
David James7358d032011-05-19 10:40:03 -0700873 # Remove our signal handlers so we don't get called recursively.
874 signal.signal(signal.SIGINT, KillHandler)
875 signal.signal(signal.SIGTERM, KillHandler)
David Jamesfcb70ef2011-02-02 16:02:30 -0800876
877 # Ensure that we exit quietly and cleanly, if possible, when we receive
878 # SIGTERM or SIGINT signals. By default, when the user hits CTRL-C, all
879 # of the child processes will print details about KeyboardInterrupt
880 # exceptions, which isn't very helpful.
881 signal.signal(signal.SIGINT, ExitHandler)
882 signal.signal(signal.SIGTERM, ExitHandler)
883
David James6b29d052012-11-02 10:27:27 -0700884def EmergeProcess(output, *args, **kwargs):
David James1ed3e252011-10-05 20:26:15 -0700885 """Merge a package in a subprocess.
886
887 Args:
David James1ed3e252011-10-05 20:26:15 -0700888 output: Temporary file to write output.
David James6b29d052012-11-02 10:27:27 -0700889 *args: Arguments to pass to Scheduler constructor.
890 **kwargs: Keyword arguments to pass to Scheduler constructor.
David James1ed3e252011-10-05 20:26:15 -0700891
892 Returns:
893 The exit code returned by the subprocess.
894 """
895 pid = os.fork()
896 if pid == 0:
897 try:
898 # Sanity checks.
Mike Frysingerf02736e2013-11-08 15:27:00 -0500899 if sys.stdout.fileno() != 1:
900 raise Exception("sys.stdout.fileno() != 1")
901 if sys.stderr.fileno() != 2:
902 raise Exception("sys.stderr.fileno() != 2")
David James1ed3e252011-10-05 20:26:15 -0700903
904 # - Redirect 1 (stdout) and 2 (stderr) at our temporary file.
905 # - Redirect 0 to point at sys.stdin. In this case, sys.stdin
906 # points at a file reading os.devnull, because multiprocessing mucks
907 # with sys.stdin.
908 # - Leave the sys.stdin and output filehandles alone.
909 fd_pipes = {0: sys.stdin.fileno(),
910 1: output.fileno(),
911 2: output.fileno(),
912 sys.stdin.fileno(): sys.stdin.fileno(),
913 output.fileno(): output.fileno()}
David James9becf572014-04-25 14:39:05 +0000914 if 0 <= vercmp(portage.VERSION, "2.1.11.50"):
915 # pylint: disable=W0212
916 portage.process._setup_pipes(fd_pipes, close_fds=False)
917 else:
918 # pylint: disable=W0212
919 portage.process._setup_pipes(fd_pipes)
David James1ed3e252011-10-05 20:26:15 -0700920
921 # Portage doesn't like when sys.stdin.fileno() != 0, so point sys.stdin
922 # at the filehandle we just created in _setup_pipes.
923 if sys.stdin.fileno() != 0:
David James6b29d052012-11-02 10:27:27 -0700924 sys.__stdin__ = sys.stdin = os.fdopen(0, "r")
925
926 scheduler = Scheduler(*args, **kwargs)
927
928 # Enable blocker handling even though we're in --nodeps mode. This
929 # allows us to unmerge the blocker after we've merged the replacement.
930 scheduler._opts_ignore_blockers = frozenset()
David James1ed3e252011-10-05 20:26:15 -0700931
932 # Actually do the merge.
933 retval = scheduler.merge()
934
935 # We catch all exceptions here (including SystemExit, KeyboardInterrupt,
936 # etc) so as to ensure that we don't confuse the multiprocessing module,
937 # which expects that all forked children exit with os._exit().
David James321490a2012-12-17 12:05:56 -0800938 # pylint: disable=W0702
David James1ed3e252011-10-05 20:26:15 -0700939 except:
940 traceback.print_exc(file=output)
941 retval = 1
942 sys.stdout.flush()
943 sys.stderr.flush()
944 output.flush()
Don Garrett25f309a2014-03-19 14:02:12 -0700945 # pylint: disable=W0212
David James1ed3e252011-10-05 20:26:15 -0700946 os._exit(retval)
947 else:
948 # Return the exit code of the subprocess.
949 return os.waitpid(pid, 0)[1]
David Jamesfcb70ef2011-02-02 16:02:30 -0800950
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700951
952def UnpackPackage(pkg_state):
953 """Unpacks package described by pkg_state.
954
955 Args:
956 pkg_state: EmergeJobState object describing target.
957
958 Returns:
959 Exit code returned by subprocess.
960 """
961 pkgdir = os.environ.get("PKGDIR",
962 os.path.join(os.environ["SYSROOT"], "packages"))
963 root = os.environ.get("ROOT", os.environ["SYSROOT"])
964 path = os.path.join(pkgdir, pkg_state.target + ".tbz2")
965 comp = cros_build_lib.FindCompressor(cros_build_lib.COMP_BZIP2)
966 cmd = [comp, "-dc"]
967 if comp.endswith("pbzip2"):
968 cmd.append("--ignore-trailing-garbage=1")
969 cmd.append(path)
970
971 result = cros_build_lib.RunCommand(cmd, cwd=root, stdout_to_pipe=True,
972 print_cmd=False, error_code_ok=True)
973
974 # If we were not successful, return now and don't attempt untar.
975 if result.returncode:
976 return result.returncode
977
978 cmd = ["sudo", "tar", "-xf", "-", "-C", root]
979 result = cros_build_lib.RunCommand(cmd, cwd=root, input=result.output,
980 print_cmd=False, error_code_ok=True)
981
982 return result.returncode
983
984
985def EmergeWorker(task_queue, job_queue, emerge, package_db, fetch_only=False,
986 unpack_only=False):
David Jamesfcb70ef2011-02-02 16:02:30 -0800987 """This worker emerges any packages given to it on the task_queue.
988
989 Args:
990 task_queue: The queue of tasks for this worker to do.
991 job_queue: The queue of results from the worker.
992 emerge: An EmergeData() object.
993 package_db: A dict, mapping package ids to portage Package objects.
Brian Harring0be85c62012-03-17 19:52:12 -0700994 fetch_only: A bool, indicating if we should just fetch the target.
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700995 unpack_only: A bool, indicating if we should just unpack the target.
David Jamesfcb70ef2011-02-02 16:02:30 -0800996
997 It expects package identifiers to be passed to it via task_queue. When
998 a task is started, it pushes the (target, filename) to the started_queue.
999 The output is stored in filename. When a merge starts or finishes, we push
1000 EmergeJobState objects to the job_queue.
1001 """
1002
1003 SetupWorkerSignals()
1004 settings, trees, mtimedb = emerge.settings, emerge.trees, emerge.mtimedb
David Jamesdeebd692011-05-09 17:02:52 -07001005
1006 # Disable flushing of caches to save on I/O.
David James7a1ea4b2011-10-13 15:06:41 -07001007 root = emerge.settings["ROOT"]
1008 vardb = emerge.trees[root]["vartree"].dbapi
1009 vardb._flush_cache_enabled = False
Brian Harring0be85c62012-03-17 19:52:12 -07001010 bindb = emerge.trees[root]["bintree"].dbapi
1011 # Might be a set, might be a list, might be None; no clue, just use shallow
1012 # copy to ensure we can roll it back.
Don Garrett25f309a2014-03-19 14:02:12 -07001013 # pylint: disable=W0212
Brian Harring0be85c62012-03-17 19:52:12 -07001014 original_remotepkgs = copy.copy(bindb.bintree._remotepkgs)
David Jamesdeebd692011-05-09 17:02:52 -07001015
David Jamesfcb70ef2011-02-02 16:02:30 -08001016 opts, spinner = emerge.opts, emerge.spinner
1017 opts["--nodeps"] = True
Brian Harring0be85c62012-03-17 19:52:12 -07001018 if fetch_only:
1019 opts["--fetchonly"] = True
1020
David Jamesfcb70ef2011-02-02 16:02:30 -08001021 while True:
1022 # Wait for a new item to show up on the queue. This is a blocking wait,
1023 # so if there's nothing to do, we just sit here.
Brian Harring0be85c62012-03-17 19:52:12 -07001024 pkg_state = task_queue.get()
1025 if pkg_state is None:
David Jamesfcb70ef2011-02-02 16:02:30 -08001026 # If target is None, this means that the main thread wants us to quit.
1027 # The other workers need to exit too, so we'll push the message back on
1028 # to the queue so they'll get it too.
Brian Harring0be85c62012-03-17 19:52:12 -07001029 task_queue.put(None)
David Jamesfcb70ef2011-02-02 16:02:30 -08001030 return
David James7358d032011-05-19 10:40:03 -07001031 if KILLED.is_set():
1032 return
1033
Brian Harring0be85c62012-03-17 19:52:12 -07001034 target = pkg_state.target
1035
David Jamesfcb70ef2011-02-02 16:02:30 -08001036 db_pkg = package_db[target]
Brian Harring0be85c62012-03-17 19:52:12 -07001037
1038 if db_pkg.type_name == "binary":
1039 if not fetch_only and pkg_state.fetched_successfully:
1040 # Ensure portage doesn't think our pkg is remote- else it'll force
1041 # a redownload of it (even if the on-disk file is fine). In-memory
1042 # caching basically, implemented dumbly.
1043 bindb.bintree._remotepkgs = None
1044 else:
1045 bindb.bintree_remotepkgs = original_remotepkgs
1046
David Jamesfcb70ef2011-02-02 16:02:30 -08001047 db_pkg.root_config = emerge.root_config
1048 install_list = [db_pkg]
1049 pkgname = db_pkg.pf
1050 output = tempfile.NamedTemporaryFile(prefix=pkgname + "-", delete=False)
David James01b1e0f2012-06-07 17:18:05 -07001051 os.chmod(output.name, 644)
David Jamesfcb70ef2011-02-02 16:02:30 -08001052 start_timestamp = time.time()
Brian Harring0be85c62012-03-17 19:52:12 -07001053 job = EmergeJobState(target, pkgname, False, output.name, start_timestamp,
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001054 fetch_only=fetch_only, unpack_only=unpack_only)
David Jamesfcb70ef2011-02-02 16:02:30 -08001055 job_queue.put(job)
1056 if "--pretend" in opts:
1057 retcode = 0
1058 else:
David Jamesfcb70ef2011-02-02 16:02:30 -08001059 try:
David James386ccd12011-05-04 20:17:42 -07001060 emerge.scheduler_graph.mergelist = install_list
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001061 if unpack_only:
1062 retcode = UnpackPackage(pkg_state)
1063 else:
1064 retcode = EmergeProcess(output, settings, trees, mtimedb, opts,
1065 spinner, favorites=emerge.favorites,
1066 graph_config=emerge.scheduler_graph)
David Jamesfcb70ef2011-02-02 16:02:30 -08001067 except Exception:
1068 traceback.print_exc(file=output)
1069 retcode = 1
David James1ed3e252011-10-05 20:26:15 -07001070 output.close()
David Jamesfcb70ef2011-02-02 16:02:30 -08001071
David James7358d032011-05-19 10:40:03 -07001072 if KILLED.is_set():
1073 return
1074
David Jamesfcb70ef2011-02-02 16:02:30 -08001075 job = EmergeJobState(target, pkgname, True, output.name, start_timestamp,
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001076 retcode, fetch_only=fetch_only,
1077 unpack_only=unpack_only)
David Jamesfcb70ef2011-02-02 16:02:30 -08001078 job_queue.put(job)
1079
1080
1081class LinePrinter(object):
1082 """Helper object to print a single line."""
1083
1084 def __init__(self, line):
1085 self.line = line
1086
David James321490a2012-12-17 12:05:56 -08001087 def Print(self, _seek_locations):
David Jamesfcb70ef2011-02-02 16:02:30 -08001088 print self.line
1089
1090
1091class JobPrinter(object):
1092 """Helper object to print output of a job."""
1093
1094 def __init__(self, job, unlink=False):
1095 """Print output of job.
1096
Mike Frysinger02e1e072013-11-10 22:11:34 -05001097 If unlink is True, unlink the job output file when done.
1098 """
David Jamesfcb70ef2011-02-02 16:02:30 -08001099 self.current_time = time.time()
1100 self.job = job
1101 self.unlink = unlink
1102
1103 def Print(self, seek_locations):
1104
1105 job = self.job
1106
1107 # Calculate how long the job has been running.
1108 seconds = self.current_time - job.start_timestamp
1109
1110 # Note that we've printed out the job so far.
1111 job.last_output_timestamp = self.current_time
1112
1113 # Note that we're starting the job
1114 info = "job %s (%dm%.1fs)" % (job.pkgname, seconds / 60, seconds % 60)
1115 last_output_seek = seek_locations.get(job.filename, 0)
1116 if last_output_seek:
1117 print "=== Continue output for %s ===" % info
1118 else:
1119 print "=== Start output for %s ===" % info
1120
1121 # Print actual output from job
1122 f = codecs.open(job.filename, encoding='utf-8', errors='replace')
1123 f.seek(last_output_seek)
1124 prefix = job.pkgname + ":"
1125 for line in f:
1126
1127 # Save off our position in the file
1128 if line and line[-1] == "\n":
1129 last_output_seek = f.tell()
1130 line = line[:-1]
1131
1132 # Print our line
1133 print prefix, line.encode('utf-8', 'replace')
1134 f.close()
1135
1136 # Save our last spot in the file so that we don't print out the same
1137 # location twice.
1138 seek_locations[job.filename] = last_output_seek
1139
1140 # Note end of output section
1141 if job.done:
1142 print "=== Complete: %s ===" % info
1143 else:
1144 print "=== Still running: %s ===" % info
1145
1146 if self.unlink:
1147 os.unlink(job.filename)
1148
1149
1150def PrintWorker(queue):
1151 """A worker that prints stuff to the screen as requested."""
1152
David James321490a2012-12-17 12:05:56 -08001153 def ExitHandler(_signum, _frame):
David James7358d032011-05-19 10:40:03 -07001154 # Set KILLED flag.
1155 KILLED.set()
1156
David Jamesfcb70ef2011-02-02 16:02:30 -08001157 # Switch to default signal handlers so that we'll die after two signals.
David James7358d032011-05-19 10:40:03 -07001158 signal.signal(signal.SIGINT, KillHandler)
1159 signal.signal(signal.SIGTERM, KillHandler)
David Jamesfcb70ef2011-02-02 16:02:30 -08001160
1161 # Don't exit on the first SIGINT / SIGTERM, because the parent worker will
1162 # handle it and tell us when we need to exit.
1163 signal.signal(signal.SIGINT, ExitHandler)
1164 signal.signal(signal.SIGTERM, ExitHandler)
1165
1166 # seek_locations is a map indicating the position we are at in each file.
1167 # It starts off empty, but is set by the various Print jobs as we go along
1168 # to indicate where we left off in each file.
1169 seek_locations = {}
1170 while True:
1171 try:
1172 job = queue.get()
1173 if job:
1174 job.Print(seek_locations)
David Jamesbccf8eb2011-07-27 14:06:06 -07001175 sys.stdout.flush()
David Jamesfcb70ef2011-02-02 16:02:30 -08001176 else:
1177 break
1178 except IOError as ex:
1179 if ex.errno == errno.EINTR:
1180 # Looks like we received a signal. Keep printing.
1181 continue
1182 raise
1183
Brian Harring867e2362012-03-17 04:05:17 -07001184
Brian Harring0be85c62012-03-17 19:52:12 -07001185class TargetState(object):
Don Garrett25f309a2014-03-19 14:02:12 -07001186 """Structure descriting the TargetState."""
Brian Harring867e2362012-03-17 04:05:17 -07001187
Brian Harring0be85c62012-03-17 19:52:12 -07001188 __slots__ = ("target", "info", "score", "prefetched", "fetched_successfully")
Brian Harring867e2362012-03-17 04:05:17 -07001189
David James321490a2012-12-17 12:05:56 -08001190 def __init__(self, target, info):
Brian Harring867e2362012-03-17 04:05:17 -07001191 self.target, self.info = target, info
Brian Harring0be85c62012-03-17 19:52:12 -07001192 self.fetched_successfully = False
1193 self.prefetched = False
David James321490a2012-12-17 12:05:56 -08001194 self.score = None
Brian Harring867e2362012-03-17 04:05:17 -07001195 self.update_score()
1196
1197 def __cmp__(self, other):
1198 return cmp(self.score, other.score)
1199
1200 def update_score(self):
1201 self.score = (
1202 -len(self.info["tprovides"]),
Brian Harring0be85c62012-03-17 19:52:12 -07001203 len(self.info["needs"]),
Brian Harring11c5eeb2012-03-18 11:02:39 -07001204 not self.info["binary"],
Brian Harring867e2362012-03-17 04:05:17 -07001205 -len(self.info["provides"]),
1206 self.info["idx"],
1207 self.target,
1208 )
1209
1210
1211class ScoredHeap(object):
Don Garrett25f309a2014-03-19 14:02:12 -07001212 """Implementation of a general purpose scored heap."""
Brian Harring867e2362012-03-17 04:05:17 -07001213
Brian Harring0be85c62012-03-17 19:52:12 -07001214 __slots__ = ("heap", "_heap_set")
1215
Brian Harring867e2362012-03-17 04:05:17 -07001216 def __init__(self, initial=()):
Brian Harring0be85c62012-03-17 19:52:12 -07001217 self.heap = list()
1218 self._heap_set = set()
1219 if initial:
1220 self.multi_put(initial)
Brian Harring867e2362012-03-17 04:05:17 -07001221
1222 def get(self):
Brian Harring0be85c62012-03-17 19:52:12 -07001223 item = heapq.heappop(self.heap)
1224 self._heap_set.remove(item.target)
1225 return item
Brian Harring867e2362012-03-17 04:05:17 -07001226
Brian Harring0be85c62012-03-17 19:52:12 -07001227 def put(self, item):
1228 if not isinstance(item, TargetState):
1229 raise ValueError("Item %r isn't a TargetState" % (item,))
1230 heapq.heappush(self.heap, item)
1231 self._heap_set.add(item.target)
Brian Harring867e2362012-03-17 04:05:17 -07001232
Brian Harring0be85c62012-03-17 19:52:12 -07001233 def multi_put(self, sequence):
1234 sequence = list(sequence)
1235 self.heap.extend(sequence)
1236 self._heap_set.update(x.target for x in sequence)
Brian Harring867e2362012-03-17 04:05:17 -07001237 self.sort()
1238
David James5c9996d2012-03-24 10:50:46 -07001239 def sort(self):
1240 heapq.heapify(self.heap)
1241
Brian Harring0be85c62012-03-17 19:52:12 -07001242 def __contains__(self, target):
1243 return target in self._heap_set
1244
1245 def __nonzero__(self):
1246 return bool(self.heap)
1247
Brian Harring867e2362012-03-17 04:05:17 -07001248 def __len__(self):
1249 return len(self.heap)
1250
1251
David Jamesfcb70ef2011-02-02 16:02:30 -08001252class EmergeQueue(object):
1253 """Class to schedule emerge jobs according to a dependency graph."""
1254
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001255 def __init__(self, deps_map, emerge, package_db, show_output, unpack_only):
David Jamesfcb70ef2011-02-02 16:02:30 -08001256 # Store the dependency graph.
1257 self._deps_map = deps_map
Brian Harring0be85c62012-03-17 19:52:12 -07001258 self._state_map = {}
David Jamesfcb70ef2011-02-02 16:02:30 -08001259 # Initialize the running queue to empty
Brian Harring0be85c62012-03-17 19:52:12 -07001260 self._build_jobs = {}
1261 self._build_ready = ScoredHeap()
1262 self._fetch_jobs = {}
1263 self._fetch_ready = ScoredHeap()
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001264 self._unpack_jobs = {}
1265 self._unpack_ready = ScoredHeap()
David Jamesfcb70ef2011-02-02 16:02:30 -08001266 # List of total package installs represented in deps_map.
1267 install_jobs = [x for x in deps_map if deps_map[x]["action"] == "merge"]
1268 self._total_jobs = len(install_jobs)
1269 self._show_output = show_output
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001270 self._unpack_only = unpack_only
David Jamesfcb70ef2011-02-02 16:02:30 -08001271
1272 if "--pretend" in emerge.opts:
1273 print "Skipping merge because of --pretend mode."
1274 sys.exit(0)
1275
David James6d47d8c2014-04-24 09:40:05 -07001276 # Set up a session so we can easily terminate all children.
1277 self._SetupSession()
David James7358d032011-05-19 10:40:03 -07001278
David Jamesfcb70ef2011-02-02 16:02:30 -08001279 # Setup scheduler graph object. This is used by the child processes
1280 # to help schedule jobs.
1281 emerge.scheduler_graph = emerge.depgraph.schedulerGraph()
1282
1283 # Calculate how many jobs we can run in parallel. We don't want to pass
1284 # the --jobs flag over to emerge itself, because that'll tell emerge to
1285 # hide its output, and said output is quite useful for debugging hung
1286 # jobs.
1287 procs = min(self._total_jobs,
1288 emerge.opts.pop("--jobs", multiprocessing.cpu_count()))
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001289 self._build_procs = self._unpack_procs = self._fetch_procs = max(1, procs)
David James8c7e5e32011-06-28 11:26:03 -07001290 self._load_avg = emerge.opts.pop("--load-average", None)
David Jamesfcb70ef2011-02-02 16:02:30 -08001291 self._job_queue = multiprocessing.Queue()
1292 self._print_queue = multiprocessing.Queue()
Brian Harring0be85c62012-03-17 19:52:12 -07001293
1294 self._fetch_queue = multiprocessing.Queue()
1295 args = (self._fetch_queue, self._job_queue, emerge, package_db, True)
1296 self._fetch_pool = multiprocessing.Pool(self._fetch_procs, EmergeWorker,
1297 args)
1298
1299 self._build_queue = multiprocessing.Queue()
1300 args = (self._build_queue, self._job_queue, emerge, package_db)
1301 self._build_pool = multiprocessing.Pool(self._build_procs, EmergeWorker,
1302 args)
1303
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001304 if self._unpack_only:
1305 # Unpack pool only required on unpack_only jobs.
1306 self._unpack_queue = multiprocessing.Queue()
1307 args = (self._unpack_queue, self._job_queue, emerge, package_db, False,
1308 True)
1309 self._unpack_pool = multiprocessing.Pool(self._unpack_procs, EmergeWorker,
1310 args)
1311
David Jamesfcb70ef2011-02-02 16:02:30 -08001312 self._print_worker = multiprocessing.Process(target=PrintWorker,
1313 args=[self._print_queue])
1314 self._print_worker.start()
1315
1316 # Initialize the failed queue to empty.
1317 self._retry_queue = []
1318 self._failed = set()
1319
David Jamesfcb70ef2011-02-02 16:02:30 -08001320 # Setup an exit handler so that we print nice messages if we are
1321 # terminated.
1322 self._SetupExitHandler()
1323
1324 # Schedule our jobs.
Brian Harring0be85c62012-03-17 19:52:12 -07001325 self._state_map.update(
1326 (pkg, TargetState(pkg, data)) for pkg, data in deps_map.iteritems())
1327 self._fetch_ready.multi_put(self._state_map.itervalues())
David Jamesfcb70ef2011-02-02 16:02:30 -08001328
David James6d47d8c2014-04-24 09:40:05 -07001329 def _SetupSession(self):
1330 """Set up a session so we can easily terminate all children."""
1331 # When we call os.setsid(), this sets up a session / process group for this
1332 # process and all children. These session groups are needed so that we can
1333 # easily kill all children (including processes launched by emerge) before
1334 # we exit.
1335 #
1336 # One unfortunate side effect of os.setsid() is that it blocks CTRL-C from
1337 # being received. To work around this, we only call os.setsid() in a forked
1338 # process, so that the parent can still watch for CTRL-C. The parent will
1339 # just sit around, watching for signals and propagating them to the child,
1340 # until the child exits.
1341 #
1342 # TODO(davidjames): It would be nice if we could replace this with cgroups.
1343 pid = os.fork()
1344 if pid == 0:
1345 os.setsid()
1346 else:
1347 def PropagateToChildren(signum, _frame):
1348 # Just propagate the signals down to the child. We'll exit when the
1349 # child does.
1350 try:
1351 os.kill(pid, signum)
1352 except OSError as ex:
1353 if ex.errno != errno.ESRCH:
1354 raise
1355 signal.signal(signal.SIGINT, PropagateToChildren)
1356 signal.signal(signal.SIGTERM, PropagateToChildren)
1357
1358 def StopGroup(_signum, _frame):
1359 # When we get stopped, stop the children.
1360 try:
1361 os.killpg(pid, signal.SIGSTOP)
1362 os.kill(0, signal.SIGSTOP)
1363 except OSError as ex:
1364 if ex.errno != errno.ESRCH:
1365 raise
1366 signal.signal(signal.SIGTSTP, StopGroup)
1367
1368 def ContinueGroup(_signum, _frame):
1369 # Launch the children again after being stopped.
1370 try:
1371 os.killpg(pid, signal.SIGCONT)
1372 except OSError as ex:
1373 if ex.errno != errno.ESRCH:
1374 raise
1375 signal.signal(signal.SIGCONT, ContinueGroup)
1376
1377 # Loop until the children exit. We exit with os._exit to be sure we
1378 # don't run any finalizers (those will be run by the child process.)
1379 # pylint: disable=W0212
1380 while True:
1381 try:
1382 # Wait for the process to exit. When it does, exit with the return
1383 # value of the subprocess.
1384 os._exit(osutils.GetExitStatus(os.waitpid(pid, 0)[1]))
1385 except OSError as ex:
1386 if ex.errno == errno.EINTR:
1387 continue
1388 traceback.print_exc()
1389 os._exit(1)
1390 except BaseException:
1391 traceback.print_exc()
1392 os._exit(1)
1393
David Jamesfcb70ef2011-02-02 16:02:30 -08001394 def _SetupExitHandler(self):
1395
David James321490a2012-12-17 12:05:56 -08001396 def ExitHandler(signum, _frame):
David James7358d032011-05-19 10:40:03 -07001397 # Set KILLED flag.
1398 KILLED.set()
David Jamesfcb70ef2011-02-02 16:02:30 -08001399
1400 # Kill our signal handlers so we don't get called recursively
David James7358d032011-05-19 10:40:03 -07001401 signal.signal(signal.SIGINT, KillHandler)
1402 signal.signal(signal.SIGTERM, KillHandler)
David Jamesfcb70ef2011-02-02 16:02:30 -08001403
1404 # Print our current job status
Brian Harring0be85c62012-03-17 19:52:12 -07001405 for job in self._build_jobs.itervalues():
David Jamesfcb70ef2011-02-02 16:02:30 -08001406 if job:
1407 self._print_queue.put(JobPrinter(job, unlink=True))
1408
1409 # Notify the user that we are exiting
1410 self._Print("Exiting on signal %s" % signum)
David James7358d032011-05-19 10:40:03 -07001411 self._print_queue.put(None)
1412 self._print_worker.join()
David Jamesfcb70ef2011-02-02 16:02:30 -08001413
1414 # Kill child threads, then exit.
David James7358d032011-05-19 10:40:03 -07001415 os.killpg(0, signal.SIGKILL)
David Jamesfcb70ef2011-02-02 16:02:30 -08001416 sys.exit(1)
1417
1418 # Print out job status when we are killed
1419 signal.signal(signal.SIGINT, ExitHandler)
1420 signal.signal(signal.SIGTERM, ExitHandler)
1421
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001422 def _ScheduleUnpack(self, pkg_state):
1423 self._unpack_jobs[pkg_state.target] = None
1424 self._unpack_queue.put(pkg_state)
1425
Brian Harring0be85c62012-03-17 19:52:12 -07001426 def _Schedule(self, pkg_state):
David Jamesfcb70ef2011-02-02 16:02:30 -08001427 # We maintain a tree of all deps, if this doesn't need
David James8c7e5e32011-06-28 11:26:03 -07001428 # to be installed just free up its children and continue.
David Jamesfcb70ef2011-02-02 16:02:30 -08001429 # It is possible to reinstall deps of deps, without reinstalling
1430 # first level deps, like so:
Mike Frysingerfd969312014-04-02 22:16:42 -04001431 # virtual/target-os (merge) -> eselect (nomerge) -> python (merge)
Brian Harring0be85c62012-03-17 19:52:12 -07001432 this_pkg = pkg_state.info
1433 target = pkg_state.target
1434 if pkg_state.info is not None:
1435 if this_pkg["action"] == "nomerge":
1436 self._Finish(target)
1437 elif target not in self._build_jobs:
1438 # Kick off the build if it's marked to be built.
1439 self._build_jobs[target] = None
1440 self._build_queue.put(pkg_state)
1441 return True
David Jamesfcb70ef2011-02-02 16:02:30 -08001442
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001443 def _ScheduleLoop(self, unpack_only=False):
1444 if unpack_only:
1445 ready_queue = self._unpack_ready
1446 jobs_queue = self._unpack_jobs
1447 procs = self._unpack_procs
1448 else:
1449 ready_queue = self._build_ready
1450 jobs_queue = self._build_jobs
1451 procs = self._build_procs
1452
David James8c7e5e32011-06-28 11:26:03 -07001453 # If the current load exceeds our desired load average, don't schedule
1454 # more than one job.
1455 if self._load_avg and os.getloadavg()[0] > self._load_avg:
1456 needed_jobs = 1
1457 else:
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001458 needed_jobs = procs
David James8c7e5e32011-06-28 11:26:03 -07001459
1460 # Schedule more jobs.
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001461 while ready_queue and len(jobs_queue) < needed_jobs:
1462 state = ready_queue.get()
1463 if unpack_only:
1464 self._ScheduleUnpack(state)
1465 else:
1466 if state.target not in self._failed:
1467 self._Schedule(state)
David Jamesfcb70ef2011-02-02 16:02:30 -08001468
1469 def _Print(self, line):
1470 """Print a single line."""
1471 self._print_queue.put(LinePrinter(line))
1472
1473 def _Status(self):
1474 """Print status."""
1475 current_time = time.time()
1476 no_output = True
1477
1478 # Print interim output every minute if --show-output is used. Otherwise,
1479 # print notifications about running packages every 2 minutes, and print
1480 # full output for jobs that have been running for 60 minutes or more.
1481 if self._show_output:
1482 interval = 60
1483 notify_interval = 0
1484 else:
1485 interval = 60 * 60
1486 notify_interval = 60 * 2
David James321490a2012-12-17 12:05:56 -08001487 for job in self._build_jobs.itervalues():
David Jamesfcb70ef2011-02-02 16:02:30 -08001488 if job:
1489 last_timestamp = max(job.start_timestamp, job.last_output_timestamp)
1490 if last_timestamp + interval < current_time:
1491 self._print_queue.put(JobPrinter(job))
1492 job.last_output_timestamp = current_time
1493 no_output = False
1494 elif (notify_interval and
1495 job.last_notify_timestamp + notify_interval < current_time):
1496 job_seconds = current_time - job.start_timestamp
1497 args = (job.pkgname, job_seconds / 60, job_seconds % 60, job.filename)
1498 info = "Still building %s (%dm%.1fs). Logs in %s" % args
1499 job.last_notify_timestamp = current_time
1500 self._Print(info)
1501 no_output = False
1502
1503 # If we haven't printed any messages yet, print a general status message
1504 # here.
1505 if no_output:
1506 seconds = current_time - GLOBAL_START
Brian Harring0be85c62012-03-17 19:52:12 -07001507 fjobs, fready = len(self._fetch_jobs), len(self._fetch_ready)
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001508 ujobs, uready = len(self._unpack_jobs), len(self._unpack_ready)
Brian Harring0be85c62012-03-17 19:52:12 -07001509 bjobs, bready = len(self._build_jobs), len(self._build_ready)
1510 retries = len(self._retry_queue)
1511 pending = max(0, len(self._deps_map) - fjobs - bjobs)
1512 line = "Pending %s/%s, " % (pending, self._total_jobs)
1513 if fjobs or fready:
1514 line += "Fetching %s/%s, " % (fjobs, fready + fjobs)
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001515 if ujobs or uready:
1516 line += "Unpacking %s/%s, " % (ujobs, uready + ujobs)
Brian Harring0be85c62012-03-17 19:52:12 -07001517 if bjobs or bready or retries:
1518 line += "Building %s/%s, " % (bjobs, bready + bjobs)
1519 if retries:
1520 line += "Retrying %s, " % (retries,)
David James8c7e5e32011-06-28 11:26:03 -07001521 load = " ".join(str(x) for x in os.getloadavg())
Brian Harring0be85c62012-03-17 19:52:12 -07001522 line += ("[Time %dm%.1fs Load %s]" % (seconds/60, seconds %60, load))
1523 self._Print(line)
David Jamesfcb70ef2011-02-02 16:02:30 -08001524
1525 def _Finish(self, target):
David James8c7e5e32011-06-28 11:26:03 -07001526 """Mark a target as completed and unblock dependencies."""
1527 this_pkg = self._deps_map[target]
1528 if this_pkg["needs"] and this_pkg["nodeps"]:
1529 # We got installed, but our deps have not been installed yet. Dependent
1530 # packages should only be installed when our needs have been fully met.
1531 this_pkg["action"] = "nomerge"
1532 else:
David James8c7e5e32011-06-28 11:26:03 -07001533 for dep in this_pkg["provides"]:
1534 dep_pkg = self._deps_map[dep]
Brian Harring0be85c62012-03-17 19:52:12 -07001535 state = self._state_map[dep]
David James8c7e5e32011-06-28 11:26:03 -07001536 del dep_pkg["needs"][target]
Brian Harring0be85c62012-03-17 19:52:12 -07001537 state.update_score()
1538 if not state.prefetched:
1539 if dep in self._fetch_ready:
1540 # If it's not currently being fetched, update the prioritization
1541 self._fetch_ready.sort()
1542 elif not dep_pkg["needs"]:
David James8c7e5e32011-06-28 11:26:03 -07001543 if dep_pkg["nodeps"] and dep_pkg["action"] == "nomerge":
1544 self._Finish(dep)
1545 else:
Brian Harring0be85c62012-03-17 19:52:12 -07001546 self._build_ready.put(self._state_map[dep])
David James8c7e5e32011-06-28 11:26:03 -07001547 self._deps_map.pop(target)
David Jamesfcb70ef2011-02-02 16:02:30 -08001548
1549 def _Retry(self):
David James8c7e5e32011-06-28 11:26:03 -07001550 while self._retry_queue:
Brian Harring0be85c62012-03-17 19:52:12 -07001551 state = self._retry_queue.pop(0)
1552 if self._Schedule(state):
1553 self._Print("Retrying emerge of %s." % state.target)
David James8c7e5e32011-06-28 11:26:03 -07001554 break
David Jamesfcb70ef2011-02-02 16:02:30 -08001555
Brian Harringa43f5952012-04-12 01:19:34 -07001556 def _Shutdown(self):
David Jamesfcb70ef2011-02-02 16:02:30 -08001557 # Tell emerge workers to exit. They all exit when 'None' is pushed
1558 # to the queue.
Brian Harring0be85c62012-03-17 19:52:12 -07001559
Brian Harringa43f5952012-04-12 01:19:34 -07001560 # Shutdown the workers first; then jobs (which is how they feed things back)
1561 # then finally the print queue.
Brian Harring0be85c62012-03-17 19:52:12 -07001562
Brian Harringa43f5952012-04-12 01:19:34 -07001563 def _stop(queue, pool):
1564 if pool is None:
1565 return
1566 try:
1567 queue.put(None)
1568 pool.close()
1569 pool.join()
1570 finally:
1571 pool.terminate()
Brian Harring0be85c62012-03-17 19:52:12 -07001572
Brian Harringa43f5952012-04-12 01:19:34 -07001573 _stop(self._fetch_queue, self._fetch_pool)
1574 self._fetch_queue = self._fetch_pool = None
Brian Harring0be85c62012-03-17 19:52:12 -07001575
Brian Harringa43f5952012-04-12 01:19:34 -07001576 _stop(self._build_queue, self._build_pool)
1577 self._build_queue = self._build_pool = None
1578
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001579 if self._unpack_only:
1580 _stop(self._unpack_queue, self._unpack_pool)
1581 self._unpack_queue = self._unpack_pool = None
1582
Brian Harringa43f5952012-04-12 01:19:34 -07001583 if self._job_queue is not None:
1584 self._job_queue.close()
1585 self._job_queue = None
David Jamesfcb70ef2011-02-02 16:02:30 -08001586
1587 # Now that our workers are finished, we can kill the print queue.
Brian Harringa43f5952012-04-12 01:19:34 -07001588 if self._print_worker is not None:
1589 try:
1590 self._print_queue.put(None)
1591 self._print_queue.close()
1592 self._print_worker.join()
1593 finally:
1594 self._print_worker.terminate()
1595 self._print_queue = self._print_worker = None
David Jamesfcb70ef2011-02-02 16:02:30 -08001596
1597 def Run(self):
1598 """Run through the scheduled ebuilds.
1599
1600 Keep running so long as we have uninstalled packages in the
1601 dependency graph to merge.
1602 """
Brian Harringa43f5952012-04-12 01:19:34 -07001603 if not self._deps_map:
1604 return
1605
Brian Harring0be85c62012-03-17 19:52:12 -07001606 # Start the fetchers.
1607 for _ in xrange(min(self._fetch_procs, len(self._fetch_ready))):
1608 state = self._fetch_ready.get()
1609 self._fetch_jobs[state.target] = None
1610 self._fetch_queue.put(state)
1611
1612 # Print an update, then get going.
1613 self._Status()
1614
David Jamese703d0f2012-01-12 16:27:45 -08001615 retried = set()
David Jamesfcb70ef2011-02-02 16:02:30 -08001616 while self._deps_map:
1617 # Check here that we are actually waiting for something.
Brian Harring0be85c62012-03-17 19:52:12 -07001618 if (self._build_queue.empty() and
David Jamesfcb70ef2011-02-02 16:02:30 -08001619 self._job_queue.empty() and
Brian Harring0be85c62012-03-17 19:52:12 -07001620 not self._fetch_jobs and
1621 not self._fetch_ready and
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001622 not self._unpack_jobs and
1623 not self._unpack_ready and
Brian Harring0be85c62012-03-17 19:52:12 -07001624 not self._build_jobs and
1625 not self._build_ready and
David Jamesfcb70ef2011-02-02 16:02:30 -08001626 self._deps_map):
1627 # If we have failed on a package, retry it now.
1628 if self._retry_queue:
1629 self._Retry()
1630 else:
David Jamesfcb70ef2011-02-02 16:02:30 -08001631 # Tell the user why we're exiting.
1632 if self._failed:
Mike Frysingerf2ff9172012-11-01 18:47:41 -04001633 print 'Packages failed:\n\t%s' % '\n\t'.join(self._failed)
David James0eae23e2012-07-03 15:04:25 -07001634 status_file = os.environ.get("PARALLEL_EMERGE_STATUS_FILE")
1635 if status_file:
David James321490a2012-12-17 12:05:56 -08001636 failed_pkgs = set(portage.versions.cpv_getkey(x)
1637 for x in self._failed)
David James0eae23e2012-07-03 15:04:25 -07001638 with open(status_file, "a") as f:
1639 f.write("%s\n" % " ".join(failed_pkgs))
David Jamesfcb70ef2011-02-02 16:02:30 -08001640 else:
1641 print "Deadlock! Circular dependencies!"
1642 sys.exit(1)
1643
David James321490a2012-12-17 12:05:56 -08001644 for _ in xrange(12):
David Jamesa74289a2011-08-12 10:41:24 -07001645 try:
1646 job = self._job_queue.get(timeout=5)
1647 break
1648 except Queue.Empty:
1649 # Check if any more jobs can be scheduled.
1650 self._ScheduleLoop()
1651 else:
Brian Harring706747c2012-03-16 03:04:31 -07001652 # Print an update every 60 seconds.
David Jamesfcb70ef2011-02-02 16:02:30 -08001653 self._Status()
1654 continue
1655
1656 target = job.target
1657
Brian Harring0be85c62012-03-17 19:52:12 -07001658 if job.fetch_only:
1659 if not job.done:
1660 self._fetch_jobs[job.target] = job
1661 else:
1662 state = self._state_map[job.target]
1663 state.prefetched = True
1664 state.fetched_successfully = (job.retcode == 0)
1665 del self._fetch_jobs[job.target]
1666 self._Print("Fetched %s in %2.2fs"
1667 % (target, time.time() - job.start_timestamp))
1668
1669 if self._show_output or job.retcode != 0:
1670 self._print_queue.put(JobPrinter(job, unlink=True))
1671 else:
1672 os.unlink(job.filename)
1673 # Failure or not, let build work with it next.
1674 if not self._deps_map[job.target]["needs"]:
1675 self._build_ready.put(state)
1676 self._ScheduleLoop()
1677
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001678 if self._unpack_only and job.retcode == 0:
1679 self._unpack_ready.put(state)
1680 self._ScheduleLoop(unpack_only=True)
1681
Brian Harring0be85c62012-03-17 19:52:12 -07001682 if self._fetch_ready:
1683 state = self._fetch_ready.get()
1684 self._fetch_queue.put(state)
1685 self._fetch_jobs[state.target] = None
1686 else:
1687 # Minor optimization; shut down fetchers early since we know
1688 # the queue is empty.
1689 self._fetch_queue.put(None)
1690 continue
1691
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001692 if job.unpack_only:
1693 if not job.done:
1694 self._unpack_jobs[target] = job
1695 else:
1696 del self._unpack_jobs[target]
1697 self._Print("Unpacked %s in %2.2fs"
1698 % (target, time.time() - job.start_timestamp))
1699 if self._show_output or job.retcode != 0:
1700 self._print_queue.put(JobPrinter(job, unlink=True))
1701 else:
1702 os.unlink(job.filename)
1703 if self._unpack_ready:
1704 state = self._unpack_ready.get()
1705 self._unpack_queue.put(state)
1706 self._unpack_jobs[state.target] = None
1707 continue
1708
David Jamesfcb70ef2011-02-02 16:02:30 -08001709 if not job.done:
Brian Harring0be85c62012-03-17 19:52:12 -07001710 self._build_jobs[target] = job
David Jamesfcb70ef2011-02-02 16:02:30 -08001711 self._Print("Started %s (logged in %s)" % (target, job.filename))
1712 continue
1713
1714 # Print output of job
1715 if self._show_output or job.retcode != 0:
1716 self._print_queue.put(JobPrinter(job, unlink=True))
1717 else:
1718 os.unlink(job.filename)
Brian Harring0be85c62012-03-17 19:52:12 -07001719 del self._build_jobs[target]
David Jamesfcb70ef2011-02-02 16:02:30 -08001720
1721 seconds = time.time() - job.start_timestamp
1722 details = "%s (in %dm%.1fs)" % (target, seconds / 60, seconds % 60)
David James32420cc2011-08-25 21:32:46 -07001723 previously_failed = target in self._failed
David Jamesfcb70ef2011-02-02 16:02:30 -08001724
1725 # Complain if necessary.
1726 if job.retcode != 0:
1727 # Handle job failure.
David James32420cc2011-08-25 21:32:46 -07001728 if previously_failed:
David Jamesfcb70ef2011-02-02 16:02:30 -08001729 # If this job has failed previously, give up.
1730 self._Print("Failed %s. Your build has failed." % details)
1731 else:
1732 # Queue up this build to try again after a long while.
David Jamese703d0f2012-01-12 16:27:45 -08001733 retried.add(target)
Brian Harring0be85c62012-03-17 19:52:12 -07001734 self._retry_queue.append(self._state_map[target])
David Jamesfcb70ef2011-02-02 16:02:30 -08001735 self._failed.add(target)
1736 self._Print("Failed %s, retrying later." % details)
1737 else:
David James32420cc2011-08-25 21:32:46 -07001738 if previously_failed:
1739 # Remove target from list of failed packages.
1740 self._failed.remove(target)
1741
1742 self._Print("Completed %s" % details)
1743
1744 # Mark as completed and unblock waiting ebuilds.
1745 self._Finish(target)
1746
1747 if previously_failed and self._retry_queue:
David Jamesfcb70ef2011-02-02 16:02:30 -08001748 # If we have successfully retried a failed package, and there
1749 # are more failed packages, try the next one. We will only have
1750 # one retrying package actively running at a time.
1751 self._Retry()
1752
David Jamesfcb70ef2011-02-02 16:02:30 -08001753
David James8c7e5e32011-06-28 11:26:03 -07001754 # Schedule pending jobs and print an update.
1755 self._ScheduleLoop()
1756 self._Status()
David Jamesfcb70ef2011-02-02 16:02:30 -08001757
David Jamese703d0f2012-01-12 16:27:45 -08001758 # If packages were retried, output a warning.
1759 if retried:
1760 self._Print("")
1761 self._Print("WARNING: The following packages failed the first time,")
1762 self._Print("but succeeded upon retry. This might indicate incorrect")
1763 self._Print("dependencies.")
1764 for pkg in retried:
1765 self._Print(" %s" % pkg)
1766 self._Print("@@@STEP_WARNINGS@@@")
1767 self._Print("")
1768
David Jamesfcb70ef2011-02-02 16:02:30 -08001769 # Tell child threads to exit.
1770 self._Print("Merge complete")
David Jamesfcb70ef2011-02-02 16:02:30 -08001771
1772
Brian Harring30675052012-02-29 12:18:22 -08001773def main(argv):
Brian Harring8294d652012-05-23 02:20:52 -07001774 try:
1775 return real_main(argv)
1776 finally:
1777 # Work around multiprocessing sucking and not cleaning up after itself.
1778 # http://bugs.python.org/issue4106;
1779 # Step one; ensure GC is ran *prior* to the VM starting shutdown.
1780 gc.collect()
1781 # Step two; go looking for those threads and try to manually reap
1782 # them if we can.
1783 for x in threading.enumerate():
1784 # Filter on the name, and ident; if ident is None, the thread
1785 # wasn't started.
1786 if x.name == 'QueueFeederThread' and x.ident is not None:
1787 x.join(1)
David Jamesfcb70ef2011-02-02 16:02:30 -08001788
Brian Harring8294d652012-05-23 02:20:52 -07001789
1790def real_main(argv):
Brian Harring30675052012-02-29 12:18:22 -08001791 parallel_emerge_args = argv[:]
David Jamesfcb70ef2011-02-02 16:02:30 -08001792 deps = DepGraphGenerator()
Brian Harring30675052012-02-29 12:18:22 -08001793 deps.Initialize(parallel_emerge_args)
David Jamesfcb70ef2011-02-02 16:02:30 -08001794 emerge = deps.emerge
1795
1796 if emerge.action is not None:
Brian Harring30675052012-02-29 12:18:22 -08001797 argv = deps.ParseParallelEmergeArgs(argv)
Brian Harring8294d652012-05-23 02:20:52 -07001798 return emerge_main(argv)
David Jamesfcb70ef2011-02-02 16:02:30 -08001799 elif not emerge.cmdline_packages:
1800 Usage()
Brian Harring8294d652012-05-23 02:20:52 -07001801 return 1
David Jamesfcb70ef2011-02-02 16:02:30 -08001802
1803 # Unless we're in pretend mode, there's not much point running without
1804 # root access. We need to be able to install packages.
1805 #
1806 # NOTE: Even if you're running --pretend, it's a good idea to run
1807 # parallel_emerge with root access so that portage can write to the
1808 # dependency cache. This is important for performance.
David James321490a2012-12-17 12:05:56 -08001809 if "--pretend" not in emerge.opts and portage.data.secpass < 2:
David Jamesfcb70ef2011-02-02 16:02:30 -08001810 print "parallel_emerge: superuser access is required."
Brian Harring8294d652012-05-23 02:20:52 -07001811 return 1
David Jamesfcb70ef2011-02-02 16:02:30 -08001812
1813 if "--quiet" not in emerge.opts:
1814 cmdline_packages = " ".join(emerge.cmdline_packages)
David Jamesfcb70ef2011-02-02 16:02:30 -08001815 print "Starting fast-emerge."
1816 print " Building package %s on %s" % (cmdline_packages,
1817 deps.board or "root")
David Jamesfcb70ef2011-02-02 16:02:30 -08001818
David James386ccd12011-05-04 20:17:42 -07001819 deps_tree, deps_info = deps.GenDependencyTree()
David Jamesfcb70ef2011-02-02 16:02:30 -08001820
1821 # You want me to be verbose? I'll give you two trees! Twice as much value.
1822 if "--tree" in emerge.opts and "--verbose" in emerge.opts:
1823 deps.PrintTree(deps_tree)
1824
David James386ccd12011-05-04 20:17:42 -07001825 deps_graph = deps.GenDependencyGraph(deps_tree, deps_info)
David Jamesfcb70ef2011-02-02 16:02:30 -08001826
1827 # OK, time to print out our progress so far.
1828 deps.PrintInstallPlan(deps_graph)
1829 if "--tree" in emerge.opts:
1830 PrintDepsMap(deps_graph)
1831
1832 # Are we upgrading portage? If so, and there are more packages to merge,
1833 # schedule a restart of parallel_emerge to merge the rest. This ensures that
1834 # we pick up all updates to portage settings before merging any more
1835 # packages.
1836 portage_upgrade = False
1837 root = emerge.settings["ROOT"]
Don Garrett25f309a2014-03-19 14:02:12 -07001838 # pylint: disable=W0212
David Jamesfcb70ef2011-02-02 16:02:30 -08001839 final_db = emerge.depgraph._dynamic_config.mydbapi[root]
1840 if root == "/":
1841 for db_pkg in final_db.match_pkgs("sys-apps/portage"):
1842 portage_pkg = deps_graph.get(db_pkg.cpv)
David James0ff16f22012-11-02 14:18:07 -07001843 if portage_pkg:
David Jamesfcb70ef2011-02-02 16:02:30 -08001844 portage_upgrade = True
1845 if "--quiet" not in emerge.opts:
1846 print "Upgrading portage first, then restarting..."
1847
David James0ff16f22012-11-02 14:18:07 -07001848 # Upgrade Portage first, then the rest of the packages.
1849 #
1850 # In order to grant the child permission to run setsid, we need to run sudo
1851 # again. We preserve SUDO_USER here in case an ebuild depends on it.
1852 if portage_upgrade:
1853 # Calculate what arguments to use when re-invoking.
1854 args = ["sudo", "-E", "SUDO_USER=%s" % os.environ.get("SUDO_USER", "")]
1855 args += [os.path.abspath(sys.argv[0])] + parallel_emerge_args
1856 args += ["--exclude=sys-apps/portage"]
1857
1858 # First upgrade Portage.
1859 passthrough_args = ("--quiet", "--pretend", "--verbose")
1860 emerge_args = [k for k in emerge.opts if k in passthrough_args]
1861 ret = emerge_main(emerge_args + ["portage"])
1862 if ret != 0:
1863 return ret
1864
1865 # Now upgrade the rest.
1866 os.execvp(args[0], args)
1867
David Jamesfcb70ef2011-02-02 16:02:30 -08001868 # Run the queued emerges.
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001869 scheduler = EmergeQueue(deps_graph, emerge, deps.package_db, deps.show_output,
1870 deps.unpack_only)
Brian Harringa43f5952012-04-12 01:19:34 -07001871 try:
1872 scheduler.Run()
1873 finally:
Don Garrett25f309a2014-03-19 14:02:12 -07001874 # pylint: disable=W0212
Brian Harringa43f5952012-04-12 01:19:34 -07001875 scheduler._Shutdown()
David James97ce8902011-08-16 09:51:05 -07001876 scheduler = None
David Jamesfcb70ef2011-02-02 16:02:30 -08001877
Mike Frysingerd20a6e22012-10-04 19:01:10 -04001878 clean_logs(emerge.settings)
1879
David Jamesfcb70ef2011-02-02 16:02:30 -08001880 print "Done"
Brian Harring8294d652012-05-23 02:20:52 -07001881 return 0