blob: 811c6cc8577b7d929940c7b69e582cc8c01bede0 [file] [log] [blame]
Mike Frysinger9f7e4ee2013-03-13 15:43:03 -04001#!/usr/bin/python
Mike Frysinger0a647fc2012-08-06 14:36:05 -04002# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
David Jamesfcb70ef2011-02-02 16:02:30 -08003# Use of this source code is governed by a BSD-style license that can be
4# found in the LICENSE file.
5
6"""Program to run emerge in parallel, for significant speedup.
7
8Usage:
David James386ccd12011-05-04 20:17:42 -07009 ./parallel_emerge [--board=BOARD] [--workon=PKGS]
David Jamesfcb70ef2011-02-02 16:02:30 -080010 [--force-remote-binary=PKGS] [emerge args] package
11
David James78b6cd92012-04-02 21:36:12 -070012This script runs multiple emerge processes in parallel, using appropriate
13Portage APIs. It is faster than standard emerge because it has a
14multiprocess model instead of an asynchronous model.
David Jamesfcb70ef2011-02-02 16:02:30 -080015"""
16
17import codecs
18import copy
19import errno
Brian Harring8294d652012-05-23 02:20:52 -070020import gc
David James8c7e5e32011-06-28 11:26:03 -070021import heapq
David Jamesfcb70ef2011-02-02 16:02:30 -080022import multiprocessing
23import os
Mike Frysinger1ae28092013-10-17 17:17:22 -040024try:
25 import Queue
26except ImportError:
27 # Python-3 renamed to "queue". We still use Queue to avoid collisions
28 # with naming variables as "queue". Maybe we'll transition at some point.
29 # pylint: disable=F0401
30 import queue as Queue
David Jamesfcb70ef2011-02-02 16:02:30 -080031import signal
32import sys
33import tempfile
Brian Harring8294d652012-05-23 02:20:52 -070034import threading
David Jamesfcb70ef2011-02-02 16:02:30 -080035import time
36import traceback
David Jamesfcb70ef2011-02-02 16:02:30 -080037
Thiago Goncalesf4acc422013-07-17 10:26:35 -070038from chromite.lib import cros_build_lib
David James6d47d8c2014-04-24 09:40:05 -070039from chromite.lib import osutils
Thiago Goncalesf4acc422013-07-17 10:26:35 -070040
David Jamesfcb70ef2011-02-02 16:02:30 -080041# If PORTAGE_USERNAME isn't specified, scrape it from the $HOME variable. On
42# Chromium OS, the default "portage" user doesn't have the necessary
43# permissions. It'd be easier if we could default to $USERNAME, but $USERNAME
44# is "root" here because we get called through sudo.
45#
46# We need to set this before importing any portage modules, because portage
47# looks up "PORTAGE_USERNAME" at import time.
48#
49# NOTE: .bashrc sets PORTAGE_USERNAME = $USERNAME, so most people won't
50# encounter this case unless they have an old chroot or blow away the
51# environment by running sudo without the -E specifier.
52if "PORTAGE_USERNAME" not in os.environ:
53 homedir = os.environ.get("HOME")
54 if homedir:
55 os.environ["PORTAGE_USERNAME"] = os.path.basename(homedir)
56
57# Portage doesn't expose dependency trees in its public API, so we have to
58# make use of some private APIs here. These modules are found under
59# /usr/lib/portage/pym/.
60#
61# TODO(davidjames): Update Portage to expose public APIs for these features.
Don Garrett25f309a2014-03-19 14:02:12 -070062# pylint: disable=F0401
David Jamesfcb70ef2011-02-02 16:02:30 -080063from _emerge.actions import adjust_configs
64from _emerge.actions import load_emerge_config
65from _emerge.create_depgraph_params import create_depgraph_params
David James386ccd12011-05-04 20:17:42 -070066from _emerge.depgraph import backtrack_depgraph
Mike Frysinger901eaad2012-10-10 18:18:03 -040067try:
68 from _emerge.main import clean_logs
69except ImportError:
70 # Older portage versions did not provide clean_logs, so stub it.
71 # We need this if running in an older chroot that hasn't yet upgraded
72 # the portage version.
73 clean_logs = lambda x: None
David Jamesfcb70ef2011-02-02 16:02:30 -080074from _emerge.main import emerge_main
75from _emerge.main import parse_opts
76from _emerge.Package import Package
77from _emerge.Scheduler import Scheduler
David Jamesfcb70ef2011-02-02 16:02:30 -080078from _emerge.stdout_spinner import stdout_spinner
David James386ccd12011-05-04 20:17:42 -070079from portage._global_updates import _global_updates
David Jamesfcb70ef2011-02-02 16:02:30 -080080import portage
81import portage.debug
Don Garrettf8bf7842014-03-20 17:03:42 -070082# pylint: enable=F0401
Mike Frysinger91d7da92013-02-19 15:53:46 -050083
David Jamesfcb70ef2011-02-02 16:02:30 -080084
David Jamesfcb70ef2011-02-02 16:02:30 -080085def Usage():
86 """Print usage."""
87 print "Usage:"
David James386ccd12011-05-04 20:17:42 -070088 print " ./parallel_emerge [--board=BOARD] [--workon=PKGS]"
David Jamesfcb70ef2011-02-02 16:02:30 -080089 print " [--rebuild] [emerge args] package"
90 print
91 print "Packages specified as workon packages are always built from source."
David Jamesfcb70ef2011-02-02 16:02:30 -080092 print
93 print "The --workon argument is mainly useful when you want to build and"
94 print "install packages that you are working on unconditionally, but do not"
95 print "to have to rev the package to indicate you want to build it from"
96 print "source. The build_packages script will automatically supply the"
97 print "workon argument to emerge, ensuring that packages selected using"
98 print "cros-workon are rebuilt."
99 print
100 print "The --rebuild option rebuilds packages whenever their dependencies"
101 print "are changed. This ensures that your build is correct."
David Jamesfcb70ef2011-02-02 16:02:30 -0800102
103
David Jamesfcb70ef2011-02-02 16:02:30 -0800104# Global start time
105GLOBAL_START = time.time()
106
David James7358d032011-05-19 10:40:03 -0700107# Whether process has been killed by a signal.
108KILLED = multiprocessing.Event()
109
David Jamesfcb70ef2011-02-02 16:02:30 -0800110
111class EmergeData(object):
112 """This simple struct holds various emerge variables.
113
114 This struct helps us easily pass emerge variables around as a unit.
115 These variables are used for calculating dependencies and installing
116 packages.
117 """
118
David Jamesbf1e3442011-05-28 07:44:20 -0700119 __slots__ = ["action", "cmdline_packages", "depgraph", "favorites",
120 "mtimedb", "opts", "root_config", "scheduler_graph",
121 "settings", "spinner", "trees"]
David Jamesfcb70ef2011-02-02 16:02:30 -0800122
123 def __init__(self):
124 # The action the user requested. If the user is installing packages, this
125 # is None. If the user is doing anything other than installing packages,
126 # this will contain the action name, which will map exactly to the
127 # long-form name of the associated emerge option.
128 #
129 # Example: If you call parallel_emerge --unmerge package, the action name
130 # will be "unmerge"
131 self.action = None
132
133 # The list of packages the user passed on the command-line.
134 self.cmdline_packages = None
135
136 # The emerge dependency graph. It'll contain all the packages involved in
137 # this merge, along with their versions.
138 self.depgraph = None
139
David Jamesbf1e3442011-05-28 07:44:20 -0700140 # The list of candidates to add to the world file.
141 self.favorites = None
142
David Jamesfcb70ef2011-02-02 16:02:30 -0800143 # A dict of the options passed to emerge. This dict has been cleaned up
144 # a bit by parse_opts, so that it's a bit easier for the emerge code to
145 # look at the options.
146 #
147 # Emerge takes a few shortcuts in its cleanup process to make parsing of
148 # the options dict easier. For example, if you pass in "--usepkg=n", the
149 # "--usepkg" flag is just left out of the dictionary altogether. Because
150 # --usepkg=n is the default, this makes parsing easier, because emerge
151 # can just assume that if "--usepkg" is in the dictionary, it's enabled.
152 #
153 # These cleanup processes aren't applied to all options. For example, the
154 # --with-bdeps flag is passed in as-is. For a full list of the cleanups
155 # applied by emerge, see the parse_opts function in the _emerge.main
156 # package.
157 self.opts = None
158
159 # A dictionary used by portage to maintain global state. This state is
160 # loaded from disk when portage starts up, and saved to disk whenever we
161 # call mtimedb.commit().
162 #
163 # This database contains information about global updates (i.e., what
164 # version of portage we have) and what we're currently doing. Portage
165 # saves what it is currently doing in this database so that it can be
166 # resumed when you call it with the --resume option.
167 #
168 # parallel_emerge does not save what it is currently doing in the mtimedb,
169 # so we do not support the --resume option.
170 self.mtimedb = None
171
172 # The portage configuration for our current root. This contains the portage
173 # settings (see below) and the three portage trees for our current root.
174 # (The three portage trees are explained below, in the documentation for
175 # the "trees" member.)
176 self.root_config = None
177
178 # The scheduler graph is used by emerge to calculate what packages to
179 # install. We don't actually install any deps, so this isn't really used,
180 # but we pass it in to the Scheduler object anyway.
181 self.scheduler_graph = None
182
183 # Portage settings for our current session. Most of these settings are set
184 # in make.conf inside our current install root.
185 self.settings = None
186
187 # The spinner, which spews stuff to stdout to indicate that portage is
188 # doing something. We maintain our own spinner, so we set the portage
189 # spinner to "silent" mode.
190 self.spinner = None
191
192 # The portage trees. There are separate portage trees for each root. To get
193 # the portage tree for the current root, you can look in self.trees[root],
194 # where root = self.settings["ROOT"].
195 #
196 # In each root, there are three trees: vartree, porttree, and bintree.
197 # - vartree: A database of the currently-installed packages.
198 # - porttree: A database of ebuilds, that can be used to build packages.
199 # - bintree: A database of binary packages.
200 self.trees = None
201
202
203class DepGraphGenerator(object):
204 """Grab dependency information about packages from portage.
205
206 Typical usage:
207 deps = DepGraphGenerator()
208 deps.Initialize(sys.argv[1:])
209 deps_tree, deps_info = deps.GenDependencyTree()
210 deps_graph = deps.GenDependencyGraph(deps_tree, deps_info)
211 deps.PrintTree(deps_tree)
212 PrintDepsMap(deps_graph)
213 """
214
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700215 __slots__ = ["board", "emerge", "package_db", "show_output", "unpack_only"]
David Jamesfcb70ef2011-02-02 16:02:30 -0800216
217 def __init__(self):
218 self.board = None
219 self.emerge = EmergeData()
David Jamesfcb70ef2011-02-02 16:02:30 -0800220 self.package_db = {}
David Jamesfcb70ef2011-02-02 16:02:30 -0800221 self.show_output = False
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700222 self.unpack_only = False
David Jamesfcb70ef2011-02-02 16:02:30 -0800223
224 def ParseParallelEmergeArgs(self, argv):
225 """Read the parallel emerge arguments from the command-line.
226
227 We need to be compatible with emerge arg format. We scrape arguments that
228 are specific to parallel_emerge, and pass through the rest directly to
229 emerge.
Mike Frysinger1a736a82013-12-12 01:50:59 -0500230
David Jamesfcb70ef2011-02-02 16:02:30 -0800231 Args:
232 argv: arguments list
Mike Frysinger1a736a82013-12-12 01:50:59 -0500233
David Jamesfcb70ef2011-02-02 16:02:30 -0800234 Returns:
235 Arguments that don't belong to parallel_emerge
236 """
237 emerge_args = []
238 for arg in argv:
239 # Specifically match arguments that are specific to parallel_emerge, and
240 # pass through the rest.
241 if arg.startswith("--board="):
242 self.board = arg.replace("--board=", "")
243 elif arg.startswith("--workon="):
244 workon_str = arg.replace("--workon=", "")
David James7a1ea4b2011-10-13 15:06:41 -0700245 emerge_args.append("--reinstall-atoms=%s" % workon_str)
246 emerge_args.append("--usepkg-exclude=%s" % workon_str)
David Jamesfcb70ef2011-02-02 16:02:30 -0800247 elif arg.startswith("--force-remote-binary="):
248 force_remote_binary = arg.replace("--force-remote-binary=", "")
David James7a1ea4b2011-10-13 15:06:41 -0700249 emerge_args.append("--useoldpkg-atoms=%s" % force_remote_binary)
David Jamesfcb70ef2011-02-02 16:02:30 -0800250 elif arg == "--show-output":
251 self.show_output = True
David James386ccd12011-05-04 20:17:42 -0700252 elif arg == "--rebuild":
David James7a1ea4b2011-10-13 15:06:41 -0700253 emerge_args.append("--rebuild-if-unbuilt")
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700254 elif arg == "--unpackonly":
255 emerge_args.append("--fetchonly")
256 self.unpack_only = True
David Jamesfcb70ef2011-02-02 16:02:30 -0800257 else:
258 # Not one of our options, so pass through to emerge.
259 emerge_args.append(arg)
260
David James386ccd12011-05-04 20:17:42 -0700261 # These packages take a really long time to build, so, for expediency, we
262 # are blacklisting them from automatic rebuilds because one of their
263 # dependencies needs to be recompiled.
Mike Frysinger5c2a9052014-04-15 15:52:04 -0400264 for pkg in ("chromeos-base/chromeos-chrome",):
David James7a1ea4b2011-10-13 15:06:41 -0700265 emerge_args.append("--rebuild-exclude=%s" % pkg)
David Jamesfcb70ef2011-02-02 16:02:30 -0800266
267 return emerge_args
268
269 def Initialize(self, args):
270 """Initializer. Parses arguments and sets up portage state."""
271
272 # Parse and strip out args that are just intended for parallel_emerge.
273 emerge_args = self.ParseParallelEmergeArgs(args)
274
275 # Setup various environment variables based on our current board. These
276 # variables are normally setup inside emerge-${BOARD}, but since we don't
277 # call that script, we have to set it up here. These variables serve to
278 # point our tools at /build/BOARD and to setup cross compiles to the
279 # appropriate board as configured in toolchain.conf.
280 if self.board:
Yu-Ju Hongdd9bb2b2014-01-03 17:08:26 -0800281 sysroot = cros_build_lib.GetSysroot(board=self.board)
282 os.environ["PORTAGE_CONFIGROOT"] = sysroot
283 os.environ["PORTAGE_SYSROOT"] = sysroot
284 os.environ["SYSROOT"] = sysroot
David Jamesfcb70ef2011-02-02 16:02:30 -0800285
286 # Although CHROMEOS_ROOT isn't specific to boards, it's normally setup
287 # inside emerge-${BOARD}, so we set it up here for compatibility. It
288 # will be going away soon as we migrate to CROS_WORKON_SRCROOT.
289 os.environ.setdefault("CHROMEOS_ROOT", os.environ["HOME"] + "/trunk")
290
291 # Turn off interactive delays
292 os.environ["EBEEP_IGNORE"] = "1"
293 os.environ["EPAUSE_IGNORE"] = "1"
Mike Frysinger0a647fc2012-08-06 14:36:05 -0400294 os.environ["CLEAN_DELAY"] = "0"
David Jamesfcb70ef2011-02-02 16:02:30 -0800295
296 # Parse the emerge options.
David Jamesea3ca332011-05-26 11:48:29 -0700297 action, opts, cmdline_packages = parse_opts(emerge_args, silent=True)
David Jamesfcb70ef2011-02-02 16:02:30 -0800298
299 # Set environment variables based on options. Portage normally sets these
300 # environment variables in emerge_main, but we can't use that function,
301 # because it also does a bunch of other stuff that we don't want.
302 # TODO(davidjames): Patch portage to move this logic into a function we can
303 # reuse here.
304 if "--debug" in opts:
305 os.environ["PORTAGE_DEBUG"] = "1"
306 if "--config-root" in opts:
307 os.environ["PORTAGE_CONFIGROOT"] = opts["--config-root"]
308 if "--root" in opts:
309 os.environ["ROOT"] = opts["--root"]
310 if "--accept-properties" in opts:
311 os.environ["ACCEPT_PROPERTIES"] = opts["--accept-properties"]
312
David James88d780c2014-02-05 13:03:29 -0800313 # If we're installing packages to the board, we can disable vardb locks.
314 # This is safe because we only run up to one instance of parallel_emerge in
315 # parallel.
316 # TODO(davidjames): Enable this for the host too.
317 if self.board:
David Jamesfcb70ef2011-02-02 16:02:30 -0800318 os.environ.setdefault("PORTAGE_LOCKS", "false")
David Jamesfcb70ef2011-02-02 16:02:30 -0800319
320 # Now that we've setup the necessary environment variables, we can load the
321 # emerge config from disk.
322 settings, trees, mtimedb = load_emerge_config()
323
David Jamesea3ca332011-05-26 11:48:29 -0700324 # Add in EMERGE_DEFAULT_OPTS, if specified.
325 tmpcmdline = []
326 if "--ignore-default-opts" not in opts:
327 tmpcmdline.extend(settings["EMERGE_DEFAULT_OPTS"].split())
328 tmpcmdline.extend(emerge_args)
329 action, opts, cmdline_packages = parse_opts(tmpcmdline)
330
331 # If we're installing to the board, we want the --root-deps option so that
332 # portage will install the build dependencies to that location as well.
333 if self.board:
334 opts.setdefault("--root-deps", True)
335
David Jamesfcb70ef2011-02-02 16:02:30 -0800336 # Check whether our portage tree is out of date. Typically, this happens
337 # when you're setting up a new portage tree, such as in setup_board and
338 # make_chroot. In that case, portage applies a bunch of global updates
339 # here. Once the updates are finished, we need to commit any changes
340 # that the global update made to our mtimedb, and reload the config.
341 #
342 # Portage normally handles this logic in emerge_main, but again, we can't
343 # use that function here.
344 if _global_updates(trees, mtimedb["updates"]):
345 mtimedb.commit()
346 settings, trees, mtimedb = load_emerge_config(trees=trees)
347
348 # Setup implied options. Portage normally handles this logic in
349 # emerge_main.
350 if "--buildpkgonly" in opts or "buildpkg" in settings.features:
351 opts.setdefault("--buildpkg", True)
352 if "--getbinpkgonly" in opts:
353 opts.setdefault("--usepkgonly", True)
354 opts.setdefault("--getbinpkg", True)
355 if "getbinpkg" in settings.features:
356 # Per emerge_main, FEATURES=getbinpkg overrides --getbinpkg=n
357 opts["--getbinpkg"] = True
358 if "--getbinpkg" in opts or "--usepkgonly" in opts:
359 opts.setdefault("--usepkg", True)
360 if "--fetch-all-uri" in opts:
361 opts.setdefault("--fetchonly", True)
362 if "--skipfirst" in opts:
363 opts.setdefault("--resume", True)
364 if "--buildpkgonly" in opts:
365 # --buildpkgonly will not merge anything, so it overrides all binary
366 # package options.
367 for opt in ("--getbinpkg", "--getbinpkgonly",
368 "--usepkg", "--usepkgonly"):
369 opts.pop(opt, None)
370 if (settings.get("PORTAGE_DEBUG", "") == "1" and
371 "python-trace" in settings.features):
372 portage.debug.set_trace(True)
373
374 # Complain about unsupported options
David James386ccd12011-05-04 20:17:42 -0700375 for opt in ("--ask", "--ask-enter-invalid", "--resume", "--skipfirst"):
David Jamesfcb70ef2011-02-02 16:02:30 -0800376 if opt in opts:
377 print "%s is not supported by parallel_emerge" % opt
378 sys.exit(1)
379
380 # Make emerge specific adjustments to the config (e.g. colors!)
381 adjust_configs(opts, trees)
382
383 # Save our configuration so far in the emerge object
384 emerge = self.emerge
385 emerge.action, emerge.opts = action, opts
386 emerge.settings, emerge.trees, emerge.mtimedb = settings, trees, mtimedb
387 emerge.cmdline_packages = cmdline_packages
388 root = settings["ROOT"]
389 emerge.root_config = trees[root]["root_config"]
390
David James386ccd12011-05-04 20:17:42 -0700391 if "--usepkg" in opts:
David Jamesfcb70ef2011-02-02 16:02:30 -0800392 emerge.trees[root]["bintree"].populate("--getbinpkg" in opts)
393
David Jamesfcb70ef2011-02-02 16:02:30 -0800394 def CreateDepgraph(self, emerge, packages):
395 """Create an emerge depgraph object."""
396 # Setup emerge options.
397 emerge_opts = emerge.opts.copy()
398
David James386ccd12011-05-04 20:17:42 -0700399 # Ask portage to build a dependency graph. with the options we specified
400 # above.
David Jamesfcb70ef2011-02-02 16:02:30 -0800401 params = create_depgraph_params(emerge_opts, emerge.action)
David Jamesbf1e3442011-05-28 07:44:20 -0700402 success, depgraph, favorites = backtrack_depgraph(
David James386ccd12011-05-04 20:17:42 -0700403 emerge.settings, emerge.trees, emerge_opts, params, emerge.action,
404 packages, emerge.spinner)
405 emerge.depgraph = depgraph
David Jamesfcb70ef2011-02-02 16:02:30 -0800406
David James386ccd12011-05-04 20:17:42 -0700407 # Is it impossible to honor the user's request? Bail!
408 if not success:
409 depgraph.display_problems()
410 sys.exit(1)
David Jamesfcb70ef2011-02-02 16:02:30 -0800411
412 emerge.depgraph = depgraph
David Jamesbf1e3442011-05-28 07:44:20 -0700413 emerge.favorites = favorites
David Jamesfcb70ef2011-02-02 16:02:30 -0800414
David Jamesdeebd692011-05-09 17:02:52 -0700415 # Prime and flush emerge caches.
416 root = emerge.settings["ROOT"]
417 vardb = emerge.trees[root]["vartree"].dbapi
David James0bdc5de2011-05-12 16:22:26 -0700418 if "--pretend" not in emerge.opts:
419 vardb.counter_tick()
David Jamesdeebd692011-05-09 17:02:52 -0700420 vardb.flush_cache()
421
David James386ccd12011-05-04 20:17:42 -0700422 def GenDependencyTree(self):
David Jamesfcb70ef2011-02-02 16:02:30 -0800423 """Get dependency tree info from emerge.
424
David Jamesfcb70ef2011-02-02 16:02:30 -0800425 Returns:
426 Dependency tree
427 """
428 start = time.time()
429
430 emerge = self.emerge
431
432 # Create a list of packages to merge
433 packages = set(emerge.cmdline_packages[:])
David Jamesfcb70ef2011-02-02 16:02:30 -0800434
435 # Tell emerge to be quiet. We print plenty of info ourselves so we don't
436 # need any extra output from portage.
437 portage.util.noiselimit = -1
438
439 # My favorite feature: The silent spinner. It doesn't spin. Ever.
440 # I'd disable the colors by default too, but they look kind of cool.
441 emerge.spinner = stdout_spinner()
442 emerge.spinner.update = emerge.spinner.update_quiet
443
444 if "--quiet" not in emerge.opts:
445 print "Calculating deps..."
446
447 self.CreateDepgraph(emerge, packages)
448 depgraph = emerge.depgraph
449
450 # Build our own tree from the emerge digraph.
451 deps_tree = {}
Don Garrett25f309a2014-03-19 14:02:12 -0700452 # pylint: disable=W0212
David Jamesfcb70ef2011-02-02 16:02:30 -0800453 digraph = depgraph._dynamic_config.digraph
David James3f778802011-08-25 19:31:45 -0700454 root = emerge.settings["ROOT"]
455 final_db = depgraph._dynamic_config.mydbapi[root]
David Jamesfcb70ef2011-02-02 16:02:30 -0800456 for node, node_deps in digraph.nodes.items():
457 # Calculate dependency packages that need to be installed first. Each
458 # child on the digraph is a dependency. The "operation" field specifies
459 # what we're doing (e.g. merge, uninstall, etc.). The "priorities" array
460 # contains the type of dependency (e.g. build, runtime, runtime_post,
461 # etc.)
462 #
David Jamesfcb70ef2011-02-02 16:02:30 -0800463 # Portage refers to the identifiers for packages as a CPV. This acronym
464 # stands for Component/Path/Version.
465 #
466 # Here's an example CPV: chromeos-base/power_manager-0.0.1-r1
467 # Split up, this CPV would be:
468 # C -- Component: chromeos-base
469 # P -- Path: power_manager
470 # V -- Version: 0.0.1-r1
471 #
472 # We just refer to CPVs as packages here because it's easier.
473 deps = {}
474 for child, priorities in node_deps[0].items():
David James3f778802011-08-25 19:31:45 -0700475 if isinstance(child, Package) and child.root == root:
476 cpv = str(child.cpv)
477 action = str(child.operation)
478
479 # If we're uninstalling a package, check whether Portage is
480 # installing a replacement. If so, just depend on the installation
481 # of the new package, because the old package will automatically
482 # be uninstalled at that time.
483 if action == "uninstall":
484 for pkg in final_db.match_pkgs(child.slot_atom):
485 cpv = str(pkg.cpv)
486 action = "merge"
487 break
488
489 deps[cpv] = dict(action=action,
490 deptypes=[str(x) for x in priorities],
491 deps={})
David Jamesfcb70ef2011-02-02 16:02:30 -0800492
493 # We've built our list of deps, so we can add our package to the tree.
David James3f778802011-08-25 19:31:45 -0700494 if isinstance(node, Package) and node.root == root:
David Jamesfcb70ef2011-02-02 16:02:30 -0800495 deps_tree[str(node.cpv)] = dict(action=str(node.operation),
496 deps=deps)
497
David Jamesfcb70ef2011-02-02 16:02:30 -0800498 # Ask portage for its install plan, so that we can only throw out
David James386ccd12011-05-04 20:17:42 -0700499 # dependencies that portage throws out.
David Jamesfcb70ef2011-02-02 16:02:30 -0800500 deps_info = {}
501 for pkg in depgraph.altlist():
502 if isinstance(pkg, Package):
David James3f778802011-08-25 19:31:45 -0700503 assert pkg.root == root
David Jamesfcb70ef2011-02-02 16:02:30 -0800504 self.package_db[pkg.cpv] = pkg
505
David Jamesfcb70ef2011-02-02 16:02:30 -0800506 # Save off info about the package
David James386ccd12011-05-04 20:17:42 -0700507 deps_info[str(pkg.cpv)] = {"idx": len(deps_info)}
David Jamesfcb70ef2011-02-02 16:02:30 -0800508
509 seconds = time.time() - start
510 if "--quiet" not in emerge.opts:
511 print "Deps calculated in %dm%.1fs" % (seconds / 60, seconds % 60)
512
513 return deps_tree, deps_info
514
515 def PrintTree(self, deps, depth=""):
516 """Print the deps we have seen in the emerge output.
517
518 Args:
519 deps: Dependency tree structure.
520 depth: Allows printing the tree recursively, with indentation.
521 """
522 for entry in sorted(deps):
523 action = deps[entry]["action"]
524 print "%s %s (%s)" % (depth, entry, action)
525 self.PrintTree(deps[entry]["deps"], depth=depth + " ")
526
David James386ccd12011-05-04 20:17:42 -0700527 def GenDependencyGraph(self, deps_tree, deps_info):
David Jamesfcb70ef2011-02-02 16:02:30 -0800528 """Generate a doubly linked dependency graph.
529
530 Args:
531 deps_tree: Dependency tree structure.
532 deps_info: More details on the dependencies.
Mike Frysinger1a736a82013-12-12 01:50:59 -0500533
David Jamesfcb70ef2011-02-02 16:02:30 -0800534 Returns:
535 Deps graph in the form of a dict of packages, with each package
536 specifying a "needs" list and "provides" list.
537 """
538 emerge = self.emerge
David Jamesfcb70ef2011-02-02 16:02:30 -0800539
David Jamesfcb70ef2011-02-02 16:02:30 -0800540 # deps_map is the actual dependency graph.
541 #
542 # Each package specifies a "needs" list and a "provides" list. The "needs"
543 # list indicates which packages we depend on. The "provides" list
544 # indicates the reverse dependencies -- what packages need us.
545 #
546 # We also provide some other information in the dependency graph:
547 # - action: What we're planning on doing with this package. Generally,
548 # "merge", "nomerge", or "uninstall"
David Jamesfcb70ef2011-02-02 16:02:30 -0800549 deps_map = {}
550
551 def ReverseTree(packages):
552 """Convert tree to digraph.
553
554 Take the tree of package -> requirements and reverse it to a digraph of
555 buildable packages -> packages they unblock.
Mike Frysinger1a736a82013-12-12 01:50:59 -0500556
David Jamesfcb70ef2011-02-02 16:02:30 -0800557 Args:
558 packages: Tree(s) of dependencies.
Mike Frysinger1a736a82013-12-12 01:50:59 -0500559
David Jamesfcb70ef2011-02-02 16:02:30 -0800560 Returns:
561 Unsanitized digraph.
562 """
David James8c7e5e32011-06-28 11:26:03 -0700563 binpkg_phases = set(["setup", "preinst", "postinst"])
David James3f778802011-08-25 19:31:45 -0700564 needed_dep_types = set(["blocker", "buildtime", "runtime"])
David Jamesfcb70ef2011-02-02 16:02:30 -0800565 for pkg in packages:
566
567 # Create an entry for the package
568 action = packages[pkg]["action"]
David James8c7e5e32011-06-28 11:26:03 -0700569 default_pkg = {"needs": {}, "provides": set(), "action": action,
570 "nodeps": False, "binary": False}
David Jamesfcb70ef2011-02-02 16:02:30 -0800571 this_pkg = deps_map.setdefault(pkg, default_pkg)
572
David James8c7e5e32011-06-28 11:26:03 -0700573 if pkg in deps_info:
574 this_pkg["idx"] = deps_info[pkg]["idx"]
575
576 # If a package doesn't have any defined phases that might use the
577 # dependent packages (i.e. pkg_setup, pkg_preinst, or pkg_postinst),
578 # we can install this package before its deps are ready.
579 emerge_pkg = self.package_db.get(pkg)
580 if emerge_pkg and emerge_pkg.type_name == "binary":
581 this_pkg["binary"] = True
Mike Frysingerfea6cfe2014-04-24 11:42:25 -0400582 defined_phases = emerge_pkg.metadata.defined_phases
David James8c7e5e32011-06-28 11:26:03 -0700583 defined_binpkg_phases = binpkg_phases.intersection(defined_phases)
584 if not defined_binpkg_phases:
585 this_pkg["nodeps"] = True
586
David Jamesfcb70ef2011-02-02 16:02:30 -0800587 # Create entries for dependencies of this package first.
588 ReverseTree(packages[pkg]["deps"])
589
590 # Add dependencies to this package.
591 for dep, dep_item in packages[pkg]["deps"].iteritems():
David James8c7e5e32011-06-28 11:26:03 -0700592 # We only need to enforce strict ordering of dependencies if the
David James3f778802011-08-25 19:31:45 -0700593 # dependency is a blocker, or is a buildtime or runtime dependency.
594 # (I.e., ignored, optional, and runtime_post dependencies don't
595 # depend on ordering.)
David James8c7e5e32011-06-28 11:26:03 -0700596 dep_types = dep_item["deptypes"]
597 if needed_dep_types.intersection(dep_types):
598 deps_map[dep]["provides"].add(pkg)
599 this_pkg["needs"][dep] = "/".join(dep_types)
David Jamesfcb70ef2011-02-02 16:02:30 -0800600
David James3f778802011-08-25 19:31:45 -0700601 # If there's a blocker, Portage may need to move files from one
602 # package to another, which requires editing the CONTENTS files of
603 # both packages. To avoid race conditions while editing this file,
604 # the two packages must not be installed in parallel, so we can't
605 # safely ignore dependencies. See http://crosbug.com/19328
606 if "blocker" in dep_types:
607 this_pkg["nodeps"] = False
608
David Jamesfcb70ef2011-02-02 16:02:30 -0800609 def FindCycles():
610 """Find cycles in the dependency tree.
611
612 Returns:
613 A dict mapping cyclic packages to a dict of the deps that cause
614 cycles. For each dep that causes cycles, it returns an example
615 traversal of the graph that shows the cycle.
616 """
617
618 def FindCyclesAtNode(pkg, cycles, unresolved, resolved):
619 """Find cycles in cyclic dependencies starting at specified package.
620
621 Args:
622 pkg: Package identifier.
623 cycles: A dict mapping cyclic packages to a dict of the deps that
624 cause cycles. For each dep that causes cycles, it returns an
625 example traversal of the graph that shows the cycle.
626 unresolved: Nodes that have been visited but are not fully processed.
627 resolved: Nodes that have been visited and are fully processed.
628 """
629 pkg_cycles = cycles.get(pkg)
630 if pkg in resolved and not pkg_cycles:
631 # If we already looked at this package, and found no cyclic
632 # dependencies, we can stop now.
633 return
634 unresolved.append(pkg)
635 for dep in deps_map[pkg]["needs"]:
636 if dep in unresolved:
637 idx = unresolved.index(dep)
638 mycycle = unresolved[idx:] + [dep]
David James321490a2012-12-17 12:05:56 -0800639 for i in xrange(len(mycycle) - 1):
David Jamesfcb70ef2011-02-02 16:02:30 -0800640 pkg1, pkg2 = mycycle[i], mycycle[i+1]
641 cycles.setdefault(pkg1, {}).setdefault(pkg2, mycycle)
642 elif not pkg_cycles or dep not in pkg_cycles:
643 # Looks like we haven't seen this edge before.
644 FindCyclesAtNode(dep, cycles, unresolved, resolved)
645 unresolved.pop()
646 resolved.add(pkg)
647
648 cycles, unresolved, resolved = {}, [], set()
649 for pkg in deps_map:
650 FindCyclesAtNode(pkg, cycles, unresolved, resolved)
651 return cycles
652
David James386ccd12011-05-04 20:17:42 -0700653 def RemoveUnusedPackages():
David Jamesfcb70ef2011-02-02 16:02:30 -0800654 """Remove installed packages, propagating dependencies."""
David Jamesfcb70ef2011-02-02 16:02:30 -0800655 # Schedule packages that aren't on the install list for removal
656 rm_pkgs = set(deps_map.keys()) - set(deps_info.keys())
657
David Jamesfcb70ef2011-02-02 16:02:30 -0800658 # Remove the packages we don't want, simplifying the graph and making
659 # it easier for us to crack cycles.
660 for pkg in sorted(rm_pkgs):
661 this_pkg = deps_map[pkg]
662 needs = this_pkg["needs"]
663 provides = this_pkg["provides"]
664 for dep in needs:
665 dep_provides = deps_map[dep]["provides"]
666 dep_provides.update(provides)
667 dep_provides.discard(pkg)
668 dep_provides.discard(dep)
669 for target in provides:
670 target_needs = deps_map[target]["needs"]
671 target_needs.update(needs)
672 target_needs.pop(pkg, None)
673 target_needs.pop(target, None)
674 del deps_map[pkg]
675
676 def PrintCycleBreak(basedep, dep, mycycle):
677 """Print details about a cycle that we are planning on breaking.
678
Mike Frysinger02e1e072013-11-10 22:11:34 -0500679 We are breaking a cycle where dep needs basedep. mycycle is an
680 example cycle which contains dep -> basedep.
681 """
David Jamesfcb70ef2011-02-02 16:02:30 -0800682
David Jamesfcb70ef2011-02-02 16:02:30 -0800683 needs = deps_map[dep]["needs"]
684 depinfo = needs.get(basedep, "deleted")
David Jamesfcb70ef2011-02-02 16:02:30 -0800685
David James3f778802011-08-25 19:31:45 -0700686 # It's OK to swap install order for blockers, as long as the two
687 # packages aren't installed in parallel. If there is a cycle, then
688 # we know the packages depend on each other already, so we can drop the
689 # blocker safely without printing a warning.
690 if depinfo == "blocker":
691 return
692
David Jamesfcb70ef2011-02-02 16:02:30 -0800693 # Notify the user that we're breaking a cycle.
694 print "Breaking %s -> %s (%s)" % (dep, basedep, depinfo)
695
696 # Show cycle.
David James321490a2012-12-17 12:05:56 -0800697 for i in xrange(len(mycycle) - 1):
David Jamesfcb70ef2011-02-02 16:02:30 -0800698 pkg1, pkg2 = mycycle[i], mycycle[i+1]
699 needs = deps_map[pkg1]["needs"]
700 depinfo = needs.get(pkg2, "deleted")
701 if pkg1 == dep and pkg2 == basedep:
702 depinfo = depinfo + ", deleting"
703 print " %s -> %s (%s)" % (pkg1, pkg2, depinfo)
704
705 def SanitizeTree():
706 """Remove circular dependencies.
707
708 We prune all dependencies involved in cycles that go against the emerge
709 ordering. This has a nice property: we're guaranteed to merge
710 dependencies in the same order that portage does.
711
712 Because we don't treat any dependencies as "soft" unless they're killed
713 by a cycle, we pay attention to a larger number of dependencies when
714 merging. This hurts performance a bit, but helps reliability.
715 """
716 start = time.time()
717 cycles = FindCycles()
718 while cycles:
719 for dep, mycycles in cycles.iteritems():
720 for basedep, mycycle in mycycles.iteritems():
721 if deps_info[basedep]["idx"] >= deps_info[dep]["idx"]:
Matt Tennant08797302011-10-17 16:18:45 -0700722 if "--quiet" not in emerge.opts:
723 PrintCycleBreak(basedep, dep, mycycle)
David Jamesfcb70ef2011-02-02 16:02:30 -0800724 del deps_map[dep]["needs"][basedep]
725 deps_map[basedep]["provides"].remove(dep)
726 cycles = FindCycles()
727 seconds = time.time() - start
728 if "--quiet" not in emerge.opts and seconds >= 0.1:
729 print "Tree sanitized in %dm%.1fs" % (seconds / 60, seconds % 60)
730
David James8c7e5e32011-06-28 11:26:03 -0700731 def FindRecursiveProvides(pkg, seen):
732 """Find all nodes that require a particular package.
733
734 Assumes that graph is acyclic.
735
736 Args:
737 pkg: Package identifier.
738 seen: Nodes that have been visited so far.
739 """
740 if pkg in seen:
741 return
742 seen.add(pkg)
743 info = deps_map[pkg]
744 info["tprovides"] = info["provides"].copy()
745 for dep in info["provides"]:
746 FindRecursiveProvides(dep, seen)
747 info["tprovides"].update(deps_map[dep]["tprovides"])
748
David Jamesa22906f2011-05-04 19:53:26 -0700749 ReverseTree(deps_tree)
David Jamesa22906f2011-05-04 19:53:26 -0700750
David James386ccd12011-05-04 20:17:42 -0700751 # We need to remove unused packages so that we can use the dependency
752 # ordering of the install process to show us what cycles to crack.
753 RemoveUnusedPackages()
David Jamesfcb70ef2011-02-02 16:02:30 -0800754 SanitizeTree()
David James8c7e5e32011-06-28 11:26:03 -0700755 seen = set()
756 for pkg in deps_map:
757 FindRecursiveProvides(pkg, seen)
David Jamesfcb70ef2011-02-02 16:02:30 -0800758 return deps_map
759
760 def PrintInstallPlan(self, deps_map):
761 """Print an emerge-style install plan.
762
763 The install plan lists what packages we're installing, in order.
764 It's useful for understanding what parallel_emerge is doing.
765
766 Args:
767 deps_map: The dependency graph.
768 """
769
770 def InstallPlanAtNode(target, deps_map):
771 nodes = []
772 nodes.append(target)
773 for dep in deps_map[target]["provides"]:
774 del deps_map[dep]["needs"][target]
775 if not deps_map[dep]["needs"]:
776 nodes.extend(InstallPlanAtNode(dep, deps_map))
777 return nodes
778
779 deps_map = copy.deepcopy(deps_map)
780 install_plan = []
781 plan = set()
782 for target, info in deps_map.iteritems():
783 if not info["needs"] and target not in plan:
784 for item in InstallPlanAtNode(target, deps_map):
785 plan.add(item)
786 install_plan.append(self.package_db[item])
787
788 for pkg in plan:
789 del deps_map[pkg]
790
791 if deps_map:
792 print "Cyclic dependencies:", " ".join(deps_map)
793 PrintDepsMap(deps_map)
794 sys.exit(1)
795
796 self.emerge.depgraph.display(install_plan)
797
798
799def PrintDepsMap(deps_map):
800 """Print dependency graph, for each package list it's prerequisites."""
801 for i in sorted(deps_map):
802 print "%s: (%s) needs" % (i, deps_map[i]["action"])
803 needs = deps_map[i]["needs"]
804 for j in sorted(needs):
805 print " %s" % (j)
806 if not needs:
807 print " no dependencies"
808
809
810class EmergeJobState(object):
Don Garrett25f309a2014-03-19 14:02:12 -0700811 """Structure describing the EmergeJobState."""
812
David Jamesfcb70ef2011-02-02 16:02:30 -0800813 __slots__ = ["done", "filename", "last_notify_timestamp", "last_output_seek",
814 "last_output_timestamp", "pkgname", "retcode", "start_timestamp",
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700815 "target", "fetch_only", "unpack_only"]
David Jamesfcb70ef2011-02-02 16:02:30 -0800816
817 def __init__(self, target, pkgname, done, filename, start_timestamp,
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700818 retcode=None, fetch_only=False, unpack_only=False):
David Jamesfcb70ef2011-02-02 16:02:30 -0800819
820 # The full name of the target we're building (e.g.
Mike Frysingerfd969312014-04-02 22:16:42 -0400821 # virtual/target-os-1-r60)
David Jamesfcb70ef2011-02-02 16:02:30 -0800822 self.target = target
823
Mike Frysingerfd969312014-04-02 22:16:42 -0400824 # The short name of the target we're building (e.g. target-os-1-r60)
David Jamesfcb70ef2011-02-02 16:02:30 -0800825 self.pkgname = pkgname
826
827 # Whether the job is done. (True if the job is done; false otherwise.)
828 self.done = done
829
830 # The filename where output is currently stored.
831 self.filename = filename
832
833 # The timestamp of the last time we printed the name of the log file. We
834 # print this at the beginning of the job, so this starts at
835 # start_timestamp.
836 self.last_notify_timestamp = start_timestamp
837
838 # The location (in bytes) of the end of the last complete line we printed.
839 # This starts off at zero. We use this to jump to the right place when we
840 # print output from the same ebuild multiple times.
841 self.last_output_seek = 0
842
843 # The timestamp of the last time we printed output. Since we haven't
844 # printed output yet, this starts at zero.
845 self.last_output_timestamp = 0
846
847 # The return code of our job, if the job is actually finished.
848 self.retcode = retcode
849
Brian Harring0be85c62012-03-17 19:52:12 -0700850 # Was this just a fetch job?
851 self.fetch_only = fetch_only
852
David Jamesfcb70ef2011-02-02 16:02:30 -0800853 # The timestamp when our job started.
854 self.start_timestamp = start_timestamp
855
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700856 # No emerge, only unpack packages.
857 self.unpack_only = unpack_only
858
David Jamesfcb70ef2011-02-02 16:02:30 -0800859
David James321490a2012-12-17 12:05:56 -0800860def KillHandler(_signum, _frame):
David James7358d032011-05-19 10:40:03 -0700861 # Kill self and all subprocesses.
862 os.killpg(0, signal.SIGKILL)
863
David Jamesfcb70ef2011-02-02 16:02:30 -0800864def SetupWorkerSignals():
David James321490a2012-12-17 12:05:56 -0800865 def ExitHandler(_signum, _frame):
David James7358d032011-05-19 10:40:03 -0700866 # Set KILLED flag.
867 KILLED.set()
David James13cead42011-05-18 16:22:01 -0700868
David James7358d032011-05-19 10:40:03 -0700869 # Remove our signal handlers so we don't get called recursively.
870 signal.signal(signal.SIGINT, KillHandler)
871 signal.signal(signal.SIGTERM, KillHandler)
David Jamesfcb70ef2011-02-02 16:02:30 -0800872
873 # Ensure that we exit quietly and cleanly, if possible, when we receive
874 # SIGTERM or SIGINT signals. By default, when the user hits CTRL-C, all
875 # of the child processes will print details about KeyboardInterrupt
876 # exceptions, which isn't very helpful.
877 signal.signal(signal.SIGINT, ExitHandler)
878 signal.signal(signal.SIGTERM, ExitHandler)
879
David James6b29d052012-11-02 10:27:27 -0700880def EmergeProcess(output, *args, **kwargs):
David James1ed3e252011-10-05 20:26:15 -0700881 """Merge a package in a subprocess.
882
883 Args:
David James1ed3e252011-10-05 20:26:15 -0700884 output: Temporary file to write output.
David James6b29d052012-11-02 10:27:27 -0700885 *args: Arguments to pass to Scheduler constructor.
886 **kwargs: Keyword arguments to pass to Scheduler constructor.
David James1ed3e252011-10-05 20:26:15 -0700887
888 Returns:
889 The exit code returned by the subprocess.
890 """
891 pid = os.fork()
892 if pid == 0:
893 try:
894 # Sanity checks.
Mike Frysingerf02736e2013-11-08 15:27:00 -0500895 if sys.stdout.fileno() != 1:
896 raise Exception("sys.stdout.fileno() != 1")
897 if sys.stderr.fileno() != 2:
898 raise Exception("sys.stderr.fileno() != 2")
David James1ed3e252011-10-05 20:26:15 -0700899
900 # - Redirect 1 (stdout) and 2 (stderr) at our temporary file.
901 # - Redirect 0 to point at sys.stdin. In this case, sys.stdin
902 # points at a file reading os.devnull, because multiprocessing mucks
903 # with sys.stdin.
904 # - Leave the sys.stdin and output filehandles alone.
905 fd_pipes = {0: sys.stdin.fileno(),
906 1: output.fileno(),
907 2: output.fileno(),
908 sys.stdin.fileno(): sys.stdin.fileno(),
909 output.fileno(): output.fileno()}
Mike Frysingerfea6cfe2014-04-24 11:42:25 -0400910 portage.process._setup_pipes(fd_pipes) # pylint: disable=W0212
David James1ed3e252011-10-05 20:26:15 -0700911
912 # Portage doesn't like when sys.stdin.fileno() != 0, so point sys.stdin
913 # at the filehandle we just created in _setup_pipes.
914 if sys.stdin.fileno() != 0:
David James6b29d052012-11-02 10:27:27 -0700915 sys.__stdin__ = sys.stdin = os.fdopen(0, "r")
916
917 scheduler = Scheduler(*args, **kwargs)
918
919 # Enable blocker handling even though we're in --nodeps mode. This
920 # allows us to unmerge the blocker after we've merged the replacement.
921 scheduler._opts_ignore_blockers = frozenset()
David James1ed3e252011-10-05 20:26:15 -0700922
923 # Actually do the merge.
924 retval = scheduler.merge()
925
926 # We catch all exceptions here (including SystemExit, KeyboardInterrupt,
927 # etc) so as to ensure that we don't confuse the multiprocessing module,
928 # which expects that all forked children exit with os._exit().
David James321490a2012-12-17 12:05:56 -0800929 # pylint: disable=W0702
David James1ed3e252011-10-05 20:26:15 -0700930 except:
931 traceback.print_exc(file=output)
932 retval = 1
933 sys.stdout.flush()
934 sys.stderr.flush()
935 output.flush()
Don Garrett25f309a2014-03-19 14:02:12 -0700936 # pylint: disable=W0212
David James1ed3e252011-10-05 20:26:15 -0700937 os._exit(retval)
938 else:
939 # Return the exit code of the subprocess.
940 return os.waitpid(pid, 0)[1]
David Jamesfcb70ef2011-02-02 16:02:30 -0800941
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700942
943def UnpackPackage(pkg_state):
944 """Unpacks package described by pkg_state.
945
946 Args:
947 pkg_state: EmergeJobState object describing target.
948
949 Returns:
950 Exit code returned by subprocess.
951 """
952 pkgdir = os.environ.get("PKGDIR",
953 os.path.join(os.environ["SYSROOT"], "packages"))
954 root = os.environ.get("ROOT", os.environ["SYSROOT"])
955 path = os.path.join(pkgdir, pkg_state.target + ".tbz2")
956 comp = cros_build_lib.FindCompressor(cros_build_lib.COMP_BZIP2)
957 cmd = [comp, "-dc"]
958 if comp.endswith("pbzip2"):
959 cmd.append("--ignore-trailing-garbage=1")
960 cmd.append(path)
961
962 result = cros_build_lib.RunCommand(cmd, cwd=root, stdout_to_pipe=True,
963 print_cmd=False, error_code_ok=True)
964
965 # If we were not successful, return now and don't attempt untar.
966 if result.returncode:
967 return result.returncode
968
969 cmd = ["sudo", "tar", "-xf", "-", "-C", root]
970 result = cros_build_lib.RunCommand(cmd, cwd=root, input=result.output,
971 print_cmd=False, error_code_ok=True)
972
973 return result.returncode
974
975
976def EmergeWorker(task_queue, job_queue, emerge, package_db, fetch_only=False,
977 unpack_only=False):
David Jamesfcb70ef2011-02-02 16:02:30 -0800978 """This worker emerges any packages given to it on the task_queue.
979
980 Args:
981 task_queue: The queue of tasks for this worker to do.
982 job_queue: The queue of results from the worker.
983 emerge: An EmergeData() object.
984 package_db: A dict, mapping package ids to portage Package objects.
Brian Harring0be85c62012-03-17 19:52:12 -0700985 fetch_only: A bool, indicating if we should just fetch the target.
Thiago Goncalesf4acc422013-07-17 10:26:35 -0700986 unpack_only: A bool, indicating if we should just unpack the target.
David Jamesfcb70ef2011-02-02 16:02:30 -0800987
988 It expects package identifiers to be passed to it via task_queue. When
989 a task is started, it pushes the (target, filename) to the started_queue.
990 The output is stored in filename. When a merge starts or finishes, we push
991 EmergeJobState objects to the job_queue.
992 """
993
994 SetupWorkerSignals()
995 settings, trees, mtimedb = emerge.settings, emerge.trees, emerge.mtimedb
David Jamesdeebd692011-05-09 17:02:52 -0700996
997 # Disable flushing of caches to save on I/O.
David James7a1ea4b2011-10-13 15:06:41 -0700998 root = emerge.settings["ROOT"]
999 vardb = emerge.trees[root]["vartree"].dbapi
1000 vardb._flush_cache_enabled = False
Brian Harring0be85c62012-03-17 19:52:12 -07001001 bindb = emerge.trees[root]["bintree"].dbapi
1002 # Might be a set, might be a list, might be None; no clue, just use shallow
1003 # copy to ensure we can roll it back.
Don Garrett25f309a2014-03-19 14:02:12 -07001004 # pylint: disable=W0212
Brian Harring0be85c62012-03-17 19:52:12 -07001005 original_remotepkgs = copy.copy(bindb.bintree._remotepkgs)
David Jamesdeebd692011-05-09 17:02:52 -07001006
David Jamesfcb70ef2011-02-02 16:02:30 -08001007 opts, spinner = emerge.opts, emerge.spinner
1008 opts["--nodeps"] = True
Brian Harring0be85c62012-03-17 19:52:12 -07001009 if fetch_only:
1010 opts["--fetchonly"] = True
1011
David Jamesfcb70ef2011-02-02 16:02:30 -08001012 while True:
1013 # Wait for a new item to show up on the queue. This is a blocking wait,
1014 # so if there's nothing to do, we just sit here.
Brian Harring0be85c62012-03-17 19:52:12 -07001015 pkg_state = task_queue.get()
1016 if pkg_state is None:
David Jamesfcb70ef2011-02-02 16:02:30 -08001017 # If target is None, this means that the main thread wants us to quit.
1018 # The other workers need to exit too, so we'll push the message back on
1019 # to the queue so they'll get it too.
Brian Harring0be85c62012-03-17 19:52:12 -07001020 task_queue.put(None)
David Jamesfcb70ef2011-02-02 16:02:30 -08001021 return
David James7358d032011-05-19 10:40:03 -07001022 if KILLED.is_set():
1023 return
1024
Brian Harring0be85c62012-03-17 19:52:12 -07001025 target = pkg_state.target
1026
David Jamesfcb70ef2011-02-02 16:02:30 -08001027 db_pkg = package_db[target]
Brian Harring0be85c62012-03-17 19:52:12 -07001028
1029 if db_pkg.type_name == "binary":
1030 if not fetch_only and pkg_state.fetched_successfully:
1031 # Ensure portage doesn't think our pkg is remote- else it'll force
1032 # a redownload of it (even if the on-disk file is fine). In-memory
1033 # caching basically, implemented dumbly.
1034 bindb.bintree._remotepkgs = None
1035 else:
1036 bindb.bintree_remotepkgs = original_remotepkgs
1037
David Jamesfcb70ef2011-02-02 16:02:30 -08001038 db_pkg.root_config = emerge.root_config
1039 install_list = [db_pkg]
1040 pkgname = db_pkg.pf
1041 output = tempfile.NamedTemporaryFile(prefix=pkgname + "-", delete=False)
David James01b1e0f2012-06-07 17:18:05 -07001042 os.chmod(output.name, 644)
David Jamesfcb70ef2011-02-02 16:02:30 -08001043 start_timestamp = time.time()
Brian Harring0be85c62012-03-17 19:52:12 -07001044 job = EmergeJobState(target, pkgname, False, output.name, start_timestamp,
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001045 fetch_only=fetch_only, unpack_only=unpack_only)
David Jamesfcb70ef2011-02-02 16:02:30 -08001046 job_queue.put(job)
1047 if "--pretend" in opts:
1048 retcode = 0
1049 else:
David Jamesfcb70ef2011-02-02 16:02:30 -08001050 try:
David James386ccd12011-05-04 20:17:42 -07001051 emerge.scheduler_graph.mergelist = install_list
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001052 if unpack_only:
1053 retcode = UnpackPackage(pkg_state)
1054 else:
1055 retcode = EmergeProcess(output, settings, trees, mtimedb, opts,
1056 spinner, favorites=emerge.favorites,
1057 graph_config=emerge.scheduler_graph)
David Jamesfcb70ef2011-02-02 16:02:30 -08001058 except Exception:
1059 traceback.print_exc(file=output)
1060 retcode = 1
David James1ed3e252011-10-05 20:26:15 -07001061 output.close()
David Jamesfcb70ef2011-02-02 16:02:30 -08001062
David James7358d032011-05-19 10:40:03 -07001063 if KILLED.is_set():
1064 return
1065
David Jamesfcb70ef2011-02-02 16:02:30 -08001066 job = EmergeJobState(target, pkgname, True, output.name, start_timestamp,
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001067 retcode, fetch_only=fetch_only,
1068 unpack_only=unpack_only)
David Jamesfcb70ef2011-02-02 16:02:30 -08001069 job_queue.put(job)
1070
1071
1072class LinePrinter(object):
1073 """Helper object to print a single line."""
1074
1075 def __init__(self, line):
1076 self.line = line
1077
David James321490a2012-12-17 12:05:56 -08001078 def Print(self, _seek_locations):
David Jamesfcb70ef2011-02-02 16:02:30 -08001079 print self.line
1080
1081
1082class JobPrinter(object):
1083 """Helper object to print output of a job."""
1084
1085 def __init__(self, job, unlink=False):
1086 """Print output of job.
1087
Mike Frysinger02e1e072013-11-10 22:11:34 -05001088 If unlink is True, unlink the job output file when done.
1089 """
David Jamesfcb70ef2011-02-02 16:02:30 -08001090 self.current_time = time.time()
1091 self.job = job
1092 self.unlink = unlink
1093
1094 def Print(self, seek_locations):
1095
1096 job = self.job
1097
1098 # Calculate how long the job has been running.
1099 seconds = self.current_time - job.start_timestamp
1100
1101 # Note that we've printed out the job so far.
1102 job.last_output_timestamp = self.current_time
1103
1104 # Note that we're starting the job
1105 info = "job %s (%dm%.1fs)" % (job.pkgname, seconds / 60, seconds % 60)
1106 last_output_seek = seek_locations.get(job.filename, 0)
1107 if last_output_seek:
1108 print "=== Continue output for %s ===" % info
1109 else:
1110 print "=== Start output for %s ===" % info
1111
1112 # Print actual output from job
1113 f = codecs.open(job.filename, encoding='utf-8', errors='replace')
1114 f.seek(last_output_seek)
1115 prefix = job.pkgname + ":"
1116 for line in f:
1117
1118 # Save off our position in the file
1119 if line and line[-1] == "\n":
1120 last_output_seek = f.tell()
1121 line = line[:-1]
1122
1123 # Print our line
1124 print prefix, line.encode('utf-8', 'replace')
1125 f.close()
1126
1127 # Save our last spot in the file so that we don't print out the same
1128 # location twice.
1129 seek_locations[job.filename] = last_output_seek
1130
1131 # Note end of output section
1132 if job.done:
1133 print "=== Complete: %s ===" % info
1134 else:
1135 print "=== Still running: %s ===" % info
1136
1137 if self.unlink:
1138 os.unlink(job.filename)
1139
1140
1141def PrintWorker(queue):
1142 """A worker that prints stuff to the screen as requested."""
1143
David James321490a2012-12-17 12:05:56 -08001144 def ExitHandler(_signum, _frame):
David James7358d032011-05-19 10:40:03 -07001145 # Set KILLED flag.
1146 KILLED.set()
1147
David Jamesfcb70ef2011-02-02 16:02:30 -08001148 # Switch to default signal handlers so that we'll die after two signals.
David James7358d032011-05-19 10:40:03 -07001149 signal.signal(signal.SIGINT, KillHandler)
1150 signal.signal(signal.SIGTERM, KillHandler)
David Jamesfcb70ef2011-02-02 16:02:30 -08001151
1152 # Don't exit on the first SIGINT / SIGTERM, because the parent worker will
1153 # handle it and tell us when we need to exit.
1154 signal.signal(signal.SIGINT, ExitHandler)
1155 signal.signal(signal.SIGTERM, ExitHandler)
1156
1157 # seek_locations is a map indicating the position we are at in each file.
1158 # It starts off empty, but is set by the various Print jobs as we go along
1159 # to indicate where we left off in each file.
1160 seek_locations = {}
1161 while True:
1162 try:
1163 job = queue.get()
1164 if job:
1165 job.Print(seek_locations)
David Jamesbccf8eb2011-07-27 14:06:06 -07001166 sys.stdout.flush()
David Jamesfcb70ef2011-02-02 16:02:30 -08001167 else:
1168 break
1169 except IOError as ex:
1170 if ex.errno == errno.EINTR:
1171 # Looks like we received a signal. Keep printing.
1172 continue
1173 raise
1174
Brian Harring867e2362012-03-17 04:05:17 -07001175
Brian Harring0be85c62012-03-17 19:52:12 -07001176class TargetState(object):
Don Garrett25f309a2014-03-19 14:02:12 -07001177 """Structure descriting the TargetState."""
Brian Harring867e2362012-03-17 04:05:17 -07001178
Brian Harring0be85c62012-03-17 19:52:12 -07001179 __slots__ = ("target", "info", "score", "prefetched", "fetched_successfully")
Brian Harring867e2362012-03-17 04:05:17 -07001180
David James321490a2012-12-17 12:05:56 -08001181 def __init__(self, target, info):
Brian Harring867e2362012-03-17 04:05:17 -07001182 self.target, self.info = target, info
Brian Harring0be85c62012-03-17 19:52:12 -07001183 self.fetched_successfully = False
1184 self.prefetched = False
David James321490a2012-12-17 12:05:56 -08001185 self.score = None
Brian Harring867e2362012-03-17 04:05:17 -07001186 self.update_score()
1187
1188 def __cmp__(self, other):
1189 return cmp(self.score, other.score)
1190
1191 def update_score(self):
1192 self.score = (
1193 -len(self.info["tprovides"]),
Brian Harring0be85c62012-03-17 19:52:12 -07001194 len(self.info["needs"]),
Brian Harring11c5eeb2012-03-18 11:02:39 -07001195 not self.info["binary"],
Brian Harring867e2362012-03-17 04:05:17 -07001196 -len(self.info["provides"]),
1197 self.info["idx"],
1198 self.target,
1199 )
1200
1201
1202class ScoredHeap(object):
Don Garrett25f309a2014-03-19 14:02:12 -07001203 """Implementation of a general purpose scored heap."""
Brian Harring867e2362012-03-17 04:05:17 -07001204
Brian Harring0be85c62012-03-17 19:52:12 -07001205 __slots__ = ("heap", "_heap_set")
1206
Brian Harring867e2362012-03-17 04:05:17 -07001207 def __init__(self, initial=()):
Brian Harring0be85c62012-03-17 19:52:12 -07001208 self.heap = list()
1209 self._heap_set = set()
1210 if initial:
1211 self.multi_put(initial)
Brian Harring867e2362012-03-17 04:05:17 -07001212
1213 def get(self):
Brian Harring0be85c62012-03-17 19:52:12 -07001214 item = heapq.heappop(self.heap)
1215 self._heap_set.remove(item.target)
1216 return item
Brian Harring867e2362012-03-17 04:05:17 -07001217
Brian Harring0be85c62012-03-17 19:52:12 -07001218 def put(self, item):
1219 if not isinstance(item, TargetState):
1220 raise ValueError("Item %r isn't a TargetState" % (item,))
1221 heapq.heappush(self.heap, item)
1222 self._heap_set.add(item.target)
Brian Harring867e2362012-03-17 04:05:17 -07001223
Brian Harring0be85c62012-03-17 19:52:12 -07001224 def multi_put(self, sequence):
1225 sequence = list(sequence)
1226 self.heap.extend(sequence)
1227 self._heap_set.update(x.target for x in sequence)
Brian Harring867e2362012-03-17 04:05:17 -07001228 self.sort()
1229
David James5c9996d2012-03-24 10:50:46 -07001230 def sort(self):
1231 heapq.heapify(self.heap)
1232
Brian Harring0be85c62012-03-17 19:52:12 -07001233 def __contains__(self, target):
1234 return target in self._heap_set
1235
1236 def __nonzero__(self):
1237 return bool(self.heap)
1238
Brian Harring867e2362012-03-17 04:05:17 -07001239 def __len__(self):
1240 return len(self.heap)
1241
1242
David Jamesfcb70ef2011-02-02 16:02:30 -08001243class EmergeQueue(object):
1244 """Class to schedule emerge jobs according to a dependency graph."""
1245
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001246 def __init__(self, deps_map, emerge, package_db, show_output, unpack_only):
David Jamesfcb70ef2011-02-02 16:02:30 -08001247 # Store the dependency graph.
1248 self._deps_map = deps_map
Brian Harring0be85c62012-03-17 19:52:12 -07001249 self._state_map = {}
David Jamesfcb70ef2011-02-02 16:02:30 -08001250 # Initialize the running queue to empty
Brian Harring0be85c62012-03-17 19:52:12 -07001251 self._build_jobs = {}
1252 self._build_ready = ScoredHeap()
1253 self._fetch_jobs = {}
1254 self._fetch_ready = ScoredHeap()
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001255 self._unpack_jobs = {}
1256 self._unpack_ready = ScoredHeap()
David Jamesfcb70ef2011-02-02 16:02:30 -08001257 # List of total package installs represented in deps_map.
1258 install_jobs = [x for x in deps_map if deps_map[x]["action"] == "merge"]
1259 self._total_jobs = len(install_jobs)
1260 self._show_output = show_output
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001261 self._unpack_only = unpack_only
David Jamesfcb70ef2011-02-02 16:02:30 -08001262
1263 if "--pretend" in emerge.opts:
1264 print "Skipping merge because of --pretend mode."
1265 sys.exit(0)
1266
David James6d47d8c2014-04-24 09:40:05 -07001267 # Set up a session so we can easily terminate all children.
1268 self._SetupSession()
David James7358d032011-05-19 10:40:03 -07001269
David Jamesfcb70ef2011-02-02 16:02:30 -08001270 # Setup scheduler graph object. This is used by the child processes
1271 # to help schedule jobs.
1272 emerge.scheduler_graph = emerge.depgraph.schedulerGraph()
1273
1274 # Calculate how many jobs we can run in parallel. We don't want to pass
1275 # the --jobs flag over to emerge itself, because that'll tell emerge to
1276 # hide its output, and said output is quite useful for debugging hung
1277 # jobs.
1278 procs = min(self._total_jobs,
1279 emerge.opts.pop("--jobs", multiprocessing.cpu_count()))
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001280 self._build_procs = self._unpack_procs = self._fetch_procs = max(1, procs)
David James8c7e5e32011-06-28 11:26:03 -07001281 self._load_avg = emerge.opts.pop("--load-average", None)
David Jamesfcb70ef2011-02-02 16:02:30 -08001282 self._job_queue = multiprocessing.Queue()
1283 self._print_queue = multiprocessing.Queue()
Brian Harring0be85c62012-03-17 19:52:12 -07001284
1285 self._fetch_queue = multiprocessing.Queue()
1286 args = (self._fetch_queue, self._job_queue, emerge, package_db, True)
1287 self._fetch_pool = multiprocessing.Pool(self._fetch_procs, EmergeWorker,
1288 args)
1289
1290 self._build_queue = multiprocessing.Queue()
1291 args = (self._build_queue, self._job_queue, emerge, package_db)
1292 self._build_pool = multiprocessing.Pool(self._build_procs, EmergeWorker,
1293 args)
1294
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001295 if self._unpack_only:
1296 # Unpack pool only required on unpack_only jobs.
1297 self._unpack_queue = multiprocessing.Queue()
1298 args = (self._unpack_queue, self._job_queue, emerge, package_db, False,
1299 True)
1300 self._unpack_pool = multiprocessing.Pool(self._unpack_procs, EmergeWorker,
1301 args)
1302
David Jamesfcb70ef2011-02-02 16:02:30 -08001303 self._print_worker = multiprocessing.Process(target=PrintWorker,
1304 args=[self._print_queue])
1305 self._print_worker.start()
1306
1307 # Initialize the failed queue to empty.
1308 self._retry_queue = []
1309 self._failed = set()
1310
David Jamesfcb70ef2011-02-02 16:02:30 -08001311 # Setup an exit handler so that we print nice messages if we are
1312 # terminated.
1313 self._SetupExitHandler()
1314
1315 # Schedule our jobs.
Brian Harring0be85c62012-03-17 19:52:12 -07001316 self._state_map.update(
1317 (pkg, TargetState(pkg, data)) for pkg, data in deps_map.iteritems())
1318 self._fetch_ready.multi_put(self._state_map.itervalues())
David Jamesfcb70ef2011-02-02 16:02:30 -08001319
David James6d47d8c2014-04-24 09:40:05 -07001320 def _SetupSession(self):
1321 """Set up a session so we can easily terminate all children."""
1322 # When we call os.setsid(), this sets up a session / process group for this
1323 # process and all children. These session groups are needed so that we can
1324 # easily kill all children (including processes launched by emerge) before
1325 # we exit.
1326 #
1327 # One unfortunate side effect of os.setsid() is that it blocks CTRL-C from
1328 # being received. To work around this, we only call os.setsid() in a forked
1329 # process, so that the parent can still watch for CTRL-C. The parent will
1330 # just sit around, watching for signals and propagating them to the child,
1331 # until the child exits.
1332 #
1333 # TODO(davidjames): It would be nice if we could replace this with cgroups.
1334 pid = os.fork()
1335 if pid == 0:
1336 os.setsid()
1337 else:
1338 def PropagateToChildren(signum, _frame):
1339 # Just propagate the signals down to the child. We'll exit when the
1340 # child does.
1341 try:
1342 os.kill(pid, signum)
1343 except OSError as ex:
1344 if ex.errno != errno.ESRCH:
1345 raise
1346 signal.signal(signal.SIGINT, PropagateToChildren)
1347 signal.signal(signal.SIGTERM, PropagateToChildren)
1348
1349 def StopGroup(_signum, _frame):
1350 # When we get stopped, stop the children.
1351 try:
1352 os.killpg(pid, signal.SIGSTOP)
1353 os.kill(0, signal.SIGSTOP)
1354 except OSError as ex:
1355 if ex.errno != errno.ESRCH:
1356 raise
1357 signal.signal(signal.SIGTSTP, StopGroup)
1358
1359 def ContinueGroup(_signum, _frame):
1360 # Launch the children again after being stopped.
1361 try:
1362 os.killpg(pid, signal.SIGCONT)
1363 except OSError as ex:
1364 if ex.errno != errno.ESRCH:
1365 raise
1366 signal.signal(signal.SIGCONT, ContinueGroup)
1367
1368 # Loop until the children exit. We exit with os._exit to be sure we
1369 # don't run any finalizers (those will be run by the child process.)
1370 # pylint: disable=W0212
1371 while True:
1372 try:
1373 # Wait for the process to exit. When it does, exit with the return
1374 # value of the subprocess.
1375 os._exit(osutils.GetExitStatus(os.waitpid(pid, 0)[1]))
1376 except OSError as ex:
1377 if ex.errno == errno.EINTR:
1378 continue
1379 traceback.print_exc()
1380 os._exit(1)
1381 except BaseException:
1382 traceback.print_exc()
1383 os._exit(1)
1384
David Jamesfcb70ef2011-02-02 16:02:30 -08001385 def _SetupExitHandler(self):
1386
David James321490a2012-12-17 12:05:56 -08001387 def ExitHandler(signum, _frame):
David James7358d032011-05-19 10:40:03 -07001388 # Set KILLED flag.
1389 KILLED.set()
David Jamesfcb70ef2011-02-02 16:02:30 -08001390
1391 # Kill our signal handlers so we don't get called recursively
David James7358d032011-05-19 10:40:03 -07001392 signal.signal(signal.SIGINT, KillHandler)
1393 signal.signal(signal.SIGTERM, KillHandler)
David Jamesfcb70ef2011-02-02 16:02:30 -08001394
1395 # Print our current job status
Brian Harring0be85c62012-03-17 19:52:12 -07001396 for job in self._build_jobs.itervalues():
David Jamesfcb70ef2011-02-02 16:02:30 -08001397 if job:
1398 self._print_queue.put(JobPrinter(job, unlink=True))
1399
1400 # Notify the user that we are exiting
1401 self._Print("Exiting on signal %s" % signum)
David James7358d032011-05-19 10:40:03 -07001402 self._print_queue.put(None)
1403 self._print_worker.join()
David Jamesfcb70ef2011-02-02 16:02:30 -08001404
1405 # Kill child threads, then exit.
David James7358d032011-05-19 10:40:03 -07001406 os.killpg(0, signal.SIGKILL)
David Jamesfcb70ef2011-02-02 16:02:30 -08001407 sys.exit(1)
1408
1409 # Print out job status when we are killed
1410 signal.signal(signal.SIGINT, ExitHandler)
1411 signal.signal(signal.SIGTERM, ExitHandler)
1412
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001413 def _ScheduleUnpack(self, pkg_state):
1414 self._unpack_jobs[pkg_state.target] = None
1415 self._unpack_queue.put(pkg_state)
1416
Brian Harring0be85c62012-03-17 19:52:12 -07001417 def _Schedule(self, pkg_state):
David Jamesfcb70ef2011-02-02 16:02:30 -08001418 # We maintain a tree of all deps, if this doesn't need
David James8c7e5e32011-06-28 11:26:03 -07001419 # to be installed just free up its children and continue.
David Jamesfcb70ef2011-02-02 16:02:30 -08001420 # It is possible to reinstall deps of deps, without reinstalling
1421 # first level deps, like so:
Mike Frysingerfd969312014-04-02 22:16:42 -04001422 # virtual/target-os (merge) -> eselect (nomerge) -> python (merge)
Brian Harring0be85c62012-03-17 19:52:12 -07001423 this_pkg = pkg_state.info
1424 target = pkg_state.target
1425 if pkg_state.info is not None:
1426 if this_pkg["action"] == "nomerge":
1427 self._Finish(target)
1428 elif target not in self._build_jobs:
1429 # Kick off the build if it's marked to be built.
1430 self._build_jobs[target] = None
1431 self._build_queue.put(pkg_state)
1432 return True
David Jamesfcb70ef2011-02-02 16:02:30 -08001433
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001434 def _ScheduleLoop(self, unpack_only=False):
1435 if unpack_only:
1436 ready_queue = self._unpack_ready
1437 jobs_queue = self._unpack_jobs
1438 procs = self._unpack_procs
1439 else:
1440 ready_queue = self._build_ready
1441 jobs_queue = self._build_jobs
1442 procs = self._build_procs
1443
David James8c7e5e32011-06-28 11:26:03 -07001444 # If the current load exceeds our desired load average, don't schedule
1445 # more than one job.
1446 if self._load_avg and os.getloadavg()[0] > self._load_avg:
1447 needed_jobs = 1
1448 else:
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001449 needed_jobs = procs
David James8c7e5e32011-06-28 11:26:03 -07001450
1451 # Schedule more jobs.
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001452 while ready_queue and len(jobs_queue) < needed_jobs:
1453 state = ready_queue.get()
1454 if unpack_only:
1455 self._ScheduleUnpack(state)
1456 else:
1457 if state.target not in self._failed:
1458 self._Schedule(state)
David Jamesfcb70ef2011-02-02 16:02:30 -08001459
1460 def _Print(self, line):
1461 """Print a single line."""
1462 self._print_queue.put(LinePrinter(line))
1463
1464 def _Status(self):
1465 """Print status."""
1466 current_time = time.time()
1467 no_output = True
1468
1469 # Print interim output every minute if --show-output is used. Otherwise,
1470 # print notifications about running packages every 2 minutes, and print
1471 # full output for jobs that have been running for 60 minutes or more.
1472 if self._show_output:
1473 interval = 60
1474 notify_interval = 0
1475 else:
1476 interval = 60 * 60
1477 notify_interval = 60 * 2
David James321490a2012-12-17 12:05:56 -08001478 for job in self._build_jobs.itervalues():
David Jamesfcb70ef2011-02-02 16:02:30 -08001479 if job:
1480 last_timestamp = max(job.start_timestamp, job.last_output_timestamp)
1481 if last_timestamp + interval < current_time:
1482 self._print_queue.put(JobPrinter(job))
1483 job.last_output_timestamp = current_time
1484 no_output = False
1485 elif (notify_interval and
1486 job.last_notify_timestamp + notify_interval < current_time):
1487 job_seconds = current_time - job.start_timestamp
1488 args = (job.pkgname, job_seconds / 60, job_seconds % 60, job.filename)
1489 info = "Still building %s (%dm%.1fs). Logs in %s" % args
1490 job.last_notify_timestamp = current_time
1491 self._Print(info)
1492 no_output = False
1493
1494 # If we haven't printed any messages yet, print a general status message
1495 # here.
1496 if no_output:
1497 seconds = current_time - GLOBAL_START
Brian Harring0be85c62012-03-17 19:52:12 -07001498 fjobs, fready = len(self._fetch_jobs), len(self._fetch_ready)
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001499 ujobs, uready = len(self._unpack_jobs), len(self._unpack_ready)
Brian Harring0be85c62012-03-17 19:52:12 -07001500 bjobs, bready = len(self._build_jobs), len(self._build_ready)
1501 retries = len(self._retry_queue)
1502 pending = max(0, len(self._deps_map) - fjobs - bjobs)
1503 line = "Pending %s/%s, " % (pending, self._total_jobs)
1504 if fjobs or fready:
1505 line += "Fetching %s/%s, " % (fjobs, fready + fjobs)
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001506 if ujobs or uready:
1507 line += "Unpacking %s/%s, " % (ujobs, uready + ujobs)
Brian Harring0be85c62012-03-17 19:52:12 -07001508 if bjobs or bready or retries:
1509 line += "Building %s/%s, " % (bjobs, bready + bjobs)
1510 if retries:
1511 line += "Retrying %s, " % (retries,)
David James8c7e5e32011-06-28 11:26:03 -07001512 load = " ".join(str(x) for x in os.getloadavg())
Brian Harring0be85c62012-03-17 19:52:12 -07001513 line += ("[Time %dm%.1fs Load %s]" % (seconds/60, seconds %60, load))
1514 self._Print(line)
David Jamesfcb70ef2011-02-02 16:02:30 -08001515
1516 def _Finish(self, target):
David James8c7e5e32011-06-28 11:26:03 -07001517 """Mark a target as completed and unblock dependencies."""
1518 this_pkg = self._deps_map[target]
1519 if this_pkg["needs"] and this_pkg["nodeps"]:
1520 # We got installed, but our deps have not been installed yet. Dependent
1521 # packages should only be installed when our needs have been fully met.
1522 this_pkg["action"] = "nomerge"
1523 else:
David James8c7e5e32011-06-28 11:26:03 -07001524 for dep in this_pkg["provides"]:
1525 dep_pkg = self._deps_map[dep]
Brian Harring0be85c62012-03-17 19:52:12 -07001526 state = self._state_map[dep]
David James8c7e5e32011-06-28 11:26:03 -07001527 del dep_pkg["needs"][target]
Brian Harring0be85c62012-03-17 19:52:12 -07001528 state.update_score()
1529 if not state.prefetched:
1530 if dep in self._fetch_ready:
1531 # If it's not currently being fetched, update the prioritization
1532 self._fetch_ready.sort()
1533 elif not dep_pkg["needs"]:
David James8c7e5e32011-06-28 11:26:03 -07001534 if dep_pkg["nodeps"] and dep_pkg["action"] == "nomerge":
1535 self._Finish(dep)
1536 else:
Brian Harring0be85c62012-03-17 19:52:12 -07001537 self._build_ready.put(self._state_map[dep])
David James8c7e5e32011-06-28 11:26:03 -07001538 self._deps_map.pop(target)
David Jamesfcb70ef2011-02-02 16:02:30 -08001539
1540 def _Retry(self):
David James8c7e5e32011-06-28 11:26:03 -07001541 while self._retry_queue:
Brian Harring0be85c62012-03-17 19:52:12 -07001542 state = self._retry_queue.pop(0)
1543 if self._Schedule(state):
1544 self._Print("Retrying emerge of %s." % state.target)
David James8c7e5e32011-06-28 11:26:03 -07001545 break
David Jamesfcb70ef2011-02-02 16:02:30 -08001546
Brian Harringa43f5952012-04-12 01:19:34 -07001547 def _Shutdown(self):
David Jamesfcb70ef2011-02-02 16:02:30 -08001548 # Tell emerge workers to exit. They all exit when 'None' is pushed
1549 # to the queue.
Brian Harring0be85c62012-03-17 19:52:12 -07001550
Brian Harringa43f5952012-04-12 01:19:34 -07001551 # Shutdown the workers first; then jobs (which is how they feed things back)
1552 # then finally the print queue.
Brian Harring0be85c62012-03-17 19:52:12 -07001553
Brian Harringa43f5952012-04-12 01:19:34 -07001554 def _stop(queue, pool):
1555 if pool is None:
1556 return
1557 try:
1558 queue.put(None)
1559 pool.close()
1560 pool.join()
1561 finally:
1562 pool.terminate()
Brian Harring0be85c62012-03-17 19:52:12 -07001563
Brian Harringa43f5952012-04-12 01:19:34 -07001564 _stop(self._fetch_queue, self._fetch_pool)
1565 self._fetch_queue = self._fetch_pool = None
Brian Harring0be85c62012-03-17 19:52:12 -07001566
Brian Harringa43f5952012-04-12 01:19:34 -07001567 _stop(self._build_queue, self._build_pool)
1568 self._build_queue = self._build_pool = None
1569
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001570 if self._unpack_only:
1571 _stop(self._unpack_queue, self._unpack_pool)
1572 self._unpack_queue = self._unpack_pool = None
1573
Brian Harringa43f5952012-04-12 01:19:34 -07001574 if self._job_queue is not None:
1575 self._job_queue.close()
1576 self._job_queue = None
David Jamesfcb70ef2011-02-02 16:02:30 -08001577
1578 # Now that our workers are finished, we can kill the print queue.
Brian Harringa43f5952012-04-12 01:19:34 -07001579 if self._print_worker is not None:
1580 try:
1581 self._print_queue.put(None)
1582 self._print_queue.close()
1583 self._print_worker.join()
1584 finally:
1585 self._print_worker.terminate()
1586 self._print_queue = self._print_worker = None
David Jamesfcb70ef2011-02-02 16:02:30 -08001587
1588 def Run(self):
1589 """Run through the scheduled ebuilds.
1590
1591 Keep running so long as we have uninstalled packages in the
1592 dependency graph to merge.
1593 """
Brian Harringa43f5952012-04-12 01:19:34 -07001594 if not self._deps_map:
1595 return
1596
Brian Harring0be85c62012-03-17 19:52:12 -07001597 # Start the fetchers.
1598 for _ in xrange(min(self._fetch_procs, len(self._fetch_ready))):
1599 state = self._fetch_ready.get()
1600 self._fetch_jobs[state.target] = None
1601 self._fetch_queue.put(state)
1602
1603 # Print an update, then get going.
1604 self._Status()
1605
David Jamese703d0f2012-01-12 16:27:45 -08001606 retried = set()
David Jamesfcb70ef2011-02-02 16:02:30 -08001607 while self._deps_map:
1608 # Check here that we are actually waiting for something.
Brian Harring0be85c62012-03-17 19:52:12 -07001609 if (self._build_queue.empty() and
David Jamesfcb70ef2011-02-02 16:02:30 -08001610 self._job_queue.empty() and
Brian Harring0be85c62012-03-17 19:52:12 -07001611 not self._fetch_jobs and
1612 not self._fetch_ready and
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001613 not self._unpack_jobs and
1614 not self._unpack_ready and
Brian Harring0be85c62012-03-17 19:52:12 -07001615 not self._build_jobs and
1616 not self._build_ready and
David Jamesfcb70ef2011-02-02 16:02:30 -08001617 self._deps_map):
1618 # If we have failed on a package, retry it now.
1619 if self._retry_queue:
1620 self._Retry()
1621 else:
David Jamesfcb70ef2011-02-02 16:02:30 -08001622 # Tell the user why we're exiting.
1623 if self._failed:
Mike Frysingerf2ff9172012-11-01 18:47:41 -04001624 print 'Packages failed:\n\t%s' % '\n\t'.join(self._failed)
David James0eae23e2012-07-03 15:04:25 -07001625 status_file = os.environ.get("PARALLEL_EMERGE_STATUS_FILE")
1626 if status_file:
David James321490a2012-12-17 12:05:56 -08001627 failed_pkgs = set(portage.versions.cpv_getkey(x)
1628 for x in self._failed)
David James0eae23e2012-07-03 15:04:25 -07001629 with open(status_file, "a") as f:
1630 f.write("%s\n" % " ".join(failed_pkgs))
David Jamesfcb70ef2011-02-02 16:02:30 -08001631 else:
1632 print "Deadlock! Circular dependencies!"
1633 sys.exit(1)
1634
David James321490a2012-12-17 12:05:56 -08001635 for _ in xrange(12):
David Jamesa74289a2011-08-12 10:41:24 -07001636 try:
1637 job = self._job_queue.get(timeout=5)
1638 break
1639 except Queue.Empty:
1640 # Check if any more jobs can be scheduled.
1641 self._ScheduleLoop()
1642 else:
Brian Harring706747c2012-03-16 03:04:31 -07001643 # Print an update every 60 seconds.
David Jamesfcb70ef2011-02-02 16:02:30 -08001644 self._Status()
1645 continue
1646
1647 target = job.target
1648
Brian Harring0be85c62012-03-17 19:52:12 -07001649 if job.fetch_only:
1650 if not job.done:
1651 self._fetch_jobs[job.target] = job
1652 else:
1653 state = self._state_map[job.target]
1654 state.prefetched = True
1655 state.fetched_successfully = (job.retcode == 0)
1656 del self._fetch_jobs[job.target]
1657 self._Print("Fetched %s in %2.2fs"
1658 % (target, time.time() - job.start_timestamp))
1659
1660 if self._show_output or job.retcode != 0:
1661 self._print_queue.put(JobPrinter(job, unlink=True))
1662 else:
1663 os.unlink(job.filename)
1664 # Failure or not, let build work with it next.
1665 if not self._deps_map[job.target]["needs"]:
1666 self._build_ready.put(state)
1667 self._ScheduleLoop()
1668
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001669 if self._unpack_only and job.retcode == 0:
1670 self._unpack_ready.put(state)
1671 self._ScheduleLoop(unpack_only=True)
1672
Brian Harring0be85c62012-03-17 19:52:12 -07001673 if self._fetch_ready:
1674 state = self._fetch_ready.get()
1675 self._fetch_queue.put(state)
1676 self._fetch_jobs[state.target] = None
1677 else:
1678 # Minor optimization; shut down fetchers early since we know
1679 # the queue is empty.
1680 self._fetch_queue.put(None)
1681 continue
1682
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001683 if job.unpack_only:
1684 if not job.done:
1685 self._unpack_jobs[target] = job
1686 else:
1687 del self._unpack_jobs[target]
1688 self._Print("Unpacked %s in %2.2fs"
1689 % (target, time.time() - job.start_timestamp))
1690 if self._show_output or job.retcode != 0:
1691 self._print_queue.put(JobPrinter(job, unlink=True))
1692 else:
1693 os.unlink(job.filename)
1694 if self._unpack_ready:
1695 state = self._unpack_ready.get()
1696 self._unpack_queue.put(state)
1697 self._unpack_jobs[state.target] = None
1698 continue
1699
David Jamesfcb70ef2011-02-02 16:02:30 -08001700 if not job.done:
Brian Harring0be85c62012-03-17 19:52:12 -07001701 self._build_jobs[target] = job
David Jamesfcb70ef2011-02-02 16:02:30 -08001702 self._Print("Started %s (logged in %s)" % (target, job.filename))
1703 continue
1704
1705 # Print output of job
1706 if self._show_output or job.retcode != 0:
1707 self._print_queue.put(JobPrinter(job, unlink=True))
1708 else:
1709 os.unlink(job.filename)
Brian Harring0be85c62012-03-17 19:52:12 -07001710 del self._build_jobs[target]
David Jamesfcb70ef2011-02-02 16:02:30 -08001711
1712 seconds = time.time() - job.start_timestamp
1713 details = "%s (in %dm%.1fs)" % (target, seconds / 60, seconds % 60)
David James32420cc2011-08-25 21:32:46 -07001714 previously_failed = target in self._failed
David Jamesfcb70ef2011-02-02 16:02:30 -08001715
1716 # Complain if necessary.
1717 if job.retcode != 0:
1718 # Handle job failure.
David James32420cc2011-08-25 21:32:46 -07001719 if previously_failed:
David Jamesfcb70ef2011-02-02 16:02:30 -08001720 # If this job has failed previously, give up.
1721 self._Print("Failed %s. Your build has failed." % details)
1722 else:
1723 # Queue up this build to try again after a long while.
David Jamese703d0f2012-01-12 16:27:45 -08001724 retried.add(target)
Brian Harring0be85c62012-03-17 19:52:12 -07001725 self._retry_queue.append(self._state_map[target])
David Jamesfcb70ef2011-02-02 16:02:30 -08001726 self._failed.add(target)
1727 self._Print("Failed %s, retrying later." % details)
1728 else:
David James32420cc2011-08-25 21:32:46 -07001729 if previously_failed:
1730 # Remove target from list of failed packages.
1731 self._failed.remove(target)
1732
1733 self._Print("Completed %s" % details)
1734
1735 # Mark as completed and unblock waiting ebuilds.
1736 self._Finish(target)
1737
1738 if previously_failed and self._retry_queue:
David Jamesfcb70ef2011-02-02 16:02:30 -08001739 # If we have successfully retried a failed package, and there
1740 # are more failed packages, try the next one. We will only have
1741 # one retrying package actively running at a time.
1742 self._Retry()
1743
David Jamesfcb70ef2011-02-02 16:02:30 -08001744
David James8c7e5e32011-06-28 11:26:03 -07001745 # Schedule pending jobs and print an update.
1746 self._ScheduleLoop()
1747 self._Status()
David Jamesfcb70ef2011-02-02 16:02:30 -08001748
David Jamese703d0f2012-01-12 16:27:45 -08001749 # If packages were retried, output a warning.
1750 if retried:
1751 self._Print("")
1752 self._Print("WARNING: The following packages failed the first time,")
1753 self._Print("but succeeded upon retry. This might indicate incorrect")
1754 self._Print("dependencies.")
1755 for pkg in retried:
1756 self._Print(" %s" % pkg)
1757 self._Print("@@@STEP_WARNINGS@@@")
1758 self._Print("")
1759
David Jamesfcb70ef2011-02-02 16:02:30 -08001760 # Tell child threads to exit.
1761 self._Print("Merge complete")
David Jamesfcb70ef2011-02-02 16:02:30 -08001762
1763
Brian Harring30675052012-02-29 12:18:22 -08001764def main(argv):
Brian Harring8294d652012-05-23 02:20:52 -07001765 try:
1766 return real_main(argv)
1767 finally:
1768 # Work around multiprocessing sucking and not cleaning up after itself.
1769 # http://bugs.python.org/issue4106;
1770 # Step one; ensure GC is ran *prior* to the VM starting shutdown.
1771 gc.collect()
1772 # Step two; go looking for those threads and try to manually reap
1773 # them if we can.
1774 for x in threading.enumerate():
1775 # Filter on the name, and ident; if ident is None, the thread
1776 # wasn't started.
1777 if x.name == 'QueueFeederThread' and x.ident is not None:
1778 x.join(1)
David Jamesfcb70ef2011-02-02 16:02:30 -08001779
Brian Harring8294d652012-05-23 02:20:52 -07001780
1781def real_main(argv):
Brian Harring30675052012-02-29 12:18:22 -08001782 parallel_emerge_args = argv[:]
David Jamesfcb70ef2011-02-02 16:02:30 -08001783 deps = DepGraphGenerator()
Brian Harring30675052012-02-29 12:18:22 -08001784 deps.Initialize(parallel_emerge_args)
David Jamesfcb70ef2011-02-02 16:02:30 -08001785 emerge = deps.emerge
1786
1787 if emerge.action is not None:
Brian Harring30675052012-02-29 12:18:22 -08001788 argv = deps.ParseParallelEmergeArgs(argv)
Brian Harring8294d652012-05-23 02:20:52 -07001789 return emerge_main(argv)
David Jamesfcb70ef2011-02-02 16:02:30 -08001790 elif not emerge.cmdline_packages:
1791 Usage()
Brian Harring8294d652012-05-23 02:20:52 -07001792 return 1
David Jamesfcb70ef2011-02-02 16:02:30 -08001793
1794 # Unless we're in pretend mode, there's not much point running without
1795 # root access. We need to be able to install packages.
1796 #
1797 # NOTE: Even if you're running --pretend, it's a good idea to run
1798 # parallel_emerge with root access so that portage can write to the
1799 # dependency cache. This is important for performance.
David James321490a2012-12-17 12:05:56 -08001800 if "--pretend" not in emerge.opts and portage.data.secpass < 2:
David Jamesfcb70ef2011-02-02 16:02:30 -08001801 print "parallel_emerge: superuser access is required."
Brian Harring8294d652012-05-23 02:20:52 -07001802 return 1
David Jamesfcb70ef2011-02-02 16:02:30 -08001803
1804 if "--quiet" not in emerge.opts:
1805 cmdline_packages = " ".join(emerge.cmdline_packages)
David Jamesfcb70ef2011-02-02 16:02:30 -08001806 print "Starting fast-emerge."
1807 print " Building package %s on %s" % (cmdline_packages,
1808 deps.board or "root")
David Jamesfcb70ef2011-02-02 16:02:30 -08001809
David James386ccd12011-05-04 20:17:42 -07001810 deps_tree, deps_info = deps.GenDependencyTree()
David Jamesfcb70ef2011-02-02 16:02:30 -08001811
1812 # You want me to be verbose? I'll give you two trees! Twice as much value.
1813 if "--tree" in emerge.opts and "--verbose" in emerge.opts:
1814 deps.PrintTree(deps_tree)
1815
David James386ccd12011-05-04 20:17:42 -07001816 deps_graph = deps.GenDependencyGraph(deps_tree, deps_info)
David Jamesfcb70ef2011-02-02 16:02:30 -08001817
1818 # OK, time to print out our progress so far.
1819 deps.PrintInstallPlan(deps_graph)
1820 if "--tree" in emerge.opts:
1821 PrintDepsMap(deps_graph)
1822
1823 # Are we upgrading portage? If so, and there are more packages to merge,
1824 # schedule a restart of parallel_emerge to merge the rest. This ensures that
1825 # we pick up all updates to portage settings before merging any more
1826 # packages.
1827 portage_upgrade = False
1828 root = emerge.settings["ROOT"]
Don Garrett25f309a2014-03-19 14:02:12 -07001829 # pylint: disable=W0212
David Jamesfcb70ef2011-02-02 16:02:30 -08001830 final_db = emerge.depgraph._dynamic_config.mydbapi[root]
1831 if root == "/":
1832 for db_pkg in final_db.match_pkgs("sys-apps/portage"):
1833 portage_pkg = deps_graph.get(db_pkg.cpv)
David James0ff16f22012-11-02 14:18:07 -07001834 if portage_pkg:
David Jamesfcb70ef2011-02-02 16:02:30 -08001835 portage_upgrade = True
1836 if "--quiet" not in emerge.opts:
1837 print "Upgrading portage first, then restarting..."
1838
David James0ff16f22012-11-02 14:18:07 -07001839 # Upgrade Portage first, then the rest of the packages.
1840 #
1841 # In order to grant the child permission to run setsid, we need to run sudo
1842 # again. We preserve SUDO_USER here in case an ebuild depends on it.
1843 if portage_upgrade:
1844 # Calculate what arguments to use when re-invoking.
1845 args = ["sudo", "-E", "SUDO_USER=%s" % os.environ.get("SUDO_USER", "")]
1846 args += [os.path.abspath(sys.argv[0])] + parallel_emerge_args
1847 args += ["--exclude=sys-apps/portage"]
1848
1849 # First upgrade Portage.
1850 passthrough_args = ("--quiet", "--pretend", "--verbose")
1851 emerge_args = [k for k in emerge.opts if k in passthrough_args]
1852 ret = emerge_main(emerge_args + ["portage"])
1853 if ret != 0:
1854 return ret
1855
1856 # Now upgrade the rest.
1857 os.execvp(args[0], args)
1858
David Jamesfcb70ef2011-02-02 16:02:30 -08001859 # Run the queued emerges.
Thiago Goncalesf4acc422013-07-17 10:26:35 -07001860 scheduler = EmergeQueue(deps_graph, emerge, deps.package_db, deps.show_output,
1861 deps.unpack_only)
Brian Harringa43f5952012-04-12 01:19:34 -07001862 try:
1863 scheduler.Run()
1864 finally:
Don Garrett25f309a2014-03-19 14:02:12 -07001865 # pylint: disable=W0212
Brian Harringa43f5952012-04-12 01:19:34 -07001866 scheduler._Shutdown()
David James97ce8902011-08-16 09:51:05 -07001867 scheduler = None
David Jamesfcb70ef2011-02-02 16:02:30 -08001868
Mike Frysingerd20a6e22012-10-04 19:01:10 -04001869 clean_logs(emerge.settings)
1870
David Jamesfcb70ef2011-02-02 16:02:30 -08001871 print "Done"
Brian Harring8294d652012-05-23 02:20:52 -07001872 return 0