blob: 402246771360a5693281006bd29dd1c126bf6d24 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
33See
34https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
35for all the variables.
36
37See
38https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
39for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000040"""
41
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000042__version__ = '1.0.0'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000043
aludwin7556e0c2016-10-26 08:46:10 -070044import argparse
maruel064c0a32016-04-05 11:47:15 -070045import base64
iannucci96fcccc2016-08-30 15:52:22 -070046import collections
vadimsh232f5a82017-01-20 19:23:44 -080047import contextlib
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040048import errno
aludwin7556e0c2016-10-26 08:46:10 -070049import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000050import logging
51import optparse
52import os
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040053import re
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000054import sys
55import tempfile
maruel064c0a32016-04-05 11:47:15 -070056import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000057
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000058from utils import tools
59tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000060
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000061# third_party/
62from depot_tools import fix_encoding
63
64# pylint: disable=ungrouped-imports
65import auth
66import cipd
67import isolate_storage
68import isolateserver
69import local_caching
70from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070071from utils import file_path
maruel12e30012015-10-09 11:55:35 -070072from utils import fs
maruel064c0a32016-04-05 11:47:15 -070073from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040074from utils import logging_utils
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040075from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050076from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000077
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000078
maruele2f2cb82016-07-13 14:41:03 -070079# Magic variables that can be found in the isolate task command line.
80ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
81EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
82SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
83
84
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000085# The name of the log file to use.
86RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
87
maruele2f2cb82016-07-13 14:41:03 -070088
csharp@chromium.orge217f302012-11-22 16:51:53 +000089# The name of the log to use for the run_test_cases.py command
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000090RUN_TEST_CASES_LOG = 'run_test_cases.log'
csharp@chromium.orge217f302012-11-22 16:51:53 +000091
vadimsh@chromium.org87d63262013-04-04 19:34:21 +000092
maruele2f2cb82016-07-13 14:41:03 -070093# Use short names for temporary directories. This is driven by Windows, which
94# imposes a relatively short maximum path length of 260 characters, often
95# referred to as MAX_PATH. It is relatively easy to create files with longer
96# path length. A use case is with recursive depedency treesV like npm packages.
97#
98# It is recommended to start the script with a `root_dir` as short as
99# possible.
100# - ir stands for isolated_run
101# - io stands for isolated_out
102# - it stands for isolated_tmp
103ISOLATED_RUN_DIR = u'ir'
104ISOLATED_OUT_DIR = u'io'
105ISOLATED_TMP_DIR = u'it'
106
107
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400108# Keep synced with task_request.py
109CACHE_NAME_RE = re.compile(ur'^[a-z0-9_]{1,4096}$')
110
111
marueld928c862017-06-08 08:20:04 -0700112OUTLIVING_ZOMBIE_MSG = """\
113*** Swarming tried multiple times to delete the %s directory and failed ***
114*** Hard failing the task ***
115
116Swarming detected that your testing script ran an executable, which may have
117started a child executable, and the main script returned early, leaving the
118children executables playing around unguided.
119
120You don't want to leave children processes outliving the task on the Swarming
121bot, do you? The Swarming bot doesn't.
122
123How to fix?
124- For any process that starts children processes, make sure all children
125 processes terminated properly before each parent process exits. This is
126 especially important in very deep process trees.
127 - This must be done properly both in normal successful task and in case of
128 task failure. Cleanup is very important.
129- The Swarming bot sends a SIGTERM in case of timeout.
130 - You have %s seconds to comply after the signal was sent to the process
131 before the process is forcibly killed.
132- To achieve not leaking children processes in case of signals on timeout, you
133 MUST handle signals in each executable / python script and propagate them to
134 children processes.
135 - When your test script (python or binary) receives a signal like SIGTERM or
136 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
137 them to terminate before quitting.
138
139See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400140https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700141for more information.
142
143*** May the SIGKILL force be with you ***
144"""
145
146
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000147# Currently hardcoded. Eventually could be exposed as a flag once there's value.
148# 3 weeks
149MAX_AGE_SECS = 21*24*60*60
150
151
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500152TaskData = collections.namedtuple(
153 'TaskData', [
154 # List of strings; the command line to use, independent of what was
155 # specified in the isolated file.
156 'command',
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500157 # Relative directory to start command into.
158 'relative_cwd',
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500159 # List of strings; the arguments to add to the command specified in the
160 # isolated file.
161 'extra_args',
162 # Hash of the .isolated file that must be retrieved to recreate the tree
163 # of files to run the target executable. The command specified in the
164 # .isolated is executed. Mutually exclusive with command argument.
165 'isolated_hash',
166 # isolateserver.Storage instance to retrieve remote objects. This object
167 # has a reference to an isolateserver.StorageApi, which does the actual
168 # I/O.
169 'storage',
170 # isolateserver.LocalCache instance to keep from retrieving the same
171 # objects constantly by caching the objects retrieved. Can be on-disk or
172 # in-memory.
173 'isolate_cache',
174 # List of paths relative to root_dir to put into the output isolated
175 # bundle upon task completion (see link_outputs_to_outdir).
176 'outputs',
177 # Function (run_dir) => context manager that installs named caches into
178 # |run_dir|.
179 'install_named_caches',
180 # If True, the temporary directory will be deliberately leaked for later
181 # examination.
182 'leak_temp_dir',
183 # Path to the directory to use to create the temporary directory. If not
184 # specified, a random temporary directory is created.
185 'root_dir',
186 # Kills the process if it lasts more than this amount of seconds.
187 'hard_timeout',
188 # Number of seconds to wait between SIGTERM and SIGKILL.
189 'grace_period',
190 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
191 # task command line argument.
192 'bot_file',
193 # Logical account to switch LUCI_CONTEXT into.
194 'switch_to_account',
195 # Context manager dir => CipdInfo, see install_client_and_packages.
196 'install_packages_fn',
197 # Create tree with symlinks instead of hardlinks.
198 'use_symlinks',
199 # Environment variables to set.
200 'env',
201 # Environment variables to mutate with relative directories.
202 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
203 'env_prefix'])
204
205
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500206def _to_str(s):
207 """Downgrades a unicode instance to str. Pass str through as-is."""
208 if isinstance(s, str):
209 return s
210 # This is technically incorrect, especially on Windows. In theory
211 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
212 # page' on Windows, but that causes other problems, as the character set
213 # is very limited.
214 return s.encode('utf-8')
215
216
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500217def _to_unicode(s):
218 """Upgrades a str instance to unicode. Pass unicode through as-is."""
219 if isinstance(s, unicode) or s is None:
220 return s
221 return s.decode('utf-8')
222
223
maruel03e11842016-07-14 10:50:16 -0700224def make_temp_dir(prefix, root_dir):
225 """Returns a new unique temporary directory."""
226 return unicode(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000227
228
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500229def change_tree_read_only(rootdir, read_only):
230 """Changes the tree read-only bits according to the read_only specification.
231
232 The flag can be 0, 1 or 2, which will affect the possibility to modify files
233 and create or delete files.
234 """
235 if read_only == 2:
236 # Files and directories (except on Windows) are marked read only. This
237 # inhibits modifying, creating or deleting files in the test directory,
238 # except on Windows where creating and deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400239 file_path.make_tree_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500240 elif read_only == 1:
241 # Files are marked read only but not the directories. This inhibits
242 # modifying files but creating or deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400243 file_path.make_tree_files_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500244 elif read_only in (0, None):
Marc-Antoine Ruelf1d827c2014-11-24 15:22:25 -0500245 # Anything can be modified.
Marc-Antoine Ruel2666d9c2018-05-18 13:52:02 -0400246 # TODO(maruel): This is currently dangerous as long as
247 # DiskContentAddressedCache.touch() is not yet changed to verify the hash of
248 # the content of the files it is looking at, so that if a test modifies an
249 # input file, the file must be deleted.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400250 file_path.make_tree_writeable(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500251 else:
252 raise ValueError(
253 'change_tree_read_only(%s, %s): Unknown flag %s' %
254 (rootdir, read_only, read_only))
255
256
vadimsh9c54b2c2017-07-25 14:08:29 -0700257@contextlib.contextmanager
258def set_luci_context_account(account, tmp_dir):
259 """Sets LUCI_CONTEXT account to be used by the task.
260
261 If 'account' is None or '', does nothing at all. This happens when
262 run_isolated.py is called without '--switch-to-account' flag. In this case,
263 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
264 just inherit whatever account is already set. This may happen is users invoke
265 run_isolated.py explicitly from their code.
266
267 If the requested account is not defined in the context, switches to
268 non-authenticated access. This happens for Swarming tasks that don't use
269 'task' service accounts.
270
271 If not using LUCI_CONTEXT-based auth, does nothing.
272 If already running as requested account, does nothing.
273 """
274 if not account:
275 # Not actually switching.
276 yield
277 return
278
279 local_auth = luci_context.read('local_auth')
280 if not local_auth:
281 # Not using LUCI_CONTEXT auth at all.
282 yield
283 return
284
285 # See LUCI_CONTEXT.md for the format of 'local_auth'.
286 if local_auth.get('default_account_id') == account:
287 # Already set, no need to switch.
288 yield
289 return
290
291 available = {a['id'] for a in local_auth.get('accounts') or []}
292 if account in available:
293 logging.info('Switching default LUCI_CONTEXT account to %r', account)
294 local_auth['default_account_id'] = account
295 else:
296 logging.warning(
297 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
298 'disabling authentication', account, sorted(available))
299 local_auth.pop('default_account_id', None)
300
301 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
302 yield
303
304
nodir90bc8dc2016-06-15 13:35:21 -0700305def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000306 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700307
308 Raises:
309 ValueError if a parameter is requested in |command| but its value is not
310 provided.
311 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000312 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
313
314
315def replace_parameters(arg, out_dir, bot_file):
316 """Replaces parameter tokens with appropriate values in a string.
317
318 Raises:
319 ValueError if a parameter is requested in |arg| but its value is not
320 provided.
321 """
322 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
323 replace_slash = False
324 if ISOLATED_OUTDIR_PARAMETER in arg:
325 if not out_dir:
326 raise ValueError(
327 'output directory is requested in command or env var, but not '
328 'provided; please specify one')
329 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
330 replace_slash = True
331 if SWARMING_BOT_FILE_PARAMETER in arg:
332 if bot_file:
333 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700334 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000335 else:
336 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
337 'var, but no bot_file specified. Leaving parameter '
338 'unchanged.')
339 if replace_slash:
340 # Replace slashes only if parameters are present
341 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
342 arg = arg.replace('/', os.sep)
343 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700344
345
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000346
347def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
348 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800349 """Returns full OS environment to run a command in.
350
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800351 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
352 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800353
354 Args:
355 tmp_dir: temp directory.
356 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500357 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500358 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800359 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000360 out_dir: Isolated output directory. Required to be != None if any of the
361 env vars contain ISOLATED_OUTDIR_PARAMETER.
362 bot_file: Required to be != None if any of the env vars contain
363 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800364 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500365 out = os.environ.copy()
366 for k, v in env.iteritems():
367 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500368 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500369 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000370 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500371
372 if cipd_info:
373 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500374 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
375 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500376
377 for key, paths in env_prefixes.iteritems():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500378 assert isinstance(paths, list), paths
379 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500380 cur = out.get(key)
381 if cur:
382 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500383 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800384
Marc-Antoine Ruelefb30b12018-07-25 18:34:36 +0000385 tmp_dir = _to_str(tmp_dir)
386 # pylint: disable=line-too-long
387 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
388 # platform. So $TMPDIR must be set on all platforms.
389 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
390 out['TMPDIR'] = tmp_dir
391 if sys.platform == 'win32':
392 # * chromium's base utils uses GetTempPath().
393 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
394 # * Go uses GetTempPath().
395 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
396 # set.
397 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
398 out['TMP'] = tmp_dir
399 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
400 out['TEMP'] = tmp_dir
401 elif sys.platform == 'darwin':
402 # * Chromium uses an hack on macOS before calling into
403 # NSTemporaryDirectory().
404 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
405 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
406 out['MAC_CHROMIUM_TMPDIR'] = tmp_dir
407 else:
408 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
409 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
410 # * mktemp on linux respects $TMPDIR.
411 # * Chromium respects $TMPDIR on linux.
412 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
413 # * Go uses $TMPDIR.
414 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
415 pass
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500416 return out
vadimsh232f5a82017-01-20 19:23:44 -0800417
418
419def run_command(command, cwd, env, hard_timeout, grace_period):
maruel6be7f9e2015-10-01 12:25:30 -0700420 """Runs the command.
421
422 Returns:
423 tuple(process exit code, bool if had a hard timeout)
424 """
maruela9cfd6f2015-09-15 11:03:15 -0700425 logging.info('run_command(%s, %s)' % (command, cwd))
marueleb5fbee2015-09-17 13:01:36 -0700426
maruel6be7f9e2015-10-01 12:25:30 -0700427 exit_code = None
428 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700429 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700430 proc = None
431 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700432 try:
maruel6be7f9e2015-10-01 12:25:30 -0700433 # TODO(maruel): This code is imperfect. It doesn't handle well signals
434 # during the download phase and there's short windows were things can go
435 # wrong.
436 def handler(signum, _frame):
437 if proc and not had_signal:
438 logging.info('Received signal %d', signum)
439 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700440 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700441
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000442 proc = subprocess42.Popen(
443 command, cwd=cwd, env=env, detached=True, close_fds=True)
maruel6be7f9e2015-10-01 12:25:30 -0700444 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
445 try:
446 exit_code = proc.wait(hard_timeout or None)
447 except subprocess42.TimeoutExpired:
448 if not had_signal:
449 logging.warning('Hard timeout')
450 had_hard_timeout = True
451 logging.warning('Sending SIGTERM')
452 proc.terminate()
453
454 # Ignore signals in grace period. Forcibly give the grace period to the
455 # child process.
456 if exit_code is None:
457 ignore = lambda *_: None
458 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
459 try:
460 exit_code = proc.wait(grace_period or None)
461 except subprocess42.TimeoutExpired:
462 # Now kill for real. The user can distinguish between the
463 # following states:
464 # - signal but process exited within grace period,
465 # hard_timed_out will be set but the process exit code will be
466 # script provided.
467 # - processed exited late, exit code will be -9 on posix.
468 logging.warning('Grace exhausted; sending SIGKILL')
469 proc.kill()
martiniss5c8043e2017-08-01 17:09:43 -0700470 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700471 exit_code = proc.wait()
maruela9cfd6f2015-09-15 11:03:15 -0700472 except OSError:
473 # This is not considered to be an internal error. The executable simply
474 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800475 sys.stderr.write(
476 '<The executable does not exist or a dependent library is missing>\n'
477 '<Check for missing .so/.dll in the .isolate or GN file>\n'
478 '<Command: %s>\n' % command)
479 if os.environ.get('SWARMING_TASK_ID'):
480 # Give an additional hint when running as a swarming task.
481 sys.stderr.write(
482 '<See the task\'s page for commands to help diagnose this issue '
483 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700484 exit_code = 1
485 logging.info(
486 'Command finished with exit code %d (%s)',
487 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700488 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700489
490
maruel4409e302016-07-19 14:25:51 -0700491def fetch_and_map(isolated_hash, storage, cache, outdir, use_symlinks):
492 """Fetches an isolated tree, create the tree and returns (bundle, stats)."""
nodir6f801882016-04-29 14:41:50 -0700493 start = time.time()
494 bundle = isolateserver.fetch_isolated(
495 isolated_hash=isolated_hash,
496 storage=storage,
497 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700498 outdir=outdir,
499 use_symlinks=use_symlinks)
nodir6f801882016-04-29 14:41:50 -0700500 return bundle, {
501 'duration': time.time() - start,
nodir6f801882016-04-29 14:41:50 -0700502 'items_cold': base64.b64encode(large.pack(sorted(cache.added))),
503 'items_hot': base64.b64encode(
tansell9e04a8d2016-07-28 09:31:59 -0700504 large.pack(sorted(set(cache.used) - set(cache.added)))),
nodir6f801882016-04-29 14:41:50 -0700505 }
506
507
aludwin0a8e17d2016-10-27 15:57:39 -0700508def link_outputs_to_outdir(run_dir, out_dir, outputs):
509 """Links any named outputs to out_dir so they can be uploaded.
510
511 Raises an error if the file already exists in that directory.
512 """
513 if not outputs:
514 return
515 isolateserver.create_directories(out_dir, outputs)
516 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400517 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
518
519
520def copy_recursively(src, dst):
521 """Efficiently copies a file or directory from src_dir to dst_dir.
522
523 `item` may be a file, directory, or a symlink to a file or directory.
524 All symlinks are replaced with their targets, so the resulting
525 directory structure in dst_dir will never have any symlinks.
526
527 To increase speed, copy_recursively hardlinks individual files into the
528 (newly created) directory structure if possible, unlike Python's
529 shutil.copytree().
530 """
531 orig_src = src
532 try:
533 # Replace symlinks with their final target.
534 while fs.islink(src):
535 res = fs.readlink(src)
536 src = os.path.join(os.path.dirname(src), res)
537 # TODO(sadafm): Explicitly handle cyclic symlinks.
538
539 # Note that fs.isfile (which is a wrapper around os.path.isfile) throws
540 # an exception if src does not exist. A warning will be logged in that case.
541 if fs.isfile(src):
542 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
543 return
544
545 if not fs.exists(dst):
546 os.makedirs(dst)
547
548 for child in fs.listdir(src):
549 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
550
551 except OSError as e:
552 if e.errno == errno.ENOENT:
553 logging.warning('Path %s does not exist or %s is a broken symlink',
554 src, orig_src)
555 else:
556 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700557
558
maruela9cfd6f2015-09-15 11:03:15 -0700559def delete_and_upload(storage, out_dir, leak_temp_dir):
560 """Deletes the temporary run directory and uploads results back.
561
562 Returns:
nodir6f801882016-04-29 14:41:50 -0700563 tuple(outputs_ref, success, stats)
maruel064c0a32016-04-05 11:47:15 -0700564 - outputs_ref: a dict referring to the results archived back to the isolated
565 server, if applicable.
566 - success: False if something occurred that means that the task must
567 forcibly be considered a failure, e.g. zombie processes were left
568 behind.
nodir6f801882016-04-29 14:41:50 -0700569 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700570 """
maruela9cfd6f2015-09-15 11:03:15 -0700571 # Upload out_dir and generate a .isolated file out of this directory. It is
572 # only done if files were written in the directory.
573 outputs_ref = None
maruel064c0a32016-04-05 11:47:15 -0700574 cold = []
575 hot = []
nodir6f801882016-04-29 14:41:50 -0700576 start = time.time()
577
maruel12e30012015-10-09 11:55:35 -0700578 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700579 with tools.Profiler('ArchiveOutput'):
580 try:
maruel064c0a32016-04-05 11:47:15 -0700581 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
maruela9cfd6f2015-09-15 11:03:15 -0700582 storage, [out_dir], None)
583 outputs_ref = {
Marc-Antoine Rueld0868ec2018-11-28 20:47:29 +0000584 'isolated': results.values()[0],
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +0000585 'isolatedserver': storage.server_ref.url,
586 'namespace': storage.server_ref.namespace,
maruela9cfd6f2015-09-15 11:03:15 -0700587 }
maruel064c0a32016-04-05 11:47:15 -0700588 cold = sorted(i.size for i in f_cold)
589 hot = sorted(i.size for i in f_hot)
maruela9cfd6f2015-09-15 11:03:15 -0700590 except isolateserver.Aborted:
591 # This happens when a signal SIGTERM was received while uploading data.
592 # There is 2 causes:
593 # - The task was too slow and was about to be killed anyway due to
594 # exceeding the hard timeout.
595 # - The amount of data uploaded back is very large and took too much
596 # time to archive.
597 sys.stderr.write('Received SIGTERM while uploading')
598 # Re-raise, so it will be treated as an internal failure.
599 raise
nodir6f801882016-04-29 14:41:50 -0700600
601 success = False
maruela9cfd6f2015-09-15 11:03:15 -0700602 try:
maruel12e30012015-10-09 11:55:35 -0700603 if (not leak_temp_dir and fs.isdir(out_dir) and
maruel6eeea7d2015-09-16 12:17:42 -0700604 not file_path.rmtree(out_dir)):
maruela9cfd6f2015-09-15 11:03:15 -0700605 logging.error('Had difficulties removing out_dir %s', out_dir)
nodir6f801882016-04-29 14:41:50 -0700606 else:
607 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700608 except OSError as e:
609 # When this happens, it means there's a process error.
maruel12e30012015-10-09 11:55:35 -0700610 logging.exception('Had difficulties removing out_dir %s: %s', out_dir, e)
nodir6f801882016-04-29 14:41:50 -0700611 stats = {
612 'duration': time.time() - start,
613 'items_cold': base64.b64encode(large.pack(cold)),
614 'items_hot': base64.b64encode(large.pack(hot)),
615 }
616 return outputs_ref, success, stats
maruela9cfd6f2015-09-15 11:03:15 -0700617
618
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500619def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700620 """Runs a command with optional isolated input/output.
621
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500622 Arguments:
623 - data: TaskData instance.
624 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700625
626 Returns metadata about the result.
627 """
maruela9cfd6f2015-09-15 11:03:15 -0700628 result = {
maruel064c0a32016-04-05 11:47:15 -0700629 'duration': None,
maruela9cfd6f2015-09-15 11:03:15 -0700630 'exit_code': None,
maruel6be7f9e2015-10-01 12:25:30 -0700631 'had_hard_timeout': False,
Seth Koehler49139812017-12-19 13:59:33 -0500632 'internal_failure': 'run_isolated did not complete properly',
maruel064c0a32016-04-05 11:47:15 -0700633 'stats': {
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000634 'isolated': {
635 #'cipd': {
636 # 'duration': 0.,
637 # 'get_client_duration': 0.,
638 #},
639 'download': {
640 #'duration': 0.,
641 'initial_number_items': len(data.isolate_cache),
642 'initial_size': data.isolate_cache.total_size,
643 #'items_cold': '<large.pack()>',
644 #'items_hot': '<large.pack()>',
645 },
646 #'upload': {
647 # 'duration': 0.,
648 # 'items_cold': '<large.pack()>',
649 # 'items_hot': '<large.pack()>',
650 #},
651 },
maruel064c0a32016-04-05 11:47:15 -0700652 },
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000653 #'cipd_pins': {
654 # 'packages': [
655 # {'package_name': ..., 'version': ..., 'path': ...},
656 # ...
657 # ],
658 # 'client_package': {'package_name': ..., 'version': ...},
659 #},
maruela9cfd6f2015-09-15 11:03:15 -0700660 'outputs_ref': None,
nodirbe642ff2016-06-09 15:51:51 -0700661 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700662 }
nodirbe642ff2016-06-09 15:51:51 -0700663
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500664 if data.root_dir:
665 file_path.ensure_tree(data.root_dir, 0700)
666 elif data.isolate_cache.cache_dir:
667 data = data._replace(
668 root_dir=os.path.dirname(data.isolate_cache.cache_dir))
maruele2f2cb82016-07-13 14:41:03 -0700669 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700670 # If root_dir is not specified, it is not constant.
671 # TODO(maruel): This is not obvious. Change this to become an error once we
672 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500673 if constant_run_path and data.root_dir:
674 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700675 if os.path.isdir(run_dir):
676 file_path.rmtree(run_dir)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500677 os.mkdir(run_dir, 0700)
maruelcffa0542017-04-07 08:39:20 -0700678 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500679 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
maruel03e11842016-07-14 10:50:16 -0700680 # storage should be normally set but don't crash if it is not. This can happen
681 # as Swarming task can run without an isolate server.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500682 out_dir = make_temp_dir(
683 ISOLATED_OUT_DIR, data.root_dir) if data.storage else None
684 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700685 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500686 if data.relative_cwd:
687 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500688 command = data.command
nodir55be77b2016-05-03 09:39:57 -0700689 try:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500690 with data.install_packages_fn(run_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800691 if cipd_info:
692 result['stats']['cipd'] = cipd_info.stats
693 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700694
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500695 if data.isolated_hash:
vadimsh232f5a82017-01-20 19:23:44 -0800696 isolated_stats = result['stats'].setdefault('isolated', {})
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000697 bundle, stats = fetch_and_map(
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500698 isolated_hash=data.isolated_hash,
699 storage=data.storage,
700 cache=data.isolate_cache,
vadimsh232f5a82017-01-20 19:23:44 -0800701 outdir=run_dir,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500702 use_symlinks=data.use_symlinks)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000703 isolated_stats['download'].update(stats)
vadimsh232f5a82017-01-20 19:23:44 -0800704 change_tree_read_only(run_dir, bundle.read_only)
maruelabec63c2017-04-26 11:53:24 -0700705 # Inject the command
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500706 if not command and bundle.command:
707 command = bundle.command + data.extra_args
Marc-Antoine Rueld704a1f2017-10-31 10:51:23 -0400708 # Only set the relative directory if the isolated file specified a
709 # command, and no raw command was specified.
710 if bundle.relative_cwd:
711 cwd = os.path.normpath(os.path.join(cwd, bundle.relative_cwd))
maruelabec63c2017-04-26 11:53:24 -0700712
713 if not command:
714 # Handle this as a task failure, not an internal failure.
715 sys.stderr.write(
716 '<No command was specified!>\n'
717 '<Please secify a command when triggering your Swarming task>\n')
718 result['exit_code'] = 1
719 return result
nodirbe642ff2016-06-09 15:51:51 -0700720
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500721 if not cwd.startswith(run_dir):
722 # Handle this as a task failure, not an internal failure. This is a
723 # 'last chance' way to gate against directory escape.
724 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
725 result['exit_code'] = 1
726 return result
727
728 if not os.path.isdir(cwd):
729 # Accepts relative_cwd that does not exist.
730 os.makedirs(cwd, 0700)
731
vadimsh232f5a82017-01-20 19:23:44 -0800732 # If we have an explicit list of files to return, make sure their
733 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500734 if data.storage and data.outputs:
735 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700736
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500737 with data.install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -0800738 sys.stdout.flush()
739 start = time.time()
740 try:
vadimsh9c54b2c2017-07-25 14:08:29 -0700741 # Need to switch the default account before 'get_command_env' call,
742 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500743 with set_luci_context_account(data.switch_to_account, tmp_dir):
744 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000745 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
746 data.bot_file)
Robert Iannucci24ae76a2018-02-26 12:51:18 -0800747 command = tools.fix_python_cmd(command, env)
748 command = process_command(command, out_dir, data.bot_file)
749 file_path.ensure_command_has_abs_path(command, cwd)
750
vadimsh9c54b2c2017-07-25 14:08:29 -0700751 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500752 command, cwd, env, data.hard_timeout, data.grace_period)
nodird6160682017-02-02 13:03:35 -0800753 finally:
754 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -0500755
756 # We successfully ran the command, set internal_failure back to
757 # None (even if the command failed, it's not an internal error).
758 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -0700759 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -0700760 # An internal error occurred. Report accordingly so the swarming task will
761 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -0700762 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -0700763 result['internal_failure'] = str(e)
764 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -0700765
766 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -0700767 finally:
768 try:
aludwin0a8e17d2016-10-27 15:57:39 -0700769 # Try to link files to the output directory, if specified.
770 if out_dir:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500771 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700772
nodir32a1ec12016-10-26 18:34:07 -0700773 success = False
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500774 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -0700775 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700776 logging.warning(
777 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -0700778 else:
maruel84537cb2015-10-16 14:21:28 -0700779 # On Windows rmtree(run_dir) call above has a synchronization effect: it
780 # finishes only when all task child processes terminate (since a running
781 # process locks *.exe file). Examine out_dir only after that call
782 # completes (since child processes may write to out_dir too and we need
783 # to wait for them to finish).
784 if fs.isdir(run_dir):
785 try:
786 success = file_path.rmtree(run_dir)
787 except OSError as e:
Marc-Antoine Ruel44699b32018-09-24 23:31:50 +0000788 logging.error('rmtree(%r) failed: %s', run_dir, e)
maruel84537cb2015-10-16 14:21:28 -0700789 success = False
790 if not success:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500791 sys.stderr.write(OUTLIVING_ZOMBIE_MSG % ('run', data.grace_period))
maruel84537cb2015-10-16 14:21:28 -0700792 if result['exit_code'] == 0:
793 result['exit_code'] = 1
794 if fs.isdir(tmp_dir):
795 try:
796 success = file_path.rmtree(tmp_dir)
797 except OSError as e:
Marc-Antoine Ruel44699b32018-09-24 23:31:50 +0000798 logging.error('rmtree(%r) failed: %s', tmp_dir, e)
maruel84537cb2015-10-16 14:21:28 -0700799 success = False
800 if not success:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500801 sys.stderr.write(OUTLIVING_ZOMBIE_MSG % ('temp', data.grace_period))
maruel84537cb2015-10-16 14:21:28 -0700802 if result['exit_code'] == 0:
803 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -0700804
marueleb5fbee2015-09-17 13:01:36 -0700805 # This deletes out_dir if leak_temp_dir is not set.
nodir9130f072016-05-27 13:59:08 -0700806 if out_dir:
nodir55715712016-06-03 12:28:19 -0700807 isolated_stats = result['stats'].setdefault('isolated', {})
808 result['outputs_ref'], success, isolated_stats['upload'] = (
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500809 delete_and_upload(data.storage, out_dir, data.leak_temp_dir))
maruela9cfd6f2015-09-15 11:03:15 -0700810 if not success and result['exit_code'] == 0:
811 result['exit_code'] = 1
812 except Exception as e:
813 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -0700814 if out_dir:
815 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -0700816 result['internal_failure'] = str(e)
817 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500818
819
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500820def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -0700821 """Runs an executable and records execution metadata.
822
nodir55be77b2016-05-03 09:39:57 -0700823 If isolated_hash is specified, downloads the dependencies in the cache,
824 hardlinks them into a temporary directory and runs the command specified in
825 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500826
827 A temporary directory is created to hold the output files. The content inside
828 this directory will be uploaded back to |storage| packaged as a .isolated
829 file.
830
831 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500832 - data: TaskData instance.
833 - result_json: File path to dump result metadata into. If set, the process
834 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -0700835
836 Returns:
837 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000838 """
maruela76b9ee2015-12-15 06:18:08 -0800839 if result_json:
840 # Write a json output file right away in case we get killed.
841 result = {
842 'exit_code': None,
843 'had_hard_timeout': False,
844 'internal_failure': 'Was terminated before completion',
845 'outputs_ref': None,
nodirbe642ff2016-06-09 15:51:51 -0700846 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -0800847 }
848 tools.write_json(result_json, result, dense=True)
849
maruela9cfd6f2015-09-15 11:03:15 -0700850 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500851 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -0700852 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -0700853
maruela9cfd6f2015-09-15 11:03:15 -0700854 if result_json:
maruel05d5a882015-09-21 13:59:02 -0700855 # We've found tests to delete 'work' when quitting, causing an exception
856 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -0700857 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -0700858 tools.write_json(result_json, result, dense=True)
859 # Only return 1 if there was an internal error.
860 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +0000861
maruela9cfd6f2015-09-15 11:03:15 -0700862 # Marshall into old-style inline output.
863 if result['outputs_ref']:
864 data = {
865 'hash': result['outputs_ref']['isolated'],
866 'namespace': result['outputs_ref']['namespace'],
867 'storage': result['outputs_ref']['isolatedserver'],
868 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -0500869 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700870 print(
871 '[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
872 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -0800873 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700874 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000875
876
iannuccib58d10d2017-03-18 02:00:25 -0700877# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -0800878CipdInfo = collections.namedtuple('CipdInfo', [
879 'client', # cipd.CipdClient object
880 'cache_dir', # absolute path to bot-global cipd tag and instance cache
881 'stats', # dict with stats to return to the server
882 'pins', # dict with installed cipd pins to return to the server
883])
884
885
886@contextlib.contextmanager
887def noop_install_packages(_run_dir):
iannuccib58d10d2017-03-18 02:00:25 -0700888 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -0800889 yield None
890
891
iannuccib58d10d2017-03-18 02:00:25 -0700892def _install_packages(run_dir, cipd_cache_dir, client, packages, timeout):
893 """Calls 'cipd ensure' for packages.
894
895 Args:
896 run_dir (str): root of installation.
897 cipd_cache_dir (str): the directory to use for the cipd package cache.
898 client (CipdClient): the cipd client to use
899 packages: packages to install, list [(path, package_name, version), ...].
900 timeout: max duration in seconds that this function can take.
901
902 Returns: list of pinned packages. Looks like [
903 {
904 'path': 'subdirectory',
905 'package_name': 'resolved/package/name',
906 'version': 'deadbeef...',
907 },
908 ...
909 ]
910 """
911 package_pins = [None]*len(packages)
912 def insert_pin(path, name, version, idx):
913 package_pins[idx] = {
914 'package_name': name,
915 # swarming deals with 'root' as '.'
916 'path': path or '.',
917 'version': version,
918 }
919
920 by_path = collections.defaultdict(list)
921 for i, (path, name, version) in enumerate(packages):
922 # cipd deals with 'root' as ''
923 if path == '.':
924 path = ''
925 by_path[path].append((name, version, i))
926
927 pins = client.ensure(
928 run_dir,
929 {
930 subdir: [(name, vers) for name, vers, _ in pkgs]
931 for subdir, pkgs in by_path.iteritems()
932 },
933 cache_dir=cipd_cache_dir,
934 timeout=timeout,
935 )
936
937 for subdir, pin_list in sorted(pins.iteritems()):
938 this_subdir = by_path[subdir]
939 for i, (name, version) in enumerate(pin_list):
940 insert_pin(subdir, name, version, this_subdir[i][2])
941
Robert Iannucci461b30d2017-12-13 11:34:03 -0800942 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -0700943
944 return package_pins
945
946
vadimsh232f5a82017-01-20 19:23:44 -0800947@contextlib.contextmanager
iannuccib58d10d2017-03-18 02:00:25 -0700948def install_client_and_packages(
nodirff531b42016-06-23 13:05:06 -0700949 run_dir, packages, service_url, client_package_name,
vadimsh232f5a82017-01-20 19:23:44 -0800950 client_version, cache_dir, timeout=None):
vadimsh902948e2017-01-20 15:57:32 -0800951 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -0700952
vadimsh232f5a82017-01-20 19:23:44 -0800953 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
954
955 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -0700956 [
957 {
958 "path": path, "package_name": package_name, "version": version,
959 },
960 ...
961 ]
vadimsh902948e2017-01-20 15:57:32 -0800962 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -0700963
964 such that they correspond 1:1 to all input package arguments from the command
965 line. These dictionaries make their all the way back to swarming, where they
966 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -0700967
vadimsh902948e2017-01-20 15:57:32 -0800968 If 'packages' list is empty, will bootstrap CIPD client, but won't install
969 any packages.
970
971 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -0800972 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -0800973
nodirbe642ff2016-06-09 15:51:51 -0700974 Args:
nodir90bc8dc2016-06-15 13:35:21 -0700975 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -0800976 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -0700977 service_url (str): CIPD server url, e.g.
978 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -0700979 client_package_name (str): CIPD package name of CIPD client.
980 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -0700981 cache_dir (str): where to keep cache of cipd clients, packages and tags.
982 timeout: max duration in seconds that this function can take.
nodirbe642ff2016-06-09 15:51:51 -0700983 """
984 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -0700985
nodirbe642ff2016-06-09 15:51:51 -0700986 timeoutfn = tools.sliding_timeout(timeout)
nodirbe642ff2016-06-09 15:51:51 -0700987 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -0700988
vadimsh902948e2017-01-20 15:57:32 -0800989 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -0800990 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -0700991 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -0800992 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -0700993
nodirbe642ff2016-06-09 15:51:51 -0700994 get_client_start = time.time()
995 client_manager = cipd.get_client(
996 service_url, client_package_name, client_version, cache_dir,
997 timeout=timeoutfn())
iannucci96fcccc2016-08-30 15:52:22 -0700998
nodirbe642ff2016-06-09 15:51:51 -0700999 with client_manager as client:
1000 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001001
iannuccib58d10d2017-03-18 02:00:25 -07001002 package_pins = []
1003 if packages:
1004 package_pins = _install_packages(
1005 run_dir, cipd_cache_dir, client, packages, timeoutfn())
1006
1007 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001008
vadimsh232f5a82017-01-20 19:23:44 -08001009 total_duration = time.time() - start
1010 logging.info(
1011 'Installing CIPD client and packages took %d seconds', total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001012
vadimsh232f5a82017-01-20 19:23:44 -08001013 yield CipdInfo(
1014 client=client,
1015 cache_dir=cipd_cache_dir,
1016 stats={
1017 'duration': total_duration,
1018 'get_client_duration': get_client_duration,
1019 },
1020 pins={
iannuccib58d10d2017-03-18 02:00:25 -07001021 'client_package': {
1022 'package_name': client.package_name,
1023 'version': client.instance_id,
1024 },
vadimsh232f5a82017-01-20 19:23:44 -08001025 'packages': package_pins,
1026 })
nodirbe642ff2016-06-09 15:51:51 -07001027
1028
1029def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001030 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001031 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001032 version=__version__,
1033 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001034 parser.add_option(
maruel36a963d2016-04-08 17:15:49 -07001035 '--clean', action='store_true',
1036 help='Cleans the cache, trimming it necessary and remove corrupted items '
1037 'and returns without executing anything; use with -v to know what '
1038 'was done')
1039 parser.add_option(
maruel4409e302016-07-19 14:25:51 -07001040 '--use-symlinks', action='store_true',
1041 help='Use symlinks instead of hardlinks')
1042 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001043 '--json',
1044 help='dump output metadata to json file. When used, run_isolated returns '
1045 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001046 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001047 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001048 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001049 '--grace-period', type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001050 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001051 parser.add_option(
Marc-Antoine Ruel49e347d2017-10-24 16:52:02 -07001052 '--raw-cmd', action='store_true',
1053 help='Ignore the isolated command, use the one supplied at the command '
1054 'line')
1055 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001056 '--relative-cwd',
1057 help='Ignore the isolated \'relative_cwd\' and use this one instead; '
1058 'requires --raw-cmd')
1059 parser.add_option(
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001060 '--env', default=[], action='append',
1061 help='Environment variables to set for the child process')
1062 parser.add_option(
1063 '--env-prefix', default=[], action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001064 help='Specify a VAR=./path/fragment to put in the environment variable '
1065 'before executing the command. The path fragment must be relative '
1066 'to the isolated run directory, and must not contain a `..` token. '
1067 'The path will be made absolute and prepended to the indicated '
1068 '$VAR using the OS\'s path separator. Multiple items for the same '
1069 '$VAR will be prepended in order.')
1070 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001071 '--bot-file',
1072 help='Path to a file describing the state of the host. The content is '
1073 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001074 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001075 '--switch-to-account',
1076 help='If given, switches LUCI_CONTEXT to given logical service account '
1077 '(e.g. "task" or "system") before launching the isolated process.')
1078 parser.add_option(
aludwin0a8e17d2016-10-27 15:57:39 -07001079 '--output', action='append',
1080 help='Specifies an output to return. If no outputs are specified, all '
1081 'files located in $(ISOLATED_OUTDIR) will be returned; '
1082 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1083 'specified by --output option (there can be multiple) will be '
1084 'returned. Note that if a file in OUT_DIR has the same path '
1085 'as an --output option, the --output version will be returned.')
1086 parser.add_option(
aludwin7556e0c2016-10-26 08:46:10 -07001087 '-a', '--argsfile',
1088 # This is actually handled in parse_args; it's included here purely so it
1089 # can make it into the help text.
1090 help='Specify a file containing a JSON array of arguments to this '
1091 'script. If --argsfile is provided, no other argument may be '
1092 'provided on the command line.')
Marc-Antoine Ruel1687b5e2014-02-06 17:47:53 -05001093 data_group = optparse.OptionGroup(parser, 'Data source')
1094 data_group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001095 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001096 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruelf7d737d2014-12-10 15:36:29 -05001097 isolateserver.add_isolate_server_options(data_group)
Marc-Antoine Ruel1687b5e2014-02-06 17:47:53 -05001098 parser.add_option_group(data_group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001099
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001100 isolateserver.add_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001101
1102 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001103
1104 group = optparse.OptionGroup(parser, 'Named caches')
1105 group.add_option(
1106 '--named-cache',
1107 dest='named_caches',
1108 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001109 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001110 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001111 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001112 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1113 'path is a path relative to the run dir where the cache directory '
1114 'must be put to. '
1115 'This option can be specified more than once.')
1116 group.add_option(
1117 '--named-cache-root', default='named_caches',
1118 help='Cache root directory. Default=%default')
1119 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001120
Kenneth Russell61d42352014-09-15 11:41:16 -07001121 debug_group = optparse.OptionGroup(parser, 'Debugging')
1122 debug_group.add_option(
1123 '--leak-temp-dir',
1124 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001125 help='Deliberately leak isolate\'s temp dir for later examination. '
1126 'Default: %default')
marueleb5fbee2015-09-17 13:01:36 -07001127 debug_group.add_option(
1128 '--root-dir', help='Use a directory instead of a random one')
Kenneth Russell61d42352014-09-15 11:41:16 -07001129 parser.add_option_group(debug_group)
1130
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001131 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001132
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001133 parser.set_defaults(cache='cache', cipd_cache='cipd_cache')
nodirbe642ff2016-06-09 15:51:51 -07001134 return parser
1135
1136
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001137def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001138 """Validates named cache options and returns a CacheManager."""
1139 if options.named_caches and not options.named_cache_root:
1140 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001141 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001142 if not CACHE_NAME_RE.match(name):
1143 parser.error(
1144 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1145 if not path:
1146 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001147 try:
1148 long(hint)
1149 except ValueError:
1150 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001151 if options.named_cache_root:
1152 # Make these configurable later if there is use case but for now it's fairly
1153 # safe values.
1154 # In practice, a fair chunk of bots are already recycled on a daily schedule
1155 # so this code doesn't have any effect to them, unless they are preloaded
1156 # with a really old cache.
1157 policies = local_caching.CachePolicies(
1158 # 1TiB.
1159 max_cache_size=1024*1024*1024*1024,
1160 min_free_space=options.min_free_space,
1161 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001162 max_age_secs=MAX_AGE_SECS)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001163 root_dir = unicode(os.path.abspath(options.named_cache_root))
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001164 return local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001165 return None
1166
1167
aludwin7556e0c2016-10-26 08:46:10 -07001168def parse_args(args):
1169 # Create a fake mini-parser just to get out the "-a" command. Note that
1170 # it's not documented here; instead, it's documented in create_option_parser
1171 # even though that parser will never actually get to parse it. This is
1172 # because --argsfile is exclusive with all other options and arguments.
1173 file_argparse = argparse.ArgumentParser(add_help=False)
1174 file_argparse.add_argument('-a', '--argsfile')
1175 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1176 if file_args.argsfile:
1177 if nonfile_args:
1178 file_argparse.error('Can\'t specify --argsfile with'
1179 'any other arguments (%s)' % nonfile_args)
1180 try:
1181 with open(file_args.argsfile, 'r') as f:
1182 args = json.load(f)
1183 except (IOError, OSError, ValueError) as e:
1184 # We don't need to error out here - "args" is now empty,
1185 # so the call below to parser.parse_args(args) will fail
1186 # and print the full help text.
1187 print >> sys.stderr, 'Couldn\'t read arguments: %s' % e
1188
1189 # Even if we failed to read the args, just call the normal parser now since it
1190 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001191 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001192 options, args = parser.parse_args(args)
aludwin7556e0c2016-10-26 08:46:10 -07001193 return (parser, options, args)
1194
1195
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001196def _calc_named_cache_hint(named_cache, named_caches):
1197 """Returns the expected size of the missing named caches."""
1198 present = named_cache.available
1199 size = 0
1200 for name, _, hint in named_caches:
1201 if name not in present:
1202 hint = long(hint)
1203 if hint > 0:
1204 size += hint
1205 return size
1206
1207
aludwin7556e0c2016-10-26 08:46:10 -07001208def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001209 # Warning: when --argsfile is used, the strings are unicode instances, when
1210 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001211 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001212
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001213 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001214 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001215
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001216 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001217 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001218 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1219 if hint:
1220 # Increase the --min-free-space value by the hint, and recreate the
1221 # NamedCache instance so it gets the updated CachePolicy.
1222 options.min_free_space += hint
1223 named_cache = process_named_cache_options(parser, options)
1224
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001225 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1226 # they can be cleaned the same way.
nodirf33b8d62016-10-26 22:34:58 -07001227 isolate_cache = isolateserver.process_cache_options(options, trim=False)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001228 caches = []
1229 if isolate_cache:
1230 caches.append(isolate_cache)
1231 if named_cache:
1232 caches.append(named_cache)
1233 root = caches[0].cache_dir if caches else unicode(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001234 if options.clean:
1235 if options.isolated:
1236 parser.error('Can\'t use --isolated with --clean.')
1237 if options.isolate_server:
1238 parser.error('Can\'t use --isolate-server with --clean.')
1239 if options.json:
1240 parser.error('Can\'t use --json with --clean.')
nodirf33b8d62016-10-26 22:34:58 -07001241 if options.named_caches:
1242 parser.error('Can\t use --named-cache with --clean.')
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001243 # Trim first, then clean.
1244 local_caching.trim_caches(
1245 caches,
1246 root,
1247 min_free_space=options.min_free_space,
1248 max_age_secs=MAX_AGE_SECS)
1249 for c in caches:
Marc-Antoine Ruel87fc2222018-06-18 13:09:24 +00001250 c.cleanup()
maruel36a963d2016-04-08 17:15:49 -07001251 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001252
1253 # Trim must still be done for the following case:
1254 # - named-cache was used
1255 # - some entries, with a large hint, where missing
1256 # - --min-free-space was increased accordingly, thus trimming is needed
1257 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1258 # --clean after each task.
1259 if hint:
1260 logging.info('Additional trimming of %d bytes', hint)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001261 local_caching.trim_caches(
1262 caches,
1263 root,
1264 min_free_space=options.min_free_space,
1265 max_age_secs=MAX_AGE_SECS)
maruel36a963d2016-04-08 17:15:49 -07001266
nodir55be77b2016-05-03 09:39:57 -07001267 if not options.isolated and not args:
1268 parser.error('--isolated or command to run is required.')
1269
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001270 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001271
1272 isolateserver.process_isolate_server_options(
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001273 parser, options, True, False)
nodir55be77b2016-05-03 09:39:57 -07001274 if not options.isolate_server:
1275 if options.isolated:
1276 parser.error('--isolated requires --isolate-server')
1277 if ISOLATED_OUTDIR_PARAMETER in args:
1278 parser.error(
1279 '%s in args requires --isolate-server' % ISOLATED_OUTDIR_PARAMETER)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001280
nodir90bc8dc2016-06-15 13:35:21 -07001281 if options.root_dir:
1282 options.root_dir = unicode(os.path.abspath(options.root_dir))
maruel12e30012015-10-09 11:55:35 -07001283 if options.json:
1284 options.json = unicode(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001285
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001286 if any('=' not in i for i in options.env):
1287 parser.error(
1288 '--env required key=value form. value can be skipped to delete '
1289 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001290 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001291
1292 prefixes = {}
1293 cwd = os.path.realpath(os.getcwd())
1294 for item in options.env_prefix:
1295 if '=' not in item:
1296 parser.error(
1297 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1298 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001299 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001300 if os.path.isabs(opath):
1301 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1302 opath = os.path.normpath(opath)
1303 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1304 parser.error(
1305 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1306 % opath)
1307 prefixes.setdefault(key, []).append(opath)
1308 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001309
nodirbe642ff2016-06-09 15:51:51 -07001310 cipd.validate_cipd_options(parser, options)
1311
vadimsh232f5a82017-01-20 19:23:44 -08001312 install_packages_fn = noop_install_packages
vadimsh902948e2017-01-20 15:57:32 -08001313 if options.cipd_enabled:
iannuccib58d10d2017-03-18 02:00:25 -07001314 install_packages_fn = lambda run_dir: install_client_and_packages(
vadimsh902948e2017-01-20 15:57:32 -08001315 run_dir, cipd.parse_package_args(options.cipd_packages),
1316 options.cipd_server, options.cipd_client_package,
1317 options.cipd_client_version, cache_dir=options.cipd_cache)
nodirbe642ff2016-06-09 15:51:51 -07001318
nodird6160682017-02-02 13:03:35 -08001319 @contextlib.contextmanager
nodir0ae98b32017-05-11 13:21:53 -07001320 def install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001321 # WARNING: this function depends on "options" variable defined in the outer
1322 # function.
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001323 assert unicode(run_dir), repr(run_dir)
1324 assert os.path.isabs(run_dir), run_dir
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001325 named_caches = [
nodir0ae98b32017-05-11 13:21:53 -07001326 (os.path.join(run_dir, unicode(relpath)), name)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001327 for name, relpath, _ in options.named_caches
nodir0ae98b32017-05-11 13:21:53 -07001328 ]
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001329 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001330 named_cache.install(path, name)
nodird6160682017-02-02 13:03:35 -08001331 try:
1332 yield
1333 finally:
dnje289d132017-07-07 11:16:44 -07001334 # Uninstall each named cache, returning it to the cache pool. If an
1335 # uninstall fails for a given cache, it will remain in the task's
1336 # temporary space, get cleaned up by the Swarming bot, and be lost.
1337 #
1338 # If the Swarming bot cannot clean up the cache, it will handle it like
1339 # any other bot file that could not be removed.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001340 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001341 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001342 # uninstall() doesn't trim but does call save() implicitly. Trimming
1343 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001344 named_cache.uninstall(path, name)
1345 except local_caching.NamedCacheError:
1346 logging.exception('Error while removing named cache %r at %r. '
1347 'The cache will be lost.', path, name)
nodirf33b8d62016-10-26 22:34:58 -07001348
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001349 extra_args = []
1350 command = []
1351 if options.raw_cmd:
1352 command = args
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001353 if options.relative_cwd:
1354 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1355 if not a.startswith(os.getcwd()):
1356 parser.error(
1357 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001358 else:
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001359 if options.relative_cwd:
1360 parser.error('--relative-cwd requires --raw-cmd')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001361 extra_args = args
1362
1363 data = TaskData(
1364 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001365 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001366 extra_args=extra_args,
1367 isolated_hash=options.isolated,
1368 storage=None,
1369 isolate_cache=isolate_cache,
1370 outputs=options.output,
1371 install_named_caches=install_named_caches,
1372 leak_temp_dir=options.leak_temp_dir,
1373 root_dir=_to_unicode(options.root_dir),
1374 hard_timeout=options.hard_timeout,
1375 grace_period=options.grace_period,
1376 bot_file=options.bot_file,
1377 switch_to_account=options.switch_to_account,
1378 install_packages_fn=install_packages_fn,
1379 use_symlinks=options.use_symlinks,
1380 env=options.env,
1381 env_prefix=options.env_prefix)
nodirbe642ff2016-06-09 15:51:51 -07001382 try:
nodir90bc8dc2016-06-15 13:35:21 -07001383 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001384 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001385 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001386 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001387 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001388 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001389 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001390 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001391 return run_tha_test(data, options.json)
1392 return run_tha_test(data, options.json)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001393 except (
1394 cipd.Error,
1395 local_caching.NamedCacheError,
Marc-Antoine Ruelb6e9e232018-11-20 00:12:33 +00001396 local_caching.NoMoreSpace) as ex:
nodirbe642ff2016-06-09 15:51:51 -07001397 print >> sys.stderr, ex.message
1398 return 1
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001399
1400
1401if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001402 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001403 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001404 fix_encoding.fix_encoding()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001405 sys.exit(main(sys.argv[1:]))