blob: 0ba51d767625cde33bf17467e5179376be037f72 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
33See
34https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
35for all the variables.
36
37See
38https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
39for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000040"""
41
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000042__version__ = '1.0.0'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000043
aludwin7556e0c2016-10-26 08:46:10 -070044import argparse
maruel064c0a32016-04-05 11:47:15 -070045import base64
iannucci96fcccc2016-08-30 15:52:22 -070046import collections
vadimsh232f5a82017-01-20 19:23:44 -080047import contextlib
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040048import errno
aludwin7556e0c2016-10-26 08:46:10 -070049import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000050import logging
51import optparse
52import os
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040053import re
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000054import sys
55import tempfile
maruel064c0a32016-04-05 11:47:15 -070056import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000057
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000058from third_party.depot_tools import fix_encoding
59
Vadim Shtayura6b555c12014-07-23 16:22:18 -070060from utils import file_path
maruel12e30012015-10-09 11:55:35 -070061from utils import fs
maruel064c0a32016-04-05 11:47:15 -070062from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040063from utils import logging_utils
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040064from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050065from utils import subprocess42
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000066from utils import tools
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000067
vadimsh9c54b2c2017-07-25 14:08:29 -070068from libs import luci_context
69
Vadim Shtayurae34e13a2014-02-02 11:23:26 -080070import auth
nodirbe642ff2016-06-09 15:51:51 -070071import cipd
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000072import isolateserver
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +000073import isolate_storage
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040074import local_caching
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000075
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000076
maruele2f2cb82016-07-13 14:41:03 -070077# Magic variables that can be found in the isolate task command line.
78ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
79EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
80SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
81
82
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000083# The name of the log file to use.
84RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
85
maruele2f2cb82016-07-13 14:41:03 -070086
csharp@chromium.orge217f302012-11-22 16:51:53 +000087# The name of the log to use for the run_test_cases.py command
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000088RUN_TEST_CASES_LOG = 'run_test_cases.log'
csharp@chromium.orge217f302012-11-22 16:51:53 +000089
vadimsh@chromium.org87d63262013-04-04 19:34:21 +000090
maruele2f2cb82016-07-13 14:41:03 -070091# Use short names for temporary directories. This is driven by Windows, which
92# imposes a relatively short maximum path length of 260 characters, often
93# referred to as MAX_PATH. It is relatively easy to create files with longer
94# path length. A use case is with recursive depedency treesV like npm packages.
95#
96# It is recommended to start the script with a `root_dir` as short as
97# possible.
98# - ir stands for isolated_run
99# - io stands for isolated_out
100# - it stands for isolated_tmp
101ISOLATED_RUN_DIR = u'ir'
102ISOLATED_OUT_DIR = u'io'
103ISOLATED_TMP_DIR = u'it'
104
105
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400106# Keep synced with task_request.py
107CACHE_NAME_RE = re.compile(ur'^[a-z0-9_]{1,4096}$')
108
109
marueld928c862017-06-08 08:20:04 -0700110OUTLIVING_ZOMBIE_MSG = """\
111*** Swarming tried multiple times to delete the %s directory and failed ***
112*** Hard failing the task ***
113
114Swarming detected that your testing script ran an executable, which may have
115started a child executable, and the main script returned early, leaving the
116children executables playing around unguided.
117
118You don't want to leave children processes outliving the task on the Swarming
119bot, do you? The Swarming bot doesn't.
120
121How to fix?
122- For any process that starts children processes, make sure all children
123 processes terminated properly before each parent process exits. This is
124 especially important in very deep process trees.
125 - This must be done properly both in normal successful task and in case of
126 task failure. Cleanup is very important.
127- The Swarming bot sends a SIGTERM in case of timeout.
128 - You have %s seconds to comply after the signal was sent to the process
129 before the process is forcibly killed.
130- To achieve not leaking children processes in case of signals on timeout, you
131 MUST handle signals in each executable / python script and propagate them to
132 children processes.
133 - When your test script (python or binary) receives a signal like SIGTERM or
134 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
135 them to terminate before quitting.
136
137See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400138https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700139for more information.
140
141*** May the SIGKILL force be with you ***
142"""
143
144
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000145# Currently hardcoded. Eventually could be exposed as a flag once there's value.
146# 3 weeks
147MAX_AGE_SECS = 21*24*60*60
148
149
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500150TaskData = collections.namedtuple(
151 'TaskData', [
152 # List of strings; the command line to use, independent of what was
153 # specified in the isolated file.
154 'command',
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500155 # Relative directory to start command into.
156 'relative_cwd',
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500157 # List of strings; the arguments to add to the command specified in the
158 # isolated file.
159 'extra_args',
160 # Hash of the .isolated file that must be retrieved to recreate the tree
161 # of files to run the target executable. The command specified in the
162 # .isolated is executed. Mutually exclusive with command argument.
163 'isolated_hash',
164 # isolateserver.Storage instance to retrieve remote objects. This object
165 # has a reference to an isolateserver.StorageApi, which does the actual
166 # I/O.
167 'storage',
168 # isolateserver.LocalCache instance to keep from retrieving the same
169 # objects constantly by caching the objects retrieved. Can be on-disk or
170 # in-memory.
171 'isolate_cache',
172 # List of paths relative to root_dir to put into the output isolated
173 # bundle upon task completion (see link_outputs_to_outdir).
174 'outputs',
175 # Function (run_dir) => context manager that installs named caches into
176 # |run_dir|.
177 'install_named_caches',
178 # If True, the temporary directory will be deliberately leaked for later
179 # examination.
180 'leak_temp_dir',
181 # Path to the directory to use to create the temporary directory. If not
182 # specified, a random temporary directory is created.
183 'root_dir',
184 # Kills the process if it lasts more than this amount of seconds.
185 'hard_timeout',
186 # Number of seconds to wait between SIGTERM and SIGKILL.
187 'grace_period',
188 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
189 # task command line argument.
190 'bot_file',
191 # Logical account to switch LUCI_CONTEXT into.
192 'switch_to_account',
193 # Context manager dir => CipdInfo, see install_client_and_packages.
194 'install_packages_fn',
195 # Create tree with symlinks instead of hardlinks.
196 'use_symlinks',
197 # Environment variables to set.
198 'env',
199 # Environment variables to mutate with relative directories.
200 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
201 'env_prefix'])
202
203
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500204def _to_str(s):
205 """Downgrades a unicode instance to str. Pass str through as-is."""
206 if isinstance(s, str):
207 return s
208 # This is technically incorrect, especially on Windows. In theory
209 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
210 # page' on Windows, but that causes other problems, as the character set
211 # is very limited.
212 return s.encode('utf-8')
213
214
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500215def _to_unicode(s):
216 """Upgrades a str instance to unicode. Pass unicode through as-is."""
217 if isinstance(s, unicode) or s is None:
218 return s
219 return s.decode('utf-8')
220
221
maruel03e11842016-07-14 10:50:16 -0700222def make_temp_dir(prefix, root_dir):
223 """Returns a new unique temporary directory."""
224 return unicode(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000225
226
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500227def change_tree_read_only(rootdir, read_only):
228 """Changes the tree read-only bits according to the read_only specification.
229
230 The flag can be 0, 1 or 2, which will affect the possibility to modify files
231 and create or delete files.
232 """
233 if read_only == 2:
234 # Files and directories (except on Windows) are marked read only. This
235 # inhibits modifying, creating or deleting files in the test directory,
236 # except on Windows where creating and deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400237 file_path.make_tree_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500238 elif read_only == 1:
239 # Files are marked read only but not the directories. This inhibits
240 # modifying files but creating or deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400241 file_path.make_tree_files_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500242 elif read_only in (0, None):
Marc-Antoine Ruelf1d827c2014-11-24 15:22:25 -0500243 # Anything can be modified.
Marc-Antoine Ruel2666d9c2018-05-18 13:52:02 -0400244 # TODO(maruel): This is currently dangerous as long as
245 # DiskContentAddressedCache.touch() is not yet changed to verify the hash of
246 # the content of the files it is looking at, so that if a test modifies an
247 # input file, the file must be deleted.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400248 file_path.make_tree_writeable(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500249 else:
250 raise ValueError(
251 'change_tree_read_only(%s, %s): Unknown flag %s' %
252 (rootdir, read_only, read_only))
253
254
vadimsh9c54b2c2017-07-25 14:08:29 -0700255@contextlib.contextmanager
256def set_luci_context_account(account, tmp_dir):
257 """Sets LUCI_CONTEXT account to be used by the task.
258
259 If 'account' is None or '', does nothing at all. This happens when
260 run_isolated.py is called without '--switch-to-account' flag. In this case,
261 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
262 just inherit whatever account is already set. This may happen is users invoke
263 run_isolated.py explicitly from their code.
264
265 If the requested account is not defined in the context, switches to
266 non-authenticated access. This happens for Swarming tasks that don't use
267 'task' service accounts.
268
269 If not using LUCI_CONTEXT-based auth, does nothing.
270 If already running as requested account, does nothing.
271 """
272 if not account:
273 # Not actually switching.
274 yield
275 return
276
277 local_auth = luci_context.read('local_auth')
278 if not local_auth:
279 # Not using LUCI_CONTEXT auth at all.
280 yield
281 return
282
283 # See LUCI_CONTEXT.md for the format of 'local_auth'.
284 if local_auth.get('default_account_id') == account:
285 # Already set, no need to switch.
286 yield
287 return
288
289 available = {a['id'] for a in local_auth.get('accounts') or []}
290 if account in available:
291 logging.info('Switching default LUCI_CONTEXT account to %r', account)
292 local_auth['default_account_id'] = account
293 else:
294 logging.warning(
295 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
296 'disabling authentication', account, sorted(available))
297 local_auth.pop('default_account_id', None)
298
299 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
300 yield
301
302
nodir90bc8dc2016-06-15 13:35:21 -0700303def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000304 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700305
306 Raises:
307 ValueError if a parameter is requested in |command| but its value is not
308 provided.
309 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000310 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
311
312
313def replace_parameters(arg, out_dir, bot_file):
314 """Replaces parameter tokens with appropriate values in a string.
315
316 Raises:
317 ValueError if a parameter is requested in |arg| but its value is not
318 provided.
319 """
320 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
321 replace_slash = False
322 if ISOLATED_OUTDIR_PARAMETER in arg:
323 if not out_dir:
324 raise ValueError(
325 'output directory is requested in command or env var, but not '
326 'provided; please specify one')
327 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
328 replace_slash = True
329 if SWARMING_BOT_FILE_PARAMETER in arg:
330 if bot_file:
331 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700332 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000333 else:
334 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
335 'var, but no bot_file specified. Leaving parameter '
336 'unchanged.')
337 if replace_slash:
338 # Replace slashes only if parameters are present
339 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
340 arg = arg.replace('/', os.sep)
341 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700342
343
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000344
345def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
346 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800347 """Returns full OS environment to run a command in.
348
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800349 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
350 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800351
352 Args:
353 tmp_dir: temp directory.
354 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500355 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500356 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800357 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000358 out_dir: Isolated output directory. Required to be != None if any of the
359 env vars contain ISOLATED_OUTDIR_PARAMETER.
360 bot_file: Required to be != None if any of the env vars contain
361 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800362 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500363 out = os.environ.copy()
364 for k, v in env.iteritems():
365 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500366 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500367 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000368 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500369
370 if cipd_info:
371 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500372 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
373 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500374
375 for key, paths in env_prefixes.iteritems():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500376 assert isinstance(paths, list), paths
377 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500378 cur = out.get(key)
379 if cur:
380 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500381 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800382
Marc-Antoine Ruelefb30b12018-07-25 18:34:36 +0000383 tmp_dir = _to_str(tmp_dir)
384 # pylint: disable=line-too-long
385 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
386 # platform. So $TMPDIR must be set on all platforms.
387 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
388 out['TMPDIR'] = tmp_dir
389 if sys.platform == 'win32':
390 # * chromium's base utils uses GetTempPath().
391 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
392 # * Go uses GetTempPath().
393 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
394 # set.
395 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
396 out['TMP'] = tmp_dir
397 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
398 out['TEMP'] = tmp_dir
399 elif sys.platform == 'darwin':
400 # * Chromium uses an hack on macOS before calling into
401 # NSTemporaryDirectory().
402 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
403 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
404 out['MAC_CHROMIUM_TMPDIR'] = tmp_dir
405 else:
406 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
407 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
408 # * mktemp on linux respects $TMPDIR.
409 # * Chromium respects $TMPDIR on linux.
410 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
411 # * Go uses $TMPDIR.
412 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
413 pass
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500414 return out
vadimsh232f5a82017-01-20 19:23:44 -0800415
416
417def run_command(command, cwd, env, hard_timeout, grace_period):
maruel6be7f9e2015-10-01 12:25:30 -0700418 """Runs the command.
419
420 Returns:
421 tuple(process exit code, bool if had a hard timeout)
422 """
maruela9cfd6f2015-09-15 11:03:15 -0700423 logging.info('run_command(%s, %s)' % (command, cwd))
marueleb5fbee2015-09-17 13:01:36 -0700424
maruel6be7f9e2015-10-01 12:25:30 -0700425 exit_code = None
426 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700427 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700428 proc = None
429 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700430 try:
maruel6be7f9e2015-10-01 12:25:30 -0700431 # TODO(maruel): This code is imperfect. It doesn't handle well signals
432 # during the download phase and there's short windows were things can go
433 # wrong.
434 def handler(signum, _frame):
435 if proc and not had_signal:
436 logging.info('Received signal %d', signum)
437 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700438 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700439
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000440 proc = subprocess42.Popen(
441 command, cwd=cwd, env=env, detached=True, close_fds=True)
maruel6be7f9e2015-10-01 12:25:30 -0700442 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
443 try:
444 exit_code = proc.wait(hard_timeout or None)
445 except subprocess42.TimeoutExpired:
446 if not had_signal:
447 logging.warning('Hard timeout')
448 had_hard_timeout = True
449 logging.warning('Sending SIGTERM')
450 proc.terminate()
451
452 # Ignore signals in grace period. Forcibly give the grace period to the
453 # child process.
454 if exit_code is None:
455 ignore = lambda *_: None
456 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
457 try:
458 exit_code = proc.wait(grace_period or None)
459 except subprocess42.TimeoutExpired:
460 # Now kill for real. The user can distinguish between the
461 # following states:
462 # - signal but process exited within grace period,
463 # hard_timed_out will be set but the process exit code will be
464 # script provided.
465 # - processed exited late, exit code will be -9 on posix.
466 logging.warning('Grace exhausted; sending SIGKILL')
467 proc.kill()
martiniss5c8043e2017-08-01 17:09:43 -0700468 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700469 exit_code = proc.wait()
maruela9cfd6f2015-09-15 11:03:15 -0700470 except OSError:
471 # This is not considered to be an internal error. The executable simply
472 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800473 sys.stderr.write(
474 '<The executable does not exist or a dependent library is missing>\n'
475 '<Check for missing .so/.dll in the .isolate or GN file>\n'
476 '<Command: %s>\n' % command)
477 if os.environ.get('SWARMING_TASK_ID'):
478 # Give an additional hint when running as a swarming task.
479 sys.stderr.write(
480 '<See the task\'s page for commands to help diagnose this issue '
481 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700482 exit_code = 1
483 logging.info(
484 'Command finished with exit code %d (%s)',
485 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700486 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700487
488
maruel4409e302016-07-19 14:25:51 -0700489def fetch_and_map(isolated_hash, storage, cache, outdir, use_symlinks):
490 """Fetches an isolated tree, create the tree and returns (bundle, stats)."""
nodir6f801882016-04-29 14:41:50 -0700491 start = time.time()
492 bundle = isolateserver.fetch_isolated(
493 isolated_hash=isolated_hash,
494 storage=storage,
495 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700496 outdir=outdir,
497 use_symlinks=use_symlinks)
nodir6f801882016-04-29 14:41:50 -0700498 return bundle, {
499 'duration': time.time() - start,
nodir6f801882016-04-29 14:41:50 -0700500 'items_cold': base64.b64encode(large.pack(sorted(cache.added))),
501 'items_hot': base64.b64encode(
tansell9e04a8d2016-07-28 09:31:59 -0700502 large.pack(sorted(set(cache.used) - set(cache.added)))),
nodir6f801882016-04-29 14:41:50 -0700503 }
504
505
aludwin0a8e17d2016-10-27 15:57:39 -0700506def link_outputs_to_outdir(run_dir, out_dir, outputs):
507 """Links any named outputs to out_dir so they can be uploaded.
508
509 Raises an error if the file already exists in that directory.
510 """
511 if not outputs:
512 return
513 isolateserver.create_directories(out_dir, outputs)
514 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400515 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
516
517
518def copy_recursively(src, dst):
519 """Efficiently copies a file or directory from src_dir to dst_dir.
520
521 `item` may be a file, directory, or a symlink to a file or directory.
522 All symlinks are replaced with their targets, so the resulting
523 directory structure in dst_dir will never have any symlinks.
524
525 To increase speed, copy_recursively hardlinks individual files into the
526 (newly created) directory structure if possible, unlike Python's
527 shutil.copytree().
528 """
529 orig_src = src
530 try:
531 # Replace symlinks with their final target.
532 while fs.islink(src):
533 res = fs.readlink(src)
534 src = os.path.join(os.path.dirname(src), res)
535 # TODO(sadafm): Explicitly handle cyclic symlinks.
536
537 # Note that fs.isfile (which is a wrapper around os.path.isfile) throws
538 # an exception if src does not exist. A warning will be logged in that case.
539 if fs.isfile(src):
540 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
541 return
542
543 if not fs.exists(dst):
544 os.makedirs(dst)
545
546 for child in fs.listdir(src):
547 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
548
549 except OSError as e:
550 if e.errno == errno.ENOENT:
551 logging.warning('Path %s does not exist or %s is a broken symlink',
552 src, orig_src)
553 else:
554 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700555
556
maruela9cfd6f2015-09-15 11:03:15 -0700557def delete_and_upload(storage, out_dir, leak_temp_dir):
558 """Deletes the temporary run directory and uploads results back.
559
560 Returns:
nodir6f801882016-04-29 14:41:50 -0700561 tuple(outputs_ref, success, stats)
maruel064c0a32016-04-05 11:47:15 -0700562 - outputs_ref: a dict referring to the results archived back to the isolated
563 server, if applicable.
564 - success: False if something occurred that means that the task must
565 forcibly be considered a failure, e.g. zombie processes were left
566 behind.
nodir6f801882016-04-29 14:41:50 -0700567 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700568 """
maruela9cfd6f2015-09-15 11:03:15 -0700569 # Upload out_dir and generate a .isolated file out of this directory. It is
570 # only done if files were written in the directory.
571 outputs_ref = None
maruel064c0a32016-04-05 11:47:15 -0700572 cold = []
573 hot = []
nodir6f801882016-04-29 14:41:50 -0700574 start = time.time()
575
maruel12e30012015-10-09 11:55:35 -0700576 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700577 with tools.Profiler('ArchiveOutput'):
578 try:
maruel064c0a32016-04-05 11:47:15 -0700579 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
maruela9cfd6f2015-09-15 11:03:15 -0700580 storage, [out_dir], None)
581 outputs_ref = {
Marc-Antoine Rueld0868ec2018-11-28 20:47:29 +0000582 'isolated': results.values()[0],
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +0000583 'isolatedserver': storage.server_ref.url,
584 'namespace': storage.server_ref.namespace,
maruela9cfd6f2015-09-15 11:03:15 -0700585 }
maruel064c0a32016-04-05 11:47:15 -0700586 cold = sorted(i.size for i in f_cold)
587 hot = sorted(i.size for i in f_hot)
maruela9cfd6f2015-09-15 11:03:15 -0700588 except isolateserver.Aborted:
589 # This happens when a signal SIGTERM was received while uploading data.
590 # There is 2 causes:
591 # - The task was too slow and was about to be killed anyway due to
592 # exceeding the hard timeout.
593 # - The amount of data uploaded back is very large and took too much
594 # time to archive.
595 sys.stderr.write('Received SIGTERM while uploading')
596 # Re-raise, so it will be treated as an internal failure.
597 raise
nodir6f801882016-04-29 14:41:50 -0700598
599 success = False
maruela9cfd6f2015-09-15 11:03:15 -0700600 try:
maruel12e30012015-10-09 11:55:35 -0700601 if (not leak_temp_dir and fs.isdir(out_dir) and
maruel6eeea7d2015-09-16 12:17:42 -0700602 not file_path.rmtree(out_dir)):
maruela9cfd6f2015-09-15 11:03:15 -0700603 logging.error('Had difficulties removing out_dir %s', out_dir)
nodir6f801882016-04-29 14:41:50 -0700604 else:
605 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700606 except OSError as e:
607 # When this happens, it means there's a process error.
maruel12e30012015-10-09 11:55:35 -0700608 logging.exception('Had difficulties removing out_dir %s: %s', out_dir, e)
nodir6f801882016-04-29 14:41:50 -0700609 stats = {
610 'duration': time.time() - start,
611 'items_cold': base64.b64encode(large.pack(cold)),
612 'items_hot': base64.b64encode(large.pack(hot)),
613 }
614 return outputs_ref, success, stats
maruela9cfd6f2015-09-15 11:03:15 -0700615
616
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500617def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700618 """Runs a command with optional isolated input/output.
619
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500620 Arguments:
621 - data: TaskData instance.
622 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700623
624 Returns metadata about the result.
625 """
maruela9cfd6f2015-09-15 11:03:15 -0700626 result = {
maruel064c0a32016-04-05 11:47:15 -0700627 'duration': None,
maruela9cfd6f2015-09-15 11:03:15 -0700628 'exit_code': None,
maruel6be7f9e2015-10-01 12:25:30 -0700629 'had_hard_timeout': False,
Seth Koehler49139812017-12-19 13:59:33 -0500630 'internal_failure': 'run_isolated did not complete properly',
maruel064c0a32016-04-05 11:47:15 -0700631 'stats': {
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000632 'isolated': {
633 #'cipd': {
634 # 'duration': 0.,
635 # 'get_client_duration': 0.,
636 #},
637 'download': {
638 #'duration': 0.,
639 'initial_number_items': len(data.isolate_cache),
640 'initial_size': data.isolate_cache.total_size,
641 #'items_cold': '<large.pack()>',
642 #'items_hot': '<large.pack()>',
643 },
644 #'upload': {
645 # 'duration': 0.,
646 # 'items_cold': '<large.pack()>',
647 # 'items_hot': '<large.pack()>',
648 #},
649 },
maruel064c0a32016-04-05 11:47:15 -0700650 },
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000651 #'cipd_pins': {
652 # 'packages': [
653 # {'package_name': ..., 'version': ..., 'path': ...},
654 # ...
655 # ],
656 # 'client_package': {'package_name': ..., 'version': ...},
657 #},
maruela9cfd6f2015-09-15 11:03:15 -0700658 'outputs_ref': None,
nodirbe642ff2016-06-09 15:51:51 -0700659 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700660 }
nodirbe642ff2016-06-09 15:51:51 -0700661
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500662 if data.root_dir:
663 file_path.ensure_tree(data.root_dir, 0700)
664 elif data.isolate_cache.cache_dir:
665 data = data._replace(
666 root_dir=os.path.dirname(data.isolate_cache.cache_dir))
maruele2f2cb82016-07-13 14:41:03 -0700667 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700668 # If root_dir is not specified, it is not constant.
669 # TODO(maruel): This is not obvious. Change this to become an error once we
670 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500671 if constant_run_path and data.root_dir:
672 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700673 if os.path.isdir(run_dir):
674 file_path.rmtree(run_dir)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500675 os.mkdir(run_dir, 0700)
maruelcffa0542017-04-07 08:39:20 -0700676 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500677 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
maruel03e11842016-07-14 10:50:16 -0700678 # storage should be normally set but don't crash if it is not. This can happen
679 # as Swarming task can run without an isolate server.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500680 out_dir = make_temp_dir(
681 ISOLATED_OUT_DIR, data.root_dir) if data.storage else None
682 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700683 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500684 if data.relative_cwd:
685 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500686 command = data.command
nodir55be77b2016-05-03 09:39:57 -0700687 try:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500688 with data.install_packages_fn(run_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800689 if cipd_info:
690 result['stats']['cipd'] = cipd_info.stats
691 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700692
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500693 if data.isolated_hash:
vadimsh232f5a82017-01-20 19:23:44 -0800694 isolated_stats = result['stats'].setdefault('isolated', {})
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000695 bundle, stats = fetch_and_map(
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500696 isolated_hash=data.isolated_hash,
697 storage=data.storage,
698 cache=data.isolate_cache,
vadimsh232f5a82017-01-20 19:23:44 -0800699 outdir=run_dir,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500700 use_symlinks=data.use_symlinks)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000701 isolated_stats['download'].update(stats)
vadimsh232f5a82017-01-20 19:23:44 -0800702 change_tree_read_only(run_dir, bundle.read_only)
maruelabec63c2017-04-26 11:53:24 -0700703 # Inject the command
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500704 if not command and bundle.command:
705 command = bundle.command + data.extra_args
Marc-Antoine Rueld704a1f2017-10-31 10:51:23 -0400706 # Only set the relative directory if the isolated file specified a
707 # command, and no raw command was specified.
708 if bundle.relative_cwd:
709 cwd = os.path.normpath(os.path.join(cwd, bundle.relative_cwd))
maruelabec63c2017-04-26 11:53:24 -0700710
711 if not command:
712 # Handle this as a task failure, not an internal failure.
713 sys.stderr.write(
714 '<No command was specified!>\n'
715 '<Please secify a command when triggering your Swarming task>\n')
716 result['exit_code'] = 1
717 return result
nodirbe642ff2016-06-09 15:51:51 -0700718
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500719 if not cwd.startswith(run_dir):
720 # Handle this as a task failure, not an internal failure. This is a
721 # 'last chance' way to gate against directory escape.
722 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
723 result['exit_code'] = 1
724 return result
725
726 if not os.path.isdir(cwd):
727 # Accepts relative_cwd that does not exist.
728 os.makedirs(cwd, 0700)
729
vadimsh232f5a82017-01-20 19:23:44 -0800730 # If we have an explicit list of files to return, make sure their
731 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500732 if data.storage and data.outputs:
733 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700734
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500735 with data.install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -0800736 sys.stdout.flush()
737 start = time.time()
738 try:
vadimsh9c54b2c2017-07-25 14:08:29 -0700739 # Need to switch the default account before 'get_command_env' call,
740 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500741 with set_luci_context_account(data.switch_to_account, tmp_dir):
742 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000743 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
744 data.bot_file)
Robert Iannucci24ae76a2018-02-26 12:51:18 -0800745 command = tools.fix_python_cmd(command, env)
746 command = process_command(command, out_dir, data.bot_file)
747 file_path.ensure_command_has_abs_path(command, cwd)
748
vadimsh9c54b2c2017-07-25 14:08:29 -0700749 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500750 command, cwd, env, data.hard_timeout, data.grace_period)
nodird6160682017-02-02 13:03:35 -0800751 finally:
752 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -0500753
754 # We successfully ran the command, set internal_failure back to
755 # None (even if the command failed, it's not an internal error).
756 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -0700757 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -0700758 # An internal error occurred. Report accordingly so the swarming task will
759 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -0700760 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -0700761 result['internal_failure'] = str(e)
762 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -0700763
764 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -0700765 finally:
766 try:
aludwin0a8e17d2016-10-27 15:57:39 -0700767 # Try to link files to the output directory, if specified.
768 if out_dir:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500769 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700770
nodir32a1ec12016-10-26 18:34:07 -0700771 success = False
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500772 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -0700773 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700774 logging.warning(
775 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -0700776 else:
maruel84537cb2015-10-16 14:21:28 -0700777 # On Windows rmtree(run_dir) call above has a synchronization effect: it
778 # finishes only when all task child processes terminate (since a running
779 # process locks *.exe file). Examine out_dir only after that call
780 # completes (since child processes may write to out_dir too and we need
781 # to wait for them to finish).
782 if fs.isdir(run_dir):
783 try:
784 success = file_path.rmtree(run_dir)
785 except OSError as e:
Marc-Antoine Ruel44699b32018-09-24 23:31:50 +0000786 logging.error('rmtree(%r) failed: %s', run_dir, e)
maruel84537cb2015-10-16 14:21:28 -0700787 success = False
788 if not success:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500789 sys.stderr.write(OUTLIVING_ZOMBIE_MSG % ('run', data.grace_period))
maruel84537cb2015-10-16 14:21:28 -0700790 if result['exit_code'] == 0:
791 result['exit_code'] = 1
792 if fs.isdir(tmp_dir):
793 try:
794 success = file_path.rmtree(tmp_dir)
795 except OSError as e:
Marc-Antoine Ruel44699b32018-09-24 23:31:50 +0000796 logging.error('rmtree(%r) failed: %s', tmp_dir, e)
maruel84537cb2015-10-16 14:21:28 -0700797 success = False
798 if not success:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500799 sys.stderr.write(OUTLIVING_ZOMBIE_MSG % ('temp', data.grace_period))
maruel84537cb2015-10-16 14:21:28 -0700800 if result['exit_code'] == 0:
801 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -0700802
marueleb5fbee2015-09-17 13:01:36 -0700803 # This deletes out_dir if leak_temp_dir is not set.
nodir9130f072016-05-27 13:59:08 -0700804 if out_dir:
nodir55715712016-06-03 12:28:19 -0700805 isolated_stats = result['stats'].setdefault('isolated', {})
806 result['outputs_ref'], success, isolated_stats['upload'] = (
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500807 delete_and_upload(data.storage, out_dir, data.leak_temp_dir))
maruela9cfd6f2015-09-15 11:03:15 -0700808 if not success and result['exit_code'] == 0:
809 result['exit_code'] = 1
810 except Exception as e:
811 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -0700812 if out_dir:
813 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -0700814 result['internal_failure'] = str(e)
815 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500816
817
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500818def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -0700819 """Runs an executable and records execution metadata.
820
nodir55be77b2016-05-03 09:39:57 -0700821 If isolated_hash is specified, downloads the dependencies in the cache,
822 hardlinks them into a temporary directory and runs the command specified in
823 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500824
825 A temporary directory is created to hold the output files. The content inside
826 this directory will be uploaded back to |storage| packaged as a .isolated
827 file.
828
829 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500830 - data: TaskData instance.
831 - result_json: File path to dump result metadata into. If set, the process
832 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -0700833
834 Returns:
835 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000836 """
maruela76b9ee2015-12-15 06:18:08 -0800837 if result_json:
838 # Write a json output file right away in case we get killed.
839 result = {
840 'exit_code': None,
841 'had_hard_timeout': False,
842 'internal_failure': 'Was terminated before completion',
843 'outputs_ref': None,
nodirbe642ff2016-06-09 15:51:51 -0700844 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -0800845 }
846 tools.write_json(result_json, result, dense=True)
847
maruela9cfd6f2015-09-15 11:03:15 -0700848 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500849 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -0700850 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -0700851
maruela9cfd6f2015-09-15 11:03:15 -0700852 if result_json:
maruel05d5a882015-09-21 13:59:02 -0700853 # We've found tests to delete 'work' when quitting, causing an exception
854 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -0700855 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -0700856 tools.write_json(result_json, result, dense=True)
857 # Only return 1 if there was an internal error.
858 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +0000859
maruela9cfd6f2015-09-15 11:03:15 -0700860 # Marshall into old-style inline output.
861 if result['outputs_ref']:
862 data = {
863 'hash': result['outputs_ref']['isolated'],
864 'namespace': result['outputs_ref']['namespace'],
865 'storage': result['outputs_ref']['isolatedserver'],
866 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -0500867 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700868 print(
869 '[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
870 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -0800871 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700872 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000873
874
iannuccib58d10d2017-03-18 02:00:25 -0700875# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -0800876CipdInfo = collections.namedtuple('CipdInfo', [
877 'client', # cipd.CipdClient object
878 'cache_dir', # absolute path to bot-global cipd tag and instance cache
879 'stats', # dict with stats to return to the server
880 'pins', # dict with installed cipd pins to return to the server
881])
882
883
884@contextlib.contextmanager
885def noop_install_packages(_run_dir):
iannuccib58d10d2017-03-18 02:00:25 -0700886 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -0800887 yield None
888
889
iannuccib58d10d2017-03-18 02:00:25 -0700890def _install_packages(run_dir, cipd_cache_dir, client, packages, timeout):
891 """Calls 'cipd ensure' for packages.
892
893 Args:
894 run_dir (str): root of installation.
895 cipd_cache_dir (str): the directory to use for the cipd package cache.
896 client (CipdClient): the cipd client to use
897 packages: packages to install, list [(path, package_name, version), ...].
898 timeout: max duration in seconds that this function can take.
899
900 Returns: list of pinned packages. Looks like [
901 {
902 'path': 'subdirectory',
903 'package_name': 'resolved/package/name',
904 'version': 'deadbeef...',
905 },
906 ...
907 ]
908 """
909 package_pins = [None]*len(packages)
910 def insert_pin(path, name, version, idx):
911 package_pins[idx] = {
912 'package_name': name,
913 # swarming deals with 'root' as '.'
914 'path': path or '.',
915 'version': version,
916 }
917
918 by_path = collections.defaultdict(list)
919 for i, (path, name, version) in enumerate(packages):
920 # cipd deals with 'root' as ''
921 if path == '.':
922 path = ''
923 by_path[path].append((name, version, i))
924
925 pins = client.ensure(
926 run_dir,
927 {
928 subdir: [(name, vers) for name, vers, _ in pkgs]
929 for subdir, pkgs in by_path.iteritems()
930 },
931 cache_dir=cipd_cache_dir,
932 timeout=timeout,
933 )
934
935 for subdir, pin_list in sorted(pins.iteritems()):
936 this_subdir = by_path[subdir]
937 for i, (name, version) in enumerate(pin_list):
938 insert_pin(subdir, name, version, this_subdir[i][2])
939
Robert Iannucci461b30d2017-12-13 11:34:03 -0800940 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -0700941
942 return package_pins
943
944
vadimsh232f5a82017-01-20 19:23:44 -0800945@contextlib.contextmanager
iannuccib58d10d2017-03-18 02:00:25 -0700946def install_client_and_packages(
nodirff531b42016-06-23 13:05:06 -0700947 run_dir, packages, service_url, client_package_name,
vadimsh232f5a82017-01-20 19:23:44 -0800948 client_version, cache_dir, timeout=None):
vadimsh902948e2017-01-20 15:57:32 -0800949 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -0700950
vadimsh232f5a82017-01-20 19:23:44 -0800951 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
952
953 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -0700954 [
955 {
956 "path": path, "package_name": package_name, "version": version,
957 },
958 ...
959 ]
vadimsh902948e2017-01-20 15:57:32 -0800960 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -0700961
962 such that they correspond 1:1 to all input package arguments from the command
963 line. These dictionaries make their all the way back to swarming, where they
964 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -0700965
vadimsh902948e2017-01-20 15:57:32 -0800966 If 'packages' list is empty, will bootstrap CIPD client, but won't install
967 any packages.
968
969 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -0800970 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -0800971
nodirbe642ff2016-06-09 15:51:51 -0700972 Args:
nodir90bc8dc2016-06-15 13:35:21 -0700973 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -0800974 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -0700975 service_url (str): CIPD server url, e.g.
976 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -0700977 client_package_name (str): CIPD package name of CIPD client.
978 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -0700979 cache_dir (str): where to keep cache of cipd clients, packages and tags.
980 timeout: max duration in seconds that this function can take.
nodirbe642ff2016-06-09 15:51:51 -0700981 """
982 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -0700983
nodirbe642ff2016-06-09 15:51:51 -0700984 timeoutfn = tools.sliding_timeout(timeout)
nodirbe642ff2016-06-09 15:51:51 -0700985 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -0700986
vadimsh902948e2017-01-20 15:57:32 -0800987 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -0800988 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -0700989 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -0800990 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -0700991
nodirbe642ff2016-06-09 15:51:51 -0700992 get_client_start = time.time()
993 client_manager = cipd.get_client(
994 service_url, client_package_name, client_version, cache_dir,
995 timeout=timeoutfn())
iannucci96fcccc2016-08-30 15:52:22 -0700996
nodirbe642ff2016-06-09 15:51:51 -0700997 with client_manager as client:
998 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -0700999
iannuccib58d10d2017-03-18 02:00:25 -07001000 package_pins = []
1001 if packages:
1002 package_pins = _install_packages(
1003 run_dir, cipd_cache_dir, client, packages, timeoutfn())
1004
1005 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001006
vadimsh232f5a82017-01-20 19:23:44 -08001007 total_duration = time.time() - start
1008 logging.info(
1009 'Installing CIPD client and packages took %d seconds', total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001010
vadimsh232f5a82017-01-20 19:23:44 -08001011 yield CipdInfo(
1012 client=client,
1013 cache_dir=cipd_cache_dir,
1014 stats={
1015 'duration': total_duration,
1016 'get_client_duration': get_client_duration,
1017 },
1018 pins={
iannuccib58d10d2017-03-18 02:00:25 -07001019 'client_package': {
1020 'package_name': client.package_name,
1021 'version': client.instance_id,
1022 },
vadimsh232f5a82017-01-20 19:23:44 -08001023 'packages': package_pins,
1024 })
nodirbe642ff2016-06-09 15:51:51 -07001025
1026
1027def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001028 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001029 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001030 version=__version__,
1031 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001032 parser.add_option(
maruel36a963d2016-04-08 17:15:49 -07001033 '--clean', action='store_true',
1034 help='Cleans the cache, trimming it necessary and remove corrupted items '
1035 'and returns without executing anything; use with -v to know what '
1036 'was done')
1037 parser.add_option(
maruel4409e302016-07-19 14:25:51 -07001038 '--use-symlinks', action='store_true',
1039 help='Use symlinks instead of hardlinks')
1040 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001041 '--json',
1042 help='dump output metadata to json file. When used, run_isolated returns '
1043 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001044 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001045 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001046 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001047 '--grace-period', type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001048 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001049 parser.add_option(
Marc-Antoine Ruel49e347d2017-10-24 16:52:02 -07001050 '--raw-cmd', action='store_true',
1051 help='Ignore the isolated command, use the one supplied at the command '
1052 'line')
1053 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001054 '--relative-cwd',
1055 help='Ignore the isolated \'relative_cwd\' and use this one instead; '
1056 'requires --raw-cmd')
1057 parser.add_option(
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001058 '--env', default=[], action='append',
1059 help='Environment variables to set for the child process')
1060 parser.add_option(
1061 '--env-prefix', default=[], action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001062 help='Specify a VAR=./path/fragment to put in the environment variable '
1063 'before executing the command. The path fragment must be relative '
1064 'to the isolated run directory, and must not contain a `..` token. '
1065 'The path will be made absolute and prepended to the indicated '
1066 '$VAR using the OS\'s path separator. Multiple items for the same '
1067 '$VAR will be prepended in order.')
1068 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001069 '--bot-file',
1070 help='Path to a file describing the state of the host. The content is '
1071 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001072 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001073 '--switch-to-account',
1074 help='If given, switches LUCI_CONTEXT to given logical service account '
1075 '(e.g. "task" or "system") before launching the isolated process.')
1076 parser.add_option(
aludwin0a8e17d2016-10-27 15:57:39 -07001077 '--output', action='append',
1078 help='Specifies an output to return. If no outputs are specified, all '
1079 'files located in $(ISOLATED_OUTDIR) will be returned; '
1080 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1081 'specified by --output option (there can be multiple) will be '
1082 'returned. Note that if a file in OUT_DIR has the same path '
1083 'as an --output option, the --output version will be returned.')
1084 parser.add_option(
aludwin7556e0c2016-10-26 08:46:10 -07001085 '-a', '--argsfile',
1086 # This is actually handled in parse_args; it's included here purely so it
1087 # can make it into the help text.
1088 help='Specify a file containing a JSON array of arguments to this '
1089 'script. If --argsfile is provided, no other argument may be '
1090 'provided on the command line.')
Marc-Antoine Ruel1687b5e2014-02-06 17:47:53 -05001091 data_group = optparse.OptionGroup(parser, 'Data source')
1092 data_group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001093 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001094 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruelf7d737d2014-12-10 15:36:29 -05001095 isolateserver.add_isolate_server_options(data_group)
Marc-Antoine Ruel1687b5e2014-02-06 17:47:53 -05001096 parser.add_option_group(data_group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001097
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001098 isolateserver.add_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001099
1100 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001101
1102 group = optparse.OptionGroup(parser, 'Named caches')
1103 group.add_option(
1104 '--named-cache',
1105 dest='named_caches',
1106 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001107 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001108 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001109 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001110 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1111 'path is a path relative to the run dir where the cache directory '
1112 'must be put to. '
1113 'This option can be specified more than once.')
1114 group.add_option(
1115 '--named-cache-root', default='named_caches',
1116 help='Cache root directory. Default=%default')
1117 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001118
Kenneth Russell61d42352014-09-15 11:41:16 -07001119 debug_group = optparse.OptionGroup(parser, 'Debugging')
1120 debug_group.add_option(
1121 '--leak-temp-dir',
1122 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001123 help='Deliberately leak isolate\'s temp dir for later examination. '
1124 'Default: %default')
marueleb5fbee2015-09-17 13:01:36 -07001125 debug_group.add_option(
1126 '--root-dir', help='Use a directory instead of a random one')
Kenneth Russell61d42352014-09-15 11:41:16 -07001127 parser.add_option_group(debug_group)
1128
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001129 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001130
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001131 parser.set_defaults(cache='cache', cipd_cache='cipd_cache')
nodirbe642ff2016-06-09 15:51:51 -07001132 return parser
1133
1134
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001135def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001136 """Validates named cache options and returns a CacheManager."""
1137 if options.named_caches and not options.named_cache_root:
1138 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001139 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001140 if not CACHE_NAME_RE.match(name):
1141 parser.error(
1142 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1143 if not path:
1144 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001145 try:
1146 long(hint)
1147 except ValueError:
1148 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001149 if options.named_cache_root:
1150 # Make these configurable later if there is use case but for now it's fairly
1151 # safe values.
1152 # In practice, a fair chunk of bots are already recycled on a daily schedule
1153 # so this code doesn't have any effect to them, unless they are preloaded
1154 # with a really old cache.
1155 policies = local_caching.CachePolicies(
1156 # 1TiB.
1157 max_cache_size=1024*1024*1024*1024,
1158 min_free_space=options.min_free_space,
1159 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001160 max_age_secs=MAX_AGE_SECS)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001161 root_dir = unicode(os.path.abspath(options.named_cache_root))
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001162 return local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001163 return None
1164
1165
aludwin7556e0c2016-10-26 08:46:10 -07001166def parse_args(args):
1167 # Create a fake mini-parser just to get out the "-a" command. Note that
1168 # it's not documented here; instead, it's documented in create_option_parser
1169 # even though that parser will never actually get to parse it. This is
1170 # because --argsfile is exclusive with all other options and arguments.
1171 file_argparse = argparse.ArgumentParser(add_help=False)
1172 file_argparse.add_argument('-a', '--argsfile')
1173 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1174 if file_args.argsfile:
1175 if nonfile_args:
1176 file_argparse.error('Can\'t specify --argsfile with'
1177 'any other arguments (%s)' % nonfile_args)
1178 try:
1179 with open(file_args.argsfile, 'r') as f:
1180 args = json.load(f)
1181 except (IOError, OSError, ValueError) as e:
1182 # We don't need to error out here - "args" is now empty,
1183 # so the call below to parser.parse_args(args) will fail
1184 # and print the full help text.
1185 print >> sys.stderr, 'Couldn\'t read arguments: %s' % e
1186
1187 # Even if we failed to read the args, just call the normal parser now since it
1188 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001189 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001190 options, args = parser.parse_args(args)
aludwin7556e0c2016-10-26 08:46:10 -07001191 return (parser, options, args)
1192
1193
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001194def _calc_named_cache_hint(named_cache, named_caches):
1195 """Returns the expected size of the missing named caches."""
1196 present = named_cache.available
1197 size = 0
1198 for name, _, hint in named_caches:
1199 if name not in present:
1200 hint = long(hint)
1201 if hint > 0:
1202 size += hint
1203 return size
1204
1205
aludwin7556e0c2016-10-26 08:46:10 -07001206def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001207 # Warning: when --argsfile is used, the strings are unicode instances, when
1208 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001209 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001210
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001211 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001212 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001213
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001214 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001215 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001216 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1217 if hint:
1218 # Increase the --min-free-space value by the hint, and recreate the
1219 # NamedCache instance so it gets the updated CachePolicy.
1220 options.min_free_space += hint
1221 named_cache = process_named_cache_options(parser, options)
1222
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001223 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1224 # they can be cleaned the same way.
nodirf33b8d62016-10-26 22:34:58 -07001225 isolate_cache = isolateserver.process_cache_options(options, trim=False)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001226 caches = []
1227 if isolate_cache:
1228 caches.append(isolate_cache)
1229 if named_cache:
1230 caches.append(named_cache)
1231 root = caches[0].cache_dir if caches else unicode(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001232 if options.clean:
1233 if options.isolated:
1234 parser.error('Can\'t use --isolated with --clean.')
1235 if options.isolate_server:
1236 parser.error('Can\'t use --isolate-server with --clean.')
1237 if options.json:
1238 parser.error('Can\'t use --json with --clean.')
nodirf33b8d62016-10-26 22:34:58 -07001239 if options.named_caches:
1240 parser.error('Can\t use --named-cache with --clean.')
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001241 # Trim first, then clean.
1242 local_caching.trim_caches(
1243 caches,
1244 root,
1245 min_free_space=options.min_free_space,
1246 max_age_secs=MAX_AGE_SECS)
1247 for c in caches:
Marc-Antoine Ruel87fc2222018-06-18 13:09:24 +00001248 c.cleanup()
maruel36a963d2016-04-08 17:15:49 -07001249 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001250
1251 # Trim must still be done for the following case:
1252 # - named-cache was used
1253 # - some entries, with a large hint, where missing
1254 # - --min-free-space was increased accordingly, thus trimming is needed
1255 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1256 # --clean after each task.
1257 if hint:
1258 logging.info('Additional trimming of %d bytes', hint)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001259 local_caching.trim_caches(
1260 caches,
1261 root,
1262 min_free_space=options.min_free_space,
1263 max_age_secs=MAX_AGE_SECS)
maruel36a963d2016-04-08 17:15:49 -07001264
nodir55be77b2016-05-03 09:39:57 -07001265 if not options.isolated and not args:
1266 parser.error('--isolated or command to run is required.')
1267
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001268 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001269
1270 isolateserver.process_isolate_server_options(
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001271 parser, options, True, False)
nodir55be77b2016-05-03 09:39:57 -07001272 if not options.isolate_server:
1273 if options.isolated:
1274 parser.error('--isolated requires --isolate-server')
1275 if ISOLATED_OUTDIR_PARAMETER in args:
1276 parser.error(
1277 '%s in args requires --isolate-server' % ISOLATED_OUTDIR_PARAMETER)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001278
nodir90bc8dc2016-06-15 13:35:21 -07001279 if options.root_dir:
1280 options.root_dir = unicode(os.path.abspath(options.root_dir))
maruel12e30012015-10-09 11:55:35 -07001281 if options.json:
1282 options.json = unicode(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001283
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001284 if any('=' not in i for i in options.env):
1285 parser.error(
1286 '--env required key=value form. value can be skipped to delete '
1287 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001288 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001289
1290 prefixes = {}
1291 cwd = os.path.realpath(os.getcwd())
1292 for item in options.env_prefix:
1293 if '=' not in item:
1294 parser.error(
1295 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1296 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001297 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001298 if os.path.isabs(opath):
1299 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1300 opath = os.path.normpath(opath)
1301 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1302 parser.error(
1303 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1304 % opath)
1305 prefixes.setdefault(key, []).append(opath)
1306 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001307
nodirbe642ff2016-06-09 15:51:51 -07001308 cipd.validate_cipd_options(parser, options)
1309
vadimsh232f5a82017-01-20 19:23:44 -08001310 install_packages_fn = noop_install_packages
vadimsh902948e2017-01-20 15:57:32 -08001311 if options.cipd_enabled:
iannuccib58d10d2017-03-18 02:00:25 -07001312 install_packages_fn = lambda run_dir: install_client_and_packages(
vadimsh902948e2017-01-20 15:57:32 -08001313 run_dir, cipd.parse_package_args(options.cipd_packages),
1314 options.cipd_server, options.cipd_client_package,
1315 options.cipd_client_version, cache_dir=options.cipd_cache)
nodirbe642ff2016-06-09 15:51:51 -07001316
nodird6160682017-02-02 13:03:35 -08001317 @contextlib.contextmanager
nodir0ae98b32017-05-11 13:21:53 -07001318 def install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001319 # WARNING: this function depends on "options" variable defined in the outer
1320 # function.
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001321 assert unicode(run_dir), repr(run_dir)
1322 assert os.path.isabs(run_dir), run_dir
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001323 named_caches = [
nodir0ae98b32017-05-11 13:21:53 -07001324 (os.path.join(run_dir, unicode(relpath)), name)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001325 for name, relpath, _ in options.named_caches
nodir0ae98b32017-05-11 13:21:53 -07001326 ]
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001327 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001328 named_cache.install(path, name)
nodird6160682017-02-02 13:03:35 -08001329 try:
1330 yield
1331 finally:
dnje289d132017-07-07 11:16:44 -07001332 # Uninstall each named cache, returning it to the cache pool. If an
1333 # uninstall fails for a given cache, it will remain in the task's
1334 # temporary space, get cleaned up by the Swarming bot, and be lost.
1335 #
1336 # If the Swarming bot cannot clean up the cache, it will handle it like
1337 # any other bot file that could not be removed.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001338 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001339 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001340 # uninstall() doesn't trim but does call save() implicitly. Trimming
1341 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001342 named_cache.uninstall(path, name)
1343 except local_caching.NamedCacheError:
1344 logging.exception('Error while removing named cache %r at %r. '
1345 'The cache will be lost.', path, name)
nodirf33b8d62016-10-26 22:34:58 -07001346
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001347 extra_args = []
1348 command = []
1349 if options.raw_cmd:
1350 command = args
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001351 if options.relative_cwd:
1352 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1353 if not a.startswith(os.getcwd()):
1354 parser.error(
1355 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001356 else:
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001357 if options.relative_cwd:
1358 parser.error('--relative-cwd requires --raw-cmd')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001359 extra_args = args
1360
1361 data = TaskData(
1362 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001363 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001364 extra_args=extra_args,
1365 isolated_hash=options.isolated,
1366 storage=None,
1367 isolate_cache=isolate_cache,
1368 outputs=options.output,
1369 install_named_caches=install_named_caches,
1370 leak_temp_dir=options.leak_temp_dir,
1371 root_dir=_to_unicode(options.root_dir),
1372 hard_timeout=options.hard_timeout,
1373 grace_period=options.grace_period,
1374 bot_file=options.bot_file,
1375 switch_to_account=options.switch_to_account,
1376 install_packages_fn=install_packages_fn,
1377 use_symlinks=options.use_symlinks,
1378 env=options.env,
1379 env_prefix=options.env_prefix)
nodirbe642ff2016-06-09 15:51:51 -07001380 try:
nodir90bc8dc2016-06-15 13:35:21 -07001381 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001382 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001383 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001384 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001385 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001386 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001387 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001388 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001389 return run_tha_test(data, options.json)
1390 return run_tha_test(data, options.json)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001391 except (
1392 cipd.Error,
1393 local_caching.NamedCacheError,
Marc-Antoine Ruelb6e9e232018-11-20 00:12:33 +00001394 local_caching.NoMoreSpace) as ex:
nodirbe642ff2016-06-09 15:51:51 -07001395 print >> sys.stderr, ex.message
1396 return 1
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001397
1398
1399if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001400 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001401 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001402 fix_encoding.fix_encoding()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001403 sys.exit(main(sys.argv[1:]))