blob: 84e9d19aabb3264473974435b9b35632e1d238e4 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
33See
34https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
35for all the variables.
36
37See
38https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
39for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000040"""
41
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000042__version__ = '1.0.0'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000043
aludwin7556e0c2016-10-26 08:46:10 -070044import argparse
maruel064c0a32016-04-05 11:47:15 -070045import base64
iannucci96fcccc2016-08-30 15:52:22 -070046import collections
vadimsh232f5a82017-01-20 19:23:44 -080047import contextlib
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040048import errno
aludwin7556e0c2016-10-26 08:46:10 -070049import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000050import logging
51import optparse
52import os
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040053import re
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000054import sys
55import tempfile
maruel064c0a32016-04-05 11:47:15 -070056import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000057
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000058from utils import tools
59tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000060
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000061# third_party/
62from depot_tools import fix_encoding
63
64# pylint: disable=ungrouped-imports
65import auth
66import cipd
67import isolate_storage
68import isolateserver
69import local_caching
70from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070071from utils import file_path
maruel12e30012015-10-09 11:55:35 -070072from utils import fs
maruel064c0a32016-04-05 11:47:15 -070073from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040074from utils import logging_utils
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040075from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050076from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000077
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000078
maruele2f2cb82016-07-13 14:41:03 -070079# Magic variables that can be found in the isolate task command line.
80ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
81EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
82SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
83
84
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000085# The name of the log file to use.
86RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
87
maruele2f2cb82016-07-13 14:41:03 -070088
csharp@chromium.orge217f302012-11-22 16:51:53 +000089# The name of the log to use for the run_test_cases.py command
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000090RUN_TEST_CASES_LOG = 'run_test_cases.log'
csharp@chromium.orge217f302012-11-22 16:51:53 +000091
vadimsh@chromium.org87d63262013-04-04 19:34:21 +000092
maruele2f2cb82016-07-13 14:41:03 -070093# Use short names for temporary directories. This is driven by Windows, which
94# imposes a relatively short maximum path length of 260 characters, often
95# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +000096# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -070097#
98# It is recommended to start the script with a `root_dir` as short as
99# possible.
100# - ir stands for isolated_run
101# - io stands for isolated_out
102# - it stands for isolated_tmp
103ISOLATED_RUN_DIR = u'ir'
104ISOLATED_OUT_DIR = u'io'
105ISOLATED_TMP_DIR = u'it'
106
107
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400108# Keep synced with task_request.py
109CACHE_NAME_RE = re.compile(ur'^[a-z0-9_]{1,4096}$')
110
111
marueld928c862017-06-08 08:20:04 -0700112OUTLIVING_ZOMBIE_MSG = """\
113*** Swarming tried multiple times to delete the %s directory and failed ***
114*** Hard failing the task ***
115
116Swarming detected that your testing script ran an executable, which may have
117started a child executable, and the main script returned early, leaving the
118children executables playing around unguided.
119
120You don't want to leave children processes outliving the task on the Swarming
121bot, do you? The Swarming bot doesn't.
122
123How to fix?
124- For any process that starts children processes, make sure all children
125 processes terminated properly before each parent process exits. This is
126 especially important in very deep process trees.
127 - This must be done properly both in normal successful task and in case of
128 task failure. Cleanup is very important.
129- The Swarming bot sends a SIGTERM in case of timeout.
130 - You have %s seconds to comply after the signal was sent to the process
131 before the process is forcibly killed.
132- To achieve not leaking children processes in case of signals on timeout, you
133 MUST handle signals in each executable / python script and propagate them to
134 children processes.
135 - When your test script (python or binary) receives a signal like SIGTERM or
136 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
137 them to terminate before quitting.
138
139See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400140https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700141for more information.
142
143*** May the SIGKILL force be with you ***
144"""
145
146
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000147# Currently hardcoded. Eventually could be exposed as a flag once there's value.
148# 3 weeks
149MAX_AGE_SECS = 21*24*60*60
150
151
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500152TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000153 'TaskData',
154 [
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500155 # List of strings; the command line to use, independent of what was
156 # specified in the isolated file.
157 'command',
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500158 # Relative directory to start command into.
159 'relative_cwd',
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500160 # List of strings; the arguments to add to the command specified in the
161 # isolated file.
162 'extra_args',
163 # Hash of the .isolated file that must be retrieved to recreate the tree
164 # of files to run the target executable. The command specified in the
165 # .isolated is executed. Mutually exclusive with command argument.
166 'isolated_hash',
167 # isolateserver.Storage instance to retrieve remote objects. This object
168 # has a reference to an isolateserver.StorageApi, which does the actual
169 # I/O.
170 'storage',
171 # isolateserver.LocalCache instance to keep from retrieving the same
172 # objects constantly by caching the objects retrieved. Can be on-disk or
173 # in-memory.
174 'isolate_cache',
175 # List of paths relative to root_dir to put into the output isolated
176 # bundle upon task completion (see link_outputs_to_outdir).
177 'outputs',
178 # Function (run_dir) => context manager that installs named caches into
179 # |run_dir|.
180 'install_named_caches',
181 # If True, the temporary directory will be deliberately leaked for later
182 # examination.
183 'leak_temp_dir',
184 # Path to the directory to use to create the temporary directory. If not
185 # specified, a random temporary directory is created.
186 'root_dir',
187 # Kills the process if it lasts more than this amount of seconds.
188 'hard_timeout',
189 # Number of seconds to wait between SIGTERM and SIGKILL.
190 'grace_period',
191 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
192 # task command line argument.
193 'bot_file',
194 # Logical account to switch LUCI_CONTEXT into.
195 'switch_to_account',
196 # Context manager dir => CipdInfo, see install_client_and_packages.
197 'install_packages_fn',
198 # Create tree with symlinks instead of hardlinks.
199 'use_symlinks',
200 # Environment variables to set.
201 'env',
202 # Environment variables to mutate with relative directories.
203 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000204 'env_prefix',
205 # Lowers the task process priority.
206 'lower_priority',
207 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500208
209
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500210def _to_str(s):
211 """Downgrades a unicode instance to str. Pass str through as-is."""
212 if isinstance(s, str):
213 return s
214 # This is technically incorrect, especially on Windows. In theory
215 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
216 # page' on Windows, but that causes other problems, as the character set
217 # is very limited.
218 return s.encode('utf-8')
219
220
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500221def _to_unicode(s):
222 """Upgrades a str instance to unicode. Pass unicode through as-is."""
223 if isinstance(s, unicode) or s is None:
224 return s
225 return s.decode('utf-8')
226
227
maruel03e11842016-07-14 10:50:16 -0700228def make_temp_dir(prefix, root_dir):
229 """Returns a new unique temporary directory."""
230 return unicode(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000231
232
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500233def change_tree_read_only(rootdir, read_only):
234 """Changes the tree read-only bits according to the read_only specification.
235
236 The flag can be 0, 1 or 2, which will affect the possibility to modify files
237 and create or delete files.
238 """
239 if read_only == 2:
240 # Files and directories (except on Windows) are marked read only. This
241 # inhibits modifying, creating or deleting files in the test directory,
242 # except on Windows where creating and deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400243 file_path.make_tree_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500244 elif read_only == 1:
245 # Files are marked read only but not the directories. This inhibits
246 # modifying files but creating or deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400247 file_path.make_tree_files_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500248 elif read_only in (0, None):
Marc-Antoine Ruelf1d827c2014-11-24 15:22:25 -0500249 # Anything can be modified.
Marc-Antoine Ruel2666d9c2018-05-18 13:52:02 -0400250 # TODO(maruel): This is currently dangerous as long as
251 # DiskContentAddressedCache.touch() is not yet changed to verify the hash of
252 # the content of the files it is looking at, so that if a test modifies an
253 # input file, the file must be deleted.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400254 file_path.make_tree_writeable(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500255 else:
256 raise ValueError(
257 'change_tree_read_only(%s, %s): Unknown flag %s' %
258 (rootdir, read_only, read_only))
259
260
vadimsh9c54b2c2017-07-25 14:08:29 -0700261@contextlib.contextmanager
262def set_luci_context_account(account, tmp_dir):
263 """Sets LUCI_CONTEXT account to be used by the task.
264
265 If 'account' is None or '', does nothing at all. This happens when
266 run_isolated.py is called without '--switch-to-account' flag. In this case,
267 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
268 just inherit whatever account is already set. This may happen is users invoke
269 run_isolated.py explicitly from their code.
270
271 If the requested account is not defined in the context, switches to
272 non-authenticated access. This happens for Swarming tasks that don't use
273 'task' service accounts.
274
275 If not using LUCI_CONTEXT-based auth, does nothing.
276 If already running as requested account, does nothing.
277 """
278 if not account:
279 # Not actually switching.
280 yield
281 return
282
283 local_auth = luci_context.read('local_auth')
284 if not local_auth:
285 # Not using LUCI_CONTEXT auth at all.
286 yield
287 return
288
289 # See LUCI_CONTEXT.md for the format of 'local_auth'.
290 if local_auth.get('default_account_id') == account:
291 # Already set, no need to switch.
292 yield
293 return
294
295 available = {a['id'] for a in local_auth.get('accounts') or []}
296 if account in available:
297 logging.info('Switching default LUCI_CONTEXT account to %r', account)
298 local_auth['default_account_id'] = account
299 else:
300 logging.warning(
301 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
302 'disabling authentication', account, sorted(available))
303 local_auth.pop('default_account_id', None)
304
305 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
306 yield
307
308
nodir90bc8dc2016-06-15 13:35:21 -0700309def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000310 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700311
312 Raises:
313 ValueError if a parameter is requested in |command| but its value is not
314 provided.
315 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000316 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
317
318
319def replace_parameters(arg, out_dir, bot_file):
320 """Replaces parameter tokens with appropriate values in a string.
321
322 Raises:
323 ValueError if a parameter is requested in |arg| but its value is not
324 provided.
325 """
326 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
327 replace_slash = False
328 if ISOLATED_OUTDIR_PARAMETER in arg:
329 if not out_dir:
330 raise ValueError(
331 'output directory is requested in command or env var, but not '
332 'provided; please specify one')
333 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
334 replace_slash = True
335 if SWARMING_BOT_FILE_PARAMETER in arg:
336 if bot_file:
337 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700338 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000339 else:
340 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
341 'var, but no bot_file specified. Leaving parameter '
342 'unchanged.')
343 if replace_slash:
344 # Replace slashes only if parameters are present
345 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
346 arg = arg.replace('/', os.sep)
347 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700348
349
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000350
351def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
352 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800353 """Returns full OS environment to run a command in.
354
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800355 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
356 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800357
358 Args:
359 tmp_dir: temp directory.
360 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500361 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500362 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800363 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000364 out_dir: Isolated output directory. Required to be != None if any of the
365 env vars contain ISOLATED_OUTDIR_PARAMETER.
366 bot_file: Required to be != None if any of the env vars contain
367 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800368 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500369 out = os.environ.copy()
370 for k, v in env.iteritems():
371 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500372 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500373 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000374 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500375
376 if cipd_info:
377 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500378 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
379 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500380
381 for key, paths in env_prefixes.iteritems():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500382 assert isinstance(paths, list), paths
383 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500384 cur = out.get(key)
385 if cur:
386 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500387 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800388
Marc-Antoine Ruelefb30b12018-07-25 18:34:36 +0000389 tmp_dir = _to_str(tmp_dir)
390 # pylint: disable=line-too-long
391 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
392 # platform. So $TMPDIR must be set on all platforms.
393 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
394 out['TMPDIR'] = tmp_dir
395 if sys.platform == 'win32':
396 # * chromium's base utils uses GetTempPath().
397 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
398 # * Go uses GetTempPath().
399 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
400 # set.
401 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
402 out['TMP'] = tmp_dir
403 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
404 out['TEMP'] = tmp_dir
405 elif sys.platform == 'darwin':
406 # * Chromium uses an hack on macOS before calling into
407 # NSTemporaryDirectory().
408 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
409 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
410 out['MAC_CHROMIUM_TMPDIR'] = tmp_dir
411 else:
412 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
413 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
414 # * mktemp on linux respects $TMPDIR.
415 # * Chromium respects $TMPDIR on linux.
416 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
417 # * Go uses $TMPDIR.
418 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
419 pass
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500420 return out
vadimsh232f5a82017-01-20 19:23:44 -0800421
422
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000423def run_command(command, cwd, env, hard_timeout, grace_period, lower_priority):
maruel6be7f9e2015-10-01 12:25:30 -0700424 """Runs the command.
425
426 Returns:
427 tuple(process exit code, bool if had a hard timeout)
428 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000429 logging.info(
430 'run_command(%s, %s, %s, %s, %s)',
431 command, cwd, hard_timeout, grace_period, lower_priority)
marueleb5fbee2015-09-17 13:01:36 -0700432
maruel6be7f9e2015-10-01 12:25:30 -0700433 exit_code = None
434 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700435 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700436 proc = None
437 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700438 try:
maruel6be7f9e2015-10-01 12:25:30 -0700439 # TODO(maruel): This code is imperfect. It doesn't handle well signals
440 # during the download phase and there's short windows were things can go
441 # wrong.
442 def handler(signum, _frame):
443 if proc and not had_signal:
444 logging.info('Received signal %d', signum)
445 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700446 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700447
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000448 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000449 command, cwd=cwd, env=env, detached=True, close_fds=True,
450 lower_priority=lower_priority)
maruel6be7f9e2015-10-01 12:25:30 -0700451 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
452 try:
453 exit_code = proc.wait(hard_timeout or None)
454 except subprocess42.TimeoutExpired:
455 if not had_signal:
456 logging.warning('Hard timeout')
457 had_hard_timeout = True
458 logging.warning('Sending SIGTERM')
459 proc.terminate()
460
461 # Ignore signals in grace period. Forcibly give the grace period to the
462 # child process.
463 if exit_code is None:
464 ignore = lambda *_: None
465 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
466 try:
467 exit_code = proc.wait(grace_period or None)
468 except subprocess42.TimeoutExpired:
469 # Now kill for real. The user can distinguish between the
470 # following states:
471 # - signal but process exited within grace period,
472 # hard_timed_out will be set but the process exit code will be
473 # script provided.
474 # - processed exited late, exit code will be -9 on posix.
475 logging.warning('Grace exhausted; sending SIGKILL')
476 proc.kill()
martiniss5c8043e2017-08-01 17:09:43 -0700477 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700478 exit_code = proc.wait()
maruela9cfd6f2015-09-15 11:03:15 -0700479 except OSError:
480 # This is not considered to be an internal error. The executable simply
481 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800482 sys.stderr.write(
483 '<The executable does not exist or a dependent library is missing>\n'
484 '<Check for missing .so/.dll in the .isolate or GN file>\n'
485 '<Command: %s>\n' % command)
486 if os.environ.get('SWARMING_TASK_ID'):
487 # Give an additional hint when running as a swarming task.
488 sys.stderr.write(
489 '<See the task\'s page for commands to help diagnose this issue '
490 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700491 exit_code = 1
492 logging.info(
493 'Command finished with exit code %d (%s)',
494 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700495 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700496
497
maruel4409e302016-07-19 14:25:51 -0700498def fetch_and_map(isolated_hash, storage, cache, outdir, use_symlinks):
499 """Fetches an isolated tree, create the tree and returns (bundle, stats)."""
nodir6f801882016-04-29 14:41:50 -0700500 start = time.time()
501 bundle = isolateserver.fetch_isolated(
502 isolated_hash=isolated_hash,
503 storage=storage,
504 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700505 outdir=outdir,
506 use_symlinks=use_symlinks)
nodir6f801882016-04-29 14:41:50 -0700507 return bundle, {
508 'duration': time.time() - start,
nodir6f801882016-04-29 14:41:50 -0700509 'items_cold': base64.b64encode(large.pack(sorted(cache.added))),
510 'items_hot': base64.b64encode(
tansell9e04a8d2016-07-28 09:31:59 -0700511 large.pack(sorted(set(cache.used) - set(cache.added)))),
nodir6f801882016-04-29 14:41:50 -0700512 }
513
514
aludwin0a8e17d2016-10-27 15:57:39 -0700515def link_outputs_to_outdir(run_dir, out_dir, outputs):
516 """Links any named outputs to out_dir so they can be uploaded.
517
518 Raises an error if the file already exists in that directory.
519 """
520 if not outputs:
521 return
522 isolateserver.create_directories(out_dir, outputs)
523 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400524 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
525
526
527def copy_recursively(src, dst):
528 """Efficiently copies a file or directory from src_dir to dst_dir.
529
530 `item` may be a file, directory, or a symlink to a file or directory.
531 All symlinks are replaced with their targets, so the resulting
532 directory structure in dst_dir will never have any symlinks.
533
534 To increase speed, copy_recursively hardlinks individual files into the
535 (newly created) directory structure if possible, unlike Python's
536 shutil.copytree().
537 """
538 orig_src = src
539 try:
540 # Replace symlinks with their final target.
541 while fs.islink(src):
542 res = fs.readlink(src)
543 src = os.path.join(os.path.dirname(src), res)
544 # TODO(sadafm): Explicitly handle cyclic symlinks.
545
546 # Note that fs.isfile (which is a wrapper around os.path.isfile) throws
547 # an exception if src does not exist. A warning will be logged in that case.
548 if fs.isfile(src):
549 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
550 return
551
552 if not fs.exists(dst):
553 os.makedirs(dst)
554
555 for child in fs.listdir(src):
556 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
557
558 except OSError as e:
559 if e.errno == errno.ENOENT:
560 logging.warning('Path %s does not exist or %s is a broken symlink',
561 src, orig_src)
562 else:
563 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700564
565
maruela9cfd6f2015-09-15 11:03:15 -0700566def delete_and_upload(storage, out_dir, leak_temp_dir):
567 """Deletes the temporary run directory and uploads results back.
568
569 Returns:
nodir6f801882016-04-29 14:41:50 -0700570 tuple(outputs_ref, success, stats)
maruel064c0a32016-04-05 11:47:15 -0700571 - outputs_ref: a dict referring to the results archived back to the isolated
572 server, if applicable.
573 - success: False if something occurred that means that the task must
574 forcibly be considered a failure, e.g. zombie processes were left
575 behind.
nodir6f801882016-04-29 14:41:50 -0700576 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700577 """
maruela9cfd6f2015-09-15 11:03:15 -0700578 # Upload out_dir and generate a .isolated file out of this directory. It is
579 # only done if files were written in the directory.
580 outputs_ref = None
maruel064c0a32016-04-05 11:47:15 -0700581 cold = []
582 hot = []
nodir6f801882016-04-29 14:41:50 -0700583 start = time.time()
584
maruel12e30012015-10-09 11:55:35 -0700585 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700586 with tools.Profiler('ArchiveOutput'):
587 try:
maruel064c0a32016-04-05 11:47:15 -0700588 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
maruela9cfd6f2015-09-15 11:03:15 -0700589 storage, [out_dir], None)
590 outputs_ref = {
Marc-Antoine Rueld0868ec2018-11-28 20:47:29 +0000591 'isolated': results.values()[0],
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +0000592 'isolatedserver': storage.server_ref.url,
593 'namespace': storage.server_ref.namespace,
maruela9cfd6f2015-09-15 11:03:15 -0700594 }
maruel064c0a32016-04-05 11:47:15 -0700595 cold = sorted(i.size for i in f_cold)
596 hot = sorted(i.size for i in f_hot)
maruela9cfd6f2015-09-15 11:03:15 -0700597 except isolateserver.Aborted:
598 # This happens when a signal SIGTERM was received while uploading data.
599 # There is 2 causes:
600 # - The task was too slow and was about to be killed anyway due to
601 # exceeding the hard timeout.
602 # - The amount of data uploaded back is very large and took too much
603 # time to archive.
604 sys.stderr.write('Received SIGTERM while uploading')
605 # Re-raise, so it will be treated as an internal failure.
606 raise
nodir6f801882016-04-29 14:41:50 -0700607
608 success = False
maruela9cfd6f2015-09-15 11:03:15 -0700609 try:
maruel12e30012015-10-09 11:55:35 -0700610 if (not leak_temp_dir and fs.isdir(out_dir) and
maruel6eeea7d2015-09-16 12:17:42 -0700611 not file_path.rmtree(out_dir)):
maruela9cfd6f2015-09-15 11:03:15 -0700612 logging.error('Had difficulties removing out_dir %s', out_dir)
nodir6f801882016-04-29 14:41:50 -0700613 else:
614 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700615 except OSError as e:
616 # When this happens, it means there's a process error.
maruel12e30012015-10-09 11:55:35 -0700617 logging.exception('Had difficulties removing out_dir %s: %s', out_dir, e)
nodir6f801882016-04-29 14:41:50 -0700618 stats = {
619 'duration': time.time() - start,
620 'items_cold': base64.b64encode(large.pack(cold)),
621 'items_hot': base64.b64encode(large.pack(hot)),
622 }
623 return outputs_ref, success, stats
maruela9cfd6f2015-09-15 11:03:15 -0700624
625
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500626def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700627 """Runs a command with optional isolated input/output.
628
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500629 Arguments:
630 - data: TaskData instance.
631 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700632
633 Returns metadata about the result.
634 """
maruela9cfd6f2015-09-15 11:03:15 -0700635 result = {
maruel064c0a32016-04-05 11:47:15 -0700636 'duration': None,
maruela9cfd6f2015-09-15 11:03:15 -0700637 'exit_code': None,
maruel6be7f9e2015-10-01 12:25:30 -0700638 'had_hard_timeout': False,
Seth Koehler49139812017-12-19 13:59:33 -0500639 'internal_failure': 'run_isolated did not complete properly',
maruel064c0a32016-04-05 11:47:15 -0700640 'stats': {
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000641 'isolated': {
642 #'cipd': {
643 # 'duration': 0.,
644 # 'get_client_duration': 0.,
645 #},
646 'download': {
647 #'duration': 0.,
648 'initial_number_items': len(data.isolate_cache),
649 'initial_size': data.isolate_cache.total_size,
650 #'items_cold': '<large.pack()>',
651 #'items_hot': '<large.pack()>',
652 },
653 #'upload': {
654 # 'duration': 0.,
655 # 'items_cold': '<large.pack()>',
656 # 'items_hot': '<large.pack()>',
657 #},
658 },
maruel064c0a32016-04-05 11:47:15 -0700659 },
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000660 #'cipd_pins': {
661 # 'packages': [
662 # {'package_name': ..., 'version': ..., 'path': ...},
663 # ...
664 # ],
665 # 'client_package': {'package_name': ..., 'version': ...},
666 #},
maruela9cfd6f2015-09-15 11:03:15 -0700667 'outputs_ref': None,
nodirbe642ff2016-06-09 15:51:51 -0700668 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700669 }
nodirbe642ff2016-06-09 15:51:51 -0700670
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500671 if data.root_dir:
672 file_path.ensure_tree(data.root_dir, 0700)
673 elif data.isolate_cache.cache_dir:
674 data = data._replace(
675 root_dir=os.path.dirname(data.isolate_cache.cache_dir))
maruele2f2cb82016-07-13 14:41:03 -0700676 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700677 # If root_dir is not specified, it is not constant.
678 # TODO(maruel): This is not obvious. Change this to become an error once we
679 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500680 if constant_run_path and data.root_dir:
681 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700682 if os.path.isdir(run_dir):
683 file_path.rmtree(run_dir)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500684 os.mkdir(run_dir, 0700)
maruelcffa0542017-04-07 08:39:20 -0700685 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500686 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
maruel03e11842016-07-14 10:50:16 -0700687 # storage should be normally set but don't crash if it is not. This can happen
688 # as Swarming task can run without an isolate server.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500689 out_dir = make_temp_dir(
690 ISOLATED_OUT_DIR, data.root_dir) if data.storage else None
691 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700692 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500693 if data.relative_cwd:
694 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500695 command = data.command
nodir55be77b2016-05-03 09:39:57 -0700696 try:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500697 with data.install_packages_fn(run_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800698 if cipd_info:
699 result['stats']['cipd'] = cipd_info.stats
700 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700701
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500702 if data.isolated_hash:
vadimsh232f5a82017-01-20 19:23:44 -0800703 isolated_stats = result['stats'].setdefault('isolated', {})
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000704 bundle, stats = fetch_and_map(
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500705 isolated_hash=data.isolated_hash,
706 storage=data.storage,
707 cache=data.isolate_cache,
vadimsh232f5a82017-01-20 19:23:44 -0800708 outdir=run_dir,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500709 use_symlinks=data.use_symlinks)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000710 isolated_stats['download'].update(stats)
vadimsh232f5a82017-01-20 19:23:44 -0800711 change_tree_read_only(run_dir, bundle.read_only)
maruelabec63c2017-04-26 11:53:24 -0700712 # Inject the command
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500713 if not command and bundle.command:
714 command = bundle.command + data.extra_args
Marc-Antoine Rueld704a1f2017-10-31 10:51:23 -0400715 # Only set the relative directory if the isolated file specified a
716 # command, and no raw command was specified.
717 if bundle.relative_cwd:
718 cwd = os.path.normpath(os.path.join(cwd, bundle.relative_cwd))
maruelabec63c2017-04-26 11:53:24 -0700719
720 if not command:
721 # Handle this as a task failure, not an internal failure.
722 sys.stderr.write(
723 '<No command was specified!>\n'
724 '<Please secify a command when triggering your Swarming task>\n')
725 result['exit_code'] = 1
726 return result
nodirbe642ff2016-06-09 15:51:51 -0700727
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500728 if not cwd.startswith(run_dir):
729 # Handle this as a task failure, not an internal failure. This is a
730 # 'last chance' way to gate against directory escape.
731 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
732 result['exit_code'] = 1
733 return result
734
735 if not os.path.isdir(cwd):
736 # Accepts relative_cwd that does not exist.
737 os.makedirs(cwd, 0700)
738
vadimsh232f5a82017-01-20 19:23:44 -0800739 # If we have an explicit list of files to return, make sure their
740 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500741 if data.storage and data.outputs:
742 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700743
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500744 with data.install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -0800745 sys.stdout.flush()
746 start = time.time()
747 try:
vadimsh9c54b2c2017-07-25 14:08:29 -0700748 # Need to switch the default account before 'get_command_env' call,
749 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500750 with set_luci_context_account(data.switch_to_account, tmp_dir):
751 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000752 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
753 data.bot_file)
Robert Iannucci24ae76a2018-02-26 12:51:18 -0800754 command = tools.fix_python_cmd(command, env)
755 command = process_command(command, out_dir, data.bot_file)
756 file_path.ensure_command_has_abs_path(command, cwd)
757
vadimsh9c54b2c2017-07-25 14:08:29 -0700758 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000759 command, cwd, env, data.hard_timeout, data.grace_period,
760 data.lower_priority)
nodird6160682017-02-02 13:03:35 -0800761 finally:
762 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -0500763
764 # We successfully ran the command, set internal_failure back to
765 # None (even if the command failed, it's not an internal error).
766 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -0700767 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -0700768 # An internal error occurred. Report accordingly so the swarming task will
769 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -0700770 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -0700771 result['internal_failure'] = str(e)
772 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -0700773
774 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -0700775 finally:
776 try:
aludwin0a8e17d2016-10-27 15:57:39 -0700777 # Try to link files to the output directory, if specified.
778 if out_dir:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500779 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700780
nodir32a1ec12016-10-26 18:34:07 -0700781 success = False
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500782 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -0700783 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700784 logging.warning(
785 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -0700786 else:
maruel84537cb2015-10-16 14:21:28 -0700787 # On Windows rmtree(run_dir) call above has a synchronization effect: it
788 # finishes only when all task child processes terminate (since a running
789 # process locks *.exe file). Examine out_dir only after that call
790 # completes (since child processes may write to out_dir too and we need
791 # to wait for them to finish).
792 if fs.isdir(run_dir):
793 try:
794 success = file_path.rmtree(run_dir)
795 except OSError as e:
Marc-Antoine Ruel44699b32018-09-24 23:31:50 +0000796 logging.error('rmtree(%r) failed: %s', run_dir, e)
maruel84537cb2015-10-16 14:21:28 -0700797 success = False
798 if not success:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500799 sys.stderr.write(OUTLIVING_ZOMBIE_MSG % ('run', data.grace_period))
maruel84537cb2015-10-16 14:21:28 -0700800 if result['exit_code'] == 0:
801 result['exit_code'] = 1
802 if fs.isdir(tmp_dir):
803 try:
804 success = file_path.rmtree(tmp_dir)
805 except OSError as e:
Marc-Antoine Ruel44699b32018-09-24 23:31:50 +0000806 logging.error('rmtree(%r) failed: %s', tmp_dir, e)
maruel84537cb2015-10-16 14:21:28 -0700807 success = False
808 if not success:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500809 sys.stderr.write(OUTLIVING_ZOMBIE_MSG % ('temp', data.grace_period))
maruel84537cb2015-10-16 14:21:28 -0700810 if result['exit_code'] == 0:
811 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -0700812
marueleb5fbee2015-09-17 13:01:36 -0700813 # This deletes out_dir if leak_temp_dir is not set.
nodir9130f072016-05-27 13:59:08 -0700814 if out_dir:
nodir55715712016-06-03 12:28:19 -0700815 isolated_stats = result['stats'].setdefault('isolated', {})
816 result['outputs_ref'], success, isolated_stats['upload'] = (
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500817 delete_and_upload(data.storage, out_dir, data.leak_temp_dir))
maruela9cfd6f2015-09-15 11:03:15 -0700818 if not success and result['exit_code'] == 0:
819 result['exit_code'] = 1
820 except Exception as e:
821 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -0700822 if out_dir:
823 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -0700824 result['internal_failure'] = str(e)
825 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500826
827
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500828def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -0700829 """Runs an executable and records execution metadata.
830
nodir55be77b2016-05-03 09:39:57 -0700831 If isolated_hash is specified, downloads the dependencies in the cache,
832 hardlinks them into a temporary directory and runs the command specified in
833 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500834
835 A temporary directory is created to hold the output files. The content inside
836 this directory will be uploaded back to |storage| packaged as a .isolated
837 file.
838
839 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500840 - data: TaskData instance.
841 - result_json: File path to dump result metadata into. If set, the process
842 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -0700843
844 Returns:
845 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000846 """
maruela76b9ee2015-12-15 06:18:08 -0800847 if result_json:
848 # Write a json output file right away in case we get killed.
849 result = {
850 'exit_code': None,
851 'had_hard_timeout': False,
852 'internal_failure': 'Was terminated before completion',
853 'outputs_ref': None,
nodirbe642ff2016-06-09 15:51:51 -0700854 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -0800855 }
856 tools.write_json(result_json, result, dense=True)
857
maruela9cfd6f2015-09-15 11:03:15 -0700858 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500859 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -0700860 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -0700861
maruela9cfd6f2015-09-15 11:03:15 -0700862 if result_json:
maruel05d5a882015-09-21 13:59:02 -0700863 # We've found tests to delete 'work' when quitting, causing an exception
864 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -0700865 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -0700866 tools.write_json(result_json, result, dense=True)
867 # Only return 1 if there was an internal error.
868 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +0000869
maruela9cfd6f2015-09-15 11:03:15 -0700870 # Marshall into old-style inline output.
871 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000872 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -0700873 data = {
874 'hash': result['outputs_ref']['isolated'],
875 'namespace': result['outputs_ref']['namespace'],
876 'storage': result['outputs_ref']['isolatedserver'],
877 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -0500878 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700879 print(
880 '[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
881 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -0800882 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700883 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000884
885
iannuccib58d10d2017-03-18 02:00:25 -0700886# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -0800887CipdInfo = collections.namedtuple('CipdInfo', [
888 'client', # cipd.CipdClient object
889 'cache_dir', # absolute path to bot-global cipd tag and instance cache
890 'stats', # dict with stats to return to the server
891 'pins', # dict with installed cipd pins to return to the server
892])
893
894
895@contextlib.contextmanager
896def noop_install_packages(_run_dir):
iannuccib58d10d2017-03-18 02:00:25 -0700897 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -0800898 yield None
899
900
iannuccib58d10d2017-03-18 02:00:25 -0700901def _install_packages(run_dir, cipd_cache_dir, client, packages, timeout):
902 """Calls 'cipd ensure' for packages.
903
904 Args:
905 run_dir (str): root of installation.
906 cipd_cache_dir (str): the directory to use for the cipd package cache.
907 client (CipdClient): the cipd client to use
908 packages: packages to install, list [(path, package_name, version), ...].
909 timeout: max duration in seconds that this function can take.
910
911 Returns: list of pinned packages. Looks like [
912 {
913 'path': 'subdirectory',
914 'package_name': 'resolved/package/name',
915 'version': 'deadbeef...',
916 },
917 ...
918 ]
919 """
920 package_pins = [None]*len(packages)
921 def insert_pin(path, name, version, idx):
922 package_pins[idx] = {
923 'package_name': name,
924 # swarming deals with 'root' as '.'
925 'path': path or '.',
926 'version': version,
927 }
928
929 by_path = collections.defaultdict(list)
930 for i, (path, name, version) in enumerate(packages):
931 # cipd deals with 'root' as ''
932 if path == '.':
933 path = ''
934 by_path[path].append((name, version, i))
935
936 pins = client.ensure(
937 run_dir,
938 {
939 subdir: [(name, vers) for name, vers, _ in pkgs]
940 for subdir, pkgs in by_path.iteritems()
941 },
942 cache_dir=cipd_cache_dir,
943 timeout=timeout,
944 )
945
946 for subdir, pin_list in sorted(pins.iteritems()):
947 this_subdir = by_path[subdir]
948 for i, (name, version) in enumerate(pin_list):
949 insert_pin(subdir, name, version, this_subdir[i][2])
950
Robert Iannucci461b30d2017-12-13 11:34:03 -0800951 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -0700952
953 return package_pins
954
955
vadimsh232f5a82017-01-20 19:23:44 -0800956@contextlib.contextmanager
iannuccib58d10d2017-03-18 02:00:25 -0700957def install_client_and_packages(
nodirff531b42016-06-23 13:05:06 -0700958 run_dir, packages, service_url, client_package_name,
vadimsh232f5a82017-01-20 19:23:44 -0800959 client_version, cache_dir, timeout=None):
vadimsh902948e2017-01-20 15:57:32 -0800960 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -0700961
vadimsh232f5a82017-01-20 19:23:44 -0800962 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
963
964 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -0700965 [
966 {
967 "path": path, "package_name": package_name, "version": version,
968 },
969 ...
970 ]
vadimsh902948e2017-01-20 15:57:32 -0800971 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -0700972
973 such that they correspond 1:1 to all input package arguments from the command
974 line. These dictionaries make their all the way back to swarming, where they
975 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -0700976
vadimsh902948e2017-01-20 15:57:32 -0800977 If 'packages' list is empty, will bootstrap CIPD client, but won't install
978 any packages.
979
980 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -0800981 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -0800982
nodirbe642ff2016-06-09 15:51:51 -0700983 Args:
nodir90bc8dc2016-06-15 13:35:21 -0700984 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -0800985 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -0700986 service_url (str): CIPD server url, e.g.
987 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -0700988 client_package_name (str): CIPD package name of CIPD client.
989 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -0700990 cache_dir (str): where to keep cache of cipd clients, packages and tags.
991 timeout: max duration in seconds that this function can take.
nodirbe642ff2016-06-09 15:51:51 -0700992 """
993 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -0700994
nodirbe642ff2016-06-09 15:51:51 -0700995 timeoutfn = tools.sliding_timeout(timeout)
nodirbe642ff2016-06-09 15:51:51 -0700996 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -0700997
vadimsh902948e2017-01-20 15:57:32 -0800998 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -0800999 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001000 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001001 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001002
nodirbe642ff2016-06-09 15:51:51 -07001003 get_client_start = time.time()
1004 client_manager = cipd.get_client(
1005 service_url, client_package_name, client_version, cache_dir,
1006 timeout=timeoutfn())
iannucci96fcccc2016-08-30 15:52:22 -07001007
nodirbe642ff2016-06-09 15:51:51 -07001008 with client_manager as client:
1009 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001010
iannuccib58d10d2017-03-18 02:00:25 -07001011 package_pins = []
1012 if packages:
1013 package_pins = _install_packages(
1014 run_dir, cipd_cache_dir, client, packages, timeoutfn())
1015
1016 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001017
vadimsh232f5a82017-01-20 19:23:44 -08001018 total_duration = time.time() - start
1019 logging.info(
1020 'Installing CIPD client and packages took %d seconds', total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001021
vadimsh232f5a82017-01-20 19:23:44 -08001022 yield CipdInfo(
1023 client=client,
1024 cache_dir=cipd_cache_dir,
1025 stats={
1026 'duration': total_duration,
1027 'get_client_duration': get_client_duration,
1028 },
1029 pins={
iannuccib58d10d2017-03-18 02:00:25 -07001030 'client_package': {
1031 'package_name': client.package_name,
1032 'version': client.instance_id,
1033 },
vadimsh232f5a82017-01-20 19:23:44 -08001034 'packages': package_pins,
1035 })
nodirbe642ff2016-06-09 15:51:51 -07001036
1037
1038def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001039 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001040 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001041 version=__version__,
1042 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001043 parser.add_option(
maruel36a963d2016-04-08 17:15:49 -07001044 '--clean', action='store_true',
1045 help='Cleans the cache, trimming it necessary and remove corrupted items '
1046 'and returns without executing anything; use with -v to know what '
1047 'was done')
1048 parser.add_option(
maruel4409e302016-07-19 14:25:51 -07001049 '--use-symlinks', action='store_true',
1050 help='Use symlinks instead of hardlinks')
1051 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001052 '--json',
1053 help='dump output metadata to json file. When used, run_isolated returns '
1054 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001055 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001056 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001057 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001058 '--grace-period', type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001059 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001060 parser.add_option(
Marc-Antoine Ruel49e347d2017-10-24 16:52:02 -07001061 '--raw-cmd', action='store_true',
1062 help='Ignore the isolated command, use the one supplied at the command '
1063 'line')
1064 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001065 '--relative-cwd',
1066 help='Ignore the isolated \'relative_cwd\' and use this one instead; '
1067 'requires --raw-cmd')
1068 parser.add_option(
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001069 '--env', default=[], action='append',
1070 help='Environment variables to set for the child process')
1071 parser.add_option(
1072 '--env-prefix', default=[], action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001073 help='Specify a VAR=./path/fragment to put in the environment variable '
1074 'before executing the command. The path fragment must be relative '
1075 'to the isolated run directory, and must not contain a `..` token. '
1076 'The path will be made absolute and prepended to the indicated '
1077 '$VAR using the OS\'s path separator. Multiple items for the same '
1078 '$VAR will be prepended in order.')
1079 parser.add_option(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001080 '--lower-priority', action='store_true',
1081 help='Lowers the child process priority')
1082 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001083 '--bot-file',
1084 help='Path to a file describing the state of the host. The content is '
1085 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001086 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001087 '--switch-to-account',
1088 help='If given, switches LUCI_CONTEXT to given logical service account '
1089 '(e.g. "task" or "system") before launching the isolated process.')
1090 parser.add_option(
aludwin0a8e17d2016-10-27 15:57:39 -07001091 '--output', action='append',
1092 help='Specifies an output to return. If no outputs are specified, all '
1093 'files located in $(ISOLATED_OUTDIR) will be returned; '
1094 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1095 'specified by --output option (there can be multiple) will be '
1096 'returned. Note that if a file in OUT_DIR has the same path '
1097 'as an --output option, the --output version will be returned.')
1098 parser.add_option(
aludwin7556e0c2016-10-26 08:46:10 -07001099 '-a', '--argsfile',
1100 # This is actually handled in parse_args; it's included here purely so it
1101 # can make it into the help text.
1102 help='Specify a file containing a JSON array of arguments to this '
1103 'script. If --argsfile is provided, no other argument may be '
1104 'provided on the command line.')
Marc-Antoine Ruel1687b5e2014-02-06 17:47:53 -05001105 data_group = optparse.OptionGroup(parser, 'Data source')
1106 data_group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001107 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001108 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruelf7d737d2014-12-10 15:36:29 -05001109 isolateserver.add_isolate_server_options(data_group)
Marc-Antoine Ruel1687b5e2014-02-06 17:47:53 -05001110 parser.add_option_group(data_group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001111
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001112 isolateserver.add_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001113
1114 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001115
1116 group = optparse.OptionGroup(parser, 'Named caches')
1117 group.add_option(
1118 '--named-cache',
1119 dest='named_caches',
1120 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001121 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001122 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001123 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001124 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1125 'path is a path relative to the run dir where the cache directory '
1126 'must be put to. '
1127 'This option can be specified more than once.')
1128 group.add_option(
1129 '--named-cache-root', default='named_caches',
1130 help='Cache root directory. Default=%default')
1131 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001132
Kenneth Russell61d42352014-09-15 11:41:16 -07001133 debug_group = optparse.OptionGroup(parser, 'Debugging')
1134 debug_group.add_option(
1135 '--leak-temp-dir',
1136 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001137 help='Deliberately leak isolate\'s temp dir for later examination. '
1138 'Default: %default')
marueleb5fbee2015-09-17 13:01:36 -07001139 debug_group.add_option(
1140 '--root-dir', help='Use a directory instead of a random one')
Kenneth Russell61d42352014-09-15 11:41:16 -07001141 parser.add_option_group(debug_group)
1142
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001143 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001144
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001145 parser.set_defaults(cache='cache', cipd_cache='cipd_cache')
nodirbe642ff2016-06-09 15:51:51 -07001146 return parser
1147
1148
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001149def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001150 """Validates named cache options and returns a CacheManager."""
1151 if options.named_caches and not options.named_cache_root:
1152 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001153 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001154 if not CACHE_NAME_RE.match(name):
1155 parser.error(
1156 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1157 if not path:
1158 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001159 try:
1160 long(hint)
1161 except ValueError:
1162 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001163 if options.named_cache_root:
1164 # Make these configurable later if there is use case but for now it's fairly
1165 # safe values.
1166 # In practice, a fair chunk of bots are already recycled on a daily schedule
1167 # so this code doesn't have any effect to them, unless they are preloaded
1168 # with a really old cache.
1169 policies = local_caching.CachePolicies(
1170 # 1TiB.
1171 max_cache_size=1024*1024*1024*1024,
1172 min_free_space=options.min_free_space,
1173 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001174 max_age_secs=MAX_AGE_SECS)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001175 root_dir = unicode(os.path.abspath(options.named_cache_root))
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001176 return local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001177 return None
1178
1179
aludwin7556e0c2016-10-26 08:46:10 -07001180def parse_args(args):
1181 # Create a fake mini-parser just to get out the "-a" command. Note that
1182 # it's not documented here; instead, it's documented in create_option_parser
1183 # even though that parser will never actually get to parse it. This is
1184 # because --argsfile is exclusive with all other options and arguments.
1185 file_argparse = argparse.ArgumentParser(add_help=False)
1186 file_argparse.add_argument('-a', '--argsfile')
1187 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1188 if file_args.argsfile:
1189 if nonfile_args:
1190 file_argparse.error('Can\'t specify --argsfile with'
1191 'any other arguments (%s)' % nonfile_args)
1192 try:
1193 with open(file_args.argsfile, 'r') as f:
1194 args = json.load(f)
1195 except (IOError, OSError, ValueError) as e:
1196 # We don't need to error out here - "args" is now empty,
1197 # so the call below to parser.parse_args(args) will fail
1198 # and print the full help text.
1199 print >> sys.stderr, 'Couldn\'t read arguments: %s' % e
1200
1201 # Even if we failed to read the args, just call the normal parser now since it
1202 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001203 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001204 options, args = parser.parse_args(args)
aludwin7556e0c2016-10-26 08:46:10 -07001205 return (parser, options, args)
1206
1207
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001208def _calc_named_cache_hint(named_cache, named_caches):
1209 """Returns the expected size of the missing named caches."""
1210 present = named_cache.available
1211 size = 0
1212 for name, _, hint in named_caches:
1213 if name not in present:
1214 hint = long(hint)
1215 if hint > 0:
1216 size += hint
1217 return size
1218
1219
aludwin7556e0c2016-10-26 08:46:10 -07001220def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001221 # Warning: when --argsfile is used, the strings are unicode instances, when
1222 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001223 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001224
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001225 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001226 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001227
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001228 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001229 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001230 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1231 if hint:
1232 # Increase the --min-free-space value by the hint, and recreate the
1233 # NamedCache instance so it gets the updated CachePolicy.
1234 options.min_free_space += hint
1235 named_cache = process_named_cache_options(parser, options)
1236
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001237 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1238 # they can be cleaned the same way.
nodirf33b8d62016-10-26 22:34:58 -07001239 isolate_cache = isolateserver.process_cache_options(options, trim=False)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001240 caches = []
1241 if isolate_cache:
1242 caches.append(isolate_cache)
1243 if named_cache:
1244 caches.append(named_cache)
1245 root = caches[0].cache_dir if caches else unicode(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001246 if options.clean:
1247 if options.isolated:
1248 parser.error('Can\'t use --isolated with --clean.')
1249 if options.isolate_server:
1250 parser.error('Can\'t use --isolate-server with --clean.')
1251 if options.json:
1252 parser.error('Can\'t use --json with --clean.')
nodirf33b8d62016-10-26 22:34:58 -07001253 if options.named_caches:
1254 parser.error('Can\t use --named-cache with --clean.')
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001255 # Trim first, then clean.
1256 local_caching.trim_caches(
1257 caches,
1258 root,
1259 min_free_space=options.min_free_space,
1260 max_age_secs=MAX_AGE_SECS)
1261 for c in caches:
Marc-Antoine Ruel87fc2222018-06-18 13:09:24 +00001262 c.cleanup()
maruel36a963d2016-04-08 17:15:49 -07001263 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001264
1265 # Trim must still be done for the following case:
1266 # - named-cache was used
1267 # - some entries, with a large hint, where missing
1268 # - --min-free-space was increased accordingly, thus trimming is needed
1269 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1270 # --clean after each task.
1271 if hint:
1272 logging.info('Additional trimming of %d bytes', hint)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001273 local_caching.trim_caches(
1274 caches,
1275 root,
1276 min_free_space=options.min_free_space,
1277 max_age_secs=MAX_AGE_SECS)
maruel36a963d2016-04-08 17:15:49 -07001278
nodir55be77b2016-05-03 09:39:57 -07001279 if not options.isolated and not args:
1280 parser.error('--isolated or command to run is required.')
1281
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001282 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001283
1284 isolateserver.process_isolate_server_options(
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001285 parser, options, True, False)
nodir55be77b2016-05-03 09:39:57 -07001286 if not options.isolate_server:
1287 if options.isolated:
1288 parser.error('--isolated requires --isolate-server')
1289 if ISOLATED_OUTDIR_PARAMETER in args:
1290 parser.error(
1291 '%s in args requires --isolate-server' % ISOLATED_OUTDIR_PARAMETER)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001292
nodir90bc8dc2016-06-15 13:35:21 -07001293 if options.root_dir:
1294 options.root_dir = unicode(os.path.abspath(options.root_dir))
maruel12e30012015-10-09 11:55:35 -07001295 if options.json:
1296 options.json = unicode(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001297
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001298 if any('=' not in i for i in options.env):
1299 parser.error(
1300 '--env required key=value form. value can be skipped to delete '
1301 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001302 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001303
1304 prefixes = {}
1305 cwd = os.path.realpath(os.getcwd())
1306 for item in options.env_prefix:
1307 if '=' not in item:
1308 parser.error(
1309 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1310 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001311 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001312 if os.path.isabs(opath):
1313 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1314 opath = os.path.normpath(opath)
1315 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1316 parser.error(
1317 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1318 % opath)
1319 prefixes.setdefault(key, []).append(opath)
1320 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001321
nodirbe642ff2016-06-09 15:51:51 -07001322 cipd.validate_cipd_options(parser, options)
1323
vadimsh232f5a82017-01-20 19:23:44 -08001324 install_packages_fn = noop_install_packages
vadimsh902948e2017-01-20 15:57:32 -08001325 if options.cipd_enabled:
iannuccib58d10d2017-03-18 02:00:25 -07001326 install_packages_fn = lambda run_dir: install_client_and_packages(
vadimsh902948e2017-01-20 15:57:32 -08001327 run_dir, cipd.parse_package_args(options.cipd_packages),
1328 options.cipd_server, options.cipd_client_package,
1329 options.cipd_client_version, cache_dir=options.cipd_cache)
nodirbe642ff2016-06-09 15:51:51 -07001330
nodird6160682017-02-02 13:03:35 -08001331 @contextlib.contextmanager
nodir0ae98b32017-05-11 13:21:53 -07001332 def install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001333 # WARNING: this function depends on "options" variable defined in the outer
1334 # function.
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001335 assert unicode(run_dir), repr(run_dir)
1336 assert os.path.isabs(run_dir), run_dir
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001337 named_caches = [
nodir0ae98b32017-05-11 13:21:53 -07001338 (os.path.join(run_dir, unicode(relpath)), name)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001339 for name, relpath, _ in options.named_caches
nodir0ae98b32017-05-11 13:21:53 -07001340 ]
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001341 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001342 named_cache.install(path, name)
nodird6160682017-02-02 13:03:35 -08001343 try:
1344 yield
1345 finally:
dnje289d132017-07-07 11:16:44 -07001346 # Uninstall each named cache, returning it to the cache pool. If an
1347 # uninstall fails for a given cache, it will remain in the task's
1348 # temporary space, get cleaned up by the Swarming bot, and be lost.
1349 #
1350 # If the Swarming bot cannot clean up the cache, it will handle it like
1351 # any other bot file that could not be removed.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001352 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001353 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001354 # uninstall() doesn't trim but does call save() implicitly. Trimming
1355 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001356 named_cache.uninstall(path, name)
1357 except local_caching.NamedCacheError:
1358 logging.exception('Error while removing named cache %r at %r. '
1359 'The cache will be lost.', path, name)
nodirf33b8d62016-10-26 22:34:58 -07001360
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001361 extra_args = []
1362 command = []
1363 if options.raw_cmd:
1364 command = args
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001365 if options.relative_cwd:
1366 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1367 if not a.startswith(os.getcwd()):
1368 parser.error(
1369 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001370 else:
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001371 if options.relative_cwd:
1372 parser.error('--relative-cwd requires --raw-cmd')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001373 extra_args = args
1374
1375 data = TaskData(
1376 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001377 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001378 extra_args=extra_args,
1379 isolated_hash=options.isolated,
1380 storage=None,
1381 isolate_cache=isolate_cache,
1382 outputs=options.output,
1383 install_named_caches=install_named_caches,
1384 leak_temp_dir=options.leak_temp_dir,
1385 root_dir=_to_unicode(options.root_dir),
1386 hard_timeout=options.hard_timeout,
1387 grace_period=options.grace_period,
1388 bot_file=options.bot_file,
1389 switch_to_account=options.switch_to_account,
1390 install_packages_fn=install_packages_fn,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001391 use_symlinks=bool(options.use_symlinks),
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001392 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001393 env_prefix=options.env_prefix,
1394 lower_priority=bool(options.lower_priority))
nodirbe642ff2016-06-09 15:51:51 -07001395 try:
nodir90bc8dc2016-06-15 13:35:21 -07001396 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001397 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001398 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001399 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001400 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001401 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001402 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001403 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001404 return run_tha_test(data, options.json)
1405 return run_tha_test(data, options.json)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001406 except (
1407 cipd.Error,
1408 local_caching.NamedCacheError,
Marc-Antoine Ruelb6e9e232018-11-20 00:12:33 +00001409 local_caching.NoMoreSpace) as ex:
nodirbe642ff2016-06-09 15:51:51 -07001410 print >> sys.stderr, ex.message
1411 return 1
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001412
1413
1414if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001415 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001416 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001417 fix_encoding.fix_encoding()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001418 sys.exit(main(sys.argv[1:]))