blob: d8655ceeddc959c94e5713855b5f761f00ae9bf1 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
33See
34https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
35for all the variables.
36
37See
38https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
39for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000040"""
41
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000042from __future__ import print_function
43
44__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000045
aludwin7556e0c2016-10-26 08:46:10 -070046import argparse
maruel064c0a32016-04-05 11:47:15 -070047import base64
iannucci96fcccc2016-08-30 15:52:22 -070048import collections
vadimsh232f5a82017-01-20 19:23:44 -080049import contextlib
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040050import errno
aludwin7556e0c2016-10-26 08:46:10 -070051import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000052import logging
53import optparse
54import os
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040055import re
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000056import sys
57import tempfile
maruel064c0a32016-04-05 11:47:15 -070058import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000059
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000060from utils import tools
61tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000062
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000063# third_party/
64from depot_tools import fix_encoding
65
66# pylint: disable=ungrouped-imports
67import auth
68import cipd
69import isolate_storage
70import isolateserver
71import local_caching
72from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070073from utils import file_path
maruel12e30012015-10-09 11:55:35 -070074from utils import fs
maruel064c0a32016-04-05 11:47:15 -070075from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040076from utils import logging_utils
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040077from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050078from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000079
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000080
maruele2f2cb82016-07-13 14:41:03 -070081# Magic variables that can be found in the isolate task command line.
82ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
83EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
84SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
85
86
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000087# The name of the log file to use.
88RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
89
maruele2f2cb82016-07-13 14:41:03 -070090
csharp@chromium.orge217f302012-11-22 16:51:53 +000091# The name of the log to use for the run_test_cases.py command
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000092RUN_TEST_CASES_LOG = 'run_test_cases.log'
csharp@chromium.orge217f302012-11-22 16:51:53 +000093
vadimsh@chromium.org87d63262013-04-04 19:34:21 +000094
maruele2f2cb82016-07-13 14:41:03 -070095# Use short names for temporary directories. This is driven by Windows, which
96# imposes a relatively short maximum path length of 260 characters, often
97# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +000098# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -070099#
100# It is recommended to start the script with a `root_dir` as short as
101# possible.
102# - ir stands for isolated_run
103# - io stands for isolated_out
104# - it stands for isolated_tmp
105ISOLATED_RUN_DIR = u'ir'
106ISOLATED_OUT_DIR = u'io'
107ISOLATED_TMP_DIR = u'it'
108
109
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400110# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000111CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400112
113
marueld928c862017-06-08 08:20:04 -0700114OUTLIVING_ZOMBIE_MSG = """\
115*** Swarming tried multiple times to delete the %s directory and failed ***
116*** Hard failing the task ***
117
118Swarming detected that your testing script ran an executable, which may have
119started a child executable, and the main script returned early, leaving the
120children executables playing around unguided.
121
122You don't want to leave children processes outliving the task on the Swarming
123bot, do you? The Swarming bot doesn't.
124
125How to fix?
126- For any process that starts children processes, make sure all children
127 processes terminated properly before each parent process exits. This is
128 especially important in very deep process trees.
129 - This must be done properly both in normal successful task and in case of
130 task failure. Cleanup is very important.
131- The Swarming bot sends a SIGTERM in case of timeout.
132 - You have %s seconds to comply after the signal was sent to the process
133 before the process is forcibly killed.
134- To achieve not leaking children processes in case of signals on timeout, you
135 MUST handle signals in each executable / python script and propagate them to
136 children processes.
137 - When your test script (python or binary) receives a signal like SIGTERM or
138 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
139 them to terminate before quitting.
140
141See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400142https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700143for more information.
144
145*** May the SIGKILL force be with you ***
146"""
147
148
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000149# Currently hardcoded. Eventually could be exposed as a flag once there's value.
150# 3 weeks
151MAX_AGE_SECS = 21*24*60*60
152
153
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500154TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000155 'TaskData',
156 [
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500157 # List of strings; the command line to use, independent of what was
158 # specified in the isolated file.
159 'command',
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500160 # Relative directory to start command into.
161 'relative_cwd',
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500162 # List of strings; the arguments to add to the command specified in the
163 # isolated file.
164 'extra_args',
165 # Hash of the .isolated file that must be retrieved to recreate the tree
166 # of files to run the target executable. The command specified in the
167 # .isolated is executed. Mutually exclusive with command argument.
168 'isolated_hash',
169 # isolateserver.Storage instance to retrieve remote objects. This object
170 # has a reference to an isolateserver.StorageApi, which does the actual
171 # I/O.
172 'storage',
173 # isolateserver.LocalCache instance to keep from retrieving the same
174 # objects constantly by caching the objects retrieved. Can be on-disk or
175 # in-memory.
176 'isolate_cache',
177 # List of paths relative to root_dir to put into the output isolated
178 # bundle upon task completion (see link_outputs_to_outdir).
179 'outputs',
180 # Function (run_dir) => context manager that installs named caches into
181 # |run_dir|.
182 'install_named_caches',
183 # If True, the temporary directory will be deliberately leaked for later
184 # examination.
185 'leak_temp_dir',
186 # Path to the directory to use to create the temporary directory. If not
187 # specified, a random temporary directory is created.
188 'root_dir',
189 # Kills the process if it lasts more than this amount of seconds.
190 'hard_timeout',
191 # Number of seconds to wait between SIGTERM and SIGKILL.
192 'grace_period',
193 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
194 # task command line argument.
195 'bot_file',
196 # Logical account to switch LUCI_CONTEXT into.
197 'switch_to_account',
198 # Context manager dir => CipdInfo, see install_client_and_packages.
199 'install_packages_fn',
200 # Create tree with symlinks instead of hardlinks.
201 'use_symlinks',
202 # Environment variables to set.
203 'env',
204 # Environment variables to mutate with relative directories.
205 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000206 'env_prefix',
207 # Lowers the task process priority.
208 'lower_priority',
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000209 # subprocess42.Containment instance. Can be None.
210 'containment',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000211 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500212
213
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500214def _to_str(s):
215 """Downgrades a unicode instance to str. Pass str through as-is."""
216 if isinstance(s, str):
217 return s
218 # This is technically incorrect, especially on Windows. In theory
219 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
220 # page' on Windows, but that causes other problems, as the character set
221 # is very limited.
222 return s.encode('utf-8')
223
224
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500225def _to_unicode(s):
226 """Upgrades a str instance to unicode. Pass unicode through as-is."""
227 if isinstance(s, unicode) or s is None:
228 return s
229 return s.decode('utf-8')
230
231
maruel03e11842016-07-14 10:50:16 -0700232def make_temp_dir(prefix, root_dir):
233 """Returns a new unique temporary directory."""
234 return unicode(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000235
236
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500237def change_tree_read_only(rootdir, read_only):
238 """Changes the tree read-only bits according to the read_only specification.
239
240 The flag can be 0, 1 or 2, which will affect the possibility to modify files
241 and create or delete files.
242 """
243 if read_only == 2:
244 # Files and directories (except on Windows) are marked read only. This
245 # inhibits modifying, creating or deleting files in the test directory,
246 # except on Windows where creating and deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400247 file_path.make_tree_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500248 elif read_only == 1:
249 # Files are marked read only but not the directories. This inhibits
250 # modifying files but creating or deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400251 file_path.make_tree_files_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500252 elif read_only in (0, None):
Marc-Antoine Ruelf1d827c2014-11-24 15:22:25 -0500253 # Anything can be modified.
Marc-Antoine Ruel2666d9c2018-05-18 13:52:02 -0400254 # TODO(maruel): This is currently dangerous as long as
255 # DiskContentAddressedCache.touch() is not yet changed to verify the hash of
256 # the content of the files it is looking at, so that if a test modifies an
257 # input file, the file must be deleted.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400258 file_path.make_tree_writeable(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500259 else:
260 raise ValueError(
261 'change_tree_read_only(%s, %s): Unknown flag %s' %
262 (rootdir, read_only, read_only))
263
264
vadimsh9c54b2c2017-07-25 14:08:29 -0700265@contextlib.contextmanager
266def set_luci_context_account(account, tmp_dir):
267 """Sets LUCI_CONTEXT account to be used by the task.
268
269 If 'account' is None or '', does nothing at all. This happens when
270 run_isolated.py is called without '--switch-to-account' flag. In this case,
271 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000272 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700273 run_isolated.py explicitly from their code.
274
275 If the requested account is not defined in the context, switches to
276 non-authenticated access. This happens for Swarming tasks that don't use
277 'task' service accounts.
278
279 If not using LUCI_CONTEXT-based auth, does nothing.
280 If already running as requested account, does nothing.
281 """
282 if not account:
283 # Not actually switching.
284 yield
285 return
286
287 local_auth = luci_context.read('local_auth')
288 if not local_auth:
289 # Not using LUCI_CONTEXT auth at all.
290 yield
291 return
292
293 # See LUCI_CONTEXT.md for the format of 'local_auth'.
294 if local_auth.get('default_account_id') == account:
295 # Already set, no need to switch.
296 yield
297 return
298
299 available = {a['id'] for a in local_auth.get('accounts') or []}
300 if account in available:
301 logging.info('Switching default LUCI_CONTEXT account to %r', account)
302 local_auth['default_account_id'] = account
303 else:
304 logging.warning(
305 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
306 'disabling authentication', account, sorted(available))
307 local_auth.pop('default_account_id', None)
308
309 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
310 yield
311
312
nodir90bc8dc2016-06-15 13:35:21 -0700313def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000314 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700315
316 Raises:
317 ValueError if a parameter is requested in |command| but its value is not
318 provided.
319 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000320 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
321
322
323def replace_parameters(arg, out_dir, bot_file):
324 """Replaces parameter tokens with appropriate values in a string.
325
326 Raises:
327 ValueError if a parameter is requested in |arg| but its value is not
328 provided.
329 """
330 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
331 replace_slash = False
332 if ISOLATED_OUTDIR_PARAMETER in arg:
333 if not out_dir:
334 raise ValueError(
335 'output directory is requested in command or env var, but not '
336 'provided; please specify one')
337 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
338 replace_slash = True
339 if SWARMING_BOT_FILE_PARAMETER in arg:
340 if bot_file:
341 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700342 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000343 else:
344 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
345 'var, but no bot_file specified. Leaving parameter '
346 'unchanged.')
347 if replace_slash:
348 # Replace slashes only if parameters are present
349 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
350 arg = arg.replace('/', os.sep)
351 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700352
353
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000354
355def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
356 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800357 """Returns full OS environment to run a command in.
358
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800359 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
360 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800361
362 Args:
363 tmp_dir: temp directory.
364 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500365 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500366 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800367 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000368 out_dir: Isolated output directory. Required to be != None if any of the
369 env vars contain ISOLATED_OUTDIR_PARAMETER.
370 bot_file: Required to be != None if any of the env vars contain
371 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800372 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500373 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000374 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500375 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500376 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500377 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000378 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500379
380 if cipd_info:
381 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500382 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
383 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500384
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000385 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500386 assert isinstance(paths, list), paths
387 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500388 cur = out.get(key)
389 if cur:
390 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500391 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800392
Marc-Antoine Ruelefb30b12018-07-25 18:34:36 +0000393 tmp_dir = _to_str(tmp_dir)
394 # pylint: disable=line-too-long
395 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
396 # platform. So $TMPDIR must be set on all platforms.
397 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
398 out['TMPDIR'] = tmp_dir
399 if sys.platform == 'win32':
400 # * chromium's base utils uses GetTempPath().
401 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
402 # * Go uses GetTempPath().
403 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
404 # set.
405 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
406 out['TMP'] = tmp_dir
407 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
408 out['TEMP'] = tmp_dir
409 elif sys.platform == 'darwin':
410 # * Chromium uses an hack on macOS before calling into
411 # NSTemporaryDirectory().
412 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
413 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
414 out['MAC_CHROMIUM_TMPDIR'] = tmp_dir
415 else:
416 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
417 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
418 # * mktemp on linux respects $TMPDIR.
419 # * Chromium respects $TMPDIR on linux.
420 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
421 # * Go uses $TMPDIR.
422 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
423 pass
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500424 return out
vadimsh232f5a82017-01-20 19:23:44 -0800425
426
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000427def run_command(
428 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700429 """Runs the command.
430
431 Returns:
432 tuple(process exit code, bool if had a hard timeout)
433 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000434 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000435 'run_command(%s, %s, %s, %s, %s, %s)',
436 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700437
maruel6be7f9e2015-10-01 12:25:30 -0700438 exit_code = None
439 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700440 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700441 proc = None
442 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700443 try:
maruel6be7f9e2015-10-01 12:25:30 -0700444 # TODO(maruel): This code is imperfect. It doesn't handle well signals
445 # during the download phase and there's short windows were things can go
446 # wrong.
447 def handler(signum, _frame):
448 if proc and not had_signal:
449 logging.info('Received signal %d', signum)
450 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700451 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700452
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000453 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000454 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000455 lower_priority=lower_priority, containment=containment)
maruel6be7f9e2015-10-01 12:25:30 -0700456 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
457 try:
John Budorickc398f092019-06-10 22:49:44 +0000458 exit_code = proc.wait(hard_timeout or None)
maruel6be7f9e2015-10-01 12:25:30 -0700459 except subprocess42.TimeoutExpired:
460 if not had_signal:
461 logging.warning('Hard timeout')
462 had_hard_timeout = True
463 logging.warning('Sending SIGTERM')
464 proc.terminate()
465
466 # Ignore signals in grace period. Forcibly give the grace period to the
467 # child process.
468 if exit_code is None:
469 ignore = lambda *_: None
470 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
471 try:
472 exit_code = proc.wait(grace_period or None)
473 except subprocess42.TimeoutExpired:
474 # Now kill for real. The user can distinguish between the
475 # following states:
476 # - signal but process exited within grace period,
477 # hard_timed_out will be set but the process exit code will be
478 # script provided.
479 # - processed exited late, exit code will be -9 on posix.
480 logging.warning('Grace exhausted; sending SIGKILL')
481 proc.kill()
martiniss5c8043e2017-08-01 17:09:43 -0700482 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700483 exit_code = proc.wait()
maruela9cfd6f2015-09-15 11:03:15 -0700484 except OSError:
485 # This is not considered to be an internal error. The executable simply
486 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800487 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000488 '<The executable does not exist, a dependent library is missing or '
489 'the command line is too long>\n'
490 '<Check for missing .so/.dll in the .isolate or GN file or length of '
491 'command line args>\n'
maruela72f46e2016-02-24 11:05:45 -0800492 '<Command: %s>\n' % command)
493 if os.environ.get('SWARMING_TASK_ID'):
494 # Give an additional hint when running as a swarming task.
495 sys.stderr.write(
496 '<See the task\'s page for commands to help diagnose this issue '
497 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700498 exit_code = 1
499 logging.info(
500 'Command finished with exit code %d (%s)',
501 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700502 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700503
504
maruel4409e302016-07-19 14:25:51 -0700505def fetch_and_map(isolated_hash, storage, cache, outdir, use_symlinks):
506 """Fetches an isolated tree, create the tree and returns (bundle, stats)."""
nodir6f801882016-04-29 14:41:50 -0700507 start = time.time()
508 bundle = isolateserver.fetch_isolated(
509 isolated_hash=isolated_hash,
510 storage=storage,
511 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700512 outdir=outdir,
513 use_symlinks=use_symlinks)
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000514 hot = (collections.Counter(cache.used) -
515 collections.Counter(cache.added)).elements()
nodir6f801882016-04-29 14:41:50 -0700516 return bundle, {
517 'duration': time.time() - start,
nodir6f801882016-04-29 14:41:50 -0700518 'items_cold': base64.b64encode(large.pack(sorted(cache.added))),
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000519 'items_hot': base64.b64encode(large.pack(sorted(hot))),
nodir6f801882016-04-29 14:41:50 -0700520 }
521
522
aludwin0a8e17d2016-10-27 15:57:39 -0700523def link_outputs_to_outdir(run_dir, out_dir, outputs):
524 """Links any named outputs to out_dir so they can be uploaded.
525
526 Raises an error if the file already exists in that directory.
527 """
528 if not outputs:
529 return
530 isolateserver.create_directories(out_dir, outputs)
531 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400532 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
533
534
535def copy_recursively(src, dst):
536 """Efficiently copies a file or directory from src_dir to dst_dir.
537
538 `item` may be a file, directory, or a symlink to a file or directory.
539 All symlinks are replaced with their targets, so the resulting
540 directory structure in dst_dir will never have any symlinks.
541
542 To increase speed, copy_recursively hardlinks individual files into the
543 (newly created) directory structure if possible, unlike Python's
544 shutil.copytree().
545 """
546 orig_src = src
547 try:
548 # Replace symlinks with their final target.
549 while fs.islink(src):
550 res = fs.readlink(src)
551 src = os.path.join(os.path.dirname(src), res)
552 # TODO(sadafm): Explicitly handle cyclic symlinks.
553
554 # Note that fs.isfile (which is a wrapper around os.path.isfile) throws
555 # an exception if src does not exist. A warning will be logged in that case.
556 if fs.isfile(src):
557 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
558 return
559
560 if not fs.exists(dst):
561 os.makedirs(dst)
562
563 for child in fs.listdir(src):
564 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
565
566 except OSError as e:
567 if e.errno == errno.ENOENT:
568 logging.warning('Path %s does not exist or %s is a broken symlink',
569 src, orig_src)
570 else:
571 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700572
573
Takuto Ikutab4aa8662019-09-17 05:54:36 +0000574def upload_then_delete(storage, out_dir, leak_temp_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700575 """Deletes the temporary run directory and uploads results back.
576
577 Returns:
nodir6f801882016-04-29 14:41:50 -0700578 tuple(outputs_ref, success, stats)
maruel064c0a32016-04-05 11:47:15 -0700579 - outputs_ref: a dict referring to the results archived back to the isolated
580 server, if applicable.
581 - success: False if something occurred that means that the task must
582 forcibly be considered a failure, e.g. zombie processes were left
583 behind.
nodir6f801882016-04-29 14:41:50 -0700584 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700585 """
maruela9cfd6f2015-09-15 11:03:15 -0700586 # Upload out_dir and generate a .isolated file out of this directory. It is
587 # only done if files were written in the directory.
588 outputs_ref = None
maruel064c0a32016-04-05 11:47:15 -0700589 cold = []
590 hot = []
nodir6f801882016-04-29 14:41:50 -0700591 start = time.time()
592
maruel12e30012015-10-09 11:55:35 -0700593 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700594 with tools.Profiler('ArchiveOutput'):
595 try:
maruel064c0a32016-04-05 11:47:15 -0700596 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
maruela9cfd6f2015-09-15 11:03:15 -0700597 storage, [out_dir], None)
598 outputs_ref = {
Marc-Antoine Rueld0868ec2018-11-28 20:47:29 +0000599 'isolated': results.values()[0],
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +0000600 'isolatedserver': storage.server_ref.url,
601 'namespace': storage.server_ref.namespace,
maruela9cfd6f2015-09-15 11:03:15 -0700602 }
maruel064c0a32016-04-05 11:47:15 -0700603 cold = sorted(i.size for i in f_cold)
604 hot = sorted(i.size for i in f_hot)
maruela9cfd6f2015-09-15 11:03:15 -0700605 except isolateserver.Aborted:
606 # This happens when a signal SIGTERM was received while uploading data.
607 # There is 2 causes:
608 # - The task was too slow and was about to be killed anyway due to
609 # exceeding the hard timeout.
610 # - The amount of data uploaded back is very large and took too much
611 # time to archive.
612 sys.stderr.write('Received SIGTERM while uploading')
613 # Re-raise, so it will be treated as an internal failure.
614 raise
nodir6f801882016-04-29 14:41:50 -0700615
616 success = False
maruela9cfd6f2015-09-15 11:03:15 -0700617 try:
maruel12e30012015-10-09 11:55:35 -0700618 if (not leak_temp_dir and fs.isdir(out_dir) and
maruel6eeea7d2015-09-16 12:17:42 -0700619 not file_path.rmtree(out_dir)):
maruela9cfd6f2015-09-15 11:03:15 -0700620 logging.error('Had difficulties removing out_dir %s', out_dir)
nodir6f801882016-04-29 14:41:50 -0700621 else:
622 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700623 except OSError as e:
624 # When this happens, it means there's a process error.
maruel12e30012015-10-09 11:55:35 -0700625 logging.exception('Had difficulties removing out_dir %s: %s', out_dir, e)
nodir6f801882016-04-29 14:41:50 -0700626 stats = {
627 'duration': time.time() - start,
628 'items_cold': base64.b64encode(large.pack(cold)),
629 'items_hot': base64.b64encode(large.pack(hot)),
630 }
631 return outputs_ref, success, stats
maruela9cfd6f2015-09-15 11:03:15 -0700632
633
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500634def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700635 """Runs a command with optional isolated input/output.
636
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500637 Arguments:
638 - data: TaskData instance.
639 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700640
641 Returns metadata about the result.
642 """
maruela9cfd6f2015-09-15 11:03:15 -0700643 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000644 'duration': None,
645 'exit_code': None,
646 'had_hard_timeout': False,
647 'internal_failure': 'run_isolated did not complete properly',
648 'stats': {
649 #'cipd': {
650 # 'duration': 0.,
651 # 'get_client_duration': 0.,
652 #},
653 'isolated': {
654 'download': {
655 #'duration': 0.,
656 'initial_number_items': len(data.isolate_cache),
657 'initial_size': data.isolate_cache.total_size,
658 #'items_cold': '<large.pack()>',
659 #'items_hot': '<large.pack()>',
660 },
661 #'upload': {
662 # 'duration': 0.,
663 # 'items_cold': '<large.pack()>',
664 # 'items_hot': '<large.pack()>',
665 #},
666 },
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000667 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000668 #'cipd_pins': {
669 # 'packages': [
670 # {'package_name': ..., 'version': ..., 'path': ...},
671 # ...
672 # ],
673 # 'client_package': {'package_name': ..., 'version': ...},
674 #},
675 'outputs_ref': None,
676 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700677 }
nodirbe642ff2016-06-09 15:51:51 -0700678
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500679 if data.root_dir:
Lei Leife202df2019-06-11 17:33:34 +0000680 file_path.ensure_tree(data.root_dir, 0o700)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500681 elif data.isolate_cache.cache_dir:
682 data = data._replace(
683 root_dir=os.path.dirname(data.isolate_cache.cache_dir))
maruele2f2cb82016-07-13 14:41:03 -0700684 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700685 # If root_dir is not specified, it is not constant.
686 # TODO(maruel): This is not obvious. Change this to become an error once we
687 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500688 if constant_run_path and data.root_dir:
689 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700690 if os.path.isdir(run_dir):
691 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000692 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700693 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500694 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
maruel03e11842016-07-14 10:50:16 -0700695 # storage should be normally set but don't crash if it is not. This can happen
696 # as Swarming task can run without an isolate server.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500697 out_dir = make_temp_dir(
698 ISOLATED_OUT_DIR, data.root_dir) if data.storage else None
699 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700700 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500701 if data.relative_cwd:
702 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500703 command = data.command
nodir55be77b2016-05-03 09:39:57 -0700704 try:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500705 with data.install_packages_fn(run_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800706 if cipd_info:
707 result['stats']['cipd'] = cipd_info.stats
708 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700709
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500710 if data.isolated_hash:
vadimsh232f5a82017-01-20 19:23:44 -0800711 isolated_stats = result['stats'].setdefault('isolated', {})
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000712 bundle, stats = fetch_and_map(
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500713 isolated_hash=data.isolated_hash,
714 storage=data.storage,
715 cache=data.isolate_cache,
vadimsh232f5a82017-01-20 19:23:44 -0800716 outdir=run_dir,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500717 use_symlinks=data.use_symlinks)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000718 isolated_stats['download'].update(stats)
vadimsh232f5a82017-01-20 19:23:44 -0800719 change_tree_read_only(run_dir, bundle.read_only)
maruelabec63c2017-04-26 11:53:24 -0700720 # Inject the command
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500721 if not command and bundle.command:
722 command = bundle.command + data.extra_args
Marc-Antoine Rueld704a1f2017-10-31 10:51:23 -0400723 # Only set the relative directory if the isolated file specified a
724 # command, and no raw command was specified.
725 if bundle.relative_cwd:
726 cwd = os.path.normpath(os.path.join(cwd, bundle.relative_cwd))
maruelabec63c2017-04-26 11:53:24 -0700727
728 if not command:
729 # Handle this as a task failure, not an internal failure.
730 sys.stderr.write(
731 '<No command was specified!>\n'
732 '<Please secify a command when triggering your Swarming task>\n')
733 result['exit_code'] = 1
734 return result
nodirbe642ff2016-06-09 15:51:51 -0700735
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500736 if not cwd.startswith(run_dir):
737 # Handle this as a task failure, not an internal failure. This is a
738 # 'last chance' way to gate against directory escape.
739 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
740 result['exit_code'] = 1
741 return result
742
743 if not os.path.isdir(cwd):
744 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +0000745 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500746
vadimsh232f5a82017-01-20 19:23:44 -0800747 # If we have an explicit list of files to return, make sure their
748 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500749 if data.storage and data.outputs:
750 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700751
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500752 with data.install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -0800753 sys.stdout.flush()
754 start = time.time()
755 try:
vadimsh9c54b2c2017-07-25 14:08:29 -0700756 # Need to switch the default account before 'get_command_env' call,
757 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500758 with set_luci_context_account(data.switch_to_account, tmp_dir):
759 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000760 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
761 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +0000762 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -0800763 command = process_command(command, out_dir, data.bot_file)
764 file_path.ensure_command_has_abs_path(command, cwd)
765
vadimsh9c54b2c2017-07-25 14:08:29 -0700766 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000767 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000768 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -0800769 finally:
770 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -0500771
772 # We successfully ran the command, set internal_failure back to
773 # None (even if the command failed, it's not an internal error).
774 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -0700775 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -0700776 # An internal error occurred. Report accordingly so the swarming task will
777 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -0700778 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -0700779 result['internal_failure'] = str(e)
780 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -0700781
782 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -0700783 finally:
784 try:
aludwin0a8e17d2016-10-27 15:57:39 -0700785 # Try to link files to the output directory, if specified.
786 if out_dir:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500787 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700788
nodir32a1ec12016-10-26 18:34:07 -0700789 success = False
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500790 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -0700791 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700792 logging.warning(
793 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -0700794 else:
maruel84537cb2015-10-16 14:21:28 -0700795 # On Windows rmtree(run_dir) call above has a synchronization effect: it
796 # finishes only when all task child processes terminate (since a running
797 # process locks *.exe file). Examine out_dir only after that call
798 # completes (since child processes may write to out_dir too and we need
799 # to wait for them to finish).
800 if fs.isdir(run_dir):
801 try:
802 success = file_path.rmtree(run_dir)
803 except OSError as e:
Marc-Antoine Ruel44699b32018-09-24 23:31:50 +0000804 logging.error('rmtree(%r) failed: %s', run_dir, e)
maruel84537cb2015-10-16 14:21:28 -0700805 success = False
806 if not success:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500807 sys.stderr.write(OUTLIVING_ZOMBIE_MSG % ('run', data.grace_period))
maruel84537cb2015-10-16 14:21:28 -0700808 if result['exit_code'] == 0:
809 result['exit_code'] = 1
810 if fs.isdir(tmp_dir):
811 try:
812 success = file_path.rmtree(tmp_dir)
813 except OSError as e:
Marc-Antoine Ruel44699b32018-09-24 23:31:50 +0000814 logging.error('rmtree(%r) failed: %s', tmp_dir, e)
maruel84537cb2015-10-16 14:21:28 -0700815 success = False
816 if not success:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500817 sys.stderr.write(OUTLIVING_ZOMBIE_MSG % ('temp', data.grace_period))
maruel84537cb2015-10-16 14:21:28 -0700818 if result['exit_code'] == 0:
819 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -0700820
marueleb5fbee2015-09-17 13:01:36 -0700821 # This deletes out_dir if leak_temp_dir is not set.
nodir9130f072016-05-27 13:59:08 -0700822 if out_dir:
nodir55715712016-06-03 12:28:19 -0700823 isolated_stats = result['stats'].setdefault('isolated', {})
824 result['outputs_ref'], success, isolated_stats['upload'] = (
Takuto Ikutab4aa8662019-09-17 05:54:36 +0000825 upload_then_delete(data.storage, out_dir, data.leak_temp_dir))
maruela9cfd6f2015-09-15 11:03:15 -0700826 if not success and result['exit_code'] == 0:
827 result['exit_code'] = 1
828 except Exception as e:
829 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -0700830 if out_dir:
831 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -0700832 result['internal_failure'] = str(e)
833 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500834
835
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500836def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -0700837 """Runs an executable and records execution metadata.
838
nodir55be77b2016-05-03 09:39:57 -0700839 If isolated_hash is specified, downloads the dependencies in the cache,
840 hardlinks them into a temporary directory and runs the command specified in
841 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500842
843 A temporary directory is created to hold the output files. The content inside
844 this directory will be uploaded back to |storage| packaged as a .isolated
845 file.
846
847 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500848 - data: TaskData instance.
849 - result_json: File path to dump result metadata into. If set, the process
850 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -0700851
852 Returns:
853 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000854 """
maruela76b9ee2015-12-15 06:18:08 -0800855 if result_json:
856 # Write a json output file right away in case we get killed.
857 result = {
858 'exit_code': None,
859 'had_hard_timeout': False,
860 'internal_failure': 'Was terminated before completion',
861 'outputs_ref': None,
nodirbe642ff2016-06-09 15:51:51 -0700862 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -0800863 }
864 tools.write_json(result_json, result, dense=True)
865
maruela9cfd6f2015-09-15 11:03:15 -0700866 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500867 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -0700868 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -0700869
maruela9cfd6f2015-09-15 11:03:15 -0700870 if result_json:
maruel05d5a882015-09-21 13:59:02 -0700871 # We've found tests to delete 'work' when quitting, causing an exception
872 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -0700873 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -0700874 tools.write_json(result_json, result, dense=True)
875 # Only return 1 if there was an internal error.
876 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +0000877
maruela9cfd6f2015-09-15 11:03:15 -0700878 # Marshall into old-style inline output.
879 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000880 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -0700881 data = {
882 'hash': result['outputs_ref']['isolated'],
883 'namespace': result['outputs_ref']['namespace'],
884 'storage': result['outputs_ref']['isolatedserver'],
885 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -0500886 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700887 print(
888 '[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
889 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -0800890 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700891 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000892
893
iannuccib58d10d2017-03-18 02:00:25 -0700894# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -0800895CipdInfo = collections.namedtuple('CipdInfo', [
896 'client', # cipd.CipdClient object
897 'cache_dir', # absolute path to bot-global cipd tag and instance cache
898 'stats', # dict with stats to return to the server
899 'pins', # dict with installed cipd pins to return to the server
900])
901
902
903@contextlib.contextmanager
904def noop_install_packages(_run_dir):
iannuccib58d10d2017-03-18 02:00:25 -0700905 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -0800906 yield None
907
908
iannuccib58d10d2017-03-18 02:00:25 -0700909def _install_packages(run_dir, cipd_cache_dir, client, packages, timeout):
910 """Calls 'cipd ensure' for packages.
911
912 Args:
913 run_dir (str): root of installation.
914 cipd_cache_dir (str): the directory to use for the cipd package cache.
915 client (CipdClient): the cipd client to use
916 packages: packages to install, list [(path, package_name, version), ...].
917 timeout: max duration in seconds that this function can take.
918
919 Returns: list of pinned packages. Looks like [
920 {
921 'path': 'subdirectory',
922 'package_name': 'resolved/package/name',
923 'version': 'deadbeef...',
924 },
925 ...
926 ]
927 """
928 package_pins = [None]*len(packages)
929 def insert_pin(path, name, version, idx):
930 package_pins[idx] = {
931 'package_name': name,
932 # swarming deals with 'root' as '.'
933 'path': path or '.',
934 'version': version,
935 }
936
937 by_path = collections.defaultdict(list)
938 for i, (path, name, version) in enumerate(packages):
939 # cipd deals with 'root' as ''
940 if path == '.':
941 path = ''
942 by_path[path].append((name, version, i))
943
944 pins = client.ensure(
945 run_dir,
946 {
947 subdir: [(name, vers) for name, vers, _ in pkgs]
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000948 for subdir, pkgs in by_path.items()
iannuccib58d10d2017-03-18 02:00:25 -0700949 },
950 cache_dir=cipd_cache_dir,
951 timeout=timeout,
952 )
953
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000954 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -0700955 this_subdir = by_path[subdir]
956 for i, (name, version) in enumerate(pin_list):
957 insert_pin(subdir, name, version, this_subdir[i][2])
958
Robert Iannucci461b30d2017-12-13 11:34:03 -0800959 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -0700960
961 return package_pins
962
963
vadimsh232f5a82017-01-20 19:23:44 -0800964@contextlib.contextmanager
iannuccib58d10d2017-03-18 02:00:25 -0700965def install_client_and_packages(
nodirff531b42016-06-23 13:05:06 -0700966 run_dir, packages, service_url, client_package_name,
vadimsh232f5a82017-01-20 19:23:44 -0800967 client_version, cache_dir, timeout=None):
vadimsh902948e2017-01-20 15:57:32 -0800968 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -0700969
vadimsh232f5a82017-01-20 19:23:44 -0800970 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
971
972 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -0700973 [
974 {
975 "path": path, "package_name": package_name, "version": version,
976 },
977 ...
978 ]
vadimsh902948e2017-01-20 15:57:32 -0800979 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -0700980
981 such that they correspond 1:1 to all input package arguments from the command
982 line. These dictionaries make their all the way back to swarming, where they
983 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -0700984
vadimsh902948e2017-01-20 15:57:32 -0800985 If 'packages' list is empty, will bootstrap CIPD client, but won't install
986 any packages.
987
988 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -0800989 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -0800990
nodirbe642ff2016-06-09 15:51:51 -0700991 Args:
nodir90bc8dc2016-06-15 13:35:21 -0700992 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -0800993 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -0700994 service_url (str): CIPD server url, e.g.
995 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -0700996 client_package_name (str): CIPD package name of CIPD client.
997 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -0700998 cache_dir (str): where to keep cache of cipd clients, packages and tags.
999 timeout: max duration in seconds that this function can take.
nodirbe642ff2016-06-09 15:51:51 -07001000 """
1001 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001002
nodirbe642ff2016-06-09 15:51:51 -07001003 timeoutfn = tools.sliding_timeout(timeout)
nodirbe642ff2016-06-09 15:51:51 -07001004 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001005
vadimsh902948e2017-01-20 15:57:32 -08001006 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001007 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001008 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001009 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001010
nodirbe642ff2016-06-09 15:51:51 -07001011 get_client_start = time.time()
1012 client_manager = cipd.get_client(
1013 service_url, client_package_name, client_version, cache_dir,
1014 timeout=timeoutfn())
iannucci96fcccc2016-08-30 15:52:22 -07001015
nodirbe642ff2016-06-09 15:51:51 -07001016 with client_manager as client:
1017 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001018
iannuccib58d10d2017-03-18 02:00:25 -07001019 package_pins = []
1020 if packages:
1021 package_pins = _install_packages(
1022 run_dir, cipd_cache_dir, client, packages, timeoutfn())
1023
1024 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001025
vadimsh232f5a82017-01-20 19:23:44 -08001026 total_duration = time.time() - start
1027 logging.info(
1028 'Installing CIPD client and packages took %d seconds', total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001029
vadimsh232f5a82017-01-20 19:23:44 -08001030 yield CipdInfo(
1031 client=client,
1032 cache_dir=cipd_cache_dir,
1033 stats={
1034 'duration': total_duration,
1035 'get_client_duration': get_client_duration,
1036 },
1037 pins={
iannuccib58d10d2017-03-18 02:00:25 -07001038 'client_package': {
1039 'package_name': client.package_name,
1040 'version': client.instance_id,
1041 },
vadimsh232f5a82017-01-20 19:23:44 -08001042 'packages': package_pins,
1043 })
nodirbe642ff2016-06-09 15:51:51 -07001044
1045
1046def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001047 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001048 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001049 version=__version__,
1050 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001051 parser.add_option(
maruel36a963d2016-04-08 17:15:49 -07001052 '--clean', action='store_true',
1053 help='Cleans the cache, trimming it necessary and remove corrupted items '
1054 'and returns without executing anything; use with -v to know what '
1055 'was done')
1056 parser.add_option(
maruel4409e302016-07-19 14:25:51 -07001057 '--use-symlinks', action='store_true',
1058 help='Use symlinks instead of hardlinks')
1059 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001060 '--json',
1061 help='dump output metadata to json file. When used, run_isolated returns '
1062 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001063 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001064 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001065 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001066 '--grace-period', type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001067 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001068 parser.add_option(
Marc-Antoine Ruel49e347d2017-10-24 16:52:02 -07001069 '--raw-cmd', action='store_true',
1070 help='Ignore the isolated command, use the one supplied at the command '
1071 'line')
1072 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001073 '--relative-cwd',
1074 help='Ignore the isolated \'relative_cwd\' and use this one instead; '
1075 'requires --raw-cmd')
1076 parser.add_option(
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001077 '--env', default=[], action='append',
1078 help='Environment variables to set for the child process')
1079 parser.add_option(
1080 '--env-prefix', default=[], action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001081 help='Specify a VAR=./path/fragment to put in the environment variable '
1082 'before executing the command. The path fragment must be relative '
1083 'to the isolated run directory, and must not contain a `..` token. '
1084 'The path will be made absolute and prepended to the indicated '
1085 '$VAR using the OS\'s path separator. Multiple items for the same '
1086 '$VAR will be prepended in order.')
1087 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001088 '--bot-file',
1089 help='Path to a file describing the state of the host. The content is '
1090 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001091 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001092 '--switch-to-account',
1093 help='If given, switches LUCI_CONTEXT to given logical service account '
1094 '(e.g. "task" or "system") before launching the isolated process.')
1095 parser.add_option(
aludwin0a8e17d2016-10-27 15:57:39 -07001096 '--output', action='append',
1097 help='Specifies an output to return. If no outputs are specified, all '
1098 'files located in $(ISOLATED_OUTDIR) will be returned; '
1099 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1100 'specified by --output option (there can be multiple) will be '
1101 'returned. Note that if a file in OUT_DIR has the same path '
1102 'as an --output option, the --output version will be returned.')
1103 parser.add_option(
aludwin7556e0c2016-10-26 08:46:10 -07001104 '-a', '--argsfile',
1105 # This is actually handled in parse_args; it's included here purely so it
1106 # can make it into the help text.
1107 help='Specify a file containing a JSON array of arguments to this '
1108 'script. If --argsfile is provided, no other argument may be '
1109 'provided on the command line.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001110
1111 group = optparse.OptionGroup(parser, 'Data source')
1112 group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001113 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001114 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001115 isolateserver.add_isolate_server_options(group)
1116 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001117
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001118 isolateserver.add_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001119
1120 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001121
1122 group = optparse.OptionGroup(parser, 'Named caches')
1123 group.add_option(
1124 '--named-cache',
1125 dest='named_caches',
1126 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001127 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001128 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001129 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001130 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1131 'path is a path relative to the run dir where the cache directory '
1132 'must be put to. '
1133 'This option can be specified more than once.')
1134 group.add_option(
1135 '--named-cache-root', default='named_caches',
1136 help='Cache root directory. Default=%default')
1137 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001138
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001139 group = optparse.OptionGroup(parser, 'Process containment')
1140 parser.add_option(
1141 '--lower-priority', action='store_true',
1142 help='Lowers the child process priority')
1143 parser.add_option(
1144 '--containment-type', choices=('NONE', 'AUTO', 'JOB_OBJECT'),
1145 default='NONE',
1146 help='Type of container to use')
1147 parser.add_option(
1148 '--limit-processes', type='int', default=0,
1149 help='Maximum number of active processes in the containment')
1150 parser.add_option(
1151 '--limit-total-committed-memory', type='int', default=0,
1152 help='Maximum sum of committed memory in the containment')
1153 parser.add_option_group(group)
1154
1155 group = optparse.OptionGroup(parser, 'Debugging')
1156 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001157 '--leak-temp-dir',
1158 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001159 help='Deliberately leak isolate\'s temp dir for later examination. '
1160 'Default: %default')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001161 group.add_option(
marueleb5fbee2015-09-17 13:01:36 -07001162 '--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001163 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001164
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001165 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001166
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001167 parser.set_defaults(cache='cache', cipd_cache='cipd_cache')
nodirbe642ff2016-06-09 15:51:51 -07001168 return parser
1169
1170
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001171def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001172 """Validates named cache options and returns a CacheManager."""
1173 if options.named_caches and not options.named_cache_root:
1174 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001175 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001176 if not CACHE_NAME_RE.match(name):
1177 parser.error(
1178 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1179 if not path:
1180 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001181 try:
1182 long(hint)
1183 except ValueError:
1184 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001185 if options.named_cache_root:
1186 # Make these configurable later if there is use case but for now it's fairly
1187 # safe values.
1188 # In practice, a fair chunk of bots are already recycled on a daily schedule
1189 # so this code doesn't have any effect to them, unless they are preloaded
1190 # with a really old cache.
1191 policies = local_caching.CachePolicies(
1192 # 1TiB.
1193 max_cache_size=1024*1024*1024*1024,
1194 min_free_space=options.min_free_space,
1195 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001196 max_age_secs=MAX_AGE_SECS)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001197 root_dir = unicode(os.path.abspath(options.named_cache_root))
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001198 return local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001199 return None
1200
1201
aludwin7556e0c2016-10-26 08:46:10 -07001202def parse_args(args):
1203 # Create a fake mini-parser just to get out the "-a" command. Note that
1204 # it's not documented here; instead, it's documented in create_option_parser
1205 # even though that parser will never actually get to parse it. This is
1206 # because --argsfile is exclusive with all other options and arguments.
1207 file_argparse = argparse.ArgumentParser(add_help=False)
1208 file_argparse.add_argument('-a', '--argsfile')
1209 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1210 if file_args.argsfile:
1211 if nonfile_args:
1212 file_argparse.error('Can\'t specify --argsfile with'
1213 'any other arguments (%s)' % nonfile_args)
1214 try:
1215 with open(file_args.argsfile, 'r') as f:
1216 args = json.load(f)
1217 except (IOError, OSError, ValueError) as e:
1218 # We don't need to error out here - "args" is now empty,
1219 # so the call below to parser.parse_args(args) will fail
1220 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001221 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001222
1223 # Even if we failed to read the args, just call the normal parser now since it
1224 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001225 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001226 options, args = parser.parse_args(args)
aludwin7556e0c2016-10-26 08:46:10 -07001227 return (parser, options, args)
1228
1229
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001230def _calc_named_cache_hint(named_cache, named_caches):
1231 """Returns the expected size of the missing named caches."""
1232 present = named_cache.available
1233 size = 0
1234 for name, _, hint in named_caches:
1235 if name not in present:
1236 hint = long(hint)
1237 if hint > 0:
1238 size += hint
1239 return size
1240
1241
aludwin7556e0c2016-10-26 08:46:10 -07001242def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001243 # Warning: when --argsfile is used, the strings are unicode instances, when
1244 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001245 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001246
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001247 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001248 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001249
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001250 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001251 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001252 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1253 if hint:
1254 # Increase the --min-free-space value by the hint, and recreate the
1255 # NamedCache instance so it gets the updated CachePolicy.
1256 options.min_free_space += hint
1257 named_cache = process_named_cache_options(parser, options)
1258
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001259 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1260 # they can be cleaned the same way.
nodirf33b8d62016-10-26 22:34:58 -07001261 isolate_cache = isolateserver.process_cache_options(options, trim=False)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001262 caches = []
1263 if isolate_cache:
1264 caches.append(isolate_cache)
1265 if named_cache:
1266 caches.append(named_cache)
1267 root = caches[0].cache_dir if caches else unicode(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001268 if options.clean:
1269 if options.isolated:
1270 parser.error('Can\'t use --isolated with --clean.')
1271 if options.isolate_server:
1272 parser.error('Can\'t use --isolate-server with --clean.')
1273 if options.json:
1274 parser.error('Can\'t use --json with --clean.')
nodirf33b8d62016-10-26 22:34:58 -07001275 if options.named_caches:
1276 parser.error('Can\t use --named-cache with --clean.')
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001277 # Trim first, then clean.
1278 local_caching.trim_caches(
1279 caches,
1280 root,
1281 min_free_space=options.min_free_space,
1282 max_age_secs=MAX_AGE_SECS)
1283 for c in caches:
Marc-Antoine Ruel87fc2222018-06-18 13:09:24 +00001284 c.cleanup()
maruel36a963d2016-04-08 17:15:49 -07001285 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001286
1287 # Trim must still be done for the following case:
1288 # - named-cache was used
1289 # - some entries, with a large hint, where missing
1290 # - --min-free-space was increased accordingly, thus trimming is needed
1291 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1292 # --clean after each task.
1293 if hint:
1294 logging.info('Additional trimming of %d bytes', hint)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001295 local_caching.trim_caches(
1296 caches,
1297 root,
1298 min_free_space=options.min_free_space,
1299 max_age_secs=MAX_AGE_SECS)
maruel36a963d2016-04-08 17:15:49 -07001300
nodir55be77b2016-05-03 09:39:57 -07001301 if not options.isolated and not args:
1302 parser.error('--isolated or command to run is required.')
1303
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001304 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001305
1306 isolateserver.process_isolate_server_options(
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001307 parser, options, True, False)
nodir55be77b2016-05-03 09:39:57 -07001308 if not options.isolate_server:
1309 if options.isolated:
1310 parser.error('--isolated requires --isolate-server')
1311 if ISOLATED_OUTDIR_PARAMETER in args:
1312 parser.error(
1313 '%s in args requires --isolate-server' % ISOLATED_OUTDIR_PARAMETER)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001314
nodir90bc8dc2016-06-15 13:35:21 -07001315 if options.root_dir:
1316 options.root_dir = unicode(os.path.abspath(options.root_dir))
maruel12e30012015-10-09 11:55:35 -07001317 if options.json:
1318 options.json = unicode(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001319
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001320 if any('=' not in i for i in options.env):
1321 parser.error(
1322 '--env required key=value form. value can be skipped to delete '
1323 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001324 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001325
1326 prefixes = {}
1327 cwd = os.path.realpath(os.getcwd())
1328 for item in options.env_prefix:
1329 if '=' not in item:
1330 parser.error(
1331 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1332 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001333 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001334 if os.path.isabs(opath):
1335 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1336 opath = os.path.normpath(opath)
1337 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1338 parser.error(
1339 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1340 % opath)
1341 prefixes.setdefault(key, []).append(opath)
1342 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001343
nodirbe642ff2016-06-09 15:51:51 -07001344 cipd.validate_cipd_options(parser, options)
1345
vadimsh232f5a82017-01-20 19:23:44 -08001346 install_packages_fn = noop_install_packages
vadimsh902948e2017-01-20 15:57:32 -08001347 if options.cipd_enabled:
iannuccib58d10d2017-03-18 02:00:25 -07001348 install_packages_fn = lambda run_dir: install_client_and_packages(
vadimsh902948e2017-01-20 15:57:32 -08001349 run_dir, cipd.parse_package_args(options.cipd_packages),
1350 options.cipd_server, options.cipd_client_package,
1351 options.cipd_client_version, cache_dir=options.cipd_cache)
nodirbe642ff2016-06-09 15:51:51 -07001352
nodird6160682017-02-02 13:03:35 -08001353 @contextlib.contextmanager
nodir0ae98b32017-05-11 13:21:53 -07001354 def install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001355 # WARNING: this function depends on "options" variable defined in the outer
1356 # function.
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001357 assert unicode(run_dir), repr(run_dir)
1358 assert os.path.isabs(run_dir), run_dir
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001359 named_caches = [
nodir0ae98b32017-05-11 13:21:53 -07001360 (os.path.join(run_dir, unicode(relpath)), name)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001361 for name, relpath, _ in options.named_caches
nodir0ae98b32017-05-11 13:21:53 -07001362 ]
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001363 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001364 named_cache.install(path, name)
nodird6160682017-02-02 13:03:35 -08001365 try:
1366 yield
1367 finally:
dnje289d132017-07-07 11:16:44 -07001368 # Uninstall each named cache, returning it to the cache pool. If an
1369 # uninstall fails for a given cache, it will remain in the task's
1370 # temporary space, get cleaned up by the Swarming bot, and be lost.
1371 #
1372 # If the Swarming bot cannot clean up the cache, it will handle it like
1373 # any other bot file that could not be removed.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001374 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001375 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001376 # uninstall() doesn't trim but does call save() implicitly. Trimming
1377 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001378 named_cache.uninstall(path, name)
1379 except local_caching.NamedCacheError:
1380 logging.exception('Error while removing named cache %r at %r. '
1381 'The cache will be lost.', path, name)
nodirf33b8d62016-10-26 22:34:58 -07001382
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001383 extra_args = []
1384 command = []
1385 if options.raw_cmd:
1386 command = args
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001387 if options.relative_cwd:
1388 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1389 if not a.startswith(os.getcwd()):
1390 parser.error(
1391 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001392 else:
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001393 if options.relative_cwd:
1394 parser.error('--relative-cwd requires --raw-cmd')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001395 extra_args = args
1396
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001397 containment_type = subprocess42.Containment.NONE
1398 if options.containment_type == 'AUTO':
1399 containment_type = subprocess42.Containment.AUTO
1400 if options.containment_type == 'JOB_OBJECT':
1401 containment_type = subprocess42.Containment.JOB_OBJECT
1402 containment = subprocess42.Containment(
1403 containment_type=containment_type,
1404 limit_processes=options.limit_processes,
1405 limit_total_committed_memory=options.limit_total_committed_memory)
1406
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001407 data = TaskData(
1408 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001409 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001410 extra_args=extra_args,
1411 isolated_hash=options.isolated,
1412 storage=None,
1413 isolate_cache=isolate_cache,
1414 outputs=options.output,
1415 install_named_caches=install_named_caches,
1416 leak_temp_dir=options.leak_temp_dir,
1417 root_dir=_to_unicode(options.root_dir),
1418 hard_timeout=options.hard_timeout,
1419 grace_period=options.grace_period,
1420 bot_file=options.bot_file,
1421 switch_to_account=options.switch_to_account,
1422 install_packages_fn=install_packages_fn,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001423 use_symlinks=bool(options.use_symlinks),
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001424 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001425 env_prefix=options.env_prefix,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001426 lower_priority=bool(options.lower_priority),
1427 containment=containment)
nodirbe642ff2016-06-09 15:51:51 -07001428 try:
nodir90bc8dc2016-06-15 13:35:21 -07001429 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001430 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001431 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001432 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001433 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001434 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001435 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001436 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001437 return run_tha_test(data, options.json)
1438 return run_tha_test(data, options.json)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001439 except (
1440 cipd.Error,
1441 local_caching.NamedCacheError,
Marc-Antoine Ruelb6e9e232018-11-20 00:12:33 +00001442 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001443 print(ex.message, file=sys.stderr)
nodirbe642ff2016-06-09 15:51:51 -07001444 return 1
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001445
1446
1447if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001448 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001449 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001450 fix_encoding.fix_encoding()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001451 sys.exit(main(sys.argv[1:]))