blob: 316d03227c1e80cce121bb24baa2e12b9cc95908 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
Joanna Wang4cec0e42021-08-26 00:48:37 +000033Any ${SWARMING_TASK_ID} on the command line will be replaced by the
34SWARMING_TASK_ID value passed with the --env option.
35
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000036See
37https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
38for all the variables.
39
40See
41https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
42for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000043"""
44
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000045from __future__ import print_function
46
47__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000048
aludwin7556e0c2016-10-26 08:46:10 -070049import argparse
maruel064c0a32016-04-05 11:47:15 -070050import base64
iannucci96fcccc2016-08-30 15:52:22 -070051import collections
vadimsh232f5a82017-01-20 19:23:44 -080052import contextlib
Ye Kuangfff1e502020-07-13 13:21:57 +000053import distutils
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040054import errno
aludwin7556e0c2016-10-26 08:46:10 -070055import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000056import logging
57import optparse
58import os
Takuto Ikuta5c59a842020-01-24 03:05:24 +000059import platform
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040060import re
Junji Watanabedc2f89e2021-11-08 08:44:30 +000061import shutil
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000062import sys
63import tempfile
maruel064c0a32016-04-05 11:47:15 -070064import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000065
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000066from utils import tools
67tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000068
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000069# third_party/
70from depot_tools import fix_encoding
71
72# pylint: disable=ungrouped-imports
Takuto Ikutad53d7bd2021-07-16 03:09:33 +000073import DEPS
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000074import auth
75import cipd
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000076import local_caching
77from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070078from utils import file_path
maruel12e30012015-10-09 11:55:35 -070079from utils import fs
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040080from utils import logging_utils
Ye Kuang2dd17442020-04-22 08:45:52 +000081from utils import net
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040082from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050083from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000084
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000085
maruele2f2cb82016-07-13 14:41:03 -070086# Magic variables that can be found in the isolate task command line.
87ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
88EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
89SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
Joanna Wang4cec0e42021-08-26 00:48:37 +000090SWARMING_TASK_ID_PARAMETER = '${SWARMING_TASK_ID}'
maruele2f2cb82016-07-13 14:41:03 -070091
92
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000093# The name of the log file to use.
94RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
95
maruele2f2cb82016-07-13 14:41:03 -070096
maruele2f2cb82016-07-13 14:41:03 -070097# Use short names for temporary directories. This is driven by Windows, which
98# imposes a relatively short maximum path length of 260 characters, often
99# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000100# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -0700101#
102# It is recommended to start the script with a `root_dir` as short as
103# possible.
104# - ir stands for isolated_run
105# - io stands for isolated_out
106# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000107# - ic stands for isolated_client
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000108# - ns stands for nsjail
Junji Watanabe53d31882022-01-13 07:58:00 +0000109ISOLATED_RUN_DIR = 'ir'
110ISOLATED_OUT_DIR = 'io'
111ISOLATED_TMP_DIR = 'it'
112ISOLATED_CLIENT_DIR = 'ic'
113_CAS_CLIENT_DIR = 'cc'
114_NSJAIL_DIR = 'ns'
maruele2f2cb82016-07-13 14:41:03 -0700115
Takuto Ikuta02edca22019-11-29 10:04:51 +0000116# TODO(tikuta): take these parameter from luci-config?
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000117_CAS_PACKAGE = 'infra/tools/luci/cas/${platform}'
Takuto Ikutad53d7bd2021-07-16 03:09:33 +0000118_LUCI_GO_REVISION = DEPS.deps['luci-go']['packages'][0]['version']
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000119_NSJAIL_PACKAGE = 'infra/3pp/tools/nsjail/${platform}'
120_NSJAIL_VERSION = DEPS.deps['nsjail']['packages'][0]['version']
maruele2f2cb82016-07-13 14:41:03 -0700121
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400122# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000123CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400124
Takuto Ikutac9ddff22021-02-18 07:58:39 +0000125_FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES = 2 * 1024 * 1024 * 1024
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400126
marueld928c862017-06-08 08:20:04 -0700127OUTLIVING_ZOMBIE_MSG = """\
128*** Swarming tried multiple times to delete the %s directory and failed ***
129*** Hard failing the task ***
130
131Swarming detected that your testing script ran an executable, which may have
132started a child executable, and the main script returned early, leaving the
133children executables playing around unguided.
134
135You don't want to leave children processes outliving the task on the Swarming
136bot, do you? The Swarming bot doesn't.
137
138How to fix?
139- For any process that starts children processes, make sure all children
140 processes terminated properly before each parent process exits. This is
141 especially important in very deep process trees.
142 - This must be done properly both in normal successful task and in case of
143 task failure. Cleanup is very important.
144- The Swarming bot sends a SIGTERM in case of timeout.
145 - You have %s seconds to comply after the signal was sent to the process
146 before the process is forcibly killed.
147- To achieve not leaking children processes in case of signals on timeout, you
148 MUST handle signals in each executable / python script and propagate them to
149 children processes.
150 - When your test script (python or binary) receives a signal like SIGTERM or
151 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
152 them to terminate before quitting.
153
154See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400155https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700156for more information.
157
158*** May the SIGKILL force be with you ***
159"""
160
161
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000162# Currently hardcoded. Eventually could be exposed as a flag once there's value.
163# 3 weeks
164MAX_AGE_SECS = 21*24*60*60
165
Takuto Ikuta7ff4b242020-12-03 08:07:06 +0000166_CAS_KVS_CACHE_THRESHOLD = 5 * 1024 * 1024 * 1024 # 5 GiB
167
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500168TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000169 'TaskData',
170 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000171 # List of strings; the command line to use, independent of what was
172 # specified in the isolated file.
173 'command',
174 # Relative directory to start command into.
175 'relative_cwd',
Junji Watanabe54925c32020-09-08 00:56:18 +0000176 # Digest of the input root on RBE-CAS.
177 'cas_digest',
178 # Full CAS instance name.
179 'cas_instance',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000180 # List of paths relative to root_dir to put into the output isolated
181 # bundle upon task completion (see link_outputs_to_outdir).
182 'outputs',
183 # Function (run_dir) => context manager that installs named caches into
184 # |run_dir|.
185 'install_named_caches',
186 # If True, the temporary directory will be deliberately leaked for later
187 # examination.
188 'leak_temp_dir',
189 # Path to the directory to use to create the temporary directory. If not
190 # specified, a random temporary directory is created.
191 'root_dir',
192 # Kills the process if it lasts more than this amount of seconds.
193 'hard_timeout',
194 # Number of seconds to wait between SIGTERM and SIGKILL.
195 'grace_period',
196 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
197 # task command line argument.
198 'bot_file',
199 # Logical account to switch LUCI_CONTEXT into.
200 'switch_to_account',
201 # Context manager dir => CipdInfo, see install_client_and_packages.
202 'install_packages_fn',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000203 # Cache directory for `cas` client.
204 'cas_cache_dir',
205 # Parameters passed to `cas` client.
206 'cas_cache_policies',
Takuto Ikutaae391c52020-12-03 08:43:45 +0000207 # Parameters for kvs file used by `cas` client.
208 'cas_kvs',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000209 # Environment variables to set.
210 'env',
211 # Environment variables to mutate with relative directories.
212 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
213 'env_prefix',
214 # Lowers the task process priority.
215 'lower_priority',
216 # subprocess42.Containment instance. Can be None.
217 'containment',
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000218 # Function to trim caches before installing cipd packages and
219 # downloading isolated files.
220 'trim_caches_fn',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000221 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500222
223
maruel03e11842016-07-14 10:50:16 -0700224def make_temp_dir(prefix, root_dir):
225 """Returns a new unique temporary directory."""
Junji Watanabe7a631b02022-01-13 02:30:29 +0000226 return tempfile.mkdtemp(prefix=prefix, dir=root_dir)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000227
228
vadimsh9c54b2c2017-07-25 14:08:29 -0700229@contextlib.contextmanager
230def set_luci_context_account(account, tmp_dir):
231 """Sets LUCI_CONTEXT account to be used by the task.
232
233 If 'account' is None or '', does nothing at all. This happens when
234 run_isolated.py is called without '--switch-to-account' flag. In this case,
235 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000236 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700237 run_isolated.py explicitly from their code.
238
239 If the requested account is not defined in the context, switches to
240 non-authenticated access. This happens for Swarming tasks that don't use
241 'task' service accounts.
242
243 If not using LUCI_CONTEXT-based auth, does nothing.
244 If already running as requested account, does nothing.
245 """
246 if not account:
247 # Not actually switching.
248 yield
249 return
250
251 local_auth = luci_context.read('local_auth')
252 if not local_auth:
253 # Not using LUCI_CONTEXT auth at all.
254 yield
255 return
256
257 # See LUCI_CONTEXT.md for the format of 'local_auth'.
258 if local_auth.get('default_account_id') == account:
259 # Already set, no need to switch.
260 yield
261 return
262
263 available = {a['id'] for a in local_auth.get('accounts') or []}
264 if account in available:
265 logging.info('Switching default LUCI_CONTEXT account to %r', account)
266 local_auth['default_account_id'] = account
267 else:
268 logging.warning(
269 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
270 'disabling authentication', account, sorted(available))
271 local_auth.pop('default_account_id', None)
272
273 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
274 yield
275
276
nodir90bc8dc2016-06-15 13:35:21 -0700277def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000278 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700279
280 Raises:
281 ValueError if a parameter is requested in |command| but its value is not
282 provided.
283 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000284 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
285
286
287def replace_parameters(arg, out_dir, bot_file):
288 """Replaces parameter tokens with appropriate values in a string.
289
290 Raises:
291 ValueError if a parameter is requested in |arg| but its value is not
292 provided.
293 """
294 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
295 replace_slash = False
296 if ISOLATED_OUTDIR_PARAMETER in arg:
297 if not out_dir:
298 raise ValueError(
299 'output directory is requested in command or env var, but not '
300 'provided; please specify one')
301 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
302 replace_slash = True
303 if SWARMING_BOT_FILE_PARAMETER in arg:
304 if bot_file:
305 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700306 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000307 else:
308 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
309 'var, but no bot_file specified. Leaving parameter '
310 'unchanged.')
Joanna Wang4cec0e42021-08-26 00:48:37 +0000311 if SWARMING_TASK_ID_PARAMETER in arg:
312 task_id = os.environ.get('SWARMING_TASK_ID')
313 if task_id:
314 arg = arg.replace(SWARMING_TASK_ID_PARAMETER, task_id)
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000315 if replace_slash:
316 # Replace slashes only if parameters are present
317 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
318 arg = arg.replace('/', os.sep)
319 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700320
321
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000322def set_temp_dir(env, tmp_dir):
323 """Set temp dir to given env var dictionary"""
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000324 # pylint: disable=line-too-long
325 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
326 # platform. So $TMPDIR must be set on all platforms.
327 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
328 env['TMPDIR'] = tmp_dir
329 if sys.platform == 'win32':
330 # * chromium's base utils uses GetTempPath().
331 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
332 # * Go uses GetTempPath().
333 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
334 # set.
335 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
336 env['TMP'] = tmp_dir
337 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
338 env['TEMP'] = tmp_dir
339 elif sys.platform == 'darwin':
340 # * Chromium uses an hack on macOS before calling into
341 # NSTemporaryDirectory().
342 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
343 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
344 env['MAC_CHROMIUM_TMPDIR'] = tmp_dir
345 else:
346 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
347 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
348 # * mktemp on linux respects $TMPDIR.
349 # * Chromium respects $TMPDIR on linux.
350 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
351 # * Go uses $TMPDIR.
352 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
353 pass
354
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000355
356def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
357 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800358 """Returns full OS environment to run a command in.
359
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800360 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
361 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800362
363 Args:
364 tmp_dir: temp directory.
365 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500366 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500367 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800368 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000369 out_dir: Isolated output directory. Required to be != None if any of the
370 env vars contain ISOLATED_OUTDIR_PARAMETER.
371 bot_file: Required to be != None if any of the env vars contain
372 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800373 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500374 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000375 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500376 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500377 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500378 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000379 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500380
381 if cipd_info:
382 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Junji Watanabe7a631b02022-01-13 02:30:29 +0000383 out['PATH'] = '%s%s%s' % (bin_dir, os.pathsep, out['PATH'])
384 out['CIPD_CACHE_DIR'] = cipd_info.cache_dir
Takuto Ikuta4ec3e8f2021-04-05 10:21:29 +0000385 cipd_info_path = os.path.join(tmp_dir, 'cipd_info.json')
386 with open(cipd_info_path, 'w') as f:
387 json.dump(cipd_info.pins, f)
388 out['ISOLATED_RESOLVED_PACKAGE_VERSIONS_FILE'] = cipd_info_path
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500389
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000390 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500391 assert isinstance(paths, list), paths
392 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500393 cur = out.get(key)
394 if cur:
395 paths.append(cur)
Junji Watanabe7a631b02022-01-13 02:30:29 +0000396 out[key] = os.path.pathsep.join(paths)
vadimsh232f5a82017-01-20 19:23:44 -0800397
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000398 set_temp_dir(out, tmp_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500399 return out
vadimsh232f5a82017-01-20 19:23:44 -0800400
401
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000402def run_command(
403 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700404 """Runs the command.
405
406 Returns:
407 tuple(process exit code, bool if had a hard timeout)
408 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000409 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000410 'run_command(%s, %s, %s, %s, %s, %s)',
411 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700412
maruel6be7f9e2015-10-01 12:25:30 -0700413 exit_code = None
414 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700415 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700416 proc = None
417 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700418 try:
maruel6be7f9e2015-10-01 12:25:30 -0700419 # TODO(maruel): This code is imperfect. It doesn't handle well signals
420 # during the download phase and there's short windows were things can go
421 # wrong.
422 def handler(signum, _frame):
423 if proc and not had_signal:
424 logging.info('Received signal %d', signum)
425 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700426 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700427
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000428 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000429 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000430 lower_priority=lower_priority, containment=containment)
Joanna Wang40959bf2021-08-12 18:10:12 +0000431 logging.info('Subprocess for command started')
maruel6be7f9e2015-10-01 12:25:30 -0700432 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
433 try:
John Budorickc398f092019-06-10 22:49:44 +0000434 exit_code = proc.wait(hard_timeout or None)
Takuto Ikuta88382c82022-02-03 08:46:17 +0000435 logging.info("finished with exit code %d after hard_timeout %s",
436 exit_code, hard_timeout)
maruel6be7f9e2015-10-01 12:25:30 -0700437 except subprocess42.TimeoutExpired:
438 if not had_signal:
439 logging.warning('Hard timeout')
440 had_hard_timeout = True
441 logging.warning('Sending SIGTERM')
442 proc.terminate()
443
Takuto Ikuta684f7912020-09-29 07:49:49 +0000444 kill_sent = False
maruel6be7f9e2015-10-01 12:25:30 -0700445 # Ignore signals in grace period. Forcibly give the grace period to the
446 # child process.
447 if exit_code is None:
448 ignore = lambda *_: None
449 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
450 try:
451 exit_code = proc.wait(grace_period or None)
Takuto Ikuta88382c82022-02-03 08:46:17 +0000452 logging.info("finished with exit code %d after grace_period %s",
453 exit_code, grace_period)
maruel6be7f9e2015-10-01 12:25:30 -0700454 except subprocess42.TimeoutExpired:
455 # Now kill for real. The user can distinguish between the
456 # following states:
457 # - signal but process exited within grace period,
458 # hard_timed_out will be set but the process exit code will be
459 # script provided.
460 # - processed exited late, exit code will be -9 on posix.
461 logging.warning('Grace exhausted; sending SIGKILL')
462 proc.kill()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000463 kill_sent = True
martiniss5c8043e2017-08-01 17:09:43 -0700464 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700465 exit_code = proc.wait()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000466
467 # the process group / job object may be dangling so if we didn't kill
468 # it already, give it a poke now.
469 if not kill_sent:
470 proc.kill()
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000471 except OSError as e:
maruela9cfd6f2015-09-15 11:03:15 -0700472 # This is not considered to be an internal error. The executable simply
473 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800474 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000475 '<The executable does not exist, a dependent library is missing or '
476 'the command line is too long>\n'
477 '<Check for missing .so/.dll in the .isolate or GN file or length of '
478 'command line args>\n'
Takuto Ikutae900df42021-04-14 04:40:11 +0000479 '<Command: %s>\n'
480 '<Exception: %s>\n' % (command, e))
maruela72f46e2016-02-24 11:05:45 -0800481 if os.environ.get('SWARMING_TASK_ID'):
482 # Give an additional hint when running as a swarming task.
483 sys.stderr.write(
484 '<See the task\'s page for commands to help diagnose this issue '
485 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700486 exit_code = 1
487 logging.info(
488 'Command finished with exit code %d (%s)',
489 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700490 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700491
492
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000493def _run_go_cmd_and_wait(cmd, tmp_dir):
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000494 """
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000495 Runs an external Go command, `isolated` or `cas`, and wait for its completion.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000496
497 While this is a generic function to launch a subprocess, it has logic that
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000498 is specific to Go `isolated` and `cas` for waiting and logging.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000499
500 Returns:
501 The subprocess object
502 """
Ye Kuang3c40e9f2020-07-28 13:15:25 +0000503 cmd_str = ' '.join(cmd)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000504 try:
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000505 env = os.environ.copy()
506 set_temp_dir(env, tmp_dir)
507 proc = subprocess42.Popen(cmd, env=env)
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000508
Ye Kuangc1d800f2020-07-28 10:14:55 +0000509 exceeded_max_timeout = True
510 check_period_sec = 30
511 max_checks = 100
512 # max timeout = max_checks * check_period_sec = 50 minutes
513 for i in range(max_checks):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000514 # This is to prevent I/O timeout error during setup.
Ye Kuangc1d800f2020-07-28 10:14:55 +0000515 try:
516 retcode = proc.wait(check_period_sec)
517 if retcode != 0:
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000518 raise subprocess42.CalledProcessError(retcode, cmd=cmd_str)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000519 exceeded_max_timeout = False
520 break
521 except subprocess42.TimeoutExpired:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000522 print('still running (after %d seconds)' % ((i + 1) * check_period_sec))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000523
Ye Kuangc1d800f2020-07-28 10:14:55 +0000524 if exceeded_max_timeout:
525 proc.terminate()
526 try:
527 proc.wait(check_period_sec)
528 except subprocess42.TimeoutExpired:
529 logging.exception(
530 "failed to terminate? timeout happened after %d seconds",
531 check_period_sec)
532 proc.kill()
533 proc.wait()
534 # Raise unconditionally, because |proc| was forcefully terminated.
535 raise ValueError("timedout after %d seconds (cmd=%s)" %
536 (check_period_sec * max_checks, cmd_str))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000537
Ye Kuangc1d800f2020-07-28 10:14:55 +0000538 return proc
539 except Exception:
540 logging.exception('Failed to run Go cmd %s', cmd_str)
541 raise
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000542
543
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000544def _fetch_and_map(cas_client, digest, instance, output_dir, cache_dir,
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000545 policies, kvs_dir, tmp_dir):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000546 """
547 Fetches a CAS tree using cas client, create the tree and returns download
548 stats.
549 """
550
551 start = time.time()
552 result_json_handle, result_json_path = tempfile.mkstemp(
Junji Watanabe53d31882022-01-13 07:58:00 +0000553 prefix='fetch-and-map-result-', suffix='.json')
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000554 os.close(result_json_handle)
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000555 profile_dir = tempfile.mkdtemp(dir=tmp_dir)
556
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000557 try:
558 cmd = [
559 cas_client,
560 'download',
561 '-digest',
562 digest,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000563 # flags for cache.
564 '-cache-dir',
565 cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000566 '-cache-max-size',
567 str(policies.max_cache_size),
568 '-cache-min-free-space',
569 str(policies.min_free_space),
570 # flags for output.
571 '-dir',
572 output_dir,
573 '-dump-stats-json',
574 result_json_path,
Takuto Ikuta557025b2021-02-01 08:37:40 +0000575 '-log-level',
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000576 'info',
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000577 ]
Takuto Ikutaae391c52020-12-03 08:43:45 +0000578
Junji Watanabe66d807b2021-11-08 03:20:10 +0000579 # When RUN_ISOLATED_CAS_ADDRESS is set in test mode,
580 # Use it and ignore CAS instance option.
581 cas_addr = os.environ.get('RUN_ISOLATED_CAS_ADDRESS')
582 if cas_addr:
583 cmd.extend([
584 '-cas-addr',
585 cas_addr,
586 ])
587 else:
588 cmd.extend([
589 '-cas-instance',
590 instance
591 ])
592
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000593 if kvs_dir:
594 cmd.extend(['-kvs-dir', kvs_dir])
Takuto Ikutaae391c52020-12-03 08:43:45 +0000595
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000596 try:
597 _run_go_cmd_and_wait(cmd, tmp_dir)
Takuto Ikuta0909eae2021-04-27 02:54:07 +0000598 except subprocess42.CalledProcessError as ex:
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000599 if not kvs_dir:
600 raise
601 logging.exception('Failed to run cas, removing kvs cache dir and retry.')
Takuto Ikuta0909eae2021-04-27 02:54:07 +0000602 on_error.report("Failed to run cas %s" % ex)
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000603 file_path.rmtree(kvs_dir)
Takuto Ikutacffabfb2021-11-01 08:05:43 +0000604 file_path.rmtree(output_dir)
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000605 _run_go_cmd_and_wait(cmd, tmp_dir)
606
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000607 with open(result_json_path) as json_file:
608 result_json = json.load(json_file)
609
610 return {
611 'duration': time.time() - start,
612 'items_cold': result_json['items_cold'],
613 'items_hot': result_json['items_hot'],
614 }
615 finally:
616 fs.remove(result_json_path)
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000617 file_path.rmtree(profile_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000618
619
aludwin0a8e17d2016-10-27 15:57:39 -0700620def link_outputs_to_outdir(run_dir, out_dir, outputs):
621 """Links any named outputs to out_dir so they can be uploaded.
622
623 Raises an error if the file already exists in that directory.
624 """
625 if not outputs:
626 return
Takuto Ikutae0dce462021-11-16 08:49:46 +0000627 file_path.create_directories(out_dir, outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700628 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400629 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
630
631
632def copy_recursively(src, dst):
633 """Efficiently copies a file or directory from src_dir to dst_dir.
634
635 `item` may be a file, directory, or a symlink to a file or directory.
636 All symlinks are replaced with their targets, so the resulting
637 directory structure in dst_dir will never have any symlinks.
638
639 To increase speed, copy_recursively hardlinks individual files into the
640 (newly created) directory structure if possible, unlike Python's
641 shutil.copytree().
642 """
643 orig_src = src
644 try:
645 # Replace symlinks with their final target.
646 while fs.islink(src):
647 res = fs.readlink(src)
Takuto Ikutaf2ad0a02021-06-24 08:38:40 +0000648 src = os.path.realpath(os.path.join(os.path.dirname(src), res))
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400649 # TODO(sadafm): Explicitly handle cyclic symlinks.
650
Takuto Ikutaf2ad0a02021-06-24 08:38:40 +0000651 if not fs.exists(src):
652 logging.warning('Path %s does not exist or %s is a broken symlink', src,
653 orig_src)
654 return
655
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400656 if fs.isfile(src):
657 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
658 return
659
660 if not fs.exists(dst):
661 os.makedirs(dst)
662
663 for child in fs.listdir(src):
664 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
665
666 except OSError as e:
667 if e.errno == errno.ENOENT:
668 logging.warning('Path %s does not exist or %s is a broken symlink',
669 src, orig_src)
670 else:
671 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700672
673
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000674def upload_outdir(cas_client, cas_instance, outdir, tmp_dir):
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000675 """Uploads the results in |outdir|, if there is any.
676
677 Returns:
678 tuple(root_digest, stats)
679 - root_digest: a digest of the output directory.
680 - stats: uploading stats.
681 """
Junji Watanabe15f9e042021-11-12 07:13:50 +0000682 if not fs.listdir(outdir):
683 return None, None
Junji Watanabe53d31882022-01-13 07:58:00 +0000684 digest_file_handle, digest_path = tempfile.mkstemp(prefix='cas-digest',
685 suffix='.txt')
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000686 os.close(digest_file_handle)
Junji Watanabe53d31882022-01-13 07:58:00 +0000687 stats_json_handle, stats_json_path = tempfile.mkstemp(prefix='upload-stats',
688 suffix='.json')
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000689 os.close(stats_json_handle)
690
691 try:
692 cmd = [
693 cas_client,
694 'archive',
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000695 '-paths',
696 # Format: <working directory>:<relative path to dir>
697 outdir + ':',
698 # output
699 '-dump-digest',
700 digest_path,
701 '-dump-stats-json',
702 stats_json_path,
703 ]
704
Junji Watanabe66d807b2021-11-08 03:20:10 +0000705 # When RUN_ISOLATED_CAS_ADDRESS is set in test mode,
706 # Use it and ignore CAS instance option.
707 cas_addr = os.environ.get('RUN_ISOLATED_CAS_ADDRESS')
708 if cas_addr:
709 cmd.extend([
710 '-cas-addr',
711 cas_addr,
712 ])
713 else:
714 cmd.extend([
715 '-cas-instance',
716 cas_instance
717 ])
718
Takuto Ikuta23388f52022-02-01 01:39:00 +0000719 if sys.platform == 'linux':
Takuto Ikutabfcef252021-08-25 07:46:19 +0000720 # TODO(crbug.com/1243194): remove this after investigation.
721 cmd.extend(['-log-level', 'debug'])
722
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000723 start = time.time()
724
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000725 _run_go_cmd_and_wait(cmd, tmp_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000726
727 with open(digest_path) as digest_file:
728 digest = digest_file.read()
Junji Watanabec208b302020-09-25 09:18:27 +0000729 h, s = digest.split('/')
730 cas_output_root = {
731 'cas_instance': cas_instance,
732 'digest': {
733 'hash': h,
734 'size_bytes': int(s)
735 }
736 }
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000737 with open(stats_json_path) as stats_file:
738 stats = json.load(stats_file)
739
740 stats['duration'] = time.time() - start
741
Junji Watanabec208b302020-09-25 09:18:27 +0000742 return cas_output_root, stats
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000743 finally:
744 fs.remove(digest_path)
745 fs.remove(stats_json_path)
746
747
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500748def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700749 """Runs a command with optional isolated input/output.
750
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500751 Arguments:
752 - data: TaskData instance.
753 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700754
755 Returns metadata about the result.
756 """
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000757
Takuto Ikutaa71c6562021-11-18 06:07:55 +0000758 # TODO(tikuta): take stats from state.json in this case too.
759 download_stats = {
760 # 'duration': 0.,
761 # 'initial_number_items': len(data.cas_cache),
762 # 'initial_size': data.cas_cache.total_size,
763 # 'items_cold': '<large.pack()>',
764 # 'items_hot': '<large.pack()>',
765 }
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000766
maruela9cfd6f2015-09-15 11:03:15 -0700767 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000768 'duration': None,
769 'exit_code': None,
770 'had_hard_timeout': False,
771 'internal_failure': 'run_isolated did not complete properly',
772 'stats': {
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000773 'trim_caches': {
774 'duration': 0,
775 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000776 #'cipd': {
777 # 'duration': 0.,
778 # 'get_client_duration': 0.,
779 #},
780 'isolated': {
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000781 'download': download_stats,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000782 #'upload': {
783 # 'duration': 0.,
784 # 'items_cold': '<large.pack()>',
785 # 'items_hot': '<large.pack()>',
786 #},
787 },
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000788 'named_caches': {
789 'install': {
790 'duration': 0,
791 },
792 'uninstall': {
793 'duration': 0,
794 },
795 },
796 'cleanup': {
797 'duration': 0,
798 }
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000799 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000800 #'cipd_pins': {
801 # 'packages': [
802 # {'package_name': ..., 'version': ..., 'path': ...},
803 # ...
804 # ],
805 # 'client_package': {'package_name': ..., 'version': ...},
806 #},
807 'outputs_ref': None,
Junji Watanabe54925c32020-09-08 00:56:18 +0000808 'cas_output_root': None,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000809 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700810 }
nodirbe642ff2016-06-09 15:51:51 -0700811
Takuto Ikutad46ea762020-10-07 05:43:22 +0000812 assert os.path.isabs(data.root_dir), ("data.root_dir is not abs path: %s" %
813 data.root_dir)
814 file_path.ensure_tree(data.root_dir, 0o700)
815
maruele2f2cb82016-07-13 14:41:03 -0700816 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700817 # TODO(maruel): This is not obvious. Change this to become an error once we
818 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500819 if constant_run_path and data.root_dir:
820 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700821 if os.path.isdir(run_dir):
822 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000823 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700824 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500825 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000826
maruel03e11842016-07-14 10:50:16 -0700827 # storage should be normally set but don't crash if it is not. This can happen
828 # as Swarming task can run without an isolate server.
Takuto Ikuta417388f2021-11-18 07:39:52 +0000829 out_dir = make_temp_dir(ISOLATED_OUT_DIR, data.root_dir)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500830 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700831 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500832 if data.relative_cwd:
833 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500834 command = data.command
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000835
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000836 cas_client_dir = make_temp_dir(_CAS_CLIENT_DIR, data.root_dir)
Takuto Ikuta417388f2021-11-18 07:39:52 +0000837 cas_client = os.path.join(cas_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000838
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000839 data.trim_caches_fn(result['stats']['trim_caches'])
840
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000841 nsjail_dir = None
842 if (sys.platform == "linux" and cipd.get_platform() == "amd64" and
843 data.containment.containment_type == subprocess42.Containment.NSJAIL):
844 nsjail_dir = make_temp_dir(_NSJAIL_DIR, data.root_dir)
845
nodir55be77b2016-05-03 09:39:57 -0700846 try:
Takuto Ikuta1ce61362021-11-16 05:44:17 +0000847 with data.install_packages_fn(run_dir, cas_client_dir,
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000848 nsjail_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800849 if cipd_info:
850 result['stats']['cipd'] = cipd_info.stats
851 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700852
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000853 isolated_stats = result['stats'].setdefault('isolated', {})
Takuto Ikutab58dbd12020-06-05 09:29:14 +0000854
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000855 if data.cas_digest:
856 stats = _fetch_and_map(
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000857 cas_client=cas_client,
858 digest=data.cas_digest,
859 instance=data.cas_instance,
860 output_dir=run_dir,
Junji Watanabeb03450b2020-09-25 05:09:27 +0000861 cache_dir=data.cas_cache_dir,
Takuto Ikutaae391c52020-12-03 08:43:45 +0000862 policies=data.cas_cache_policies,
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000863 kvs_dir=data.cas_kvs,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000864 tmp_dir=tmp_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000865 isolated_stats['download'].update(stats)
Junji Watanabe54925c32020-09-08 00:56:18 +0000866
maruelabec63c2017-04-26 11:53:24 -0700867 if not command:
868 # Handle this as a task failure, not an internal failure.
869 sys.stderr.write(
870 '<No command was specified!>\n'
871 '<Please secify a command when triggering your Swarming task>\n')
872 result['exit_code'] = 1
873 return result
nodirbe642ff2016-06-09 15:51:51 -0700874
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500875 if not cwd.startswith(run_dir):
876 # Handle this as a task failure, not an internal failure. This is a
877 # 'last chance' way to gate against directory escape.
878 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
879 result['exit_code'] = 1
880 return result
881
882 if not os.path.isdir(cwd):
883 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +0000884 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500885
vadimsh232f5a82017-01-20 19:23:44 -0800886 # If we have an explicit list of files to return, make sure their
887 # directories exist now.
Takuto Ikutaab8d0232021-11-16 12:12:09 +0000888 if data.outputs:
Takuto Ikutae0dce462021-11-16 08:49:46 +0000889 file_path.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700890
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000891 with data.install_named_caches(run_dir, result['stats']['named_caches']):
nodird6160682017-02-02 13:03:35 -0800892 sys.stdout.flush()
893 start = time.time()
894 try:
vadimsh9c54b2c2017-07-25 14:08:29 -0700895 # Need to switch the default account before 'get_command_env' call,
896 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500897 with set_luci_context_account(data.switch_to_account, tmp_dir):
898 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000899 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
900 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +0000901 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -0800902 command = process_command(command, out_dir, data.bot_file)
903 file_path.ensure_command_has_abs_path(command, cwd)
904
vadimsh9c54b2c2017-07-25 14:08:29 -0700905 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000906 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000907 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -0800908 finally:
909 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -0500910
Takuto Ikuta417388f2021-11-18 07:39:52 +0000911 # Try to link files to the output directory, if specified.
912 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
913 isolated_stats = result['stats'].setdefault('isolated', {})
914 result['cas_output_root'], upload_stats = upload_outdir(
915 cas_client, data.cas_instance, out_dir, tmp_dir)
916 if upload_stats:
917 isolated_stats['upload'] = upload_stats
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000918
Seth Koehler49139812017-12-19 13:59:33 -0500919 # We successfully ran the command, set internal_failure back to
920 # None (even if the command failed, it's not an internal error).
921 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -0700922 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -0700923 # An internal error occurred. Report accordingly so the swarming task will
924 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -0700925 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -0700926 result['internal_failure'] = str(e)
927 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -0700928
929 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -0700930 finally:
931 try:
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000932 cleanup_start = time.time()
Ye Kuangbc4e8402020-07-29 09:54:30 +0000933 success = True
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500934 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -0700935 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700936 logging.warning(
937 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -0700938 else:
maruel84537cb2015-10-16 14:21:28 -0700939 # On Windows rmtree(run_dir) call above has a synchronization effect: it
940 # finishes only when all task child processes terminate (since a running
941 # process locks *.exe file). Examine out_dir only after that call
942 # completes (since child processes may write to out_dir too and we need
943 # to wait for them to finish).
Takuto Ikuta1ce61362021-11-16 05:44:17 +0000944 dirs_to_remove = [run_dir, tmp_dir, cas_client_dir]
Ye Kuangbc4e8402020-07-29 09:54:30 +0000945 if out_dir:
946 dirs_to_remove.append(out_dir)
947 for directory in dirs_to_remove:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000948 if not fs.isdir(directory):
949 continue
Junji Watanabe9cdfff52021-01-08 07:20:35 +0000950 start = time.time()
maruel84537cb2015-10-16 14:21:28 -0700951 try:
Junji Watanabecc4eefd2021-01-19 01:46:10 +0000952 file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -0700953 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000954 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -0700955 success = False
Junji Watanabe9cdfff52021-01-08 07:20:35 +0000956 finally:
957 logging.info('Cleanup: rmtree(%r) took %d seconds', directory,
958 time.time() - start)
maruel84537cb2015-10-16 14:21:28 -0700959 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000960 sys.stderr.write(
961 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
Junji Watanabed952bf12021-05-13 03:15:54 +0000962 if sys.platform == 'win32':
963 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
964 else:
965 subprocess42.check_call(['ps', 'axu'], stdout=sys.stderr)
maruel84537cb2015-10-16 14:21:28 -0700966 if result['exit_code'] == 0:
967 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -0700968
maruela9cfd6f2015-09-15 11:03:15 -0700969 if not success and result['exit_code'] == 0:
970 result['exit_code'] = 1
971 except Exception as e:
972 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -0700973 if out_dir:
974 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -0700975 result['internal_failure'] = str(e)
Takuto Ikutaa9a907b2020-04-17 08:50:50 +0000976 on_error.report(None)
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000977 finally:
978 cleanup_duration = time.time() - cleanup_start
979 result['stats']['cleanup']['duration'] = cleanup_duration
980 logging.info('Cleanup: removing directories took %d seconds',
981 cleanup_duration)
maruela9cfd6f2015-09-15 11:03:15 -0700982 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500983
984
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500985def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -0700986 """Runs an executable and records execution metadata.
987
nodir55be77b2016-05-03 09:39:57 -0700988 If isolated_hash is specified, downloads the dependencies in the cache,
989 hardlinks them into a temporary directory and runs the command specified in
990 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500991
992 A temporary directory is created to hold the output files. The content inside
993 this directory will be uploaded back to |storage| packaged as a .isolated
994 file.
995
996 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500997 - data: TaskData instance.
998 - result_json: File path to dump result metadata into. If set, the process
999 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -07001000
1001 Returns:
1002 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001003 """
maruela76b9ee2015-12-15 06:18:08 -08001004 if result_json:
1005 # Write a json output file right away in case we get killed.
1006 result = {
Junji Watanabe54925c32020-09-08 00:56:18 +00001007 'exit_code': None,
1008 'had_hard_timeout': False,
1009 'internal_failure': 'Was terminated before completion',
1010 'outputs_ref': None,
1011 'cas_output_root': None,
1012 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -08001013 }
1014 tools.write_json(result_json, result, dense=True)
1015
maruela9cfd6f2015-09-15 11:03:15 -07001016 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001017 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -07001018 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -07001019
maruela9cfd6f2015-09-15 11:03:15 -07001020 if result_json:
maruel05d5a882015-09-21 13:59:02 -07001021 # We've found tests to delete 'work' when quitting, causing an exception
1022 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -07001023 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -07001024 tools.write_json(result_json, result, dense=True)
1025 # Only return 1 if there was an internal error.
1026 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +00001027
maruela9cfd6f2015-09-15 11:03:15 -07001028 # Marshall into old-style inline output.
1029 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +00001030 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -07001031 data = {
Junji Watanabe38b28b02020-04-23 10:23:30 +00001032 'hash': result['outputs_ref']['isolated'],
1033 'namespace': result['outputs_ref']['namespace'],
1034 'storage': result['outputs_ref']['isolatedserver'],
maruela9cfd6f2015-09-15 11:03:15 -07001035 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -05001036 sys.stdout.flush()
Junji Watanabe38b28b02020-04-23 10:23:30 +00001037 print('[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
1038 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -08001039 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -07001040 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001041
1042
iannuccib58d10d2017-03-18 02:00:25 -07001043# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -08001044CipdInfo = collections.namedtuple('CipdInfo', [
1045 'client', # cipd.CipdClient object
1046 'cache_dir', # absolute path to bot-global cipd tag and instance cache
1047 'stats', # dict with stats to return to the server
1048 'pins', # dict with installed cipd pins to return to the server
1049])
1050
1051
1052@contextlib.contextmanager
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001053def copy_local_packages(_run_dir, cas_dir, _nsjail_dir):
Junji Watanabedc2f89e2021-11-08 08:44:30 +00001054 """Copies CIPD packages from luci/luci-go dir."""
1055 go_client_dir = os.environ.get('LUCI_GO_CLIENT_DIR')
1056 assert go_client_dir, ('Please set LUCI_GO_CLIENT_DIR env var to install CIPD'
1057 ' packages locally.')
1058 shutil.copy2(os.path.join(go_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX),
1059 os.path.join(cas_dir, 'cas' + cipd.EXECUTABLE_SUFFIX))
vadimsh232f5a82017-01-20 19:23:44 -08001060 yield None
1061
1062
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001063def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -07001064 """Calls 'cipd ensure' for packages.
1065
1066 Args:
1067 run_dir (str): root of installation.
1068 cipd_cache_dir (str): the directory to use for the cipd package cache.
1069 client (CipdClient): the cipd client to use
1070 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -07001071
1072 Returns: list of pinned packages. Looks like [
1073 {
1074 'path': 'subdirectory',
1075 'package_name': 'resolved/package/name',
1076 'version': 'deadbeef...',
1077 },
1078 ...
1079 ]
1080 """
1081 package_pins = [None]*len(packages)
1082 def insert_pin(path, name, version, idx):
1083 package_pins[idx] = {
1084 'package_name': name,
1085 # swarming deals with 'root' as '.'
1086 'path': path or '.',
1087 'version': version,
1088 }
1089
1090 by_path = collections.defaultdict(list)
1091 for i, (path, name, version) in enumerate(packages):
1092 # cipd deals with 'root' as ''
1093 if path == '.':
1094 path = ''
1095 by_path[path].append((name, version, i))
1096
1097 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001098 run_dir,
1099 {
1100 subdir: [(name, vers) for name, vers, _ in pkgs
1101 ] for subdir, pkgs in by_path.items()
1102 },
1103 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -07001104 )
1105
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +00001106 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -07001107 this_subdir = by_path[subdir]
1108 for i, (name, version) in enumerate(pin_list):
1109 insert_pin(subdir, name, version, this_subdir[i][2])
1110
Robert Iannucci461b30d2017-12-13 11:34:03 -08001111 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -07001112
1113 return package_pins
1114
1115
vadimsh232f5a82017-01-20 19:23:44 -08001116@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001117def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001118 client_package_name, client_version, cache_dir,
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001119 cas_dir, nsjail_dir):
vadimsh902948e2017-01-20 15:57:32 -08001120 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -07001121
vadimsh232f5a82017-01-20 19:23:44 -08001122 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
1123
1124 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -07001125 [
1126 {
1127 "path": path, "package_name": package_name, "version": version,
1128 },
1129 ...
1130 ]
vadimsh902948e2017-01-20 15:57:32 -08001131 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -07001132
1133 such that they correspond 1:1 to all input package arguments from the command
1134 line. These dictionaries make their all the way back to swarming, where they
1135 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -07001136
vadimsh902948e2017-01-20 15:57:32 -08001137 If 'packages' list is empty, will bootstrap CIPD client, but won't install
1138 any packages.
1139
1140 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -08001141 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -08001142
nodirbe642ff2016-06-09 15:51:51 -07001143 Args:
nodir90bc8dc2016-06-15 13:35:21 -07001144 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -08001145 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -07001146 service_url (str): CIPD server url, e.g.
1147 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -07001148 client_package_name (str): CIPD package name of CIPD client.
1149 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -07001150 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001151 cas_dir (str): where to download cas client.
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001152 nsjail_dir (str): where to download nsjail. If set to None, nsjail is not
1153 downloaded.
nodirbe642ff2016-06-09 15:51:51 -07001154 """
1155 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001156
nodirbe642ff2016-06-09 15:51:51 -07001157 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001158
vadimsh902948e2017-01-20 15:57:32 -08001159 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001160 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001161 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001162 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001163
nodirbe642ff2016-06-09 15:51:51 -07001164 get_client_start = time.time()
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001165 client_manager = cipd.get_client(cache_dir, service_url, client_package_name,
1166 client_version)
iannucci96fcccc2016-08-30 15:52:22 -07001167
nodirbe642ff2016-06-09 15:51:51 -07001168 with client_manager as client:
1169 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001170
iannuccib58d10d2017-03-18 02:00:25 -07001171 package_pins = []
1172 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001173 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1174 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001175
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001176 # Install cas client to |cas_dir|.
1177 _install_packages(cas_dir, cipd_cache_dir, client,
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +00001178 [('', _CAS_PACKAGE, _LUCI_GO_REVISION)])
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001179
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001180 # Install nsjail to |nsjail_dir|.
1181 if nsjail_dir is not None:
1182 _install_packages(nsjail_dir, cipd_cache_dir, client,
1183 [('', _NSJAIL_PACKAGE, _NSJAIL_VERSION)])
1184
iannuccib58d10d2017-03-18 02:00:25 -07001185 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001186
vadimsh232f5a82017-01-20 19:23:44 -08001187 total_duration = time.time() - start
Junji Watanabe38b28b02020-04-23 10:23:30 +00001188 logging.info('Installing CIPD client and packages took %d seconds',
1189 total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001190
vadimsh232f5a82017-01-20 19:23:44 -08001191 yield CipdInfo(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001192 client=client,
1193 cache_dir=cipd_cache_dir,
1194 stats={
1195 'duration': total_duration,
1196 'get_client_duration': get_client_duration,
iannuccib58d10d2017-03-18 02:00:25 -07001197 },
Junji Watanabe38b28b02020-04-23 10:23:30 +00001198 pins={
1199 'client_package': {
1200 'package_name': client.package_name,
1201 'version': client.instance_id,
1202 },
1203 'packages': package_pins,
1204 })
nodirbe642ff2016-06-09 15:51:51 -07001205
1206
1207def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001208 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001209 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001210 version=__version__,
1211 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001212 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001213 '--clean',
1214 action='store_true',
maruel36a963d2016-04-08 17:15:49 -07001215 help='Cleans the cache, trimming it necessary and remove corrupted items '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001216 'and returns without executing anything; use with -v to know what '
1217 'was done')
maruel36a963d2016-04-08 17:15:49 -07001218 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001219 '--json',
1220 help='dump output metadata to json file. When used, run_isolated returns '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001221 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001222 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001223 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001224 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001225 '--grace-period',
1226 type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001227 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001228 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001229 '--relative-cwd',
Takuto Ikuta18ca29a2020-12-04 07:34:20 +00001230 help='Ignore the isolated \'relative_cwd\' and use this one instead')
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001231 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001232 '--env',
1233 default=[],
1234 action='append',
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001235 help='Environment variables to set for the child process')
1236 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001237 '--env-prefix',
1238 default=[],
1239 action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001240 help='Specify a VAR=./path/fragment to put in the environment variable '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001241 'before executing the command. The path fragment must be relative '
1242 'to the isolated run directory, and must not contain a `..` token. '
1243 'The path will be made absolute and prepended to the indicated '
1244 '$VAR using the OS\'s path separator. Multiple items for the same '
1245 '$VAR will be prepended in order.')
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001246 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001247 '--bot-file',
1248 help='Path to a file describing the state of the host. The content is '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001249 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001250 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001251 '--switch-to-account',
1252 help='If given, switches LUCI_CONTEXT to given logical service account '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001253 '(e.g. "task" or "system") before launching the isolated process.')
vadimsh9c54b2c2017-07-25 14:08:29 -07001254 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001255 '--output',
1256 action='append',
aludwin0a8e17d2016-10-27 15:57:39 -07001257 help='Specifies an output to return. If no outputs are specified, all '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001258 'files located in $(ISOLATED_OUTDIR) will be returned; '
1259 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1260 'specified by --output option (there can be multiple) will be '
1261 'returned. Note that if a file in OUT_DIR has the same path '
1262 'as an --output option, the --output version will be returned.')
aludwin0a8e17d2016-10-27 15:57:39 -07001263 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001264 '-a',
1265 '--argsfile',
aludwin7556e0c2016-10-26 08:46:10 -07001266 # This is actually handled in parse_args; it's included here purely so it
1267 # can make it into the help text.
1268 help='Specify a file containing a JSON array of arguments to this '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001269 'script. If --argsfile is provided, no other argument may be '
1270 'provided on the command line.')
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001271 parser.add_option(
1272 '--report-on-exception',
1273 action='store_true',
1274 help='Whether report exception during execution to isolate server. '
1275 'This flag should only be used in swarming bot.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001276
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001277 group = optparse.OptionGroup(parser,
1278 'Data source - Content Addressed Storage')
Junji Watanabe54925c32020-09-08 00:56:18 +00001279 group.add_option(
1280 '--cas-instance', help='Full CAS instance name for input/output files.')
1281 group.add_option(
1282 '--cas-digest',
1283 help='Digest of the input root on RBE-CAS. The format is '
1284 '`{hash}/{size_bytes}`.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001285 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001286
Junji Watanabeb03450b2020-09-25 05:09:27 +00001287 # Cache options.
Junji Watanabeb03450b2020-09-25 05:09:27 +00001288 add_cas_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001289
1290 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001291
1292 group = optparse.OptionGroup(parser, 'Named caches')
1293 group.add_option(
1294 '--named-cache',
1295 dest='named_caches',
1296 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001297 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001298 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001299 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001300 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1301 'path is a path relative to the run dir where the cache directory '
1302 'must be put to. '
1303 'This option can be specified more than once.')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001304 group.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001305 '--named-cache-root',
1306 default='named_caches',
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001307 help='Cache root directory. Default=%default')
1308 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001309
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001310 group = optparse.OptionGroup(parser, 'Process containment')
1311 parser.add_option(
1312 '--lower-priority', action='store_true',
1313 help='Lowers the child process priority')
1314 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001315 '--containment-type',
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001316 choices=('NONE', 'AUTO', 'JOB_OBJECT', 'NSJAIL'),
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001317 default='NONE',
1318 help='Type of container to use')
1319 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001320 '--limit-processes',
1321 type='int',
1322 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001323 help='Maximum number of active processes in the containment')
1324 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001325 '--limit-total-committed-memory',
1326 type='int',
1327 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001328 help='Maximum sum of committed memory in the containment')
1329 parser.add_option_group(group)
1330
1331 group = optparse.OptionGroup(parser, 'Debugging')
1332 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001333 '--leak-temp-dir',
1334 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001335 help='Deliberately leak isolate\'s temp dir for later examination. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001336 'Default: %default')
1337 group.add_option('--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001338 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001339
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001340 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001341
Ye Kuang1d096cb2020-06-26 08:38:21 +00001342 parser.set_defaults(cache='cache')
nodirbe642ff2016-06-09 15:51:51 -07001343 return parser
1344
1345
Junji Watanabeb03450b2020-09-25 05:09:27 +00001346def add_cas_cache_options(parser):
1347 group = optparse.OptionGroup(parser, 'CAS cache management')
1348 group.add_option(
1349 '--cas-cache',
1350 metavar='DIR',
1351 default='cas-cache',
1352 help='Directory to keep a local cache of the files. Accelerates download '
1353 'by reusing already downloaded files. Default=%default')
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001354 group.add_option(
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001355 '--kvs-dir',
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001356 default='',
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001357 help='CAS cache dir using kvs for small files. Default=%default')
Takuto Ikutaa71c6562021-11-18 06:07:55 +00001358 group.add_option(
1359 '--max-cache-size',
1360 type='int',
1361 metavar='NNN',
1362 default=50 * 1024 * 1024 * 1024,
1363 help='Trim if the cache gets larger than this value, default=%default')
1364 group.add_option(
1365 '--min-free-space',
1366 type='int',
1367 metavar='NNN',
1368 default=2 * 1024 * 1024 * 1024,
1369 help='Trim if disk free space becomes lower than this value, '
1370 'default=%default')
Junji Watanabeb03450b2020-09-25 05:09:27 +00001371 parser.add_option_group(group)
1372
1373
1374def process_cas_cache_options(options):
1375 if options.cas_cache:
1376 policies = local_caching.CachePolicies(
1377 max_cache_size=options.max_cache_size,
1378 min_free_space=options.min_free_space,
1379 # max_items isn't used for CAS cache for now.
1380 max_items=None,
1381 max_age_secs=MAX_AGE_SECS)
1382
Junji Watanabe7a631b02022-01-13 02:30:29 +00001383 return local_caching.DiskContentAddressedCache(os.path.abspath(
1384 options.cas_cache),
1385 policies,
1386 trim=False)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001387 return local_caching.MemoryContentAddressedCache()
1388
1389
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001390def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001391 """Validates named cache options and returns a CacheManager."""
1392 if options.named_caches and not options.named_cache_root:
1393 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001394 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001395 if not CACHE_NAME_RE.match(name):
1396 parser.error(
1397 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1398 if not path:
1399 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001400 try:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001401 int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001402 except ValueError:
1403 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001404 if options.named_cache_root:
1405 # Make these configurable later if there is use case but for now it's fairly
1406 # safe values.
1407 # In practice, a fair chunk of bots are already recycled on a daily schedule
1408 # so this code doesn't have any effect to them, unless they are preloaded
1409 # with a really old cache.
1410 policies = local_caching.CachePolicies(
1411 # 1TiB.
1412 max_cache_size=1024*1024*1024*1024,
1413 min_free_space=options.min_free_space,
1414 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001415 max_age_secs=MAX_AGE_SECS)
Junji Watanabe7a631b02022-01-13 02:30:29 +00001416 root_dir = os.path.abspath(options.named_cache_root)
John Budorickc6186972020-02-26 00:58:14 +00001417 cache = local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
1418 # Touch any named caches we're going to use to minimize thrashing
1419 # between tasks that request some (but not all) of the same named caches.
John Budorick0a4dab62020-03-02 22:23:35 +00001420 cache.touch(*[name for name, _, _ in options.named_caches])
John Budorickc6186972020-02-26 00:58:14 +00001421 return cache
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001422 return None
1423
1424
aludwin7556e0c2016-10-26 08:46:10 -07001425def parse_args(args):
1426 # Create a fake mini-parser just to get out the "-a" command. Note that
1427 # it's not documented here; instead, it's documented in create_option_parser
1428 # even though that parser will never actually get to parse it. This is
1429 # because --argsfile is exclusive with all other options and arguments.
1430 file_argparse = argparse.ArgumentParser(add_help=False)
1431 file_argparse.add_argument('-a', '--argsfile')
1432 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1433 if file_args.argsfile:
1434 if nonfile_args:
1435 file_argparse.error('Can\'t specify --argsfile with'
1436 'any other arguments (%s)' % nonfile_args)
1437 try:
1438 with open(file_args.argsfile, 'r') as f:
1439 args = json.load(f)
1440 except (IOError, OSError, ValueError) as e:
1441 # We don't need to error out here - "args" is now empty,
1442 # so the call below to parser.parse_args(args) will fail
1443 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001444 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001445
1446 # Even if we failed to read the args, just call the normal parser now since it
1447 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001448 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001449 options, args = parser.parse_args(args)
Ye Kuangfff1e502020-07-13 13:21:57 +00001450 if not isinstance(options.cipd_enabled, (bool, int)):
1451 options.cipd_enabled = distutils.util.strtobool(options.cipd_enabled)
aludwin7556e0c2016-10-26 08:46:10 -07001452 return (parser, options, args)
1453
1454
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001455def _calc_named_cache_hint(named_cache, named_caches):
1456 """Returns the expected size of the missing named caches."""
1457 present = named_cache.available
1458 size = 0
Takuto Ikutad169bfd2021-08-02 05:45:09 +00001459 logging.info('available named cache %s', present)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001460 for name, _, hint in named_caches:
1461 if name not in present:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001462 hint = int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001463 if hint > 0:
Takuto Ikuta74686842021-07-30 04:11:03 +00001464 logging.info("named cache hint: %s, %d", name, hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001465 size += hint
Takuto Ikuta74686842021-07-30 04:11:03 +00001466 logging.info("total size of named cache hint: %d", size)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001467 return size
1468
1469
Takuto Ikutaae391c52020-12-03 08:43:45 +00001470def _clean_cmd(parser, options, caches, root):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001471 """Cleanup cache dirs/files."""
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001472 if options.json:
1473 parser.error('Can\'t use --json with --clean.')
1474 if options.named_caches:
1475 parser.error('Can\t use --named-cache with --clean.')
1476 if options.cas_instance or options.cas_digest:
1477 parser.error('Can\t use --cas-instance, --cas-digest with --clean.')
1478
1479 logging.info("initial free space: %d", file_path.get_free_space(root))
1480
Junji Watanabe7a631b02022-01-13 02:30:29 +00001481 if options.kvs_dir and fs.isdir(options.kvs_dir):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001482 # Remove kvs file if its size exceeds fixed threshold.
Junji Watanabe7a631b02022-01-13 02:30:29 +00001483 kvs_dir = options.kvs_dir
Takuto Ikutab1b70062021-03-22 01:02:41 +00001484 size = file_path.get_recursive_size(kvs_dir)
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001485 if size >= _CAS_KVS_CACHE_THRESHOLD:
1486 logging.info("remove kvs dir with size: %d", size)
Takuto Ikutab1b70062021-03-22 01:02:41 +00001487 file_path.rmtree(kvs_dir)
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001488
1489 # Trim first, then clean.
1490 local_caching.trim_caches(
1491 caches,
1492 root,
1493 min_free_space=options.min_free_space,
1494 max_age_secs=MAX_AGE_SECS)
1495 logging.info("free space after trim: %d", file_path.get_free_space(root))
1496 for c in caches:
1497 c.cleanup()
1498 logging.info("free space after cleanup: %d", file_path.get_free_space(root))
1499
1500
aludwin7556e0c2016-10-26 08:46:10 -07001501def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001502 # Warning: when --argsfile is used, the strings are unicode instances, when
1503 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001504 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001505
Joanna Wang40959bf2021-08-12 18:10:12 +00001506 # Must be logged after parse_args(), which eventually calls
1507 # logging_utils.prepare_logging() which expects no logs before its call.
1508 logging.info('Starting run_isolated script')
1509
Junji Watanabe1d83d282021-05-11 05:50:40 +00001510 SWARMING_SERVER = os.environ.get('SWARMING_SERVER')
1511 SWARMING_TASK_ID = os.environ.get('SWARMING_TASK_ID')
1512 if options.report_on_exception and SWARMING_SERVER:
1513 task_url = None
1514 if SWARMING_TASK_ID:
1515 task_url = '%s/task?id=%s' % (SWARMING_SERVER, SWARMING_TASK_ID)
1516 on_error.report_on_exception_exit(SWARMING_SERVER, source=task_url)
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001517
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001518 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001519 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001520
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001521 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001522 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001523 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1524 if hint:
1525 # Increase the --min-free-space value by the hint, and recreate the
1526 # NamedCache instance so it gets the updated CachePolicy.
1527 options.min_free_space += hint
1528 named_cache = process_named_cache_options(parser, options)
1529
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001530 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1531 # they can be cleaned the same way.
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001532
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001533 cas_cache = process_cas_cache_options(options)
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +00001534
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001535 caches = []
Junji Watanabeb03450b2020-09-25 05:09:27 +00001536 if cas_cache:
1537 caches.append(cas_cache)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001538 if named_cache:
1539 caches.append(named_cache)
Junji Watanabe7a631b02022-01-13 02:30:29 +00001540 root = caches[0].cache_dir if caches else os.getcwd()
maruel36a963d2016-04-08 17:15:49 -07001541 if options.clean:
Takuto Ikutaae391c52020-12-03 08:43:45 +00001542 _clean_cmd(parser, options, caches, root)
maruel36a963d2016-04-08 17:15:49 -07001543 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001544
1545 # Trim must still be done for the following case:
1546 # - named-cache was used
1547 # - some entries, with a large hint, where missing
1548 # - --min-free-space was increased accordingly, thus trimming is needed
1549 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1550 # --clean after each task.
Takuto Ikutac9ddff22021-02-18 07:58:39 +00001551 additional_buffer = _FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001552 if options.kvs_dir:
Takuto Ikuta7f45c592021-02-09 05:57:05 +00001553 additional_buffer += _CAS_KVS_CACHE_THRESHOLD
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001554 # Add some buffer for Go CLI.
1555 min_free_space = options.min_free_space + additional_buffer
1556
1557 def trim_caches_fn(stats):
1558 start = time.time()
1559 local_caching.trim_caches(
1560 caches, root, min_free_space=min_free_space, max_age_secs=MAX_AGE_SECS)
1561 duration = time.time() - start
1562 stats['duration'] = duration
1563 logging.info('trim_caches: took %d seconds', duration)
maruel36a963d2016-04-08 17:15:49 -07001564
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001565 # Save state of cas cache not to overwrite state from go client.
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001566 if cas_cache:
1567 cas_cache.save()
1568 cas_cache = None
1569
Takuto Ikutadc496672021-11-12 05:58:59 +00001570 if not args:
1571 parser.error('command to run is required.')
nodir55be77b2016-05-03 09:39:57 -07001572
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001573 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001574
Takuto Ikutaa71c6562021-11-18 06:07:55 +00001575 if ISOLATED_OUTDIR_PARAMETER in args and not options.cas_instance:
1576 parser.error('%s in args requires --cas-instance' %
Junji Watanabeed9ce352020-09-25 12:32:07 +00001577 ISOLATED_OUTDIR_PARAMETER)
1578
nodir90bc8dc2016-06-15 13:35:21 -07001579 if options.root_dir:
Junji Watanabe7a631b02022-01-13 02:30:29 +00001580 options.root_dir = os.path.abspath(options.root_dir)
Takuto Ikutad46ea762020-10-07 05:43:22 +00001581 else:
Junji Watanabe7a631b02022-01-13 02:30:29 +00001582 options.root_dir = tempfile.mkdtemp(prefix='root')
maruel12e30012015-10-09 11:55:35 -07001583 if options.json:
Junji Watanabe7a631b02022-01-13 02:30:29 +00001584 options.json = os.path.abspath(options.json)
nodir55be77b2016-05-03 09:39:57 -07001585
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001586 if any('=' not in i for i in options.env):
1587 parser.error(
1588 '--env required key=value form. value can be skipped to delete '
1589 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001590 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001591
1592 prefixes = {}
1593 cwd = os.path.realpath(os.getcwd())
1594 for item in options.env_prefix:
1595 if '=' not in item:
1596 parser.error(
1597 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1598 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001599 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001600 if os.path.isabs(opath):
1601 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1602 opath = os.path.normpath(opath)
1603 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1604 parser.error(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001605 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1606 % opath)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001607 prefixes.setdefault(key, []).append(opath)
1608 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001609
nodirbe642ff2016-06-09 15:51:51 -07001610 cipd.validate_cipd_options(parser, options)
1611
Junji Watanabedc2f89e2021-11-08 08:44:30 +00001612 install_packages_fn = copy_local_packages
Ye Kuang1d096cb2020-06-26 08:38:21 +00001613 tmp_cipd_cache_dir = None
vadimsh902948e2017-01-20 15:57:32 -08001614 if options.cipd_enabled:
Ye Kuang1d096cb2020-06-26 08:38:21 +00001615 cache_dir = options.cipd_cache
1616 if not cache_dir:
Junji Watanabe7a631b02022-01-13 02:30:29 +00001617 tmp_cipd_cache_dir = tempfile.mkdtemp()
Ye Kuang1d096cb2020-06-26 08:38:21 +00001618 cache_dir = tmp_cipd_cache_dir
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001619 install_packages_fn = (
1620 lambda run_dir, cas_dir, nsjail_dir: install_client_and_packages(
1621 run_dir,
1622 cipd.parse_package_args(options.cipd_packages),
1623 options.cipd_server,
1624 options.cipd_client_package,
1625 options.cipd_client_version,
1626 cache_dir=cache_dir,
1627 cas_dir=cas_dir,
1628 nsjail_dir=nsjail_dir,
1629 ))
nodirbe642ff2016-06-09 15:51:51 -07001630
nodird6160682017-02-02 13:03:35 -08001631 @contextlib.contextmanager
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001632 def install_named_caches(run_dir, stats):
nodird6160682017-02-02 13:03:35 -08001633 # WARNING: this function depends on "options" variable defined in the outer
1634 # function.
Junji Watanabe7a631b02022-01-13 02:30:29 +00001635 assert str(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001636 assert os.path.isabs(run_dir), run_dir
Junji Watanabe7a631b02022-01-13 02:30:29 +00001637 named_caches = [(os.path.join(run_dir, str(relpath)), name)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001638 for name, relpath, _ in options.named_caches]
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001639 install_start = time.time()
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001640 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001641 named_cache.install(path, name)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001642 install_duration = time.time() - install_start
1643 stats['install']['duration'] = install_duration
1644 logging.info('named_caches: install took %d seconds', install_duration)
nodird6160682017-02-02 13:03:35 -08001645 try:
1646 yield
1647 finally:
dnje289d132017-07-07 11:16:44 -07001648 # Uninstall each named cache, returning it to the cache pool. If an
1649 # uninstall fails for a given cache, it will remain in the task's
1650 # temporary space, get cleaned up by the Swarming bot, and be lost.
1651 #
1652 # If the Swarming bot cannot clean up the cache, it will handle it like
1653 # any other bot file that could not be removed.
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001654 uninstall_start = time.time()
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001655 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001656 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001657 # uninstall() doesn't trim but does call save() implicitly. Trimming
1658 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001659 named_cache.uninstall(path, name)
1660 except local_caching.NamedCacheError:
Takuto Ikuta463ecdd2021-03-05 09:35:38 +00001661 if sys.platform == 'win32':
1662 # Show running processes.
1663 sys.stderr.write("running process\n")
1664 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
1665
Junji Watanabed2ab86b2021-08-13 07:20:23 +00001666 error = (
1667 'Error while removing named cache %r at %r. The cache will be'
1668 ' lost.' % (path, name))
1669 logging.exception(error)
1670 on_error.report(error)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001671 uninstall_duration = time.time() - uninstall_start
1672 stats['uninstall']['duration'] = uninstall_duration
1673 logging.info('named_caches: uninstall took %d seconds',
1674 uninstall_duration)
nodirf33b8d62016-10-26 22:34:58 -07001675
Takuto Ikutaf3caa9b2020-11-02 05:38:26 +00001676 command = args
1677 if options.relative_cwd:
1678 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1679 if not a.startswith(os.getcwd()):
1680 parser.error(
1681 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001682
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001683 containment_type = subprocess42.Containment.NONE
1684 if options.containment_type == 'AUTO':
1685 containment_type = subprocess42.Containment.AUTO
1686 if options.containment_type == 'JOB_OBJECT':
1687 containment_type = subprocess42.Containment.JOB_OBJECT
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001688 if options.containment_type == 'NSJAIL':
1689 containment_type = subprocess42.Containment.NSJAIL
1690 # TODO(https://crbug.com/1227833): This object should eventually contain the
1691 # path to the nsjail binary and the nsjail configuration file.
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001692 containment = subprocess42.Containment(
1693 containment_type=containment_type,
1694 limit_processes=options.limit_processes,
1695 limit_total_committed_memory=options.limit_total_committed_memory)
1696
Junji Watanabe7a631b02022-01-13 02:30:29 +00001697 data = TaskData(command=command,
1698 relative_cwd=options.relative_cwd,
1699 cas_instance=options.cas_instance,
1700 cas_digest=options.cas_digest,
1701 outputs=options.output,
1702 install_named_caches=install_named_caches,
1703 leak_temp_dir=options.leak_temp_dir,
1704 root_dir=options.root_dir,
1705 hard_timeout=options.hard_timeout,
1706 grace_period=options.grace_period,
1707 bot_file=options.bot_file,
1708 switch_to_account=options.switch_to_account,
1709 install_packages_fn=install_packages_fn,
1710 cas_cache_dir=options.cas_cache,
1711 cas_cache_policies=local_caching.CachePolicies(
1712 max_cache_size=options.max_cache_size,
1713 min_free_space=options.min_free_space,
1714 max_items=None,
1715 max_age_secs=None,
1716 ),
1717 cas_kvs=options.kvs_dir,
1718 env=options.env,
1719 env_prefix=options.env_prefix,
1720 lower_priority=bool(options.lower_priority),
1721 containment=containment,
1722 trim_caches_fn=trim_caches_fn)
nodirbe642ff2016-06-09 15:51:51 -07001723 try:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001724 return run_tha_test(data, options.json)
Junji Watanabe38b28b02020-04-23 10:23:30 +00001725 except (cipd.Error, local_caching.NamedCacheError,
1726 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001727 print(ex.message, file=sys.stderr)
Junji Watanabed2ab86b2021-08-13 07:20:23 +00001728 on_error.report(None)
nodirbe642ff2016-06-09 15:51:51 -07001729 return 1
Ye Kuang1d096cb2020-06-26 08:38:21 +00001730 finally:
1731 if tmp_cipd_cache_dir is not None:
1732 try:
1733 file_path.rmtree(tmp_cipd_cache_dir)
1734 except OSError:
1735 logging.exception('Remove tmp_cipd_cache_dir=%s failed',
1736 tmp_cipd_cache_dir)
1737 # Best effort clean up. Failed to do so doesn't affect the outcome.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001738
1739
1740if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001741 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001742 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001743 fix_encoding.fix_encoding()
Ye Kuang2dd17442020-04-22 08:45:52 +00001744 net.set_user_agent('run_isolated.py/' + __version__)
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001745 sys.exit(main(sys.argv[1:]))