blob: 5924db334caf61d53894186a7428f5a0eeb4c256 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
Joanna Wang4cec0e42021-08-26 00:48:37 +000033Any ${SWARMING_TASK_ID} on the command line will be replaced by the
34SWARMING_TASK_ID value passed with the --env option.
35
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000036See
37https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
38for all the variables.
39
40See
41https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
42for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000043"""
44
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000045from __future__ import print_function
46
47__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000048
aludwin7556e0c2016-10-26 08:46:10 -070049import argparse
maruel064c0a32016-04-05 11:47:15 -070050import base64
iannucci96fcccc2016-08-30 15:52:22 -070051import collections
vadimsh232f5a82017-01-20 19:23:44 -080052import contextlib
Ye Kuangfff1e502020-07-13 13:21:57 +000053import distutils
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040054import errno
aludwin7556e0c2016-10-26 08:46:10 -070055import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000056import logging
57import optparse
58import os
Takuto Ikuta5c59a842020-01-24 03:05:24 +000059import platform
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040060import re
Junji Watanabedc2f89e2021-11-08 08:44:30 +000061import shutil
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000062import sys
63import tempfile
maruel064c0a32016-04-05 11:47:15 -070064import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000065
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000066from utils import tools
67tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000068
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000069# third_party/
70from depot_tools import fix_encoding
71
72# pylint: disable=ungrouped-imports
73import auth
74import cipd
Justin Luong97eda6f2022-08-23 01:29:16 +000075import errors
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000076import local_caching
77from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070078from utils import file_path
maruel12e30012015-10-09 11:55:35 -070079from utils import fs
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040080from utils import logging_utils
Ye Kuang2dd17442020-04-22 08:45:52 +000081from utils import net
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040082from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050083from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000084
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000085
maruele2f2cb82016-07-13 14:41:03 -070086# Magic variables that can be found in the isolate task command line.
87ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
88EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
89SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
Joanna Wang4cec0e42021-08-26 00:48:37 +000090SWARMING_TASK_ID_PARAMETER = '${SWARMING_TASK_ID}'
maruele2f2cb82016-07-13 14:41:03 -070091
92
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000093# The name of the log file to use.
94RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
95
maruele2f2cb82016-07-13 14:41:03 -070096
maruele2f2cb82016-07-13 14:41:03 -070097# Use short names for temporary directories. This is driven by Windows, which
98# imposes a relatively short maximum path length of 260 characters, often
99# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000100# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -0700101#
102# It is recommended to start the script with a `root_dir` as short as
103# possible.
104# - ir stands for isolated_run
105# - io stands for isolated_out
106# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000107# - ic stands for isolated_client
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000108# - ns stands for nsjail
Junji Watanabe53d31882022-01-13 07:58:00 +0000109ISOLATED_RUN_DIR = 'ir'
110ISOLATED_OUT_DIR = 'io'
111ISOLATED_TMP_DIR = 'it'
112ISOLATED_CLIENT_DIR = 'ic'
113_CAS_CLIENT_DIR = 'cc'
114_NSJAIL_DIR = 'ns'
maruele2f2cb82016-07-13 14:41:03 -0700115
Takuto Ikuta02edca22019-11-29 10:04:51 +0000116# TODO(tikuta): take these parameter from luci-config?
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000117_CAS_PACKAGE = 'infra/tools/luci/cas/${platform}'
Justin Luongffaf3cf2022-09-07 03:38:45 +0000118_LUCI_GO_REVISION = 'git_revision:f529671465f28c457995930305dbfa049e5551f7'
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000119_NSJAIL_PACKAGE = 'infra/3pp/tools/nsjail/${platform}'
Takuto Ikuta6b5e4522022-09-01 04:21:14 +0000120_NSJAIL_VERSION = 'version:2@3.0.chromium.1'
maruele2f2cb82016-07-13 14:41:03 -0700121
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400122# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000123CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400124
Takuto Ikutac9ddff22021-02-18 07:58:39 +0000125_FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES = 2 * 1024 * 1024 * 1024
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400126
marueld928c862017-06-08 08:20:04 -0700127OUTLIVING_ZOMBIE_MSG = """\
128*** Swarming tried multiple times to delete the %s directory and failed ***
129*** Hard failing the task ***
130
131Swarming detected that your testing script ran an executable, which may have
132started a child executable, and the main script returned early, leaving the
133children executables playing around unguided.
134
135You don't want to leave children processes outliving the task on the Swarming
136bot, do you? The Swarming bot doesn't.
137
138How to fix?
139- For any process that starts children processes, make sure all children
140 processes terminated properly before each parent process exits. This is
141 especially important in very deep process trees.
142 - This must be done properly both in normal successful task and in case of
143 task failure. Cleanup is very important.
144- The Swarming bot sends a SIGTERM in case of timeout.
145 - You have %s seconds to comply after the signal was sent to the process
146 before the process is forcibly killed.
147- To achieve not leaking children processes in case of signals on timeout, you
148 MUST handle signals in each executable / python script and propagate them to
149 children processes.
150 - When your test script (python or binary) receives a signal like SIGTERM or
151 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
152 them to terminate before quitting.
153
154See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400155https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700156for more information.
157
158*** May the SIGKILL force be with you ***
159"""
160
161
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000162# Currently hardcoded. Eventually could be exposed as a flag once there's value.
163# 3 weeks
164MAX_AGE_SECS = 21*24*60*60
165
Takuto Ikuta7ff4b242020-12-03 08:07:06 +0000166_CAS_KVS_CACHE_THRESHOLD = 5 * 1024 * 1024 * 1024 # 5 GiB
167
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500168TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000169 'TaskData',
170 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000171 # List of strings; the command line to use, independent of what was
172 # specified in the isolated file.
173 'command',
174 # Relative directory to start command into.
175 'relative_cwd',
Junji Watanabe54925c32020-09-08 00:56:18 +0000176 # Digest of the input root on RBE-CAS.
177 'cas_digest',
178 # Full CAS instance name.
179 'cas_instance',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000180 # List of paths relative to root_dir to put into the output isolated
181 # bundle upon task completion (see link_outputs_to_outdir).
182 'outputs',
183 # Function (run_dir) => context manager that installs named caches into
184 # |run_dir|.
185 'install_named_caches',
186 # If True, the temporary directory will be deliberately leaked for later
187 # examination.
188 'leak_temp_dir',
189 # Path to the directory to use to create the temporary directory. If not
190 # specified, a random temporary directory is created.
191 'root_dir',
192 # Kills the process if it lasts more than this amount of seconds.
193 'hard_timeout',
194 # Number of seconds to wait between SIGTERM and SIGKILL.
195 'grace_period',
196 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
197 # task command line argument.
198 'bot_file',
199 # Logical account to switch LUCI_CONTEXT into.
200 'switch_to_account',
201 # Context manager dir => CipdInfo, see install_client_and_packages.
202 'install_packages_fn',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000203 # Cache directory for `cas` client.
204 'cas_cache_dir',
205 # Parameters passed to `cas` client.
206 'cas_cache_policies',
Takuto Ikutaae391c52020-12-03 08:43:45 +0000207 # Parameters for kvs file used by `cas` client.
208 'cas_kvs',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000209 # Environment variables to set.
210 'env',
211 # Environment variables to mutate with relative directories.
212 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
213 'env_prefix',
214 # Lowers the task process priority.
215 'lower_priority',
216 # subprocess42.Containment instance. Can be None.
217 'containment',
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000218 # Function to trim caches before installing cipd packages and
219 # downloading isolated files.
220 'trim_caches_fn',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000221 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500222
maruel03e11842016-07-14 10:50:16 -0700223def make_temp_dir(prefix, root_dir):
224 """Returns a new unique temporary directory."""
Junji Watanabe7a631b02022-01-13 02:30:29 +0000225 return tempfile.mkdtemp(prefix=prefix, dir=root_dir)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000226
227
vadimsh9c54b2c2017-07-25 14:08:29 -0700228@contextlib.contextmanager
229def set_luci_context_account(account, tmp_dir):
230 """Sets LUCI_CONTEXT account to be used by the task.
231
232 If 'account' is None or '', does nothing at all. This happens when
233 run_isolated.py is called without '--switch-to-account' flag. In this case,
234 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000235 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700236 run_isolated.py explicitly from their code.
237
238 If the requested account is not defined in the context, switches to
239 non-authenticated access. This happens for Swarming tasks that don't use
240 'task' service accounts.
241
242 If not using LUCI_CONTEXT-based auth, does nothing.
243 If already running as requested account, does nothing.
244 """
245 if not account:
246 # Not actually switching.
247 yield
248 return
249
250 local_auth = luci_context.read('local_auth')
251 if not local_auth:
252 # Not using LUCI_CONTEXT auth at all.
253 yield
254 return
255
256 # See LUCI_CONTEXT.md for the format of 'local_auth'.
257 if local_auth.get('default_account_id') == account:
258 # Already set, no need to switch.
259 yield
260 return
261
262 available = {a['id'] for a in local_auth.get('accounts') or []}
263 if account in available:
264 logging.info('Switching default LUCI_CONTEXT account to %r', account)
265 local_auth['default_account_id'] = account
266 else:
267 logging.warning(
268 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
269 'disabling authentication', account, sorted(available))
270 local_auth.pop('default_account_id', None)
271
272 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
273 yield
274
275
nodir90bc8dc2016-06-15 13:35:21 -0700276def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000277 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700278
279 Raises:
280 ValueError if a parameter is requested in |command| but its value is not
281 provided.
282 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000283 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
284
285
286def replace_parameters(arg, out_dir, bot_file):
287 """Replaces parameter tokens with appropriate values in a string.
288
289 Raises:
290 ValueError if a parameter is requested in |arg| but its value is not
291 provided.
292 """
293 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
294 replace_slash = False
295 if ISOLATED_OUTDIR_PARAMETER in arg:
296 if not out_dir:
297 raise ValueError(
298 'output directory is requested in command or env var, but not '
299 'provided; please specify one')
300 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
301 replace_slash = True
302 if SWARMING_BOT_FILE_PARAMETER in arg:
303 if bot_file:
304 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700305 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000306 else:
307 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
308 'var, but no bot_file specified. Leaving parameter '
309 'unchanged.')
Joanna Wang4cec0e42021-08-26 00:48:37 +0000310 if SWARMING_TASK_ID_PARAMETER in arg:
311 task_id = os.environ.get('SWARMING_TASK_ID')
312 if task_id:
313 arg = arg.replace(SWARMING_TASK_ID_PARAMETER, task_id)
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000314 if replace_slash:
315 # Replace slashes only if parameters are present
316 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
317 arg = arg.replace('/', os.sep)
318 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700319
320
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000321def set_temp_dir(env, tmp_dir):
322 """Set temp dir to given env var dictionary"""
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000323 # pylint: disable=line-too-long
324 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
325 # platform. So $TMPDIR must be set on all platforms.
326 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
327 env['TMPDIR'] = tmp_dir
328 if sys.platform == 'win32':
329 # * chromium's base utils uses GetTempPath().
330 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
331 # * Go uses GetTempPath().
332 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
333 # set.
334 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
335 env['TMP'] = tmp_dir
336 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
337 env['TEMP'] = tmp_dir
338 elif sys.platform == 'darwin':
339 # * Chromium uses an hack on macOS before calling into
340 # NSTemporaryDirectory().
341 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
342 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
343 env['MAC_CHROMIUM_TMPDIR'] = tmp_dir
344 else:
345 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
346 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
347 # * mktemp on linux respects $TMPDIR.
348 # * Chromium respects $TMPDIR on linux.
349 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
350 # * Go uses $TMPDIR.
351 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
352 pass
353
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000354
355def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
356 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800357 """Returns full OS environment to run a command in.
358
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800359 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
360 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800361
362 Args:
363 tmp_dir: temp directory.
364 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500365 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500366 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800367 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000368 out_dir: Isolated output directory. Required to be != None if any of the
369 env vars contain ISOLATED_OUTDIR_PARAMETER.
370 bot_file: Required to be != None if any of the env vars contain
371 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800372 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500373 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000374 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500375 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500376 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500377 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000378 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500379
380 if cipd_info:
381 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Junji Watanabe7a631b02022-01-13 02:30:29 +0000382 out['PATH'] = '%s%s%s' % (bin_dir, os.pathsep, out['PATH'])
383 out['CIPD_CACHE_DIR'] = cipd_info.cache_dir
Takuto Ikuta4ec3e8f2021-04-05 10:21:29 +0000384 cipd_info_path = os.path.join(tmp_dir, 'cipd_info.json')
385 with open(cipd_info_path, 'w') as f:
386 json.dump(cipd_info.pins, f)
387 out['ISOLATED_RESOLVED_PACKAGE_VERSIONS_FILE'] = cipd_info_path
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500388
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000389 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500390 assert isinstance(paths, list), paths
391 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500392 cur = out.get(key)
393 if cur:
394 paths.append(cur)
Junji Watanabe7a631b02022-01-13 02:30:29 +0000395 out[key] = os.path.pathsep.join(paths)
vadimsh232f5a82017-01-20 19:23:44 -0800396
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000397 set_temp_dir(out, tmp_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500398 return out
vadimsh232f5a82017-01-20 19:23:44 -0800399
400
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000401def run_command(
402 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700403 """Runs the command.
404
405 Returns:
406 tuple(process exit code, bool if had a hard timeout)
407 """
Jonah Hooper9b5bd8c2022-07-21 15:33:41 +0000408 logging_utils.user_logs('run_command(%s, %s, %s, %s, %s, %s)', command, cwd,
409 hard_timeout, grace_period, lower_priority,
410 containment)
marueleb5fbee2015-09-17 13:01:36 -0700411
maruel6be7f9e2015-10-01 12:25:30 -0700412 exit_code = None
413 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700414 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700415 proc = None
416 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700417 try:
maruel6be7f9e2015-10-01 12:25:30 -0700418 # TODO(maruel): This code is imperfect. It doesn't handle well signals
419 # during the download phase and there's short windows were things can go
420 # wrong.
421 def handler(signum, _frame):
422 if proc and not had_signal:
423 logging.info('Received signal %d', signum)
424 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700425 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700426
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000427 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000428 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000429 lower_priority=lower_priority, containment=containment)
Joanna Wang40959bf2021-08-12 18:10:12 +0000430 logging.info('Subprocess for command started')
maruel6be7f9e2015-10-01 12:25:30 -0700431 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
432 try:
John Budorickc398f092019-06-10 22:49:44 +0000433 exit_code = proc.wait(hard_timeout or None)
Takuto Ikuta88382c82022-02-03 08:46:17 +0000434 logging.info("finished with exit code %d after hard_timeout %s",
435 exit_code, hard_timeout)
maruel6be7f9e2015-10-01 12:25:30 -0700436 except subprocess42.TimeoutExpired:
437 if not had_signal:
438 logging.warning('Hard timeout')
439 had_hard_timeout = True
440 logging.warning('Sending SIGTERM')
441 proc.terminate()
442
Takuto Ikuta684f7912020-09-29 07:49:49 +0000443 kill_sent = False
maruel6be7f9e2015-10-01 12:25:30 -0700444 # Ignore signals in grace period. Forcibly give the grace period to the
445 # child process.
446 if exit_code is None:
447 ignore = lambda *_: None
448 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
449 try:
450 exit_code = proc.wait(grace_period or None)
Takuto Ikuta88382c82022-02-03 08:46:17 +0000451 logging.info("finished with exit code %d after grace_period %s",
452 exit_code, grace_period)
maruel6be7f9e2015-10-01 12:25:30 -0700453 except subprocess42.TimeoutExpired:
454 # Now kill for real. The user can distinguish between the
455 # following states:
456 # - signal but process exited within grace period,
457 # hard_timed_out will be set but the process exit code will be
458 # script provided.
459 # - processed exited late, exit code will be -9 on posix.
460 logging.warning('Grace exhausted; sending SIGKILL')
461 proc.kill()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000462 kill_sent = True
martiniss5c8043e2017-08-01 17:09:43 -0700463 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700464 exit_code = proc.wait()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000465
466 # the process group / job object may be dangling so if we didn't kill
467 # it already, give it a poke now.
468 if not kill_sent:
469 proc.kill()
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000470 except OSError as e:
maruela9cfd6f2015-09-15 11:03:15 -0700471 # This is not considered to be an internal error. The executable simply
472 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800473 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000474 '<The executable does not exist, a dependent library is missing or '
475 'the command line is too long>\n'
476 '<Check for missing .so/.dll in the .isolate or GN file or length of '
477 'command line args>\n'
Takuto Ikutae900df42021-04-14 04:40:11 +0000478 '<Command: %s>\n'
479 '<Exception: %s>\n' % (command, e))
maruela72f46e2016-02-24 11:05:45 -0800480 if os.environ.get('SWARMING_TASK_ID'):
481 # Give an additional hint when running as a swarming task.
482 sys.stderr.write(
483 '<See the task\'s page for commands to help diagnose this issue '
484 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700485 exit_code = 1
486 logging.info(
487 'Command finished with exit code %d (%s)',
488 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700489 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700490
491
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000492def _run_go_cmd_and_wait(cmd, tmp_dir):
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000493 """
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000494 Runs an external Go command, `isolated` or `cas`, and wait for its completion.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000495
496 While this is a generic function to launch a subprocess, it has logic that
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000497 is specific to Go `isolated` and `cas` for waiting and logging.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000498
499 Returns:
500 The subprocess object
501 """
Ye Kuang3c40e9f2020-07-28 13:15:25 +0000502 cmd_str = ' '.join(cmd)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000503 try:
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000504 env = os.environ.copy()
505 set_temp_dir(env, tmp_dir)
506 proc = subprocess42.Popen(cmd, env=env)
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000507
Ye Kuangc1d800f2020-07-28 10:14:55 +0000508 exceeded_max_timeout = True
509 check_period_sec = 30
510 max_checks = 100
511 # max timeout = max_checks * check_period_sec = 50 minutes
512 for i in range(max_checks):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000513 # This is to prevent I/O timeout error during setup.
Ye Kuangc1d800f2020-07-28 10:14:55 +0000514 try:
515 retcode = proc.wait(check_period_sec)
516 if retcode != 0:
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000517 raise subprocess42.CalledProcessError(retcode, cmd=cmd_str)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000518 exceeded_max_timeout = False
519 break
520 except subprocess42.TimeoutExpired:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000521 print('still running (after %d seconds)' % ((i + 1) * check_period_sec))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000522
Ye Kuangc1d800f2020-07-28 10:14:55 +0000523 if exceeded_max_timeout:
524 proc.terminate()
525 try:
526 proc.wait(check_period_sec)
527 except subprocess42.TimeoutExpired:
528 logging.exception(
529 "failed to terminate? timeout happened after %d seconds",
530 check_period_sec)
531 proc.kill()
532 proc.wait()
533 # Raise unconditionally, because |proc| was forcefully terminated.
534 raise ValueError("timedout after %d seconds (cmd=%s)" %
535 (check_period_sec * max_checks, cmd_str))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000536
Ye Kuangc1d800f2020-07-28 10:14:55 +0000537 return proc
538 except Exception:
539 logging.exception('Failed to run Go cmd %s', cmd_str)
540 raise
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000541
542
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000543def _fetch_and_map(cas_client, digest, instance, output_dir, cache_dir,
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000544 policies, kvs_dir, tmp_dir):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000545 """
546 Fetches a CAS tree using cas client, create the tree and returns download
547 stats.
548 """
549
550 start = time.time()
551 result_json_handle, result_json_path = tempfile.mkstemp(
Junji Watanabe53d31882022-01-13 07:58:00 +0000552 prefix='fetch-and-map-result-', suffix='.json')
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000553 os.close(result_json_handle)
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000554 profile_dir = tempfile.mkdtemp(dir=tmp_dir)
555
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000556 try:
557 cmd = [
558 cas_client,
559 'download',
560 '-digest',
561 digest,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000562 # flags for cache.
563 '-cache-dir',
564 cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000565 '-cache-max-size',
566 str(policies.max_cache_size),
567 '-cache-min-free-space',
568 str(policies.min_free_space),
569 # flags for output.
570 '-dir',
571 output_dir,
Justin Luong54fa9592022-08-11 03:44:40 +0000572 '-dump-json',
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000573 result_json_path,
Takuto Ikuta557025b2021-02-01 08:37:40 +0000574 '-log-level',
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000575 'info',
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000576 ]
Takuto Ikutaae391c52020-12-03 08:43:45 +0000577
Junji Watanabe66d807b2021-11-08 03:20:10 +0000578 # When RUN_ISOLATED_CAS_ADDRESS is set in test mode,
579 # Use it and ignore CAS instance option.
580 cas_addr = os.environ.get('RUN_ISOLATED_CAS_ADDRESS')
581 if cas_addr:
582 cmd.extend([
583 '-cas-addr',
584 cas_addr,
585 ])
586 else:
587 cmd.extend([
588 '-cas-instance',
589 instance
590 ])
591
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000592 if kvs_dir:
593 cmd.extend(['-kvs-dir', kvs_dir])
Takuto Ikutaae391c52020-12-03 08:43:45 +0000594
Justin Luong54fa9592022-08-11 03:44:40 +0000595 def open_json_and_check(result_json_path, cleanup_dirs):
596 cas_error = False
597 result_json = {}
Justin Luong9d47a352022-09-01 03:01:35 +0000598 error_digest = digest
Justin Luong54fa9592022-08-11 03:44:40 +0000599 try:
600 with open(result_json_path) as json_file:
601 result_json = json.load(json_file)
602 cas_error = result_json.get('result') in ('digest_invalid',
603 'authentication_error',
604 'arguments_invalid')
Justin Luong9d47a352022-09-01 03:01:35 +0000605 if cas_error and result_json.get('error_details'):
606 error_digest = result_json['error_details'].get('digest', digest)
607
Justin Luong54fa9592022-08-11 03:44:40 +0000608 except (IOError, ValueError):
609 logging.error('Failed to read json file: %s', result_json_path)
610 raise
611 finally:
612 if cleanup_dirs:
613 file_path.rmtree(kvs_dir)
614 file_path.rmtree(output_dir)
615 if cas_error:
Justin Luong9d47a352022-09-01 03:01:35 +0000616 raise errors.NonRecoverableCasException(result_json['result'],
617 error_digest, instance)
Justin Luong54fa9592022-08-11 03:44:40 +0000618 return result_json
619
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000620 try:
621 _run_go_cmd_and_wait(cmd, tmp_dir)
Takuto Ikuta0909eae2021-04-27 02:54:07 +0000622 except subprocess42.CalledProcessError as ex:
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000623 if not kvs_dir:
Justin Luong54fa9592022-08-11 03:44:40 +0000624 open_json_and_check(result_json_path, False)
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000625 raise
Justin Luong54fa9592022-08-11 03:44:40 +0000626 open_json_and_check(result_json_path, True)
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000627 logging.exception('Failed to run cas, removing kvs cache dir and retry.')
Takuto Ikuta0909eae2021-04-27 02:54:07 +0000628 on_error.report("Failed to run cas %s" % ex)
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000629 _run_go_cmd_and_wait(cmd, tmp_dir)
630
Justin Luong54fa9592022-08-11 03:44:40 +0000631 result_json = open_json_and_check(result_json_path, False)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000632
633 return {
634 'duration': time.time() - start,
635 'items_cold': result_json['items_cold'],
636 'items_hot': result_json['items_hot'],
637 }
638 finally:
639 fs.remove(result_json_path)
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000640 file_path.rmtree(profile_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000641
642
aludwin0a8e17d2016-10-27 15:57:39 -0700643def link_outputs_to_outdir(run_dir, out_dir, outputs):
644 """Links any named outputs to out_dir so they can be uploaded.
645
646 Raises an error if the file already exists in that directory.
647 """
648 if not outputs:
649 return
Takuto Ikutae0dce462021-11-16 08:49:46 +0000650 file_path.create_directories(out_dir, outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700651 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400652 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
653
654
655def copy_recursively(src, dst):
656 """Efficiently copies a file or directory from src_dir to dst_dir.
657
658 `item` may be a file, directory, or a symlink to a file or directory.
659 All symlinks are replaced with their targets, so the resulting
660 directory structure in dst_dir will never have any symlinks.
661
662 To increase speed, copy_recursively hardlinks individual files into the
663 (newly created) directory structure if possible, unlike Python's
664 shutil.copytree().
665 """
666 orig_src = src
667 try:
668 # Replace symlinks with their final target.
669 while fs.islink(src):
670 res = fs.readlink(src)
Takuto Ikutaf2ad0a02021-06-24 08:38:40 +0000671 src = os.path.realpath(os.path.join(os.path.dirname(src), res))
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400672 # TODO(sadafm): Explicitly handle cyclic symlinks.
673
Takuto Ikutaf2ad0a02021-06-24 08:38:40 +0000674 if not fs.exists(src):
675 logging.warning('Path %s does not exist or %s is a broken symlink', src,
676 orig_src)
677 return
678
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400679 if fs.isfile(src):
680 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
681 return
682
683 if not fs.exists(dst):
684 os.makedirs(dst)
685
686 for child in fs.listdir(src):
687 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
688
689 except OSError as e:
690 if e.errno == errno.ENOENT:
691 logging.warning('Path %s does not exist or %s is a broken symlink',
692 src, orig_src)
693 else:
694 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700695
696
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000697def upload_outdir(cas_client, cas_instance, outdir, tmp_dir):
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000698 """Uploads the results in |outdir|, if there is any.
699
700 Returns:
701 tuple(root_digest, stats)
702 - root_digest: a digest of the output directory.
703 - stats: uploading stats.
704 """
Junji Watanabe15f9e042021-11-12 07:13:50 +0000705 if not fs.listdir(outdir):
706 return None, None
Junji Watanabe53d31882022-01-13 07:58:00 +0000707 digest_file_handle, digest_path = tempfile.mkstemp(prefix='cas-digest',
708 suffix='.txt')
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000709 os.close(digest_file_handle)
Junji Watanabe53d31882022-01-13 07:58:00 +0000710 stats_json_handle, stats_json_path = tempfile.mkstemp(prefix='upload-stats',
711 suffix='.json')
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000712 os.close(stats_json_handle)
713
714 try:
715 cmd = [
716 cas_client,
717 'archive',
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000718 '-paths',
719 # Format: <working directory>:<relative path to dir>
720 outdir + ':',
721 # output
722 '-dump-digest',
723 digest_path,
Justin Luong54fa9592022-08-11 03:44:40 +0000724 '-dump-json',
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000725 stats_json_path,
726 ]
727
Junji Watanabe66d807b2021-11-08 03:20:10 +0000728 # When RUN_ISOLATED_CAS_ADDRESS is set in test mode,
729 # Use it and ignore CAS instance option.
730 cas_addr = os.environ.get('RUN_ISOLATED_CAS_ADDRESS')
731 if cas_addr:
732 cmd.extend([
733 '-cas-addr',
734 cas_addr,
735 ])
736 else:
737 cmd.extend([
738 '-cas-instance',
739 cas_instance
740 ])
741
Takuto Ikuta23388f52022-02-01 01:39:00 +0000742 if sys.platform == 'linux':
Takuto Ikutabfcef252021-08-25 07:46:19 +0000743 # TODO(crbug.com/1243194): remove this after investigation.
744 cmd.extend(['-log-level', 'debug'])
745
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000746 start = time.time()
747
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000748 _run_go_cmd_and_wait(cmd, tmp_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000749
750 with open(digest_path) as digest_file:
751 digest = digest_file.read()
Junji Watanabec208b302020-09-25 09:18:27 +0000752 h, s = digest.split('/')
753 cas_output_root = {
754 'cas_instance': cas_instance,
755 'digest': {
756 'hash': h,
757 'size_bytes': int(s)
758 }
759 }
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000760 with open(stats_json_path) as stats_file:
761 stats = json.load(stats_file)
762
763 stats['duration'] = time.time() - start
764
Junji Watanabec208b302020-09-25 09:18:27 +0000765 return cas_output_root, stats
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000766 finally:
767 fs.remove(digest_path)
768 fs.remove(stats_json_path)
769
770
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500771def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700772 """Runs a command with optional isolated input/output.
773
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500774 Arguments:
775 - data: TaskData instance.
776 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700777
778 Returns metadata about the result.
779 """
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000780
Takuto Ikutaa71c6562021-11-18 06:07:55 +0000781 # TODO(tikuta): take stats from state.json in this case too.
782 download_stats = {
783 # 'duration': 0.,
784 # 'initial_number_items': len(data.cas_cache),
785 # 'initial_size': data.cas_cache.total_size,
786 # 'items_cold': '<large.pack()>',
787 # 'items_hot': '<large.pack()>',
788 }
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000789
maruela9cfd6f2015-09-15 11:03:15 -0700790 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000791 'duration': None,
792 'exit_code': None,
793 'had_hard_timeout': False,
794 'internal_failure': 'run_isolated did not complete properly',
795 'stats': {
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000796 'trim_caches': {
797 'duration': 0,
798 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000799 #'cipd': {
800 # 'duration': 0.,
801 # 'get_client_duration': 0.,
802 #},
803 'isolated': {
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000804 'download': download_stats,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000805 #'upload': {
806 # 'duration': 0.,
807 # 'items_cold': '<large.pack()>',
808 # 'items_hot': '<large.pack()>',
809 #},
810 },
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000811 'named_caches': {
812 'install': {
813 'duration': 0,
814 },
815 'uninstall': {
816 'duration': 0,
817 },
818 },
819 'cleanup': {
820 'duration': 0,
821 }
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000822 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000823 #'cipd_pins': {
824 # 'packages': [
825 # {'package_name': ..., 'version': ..., 'path': ...},
826 # ...
827 # ],
828 # 'client_package': {'package_name': ..., 'version': ...},
829 #},
830 'outputs_ref': None,
Junji Watanabe54925c32020-09-08 00:56:18 +0000831 'cas_output_root': None,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000832 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700833 }
nodirbe642ff2016-06-09 15:51:51 -0700834
Takuto Ikutad46ea762020-10-07 05:43:22 +0000835 assert os.path.isabs(data.root_dir), ("data.root_dir is not abs path: %s" %
836 data.root_dir)
837 file_path.ensure_tree(data.root_dir, 0o700)
838
maruele2f2cb82016-07-13 14:41:03 -0700839 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700840 # TODO(maruel): This is not obvious. Change this to become an error once we
841 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500842 if constant_run_path and data.root_dir:
843 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700844 if os.path.isdir(run_dir):
845 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000846 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700847 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500848 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000849
maruel03e11842016-07-14 10:50:16 -0700850 # storage should be normally set but don't crash if it is not. This can happen
851 # as Swarming task can run without an isolate server.
Takuto Ikuta417388f2021-11-18 07:39:52 +0000852 out_dir = make_temp_dir(ISOLATED_OUT_DIR, data.root_dir)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500853 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700854 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500855 if data.relative_cwd:
856 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500857 command = data.command
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000858
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000859 cas_client_dir = make_temp_dir(_CAS_CLIENT_DIR, data.root_dir)
Takuto Ikuta417388f2021-11-18 07:39:52 +0000860 cas_client = os.path.join(cas_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000861
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000862 data.trim_caches_fn(result['stats']['trim_caches'])
863
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000864 nsjail_dir = None
865 if (sys.platform == "linux" and cipd.get_platform() == "amd64" and
866 data.containment.containment_type == subprocess42.Containment.NSJAIL):
867 nsjail_dir = make_temp_dir(_NSJAIL_DIR, data.root_dir)
868
nodir55be77b2016-05-03 09:39:57 -0700869 try:
Takuto Ikuta1ce61362021-11-16 05:44:17 +0000870 with data.install_packages_fn(run_dir, cas_client_dir,
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000871 nsjail_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800872 if cipd_info:
873 result['stats']['cipd'] = cipd_info.stats
874 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700875
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000876 isolated_stats = result['stats'].setdefault('isolated', {})
Takuto Ikutab58dbd12020-06-05 09:29:14 +0000877
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000878 if data.cas_digest:
879 stats = _fetch_and_map(
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000880 cas_client=cas_client,
881 digest=data.cas_digest,
882 instance=data.cas_instance,
883 output_dir=run_dir,
Junji Watanabeb03450b2020-09-25 05:09:27 +0000884 cache_dir=data.cas_cache_dir,
Takuto Ikutaae391c52020-12-03 08:43:45 +0000885 policies=data.cas_cache_policies,
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000886 kvs_dir=data.cas_kvs,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000887 tmp_dir=tmp_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000888 isolated_stats['download'].update(stats)
Junji Watanabe54925c32020-09-08 00:56:18 +0000889
maruelabec63c2017-04-26 11:53:24 -0700890 if not command:
891 # Handle this as a task failure, not an internal failure.
892 sys.stderr.write(
893 '<No command was specified!>\n'
894 '<Please secify a command when triggering your Swarming task>\n')
895 result['exit_code'] = 1
896 return result
nodirbe642ff2016-06-09 15:51:51 -0700897
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500898 if not cwd.startswith(run_dir):
899 # Handle this as a task failure, not an internal failure. This is a
900 # 'last chance' way to gate against directory escape.
901 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
902 result['exit_code'] = 1
903 return result
904
905 if not os.path.isdir(cwd):
906 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +0000907 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500908
vadimsh232f5a82017-01-20 19:23:44 -0800909 # If we have an explicit list of files to return, make sure their
910 # directories exist now.
Takuto Ikutaab8d0232021-11-16 12:12:09 +0000911 if data.outputs:
Takuto Ikutae0dce462021-11-16 08:49:46 +0000912 file_path.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700913
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000914 with data.install_named_caches(run_dir, result['stats']['named_caches']):
nodird6160682017-02-02 13:03:35 -0800915 sys.stdout.flush()
916 start = time.time()
917 try:
vadimsh9c54b2c2017-07-25 14:08:29 -0700918 # Need to switch the default account before 'get_command_env' call,
919 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500920 with set_luci_context_account(data.switch_to_account, tmp_dir):
921 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000922 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
923 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +0000924 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -0800925 command = process_command(command, out_dir, data.bot_file)
926 file_path.ensure_command_has_abs_path(command, cwd)
927
vadimsh9c54b2c2017-07-25 14:08:29 -0700928 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000929 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000930 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -0800931 finally:
932 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -0500933
Takuto Ikuta417388f2021-11-18 07:39:52 +0000934 # Try to link files to the output directory, if specified.
935 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
936 isolated_stats = result['stats'].setdefault('isolated', {})
937 result['cas_output_root'], upload_stats = upload_outdir(
938 cas_client, data.cas_instance, out_dir, tmp_dir)
939 if upload_stats:
940 isolated_stats['upload'] = upload_stats
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000941
Seth Koehler49139812017-12-19 13:59:33 -0500942 # We successfully ran the command, set internal_failure back to
943 # None (even if the command failed, it's not an internal error).
944 result['internal_failure'] = None
Justin Luong97eda6f2022-08-23 01:29:16 +0000945 except errors.NonRecoverableCasException as e:
Justin Luong54fa9592022-08-11 03:44:40 +0000946 # We could not find the CAS package. The swarming task should not
947 # be retried automatically
Justin Luongcee9ce82022-08-31 02:03:32 +0000948 result['missing_cas'] = [e.to_dict()]
Justin Luong54fa9592022-08-11 03:44:40 +0000949 logging.exception('internal failure: %s', e)
950 result['internal_failure'] = str(e)
951 on_error.report(None)
952
Justin Luong97eda6f2022-08-23 01:29:16 +0000953 except errors.NonRecoverableCipdException as e:
Justin Luong54fa9592022-08-11 03:44:40 +0000954 # We could not find the CIPD package. The swarming task should not
955 # be retried automatically
956 result['missing_cipd'] = [e.to_dict()]
957 logging.exception('internal failure: %s', e)
958 result['internal_failure'] = str(e)
959 on_error.report(None)
maruela9cfd6f2015-09-15 11:03:15 -0700960 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -0700961 # An internal error occurred. Report accordingly so the swarming task will
962 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -0700963 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -0700964 result['internal_failure'] = str(e)
965 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -0700966
967 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -0700968 finally:
969 try:
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000970 cleanup_start = time.time()
Ye Kuangbc4e8402020-07-29 09:54:30 +0000971 success = True
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500972 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -0700973 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700974 logging.warning(
975 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -0700976 else:
maruel84537cb2015-10-16 14:21:28 -0700977 # On Windows rmtree(run_dir) call above has a synchronization effect: it
978 # finishes only when all task child processes terminate (since a running
979 # process locks *.exe file). Examine out_dir only after that call
980 # completes (since child processes may write to out_dir too and we need
981 # to wait for them to finish).
Takuto Ikuta1ce61362021-11-16 05:44:17 +0000982 dirs_to_remove = [run_dir, tmp_dir, cas_client_dir]
Ye Kuangbc4e8402020-07-29 09:54:30 +0000983 if out_dir:
984 dirs_to_remove.append(out_dir)
985 for directory in dirs_to_remove:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000986 if not fs.isdir(directory):
987 continue
Junji Watanabe9cdfff52021-01-08 07:20:35 +0000988 start = time.time()
maruel84537cb2015-10-16 14:21:28 -0700989 try:
Junji Watanabecc4eefd2021-01-19 01:46:10 +0000990 file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -0700991 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000992 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -0700993 success = False
Junji Watanabe9cdfff52021-01-08 07:20:35 +0000994 finally:
995 logging.info('Cleanup: rmtree(%r) took %d seconds', directory,
996 time.time() - start)
maruel84537cb2015-10-16 14:21:28 -0700997 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000998 sys.stderr.write(
999 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
Junji Watanabed952bf12021-05-13 03:15:54 +00001000 if sys.platform == 'win32':
1001 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
1002 else:
1003 subprocess42.check_call(['ps', 'axu'], stdout=sys.stderr)
maruel84537cb2015-10-16 14:21:28 -07001004 if result['exit_code'] == 0:
1005 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -07001006
maruela9cfd6f2015-09-15 11:03:15 -07001007 if not success and result['exit_code'] == 0:
1008 result['exit_code'] = 1
1009 except Exception as e:
1010 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -07001011 if out_dir:
1012 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -07001013 result['internal_failure'] = str(e)
Takuto Ikutaa9a907b2020-04-17 08:50:50 +00001014 on_error.report(None)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001015 finally:
1016 cleanup_duration = time.time() - cleanup_start
1017 result['stats']['cleanup']['duration'] = cleanup_duration
1018 logging.info('Cleanup: removing directories took %d seconds',
1019 cleanup_duration)
maruela9cfd6f2015-09-15 11:03:15 -07001020 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001021
1022
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001023def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -07001024 """Runs an executable and records execution metadata.
1025
nodir55be77b2016-05-03 09:39:57 -07001026 If isolated_hash is specified, downloads the dependencies in the cache,
1027 hardlinks them into a temporary directory and runs the command specified in
1028 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001029
1030 A temporary directory is created to hold the output files. The content inside
1031 this directory will be uploaded back to |storage| packaged as a .isolated
1032 file.
1033
1034 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001035 - data: TaskData instance.
1036 - result_json: File path to dump result metadata into. If set, the process
1037 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -07001038
1039 Returns:
1040 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001041 """
maruela76b9ee2015-12-15 06:18:08 -08001042 if result_json:
1043 # Write a json output file right away in case we get killed.
1044 result = {
Junji Watanabe54925c32020-09-08 00:56:18 +00001045 'exit_code': None,
1046 'had_hard_timeout': False,
1047 'internal_failure': 'Was terminated before completion',
1048 'outputs_ref': None,
1049 'cas_output_root': None,
1050 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -08001051 }
1052 tools.write_json(result_json, result, dense=True)
1053
maruela9cfd6f2015-09-15 11:03:15 -07001054 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001055 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -07001056 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -07001057
maruela9cfd6f2015-09-15 11:03:15 -07001058 if result_json:
maruel05d5a882015-09-21 13:59:02 -07001059 # We've found tests to delete 'work' when quitting, causing an exception
1060 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -07001061 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -07001062 tools.write_json(result_json, result, dense=True)
1063 # Only return 1 if there was an internal error.
1064 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +00001065
maruela9cfd6f2015-09-15 11:03:15 -07001066 # Marshall into old-style inline output.
1067 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +00001068 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -07001069 data = {
Junji Watanabe38b28b02020-04-23 10:23:30 +00001070 'hash': result['outputs_ref']['isolated'],
1071 'namespace': result['outputs_ref']['namespace'],
1072 'storage': result['outputs_ref']['isolatedserver'],
maruela9cfd6f2015-09-15 11:03:15 -07001073 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -05001074 sys.stdout.flush()
Junji Watanabe38b28b02020-04-23 10:23:30 +00001075 print('[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
1076 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -08001077 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -07001078 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001079
1080
iannuccib58d10d2017-03-18 02:00:25 -07001081# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -08001082CipdInfo = collections.namedtuple('CipdInfo', [
1083 'client', # cipd.CipdClient object
1084 'cache_dir', # absolute path to bot-global cipd tag and instance cache
1085 'stats', # dict with stats to return to the server
1086 'pins', # dict with installed cipd pins to return to the server
1087])
1088
1089
1090@contextlib.contextmanager
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001091def copy_local_packages(_run_dir, cas_dir, _nsjail_dir):
Junji Watanabedc2f89e2021-11-08 08:44:30 +00001092 """Copies CIPD packages from luci/luci-go dir."""
1093 go_client_dir = os.environ.get('LUCI_GO_CLIENT_DIR')
1094 assert go_client_dir, ('Please set LUCI_GO_CLIENT_DIR env var to install CIPD'
1095 ' packages locally.')
1096 shutil.copy2(os.path.join(go_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX),
1097 os.path.join(cas_dir, 'cas' + cipd.EXECUTABLE_SUFFIX))
vadimsh232f5a82017-01-20 19:23:44 -08001098 yield None
1099
1100
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001101def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -07001102 """Calls 'cipd ensure' for packages.
1103
1104 Args:
1105 run_dir (str): root of installation.
1106 cipd_cache_dir (str): the directory to use for the cipd package cache.
1107 client (CipdClient): the cipd client to use
1108 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -07001109
1110 Returns: list of pinned packages. Looks like [
1111 {
1112 'path': 'subdirectory',
1113 'package_name': 'resolved/package/name',
1114 'version': 'deadbeef...',
1115 },
1116 ...
1117 ]
1118 """
1119 package_pins = [None]*len(packages)
1120 def insert_pin(path, name, version, idx):
1121 package_pins[idx] = {
1122 'package_name': name,
1123 # swarming deals with 'root' as '.'
1124 'path': path or '.',
1125 'version': version,
1126 }
1127
1128 by_path = collections.defaultdict(list)
1129 for i, (path, name, version) in enumerate(packages):
1130 # cipd deals with 'root' as ''
1131 if path == '.':
1132 path = ''
1133 by_path[path].append((name, version, i))
1134
1135 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001136 run_dir,
1137 {
1138 subdir: [(name, vers) for name, vers, _ in pkgs
1139 ] for subdir, pkgs in by_path.items()
1140 },
1141 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -07001142 )
1143
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +00001144 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -07001145 this_subdir = by_path[subdir]
1146 for i, (name, version) in enumerate(pin_list):
1147 insert_pin(subdir, name, version, this_subdir[i][2])
1148
Robert Iannucci461b30d2017-12-13 11:34:03 -08001149 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -07001150
1151 return package_pins
1152
1153
vadimsh232f5a82017-01-20 19:23:44 -08001154@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001155def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001156 client_package_name, client_version, cache_dir,
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001157 cas_dir, nsjail_dir):
vadimsh902948e2017-01-20 15:57:32 -08001158 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -07001159
vadimsh232f5a82017-01-20 19:23:44 -08001160 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
1161
1162 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -07001163 [
1164 {
1165 "path": path, "package_name": package_name, "version": version,
1166 },
1167 ...
1168 ]
vadimsh902948e2017-01-20 15:57:32 -08001169 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -07001170
1171 such that they correspond 1:1 to all input package arguments from the command
1172 line. These dictionaries make their all the way back to swarming, where they
1173 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -07001174
vadimsh902948e2017-01-20 15:57:32 -08001175 If 'packages' list is empty, will bootstrap CIPD client, but won't install
1176 any packages.
1177
1178 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -08001179 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -08001180
nodirbe642ff2016-06-09 15:51:51 -07001181 Args:
nodir90bc8dc2016-06-15 13:35:21 -07001182 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -08001183 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -07001184 service_url (str): CIPD server url, e.g.
1185 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -07001186 client_package_name (str): CIPD package name of CIPD client.
1187 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -07001188 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001189 cas_dir (str): where to download cas client.
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001190 nsjail_dir (str): where to download nsjail. If set to None, nsjail is not
1191 downloaded.
nodirbe642ff2016-06-09 15:51:51 -07001192 """
1193 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001194
nodirbe642ff2016-06-09 15:51:51 -07001195 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001196
vadimsh902948e2017-01-20 15:57:32 -08001197 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001198 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001199 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001200 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001201
nodirbe642ff2016-06-09 15:51:51 -07001202 get_client_start = time.time()
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001203 client_manager = cipd.get_client(cache_dir, service_url, client_package_name,
1204 client_version)
iannucci96fcccc2016-08-30 15:52:22 -07001205
nodirbe642ff2016-06-09 15:51:51 -07001206 with client_manager as client:
1207 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001208
iannuccib58d10d2017-03-18 02:00:25 -07001209 package_pins = []
1210 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001211 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1212 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001213
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001214 # Install cas client to |cas_dir|.
1215 _install_packages(cas_dir, cipd_cache_dir, client,
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +00001216 [('', _CAS_PACKAGE, _LUCI_GO_REVISION)])
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001217
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001218 # Install nsjail to |nsjail_dir|.
1219 if nsjail_dir is not None:
1220 _install_packages(nsjail_dir, cipd_cache_dir, client,
1221 [('', _NSJAIL_PACKAGE, _NSJAIL_VERSION)])
1222
iannuccib58d10d2017-03-18 02:00:25 -07001223 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001224
vadimsh232f5a82017-01-20 19:23:44 -08001225 total_duration = time.time() - start
Junji Watanabe38b28b02020-04-23 10:23:30 +00001226 logging.info('Installing CIPD client and packages took %d seconds',
1227 total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001228
vadimsh232f5a82017-01-20 19:23:44 -08001229 yield CipdInfo(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001230 client=client,
1231 cache_dir=cipd_cache_dir,
1232 stats={
1233 'duration': total_duration,
1234 'get_client_duration': get_client_duration,
iannuccib58d10d2017-03-18 02:00:25 -07001235 },
Junji Watanabe38b28b02020-04-23 10:23:30 +00001236 pins={
1237 'client_package': {
1238 'package_name': client.package_name,
1239 'version': client.instance_id,
1240 },
1241 'packages': package_pins,
1242 })
nodirbe642ff2016-06-09 15:51:51 -07001243
1244
1245def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001246 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001247 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001248 version=__version__,
1249 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001250 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001251 '--clean',
1252 action='store_true',
maruel36a963d2016-04-08 17:15:49 -07001253 help='Cleans the cache, trimming it necessary and remove corrupted items '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001254 'and returns without executing anything; use with -v to know what '
1255 'was done')
maruel36a963d2016-04-08 17:15:49 -07001256 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001257 '--json',
1258 help='dump output metadata to json file. When used, run_isolated returns '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001259 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001260 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001261 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001262 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001263 '--grace-period',
1264 type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001265 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001266 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001267 '--relative-cwd',
Takuto Ikuta18ca29a2020-12-04 07:34:20 +00001268 help='Ignore the isolated \'relative_cwd\' and use this one instead')
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001269 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001270 '--env',
1271 default=[],
1272 action='append',
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001273 help='Environment variables to set for the child process')
1274 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001275 '--env-prefix',
1276 default=[],
1277 action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001278 help='Specify a VAR=./path/fragment to put in the environment variable '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001279 'before executing the command. The path fragment must be relative '
1280 'to the isolated run directory, and must not contain a `..` token. '
1281 'The path will be made absolute and prepended to the indicated '
1282 '$VAR using the OS\'s path separator. Multiple items for the same '
1283 '$VAR will be prepended in order.')
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001284 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001285 '--bot-file',
1286 help='Path to a file describing the state of the host. The content is '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001287 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001288 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001289 '--switch-to-account',
1290 help='If given, switches LUCI_CONTEXT to given logical service account '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001291 '(e.g. "task" or "system") before launching the isolated process.')
vadimsh9c54b2c2017-07-25 14:08:29 -07001292 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001293 '--output',
1294 action='append',
aludwin0a8e17d2016-10-27 15:57:39 -07001295 help='Specifies an output to return. If no outputs are specified, all '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001296 'files located in $(ISOLATED_OUTDIR) will be returned; '
1297 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1298 'specified by --output option (there can be multiple) will be '
1299 'returned. Note that if a file in OUT_DIR has the same path '
1300 'as an --output option, the --output version will be returned.')
aludwin0a8e17d2016-10-27 15:57:39 -07001301 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001302 '-a',
1303 '--argsfile',
aludwin7556e0c2016-10-26 08:46:10 -07001304 # This is actually handled in parse_args; it's included here purely so it
1305 # can make it into the help text.
1306 help='Specify a file containing a JSON array of arguments to this '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001307 'script. If --argsfile is provided, no other argument may be '
1308 'provided on the command line.')
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001309 parser.add_option(
1310 '--report-on-exception',
1311 action='store_true',
1312 help='Whether report exception during execution to isolate server. '
1313 'This flag should only be used in swarming bot.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001314
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001315 group = optparse.OptionGroup(parser,
1316 'Data source - Content Addressed Storage')
Junji Watanabe54925c32020-09-08 00:56:18 +00001317 group.add_option(
1318 '--cas-instance', help='Full CAS instance name for input/output files.')
1319 group.add_option(
1320 '--cas-digest',
1321 help='Digest of the input root on RBE-CAS. The format is '
1322 '`{hash}/{size_bytes}`.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001323 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001324
Junji Watanabeb03450b2020-09-25 05:09:27 +00001325 # Cache options.
Junji Watanabeb03450b2020-09-25 05:09:27 +00001326 add_cas_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001327
1328 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001329
1330 group = optparse.OptionGroup(parser, 'Named caches')
1331 group.add_option(
1332 '--named-cache',
1333 dest='named_caches',
1334 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001335 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001336 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001337 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001338 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1339 'path is a path relative to the run dir where the cache directory '
1340 'must be put to. '
1341 'This option can be specified more than once.')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001342 group.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001343 '--named-cache-root',
1344 default='named_caches',
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001345 help='Cache root directory. Default=%default')
1346 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001347
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001348 group = optparse.OptionGroup(parser, 'Process containment')
1349 parser.add_option(
1350 '--lower-priority', action='store_true',
1351 help='Lowers the child process priority')
1352 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001353 '--containment-type',
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001354 choices=('NONE', 'AUTO', 'JOB_OBJECT', 'NSJAIL'),
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001355 default='NONE',
1356 help='Type of container to use')
1357 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001358 '--limit-processes',
1359 type='int',
1360 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001361 help='Maximum number of active processes in the containment')
1362 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001363 '--limit-total-committed-memory',
1364 type='int',
1365 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001366 help='Maximum sum of committed memory in the containment')
1367 parser.add_option_group(group)
1368
1369 group = optparse.OptionGroup(parser, 'Debugging')
1370 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001371 '--leak-temp-dir',
1372 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001373 help='Deliberately leak isolate\'s temp dir for later examination. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001374 'Default: %default')
1375 group.add_option('--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001376 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001377
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001378 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001379
Ye Kuang1d096cb2020-06-26 08:38:21 +00001380 parser.set_defaults(cache='cache')
nodirbe642ff2016-06-09 15:51:51 -07001381 return parser
1382
1383
Junji Watanabeb03450b2020-09-25 05:09:27 +00001384def add_cas_cache_options(parser):
1385 group = optparse.OptionGroup(parser, 'CAS cache management')
1386 group.add_option(
1387 '--cas-cache',
1388 metavar='DIR',
1389 default='cas-cache',
1390 help='Directory to keep a local cache of the files. Accelerates download '
1391 'by reusing already downloaded files. Default=%default')
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001392 group.add_option(
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001393 '--kvs-dir',
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001394 default='',
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001395 help='CAS cache dir using kvs for small files. Default=%default')
Takuto Ikutaa71c6562021-11-18 06:07:55 +00001396 group.add_option(
1397 '--max-cache-size',
1398 type='int',
1399 metavar='NNN',
1400 default=50 * 1024 * 1024 * 1024,
1401 help='Trim if the cache gets larger than this value, default=%default')
1402 group.add_option(
1403 '--min-free-space',
1404 type='int',
1405 metavar='NNN',
1406 default=2 * 1024 * 1024 * 1024,
1407 help='Trim if disk free space becomes lower than this value, '
1408 'default=%default')
Junji Watanabeb03450b2020-09-25 05:09:27 +00001409 parser.add_option_group(group)
1410
1411
1412def process_cas_cache_options(options):
1413 if options.cas_cache:
1414 policies = local_caching.CachePolicies(
1415 max_cache_size=options.max_cache_size,
1416 min_free_space=options.min_free_space,
1417 # max_items isn't used for CAS cache for now.
1418 max_items=None,
1419 max_age_secs=MAX_AGE_SECS)
1420
Junji Watanabe7a631b02022-01-13 02:30:29 +00001421 return local_caching.DiskContentAddressedCache(os.path.abspath(
1422 options.cas_cache),
1423 policies,
1424 trim=False)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001425 return local_caching.MemoryContentAddressedCache()
1426
1427
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001428def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001429 """Validates named cache options and returns a CacheManager."""
1430 if options.named_caches and not options.named_cache_root:
1431 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001432 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001433 if not CACHE_NAME_RE.match(name):
1434 parser.error(
1435 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1436 if not path:
1437 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001438 try:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001439 int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001440 except ValueError:
1441 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001442 if options.named_cache_root:
1443 # Make these configurable later if there is use case but for now it's fairly
1444 # safe values.
1445 # In practice, a fair chunk of bots are already recycled on a daily schedule
1446 # so this code doesn't have any effect to them, unless they are preloaded
1447 # with a really old cache.
1448 policies = local_caching.CachePolicies(
1449 # 1TiB.
1450 max_cache_size=1024*1024*1024*1024,
1451 min_free_space=options.min_free_space,
1452 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001453 max_age_secs=MAX_AGE_SECS)
Junji Watanabe7a631b02022-01-13 02:30:29 +00001454 root_dir = os.path.abspath(options.named_cache_root)
John Budorickc6186972020-02-26 00:58:14 +00001455 cache = local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
1456 # Touch any named caches we're going to use to minimize thrashing
1457 # between tasks that request some (but not all) of the same named caches.
John Budorick0a4dab62020-03-02 22:23:35 +00001458 cache.touch(*[name for name, _, _ in options.named_caches])
John Budorickc6186972020-02-26 00:58:14 +00001459 return cache
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001460 return None
1461
1462
aludwin7556e0c2016-10-26 08:46:10 -07001463def parse_args(args):
1464 # Create a fake mini-parser just to get out the "-a" command. Note that
1465 # it's not documented here; instead, it's documented in create_option_parser
1466 # even though that parser will never actually get to parse it. This is
1467 # because --argsfile is exclusive with all other options and arguments.
1468 file_argparse = argparse.ArgumentParser(add_help=False)
1469 file_argparse.add_argument('-a', '--argsfile')
1470 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1471 if file_args.argsfile:
1472 if nonfile_args:
1473 file_argparse.error('Can\'t specify --argsfile with'
1474 'any other arguments (%s)' % nonfile_args)
1475 try:
1476 with open(file_args.argsfile, 'r') as f:
1477 args = json.load(f)
1478 except (IOError, OSError, ValueError) as e:
1479 # We don't need to error out here - "args" is now empty,
1480 # so the call below to parser.parse_args(args) will fail
1481 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001482 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001483
1484 # Even if we failed to read the args, just call the normal parser now since it
1485 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001486 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001487 options, args = parser.parse_args(args)
Ye Kuangfff1e502020-07-13 13:21:57 +00001488 if not isinstance(options.cipd_enabled, (bool, int)):
1489 options.cipd_enabled = distutils.util.strtobool(options.cipd_enabled)
aludwin7556e0c2016-10-26 08:46:10 -07001490 return (parser, options, args)
1491
1492
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001493def _calc_named_cache_hint(named_cache, named_caches):
1494 """Returns the expected size of the missing named caches."""
1495 present = named_cache.available
1496 size = 0
Takuto Ikutad169bfd2021-08-02 05:45:09 +00001497 logging.info('available named cache %s', present)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001498 for name, _, hint in named_caches:
1499 if name not in present:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001500 hint = int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001501 if hint > 0:
Takuto Ikuta74686842021-07-30 04:11:03 +00001502 logging.info("named cache hint: %s, %d", name, hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001503 size += hint
Takuto Ikuta74686842021-07-30 04:11:03 +00001504 logging.info("total size of named cache hint: %d", size)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001505 return size
1506
1507
Takuto Ikutaae391c52020-12-03 08:43:45 +00001508def _clean_cmd(parser, options, caches, root):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001509 """Cleanup cache dirs/files."""
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001510 if options.json:
1511 parser.error('Can\'t use --json with --clean.')
1512 if options.named_caches:
1513 parser.error('Can\t use --named-cache with --clean.')
1514 if options.cas_instance or options.cas_digest:
1515 parser.error('Can\t use --cas-instance, --cas-digest with --clean.')
1516
1517 logging.info("initial free space: %d", file_path.get_free_space(root))
1518
Junji Watanabe7a631b02022-01-13 02:30:29 +00001519 if options.kvs_dir and fs.isdir(options.kvs_dir):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001520 # Remove kvs file if its size exceeds fixed threshold.
Junji Watanabe7a631b02022-01-13 02:30:29 +00001521 kvs_dir = options.kvs_dir
Takuto Ikutab1b70062021-03-22 01:02:41 +00001522 size = file_path.get_recursive_size(kvs_dir)
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001523 if size >= _CAS_KVS_CACHE_THRESHOLD:
1524 logging.info("remove kvs dir with size: %d", size)
Takuto Ikutab1b70062021-03-22 01:02:41 +00001525 file_path.rmtree(kvs_dir)
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001526
1527 # Trim first, then clean.
1528 local_caching.trim_caches(
1529 caches,
1530 root,
1531 min_free_space=options.min_free_space,
1532 max_age_secs=MAX_AGE_SECS)
1533 logging.info("free space after trim: %d", file_path.get_free_space(root))
1534 for c in caches:
1535 c.cleanup()
1536 logging.info("free space after cleanup: %d", file_path.get_free_space(root))
1537
1538
aludwin7556e0c2016-10-26 08:46:10 -07001539def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001540 # Warning: when --argsfile is used, the strings are unicode instances, when
1541 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001542 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001543
Jonah Hooper9b5bd8c2022-07-21 15:33:41 +00001544 # adds another log level for logs which are directed to standard output
1545 # these logs will be uploaded to cloudstorage
1546 logging_utils.set_user_level_logging()
1547
Joanna Wang40959bf2021-08-12 18:10:12 +00001548 # Must be logged after parse_args(), which eventually calls
1549 # logging_utils.prepare_logging() which expects no logs before its call.
Jonah Hooper9b5bd8c2022-07-21 15:33:41 +00001550 logging_utils.user_logs('Starting run_isolated script')
Joanna Wang40959bf2021-08-12 18:10:12 +00001551
Junji Watanabe1d83d282021-05-11 05:50:40 +00001552 SWARMING_SERVER = os.environ.get('SWARMING_SERVER')
1553 SWARMING_TASK_ID = os.environ.get('SWARMING_TASK_ID')
1554 if options.report_on_exception and SWARMING_SERVER:
1555 task_url = None
1556 if SWARMING_TASK_ID:
1557 task_url = '%s/task?id=%s' % (SWARMING_SERVER, SWARMING_TASK_ID)
1558 on_error.report_on_exception_exit(SWARMING_SERVER, source=task_url)
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001559
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001560 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001561 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001562
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001563 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001564 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001565 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1566 if hint:
1567 # Increase the --min-free-space value by the hint, and recreate the
1568 # NamedCache instance so it gets the updated CachePolicy.
1569 options.min_free_space += hint
1570 named_cache = process_named_cache_options(parser, options)
1571
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001572 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1573 # they can be cleaned the same way.
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001574
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001575 cas_cache = process_cas_cache_options(options)
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +00001576
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001577 caches = []
Junji Watanabeb03450b2020-09-25 05:09:27 +00001578 if cas_cache:
1579 caches.append(cas_cache)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001580 if named_cache:
1581 caches.append(named_cache)
Junji Watanabe7a631b02022-01-13 02:30:29 +00001582 root = caches[0].cache_dir if caches else os.getcwd()
maruel36a963d2016-04-08 17:15:49 -07001583 if options.clean:
Takuto Ikutaae391c52020-12-03 08:43:45 +00001584 _clean_cmd(parser, options, caches, root)
maruel36a963d2016-04-08 17:15:49 -07001585 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001586
1587 # Trim must still be done for the following case:
1588 # - named-cache was used
1589 # - some entries, with a large hint, where missing
1590 # - --min-free-space was increased accordingly, thus trimming is needed
1591 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1592 # --clean after each task.
Takuto Ikutac9ddff22021-02-18 07:58:39 +00001593 additional_buffer = _FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001594 if options.kvs_dir:
Takuto Ikuta7f45c592021-02-09 05:57:05 +00001595 additional_buffer += _CAS_KVS_CACHE_THRESHOLD
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001596 # Add some buffer for Go CLI.
1597 min_free_space = options.min_free_space + additional_buffer
1598
1599 def trim_caches_fn(stats):
1600 start = time.time()
1601 local_caching.trim_caches(
1602 caches, root, min_free_space=min_free_space, max_age_secs=MAX_AGE_SECS)
1603 duration = time.time() - start
1604 stats['duration'] = duration
Jonah Hooper9b5bd8c2022-07-21 15:33:41 +00001605 logging_utils.user_logs('trim_caches: took %d seconds', duration)
maruel36a963d2016-04-08 17:15:49 -07001606
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001607 # Save state of cas cache not to overwrite state from go client.
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001608 if cas_cache:
1609 cas_cache.save()
1610 cas_cache = None
1611
Takuto Ikutadc496672021-11-12 05:58:59 +00001612 if not args:
1613 parser.error('command to run is required.')
nodir55be77b2016-05-03 09:39:57 -07001614
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001615 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001616
Takuto Ikutaa71c6562021-11-18 06:07:55 +00001617 if ISOLATED_OUTDIR_PARAMETER in args and not options.cas_instance:
1618 parser.error('%s in args requires --cas-instance' %
Junji Watanabeed9ce352020-09-25 12:32:07 +00001619 ISOLATED_OUTDIR_PARAMETER)
1620
nodir90bc8dc2016-06-15 13:35:21 -07001621 if options.root_dir:
Junji Watanabe7a631b02022-01-13 02:30:29 +00001622 options.root_dir = os.path.abspath(options.root_dir)
Takuto Ikutad46ea762020-10-07 05:43:22 +00001623 else:
Junji Watanabe7a631b02022-01-13 02:30:29 +00001624 options.root_dir = tempfile.mkdtemp(prefix='root')
maruel12e30012015-10-09 11:55:35 -07001625 if options.json:
Junji Watanabe7a631b02022-01-13 02:30:29 +00001626 options.json = os.path.abspath(options.json)
nodir55be77b2016-05-03 09:39:57 -07001627
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001628 if any('=' not in i for i in options.env):
1629 parser.error(
1630 '--env required key=value form. value can be skipped to delete '
1631 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001632 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001633
1634 prefixes = {}
1635 cwd = os.path.realpath(os.getcwd())
1636 for item in options.env_prefix:
1637 if '=' not in item:
1638 parser.error(
1639 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1640 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001641 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001642 if os.path.isabs(opath):
1643 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1644 opath = os.path.normpath(opath)
1645 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1646 parser.error(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001647 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1648 % opath)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001649 prefixes.setdefault(key, []).append(opath)
1650 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001651
nodirbe642ff2016-06-09 15:51:51 -07001652 cipd.validate_cipd_options(parser, options)
1653
Junji Watanabedc2f89e2021-11-08 08:44:30 +00001654 install_packages_fn = copy_local_packages
vadimsh902948e2017-01-20 15:57:32 -08001655 if options.cipd_enabled:
Jonah Hoopera404c6e2022-12-09 20:57:37 +00001656 if options.cipd_cache:
1657 cipd_cache_dir = options.cipd_cache
1658 else:
1659 cipd_cache_dir = os.path.join(options.root_dir, 'cipd_cache')
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001660 install_packages_fn = (
1661 lambda run_dir, cas_dir, nsjail_dir: install_client_and_packages(
1662 run_dir,
1663 cipd.parse_package_args(options.cipd_packages),
1664 options.cipd_server,
1665 options.cipd_client_package,
1666 options.cipd_client_version,
Jonah Hoopera404c6e2022-12-09 20:57:37 +00001667 cache_dir=cipd_cache_dir,
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001668 cas_dir=cas_dir,
1669 nsjail_dir=nsjail_dir,
1670 ))
nodirbe642ff2016-06-09 15:51:51 -07001671
nodird6160682017-02-02 13:03:35 -08001672 @contextlib.contextmanager
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001673 def install_named_caches(run_dir, stats):
nodird6160682017-02-02 13:03:35 -08001674 # WARNING: this function depends on "options" variable defined in the outer
1675 # function.
Junji Watanabe7a631b02022-01-13 02:30:29 +00001676 assert str(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001677 assert os.path.isabs(run_dir), run_dir
Junji Watanabe7a631b02022-01-13 02:30:29 +00001678 named_caches = [(os.path.join(run_dir, str(relpath)), name)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001679 for name, relpath, _ in options.named_caches]
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001680 install_start = time.time()
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001681 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001682 named_cache.install(path, name)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001683 install_duration = time.time() - install_start
1684 stats['install']['duration'] = install_duration
1685 logging.info('named_caches: install took %d seconds', install_duration)
nodird6160682017-02-02 13:03:35 -08001686 try:
1687 yield
1688 finally:
dnje289d132017-07-07 11:16:44 -07001689 # Uninstall each named cache, returning it to the cache pool. If an
1690 # uninstall fails for a given cache, it will remain in the task's
1691 # temporary space, get cleaned up by the Swarming bot, and be lost.
1692 #
1693 # If the Swarming bot cannot clean up the cache, it will handle it like
1694 # any other bot file that could not be removed.
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001695 uninstall_start = time.time()
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001696 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001697 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001698 # uninstall() doesn't trim but does call save() implicitly. Trimming
1699 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001700 named_cache.uninstall(path, name)
1701 except local_caching.NamedCacheError:
Takuto Ikuta463ecdd2021-03-05 09:35:38 +00001702 if sys.platform == 'win32':
1703 # Show running processes.
1704 sys.stderr.write("running process\n")
1705 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
1706
Junji Watanabed2ab86b2021-08-13 07:20:23 +00001707 error = (
1708 'Error while removing named cache %r at %r. The cache will be'
1709 ' lost.' % (path, name))
1710 logging.exception(error)
1711 on_error.report(error)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001712 uninstall_duration = time.time() - uninstall_start
1713 stats['uninstall']['duration'] = uninstall_duration
1714 logging.info('named_caches: uninstall took %d seconds',
1715 uninstall_duration)
nodirf33b8d62016-10-26 22:34:58 -07001716
Takuto Ikutaf3caa9b2020-11-02 05:38:26 +00001717 command = args
1718 if options.relative_cwd:
1719 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1720 if not a.startswith(os.getcwd()):
1721 parser.error(
1722 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001723
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001724 containment_type = subprocess42.Containment.NONE
1725 if options.containment_type == 'AUTO':
1726 containment_type = subprocess42.Containment.AUTO
1727 if options.containment_type == 'JOB_OBJECT':
1728 containment_type = subprocess42.Containment.JOB_OBJECT
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001729 if options.containment_type == 'NSJAIL':
1730 containment_type = subprocess42.Containment.NSJAIL
1731 # TODO(https://crbug.com/1227833): This object should eventually contain the
1732 # path to the nsjail binary and the nsjail configuration file.
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001733 containment = subprocess42.Containment(
1734 containment_type=containment_type,
1735 limit_processes=options.limit_processes,
1736 limit_total_committed_memory=options.limit_total_committed_memory)
1737
Junji Watanabe7a631b02022-01-13 02:30:29 +00001738 data = TaskData(command=command,
1739 relative_cwd=options.relative_cwd,
1740 cas_instance=options.cas_instance,
1741 cas_digest=options.cas_digest,
1742 outputs=options.output,
1743 install_named_caches=install_named_caches,
1744 leak_temp_dir=options.leak_temp_dir,
1745 root_dir=options.root_dir,
1746 hard_timeout=options.hard_timeout,
1747 grace_period=options.grace_period,
1748 bot_file=options.bot_file,
1749 switch_to_account=options.switch_to_account,
1750 install_packages_fn=install_packages_fn,
1751 cas_cache_dir=options.cas_cache,
1752 cas_cache_policies=local_caching.CachePolicies(
1753 max_cache_size=options.max_cache_size,
1754 min_free_space=options.min_free_space,
1755 max_items=None,
1756 max_age_secs=None,
1757 ),
1758 cas_kvs=options.kvs_dir,
1759 env=options.env,
1760 env_prefix=options.env_prefix,
1761 lower_priority=bool(options.lower_priority),
1762 containment=containment,
1763 trim_caches_fn=trim_caches_fn)
nodirbe642ff2016-06-09 15:51:51 -07001764 try:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001765 return run_tha_test(data, options.json)
Justin Luong122227e2022-08-25 03:05:03 +00001766 except (cipd.Error, local_caching.NamedCacheError,
1767 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001768 print(ex.message, file=sys.stderr)
Junji Watanabed2ab86b2021-08-13 07:20:23 +00001769 on_error.report(None)
nodirbe642ff2016-06-09 15:51:51 -07001770 return 1
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001771
1772if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001773 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001774 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001775 fix_encoding.fix_encoding()
Ye Kuang2dd17442020-04-22 08:45:52 +00001776 net.set_user_agent('run_isolated.py/' + __version__)
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001777 sys.exit(main(sys.argv[1:]))