blob: 4afaa8932dd538930c179d43fc90b6488308532d [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
Joanna Wang4cec0e42021-08-26 00:48:37 +000033Any ${SWARMING_TASK_ID} on the command line will be replaced by the
34SWARMING_TASK_ID value passed with the --env option.
35
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000036See
37https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
38for all the variables.
39
40See
41https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
42for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000043"""
44
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000045from __future__ import print_function
46
47__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000048
aludwin7556e0c2016-10-26 08:46:10 -070049import argparse
maruel064c0a32016-04-05 11:47:15 -070050import base64
iannucci96fcccc2016-08-30 15:52:22 -070051import collections
vadimsh232f5a82017-01-20 19:23:44 -080052import contextlib
Ye Kuangfff1e502020-07-13 13:21:57 +000053import distutils
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040054import errno
aludwin7556e0c2016-10-26 08:46:10 -070055import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000056import logging
57import optparse
58import os
Takuto Ikuta5c59a842020-01-24 03:05:24 +000059import platform
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040060import re
Junji Watanabedc2f89e2021-11-08 08:44:30 +000061import shutil
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000062import sys
63import tempfile
maruel064c0a32016-04-05 11:47:15 -070064import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000065
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000066from utils import tools
67tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000068
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000069# third_party/
70from depot_tools import fix_encoding
Takuto Ikuta6e2ff962019-10-29 12:35:27 +000071import six
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000072
73# pylint: disable=ungrouped-imports
Takuto Ikutad53d7bd2021-07-16 03:09:33 +000074import DEPS
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000075import auth
76import cipd
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000077import local_caching
78from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070079from utils import file_path
maruel12e30012015-10-09 11:55:35 -070080from utils import fs
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040081from utils import logging_utils
Ye Kuang2dd17442020-04-22 08:45:52 +000082from utils import net
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040083from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050084from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000085
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000086
maruele2f2cb82016-07-13 14:41:03 -070087# Magic variables that can be found in the isolate task command line.
88ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
89EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
90SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
Joanna Wang4cec0e42021-08-26 00:48:37 +000091SWARMING_TASK_ID_PARAMETER = '${SWARMING_TASK_ID}'
maruele2f2cb82016-07-13 14:41:03 -070092
93
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000094# The name of the log file to use.
95RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
96
maruele2f2cb82016-07-13 14:41:03 -070097
maruele2f2cb82016-07-13 14:41:03 -070098# Use short names for temporary directories. This is driven by Windows, which
99# imposes a relatively short maximum path length of 260 characters, often
100# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000101# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -0700102#
103# It is recommended to start the script with a `root_dir` as short as
104# possible.
105# - ir stands for isolated_run
106# - io stands for isolated_out
107# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000108# - ic stands for isolated_client
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000109# - ns stands for nsjail
maruele2f2cb82016-07-13 14:41:03 -0700110ISOLATED_RUN_DIR = u'ir'
111ISOLATED_OUT_DIR = u'io'
112ISOLATED_TMP_DIR = u'it'
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000113ISOLATED_CLIENT_DIR = u'ic'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000114_CAS_CLIENT_DIR = u'cc'
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000115_NSJAIL_DIR = u'ns'
maruele2f2cb82016-07-13 14:41:03 -0700116
Takuto Ikuta02edca22019-11-29 10:04:51 +0000117# TODO(tikuta): take these parameter from luci-config?
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000118_CAS_PACKAGE = 'infra/tools/luci/cas/${platform}'
Takuto Ikutad53d7bd2021-07-16 03:09:33 +0000119_LUCI_GO_REVISION = DEPS.deps['luci-go']['packages'][0]['version']
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000120_NSJAIL_PACKAGE = 'infra/3pp/tools/nsjail/${platform}'
121_NSJAIL_VERSION = DEPS.deps['nsjail']['packages'][0]['version']
maruele2f2cb82016-07-13 14:41:03 -0700122
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400123# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000124CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400125
Takuto Ikutac9ddff22021-02-18 07:58:39 +0000126_FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES = 2 * 1024 * 1024 * 1024
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400127
marueld928c862017-06-08 08:20:04 -0700128OUTLIVING_ZOMBIE_MSG = """\
129*** Swarming tried multiple times to delete the %s directory and failed ***
130*** Hard failing the task ***
131
132Swarming detected that your testing script ran an executable, which may have
133started a child executable, and the main script returned early, leaving the
134children executables playing around unguided.
135
136You don't want to leave children processes outliving the task on the Swarming
137bot, do you? The Swarming bot doesn't.
138
139How to fix?
140- For any process that starts children processes, make sure all children
141 processes terminated properly before each parent process exits. This is
142 especially important in very deep process trees.
143 - This must be done properly both in normal successful task and in case of
144 task failure. Cleanup is very important.
145- The Swarming bot sends a SIGTERM in case of timeout.
146 - You have %s seconds to comply after the signal was sent to the process
147 before the process is forcibly killed.
148- To achieve not leaking children processes in case of signals on timeout, you
149 MUST handle signals in each executable / python script and propagate them to
150 children processes.
151 - When your test script (python or binary) receives a signal like SIGTERM or
152 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
153 them to terminate before quitting.
154
155See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400156https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700157for more information.
158
159*** May the SIGKILL force be with you ***
160"""
161
162
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000163# Currently hardcoded. Eventually could be exposed as a flag once there's value.
164# 3 weeks
165MAX_AGE_SECS = 21*24*60*60
166
Takuto Ikuta7ff4b242020-12-03 08:07:06 +0000167_CAS_KVS_CACHE_THRESHOLD = 5 * 1024 * 1024 * 1024 # 5 GiB
168
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500169TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000170 'TaskData',
171 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000172 # List of strings; the command line to use, independent of what was
173 # specified in the isolated file.
174 'command',
175 # Relative directory to start command into.
176 'relative_cwd',
Junji Watanabe54925c32020-09-08 00:56:18 +0000177 # Digest of the input root on RBE-CAS.
178 'cas_digest',
179 # Full CAS instance name.
180 'cas_instance',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000181 # List of paths relative to root_dir to put into the output isolated
182 # bundle upon task completion (see link_outputs_to_outdir).
183 'outputs',
184 # Function (run_dir) => context manager that installs named caches into
185 # |run_dir|.
186 'install_named_caches',
187 # If True, the temporary directory will be deliberately leaked for later
188 # examination.
189 'leak_temp_dir',
190 # Path to the directory to use to create the temporary directory. If not
191 # specified, a random temporary directory is created.
192 'root_dir',
193 # Kills the process if it lasts more than this amount of seconds.
194 'hard_timeout',
195 # Number of seconds to wait between SIGTERM and SIGKILL.
196 'grace_period',
197 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
198 # task command line argument.
199 'bot_file',
200 # Logical account to switch LUCI_CONTEXT into.
201 'switch_to_account',
202 # Context manager dir => CipdInfo, see install_client_and_packages.
203 'install_packages_fn',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000204 # Cache directory for `cas` client.
205 'cas_cache_dir',
206 # Parameters passed to `cas` client.
207 'cas_cache_policies',
Takuto Ikutaae391c52020-12-03 08:43:45 +0000208 # Parameters for kvs file used by `cas` client.
209 'cas_kvs',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000210 # Environment variables to set.
211 'env',
212 # Environment variables to mutate with relative directories.
213 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
214 'env_prefix',
215 # Lowers the task process priority.
216 'lower_priority',
217 # subprocess42.Containment instance. Can be None.
218 'containment',
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000219 # Function to trim caches before installing cipd packages and
220 # downloading isolated files.
221 'trim_caches_fn',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000222 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500223
224
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500225def _to_str(s):
226 """Downgrades a unicode instance to str. Pass str through as-is."""
227 if isinstance(s, str):
228 return s
229 # This is technically incorrect, especially on Windows. In theory
230 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
231 # page' on Windows, but that causes other problems, as the character set
232 # is very limited.
233 return s.encode('utf-8')
234
235
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500236def _to_unicode(s):
237 """Upgrades a str instance to unicode. Pass unicode through as-is."""
Takuto Ikuta95459dd2019-10-29 12:39:47 +0000238 if isinstance(s, six.text_type) or s is None:
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500239 return s
240 return s.decode('utf-8')
241
242
maruel03e11842016-07-14 10:50:16 -0700243def make_temp_dir(prefix, root_dir):
244 """Returns a new unique temporary directory."""
Takuto Ikuta6e2ff962019-10-29 12:35:27 +0000245 return six.text_type(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000246
247
vadimsh9c54b2c2017-07-25 14:08:29 -0700248@contextlib.contextmanager
249def set_luci_context_account(account, tmp_dir):
250 """Sets LUCI_CONTEXT account to be used by the task.
251
252 If 'account' is None or '', does nothing at all. This happens when
253 run_isolated.py is called without '--switch-to-account' flag. In this case,
254 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000255 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700256 run_isolated.py explicitly from their code.
257
258 If the requested account is not defined in the context, switches to
259 non-authenticated access. This happens for Swarming tasks that don't use
260 'task' service accounts.
261
262 If not using LUCI_CONTEXT-based auth, does nothing.
263 If already running as requested account, does nothing.
264 """
265 if not account:
266 # Not actually switching.
267 yield
268 return
269
270 local_auth = luci_context.read('local_auth')
271 if not local_auth:
272 # Not using LUCI_CONTEXT auth at all.
273 yield
274 return
275
276 # See LUCI_CONTEXT.md for the format of 'local_auth'.
277 if local_auth.get('default_account_id') == account:
278 # Already set, no need to switch.
279 yield
280 return
281
282 available = {a['id'] for a in local_auth.get('accounts') or []}
283 if account in available:
284 logging.info('Switching default LUCI_CONTEXT account to %r', account)
285 local_auth['default_account_id'] = account
286 else:
287 logging.warning(
288 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
289 'disabling authentication', account, sorted(available))
290 local_auth.pop('default_account_id', None)
291
292 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
293 yield
294
295
nodir90bc8dc2016-06-15 13:35:21 -0700296def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000297 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700298
299 Raises:
300 ValueError if a parameter is requested in |command| but its value is not
301 provided.
302 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000303 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
304
305
306def replace_parameters(arg, out_dir, bot_file):
307 """Replaces parameter tokens with appropriate values in a string.
308
309 Raises:
310 ValueError if a parameter is requested in |arg| but its value is not
311 provided.
312 """
313 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
314 replace_slash = False
315 if ISOLATED_OUTDIR_PARAMETER in arg:
316 if not out_dir:
317 raise ValueError(
318 'output directory is requested in command or env var, but not '
319 'provided; please specify one')
320 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
321 replace_slash = True
322 if SWARMING_BOT_FILE_PARAMETER in arg:
323 if bot_file:
324 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700325 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000326 else:
327 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
328 'var, but no bot_file specified. Leaving parameter '
329 'unchanged.')
Joanna Wang4cec0e42021-08-26 00:48:37 +0000330 if SWARMING_TASK_ID_PARAMETER in arg:
331 task_id = os.environ.get('SWARMING_TASK_ID')
332 if task_id:
333 arg = arg.replace(SWARMING_TASK_ID_PARAMETER, task_id)
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000334 if replace_slash:
335 # Replace slashes only if parameters are present
336 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
337 arg = arg.replace('/', os.sep)
338 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700339
340
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000341def set_temp_dir(env, tmp_dir):
342 """Set temp dir to given env var dictionary"""
343 tmp_dir = _to_str(tmp_dir)
344 # pylint: disable=line-too-long
345 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
346 # platform. So $TMPDIR must be set on all platforms.
347 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
348 env['TMPDIR'] = tmp_dir
349 if sys.platform == 'win32':
350 # * chromium's base utils uses GetTempPath().
351 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
352 # * Go uses GetTempPath().
353 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
354 # set.
355 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
356 env['TMP'] = tmp_dir
357 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
358 env['TEMP'] = tmp_dir
359 elif sys.platform == 'darwin':
360 # * Chromium uses an hack on macOS before calling into
361 # NSTemporaryDirectory().
362 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
363 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
364 env['MAC_CHROMIUM_TMPDIR'] = tmp_dir
365 else:
366 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
367 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
368 # * mktemp on linux respects $TMPDIR.
369 # * Chromium respects $TMPDIR on linux.
370 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
371 # * Go uses $TMPDIR.
372 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
373 pass
374
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000375
376def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
377 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800378 """Returns full OS environment to run a command in.
379
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800380 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
381 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800382
383 Args:
384 tmp_dir: temp directory.
385 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500386 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500387 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800388 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000389 out_dir: Isolated output directory. Required to be != None if any of the
390 env vars contain ISOLATED_OUTDIR_PARAMETER.
391 bot_file: Required to be != None if any of the env vars contain
392 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800393 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500394 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000395 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500396 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500397 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500398 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000399 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500400
401 if cipd_info:
402 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500403 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
404 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Takuto Ikuta4ec3e8f2021-04-05 10:21:29 +0000405 cipd_info_path = os.path.join(tmp_dir, 'cipd_info.json')
406 with open(cipd_info_path, 'w') as f:
407 json.dump(cipd_info.pins, f)
408 out['ISOLATED_RESOLVED_PACKAGE_VERSIONS_FILE'] = cipd_info_path
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500409
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000410 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500411 assert isinstance(paths, list), paths
412 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500413 cur = out.get(key)
414 if cur:
415 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500416 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800417
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000418 set_temp_dir(out, tmp_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500419 return out
vadimsh232f5a82017-01-20 19:23:44 -0800420
421
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000422def run_command(
423 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700424 """Runs the command.
425
426 Returns:
427 tuple(process exit code, bool if had a hard timeout)
428 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000429 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000430 'run_command(%s, %s, %s, %s, %s, %s)',
431 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700432
maruel6be7f9e2015-10-01 12:25:30 -0700433 exit_code = None
434 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700435 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700436 proc = None
437 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700438 try:
maruel6be7f9e2015-10-01 12:25:30 -0700439 # TODO(maruel): This code is imperfect. It doesn't handle well signals
440 # during the download phase and there's short windows were things can go
441 # wrong.
442 def handler(signum, _frame):
443 if proc and not had_signal:
444 logging.info('Received signal %d', signum)
445 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700446 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700447
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000448 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000449 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000450 lower_priority=lower_priority, containment=containment)
Joanna Wang40959bf2021-08-12 18:10:12 +0000451 logging.info('Subprocess for command started')
maruel6be7f9e2015-10-01 12:25:30 -0700452 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
453 try:
John Budorickc398f092019-06-10 22:49:44 +0000454 exit_code = proc.wait(hard_timeout or None)
Takuto Ikuta6a8f4e12021-11-15 02:33:04 +0000455 logging.info("finished with exit code %d", exit_code)
maruel6be7f9e2015-10-01 12:25:30 -0700456 except subprocess42.TimeoutExpired:
457 if not had_signal:
458 logging.warning('Hard timeout')
459 had_hard_timeout = True
460 logging.warning('Sending SIGTERM')
461 proc.terminate()
462
Takuto Ikuta684f7912020-09-29 07:49:49 +0000463 kill_sent = False
maruel6be7f9e2015-10-01 12:25:30 -0700464 # Ignore signals in grace period. Forcibly give the grace period to the
465 # child process.
466 if exit_code is None:
467 ignore = lambda *_: None
468 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
469 try:
470 exit_code = proc.wait(grace_period or None)
Takuto Ikuta6a8f4e12021-11-15 02:33:04 +0000471 logging.info("finished with exit code %d", exit_code)
maruel6be7f9e2015-10-01 12:25:30 -0700472 except subprocess42.TimeoutExpired:
473 # Now kill for real. The user can distinguish between the
474 # following states:
475 # - signal but process exited within grace period,
476 # hard_timed_out will be set but the process exit code will be
477 # script provided.
478 # - processed exited late, exit code will be -9 on posix.
479 logging.warning('Grace exhausted; sending SIGKILL')
480 proc.kill()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000481 kill_sent = True
martiniss5c8043e2017-08-01 17:09:43 -0700482 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700483 exit_code = proc.wait()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000484
485 # the process group / job object may be dangling so if we didn't kill
486 # it already, give it a poke now.
487 if not kill_sent:
488 proc.kill()
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000489 except OSError as e:
maruela9cfd6f2015-09-15 11:03:15 -0700490 # This is not considered to be an internal error. The executable simply
491 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800492 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000493 '<The executable does not exist, a dependent library is missing or '
494 'the command line is too long>\n'
495 '<Check for missing .so/.dll in the .isolate or GN file or length of '
496 'command line args>\n'
Takuto Ikutae900df42021-04-14 04:40:11 +0000497 '<Command: %s>\n'
498 '<Exception: %s>\n' % (command, e))
maruela72f46e2016-02-24 11:05:45 -0800499 if os.environ.get('SWARMING_TASK_ID'):
500 # Give an additional hint when running as a swarming task.
501 sys.stderr.write(
502 '<See the task\'s page for commands to help diagnose this issue '
503 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700504 exit_code = 1
505 logging.info(
506 'Command finished with exit code %d (%s)',
507 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700508 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700509
510
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000511def _run_go_cmd_and_wait(cmd, tmp_dir):
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000512 """
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000513 Runs an external Go command, `isolated` or `cas`, and wait for its completion.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000514
515 While this is a generic function to launch a subprocess, it has logic that
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000516 is specific to Go `isolated` and `cas` for waiting and logging.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000517
518 Returns:
519 The subprocess object
520 """
Ye Kuang3c40e9f2020-07-28 13:15:25 +0000521 cmd_str = ' '.join(cmd)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000522 try:
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000523 env = os.environ.copy()
524 set_temp_dir(env, tmp_dir)
525 proc = subprocess42.Popen(cmd, env=env)
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000526
Ye Kuangc1d800f2020-07-28 10:14:55 +0000527 exceeded_max_timeout = True
528 check_period_sec = 30
529 max_checks = 100
530 # max timeout = max_checks * check_period_sec = 50 minutes
531 for i in range(max_checks):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000532 # This is to prevent I/O timeout error during setup.
Ye Kuangc1d800f2020-07-28 10:14:55 +0000533 try:
534 retcode = proc.wait(check_period_sec)
535 if retcode != 0:
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000536 raise subprocess42.CalledProcessError(retcode, cmd=cmd_str)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000537 exceeded_max_timeout = False
538 break
539 except subprocess42.TimeoutExpired:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000540 print('still running (after %d seconds)' % ((i + 1) * check_period_sec))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000541
Ye Kuangc1d800f2020-07-28 10:14:55 +0000542 if exceeded_max_timeout:
543 proc.terminate()
544 try:
545 proc.wait(check_period_sec)
546 except subprocess42.TimeoutExpired:
547 logging.exception(
548 "failed to terminate? timeout happened after %d seconds",
549 check_period_sec)
550 proc.kill()
551 proc.wait()
552 # Raise unconditionally, because |proc| was forcefully terminated.
553 raise ValueError("timedout after %d seconds (cmd=%s)" %
554 (check_period_sec * max_checks, cmd_str))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000555
Ye Kuangc1d800f2020-07-28 10:14:55 +0000556 return proc
557 except Exception:
558 logging.exception('Failed to run Go cmd %s', cmd_str)
559 raise
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000560
561
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000562def _fetch_and_map(cas_client, digest, instance, output_dir, cache_dir,
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000563 policies, kvs_dir, tmp_dir):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000564 """
565 Fetches a CAS tree using cas client, create the tree and returns download
566 stats.
567 """
568
569 start = time.time()
570 result_json_handle, result_json_path = tempfile.mkstemp(
571 prefix=u'fetch-and-map-result-', suffix=u'.json')
572 os.close(result_json_handle)
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000573 profile_dir = tempfile.mkdtemp(dir=tmp_dir)
574
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000575 try:
576 cmd = [
577 cas_client,
578 'download',
579 '-digest',
580 digest,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000581 # flags for cache.
582 '-cache-dir',
583 cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000584 '-cache-max-size',
585 str(policies.max_cache_size),
586 '-cache-min-free-space',
587 str(policies.min_free_space),
588 # flags for output.
589 '-dir',
590 output_dir,
591 '-dump-stats-json',
592 result_json_path,
Takuto Ikuta557025b2021-02-01 08:37:40 +0000593 '-log-level',
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000594 'info',
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000595 ]
Takuto Ikutaae391c52020-12-03 08:43:45 +0000596
Junji Watanabe66d807b2021-11-08 03:20:10 +0000597 # When RUN_ISOLATED_CAS_ADDRESS is set in test mode,
598 # Use it and ignore CAS instance option.
599 cas_addr = os.environ.get('RUN_ISOLATED_CAS_ADDRESS')
600 if cas_addr:
601 cmd.extend([
602 '-cas-addr',
603 cas_addr,
604 ])
605 else:
606 cmd.extend([
607 '-cas-instance',
608 instance
609 ])
610
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000611 if kvs_dir:
612 cmd.extend(['-kvs-dir', kvs_dir])
Takuto Ikutaae391c52020-12-03 08:43:45 +0000613
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000614 try:
615 _run_go_cmd_and_wait(cmd, tmp_dir)
Takuto Ikuta0909eae2021-04-27 02:54:07 +0000616 except subprocess42.CalledProcessError as ex:
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000617 if not kvs_dir:
618 raise
619 logging.exception('Failed to run cas, removing kvs cache dir and retry.')
Takuto Ikuta0909eae2021-04-27 02:54:07 +0000620 on_error.report("Failed to run cas %s" % ex)
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000621 file_path.rmtree(kvs_dir)
Takuto Ikutacffabfb2021-11-01 08:05:43 +0000622 file_path.rmtree(output_dir)
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000623 _run_go_cmd_and_wait(cmd, tmp_dir)
624
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000625 with open(result_json_path) as json_file:
626 result_json = json.load(json_file)
627
628 return {
629 'duration': time.time() - start,
630 'items_cold': result_json['items_cold'],
631 'items_hot': result_json['items_hot'],
632 }
633 finally:
634 fs.remove(result_json_path)
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000635 file_path.rmtree(profile_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000636
637
aludwin0a8e17d2016-10-27 15:57:39 -0700638def link_outputs_to_outdir(run_dir, out_dir, outputs):
639 """Links any named outputs to out_dir so they can be uploaded.
640
641 Raises an error if the file already exists in that directory.
642 """
643 if not outputs:
644 return
Takuto Ikutae0dce462021-11-16 08:49:46 +0000645 file_path.create_directories(out_dir, outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700646 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400647 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
648
649
650def copy_recursively(src, dst):
651 """Efficiently copies a file or directory from src_dir to dst_dir.
652
653 `item` may be a file, directory, or a symlink to a file or directory.
654 All symlinks are replaced with their targets, so the resulting
655 directory structure in dst_dir will never have any symlinks.
656
657 To increase speed, copy_recursively hardlinks individual files into the
658 (newly created) directory structure if possible, unlike Python's
659 shutil.copytree().
660 """
661 orig_src = src
662 try:
663 # Replace symlinks with their final target.
664 while fs.islink(src):
665 res = fs.readlink(src)
Takuto Ikutaf2ad0a02021-06-24 08:38:40 +0000666 src = os.path.realpath(os.path.join(os.path.dirname(src), res))
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400667 # TODO(sadafm): Explicitly handle cyclic symlinks.
668
Takuto Ikutaf2ad0a02021-06-24 08:38:40 +0000669 if not fs.exists(src):
670 logging.warning('Path %s does not exist or %s is a broken symlink', src,
671 orig_src)
672 return
673
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400674 if fs.isfile(src):
675 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
676 return
677
678 if not fs.exists(dst):
679 os.makedirs(dst)
680
681 for child in fs.listdir(src):
682 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
683
684 except OSError as e:
685 if e.errno == errno.ENOENT:
686 logging.warning('Path %s does not exist or %s is a broken symlink',
687 src, orig_src)
688 else:
689 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700690
691
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000692def upload_outdir(cas_client, cas_instance, outdir, tmp_dir):
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000693 """Uploads the results in |outdir|, if there is any.
694
695 Returns:
696 tuple(root_digest, stats)
697 - root_digest: a digest of the output directory.
698 - stats: uploading stats.
699 """
Junji Watanabe15f9e042021-11-12 07:13:50 +0000700 if not fs.listdir(outdir):
701 return None, None
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000702 digest_file_handle, digest_path = tempfile.mkstemp(
703 prefix=u'cas-digest', suffix=u'.txt')
704 os.close(digest_file_handle)
705 stats_json_handle, stats_json_path = tempfile.mkstemp(
706 prefix=u'upload-stats', suffix=u'.json')
707 os.close(stats_json_handle)
708
709 try:
710 cmd = [
711 cas_client,
712 'archive',
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000713 '-paths',
714 # Format: <working directory>:<relative path to dir>
715 outdir + ':',
716 # output
717 '-dump-digest',
718 digest_path,
719 '-dump-stats-json',
720 stats_json_path,
721 ]
722
Junji Watanabe66d807b2021-11-08 03:20:10 +0000723 # When RUN_ISOLATED_CAS_ADDRESS is set in test mode,
724 # Use it and ignore CAS instance option.
725 cas_addr = os.environ.get('RUN_ISOLATED_CAS_ADDRESS')
726 if cas_addr:
727 cmd.extend([
728 '-cas-addr',
729 cas_addr,
730 ])
731 else:
732 cmd.extend([
733 '-cas-instance',
734 cas_instance
735 ])
736
Takuto Ikutabfcef252021-08-25 07:46:19 +0000737 if sys.platform.startswith('linux'):
738 # TODO(crbug.com/1243194): remove this after investigation.
739 cmd.extend(['-log-level', 'debug'])
740
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000741 start = time.time()
742
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000743 _run_go_cmd_and_wait(cmd, tmp_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000744
745 with open(digest_path) as digest_file:
746 digest = digest_file.read()
Junji Watanabec208b302020-09-25 09:18:27 +0000747 h, s = digest.split('/')
748 cas_output_root = {
749 'cas_instance': cas_instance,
750 'digest': {
751 'hash': h,
752 'size_bytes': int(s)
753 }
754 }
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000755 with open(stats_json_path) as stats_file:
756 stats = json.load(stats_file)
757
758 stats['duration'] = time.time() - start
759
Junji Watanabec208b302020-09-25 09:18:27 +0000760 return cas_output_root, stats
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000761 finally:
762 fs.remove(digest_path)
763 fs.remove(stats_json_path)
764
765
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500766def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700767 """Runs a command with optional isolated input/output.
768
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500769 Arguments:
770 - data: TaskData instance.
771 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700772
773 Returns metadata about the result.
774 """
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000775
Takuto Ikutaa71c6562021-11-18 06:07:55 +0000776 # TODO(tikuta): take stats from state.json in this case too.
777 download_stats = {
778 # 'duration': 0.,
779 # 'initial_number_items': len(data.cas_cache),
780 # 'initial_size': data.cas_cache.total_size,
781 # 'items_cold': '<large.pack()>',
782 # 'items_hot': '<large.pack()>',
783 }
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000784
maruela9cfd6f2015-09-15 11:03:15 -0700785 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000786 'duration': None,
787 'exit_code': None,
788 'had_hard_timeout': False,
789 'internal_failure': 'run_isolated did not complete properly',
790 'stats': {
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000791 'trim_caches': {
792 'duration': 0,
793 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000794 #'cipd': {
795 # 'duration': 0.,
796 # 'get_client_duration': 0.,
797 #},
798 'isolated': {
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000799 'download': download_stats,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000800 #'upload': {
801 # 'duration': 0.,
802 # 'items_cold': '<large.pack()>',
803 # 'items_hot': '<large.pack()>',
804 #},
805 },
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000806 'named_caches': {
807 'install': {
808 'duration': 0,
809 },
810 'uninstall': {
811 'duration': 0,
812 },
813 },
814 'cleanup': {
815 'duration': 0,
816 }
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000817 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000818 #'cipd_pins': {
819 # 'packages': [
820 # {'package_name': ..., 'version': ..., 'path': ...},
821 # ...
822 # ],
823 # 'client_package': {'package_name': ..., 'version': ...},
824 #},
825 'outputs_ref': None,
Junji Watanabe54925c32020-09-08 00:56:18 +0000826 'cas_output_root': None,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000827 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700828 }
nodirbe642ff2016-06-09 15:51:51 -0700829
Takuto Ikutad46ea762020-10-07 05:43:22 +0000830 assert os.path.isabs(data.root_dir), ("data.root_dir is not abs path: %s" %
831 data.root_dir)
832 file_path.ensure_tree(data.root_dir, 0o700)
833
maruele2f2cb82016-07-13 14:41:03 -0700834 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700835 # TODO(maruel): This is not obvious. Change this to become an error once we
836 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500837 if constant_run_path and data.root_dir:
838 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700839 if os.path.isdir(run_dir):
840 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000841 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700842 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500843 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000844
845 # True if CAS is used for download/upload files.
846 use_cas = bool(data.cas_digest)
847
maruel03e11842016-07-14 10:50:16 -0700848 # storage should be normally set but don't crash if it is not. This can happen
849 # as Swarming task can run without an isolate server.
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000850 out_dir = None
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000851 if use_cas:
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000852 out_dir = make_temp_dir(ISOLATED_OUT_DIR, data.root_dir)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500853 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700854 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500855 if data.relative_cwd:
856 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500857 command = data.command
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000858
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000859 cas_client = None
860 cas_client_dir = make_temp_dir(_CAS_CLIENT_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000861 if use_cas:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000862 cas_client = os.path.join(cas_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX)
863
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000864 data.trim_caches_fn(result['stats']['trim_caches'])
865
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000866 nsjail_dir = None
867 if (sys.platform == "linux" and cipd.get_platform() == "amd64" and
868 data.containment.containment_type == subprocess42.Containment.NSJAIL):
869 nsjail_dir = make_temp_dir(_NSJAIL_DIR, data.root_dir)
870
nodir55be77b2016-05-03 09:39:57 -0700871 try:
Takuto Ikuta1ce61362021-11-16 05:44:17 +0000872 with data.install_packages_fn(run_dir, cas_client_dir,
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000873 nsjail_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800874 if cipd_info:
875 result['stats']['cipd'] = cipd_info.stats
876 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700877
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000878 isolated_stats = result['stats'].setdefault('isolated', {})
Takuto Ikutab58dbd12020-06-05 09:29:14 +0000879
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000880 if data.cas_digest:
881 stats = _fetch_and_map(
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000882 cas_client=cas_client,
883 digest=data.cas_digest,
884 instance=data.cas_instance,
885 output_dir=run_dir,
Junji Watanabeb03450b2020-09-25 05:09:27 +0000886 cache_dir=data.cas_cache_dir,
Takuto Ikutaae391c52020-12-03 08:43:45 +0000887 policies=data.cas_cache_policies,
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000888 kvs_dir=data.cas_kvs,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000889 tmp_dir=tmp_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000890 isolated_stats['download'].update(stats)
Junji Watanabe54925c32020-09-08 00:56:18 +0000891
maruelabec63c2017-04-26 11:53:24 -0700892 if not command:
893 # Handle this as a task failure, not an internal failure.
894 sys.stderr.write(
895 '<No command was specified!>\n'
896 '<Please secify a command when triggering your Swarming task>\n')
897 result['exit_code'] = 1
898 return result
nodirbe642ff2016-06-09 15:51:51 -0700899
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500900 if not cwd.startswith(run_dir):
901 # Handle this as a task failure, not an internal failure. This is a
902 # 'last chance' way to gate against directory escape.
903 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
904 result['exit_code'] = 1
905 return result
906
907 if not os.path.isdir(cwd):
908 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +0000909 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500910
vadimsh232f5a82017-01-20 19:23:44 -0800911 # If we have an explicit list of files to return, make sure their
912 # directories exist now.
Takuto Ikutaab8d0232021-11-16 12:12:09 +0000913 if data.outputs:
Takuto Ikutae0dce462021-11-16 08:49:46 +0000914 file_path.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700915
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000916 with data.install_named_caches(run_dir, result['stats']['named_caches']):
nodird6160682017-02-02 13:03:35 -0800917 sys.stdout.flush()
918 start = time.time()
919 try:
vadimsh9c54b2c2017-07-25 14:08:29 -0700920 # Need to switch the default account before 'get_command_env' call,
921 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500922 with set_luci_context_account(data.switch_to_account, tmp_dir):
923 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000924 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
925 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +0000926 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -0800927 command = process_command(command, out_dir, data.bot_file)
928 file_path.ensure_command_has_abs_path(command, cwd)
929
vadimsh9c54b2c2017-07-25 14:08:29 -0700930 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000931 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000932 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -0800933 finally:
934 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -0500935
Ye Kuangbc4e8402020-07-29 09:54:30 +0000936 if out_dir:
937 # Try to link files to the output directory, if specified.
938 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
939 isolated_stats = result['stats'].setdefault('isolated', {})
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000940 if use_cas:
941 result['cas_output_root'], isolated_stats['upload'] = (
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000942 upload_outdir(cas_client, data.cas_instance, out_dir,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000943 tmp_dir))
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000944
Seth Koehler49139812017-12-19 13:59:33 -0500945 # We successfully ran the command, set internal_failure back to
946 # None (even if the command failed, it's not an internal error).
947 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -0700948 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -0700949 # An internal error occurred. Report accordingly so the swarming task will
950 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -0700951 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -0700952 result['internal_failure'] = str(e)
953 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -0700954
955 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -0700956 finally:
957 try:
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000958 cleanup_start = time.time()
Ye Kuangbc4e8402020-07-29 09:54:30 +0000959 success = True
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500960 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -0700961 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700962 logging.warning(
963 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -0700964 else:
maruel84537cb2015-10-16 14:21:28 -0700965 # On Windows rmtree(run_dir) call above has a synchronization effect: it
966 # finishes only when all task child processes terminate (since a running
967 # process locks *.exe file). Examine out_dir only after that call
968 # completes (since child processes may write to out_dir too and we need
969 # to wait for them to finish).
Takuto Ikuta1ce61362021-11-16 05:44:17 +0000970 dirs_to_remove = [run_dir, tmp_dir, cas_client_dir]
Ye Kuangbc4e8402020-07-29 09:54:30 +0000971 if out_dir:
972 dirs_to_remove.append(out_dir)
973 for directory in dirs_to_remove:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000974 if not fs.isdir(directory):
975 continue
Junji Watanabe9cdfff52021-01-08 07:20:35 +0000976 start = time.time()
maruel84537cb2015-10-16 14:21:28 -0700977 try:
Junji Watanabecc4eefd2021-01-19 01:46:10 +0000978 file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -0700979 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000980 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -0700981 success = False
Junji Watanabe9cdfff52021-01-08 07:20:35 +0000982 finally:
983 logging.info('Cleanup: rmtree(%r) took %d seconds', directory,
984 time.time() - start)
maruel84537cb2015-10-16 14:21:28 -0700985 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000986 sys.stderr.write(
987 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
Junji Watanabed952bf12021-05-13 03:15:54 +0000988 if sys.platform == 'win32':
989 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
990 else:
991 subprocess42.check_call(['ps', 'axu'], stdout=sys.stderr)
maruel84537cb2015-10-16 14:21:28 -0700992 if result['exit_code'] == 0:
993 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -0700994
maruela9cfd6f2015-09-15 11:03:15 -0700995 if not success and result['exit_code'] == 0:
996 result['exit_code'] = 1
997 except Exception as e:
998 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -0700999 if out_dir:
1000 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -07001001 result['internal_failure'] = str(e)
Takuto Ikutaa9a907b2020-04-17 08:50:50 +00001002 on_error.report(None)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001003 finally:
1004 cleanup_duration = time.time() - cleanup_start
1005 result['stats']['cleanup']['duration'] = cleanup_duration
1006 logging.info('Cleanup: removing directories took %d seconds',
1007 cleanup_duration)
maruela9cfd6f2015-09-15 11:03:15 -07001008 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001009
1010
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001011def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -07001012 """Runs an executable and records execution metadata.
1013
nodir55be77b2016-05-03 09:39:57 -07001014 If isolated_hash is specified, downloads the dependencies in the cache,
1015 hardlinks them into a temporary directory and runs the command specified in
1016 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001017
1018 A temporary directory is created to hold the output files. The content inside
1019 this directory will be uploaded back to |storage| packaged as a .isolated
1020 file.
1021
1022 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001023 - data: TaskData instance.
1024 - result_json: File path to dump result metadata into. If set, the process
1025 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -07001026
1027 Returns:
1028 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001029 """
maruela76b9ee2015-12-15 06:18:08 -08001030 if result_json:
1031 # Write a json output file right away in case we get killed.
1032 result = {
Junji Watanabe54925c32020-09-08 00:56:18 +00001033 'exit_code': None,
1034 'had_hard_timeout': False,
1035 'internal_failure': 'Was terminated before completion',
1036 'outputs_ref': None,
1037 'cas_output_root': None,
1038 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -08001039 }
1040 tools.write_json(result_json, result, dense=True)
1041
maruela9cfd6f2015-09-15 11:03:15 -07001042 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001043 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -07001044 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -07001045
maruela9cfd6f2015-09-15 11:03:15 -07001046 if result_json:
maruel05d5a882015-09-21 13:59:02 -07001047 # We've found tests to delete 'work' when quitting, causing an exception
1048 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -07001049 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -07001050 tools.write_json(result_json, result, dense=True)
1051 # Only return 1 if there was an internal error.
1052 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +00001053
maruela9cfd6f2015-09-15 11:03:15 -07001054 # Marshall into old-style inline output.
1055 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +00001056 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -07001057 data = {
Junji Watanabe38b28b02020-04-23 10:23:30 +00001058 'hash': result['outputs_ref']['isolated'],
1059 'namespace': result['outputs_ref']['namespace'],
1060 'storage': result['outputs_ref']['isolatedserver'],
maruela9cfd6f2015-09-15 11:03:15 -07001061 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -05001062 sys.stdout.flush()
Junji Watanabe38b28b02020-04-23 10:23:30 +00001063 print('[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
1064 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -08001065 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -07001066 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001067
1068
iannuccib58d10d2017-03-18 02:00:25 -07001069# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -08001070CipdInfo = collections.namedtuple('CipdInfo', [
1071 'client', # cipd.CipdClient object
1072 'cache_dir', # absolute path to bot-global cipd tag and instance cache
1073 'stats', # dict with stats to return to the server
1074 'pins', # dict with installed cipd pins to return to the server
1075])
1076
1077
1078@contextlib.contextmanager
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001079def copy_local_packages(_run_dir, cas_dir, _nsjail_dir):
Junji Watanabedc2f89e2021-11-08 08:44:30 +00001080 """Copies CIPD packages from luci/luci-go dir."""
1081 go_client_dir = os.environ.get('LUCI_GO_CLIENT_DIR')
1082 assert go_client_dir, ('Please set LUCI_GO_CLIENT_DIR env var to install CIPD'
1083 ' packages locally.')
1084 shutil.copy2(os.path.join(go_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX),
1085 os.path.join(cas_dir, 'cas' + cipd.EXECUTABLE_SUFFIX))
vadimsh232f5a82017-01-20 19:23:44 -08001086 yield None
1087
1088
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001089def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -07001090 """Calls 'cipd ensure' for packages.
1091
1092 Args:
1093 run_dir (str): root of installation.
1094 cipd_cache_dir (str): the directory to use for the cipd package cache.
1095 client (CipdClient): the cipd client to use
1096 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -07001097
1098 Returns: list of pinned packages. Looks like [
1099 {
1100 'path': 'subdirectory',
1101 'package_name': 'resolved/package/name',
1102 'version': 'deadbeef...',
1103 },
1104 ...
1105 ]
1106 """
1107 package_pins = [None]*len(packages)
1108 def insert_pin(path, name, version, idx):
1109 package_pins[idx] = {
1110 'package_name': name,
1111 # swarming deals with 'root' as '.'
1112 'path': path or '.',
1113 'version': version,
1114 }
1115
1116 by_path = collections.defaultdict(list)
1117 for i, (path, name, version) in enumerate(packages):
1118 # cipd deals with 'root' as ''
1119 if path == '.':
1120 path = ''
1121 by_path[path].append((name, version, i))
1122
1123 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001124 run_dir,
1125 {
1126 subdir: [(name, vers) for name, vers, _ in pkgs
1127 ] for subdir, pkgs in by_path.items()
1128 },
1129 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -07001130 )
1131
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +00001132 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -07001133 this_subdir = by_path[subdir]
1134 for i, (name, version) in enumerate(pin_list):
1135 insert_pin(subdir, name, version, this_subdir[i][2])
1136
Robert Iannucci461b30d2017-12-13 11:34:03 -08001137 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -07001138
1139 return package_pins
1140
1141
vadimsh232f5a82017-01-20 19:23:44 -08001142@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001143def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001144 client_package_name, client_version, cache_dir,
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001145 cas_dir, nsjail_dir):
vadimsh902948e2017-01-20 15:57:32 -08001146 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -07001147
vadimsh232f5a82017-01-20 19:23:44 -08001148 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
1149
1150 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -07001151 [
1152 {
1153 "path": path, "package_name": package_name, "version": version,
1154 },
1155 ...
1156 ]
vadimsh902948e2017-01-20 15:57:32 -08001157 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -07001158
1159 such that they correspond 1:1 to all input package arguments from the command
1160 line. These dictionaries make their all the way back to swarming, where they
1161 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -07001162
vadimsh902948e2017-01-20 15:57:32 -08001163 If 'packages' list is empty, will bootstrap CIPD client, but won't install
1164 any packages.
1165
1166 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -08001167 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -08001168
nodirbe642ff2016-06-09 15:51:51 -07001169 Args:
nodir90bc8dc2016-06-15 13:35:21 -07001170 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -08001171 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -07001172 service_url (str): CIPD server url, e.g.
1173 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -07001174 client_package_name (str): CIPD package name of CIPD client.
1175 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -07001176 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001177 cas_dir (str): where to download cas client.
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001178 nsjail_dir (str): where to download nsjail. If set to None, nsjail is not
1179 downloaded.
nodirbe642ff2016-06-09 15:51:51 -07001180 """
1181 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001182
nodirbe642ff2016-06-09 15:51:51 -07001183 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001184
vadimsh902948e2017-01-20 15:57:32 -08001185 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001186 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001187 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001188 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001189
nodirbe642ff2016-06-09 15:51:51 -07001190 get_client_start = time.time()
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001191 client_manager = cipd.get_client(cache_dir, service_url, client_package_name,
1192 client_version)
iannucci96fcccc2016-08-30 15:52:22 -07001193
nodirbe642ff2016-06-09 15:51:51 -07001194 with client_manager as client:
1195 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001196
iannuccib58d10d2017-03-18 02:00:25 -07001197 package_pins = []
1198 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001199 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1200 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001201
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001202 # Install cas client to |cas_dir|.
1203 _install_packages(cas_dir, cipd_cache_dir, client,
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +00001204 [('', _CAS_PACKAGE, _LUCI_GO_REVISION)])
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001205
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001206 # Install nsjail to |nsjail_dir|.
1207 if nsjail_dir is not None:
1208 _install_packages(nsjail_dir, cipd_cache_dir, client,
1209 [('', _NSJAIL_PACKAGE, _NSJAIL_VERSION)])
1210
iannuccib58d10d2017-03-18 02:00:25 -07001211 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001212
vadimsh232f5a82017-01-20 19:23:44 -08001213 total_duration = time.time() - start
Junji Watanabe38b28b02020-04-23 10:23:30 +00001214 logging.info('Installing CIPD client and packages took %d seconds',
1215 total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001216
vadimsh232f5a82017-01-20 19:23:44 -08001217 yield CipdInfo(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001218 client=client,
1219 cache_dir=cipd_cache_dir,
1220 stats={
1221 'duration': total_duration,
1222 'get_client_duration': get_client_duration,
iannuccib58d10d2017-03-18 02:00:25 -07001223 },
Junji Watanabe38b28b02020-04-23 10:23:30 +00001224 pins={
1225 'client_package': {
1226 'package_name': client.package_name,
1227 'version': client.instance_id,
1228 },
1229 'packages': package_pins,
1230 })
nodirbe642ff2016-06-09 15:51:51 -07001231
1232
1233def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001234 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001235 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001236 version=__version__,
1237 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001238 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001239 '--clean',
1240 action='store_true',
maruel36a963d2016-04-08 17:15:49 -07001241 help='Cleans the cache, trimming it necessary and remove corrupted items '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001242 'and returns without executing anything; use with -v to know what '
1243 'was done')
maruel36a963d2016-04-08 17:15:49 -07001244 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001245 '--json',
1246 help='dump output metadata to json file. When used, run_isolated returns '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001247 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001248 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001249 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001250 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001251 '--grace-period',
1252 type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001253 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001254 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001255 '--relative-cwd',
Takuto Ikuta18ca29a2020-12-04 07:34:20 +00001256 help='Ignore the isolated \'relative_cwd\' and use this one instead')
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001257 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001258 '--env',
1259 default=[],
1260 action='append',
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001261 help='Environment variables to set for the child process')
1262 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001263 '--env-prefix',
1264 default=[],
1265 action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001266 help='Specify a VAR=./path/fragment to put in the environment variable '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001267 'before executing the command. The path fragment must be relative '
1268 'to the isolated run directory, and must not contain a `..` token. '
1269 'The path will be made absolute and prepended to the indicated '
1270 '$VAR using the OS\'s path separator. Multiple items for the same '
1271 '$VAR will be prepended in order.')
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001272 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001273 '--bot-file',
1274 help='Path to a file describing the state of the host. The content is '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001275 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001276 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001277 '--switch-to-account',
1278 help='If given, switches LUCI_CONTEXT to given logical service account '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001279 '(e.g. "task" or "system") before launching the isolated process.')
vadimsh9c54b2c2017-07-25 14:08:29 -07001280 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001281 '--output',
1282 action='append',
aludwin0a8e17d2016-10-27 15:57:39 -07001283 help='Specifies an output to return. If no outputs are specified, all '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001284 'files located in $(ISOLATED_OUTDIR) will be returned; '
1285 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1286 'specified by --output option (there can be multiple) will be '
1287 'returned. Note that if a file in OUT_DIR has the same path '
1288 'as an --output option, the --output version will be returned.')
aludwin0a8e17d2016-10-27 15:57:39 -07001289 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001290 '-a',
1291 '--argsfile',
aludwin7556e0c2016-10-26 08:46:10 -07001292 # This is actually handled in parse_args; it's included here purely so it
1293 # can make it into the help text.
1294 help='Specify a file containing a JSON array of arguments to this '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001295 'script. If --argsfile is provided, no other argument may be '
1296 'provided on the command line.')
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001297 parser.add_option(
1298 '--report-on-exception',
1299 action='store_true',
1300 help='Whether report exception during execution to isolate server. '
1301 'This flag should only be used in swarming bot.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001302
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001303 group = optparse.OptionGroup(parser,
1304 'Data source - Content Addressed Storage')
Junji Watanabe54925c32020-09-08 00:56:18 +00001305 group.add_option(
1306 '--cas-instance', help='Full CAS instance name for input/output files.')
1307 group.add_option(
1308 '--cas-digest',
1309 help='Digest of the input root on RBE-CAS. The format is '
1310 '`{hash}/{size_bytes}`.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001311 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001312
Junji Watanabeb03450b2020-09-25 05:09:27 +00001313 # Cache options.
Junji Watanabeb03450b2020-09-25 05:09:27 +00001314 add_cas_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001315
1316 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001317
1318 group = optparse.OptionGroup(parser, 'Named caches')
1319 group.add_option(
1320 '--named-cache',
1321 dest='named_caches',
1322 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001323 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001324 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001325 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001326 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1327 'path is a path relative to the run dir where the cache directory '
1328 'must be put to. '
1329 'This option can be specified more than once.')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001330 group.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001331 '--named-cache-root',
1332 default='named_caches',
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001333 help='Cache root directory. Default=%default')
1334 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001335
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001336 group = optparse.OptionGroup(parser, 'Process containment')
1337 parser.add_option(
1338 '--lower-priority', action='store_true',
1339 help='Lowers the child process priority')
1340 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001341 '--containment-type',
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001342 choices=('NONE', 'AUTO', 'JOB_OBJECT', 'NSJAIL'),
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001343 default='NONE',
1344 help='Type of container to use')
1345 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001346 '--limit-processes',
1347 type='int',
1348 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001349 help='Maximum number of active processes in the containment')
1350 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001351 '--limit-total-committed-memory',
1352 type='int',
1353 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001354 help='Maximum sum of committed memory in the containment')
1355 parser.add_option_group(group)
1356
1357 group = optparse.OptionGroup(parser, 'Debugging')
1358 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001359 '--leak-temp-dir',
1360 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001361 help='Deliberately leak isolate\'s temp dir for later examination. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001362 'Default: %default')
1363 group.add_option('--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001364 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001365
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001366 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001367
Ye Kuang1d096cb2020-06-26 08:38:21 +00001368 parser.set_defaults(cache='cache')
nodirbe642ff2016-06-09 15:51:51 -07001369 return parser
1370
1371
Junji Watanabeb03450b2020-09-25 05:09:27 +00001372def add_cas_cache_options(parser):
1373 group = optparse.OptionGroup(parser, 'CAS cache management')
1374 group.add_option(
1375 '--cas-cache',
1376 metavar='DIR',
1377 default='cas-cache',
1378 help='Directory to keep a local cache of the files. Accelerates download '
1379 'by reusing already downloaded files. Default=%default')
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001380 group.add_option(
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001381 '--kvs-dir',
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001382 default='',
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001383 help='CAS cache dir using kvs for small files. Default=%default')
Takuto Ikutaa71c6562021-11-18 06:07:55 +00001384 group.add_option(
1385 '--max-cache-size',
1386 type='int',
1387 metavar='NNN',
1388 default=50 * 1024 * 1024 * 1024,
1389 help='Trim if the cache gets larger than this value, default=%default')
1390 group.add_option(
1391 '--min-free-space',
1392 type='int',
1393 metavar='NNN',
1394 default=2 * 1024 * 1024 * 1024,
1395 help='Trim if disk free space becomes lower than this value, '
1396 'default=%default')
Junji Watanabeb03450b2020-09-25 05:09:27 +00001397 parser.add_option_group(group)
1398
1399
1400def process_cas_cache_options(options):
1401 if options.cas_cache:
1402 policies = local_caching.CachePolicies(
1403 max_cache_size=options.max_cache_size,
1404 min_free_space=options.min_free_space,
1405 # max_items isn't used for CAS cache for now.
1406 max_items=None,
1407 max_age_secs=MAX_AGE_SECS)
1408
1409 return local_caching.DiskContentAddressedCache(
1410 six.text_type(os.path.abspath(options.cas_cache)), policies, trim=False)
1411 return local_caching.MemoryContentAddressedCache()
1412
1413
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001414def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001415 """Validates named cache options and returns a CacheManager."""
1416 if options.named_caches and not options.named_cache_root:
1417 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001418 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001419 if not CACHE_NAME_RE.match(name):
1420 parser.error(
1421 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1422 if not path:
1423 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001424 try:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001425 int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001426 except ValueError:
1427 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001428 if options.named_cache_root:
1429 # Make these configurable later if there is use case but for now it's fairly
1430 # safe values.
1431 # In practice, a fair chunk of bots are already recycled on a daily schedule
1432 # so this code doesn't have any effect to them, unless they are preloaded
1433 # with a really old cache.
1434 policies = local_caching.CachePolicies(
1435 # 1TiB.
1436 max_cache_size=1024*1024*1024*1024,
1437 min_free_space=options.min_free_space,
1438 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001439 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001440 root_dir = six.text_type(os.path.abspath(options.named_cache_root))
John Budorickc6186972020-02-26 00:58:14 +00001441 cache = local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
1442 # Touch any named caches we're going to use to minimize thrashing
1443 # between tasks that request some (but not all) of the same named caches.
John Budorick0a4dab62020-03-02 22:23:35 +00001444 cache.touch(*[name for name, _, _ in options.named_caches])
John Budorickc6186972020-02-26 00:58:14 +00001445 return cache
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001446 return None
1447
1448
aludwin7556e0c2016-10-26 08:46:10 -07001449def parse_args(args):
1450 # Create a fake mini-parser just to get out the "-a" command. Note that
1451 # it's not documented here; instead, it's documented in create_option_parser
1452 # even though that parser will never actually get to parse it. This is
1453 # because --argsfile is exclusive with all other options and arguments.
1454 file_argparse = argparse.ArgumentParser(add_help=False)
1455 file_argparse.add_argument('-a', '--argsfile')
1456 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1457 if file_args.argsfile:
1458 if nonfile_args:
1459 file_argparse.error('Can\'t specify --argsfile with'
1460 'any other arguments (%s)' % nonfile_args)
1461 try:
1462 with open(file_args.argsfile, 'r') as f:
1463 args = json.load(f)
1464 except (IOError, OSError, ValueError) as e:
1465 # We don't need to error out here - "args" is now empty,
1466 # so the call below to parser.parse_args(args) will fail
1467 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001468 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001469
1470 # Even if we failed to read the args, just call the normal parser now since it
1471 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001472 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001473 options, args = parser.parse_args(args)
Ye Kuangfff1e502020-07-13 13:21:57 +00001474 if not isinstance(options.cipd_enabled, (bool, int)):
1475 options.cipd_enabled = distutils.util.strtobool(options.cipd_enabled)
aludwin7556e0c2016-10-26 08:46:10 -07001476 return (parser, options, args)
1477
1478
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001479def _calc_named_cache_hint(named_cache, named_caches):
1480 """Returns the expected size of the missing named caches."""
1481 present = named_cache.available
1482 size = 0
Takuto Ikutad169bfd2021-08-02 05:45:09 +00001483 logging.info('available named cache %s', present)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001484 for name, _, hint in named_caches:
1485 if name not in present:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001486 hint = int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001487 if hint > 0:
Takuto Ikuta74686842021-07-30 04:11:03 +00001488 logging.info("named cache hint: %s, %d", name, hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001489 size += hint
Takuto Ikuta74686842021-07-30 04:11:03 +00001490 logging.info("total size of named cache hint: %d", size)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001491 return size
1492
1493
Takuto Ikutaae391c52020-12-03 08:43:45 +00001494def _clean_cmd(parser, options, caches, root):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001495 """Cleanup cache dirs/files."""
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001496 if options.json:
1497 parser.error('Can\'t use --json with --clean.')
1498 if options.named_caches:
1499 parser.error('Can\t use --named-cache with --clean.')
1500 if options.cas_instance or options.cas_digest:
1501 parser.error('Can\t use --cas-instance, --cas-digest with --clean.')
1502
1503 logging.info("initial free space: %d", file_path.get_free_space(root))
1504
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001505 if options.kvs_dir and fs.isdir(six.text_type(options.kvs_dir)):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001506 # Remove kvs file if its size exceeds fixed threshold.
Takuto Ikutab1b70062021-03-22 01:02:41 +00001507 kvs_dir = six.text_type(options.kvs_dir)
1508 size = file_path.get_recursive_size(kvs_dir)
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001509 if size >= _CAS_KVS_CACHE_THRESHOLD:
1510 logging.info("remove kvs dir with size: %d", size)
Takuto Ikutab1b70062021-03-22 01:02:41 +00001511 file_path.rmtree(kvs_dir)
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001512
1513 # Trim first, then clean.
1514 local_caching.trim_caches(
1515 caches,
1516 root,
1517 min_free_space=options.min_free_space,
1518 max_age_secs=MAX_AGE_SECS)
1519 logging.info("free space after trim: %d", file_path.get_free_space(root))
1520 for c in caches:
1521 c.cleanup()
1522 logging.info("free space after cleanup: %d", file_path.get_free_space(root))
1523
1524
aludwin7556e0c2016-10-26 08:46:10 -07001525def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001526 # Warning: when --argsfile is used, the strings are unicode instances, when
1527 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001528 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001529
Joanna Wang40959bf2021-08-12 18:10:12 +00001530 # Must be logged after parse_args(), which eventually calls
1531 # logging_utils.prepare_logging() which expects no logs before its call.
1532 logging.info('Starting run_isolated script')
1533
Junji Watanabe1d83d282021-05-11 05:50:40 +00001534 SWARMING_SERVER = os.environ.get('SWARMING_SERVER')
1535 SWARMING_TASK_ID = os.environ.get('SWARMING_TASK_ID')
1536 if options.report_on_exception and SWARMING_SERVER:
1537 task_url = None
1538 if SWARMING_TASK_ID:
1539 task_url = '%s/task?id=%s' % (SWARMING_SERVER, SWARMING_TASK_ID)
1540 on_error.report_on_exception_exit(SWARMING_SERVER, source=task_url)
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001541
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001542 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001543 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001544
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001545 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001546 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001547 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1548 if hint:
1549 # Increase the --min-free-space value by the hint, and recreate the
1550 # NamedCache instance so it gets the updated CachePolicy.
1551 options.min_free_space += hint
1552 named_cache = process_named_cache_options(parser, options)
1553
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001554 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1555 # they can be cleaned the same way.
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001556
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001557 cas_cache = process_cas_cache_options(options)
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +00001558
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001559 caches = []
Junji Watanabeb03450b2020-09-25 05:09:27 +00001560 if cas_cache:
1561 caches.append(cas_cache)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001562 if named_cache:
1563 caches.append(named_cache)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001564 root = caches[0].cache_dir if caches else six.text_type(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001565 if options.clean:
Takuto Ikutaae391c52020-12-03 08:43:45 +00001566 _clean_cmd(parser, options, caches, root)
maruel36a963d2016-04-08 17:15:49 -07001567 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001568
1569 # Trim must still be done for the following case:
1570 # - named-cache was used
1571 # - some entries, with a large hint, where missing
1572 # - --min-free-space was increased accordingly, thus trimming is needed
1573 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1574 # --clean after each task.
Takuto Ikutac9ddff22021-02-18 07:58:39 +00001575 additional_buffer = _FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001576 if options.kvs_dir:
Takuto Ikuta7f45c592021-02-09 05:57:05 +00001577 additional_buffer += _CAS_KVS_CACHE_THRESHOLD
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001578 # Add some buffer for Go CLI.
1579 min_free_space = options.min_free_space + additional_buffer
1580
1581 def trim_caches_fn(stats):
1582 start = time.time()
1583 local_caching.trim_caches(
1584 caches, root, min_free_space=min_free_space, max_age_secs=MAX_AGE_SECS)
1585 duration = time.time() - start
1586 stats['duration'] = duration
1587 logging.info('trim_caches: took %d seconds', duration)
maruel36a963d2016-04-08 17:15:49 -07001588
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001589 # Save state of cas cache not to overwrite state from go client.
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001590 if cas_cache:
1591 cas_cache.save()
1592 cas_cache = None
1593
Takuto Ikutadc496672021-11-12 05:58:59 +00001594 if not args:
1595 parser.error('command to run is required.')
nodir55be77b2016-05-03 09:39:57 -07001596
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001597 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001598
Takuto Ikutaa71c6562021-11-18 06:07:55 +00001599 if ISOLATED_OUTDIR_PARAMETER in args and not options.cas_instance:
1600 parser.error('%s in args requires --cas-instance' %
Junji Watanabeed9ce352020-09-25 12:32:07 +00001601 ISOLATED_OUTDIR_PARAMETER)
1602
nodir90bc8dc2016-06-15 13:35:21 -07001603 if options.root_dir:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001604 options.root_dir = six.text_type(os.path.abspath(options.root_dir))
Takuto Ikutad46ea762020-10-07 05:43:22 +00001605 else:
1606 options.root_dir = six.text_type(tempfile.mkdtemp(prefix='root'))
maruel12e30012015-10-09 11:55:35 -07001607 if options.json:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001608 options.json = six.text_type(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001609
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001610 if any('=' not in i for i in options.env):
1611 parser.error(
1612 '--env required key=value form. value can be skipped to delete '
1613 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001614 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001615
1616 prefixes = {}
1617 cwd = os.path.realpath(os.getcwd())
1618 for item in options.env_prefix:
1619 if '=' not in item:
1620 parser.error(
1621 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1622 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001623 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001624 if os.path.isabs(opath):
1625 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1626 opath = os.path.normpath(opath)
1627 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1628 parser.error(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001629 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1630 % opath)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001631 prefixes.setdefault(key, []).append(opath)
1632 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001633
nodirbe642ff2016-06-09 15:51:51 -07001634 cipd.validate_cipd_options(parser, options)
1635
Junji Watanabedc2f89e2021-11-08 08:44:30 +00001636 install_packages_fn = copy_local_packages
Ye Kuang1d096cb2020-06-26 08:38:21 +00001637 tmp_cipd_cache_dir = None
vadimsh902948e2017-01-20 15:57:32 -08001638 if options.cipd_enabled:
Ye Kuang1d096cb2020-06-26 08:38:21 +00001639 cache_dir = options.cipd_cache
1640 if not cache_dir:
1641 tmp_cipd_cache_dir = six.text_type(tempfile.mkdtemp())
1642 cache_dir = tmp_cipd_cache_dir
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001643 install_packages_fn = (
1644 lambda run_dir, cas_dir, nsjail_dir: install_client_and_packages(
1645 run_dir,
1646 cipd.parse_package_args(options.cipd_packages),
1647 options.cipd_server,
1648 options.cipd_client_package,
1649 options.cipd_client_version,
1650 cache_dir=cache_dir,
1651 cas_dir=cas_dir,
1652 nsjail_dir=nsjail_dir,
1653 ))
nodirbe642ff2016-06-09 15:51:51 -07001654
nodird6160682017-02-02 13:03:35 -08001655 @contextlib.contextmanager
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001656 def install_named_caches(run_dir, stats):
nodird6160682017-02-02 13:03:35 -08001657 # WARNING: this function depends on "options" variable defined in the outer
1658 # function.
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001659 assert six.text_type(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001660 assert os.path.isabs(run_dir), run_dir
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001661 named_caches = [(os.path.join(run_dir, six.text_type(relpath)), name)
1662 for name, relpath, _ in options.named_caches]
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001663 install_start = time.time()
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001664 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001665 named_cache.install(path, name)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001666 install_duration = time.time() - install_start
1667 stats['install']['duration'] = install_duration
1668 logging.info('named_caches: install took %d seconds', install_duration)
nodird6160682017-02-02 13:03:35 -08001669 try:
1670 yield
1671 finally:
dnje289d132017-07-07 11:16:44 -07001672 # Uninstall each named cache, returning it to the cache pool. If an
1673 # uninstall fails for a given cache, it will remain in the task's
1674 # temporary space, get cleaned up by the Swarming bot, and be lost.
1675 #
1676 # If the Swarming bot cannot clean up the cache, it will handle it like
1677 # any other bot file that could not be removed.
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001678 uninstall_start = time.time()
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001679 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001680 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001681 # uninstall() doesn't trim but does call save() implicitly. Trimming
1682 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001683 named_cache.uninstall(path, name)
1684 except local_caching.NamedCacheError:
Takuto Ikuta463ecdd2021-03-05 09:35:38 +00001685 if sys.platform == 'win32':
1686 # Show running processes.
1687 sys.stderr.write("running process\n")
1688 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
1689
Junji Watanabed2ab86b2021-08-13 07:20:23 +00001690 error = (
1691 'Error while removing named cache %r at %r. The cache will be'
1692 ' lost.' % (path, name))
1693 logging.exception(error)
1694 on_error.report(error)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001695 uninstall_duration = time.time() - uninstall_start
1696 stats['uninstall']['duration'] = uninstall_duration
1697 logging.info('named_caches: uninstall took %d seconds',
1698 uninstall_duration)
nodirf33b8d62016-10-26 22:34:58 -07001699
Takuto Ikutaf3caa9b2020-11-02 05:38:26 +00001700 command = args
1701 if options.relative_cwd:
1702 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1703 if not a.startswith(os.getcwd()):
1704 parser.error(
1705 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001706
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001707 containment_type = subprocess42.Containment.NONE
1708 if options.containment_type == 'AUTO':
1709 containment_type = subprocess42.Containment.AUTO
1710 if options.containment_type == 'JOB_OBJECT':
1711 containment_type = subprocess42.Containment.JOB_OBJECT
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001712 if options.containment_type == 'NSJAIL':
1713 containment_type = subprocess42.Containment.NSJAIL
1714 # TODO(https://crbug.com/1227833): This object should eventually contain the
1715 # path to the nsjail binary and the nsjail configuration file.
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001716 containment = subprocess42.Containment(
1717 containment_type=containment_type,
1718 limit_processes=options.limit_processes,
1719 limit_total_committed_memory=options.limit_total_committed_memory)
1720
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001721 data = TaskData(
1722 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001723 relative_cwd=options.relative_cwd,
Junji Watanabe54925c32020-09-08 00:56:18 +00001724 cas_instance=options.cas_instance,
1725 cas_digest=options.cas_digest,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001726 outputs=options.output,
1727 install_named_caches=install_named_caches,
1728 leak_temp_dir=options.leak_temp_dir,
1729 root_dir=_to_unicode(options.root_dir),
1730 hard_timeout=options.hard_timeout,
1731 grace_period=options.grace_period,
1732 bot_file=options.bot_file,
1733 switch_to_account=options.switch_to_account,
1734 install_packages_fn=install_packages_fn,
Junji Watanabeb03450b2020-09-25 05:09:27 +00001735 cas_cache_dir=options.cas_cache,
1736 cas_cache_policies=local_caching.CachePolicies(
1737 max_cache_size=options.max_cache_size,
1738 min_free_space=options.min_free_space,
1739 max_items=None,
1740 max_age_secs=None,
1741 ),
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001742 cas_kvs=options.kvs_dir,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001743 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001744 env_prefix=options.env_prefix,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001745 lower_priority=bool(options.lower_priority),
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001746 containment=containment,
1747 trim_caches_fn=trim_caches_fn)
nodirbe642ff2016-06-09 15:51:51 -07001748 try:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001749 return run_tha_test(data, options.json)
Junji Watanabe38b28b02020-04-23 10:23:30 +00001750 except (cipd.Error, local_caching.NamedCacheError,
1751 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001752 print(ex.message, file=sys.stderr)
Junji Watanabed2ab86b2021-08-13 07:20:23 +00001753 on_error.report(None)
nodirbe642ff2016-06-09 15:51:51 -07001754 return 1
Ye Kuang1d096cb2020-06-26 08:38:21 +00001755 finally:
1756 if tmp_cipd_cache_dir is not None:
1757 try:
1758 file_path.rmtree(tmp_cipd_cache_dir)
1759 except OSError:
1760 logging.exception('Remove tmp_cipd_cache_dir=%s failed',
1761 tmp_cipd_cache_dir)
1762 # Best effort clean up. Failed to do so doesn't affect the outcome.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001763
1764
1765if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001766 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001767 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001768 fix_encoding.fix_encoding()
Ye Kuang2dd17442020-04-22 08:45:52 +00001769 net.set_user_agent('run_isolated.py/' + __version__)
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001770 sys.exit(main(sys.argv[1:]))