blob: f8bf7d12982aa07cda05a42e62518b6b9243f3d4 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
Joanna Wang4cec0e42021-08-26 00:48:37 +000033Any ${SWARMING_TASK_ID} on the command line will be replaced by the
34SWARMING_TASK_ID value passed with the --env option.
35
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000036See
37https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
38for all the variables.
39
40See
41https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
42for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000043"""
44
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000045from __future__ import print_function
46
47__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000048
aludwin7556e0c2016-10-26 08:46:10 -070049import argparse
maruel064c0a32016-04-05 11:47:15 -070050import base64
iannucci96fcccc2016-08-30 15:52:22 -070051import collections
vadimsh232f5a82017-01-20 19:23:44 -080052import contextlib
Ye Kuangfff1e502020-07-13 13:21:57 +000053import distutils
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040054import errno
aludwin7556e0c2016-10-26 08:46:10 -070055import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000056import logging
57import optparse
58import os
Takuto Ikuta5c59a842020-01-24 03:05:24 +000059import platform
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040060import re
Junji Watanabedc2f89e2021-11-08 08:44:30 +000061import shutil
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000062import sys
63import tempfile
maruel064c0a32016-04-05 11:47:15 -070064import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000065
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000066from utils import tools
67tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000068
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000069# third_party/
70from depot_tools import fix_encoding
Takuto Ikuta6e2ff962019-10-29 12:35:27 +000071import six
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000072
73# pylint: disable=ungrouped-imports
Takuto Ikutad53d7bd2021-07-16 03:09:33 +000074import DEPS
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000075import auth
76import cipd
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000077import isolateserver
78import local_caching
79from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070080from utils import file_path
maruel12e30012015-10-09 11:55:35 -070081from utils import fs
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040082from utils import logging_utils
Ye Kuang2dd17442020-04-22 08:45:52 +000083from utils import net
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040084from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050085from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000086
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000087
maruele2f2cb82016-07-13 14:41:03 -070088# Magic variables that can be found in the isolate task command line.
89ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
90EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
91SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
Joanna Wang4cec0e42021-08-26 00:48:37 +000092SWARMING_TASK_ID_PARAMETER = '${SWARMING_TASK_ID}'
maruele2f2cb82016-07-13 14:41:03 -070093
94
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000095# The name of the log file to use.
96RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
97
maruele2f2cb82016-07-13 14:41:03 -070098
maruele2f2cb82016-07-13 14:41:03 -070099# Use short names for temporary directories. This is driven by Windows, which
100# imposes a relatively short maximum path length of 260 characters, often
101# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000102# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -0700103#
104# It is recommended to start the script with a `root_dir` as short as
105# possible.
106# - ir stands for isolated_run
107# - io stands for isolated_out
108# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000109# - ic stands for isolated_client
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000110# - ns stands for nsjail
maruele2f2cb82016-07-13 14:41:03 -0700111ISOLATED_RUN_DIR = u'ir'
112ISOLATED_OUT_DIR = u'io'
113ISOLATED_TMP_DIR = u'it'
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000114ISOLATED_CLIENT_DIR = u'ic'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000115_CAS_CLIENT_DIR = u'cc'
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000116_NSJAIL_DIR = u'ns'
maruele2f2cb82016-07-13 14:41:03 -0700117
Takuto Ikuta02edca22019-11-29 10:04:51 +0000118# TODO(tikuta): take these parameter from luci-config?
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000119_CAS_PACKAGE = 'infra/tools/luci/cas/${platform}'
Takuto Ikutad53d7bd2021-07-16 03:09:33 +0000120_LUCI_GO_REVISION = DEPS.deps['luci-go']['packages'][0]['version']
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000121_NSJAIL_PACKAGE = 'infra/3pp/tools/nsjail/${platform}'
122_NSJAIL_VERSION = DEPS.deps['nsjail']['packages'][0]['version']
maruele2f2cb82016-07-13 14:41:03 -0700123
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400124# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000125CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400126
Takuto Ikutac9ddff22021-02-18 07:58:39 +0000127_FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES = 2 * 1024 * 1024 * 1024
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400128
marueld928c862017-06-08 08:20:04 -0700129OUTLIVING_ZOMBIE_MSG = """\
130*** Swarming tried multiple times to delete the %s directory and failed ***
131*** Hard failing the task ***
132
133Swarming detected that your testing script ran an executable, which may have
134started a child executable, and the main script returned early, leaving the
135children executables playing around unguided.
136
137You don't want to leave children processes outliving the task on the Swarming
138bot, do you? The Swarming bot doesn't.
139
140How to fix?
141- For any process that starts children processes, make sure all children
142 processes terminated properly before each parent process exits. This is
143 especially important in very deep process trees.
144 - This must be done properly both in normal successful task and in case of
145 task failure. Cleanup is very important.
146- The Swarming bot sends a SIGTERM in case of timeout.
147 - You have %s seconds to comply after the signal was sent to the process
148 before the process is forcibly killed.
149- To achieve not leaking children processes in case of signals on timeout, you
150 MUST handle signals in each executable / python script and propagate them to
151 children processes.
152 - When your test script (python or binary) receives a signal like SIGTERM or
153 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
154 them to terminate before quitting.
155
156See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400157https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700158for more information.
159
160*** May the SIGKILL force be with you ***
161"""
162
163
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000164# Currently hardcoded. Eventually could be exposed as a flag once there's value.
165# 3 weeks
166MAX_AGE_SECS = 21*24*60*60
167
Takuto Ikuta7ff4b242020-12-03 08:07:06 +0000168_CAS_KVS_CACHE_THRESHOLD = 5 * 1024 * 1024 * 1024 # 5 GiB
169
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500170TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000171 'TaskData',
172 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000173 # List of strings; the command line to use, independent of what was
174 # specified in the isolated file.
175 'command',
176 # Relative directory to start command into.
177 'relative_cwd',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000178 # Hash of the .isolated file that must be retrieved to recreate the tree
179 # of files to run the target executable. The command specified in the
180 # .isolated is executed. Mutually exclusive with command argument.
181 'isolated_hash',
182 # isolateserver.Storage instance to retrieve remote objects. This object
183 # has a reference to an isolateserver.StorageApi, which does the actual
184 # I/O.
185 'storage',
186 # isolateserver.LocalCache instance to keep from retrieving the same
187 # objects constantly by caching the objects retrieved. Can be on-disk or
188 # in-memory.
189 'isolate_cache',
Junji Watanabe54925c32020-09-08 00:56:18 +0000190 # Digest of the input root on RBE-CAS.
191 'cas_digest',
192 # Full CAS instance name.
193 'cas_instance',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000194 # List of paths relative to root_dir to put into the output isolated
195 # bundle upon task completion (see link_outputs_to_outdir).
196 'outputs',
197 # Function (run_dir) => context manager that installs named caches into
198 # |run_dir|.
199 'install_named_caches',
200 # If True, the temporary directory will be deliberately leaked for later
201 # examination.
202 'leak_temp_dir',
203 # Path to the directory to use to create the temporary directory. If not
204 # specified, a random temporary directory is created.
205 'root_dir',
206 # Kills the process if it lasts more than this amount of seconds.
207 'hard_timeout',
208 # Number of seconds to wait between SIGTERM and SIGKILL.
209 'grace_period',
210 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
211 # task command line argument.
212 'bot_file',
213 # Logical account to switch LUCI_CONTEXT into.
214 'switch_to_account',
215 # Context manager dir => CipdInfo, see install_client_and_packages.
216 'install_packages_fn',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000217 # Cache directory for `cas` client.
218 'cas_cache_dir',
219 # Parameters passed to `cas` client.
220 'cas_cache_policies',
Takuto Ikutaae391c52020-12-03 08:43:45 +0000221 # Parameters for kvs file used by `cas` client.
222 'cas_kvs',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000223 # Environment variables to set.
224 'env',
225 # Environment variables to mutate with relative directories.
226 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
227 'env_prefix',
228 # Lowers the task process priority.
229 'lower_priority',
230 # subprocess42.Containment instance. Can be None.
231 'containment',
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000232 # Function to trim caches before installing cipd packages and
233 # downloading isolated files.
234 'trim_caches_fn',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000235 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500236
237
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500238def _to_str(s):
239 """Downgrades a unicode instance to str. Pass str through as-is."""
240 if isinstance(s, str):
241 return s
242 # This is technically incorrect, especially on Windows. In theory
243 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
244 # page' on Windows, but that causes other problems, as the character set
245 # is very limited.
246 return s.encode('utf-8')
247
248
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500249def _to_unicode(s):
250 """Upgrades a str instance to unicode. Pass unicode through as-is."""
Takuto Ikuta95459dd2019-10-29 12:39:47 +0000251 if isinstance(s, six.text_type) or s is None:
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500252 return s
253 return s.decode('utf-8')
254
255
maruel03e11842016-07-14 10:50:16 -0700256def make_temp_dir(prefix, root_dir):
257 """Returns a new unique temporary directory."""
Takuto Ikuta6e2ff962019-10-29 12:35:27 +0000258 return six.text_type(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000259
260
vadimsh9c54b2c2017-07-25 14:08:29 -0700261@contextlib.contextmanager
262def set_luci_context_account(account, tmp_dir):
263 """Sets LUCI_CONTEXT account to be used by the task.
264
265 If 'account' is None or '', does nothing at all. This happens when
266 run_isolated.py is called without '--switch-to-account' flag. In this case,
267 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000268 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700269 run_isolated.py explicitly from their code.
270
271 If the requested account is not defined in the context, switches to
272 non-authenticated access. This happens for Swarming tasks that don't use
273 'task' service accounts.
274
275 If not using LUCI_CONTEXT-based auth, does nothing.
276 If already running as requested account, does nothing.
277 """
278 if not account:
279 # Not actually switching.
280 yield
281 return
282
283 local_auth = luci_context.read('local_auth')
284 if not local_auth:
285 # Not using LUCI_CONTEXT auth at all.
286 yield
287 return
288
289 # See LUCI_CONTEXT.md for the format of 'local_auth'.
290 if local_auth.get('default_account_id') == account:
291 # Already set, no need to switch.
292 yield
293 return
294
295 available = {a['id'] for a in local_auth.get('accounts') or []}
296 if account in available:
297 logging.info('Switching default LUCI_CONTEXT account to %r', account)
298 local_auth['default_account_id'] = account
299 else:
300 logging.warning(
301 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
302 'disabling authentication', account, sorted(available))
303 local_auth.pop('default_account_id', None)
304
305 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
306 yield
307
308
nodir90bc8dc2016-06-15 13:35:21 -0700309def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000310 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700311
312 Raises:
313 ValueError if a parameter is requested in |command| but its value is not
314 provided.
315 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000316 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
317
318
319def replace_parameters(arg, out_dir, bot_file):
320 """Replaces parameter tokens with appropriate values in a string.
321
322 Raises:
323 ValueError if a parameter is requested in |arg| but its value is not
324 provided.
325 """
326 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
327 replace_slash = False
328 if ISOLATED_OUTDIR_PARAMETER in arg:
329 if not out_dir:
330 raise ValueError(
331 'output directory is requested in command or env var, but not '
332 'provided; please specify one')
333 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
334 replace_slash = True
335 if SWARMING_BOT_FILE_PARAMETER in arg:
336 if bot_file:
337 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700338 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000339 else:
340 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
341 'var, but no bot_file specified. Leaving parameter '
342 'unchanged.')
Joanna Wang4cec0e42021-08-26 00:48:37 +0000343 if SWARMING_TASK_ID_PARAMETER in arg:
344 task_id = os.environ.get('SWARMING_TASK_ID')
345 if task_id:
346 arg = arg.replace(SWARMING_TASK_ID_PARAMETER, task_id)
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000347 if replace_slash:
348 # Replace slashes only if parameters are present
349 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
350 arg = arg.replace('/', os.sep)
351 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700352
353
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000354def set_temp_dir(env, tmp_dir):
355 """Set temp dir to given env var dictionary"""
356 tmp_dir = _to_str(tmp_dir)
357 # pylint: disable=line-too-long
358 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
359 # platform. So $TMPDIR must be set on all platforms.
360 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
361 env['TMPDIR'] = tmp_dir
362 if sys.platform == 'win32':
363 # * chromium's base utils uses GetTempPath().
364 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
365 # * Go uses GetTempPath().
366 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
367 # set.
368 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
369 env['TMP'] = tmp_dir
370 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
371 env['TEMP'] = tmp_dir
372 elif sys.platform == 'darwin':
373 # * Chromium uses an hack on macOS before calling into
374 # NSTemporaryDirectory().
375 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
376 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
377 env['MAC_CHROMIUM_TMPDIR'] = tmp_dir
378 else:
379 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
380 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
381 # * mktemp on linux respects $TMPDIR.
382 # * Chromium respects $TMPDIR on linux.
383 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
384 # * Go uses $TMPDIR.
385 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
386 pass
387
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000388
389def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
390 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800391 """Returns full OS environment to run a command in.
392
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800393 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
394 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800395
396 Args:
397 tmp_dir: temp directory.
398 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500399 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500400 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800401 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000402 out_dir: Isolated output directory. Required to be != None if any of the
403 env vars contain ISOLATED_OUTDIR_PARAMETER.
404 bot_file: Required to be != None if any of the env vars contain
405 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800406 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500407 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000408 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500409 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500410 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500411 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000412 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500413
414 if cipd_info:
415 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500416 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
417 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Takuto Ikuta4ec3e8f2021-04-05 10:21:29 +0000418 cipd_info_path = os.path.join(tmp_dir, 'cipd_info.json')
419 with open(cipd_info_path, 'w') as f:
420 json.dump(cipd_info.pins, f)
421 out['ISOLATED_RESOLVED_PACKAGE_VERSIONS_FILE'] = cipd_info_path
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500422
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000423 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500424 assert isinstance(paths, list), paths
425 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500426 cur = out.get(key)
427 if cur:
428 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500429 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800430
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000431 set_temp_dir(out, tmp_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500432 return out
vadimsh232f5a82017-01-20 19:23:44 -0800433
434
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000435def run_command(
436 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700437 """Runs the command.
438
439 Returns:
440 tuple(process exit code, bool if had a hard timeout)
441 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000442 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000443 'run_command(%s, %s, %s, %s, %s, %s)',
444 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700445
maruel6be7f9e2015-10-01 12:25:30 -0700446 exit_code = None
447 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700448 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700449 proc = None
450 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700451 try:
maruel6be7f9e2015-10-01 12:25:30 -0700452 # TODO(maruel): This code is imperfect. It doesn't handle well signals
453 # during the download phase and there's short windows were things can go
454 # wrong.
455 def handler(signum, _frame):
456 if proc and not had_signal:
457 logging.info('Received signal %d', signum)
458 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700459 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700460
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000461 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000462 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000463 lower_priority=lower_priority, containment=containment)
Joanna Wang40959bf2021-08-12 18:10:12 +0000464 logging.info('Subprocess for command started')
maruel6be7f9e2015-10-01 12:25:30 -0700465 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
466 try:
John Budorickc398f092019-06-10 22:49:44 +0000467 exit_code = proc.wait(hard_timeout or None)
Takuto Ikuta6a8f4e12021-11-15 02:33:04 +0000468 logging.info("finished with exit code %d", exit_code)
maruel6be7f9e2015-10-01 12:25:30 -0700469 except subprocess42.TimeoutExpired:
470 if not had_signal:
471 logging.warning('Hard timeout')
472 had_hard_timeout = True
473 logging.warning('Sending SIGTERM')
474 proc.terminate()
475
Takuto Ikuta684f7912020-09-29 07:49:49 +0000476 kill_sent = False
maruel6be7f9e2015-10-01 12:25:30 -0700477 # Ignore signals in grace period. Forcibly give the grace period to the
478 # child process.
479 if exit_code is None:
480 ignore = lambda *_: None
481 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
482 try:
483 exit_code = proc.wait(grace_period or None)
Takuto Ikuta6a8f4e12021-11-15 02:33:04 +0000484 logging.info("finished with exit code %d", exit_code)
maruel6be7f9e2015-10-01 12:25:30 -0700485 except subprocess42.TimeoutExpired:
486 # Now kill for real. The user can distinguish between the
487 # following states:
488 # - signal but process exited within grace period,
489 # hard_timed_out will be set but the process exit code will be
490 # script provided.
491 # - processed exited late, exit code will be -9 on posix.
492 logging.warning('Grace exhausted; sending SIGKILL')
493 proc.kill()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000494 kill_sent = True
martiniss5c8043e2017-08-01 17:09:43 -0700495 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700496 exit_code = proc.wait()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000497
498 # the process group / job object may be dangling so if we didn't kill
499 # it already, give it a poke now.
500 if not kill_sent:
501 proc.kill()
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000502 except OSError as e:
maruela9cfd6f2015-09-15 11:03:15 -0700503 # This is not considered to be an internal error. The executable simply
504 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800505 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000506 '<The executable does not exist, a dependent library is missing or '
507 'the command line is too long>\n'
508 '<Check for missing .so/.dll in the .isolate or GN file or length of '
509 'command line args>\n'
Takuto Ikutae900df42021-04-14 04:40:11 +0000510 '<Command: %s>\n'
511 '<Exception: %s>\n' % (command, e))
maruela72f46e2016-02-24 11:05:45 -0800512 if os.environ.get('SWARMING_TASK_ID'):
513 # Give an additional hint when running as a swarming task.
514 sys.stderr.write(
515 '<See the task\'s page for commands to help diagnose this issue '
516 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700517 exit_code = 1
518 logging.info(
519 'Command finished with exit code %d (%s)',
520 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700521 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700522
523
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000524def _run_go_cmd_and_wait(cmd, tmp_dir):
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000525 """
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000526 Runs an external Go command, `isolated` or `cas`, and wait for its completion.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000527
528 While this is a generic function to launch a subprocess, it has logic that
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000529 is specific to Go `isolated` and `cas` for waiting and logging.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000530
531 Returns:
532 The subprocess object
533 """
Ye Kuang3c40e9f2020-07-28 13:15:25 +0000534 cmd_str = ' '.join(cmd)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000535 try:
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000536 env = os.environ.copy()
537 set_temp_dir(env, tmp_dir)
538 proc = subprocess42.Popen(cmd, env=env)
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000539
Ye Kuangc1d800f2020-07-28 10:14:55 +0000540 exceeded_max_timeout = True
541 check_period_sec = 30
542 max_checks = 100
543 # max timeout = max_checks * check_period_sec = 50 minutes
544 for i in range(max_checks):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000545 # This is to prevent I/O timeout error during setup.
Ye Kuangc1d800f2020-07-28 10:14:55 +0000546 try:
547 retcode = proc.wait(check_period_sec)
548 if retcode != 0:
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000549 raise subprocess42.CalledProcessError(retcode, cmd=cmd_str)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000550 exceeded_max_timeout = False
551 break
552 except subprocess42.TimeoutExpired:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000553 print('still running (after %d seconds)' % ((i + 1) * check_period_sec))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000554
Ye Kuangc1d800f2020-07-28 10:14:55 +0000555 if exceeded_max_timeout:
556 proc.terminate()
557 try:
558 proc.wait(check_period_sec)
559 except subprocess42.TimeoutExpired:
560 logging.exception(
561 "failed to terminate? timeout happened after %d seconds",
562 check_period_sec)
563 proc.kill()
564 proc.wait()
565 # Raise unconditionally, because |proc| was forcefully terminated.
566 raise ValueError("timedout after %d seconds (cmd=%s)" %
567 (check_period_sec * max_checks, cmd_str))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000568
Ye Kuangc1d800f2020-07-28 10:14:55 +0000569 return proc
570 except Exception:
571 logging.exception('Failed to run Go cmd %s', cmd_str)
572 raise
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000573
574
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000575def _fetch_and_map(cas_client, digest, instance, output_dir, cache_dir,
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000576 policies, kvs_dir, tmp_dir):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000577 """
578 Fetches a CAS tree using cas client, create the tree and returns download
579 stats.
580 """
581
582 start = time.time()
583 result_json_handle, result_json_path = tempfile.mkstemp(
584 prefix=u'fetch-and-map-result-', suffix=u'.json')
585 os.close(result_json_handle)
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000586 profile_dir = tempfile.mkdtemp(dir=tmp_dir)
587
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000588 try:
589 cmd = [
590 cas_client,
591 'download',
592 '-digest',
593 digest,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000594 # flags for cache.
595 '-cache-dir',
596 cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000597 '-cache-max-size',
598 str(policies.max_cache_size),
599 '-cache-min-free-space',
600 str(policies.min_free_space),
601 # flags for output.
602 '-dir',
603 output_dir,
604 '-dump-stats-json',
605 result_json_path,
Takuto Ikuta557025b2021-02-01 08:37:40 +0000606 '-log-level',
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000607 'info',
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000608 ]
Takuto Ikutaae391c52020-12-03 08:43:45 +0000609
Junji Watanabe66d807b2021-11-08 03:20:10 +0000610 # When RUN_ISOLATED_CAS_ADDRESS is set in test mode,
611 # Use it and ignore CAS instance option.
612 cas_addr = os.environ.get('RUN_ISOLATED_CAS_ADDRESS')
613 if cas_addr:
614 cmd.extend([
615 '-cas-addr',
616 cas_addr,
617 ])
618 else:
619 cmd.extend([
620 '-cas-instance',
621 instance
622 ])
623
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000624 if kvs_dir:
625 cmd.extend(['-kvs-dir', kvs_dir])
Takuto Ikutaae391c52020-12-03 08:43:45 +0000626
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000627 try:
628 _run_go_cmd_and_wait(cmd, tmp_dir)
Takuto Ikuta0909eae2021-04-27 02:54:07 +0000629 except subprocess42.CalledProcessError as ex:
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000630 if not kvs_dir:
631 raise
632 logging.exception('Failed to run cas, removing kvs cache dir and retry.')
Takuto Ikuta0909eae2021-04-27 02:54:07 +0000633 on_error.report("Failed to run cas %s" % ex)
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000634 file_path.rmtree(kvs_dir)
Takuto Ikutacffabfb2021-11-01 08:05:43 +0000635 file_path.rmtree(output_dir)
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000636 _run_go_cmd_and_wait(cmd, tmp_dir)
637
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000638 with open(result_json_path) as json_file:
639 result_json = json.load(json_file)
640
641 return {
642 'duration': time.time() - start,
643 'items_cold': result_json['items_cold'],
644 'items_hot': result_json['items_hot'],
645 }
646 finally:
647 fs.remove(result_json_path)
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000648 file_path.rmtree(profile_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000649
650
aludwin0a8e17d2016-10-27 15:57:39 -0700651def link_outputs_to_outdir(run_dir, out_dir, outputs):
652 """Links any named outputs to out_dir so they can be uploaded.
653
654 Raises an error if the file already exists in that directory.
655 """
656 if not outputs:
657 return
Takuto Ikutae0dce462021-11-16 08:49:46 +0000658 file_path.create_directories(out_dir, outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700659 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400660 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
661
662
663def copy_recursively(src, dst):
664 """Efficiently copies a file or directory from src_dir to dst_dir.
665
666 `item` may be a file, directory, or a symlink to a file or directory.
667 All symlinks are replaced with their targets, so the resulting
668 directory structure in dst_dir will never have any symlinks.
669
670 To increase speed, copy_recursively hardlinks individual files into the
671 (newly created) directory structure if possible, unlike Python's
672 shutil.copytree().
673 """
674 orig_src = src
675 try:
676 # Replace symlinks with their final target.
677 while fs.islink(src):
678 res = fs.readlink(src)
Takuto Ikutaf2ad0a02021-06-24 08:38:40 +0000679 src = os.path.realpath(os.path.join(os.path.dirname(src), res))
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400680 # TODO(sadafm): Explicitly handle cyclic symlinks.
681
Takuto Ikutaf2ad0a02021-06-24 08:38:40 +0000682 if not fs.exists(src):
683 logging.warning('Path %s does not exist or %s is a broken symlink', src,
684 orig_src)
685 return
686
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400687 if fs.isfile(src):
688 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
689 return
690
691 if not fs.exists(dst):
692 os.makedirs(dst)
693
694 for child in fs.listdir(src):
695 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
696
697 except OSError as e:
698 if e.errno == errno.ENOENT:
699 logging.warning('Path %s does not exist or %s is a broken symlink',
700 src, orig_src)
701 else:
702 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700703
704
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000705def upload_outdir(cas_client, cas_instance, outdir, tmp_dir):
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000706 """Uploads the results in |outdir|, if there is any.
707
708 Returns:
709 tuple(root_digest, stats)
710 - root_digest: a digest of the output directory.
711 - stats: uploading stats.
712 """
Junji Watanabe15f9e042021-11-12 07:13:50 +0000713 if not fs.listdir(outdir):
714 return None, None
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000715 digest_file_handle, digest_path = tempfile.mkstemp(
716 prefix=u'cas-digest', suffix=u'.txt')
717 os.close(digest_file_handle)
718 stats_json_handle, stats_json_path = tempfile.mkstemp(
719 prefix=u'upload-stats', suffix=u'.json')
720 os.close(stats_json_handle)
721
722 try:
723 cmd = [
724 cas_client,
725 'archive',
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000726 '-paths',
727 # Format: <working directory>:<relative path to dir>
728 outdir + ':',
729 # output
730 '-dump-digest',
731 digest_path,
732 '-dump-stats-json',
733 stats_json_path,
734 ]
735
Junji Watanabe66d807b2021-11-08 03:20:10 +0000736 # When RUN_ISOLATED_CAS_ADDRESS is set in test mode,
737 # Use it and ignore CAS instance option.
738 cas_addr = os.environ.get('RUN_ISOLATED_CAS_ADDRESS')
739 if cas_addr:
740 cmd.extend([
741 '-cas-addr',
742 cas_addr,
743 ])
744 else:
745 cmd.extend([
746 '-cas-instance',
747 cas_instance
748 ])
749
Takuto Ikutabfcef252021-08-25 07:46:19 +0000750 if sys.platform.startswith('linux'):
751 # TODO(crbug.com/1243194): remove this after investigation.
752 cmd.extend(['-log-level', 'debug'])
753
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000754 start = time.time()
755
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000756 _run_go_cmd_and_wait(cmd, tmp_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000757
758 with open(digest_path) as digest_file:
759 digest = digest_file.read()
Junji Watanabec208b302020-09-25 09:18:27 +0000760 h, s = digest.split('/')
761 cas_output_root = {
762 'cas_instance': cas_instance,
763 'digest': {
764 'hash': h,
765 'size_bytes': int(s)
766 }
767 }
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000768 with open(stats_json_path) as stats_file:
769 stats = json.load(stats_file)
770
771 stats['duration'] = time.time() - start
772
Junji Watanabec208b302020-09-25 09:18:27 +0000773 return cas_output_root, stats
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000774 finally:
775 fs.remove(digest_path)
776 fs.remove(stats_json_path)
777
778
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500779def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700780 """Runs a command with optional isolated input/output.
781
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500782 Arguments:
783 - data: TaskData instance.
784 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700785
786 Returns metadata about the result.
787 """
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000788
789 if data.isolate_cache:
790 download_stats = {
791 #'duration': 0.,
792 'initial_number_items': len(data.isolate_cache),
793 'initial_size': data.isolate_cache.total_size,
794 #'items_cold': '<large.pack()>',
795 #'items_hot': '<large.pack()>',
796 }
797 else:
798 # TODO(tikuta): take stats from state.json in this case too.
799 download_stats = {}
800
maruela9cfd6f2015-09-15 11:03:15 -0700801 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000802 'duration': None,
803 'exit_code': None,
804 'had_hard_timeout': False,
805 'internal_failure': 'run_isolated did not complete properly',
806 'stats': {
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000807 'trim_caches': {
808 'duration': 0,
809 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000810 #'cipd': {
811 # 'duration': 0.,
812 # 'get_client_duration': 0.,
813 #},
814 'isolated': {
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000815 'download': download_stats,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000816 #'upload': {
817 # 'duration': 0.,
818 # 'items_cold': '<large.pack()>',
819 # 'items_hot': '<large.pack()>',
820 #},
821 },
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000822 'named_caches': {
823 'install': {
824 'duration': 0,
825 },
826 'uninstall': {
827 'duration': 0,
828 },
829 },
830 'cleanup': {
831 'duration': 0,
832 }
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000833 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000834 #'cipd_pins': {
835 # 'packages': [
836 # {'package_name': ..., 'version': ..., 'path': ...},
837 # ...
838 # ],
839 # 'client_package': {'package_name': ..., 'version': ...},
840 #},
841 'outputs_ref': None,
Junji Watanabe54925c32020-09-08 00:56:18 +0000842 'cas_output_root': None,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000843 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700844 }
nodirbe642ff2016-06-09 15:51:51 -0700845
Takuto Ikutad46ea762020-10-07 05:43:22 +0000846 assert os.path.isabs(data.root_dir), ("data.root_dir is not abs path: %s" %
847 data.root_dir)
848 file_path.ensure_tree(data.root_dir, 0o700)
849
maruele2f2cb82016-07-13 14:41:03 -0700850 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700851 # TODO(maruel): This is not obvious. Change this to become an error once we
852 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500853 if constant_run_path and data.root_dir:
854 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700855 if os.path.isdir(run_dir):
856 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000857 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700858 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500859 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000860
861 # True if CAS is used for download/upload files.
862 use_cas = bool(data.cas_digest)
863
maruel03e11842016-07-14 10:50:16 -0700864 # storage should be normally set but don't crash if it is not. This can happen
865 # as Swarming task can run without an isolate server.
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000866 out_dir = None
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000867 if use_cas:
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000868 out_dir = make_temp_dir(ISOLATED_OUT_DIR, data.root_dir)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500869 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700870 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500871 if data.relative_cwd:
872 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500873 command = data.command
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000874
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000875 cas_client = None
876 cas_client_dir = make_temp_dir(_CAS_CLIENT_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000877 if use_cas:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000878 cas_client = os.path.join(cas_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX)
879
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000880 data.trim_caches_fn(result['stats']['trim_caches'])
881
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000882 nsjail_dir = None
883 if (sys.platform == "linux" and cipd.get_platform() == "amd64" and
884 data.containment.containment_type == subprocess42.Containment.NSJAIL):
885 nsjail_dir = make_temp_dir(_NSJAIL_DIR, data.root_dir)
886
nodir55be77b2016-05-03 09:39:57 -0700887 try:
Takuto Ikuta1ce61362021-11-16 05:44:17 +0000888 with data.install_packages_fn(run_dir, cas_client_dir,
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000889 nsjail_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800890 if cipd_info:
891 result['stats']['cipd'] = cipd_info.stats
892 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700893
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000894 isolated_stats = result['stats'].setdefault('isolated', {})
Takuto Ikutab58dbd12020-06-05 09:29:14 +0000895
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000896 if data.cas_digest:
897 stats = _fetch_and_map(
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000898 cas_client=cas_client,
899 digest=data.cas_digest,
900 instance=data.cas_instance,
901 output_dir=run_dir,
Junji Watanabeb03450b2020-09-25 05:09:27 +0000902 cache_dir=data.cas_cache_dir,
Takuto Ikutaae391c52020-12-03 08:43:45 +0000903 policies=data.cas_cache_policies,
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000904 kvs_dir=data.cas_kvs,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000905 tmp_dir=tmp_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000906 isolated_stats['download'].update(stats)
Junji Watanabe54925c32020-09-08 00:56:18 +0000907
maruelabec63c2017-04-26 11:53:24 -0700908 if not command:
909 # Handle this as a task failure, not an internal failure.
910 sys.stderr.write(
911 '<No command was specified!>\n'
912 '<Please secify a command when triggering your Swarming task>\n')
913 result['exit_code'] = 1
914 return result
nodirbe642ff2016-06-09 15:51:51 -0700915
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500916 if not cwd.startswith(run_dir):
917 # Handle this as a task failure, not an internal failure. This is a
918 # 'last chance' way to gate against directory escape.
919 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
920 result['exit_code'] = 1
921 return result
922
923 if not os.path.isdir(cwd):
924 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +0000925 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500926
vadimsh232f5a82017-01-20 19:23:44 -0800927 # If we have an explicit list of files to return, make sure their
928 # directories exist now.
Takuto Ikutaab8d0232021-11-16 12:12:09 +0000929 if data.outputs:
Takuto Ikutae0dce462021-11-16 08:49:46 +0000930 file_path.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700931
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000932 with data.install_named_caches(run_dir, result['stats']['named_caches']):
nodird6160682017-02-02 13:03:35 -0800933 sys.stdout.flush()
934 start = time.time()
935 try:
vadimsh9c54b2c2017-07-25 14:08:29 -0700936 # Need to switch the default account before 'get_command_env' call,
937 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500938 with set_luci_context_account(data.switch_to_account, tmp_dir):
939 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000940 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
941 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +0000942 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -0800943 command = process_command(command, out_dir, data.bot_file)
944 file_path.ensure_command_has_abs_path(command, cwd)
945
vadimsh9c54b2c2017-07-25 14:08:29 -0700946 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000947 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000948 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -0800949 finally:
950 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -0500951
Ye Kuangbc4e8402020-07-29 09:54:30 +0000952 if out_dir:
953 # Try to link files to the output directory, if specified.
954 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
955 isolated_stats = result['stats'].setdefault('isolated', {})
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000956 if use_cas:
957 result['cas_output_root'], isolated_stats['upload'] = (
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000958 upload_outdir(cas_client, data.cas_instance, out_dir,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000959 tmp_dir))
Takuto Ikutacd68ef52021-11-18 04:11:45 +0000960
Seth Koehler49139812017-12-19 13:59:33 -0500961 # We successfully ran the command, set internal_failure back to
962 # None (even if the command failed, it's not an internal error).
963 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -0700964 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -0700965 # An internal error occurred. Report accordingly so the swarming task will
966 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -0700967 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -0700968 result['internal_failure'] = str(e)
969 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -0700970
971 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -0700972 finally:
973 try:
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000974 cleanup_start = time.time()
Ye Kuangbc4e8402020-07-29 09:54:30 +0000975 success = True
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500976 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -0700977 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700978 logging.warning(
979 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -0700980 else:
maruel84537cb2015-10-16 14:21:28 -0700981 # On Windows rmtree(run_dir) call above has a synchronization effect: it
982 # finishes only when all task child processes terminate (since a running
983 # process locks *.exe file). Examine out_dir only after that call
984 # completes (since child processes may write to out_dir too and we need
985 # to wait for them to finish).
Takuto Ikuta1ce61362021-11-16 05:44:17 +0000986 dirs_to_remove = [run_dir, tmp_dir, cas_client_dir]
Ye Kuangbc4e8402020-07-29 09:54:30 +0000987 if out_dir:
988 dirs_to_remove.append(out_dir)
989 for directory in dirs_to_remove:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000990 if not fs.isdir(directory):
991 continue
Junji Watanabe9cdfff52021-01-08 07:20:35 +0000992 start = time.time()
maruel84537cb2015-10-16 14:21:28 -0700993 try:
Junji Watanabecc4eefd2021-01-19 01:46:10 +0000994 file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -0700995 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000996 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -0700997 success = False
Junji Watanabe9cdfff52021-01-08 07:20:35 +0000998 finally:
999 logging.info('Cleanup: rmtree(%r) took %d seconds', directory,
1000 time.time() - start)
maruel84537cb2015-10-16 14:21:28 -07001001 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001002 sys.stderr.write(
1003 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
Junji Watanabed952bf12021-05-13 03:15:54 +00001004 if sys.platform == 'win32':
1005 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
1006 else:
1007 subprocess42.check_call(['ps', 'axu'], stdout=sys.stderr)
maruel84537cb2015-10-16 14:21:28 -07001008 if result['exit_code'] == 0:
1009 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -07001010
maruela9cfd6f2015-09-15 11:03:15 -07001011 if not success and result['exit_code'] == 0:
1012 result['exit_code'] = 1
1013 except Exception as e:
1014 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -07001015 if out_dir:
1016 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -07001017 result['internal_failure'] = str(e)
Takuto Ikutaa9a907b2020-04-17 08:50:50 +00001018 on_error.report(None)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001019 finally:
1020 cleanup_duration = time.time() - cleanup_start
1021 result['stats']['cleanup']['duration'] = cleanup_duration
1022 logging.info('Cleanup: removing directories took %d seconds',
1023 cleanup_duration)
maruela9cfd6f2015-09-15 11:03:15 -07001024 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001025
1026
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001027def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -07001028 """Runs an executable and records execution metadata.
1029
nodir55be77b2016-05-03 09:39:57 -07001030 If isolated_hash is specified, downloads the dependencies in the cache,
1031 hardlinks them into a temporary directory and runs the command specified in
1032 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001033
1034 A temporary directory is created to hold the output files. The content inside
1035 this directory will be uploaded back to |storage| packaged as a .isolated
1036 file.
1037
1038 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001039 - data: TaskData instance.
1040 - result_json: File path to dump result metadata into. If set, the process
1041 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -07001042
1043 Returns:
1044 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001045 """
maruela76b9ee2015-12-15 06:18:08 -08001046 if result_json:
1047 # Write a json output file right away in case we get killed.
1048 result = {
Junji Watanabe54925c32020-09-08 00:56:18 +00001049 'exit_code': None,
1050 'had_hard_timeout': False,
1051 'internal_failure': 'Was terminated before completion',
1052 'outputs_ref': None,
1053 'cas_output_root': None,
1054 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -08001055 }
1056 tools.write_json(result_json, result, dense=True)
1057
maruela9cfd6f2015-09-15 11:03:15 -07001058 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001059 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -07001060 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -07001061
maruela9cfd6f2015-09-15 11:03:15 -07001062 if result_json:
maruel05d5a882015-09-21 13:59:02 -07001063 # We've found tests to delete 'work' when quitting, causing an exception
1064 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -07001065 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -07001066 tools.write_json(result_json, result, dense=True)
1067 # Only return 1 if there was an internal error.
1068 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +00001069
maruela9cfd6f2015-09-15 11:03:15 -07001070 # Marshall into old-style inline output.
1071 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +00001072 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -07001073 data = {
Junji Watanabe38b28b02020-04-23 10:23:30 +00001074 'hash': result['outputs_ref']['isolated'],
1075 'namespace': result['outputs_ref']['namespace'],
1076 'storage': result['outputs_ref']['isolatedserver'],
maruela9cfd6f2015-09-15 11:03:15 -07001077 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -05001078 sys.stdout.flush()
Junji Watanabe38b28b02020-04-23 10:23:30 +00001079 print('[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
1080 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -08001081 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -07001082 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001083
1084
iannuccib58d10d2017-03-18 02:00:25 -07001085# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -08001086CipdInfo = collections.namedtuple('CipdInfo', [
1087 'client', # cipd.CipdClient object
1088 'cache_dir', # absolute path to bot-global cipd tag and instance cache
1089 'stats', # dict with stats to return to the server
1090 'pins', # dict with installed cipd pins to return to the server
1091])
1092
1093
1094@contextlib.contextmanager
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001095def copy_local_packages(_run_dir, cas_dir, _nsjail_dir):
Junji Watanabedc2f89e2021-11-08 08:44:30 +00001096 """Copies CIPD packages from luci/luci-go dir."""
1097 go_client_dir = os.environ.get('LUCI_GO_CLIENT_DIR')
1098 assert go_client_dir, ('Please set LUCI_GO_CLIENT_DIR env var to install CIPD'
1099 ' packages locally.')
1100 shutil.copy2(os.path.join(go_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX),
1101 os.path.join(cas_dir, 'cas' + cipd.EXECUTABLE_SUFFIX))
vadimsh232f5a82017-01-20 19:23:44 -08001102 yield None
1103
1104
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001105def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -07001106 """Calls 'cipd ensure' for packages.
1107
1108 Args:
1109 run_dir (str): root of installation.
1110 cipd_cache_dir (str): the directory to use for the cipd package cache.
1111 client (CipdClient): the cipd client to use
1112 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -07001113
1114 Returns: list of pinned packages. Looks like [
1115 {
1116 'path': 'subdirectory',
1117 'package_name': 'resolved/package/name',
1118 'version': 'deadbeef...',
1119 },
1120 ...
1121 ]
1122 """
1123 package_pins = [None]*len(packages)
1124 def insert_pin(path, name, version, idx):
1125 package_pins[idx] = {
1126 'package_name': name,
1127 # swarming deals with 'root' as '.'
1128 'path': path or '.',
1129 'version': version,
1130 }
1131
1132 by_path = collections.defaultdict(list)
1133 for i, (path, name, version) in enumerate(packages):
1134 # cipd deals with 'root' as ''
1135 if path == '.':
1136 path = ''
1137 by_path[path].append((name, version, i))
1138
1139 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001140 run_dir,
1141 {
1142 subdir: [(name, vers) for name, vers, _ in pkgs
1143 ] for subdir, pkgs in by_path.items()
1144 },
1145 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -07001146 )
1147
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +00001148 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -07001149 this_subdir = by_path[subdir]
1150 for i, (name, version) in enumerate(pin_list):
1151 insert_pin(subdir, name, version, this_subdir[i][2])
1152
Robert Iannucci461b30d2017-12-13 11:34:03 -08001153 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -07001154
1155 return package_pins
1156
1157
vadimsh232f5a82017-01-20 19:23:44 -08001158@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001159def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001160 client_package_name, client_version, cache_dir,
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001161 cas_dir, nsjail_dir):
vadimsh902948e2017-01-20 15:57:32 -08001162 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -07001163
vadimsh232f5a82017-01-20 19:23:44 -08001164 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
1165
1166 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -07001167 [
1168 {
1169 "path": path, "package_name": package_name, "version": version,
1170 },
1171 ...
1172 ]
vadimsh902948e2017-01-20 15:57:32 -08001173 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -07001174
1175 such that they correspond 1:1 to all input package arguments from the command
1176 line. These dictionaries make their all the way back to swarming, where they
1177 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -07001178
vadimsh902948e2017-01-20 15:57:32 -08001179 If 'packages' list is empty, will bootstrap CIPD client, but won't install
1180 any packages.
1181
1182 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -08001183 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -08001184
nodirbe642ff2016-06-09 15:51:51 -07001185 Args:
nodir90bc8dc2016-06-15 13:35:21 -07001186 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -08001187 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -07001188 service_url (str): CIPD server url, e.g.
1189 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -07001190 client_package_name (str): CIPD package name of CIPD client.
1191 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -07001192 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001193 cas_dir (str): where to download cas client.
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001194 nsjail_dir (str): where to download nsjail. If set to None, nsjail is not
1195 downloaded.
nodirbe642ff2016-06-09 15:51:51 -07001196 """
1197 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001198
nodirbe642ff2016-06-09 15:51:51 -07001199 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001200
vadimsh902948e2017-01-20 15:57:32 -08001201 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001202 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001203 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001204 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001205
nodirbe642ff2016-06-09 15:51:51 -07001206 get_client_start = time.time()
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001207 client_manager = cipd.get_client(cache_dir, service_url, client_package_name,
1208 client_version)
iannucci96fcccc2016-08-30 15:52:22 -07001209
nodirbe642ff2016-06-09 15:51:51 -07001210 with client_manager as client:
1211 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001212
iannuccib58d10d2017-03-18 02:00:25 -07001213 package_pins = []
1214 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001215 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1216 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001217
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001218 # Install cas client to |cas_dir|.
1219 _install_packages(cas_dir, cipd_cache_dir, client,
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +00001220 [('', _CAS_PACKAGE, _LUCI_GO_REVISION)])
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001221
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001222 # Install nsjail to |nsjail_dir|.
1223 if nsjail_dir is not None:
1224 _install_packages(nsjail_dir, cipd_cache_dir, client,
1225 [('', _NSJAIL_PACKAGE, _NSJAIL_VERSION)])
1226
iannuccib58d10d2017-03-18 02:00:25 -07001227 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001228
vadimsh232f5a82017-01-20 19:23:44 -08001229 total_duration = time.time() - start
Junji Watanabe38b28b02020-04-23 10:23:30 +00001230 logging.info('Installing CIPD client and packages took %d seconds',
1231 total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001232
vadimsh232f5a82017-01-20 19:23:44 -08001233 yield CipdInfo(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001234 client=client,
1235 cache_dir=cipd_cache_dir,
1236 stats={
1237 'duration': total_duration,
1238 'get_client_duration': get_client_duration,
iannuccib58d10d2017-03-18 02:00:25 -07001239 },
Junji Watanabe38b28b02020-04-23 10:23:30 +00001240 pins={
1241 'client_package': {
1242 'package_name': client.package_name,
1243 'version': client.instance_id,
1244 },
1245 'packages': package_pins,
1246 })
nodirbe642ff2016-06-09 15:51:51 -07001247
1248
1249def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001250 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001251 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001252 version=__version__,
1253 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001254 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001255 '--clean',
1256 action='store_true',
maruel36a963d2016-04-08 17:15:49 -07001257 help='Cleans the cache, trimming it necessary and remove corrupted items '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001258 'and returns without executing anything; use with -v to know what '
1259 'was done')
maruel36a963d2016-04-08 17:15:49 -07001260 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001261 '--json',
1262 help='dump output metadata to json file. When used, run_isolated returns '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001263 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001264 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001265 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001266 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001267 '--grace-period',
1268 type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001269 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001270 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001271 '--relative-cwd',
Takuto Ikuta18ca29a2020-12-04 07:34:20 +00001272 help='Ignore the isolated \'relative_cwd\' and use this one instead')
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001273 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001274 '--env',
1275 default=[],
1276 action='append',
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001277 help='Environment variables to set for the child process')
1278 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001279 '--env-prefix',
1280 default=[],
1281 action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001282 help='Specify a VAR=./path/fragment to put in the environment variable '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001283 'before executing the command. The path fragment must be relative '
1284 'to the isolated run directory, and must not contain a `..` token. '
1285 'The path will be made absolute and prepended to the indicated '
1286 '$VAR using the OS\'s path separator. Multiple items for the same '
1287 '$VAR will be prepended in order.')
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001288 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001289 '--bot-file',
1290 help='Path to a file describing the state of the host. The content is '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001291 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001292 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001293 '--switch-to-account',
1294 help='If given, switches LUCI_CONTEXT to given logical service account '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001295 '(e.g. "task" or "system") before launching the isolated process.')
vadimsh9c54b2c2017-07-25 14:08:29 -07001296 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001297 '--output',
1298 action='append',
aludwin0a8e17d2016-10-27 15:57:39 -07001299 help='Specifies an output to return. If no outputs are specified, all '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001300 'files located in $(ISOLATED_OUTDIR) will be returned; '
1301 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1302 'specified by --output option (there can be multiple) will be '
1303 'returned. Note that if a file in OUT_DIR has the same path '
1304 'as an --output option, the --output version will be returned.')
aludwin0a8e17d2016-10-27 15:57:39 -07001305 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001306 '-a',
1307 '--argsfile',
aludwin7556e0c2016-10-26 08:46:10 -07001308 # This is actually handled in parse_args; it's included here purely so it
1309 # can make it into the help text.
1310 help='Specify a file containing a JSON array of arguments to this '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001311 'script. If --argsfile is provided, no other argument may be '
1312 'provided on the command line.')
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001313 parser.add_option(
1314 '--report-on-exception',
1315 action='store_true',
1316 help='Whether report exception during execution to isolate server. '
1317 'This flag should only be used in swarming bot.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001318
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001319 group = optparse.OptionGroup(parser, 'Data source - Isolate server')
Junji Watanabe54925c32020-09-08 00:56:18 +00001320 # Deprecated. Isoate server is being migrated to RBE-CAS.
1321 # Remove --isolated and isolate server options after migration.
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001322 group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001323 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001324 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001325 isolateserver.add_isolate_server_options(group)
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001326 parser.add_option_group(group)
1327
1328 group = optparse.OptionGroup(parser,
1329 'Data source - Content Addressed Storage')
Junji Watanabe54925c32020-09-08 00:56:18 +00001330 group.add_option(
1331 '--cas-instance', help='Full CAS instance name for input/output files.')
1332 group.add_option(
1333 '--cas-digest',
1334 help='Digest of the input root on RBE-CAS. The format is '
1335 '`{hash}/{size_bytes}`.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001336 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001337
Junji Watanabeb03450b2020-09-25 05:09:27 +00001338 # Cache options.
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001339 isolateserver.add_cache_options(parser)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001340 add_cas_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001341
1342 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001343
1344 group = optparse.OptionGroup(parser, 'Named caches')
1345 group.add_option(
1346 '--named-cache',
1347 dest='named_caches',
1348 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001349 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001350 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001351 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001352 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1353 'path is a path relative to the run dir where the cache directory '
1354 'must be put to. '
1355 'This option can be specified more than once.')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001356 group.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001357 '--named-cache-root',
1358 default='named_caches',
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001359 help='Cache root directory. Default=%default')
1360 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001361
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001362 group = optparse.OptionGroup(parser, 'Process containment')
1363 parser.add_option(
1364 '--lower-priority', action='store_true',
1365 help='Lowers the child process priority')
1366 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001367 '--containment-type',
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001368 choices=('NONE', 'AUTO', 'JOB_OBJECT', 'NSJAIL'),
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001369 default='NONE',
1370 help='Type of container to use')
1371 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001372 '--limit-processes',
1373 type='int',
1374 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001375 help='Maximum number of active processes in the containment')
1376 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001377 '--limit-total-committed-memory',
1378 type='int',
1379 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001380 help='Maximum sum of committed memory in the containment')
1381 parser.add_option_group(group)
1382
1383 group = optparse.OptionGroup(parser, 'Debugging')
1384 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001385 '--leak-temp-dir',
1386 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001387 help='Deliberately leak isolate\'s temp dir for later examination. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001388 'Default: %default')
1389 group.add_option('--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001390 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001391
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001392 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001393
Ye Kuang1d096cb2020-06-26 08:38:21 +00001394 parser.set_defaults(cache='cache')
nodirbe642ff2016-06-09 15:51:51 -07001395 return parser
1396
1397
Junji Watanabeb03450b2020-09-25 05:09:27 +00001398def add_cas_cache_options(parser):
1399 group = optparse.OptionGroup(parser, 'CAS cache management')
1400 group.add_option(
1401 '--cas-cache',
1402 metavar='DIR',
1403 default='cas-cache',
1404 help='Directory to keep a local cache of the files. Accelerates download '
1405 'by reusing already downloaded files. Default=%default')
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001406 group.add_option(
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001407 '--kvs-dir',
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001408 default='',
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001409 help='CAS cache dir using kvs for small files. Default=%default')
Junji Watanabeb03450b2020-09-25 05:09:27 +00001410 parser.add_option_group(group)
1411
1412
1413def process_cas_cache_options(options):
1414 if options.cas_cache:
1415 policies = local_caching.CachePolicies(
1416 max_cache_size=options.max_cache_size,
1417 min_free_space=options.min_free_space,
1418 # max_items isn't used for CAS cache for now.
1419 max_items=None,
1420 max_age_secs=MAX_AGE_SECS)
1421
1422 return local_caching.DiskContentAddressedCache(
1423 six.text_type(os.path.abspath(options.cas_cache)), policies, trim=False)
1424 return local_caching.MemoryContentAddressedCache()
1425
1426
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001427def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001428 """Validates named cache options and returns a CacheManager."""
1429 if options.named_caches and not options.named_cache_root:
1430 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001431 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001432 if not CACHE_NAME_RE.match(name):
1433 parser.error(
1434 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1435 if not path:
1436 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001437 try:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001438 int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001439 except ValueError:
1440 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001441 if options.named_cache_root:
1442 # Make these configurable later if there is use case but for now it's fairly
1443 # safe values.
1444 # In practice, a fair chunk of bots are already recycled on a daily schedule
1445 # so this code doesn't have any effect to them, unless they are preloaded
1446 # with a really old cache.
1447 policies = local_caching.CachePolicies(
1448 # 1TiB.
1449 max_cache_size=1024*1024*1024*1024,
1450 min_free_space=options.min_free_space,
1451 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001452 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001453 root_dir = six.text_type(os.path.abspath(options.named_cache_root))
John Budorickc6186972020-02-26 00:58:14 +00001454 cache = local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
1455 # Touch any named caches we're going to use to minimize thrashing
1456 # between tasks that request some (but not all) of the same named caches.
John Budorick0a4dab62020-03-02 22:23:35 +00001457 cache.touch(*[name for name, _, _ in options.named_caches])
John Budorickc6186972020-02-26 00:58:14 +00001458 return cache
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001459 return None
1460
1461
aludwin7556e0c2016-10-26 08:46:10 -07001462def parse_args(args):
1463 # Create a fake mini-parser just to get out the "-a" command. Note that
1464 # it's not documented here; instead, it's documented in create_option_parser
1465 # even though that parser will never actually get to parse it. This is
1466 # because --argsfile is exclusive with all other options and arguments.
1467 file_argparse = argparse.ArgumentParser(add_help=False)
1468 file_argparse.add_argument('-a', '--argsfile')
1469 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1470 if file_args.argsfile:
1471 if nonfile_args:
1472 file_argparse.error('Can\'t specify --argsfile with'
1473 'any other arguments (%s)' % nonfile_args)
1474 try:
1475 with open(file_args.argsfile, 'r') as f:
1476 args = json.load(f)
1477 except (IOError, OSError, ValueError) as e:
1478 # We don't need to error out here - "args" is now empty,
1479 # so the call below to parser.parse_args(args) will fail
1480 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001481 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001482
1483 # Even if we failed to read the args, just call the normal parser now since it
1484 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001485 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001486 options, args = parser.parse_args(args)
Ye Kuangfff1e502020-07-13 13:21:57 +00001487 if not isinstance(options.cipd_enabled, (bool, int)):
1488 options.cipd_enabled = distutils.util.strtobool(options.cipd_enabled)
aludwin7556e0c2016-10-26 08:46:10 -07001489 return (parser, options, args)
1490
1491
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001492def _calc_named_cache_hint(named_cache, named_caches):
1493 """Returns the expected size of the missing named caches."""
1494 present = named_cache.available
1495 size = 0
Takuto Ikutad169bfd2021-08-02 05:45:09 +00001496 logging.info('available named cache %s', present)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001497 for name, _, hint in named_caches:
1498 if name not in present:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001499 hint = int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001500 if hint > 0:
Takuto Ikuta74686842021-07-30 04:11:03 +00001501 logging.info("named cache hint: %s, %d", name, hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001502 size += hint
Takuto Ikuta74686842021-07-30 04:11:03 +00001503 logging.info("total size of named cache hint: %d", size)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001504 return size
1505
1506
Takuto Ikutaae391c52020-12-03 08:43:45 +00001507def _clean_cmd(parser, options, caches, root):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001508 """Cleanup cache dirs/files."""
1509 if options.isolated:
1510 parser.error('Can\'t use --isolated with --clean.')
1511 if options.isolate_server:
1512 parser.error('Can\'t use --isolate-server with --clean.')
1513 if options.json:
1514 parser.error('Can\'t use --json with --clean.')
1515 if options.named_caches:
1516 parser.error('Can\t use --named-cache with --clean.')
1517 if options.cas_instance or options.cas_digest:
1518 parser.error('Can\t use --cas-instance, --cas-digest with --clean.')
1519
1520 logging.info("initial free space: %d", file_path.get_free_space(root))
1521
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001522 if options.kvs_dir and fs.isdir(six.text_type(options.kvs_dir)):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001523 # Remove kvs file if its size exceeds fixed threshold.
Takuto Ikutab1b70062021-03-22 01:02:41 +00001524 kvs_dir = six.text_type(options.kvs_dir)
1525 size = file_path.get_recursive_size(kvs_dir)
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001526 if size >= _CAS_KVS_CACHE_THRESHOLD:
1527 logging.info("remove kvs dir with size: %d", size)
Takuto Ikutab1b70062021-03-22 01:02:41 +00001528 file_path.rmtree(kvs_dir)
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001529
1530 # Trim first, then clean.
1531 local_caching.trim_caches(
1532 caches,
1533 root,
1534 min_free_space=options.min_free_space,
1535 max_age_secs=MAX_AGE_SECS)
1536 logging.info("free space after trim: %d", file_path.get_free_space(root))
1537 for c in caches:
1538 c.cleanup()
1539 logging.info("free space after cleanup: %d", file_path.get_free_space(root))
1540
1541
aludwin7556e0c2016-10-26 08:46:10 -07001542def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001543 # Warning: when --argsfile is used, the strings are unicode instances, when
1544 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001545 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001546
Joanna Wang40959bf2021-08-12 18:10:12 +00001547 # Must be logged after parse_args(), which eventually calls
1548 # logging_utils.prepare_logging() which expects no logs before its call.
1549 logging.info('Starting run_isolated script')
1550
Junji Watanabe1d83d282021-05-11 05:50:40 +00001551 SWARMING_SERVER = os.environ.get('SWARMING_SERVER')
1552 SWARMING_TASK_ID = os.environ.get('SWARMING_TASK_ID')
1553 if options.report_on_exception and SWARMING_SERVER:
1554 task_url = None
1555 if SWARMING_TASK_ID:
1556 task_url = '%s/task?id=%s' % (SWARMING_SERVER, SWARMING_TASK_ID)
1557 on_error.report_on_exception_exit(SWARMING_SERVER, source=task_url)
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001558
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001559 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001560 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001561
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001562 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001563 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001564 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1565 if hint:
1566 # Increase the --min-free-space value by the hint, and recreate the
1567 # NamedCache instance so it gets the updated CachePolicy.
1568 options.min_free_space += hint
1569 named_cache = process_named_cache_options(parser, options)
1570
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001571 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1572 # they can be cleaned the same way.
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001573
1574 isolate_cache = isolateserver.process_cache_options(options, trim=False)
1575 cas_cache = process_cas_cache_options(options)
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +00001576
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001577 caches = []
1578 if isolate_cache:
1579 caches.append(isolate_cache)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001580 if cas_cache:
1581 caches.append(cas_cache)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001582 if named_cache:
1583 caches.append(named_cache)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001584 root = caches[0].cache_dir if caches else six.text_type(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001585 if options.clean:
Takuto Ikutaae391c52020-12-03 08:43:45 +00001586 _clean_cmd(parser, options, caches, root)
maruel36a963d2016-04-08 17:15:49 -07001587 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001588
1589 # Trim must still be done for the following case:
1590 # - named-cache was used
1591 # - some entries, with a large hint, where missing
1592 # - --min-free-space was increased accordingly, thus trimming is needed
1593 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1594 # --clean after each task.
Takuto Ikutac9ddff22021-02-18 07:58:39 +00001595 additional_buffer = _FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001596 if options.kvs_dir:
Takuto Ikuta7f45c592021-02-09 05:57:05 +00001597 additional_buffer += _CAS_KVS_CACHE_THRESHOLD
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001598 # Add some buffer for Go CLI.
1599 min_free_space = options.min_free_space + additional_buffer
1600
1601 def trim_caches_fn(stats):
1602 start = time.time()
1603 local_caching.trim_caches(
1604 caches, root, min_free_space=min_free_space, max_age_secs=MAX_AGE_SECS)
1605 duration = time.time() - start
1606 stats['duration'] = duration
1607 logging.info('trim_caches: took %d seconds', duration)
maruel36a963d2016-04-08 17:15:49 -07001608
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001609 # Save state of cas cache not to overwrite state from go client.
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001610 if cas_cache:
1611 cas_cache.save()
1612 cas_cache = None
1613
Takuto Ikutadc496672021-11-12 05:58:59 +00001614 if not args:
1615 parser.error('command to run is required.')
nodir55be77b2016-05-03 09:39:57 -07001616
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001617 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001618
Takuto Ikutaae767b32020-05-11 01:22:19 +00001619 isolateserver.process_isolate_server_options(parser, options, False)
Junji Watanabeed9ce352020-09-25 12:32:07 +00001620 if ISOLATED_OUTDIR_PARAMETER in args and (not options.isolate_server and
1621 not options.cas_instance):
1622 parser.error('%s in args requires --isolate-server or --cas-instance' %
1623 ISOLATED_OUTDIR_PARAMETER)
1624
1625 if options.isolated and not options.isolate_server:
1626 parser.error('--isolated requires --isolate-server')
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001627
nodir90bc8dc2016-06-15 13:35:21 -07001628 if options.root_dir:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001629 options.root_dir = six.text_type(os.path.abspath(options.root_dir))
Takuto Ikutad46ea762020-10-07 05:43:22 +00001630 else:
1631 options.root_dir = six.text_type(tempfile.mkdtemp(prefix='root'))
maruel12e30012015-10-09 11:55:35 -07001632 if options.json:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001633 options.json = six.text_type(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001634
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001635 if any('=' not in i for i in options.env):
1636 parser.error(
1637 '--env required key=value form. value can be skipped to delete '
1638 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001639 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001640
1641 prefixes = {}
1642 cwd = os.path.realpath(os.getcwd())
1643 for item in options.env_prefix:
1644 if '=' not in item:
1645 parser.error(
1646 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1647 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001648 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001649 if os.path.isabs(opath):
1650 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1651 opath = os.path.normpath(opath)
1652 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1653 parser.error(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001654 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1655 % opath)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001656 prefixes.setdefault(key, []).append(opath)
1657 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001658
nodirbe642ff2016-06-09 15:51:51 -07001659 cipd.validate_cipd_options(parser, options)
1660
Junji Watanabedc2f89e2021-11-08 08:44:30 +00001661 install_packages_fn = copy_local_packages
Ye Kuang1d096cb2020-06-26 08:38:21 +00001662 tmp_cipd_cache_dir = None
vadimsh902948e2017-01-20 15:57:32 -08001663 if options.cipd_enabled:
Ye Kuang1d096cb2020-06-26 08:38:21 +00001664 cache_dir = options.cipd_cache
1665 if not cache_dir:
1666 tmp_cipd_cache_dir = six.text_type(tempfile.mkdtemp())
1667 cache_dir = tmp_cipd_cache_dir
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001668 install_packages_fn = (
1669 lambda run_dir, cas_dir, nsjail_dir: install_client_and_packages(
1670 run_dir,
1671 cipd.parse_package_args(options.cipd_packages),
1672 options.cipd_server,
1673 options.cipd_client_package,
1674 options.cipd_client_version,
1675 cache_dir=cache_dir,
1676 cas_dir=cas_dir,
1677 nsjail_dir=nsjail_dir,
1678 ))
nodirbe642ff2016-06-09 15:51:51 -07001679
nodird6160682017-02-02 13:03:35 -08001680 @contextlib.contextmanager
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001681 def install_named_caches(run_dir, stats):
nodird6160682017-02-02 13:03:35 -08001682 # WARNING: this function depends on "options" variable defined in the outer
1683 # function.
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001684 assert six.text_type(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001685 assert os.path.isabs(run_dir), run_dir
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001686 named_caches = [(os.path.join(run_dir, six.text_type(relpath)), name)
1687 for name, relpath, _ in options.named_caches]
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001688 install_start = time.time()
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001689 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001690 named_cache.install(path, name)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001691 install_duration = time.time() - install_start
1692 stats['install']['duration'] = install_duration
1693 logging.info('named_caches: install took %d seconds', install_duration)
nodird6160682017-02-02 13:03:35 -08001694 try:
1695 yield
1696 finally:
dnje289d132017-07-07 11:16:44 -07001697 # Uninstall each named cache, returning it to the cache pool. If an
1698 # uninstall fails for a given cache, it will remain in the task's
1699 # temporary space, get cleaned up by the Swarming bot, and be lost.
1700 #
1701 # If the Swarming bot cannot clean up the cache, it will handle it like
1702 # any other bot file that could not be removed.
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001703 uninstall_start = time.time()
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001704 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001705 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001706 # uninstall() doesn't trim but does call save() implicitly. Trimming
1707 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001708 named_cache.uninstall(path, name)
1709 except local_caching.NamedCacheError:
Takuto Ikuta463ecdd2021-03-05 09:35:38 +00001710 if sys.platform == 'win32':
1711 # Show running processes.
1712 sys.stderr.write("running process\n")
1713 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
1714
Junji Watanabed2ab86b2021-08-13 07:20:23 +00001715 error = (
1716 'Error while removing named cache %r at %r. The cache will be'
1717 ' lost.' % (path, name))
1718 logging.exception(error)
1719 on_error.report(error)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001720 uninstall_duration = time.time() - uninstall_start
1721 stats['uninstall']['duration'] = uninstall_duration
1722 logging.info('named_caches: uninstall took %d seconds',
1723 uninstall_duration)
nodirf33b8d62016-10-26 22:34:58 -07001724
Takuto Ikutaf3caa9b2020-11-02 05:38:26 +00001725 command = args
1726 if options.relative_cwd:
1727 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1728 if not a.startswith(os.getcwd()):
1729 parser.error(
1730 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001731
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001732 containment_type = subprocess42.Containment.NONE
1733 if options.containment_type == 'AUTO':
1734 containment_type = subprocess42.Containment.AUTO
1735 if options.containment_type == 'JOB_OBJECT':
1736 containment_type = subprocess42.Containment.JOB_OBJECT
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001737 if options.containment_type == 'NSJAIL':
1738 containment_type = subprocess42.Containment.NSJAIL
1739 # TODO(https://crbug.com/1227833): This object should eventually contain the
1740 # path to the nsjail binary and the nsjail configuration file.
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001741 containment = subprocess42.Containment(
1742 containment_type=containment_type,
1743 limit_processes=options.limit_processes,
1744 limit_total_committed_memory=options.limit_total_committed_memory)
1745
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001746 data = TaskData(
1747 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001748 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001749 isolated_hash=options.isolated,
1750 storage=None,
1751 isolate_cache=isolate_cache,
Junji Watanabe54925c32020-09-08 00:56:18 +00001752 cas_instance=options.cas_instance,
1753 cas_digest=options.cas_digest,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001754 outputs=options.output,
1755 install_named_caches=install_named_caches,
1756 leak_temp_dir=options.leak_temp_dir,
1757 root_dir=_to_unicode(options.root_dir),
1758 hard_timeout=options.hard_timeout,
1759 grace_period=options.grace_period,
1760 bot_file=options.bot_file,
1761 switch_to_account=options.switch_to_account,
1762 install_packages_fn=install_packages_fn,
Junji Watanabeb03450b2020-09-25 05:09:27 +00001763 cas_cache_dir=options.cas_cache,
1764 cas_cache_policies=local_caching.CachePolicies(
1765 max_cache_size=options.max_cache_size,
1766 min_free_space=options.min_free_space,
1767 max_items=None,
1768 max_age_secs=None,
1769 ),
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001770 cas_kvs=options.kvs_dir,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001771 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001772 env_prefix=options.env_prefix,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001773 lower_priority=bool(options.lower_priority),
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001774 containment=containment,
1775 trim_caches_fn=trim_caches_fn)
nodirbe642ff2016-06-09 15:51:51 -07001776 try:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001777 return run_tha_test(data, options.json)
Junji Watanabe38b28b02020-04-23 10:23:30 +00001778 except (cipd.Error, local_caching.NamedCacheError,
1779 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001780 print(ex.message, file=sys.stderr)
Junji Watanabed2ab86b2021-08-13 07:20:23 +00001781 on_error.report(None)
nodirbe642ff2016-06-09 15:51:51 -07001782 return 1
Ye Kuang1d096cb2020-06-26 08:38:21 +00001783 finally:
1784 if tmp_cipd_cache_dir is not None:
1785 try:
1786 file_path.rmtree(tmp_cipd_cache_dir)
1787 except OSError:
1788 logging.exception('Remove tmp_cipd_cache_dir=%s failed',
1789 tmp_cipd_cache_dir)
1790 # Best effort clean up. Failed to do so doesn't affect the outcome.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001791
1792
1793if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001794 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001795 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001796 fix_encoding.fix_encoding()
Ye Kuang2dd17442020-04-22 08:45:52 +00001797 net.set_user_agent('run_isolated.py/' + __version__)
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001798 sys.exit(main(sys.argv[1:]))