blob: 13927c7466bd8f36f147c6e831c977884a5410b6 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
Joanna Wang4cec0e42021-08-26 00:48:37 +000033Any ${SWARMING_TASK_ID} on the command line will be replaced by the
34SWARMING_TASK_ID value passed with the --env option.
35
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000036See
37https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
38for all the variables.
39
40See
41https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
42for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000043"""
44
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000045from __future__ import print_function
46
47__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000048
aludwin7556e0c2016-10-26 08:46:10 -070049import argparse
maruel064c0a32016-04-05 11:47:15 -070050import base64
iannucci96fcccc2016-08-30 15:52:22 -070051import collections
vadimsh232f5a82017-01-20 19:23:44 -080052import contextlib
Ye Kuangfff1e502020-07-13 13:21:57 +000053import distutils
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040054import errno
aludwin7556e0c2016-10-26 08:46:10 -070055import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000056import logging
57import optparse
58import os
Takuto Ikuta5c59a842020-01-24 03:05:24 +000059import platform
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040060import re
Junji Watanabedc2f89e2021-11-08 08:44:30 +000061import shutil
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000062import sys
63import tempfile
maruel064c0a32016-04-05 11:47:15 -070064import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000065
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000066from utils import tools
67tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000068
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000069# third_party/
70from depot_tools import fix_encoding
Takuto Ikuta6e2ff962019-10-29 12:35:27 +000071import six
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000072
73# pylint: disable=ungrouped-imports
Takuto Ikutad53d7bd2021-07-16 03:09:33 +000074import DEPS
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000075import auth
76import cipd
77import isolate_storage
78import isolateserver
79import local_caching
80from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070081from utils import file_path
maruel12e30012015-10-09 11:55:35 -070082from utils import fs
maruel064c0a32016-04-05 11:47:15 -070083from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040084from utils import logging_utils
Ye Kuang2dd17442020-04-22 08:45:52 +000085from utils import net
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040086from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050087from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000088
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000089
maruele2f2cb82016-07-13 14:41:03 -070090# Magic variables that can be found in the isolate task command line.
91ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
92EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
93SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
Joanna Wang4cec0e42021-08-26 00:48:37 +000094SWARMING_TASK_ID_PARAMETER = '${SWARMING_TASK_ID}'
maruele2f2cb82016-07-13 14:41:03 -070095
96
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000097# The name of the log file to use.
98RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
99
maruele2f2cb82016-07-13 14:41:03 -0700100
maruele2f2cb82016-07-13 14:41:03 -0700101# Use short names for temporary directories. This is driven by Windows, which
102# imposes a relatively short maximum path length of 260 characters, often
103# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000104# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -0700105#
106# It is recommended to start the script with a `root_dir` as short as
107# possible.
108# - ir stands for isolated_run
109# - io stands for isolated_out
110# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000111# - ic stands for isolated_client
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000112# - ns stands for nsjail
maruele2f2cb82016-07-13 14:41:03 -0700113ISOLATED_RUN_DIR = u'ir'
114ISOLATED_OUT_DIR = u'io'
115ISOLATED_TMP_DIR = u'it'
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000116ISOLATED_CLIENT_DIR = u'ic'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000117_CAS_CLIENT_DIR = u'cc'
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000118_NSJAIL_DIR = u'ns'
maruele2f2cb82016-07-13 14:41:03 -0700119
Takuto Ikuta02edca22019-11-29 10:04:51 +0000120# TODO(tikuta): take these parameter from luci-config?
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000121_CAS_PACKAGE = 'infra/tools/luci/cas/${platform}'
Takuto Ikutad53d7bd2021-07-16 03:09:33 +0000122_LUCI_GO_REVISION = DEPS.deps['luci-go']['packages'][0]['version']
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000123_NSJAIL_PACKAGE = 'infra/3pp/tools/nsjail/${platform}'
124_NSJAIL_VERSION = DEPS.deps['nsjail']['packages'][0]['version']
maruele2f2cb82016-07-13 14:41:03 -0700125
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400126# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000127CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400128
Takuto Ikutac9ddff22021-02-18 07:58:39 +0000129_FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES = 2 * 1024 * 1024 * 1024
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400130
marueld928c862017-06-08 08:20:04 -0700131OUTLIVING_ZOMBIE_MSG = """\
132*** Swarming tried multiple times to delete the %s directory and failed ***
133*** Hard failing the task ***
134
135Swarming detected that your testing script ran an executable, which may have
136started a child executable, and the main script returned early, leaving the
137children executables playing around unguided.
138
139You don't want to leave children processes outliving the task on the Swarming
140bot, do you? The Swarming bot doesn't.
141
142How to fix?
143- For any process that starts children processes, make sure all children
144 processes terminated properly before each parent process exits. This is
145 especially important in very deep process trees.
146 - This must be done properly both in normal successful task and in case of
147 task failure. Cleanup is very important.
148- The Swarming bot sends a SIGTERM in case of timeout.
149 - You have %s seconds to comply after the signal was sent to the process
150 before the process is forcibly killed.
151- To achieve not leaking children processes in case of signals on timeout, you
152 MUST handle signals in each executable / python script and propagate them to
153 children processes.
154 - When your test script (python or binary) receives a signal like SIGTERM or
155 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
156 them to terminate before quitting.
157
158See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400159https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700160for more information.
161
162*** May the SIGKILL force be with you ***
163"""
164
165
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000166# Currently hardcoded. Eventually could be exposed as a flag once there's value.
167# 3 weeks
168MAX_AGE_SECS = 21*24*60*60
169
Takuto Ikuta7ff4b242020-12-03 08:07:06 +0000170_CAS_KVS_CACHE_THRESHOLD = 5 * 1024 * 1024 * 1024 # 5 GiB
171
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500172TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000173 'TaskData',
174 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000175 # List of strings; the command line to use, independent of what was
176 # specified in the isolated file.
177 'command',
178 # Relative directory to start command into.
179 'relative_cwd',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000180 # Hash of the .isolated file that must be retrieved to recreate the tree
181 # of files to run the target executable. The command specified in the
182 # .isolated is executed. Mutually exclusive with command argument.
183 'isolated_hash',
184 # isolateserver.Storage instance to retrieve remote objects. This object
185 # has a reference to an isolateserver.StorageApi, which does the actual
186 # I/O.
187 'storage',
188 # isolateserver.LocalCache instance to keep from retrieving the same
189 # objects constantly by caching the objects retrieved. Can be on-disk or
190 # in-memory.
191 'isolate_cache',
Junji Watanabe54925c32020-09-08 00:56:18 +0000192 # Digest of the input root on RBE-CAS.
193 'cas_digest',
194 # Full CAS instance name.
195 'cas_instance',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000196 # List of paths relative to root_dir to put into the output isolated
197 # bundle upon task completion (see link_outputs_to_outdir).
198 'outputs',
199 # Function (run_dir) => context manager that installs named caches into
200 # |run_dir|.
201 'install_named_caches',
202 # If True, the temporary directory will be deliberately leaked for later
203 # examination.
204 'leak_temp_dir',
205 # Path to the directory to use to create the temporary directory. If not
206 # specified, a random temporary directory is created.
207 'root_dir',
208 # Kills the process if it lasts more than this amount of seconds.
209 'hard_timeout',
210 # Number of seconds to wait between SIGTERM and SIGKILL.
211 'grace_period',
212 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
213 # task command line argument.
214 'bot_file',
215 # Logical account to switch LUCI_CONTEXT into.
216 'switch_to_account',
217 # Context manager dir => CipdInfo, see install_client_and_packages.
218 'install_packages_fn',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000219 # Cache directory for `cas` client.
220 'cas_cache_dir',
221 # Parameters passed to `cas` client.
222 'cas_cache_policies',
Takuto Ikutaae391c52020-12-03 08:43:45 +0000223 # Parameters for kvs file used by `cas` client.
224 'cas_kvs',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000225 # Environment variables to set.
226 'env',
227 # Environment variables to mutate with relative directories.
228 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
229 'env_prefix',
230 # Lowers the task process priority.
231 'lower_priority',
232 # subprocess42.Containment instance. Can be None.
233 'containment',
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000234 # Function to trim caches before installing cipd packages and
235 # downloading isolated files.
236 'trim_caches_fn',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000237 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500238
239
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500240def _to_str(s):
241 """Downgrades a unicode instance to str. Pass str through as-is."""
242 if isinstance(s, str):
243 return s
244 # This is technically incorrect, especially on Windows. In theory
245 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
246 # page' on Windows, but that causes other problems, as the character set
247 # is very limited.
248 return s.encode('utf-8')
249
250
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500251def _to_unicode(s):
252 """Upgrades a str instance to unicode. Pass unicode through as-is."""
Takuto Ikuta95459dd2019-10-29 12:39:47 +0000253 if isinstance(s, six.text_type) or s is None:
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500254 return s
255 return s.decode('utf-8')
256
257
maruel03e11842016-07-14 10:50:16 -0700258def make_temp_dir(prefix, root_dir):
259 """Returns a new unique temporary directory."""
Takuto Ikuta6e2ff962019-10-29 12:35:27 +0000260 return six.text_type(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000261
262
vadimsh9c54b2c2017-07-25 14:08:29 -0700263@contextlib.contextmanager
264def set_luci_context_account(account, tmp_dir):
265 """Sets LUCI_CONTEXT account to be used by the task.
266
267 If 'account' is None or '', does nothing at all. This happens when
268 run_isolated.py is called without '--switch-to-account' flag. In this case,
269 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000270 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700271 run_isolated.py explicitly from their code.
272
273 If the requested account is not defined in the context, switches to
274 non-authenticated access. This happens for Swarming tasks that don't use
275 'task' service accounts.
276
277 If not using LUCI_CONTEXT-based auth, does nothing.
278 If already running as requested account, does nothing.
279 """
280 if not account:
281 # Not actually switching.
282 yield
283 return
284
285 local_auth = luci_context.read('local_auth')
286 if not local_auth:
287 # Not using LUCI_CONTEXT auth at all.
288 yield
289 return
290
291 # See LUCI_CONTEXT.md for the format of 'local_auth'.
292 if local_auth.get('default_account_id') == account:
293 # Already set, no need to switch.
294 yield
295 return
296
297 available = {a['id'] for a in local_auth.get('accounts') or []}
298 if account in available:
299 logging.info('Switching default LUCI_CONTEXT account to %r', account)
300 local_auth['default_account_id'] = account
301 else:
302 logging.warning(
303 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
304 'disabling authentication', account, sorted(available))
305 local_auth.pop('default_account_id', None)
306
307 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
308 yield
309
310
nodir90bc8dc2016-06-15 13:35:21 -0700311def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000312 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700313
314 Raises:
315 ValueError if a parameter is requested in |command| but its value is not
316 provided.
317 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000318 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
319
320
321def replace_parameters(arg, out_dir, bot_file):
322 """Replaces parameter tokens with appropriate values in a string.
323
324 Raises:
325 ValueError if a parameter is requested in |arg| but its value is not
326 provided.
327 """
328 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
329 replace_slash = False
330 if ISOLATED_OUTDIR_PARAMETER in arg:
331 if not out_dir:
332 raise ValueError(
333 'output directory is requested in command or env var, but not '
334 'provided; please specify one')
335 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
336 replace_slash = True
337 if SWARMING_BOT_FILE_PARAMETER in arg:
338 if bot_file:
339 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700340 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000341 else:
342 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
343 'var, but no bot_file specified. Leaving parameter '
344 'unchanged.')
Joanna Wang4cec0e42021-08-26 00:48:37 +0000345 if SWARMING_TASK_ID_PARAMETER in arg:
346 task_id = os.environ.get('SWARMING_TASK_ID')
347 if task_id:
348 arg = arg.replace(SWARMING_TASK_ID_PARAMETER, task_id)
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000349 if replace_slash:
350 # Replace slashes only if parameters are present
351 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
352 arg = arg.replace('/', os.sep)
353 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700354
355
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000356def set_temp_dir(env, tmp_dir):
357 """Set temp dir to given env var dictionary"""
358 tmp_dir = _to_str(tmp_dir)
359 # pylint: disable=line-too-long
360 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
361 # platform. So $TMPDIR must be set on all platforms.
362 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
363 env['TMPDIR'] = tmp_dir
364 if sys.platform == 'win32':
365 # * chromium's base utils uses GetTempPath().
366 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
367 # * Go uses GetTempPath().
368 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
369 # set.
370 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
371 env['TMP'] = tmp_dir
372 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
373 env['TEMP'] = tmp_dir
374 elif sys.platform == 'darwin':
375 # * Chromium uses an hack on macOS before calling into
376 # NSTemporaryDirectory().
377 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
378 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
379 env['MAC_CHROMIUM_TMPDIR'] = tmp_dir
380 else:
381 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
382 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
383 # * mktemp on linux respects $TMPDIR.
384 # * Chromium respects $TMPDIR on linux.
385 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
386 # * Go uses $TMPDIR.
387 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
388 pass
389
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000390
391def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
392 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800393 """Returns full OS environment to run a command in.
394
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800395 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
396 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800397
398 Args:
399 tmp_dir: temp directory.
400 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500401 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500402 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800403 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000404 out_dir: Isolated output directory. Required to be != None if any of the
405 env vars contain ISOLATED_OUTDIR_PARAMETER.
406 bot_file: Required to be != None if any of the env vars contain
407 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800408 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500409 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000410 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500411 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500412 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500413 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000414 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500415
416 if cipd_info:
417 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500418 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
419 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Takuto Ikuta4ec3e8f2021-04-05 10:21:29 +0000420 cipd_info_path = os.path.join(tmp_dir, 'cipd_info.json')
421 with open(cipd_info_path, 'w') as f:
422 json.dump(cipd_info.pins, f)
423 out['ISOLATED_RESOLVED_PACKAGE_VERSIONS_FILE'] = cipd_info_path
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500424
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000425 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500426 assert isinstance(paths, list), paths
427 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500428 cur = out.get(key)
429 if cur:
430 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500431 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800432
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000433 set_temp_dir(out, tmp_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500434 return out
vadimsh232f5a82017-01-20 19:23:44 -0800435
436
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000437def run_command(
438 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700439 """Runs the command.
440
441 Returns:
442 tuple(process exit code, bool if had a hard timeout)
443 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000444 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000445 'run_command(%s, %s, %s, %s, %s, %s)',
446 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700447
maruel6be7f9e2015-10-01 12:25:30 -0700448 exit_code = None
449 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700450 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700451 proc = None
452 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700453 try:
maruel6be7f9e2015-10-01 12:25:30 -0700454 # TODO(maruel): This code is imperfect. It doesn't handle well signals
455 # during the download phase and there's short windows were things can go
456 # wrong.
457 def handler(signum, _frame):
458 if proc and not had_signal:
459 logging.info('Received signal %d', signum)
460 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700461 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700462
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000463 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000464 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000465 lower_priority=lower_priority, containment=containment)
Joanna Wang40959bf2021-08-12 18:10:12 +0000466 logging.info('Subprocess for command started')
maruel6be7f9e2015-10-01 12:25:30 -0700467 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
468 try:
John Budorickc398f092019-06-10 22:49:44 +0000469 exit_code = proc.wait(hard_timeout or None)
Takuto Ikuta6a8f4e12021-11-15 02:33:04 +0000470 logging.info("finished with exit code %d", exit_code)
maruel6be7f9e2015-10-01 12:25:30 -0700471 except subprocess42.TimeoutExpired:
472 if not had_signal:
473 logging.warning('Hard timeout')
474 had_hard_timeout = True
475 logging.warning('Sending SIGTERM')
476 proc.terminate()
477
Takuto Ikuta684f7912020-09-29 07:49:49 +0000478 kill_sent = False
maruel6be7f9e2015-10-01 12:25:30 -0700479 # Ignore signals in grace period. Forcibly give the grace period to the
480 # child process.
481 if exit_code is None:
482 ignore = lambda *_: None
483 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
484 try:
485 exit_code = proc.wait(grace_period or None)
Takuto Ikuta6a8f4e12021-11-15 02:33:04 +0000486 logging.info("finished with exit code %d", exit_code)
maruel6be7f9e2015-10-01 12:25:30 -0700487 except subprocess42.TimeoutExpired:
488 # Now kill for real. The user can distinguish between the
489 # following states:
490 # - signal but process exited within grace period,
491 # hard_timed_out will be set but the process exit code will be
492 # script provided.
493 # - processed exited late, exit code will be -9 on posix.
494 logging.warning('Grace exhausted; sending SIGKILL')
495 proc.kill()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000496 kill_sent = True
martiniss5c8043e2017-08-01 17:09:43 -0700497 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700498 exit_code = proc.wait()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000499
500 # the process group / job object may be dangling so if we didn't kill
501 # it already, give it a poke now.
502 if not kill_sent:
503 proc.kill()
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000504 except OSError as e:
maruela9cfd6f2015-09-15 11:03:15 -0700505 # This is not considered to be an internal error. The executable simply
506 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800507 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000508 '<The executable does not exist, a dependent library is missing or '
509 'the command line is too long>\n'
510 '<Check for missing .so/.dll in the .isolate or GN file or length of '
511 'command line args>\n'
Takuto Ikutae900df42021-04-14 04:40:11 +0000512 '<Command: %s>\n'
513 '<Exception: %s>\n' % (command, e))
maruela72f46e2016-02-24 11:05:45 -0800514 if os.environ.get('SWARMING_TASK_ID'):
515 # Give an additional hint when running as a swarming task.
516 sys.stderr.write(
517 '<See the task\'s page for commands to help diagnose this issue '
518 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700519 exit_code = 1
520 logging.info(
521 'Command finished with exit code %d (%s)',
522 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700523 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700524
525
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000526def _run_go_cmd_and_wait(cmd, tmp_dir):
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000527 """
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000528 Runs an external Go command, `isolated` or `cas`, and wait for its completion.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000529
530 While this is a generic function to launch a subprocess, it has logic that
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000531 is specific to Go `isolated` and `cas` for waiting and logging.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000532
533 Returns:
534 The subprocess object
535 """
Ye Kuang3c40e9f2020-07-28 13:15:25 +0000536 cmd_str = ' '.join(cmd)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000537 try:
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000538 env = os.environ.copy()
539 set_temp_dir(env, tmp_dir)
540 proc = subprocess42.Popen(cmd, env=env)
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000541
Ye Kuangc1d800f2020-07-28 10:14:55 +0000542 exceeded_max_timeout = True
543 check_period_sec = 30
544 max_checks = 100
545 # max timeout = max_checks * check_period_sec = 50 minutes
546 for i in range(max_checks):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000547 # This is to prevent I/O timeout error during setup.
Ye Kuangc1d800f2020-07-28 10:14:55 +0000548 try:
549 retcode = proc.wait(check_period_sec)
550 if retcode != 0:
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000551 raise subprocess42.CalledProcessError(retcode, cmd=cmd_str)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000552 exceeded_max_timeout = False
553 break
554 except subprocess42.TimeoutExpired:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000555 print('still running (after %d seconds)' % ((i + 1) * check_period_sec))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000556
Ye Kuangc1d800f2020-07-28 10:14:55 +0000557 if exceeded_max_timeout:
558 proc.terminate()
559 try:
560 proc.wait(check_period_sec)
561 except subprocess42.TimeoutExpired:
562 logging.exception(
563 "failed to terminate? timeout happened after %d seconds",
564 check_period_sec)
565 proc.kill()
566 proc.wait()
567 # Raise unconditionally, because |proc| was forcefully terminated.
568 raise ValueError("timedout after %d seconds (cmd=%s)" %
569 (check_period_sec * max_checks, cmd_str))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000570
Ye Kuangc1d800f2020-07-28 10:14:55 +0000571 return proc
572 except Exception:
573 logging.exception('Failed to run Go cmd %s', cmd_str)
574 raise
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000575
576
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000577def _fetch_and_map_with_cas(cas_client, digest, instance, output_dir, cache_dir,
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000578 policies, kvs_dir, tmp_dir):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000579 """
580 Fetches a CAS tree using cas client, create the tree and returns download
581 stats.
582 """
583
584 start = time.time()
585 result_json_handle, result_json_path = tempfile.mkstemp(
586 prefix=u'fetch-and-map-result-', suffix=u'.json')
587 os.close(result_json_handle)
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000588 profile_dir = tempfile.mkdtemp(dir=tmp_dir)
589
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000590 try:
591 cmd = [
592 cas_client,
593 'download',
594 '-digest',
595 digest,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000596 # flags for cache.
597 '-cache-dir',
598 cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000599 '-cache-max-size',
600 str(policies.max_cache_size),
601 '-cache-min-free-space',
602 str(policies.min_free_space),
603 # flags for output.
604 '-dir',
605 output_dir,
606 '-dump-stats-json',
607 result_json_path,
Takuto Ikuta557025b2021-02-01 08:37:40 +0000608 '-log-level',
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000609 'info',
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000610 ]
Takuto Ikutaae391c52020-12-03 08:43:45 +0000611
Junji Watanabe66d807b2021-11-08 03:20:10 +0000612 # When RUN_ISOLATED_CAS_ADDRESS is set in test mode,
613 # Use it and ignore CAS instance option.
614 cas_addr = os.environ.get('RUN_ISOLATED_CAS_ADDRESS')
615 if cas_addr:
616 cmd.extend([
617 '-cas-addr',
618 cas_addr,
619 ])
620 else:
621 cmd.extend([
622 '-cas-instance',
623 instance
624 ])
625
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000626 if kvs_dir:
627 cmd.extend(['-kvs-dir', kvs_dir])
Takuto Ikutaae391c52020-12-03 08:43:45 +0000628
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000629 try:
630 _run_go_cmd_and_wait(cmd, tmp_dir)
Takuto Ikuta0909eae2021-04-27 02:54:07 +0000631 except subprocess42.CalledProcessError as ex:
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000632 if not kvs_dir:
633 raise
634 logging.exception('Failed to run cas, removing kvs cache dir and retry.')
Takuto Ikuta0909eae2021-04-27 02:54:07 +0000635 on_error.report("Failed to run cas %s" % ex)
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000636 file_path.rmtree(kvs_dir)
Takuto Ikutacffabfb2021-11-01 08:05:43 +0000637 file_path.rmtree(output_dir)
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000638 _run_go_cmd_and_wait(cmd, tmp_dir)
639
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000640 with open(result_json_path) as json_file:
641 result_json = json.load(json_file)
642
643 return {
644 'duration': time.time() - start,
645 'items_cold': result_json['items_cold'],
646 'items_hot': result_json['items_hot'],
647 }
648 finally:
649 fs.remove(result_json_path)
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000650 file_path.rmtree(profile_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000651
652
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000653# TODO(crbug.com/932396): remove this function.
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000654def fetch_and_map(isolated_hash, storage, cache, outdir):
Takuto Ikuta57219f42020-11-02 07:35:36 +0000655 """Fetches an isolated tree, create the tree and returns stats."""
nodir6f801882016-04-29 14:41:50 -0700656 start = time.time()
Takuto Ikuta57219f42020-11-02 07:35:36 +0000657 isolateserver.fetch_isolated(
nodir6f801882016-04-29 14:41:50 -0700658 isolated_hash=isolated_hash,
659 storage=storage,
660 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700661 outdir=outdir,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000662 use_symlinks=False)
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000663 hot = (collections.Counter(cache.used) -
664 collections.Counter(cache.added)).elements()
Takuto Ikuta57219f42020-11-02 07:35:36 +0000665 return {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000666 'duration': time.time() - start,
667 'items_cold': base64.b64encode(large.pack(sorted(cache.added))).decode(),
668 'items_hot': base64.b64encode(large.pack(sorted(hot))).decode(),
nodir6f801882016-04-29 14:41:50 -0700669 }
670
671
aludwin0a8e17d2016-10-27 15:57:39 -0700672def link_outputs_to_outdir(run_dir, out_dir, outputs):
673 """Links any named outputs to out_dir so they can be uploaded.
674
675 Raises an error if the file already exists in that directory.
676 """
677 if not outputs:
678 return
Takuto Ikutae0dce462021-11-16 08:49:46 +0000679 file_path.create_directories(out_dir, outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700680 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400681 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
682
683
684def copy_recursively(src, dst):
685 """Efficiently copies a file or directory from src_dir to dst_dir.
686
687 `item` may be a file, directory, or a symlink to a file or directory.
688 All symlinks are replaced with their targets, so the resulting
689 directory structure in dst_dir will never have any symlinks.
690
691 To increase speed, copy_recursively hardlinks individual files into the
692 (newly created) directory structure if possible, unlike Python's
693 shutil.copytree().
694 """
695 orig_src = src
696 try:
697 # Replace symlinks with their final target.
698 while fs.islink(src):
699 res = fs.readlink(src)
Takuto Ikutaf2ad0a02021-06-24 08:38:40 +0000700 src = os.path.realpath(os.path.join(os.path.dirname(src), res))
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400701 # TODO(sadafm): Explicitly handle cyclic symlinks.
702
Takuto Ikutaf2ad0a02021-06-24 08:38:40 +0000703 if not fs.exists(src):
704 logging.warning('Path %s does not exist or %s is a broken symlink', src,
705 orig_src)
706 return
707
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400708 if fs.isfile(src):
709 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
710 return
711
712 if not fs.exists(dst):
713 os.makedirs(dst)
714
715 for child in fs.listdir(src):
716 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
717
718 except OSError as e:
719 if e.errno == errno.ENOENT:
720 logging.warning('Path %s does not exist or %s is a broken symlink',
721 src, orig_src)
722 else:
723 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700724
725
Ye Kuangfb0bad62020-07-28 08:07:25 +0000726def _upload_with_py(storage, out_dir):
727
728 def process_stats(f_st):
729 st = sorted(i.size for i in f_st)
730 return base64.b64encode(large.pack(st)).decode()
731
732 try:
733 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
734 storage, [out_dir], None, verify_push=True)
735
736 isolated = list(results.values())[0]
737 cold = process_stats(f_cold)
738 hot = process_stats(f_hot)
739 return isolated, cold, hot
740
741 except isolateserver.Aborted:
742 # This happens when a signal SIGTERM was received while uploading data.
743 # There is 2 causes:
744 # - The task was too slow and was about to be killed anyway due to
745 # exceeding the hard timeout.
746 # - The amount of data uploaded back is very large and took too much
747 # time to archive.
748 sys.stderr.write('Received SIGTERM while uploading')
749 # Re-raise, so it will be treated as an internal failure.
750 raise
751
752
Takuto Ikutaf5173872021-05-11 03:18:40 +0000753def upload_out_dir(storage, out_dir):
Ye Kuangbc4e8402020-07-29 09:54:30 +0000754 """Uploads the results in |out_dir| back, if there is any.
maruela9cfd6f2015-09-15 11:03:15 -0700755
756 Returns:
Ye Kuangbc4e8402020-07-29 09:54:30 +0000757 tuple(outputs_ref, stats)
maruel064c0a32016-04-05 11:47:15 -0700758 - outputs_ref: a dict referring to the results archived back to the isolated
759 server, if applicable.
nodir6f801882016-04-29 14:41:50 -0700760 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700761 """
maruela9cfd6f2015-09-15 11:03:15 -0700762 # Upload out_dir and generate a .isolated file out of this directory. It is
763 # only done if files were written in the directory.
764 outputs_ref = None
Ye Kuangfb0bad62020-07-28 08:07:25 +0000765 cold = ''
766 hot = ''
nodir6f801882016-04-29 14:41:50 -0700767 start = time.time()
768
maruel12e30012015-10-09 11:55:35 -0700769 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700770 with tools.Profiler('ArchiveOutput'):
Takuto Ikutaf5173872021-05-11 03:18:40 +0000771 isolated, cold, hot = _upload_with_py(storage, out_dir)
Ye Kuangfb0bad62020-07-28 08:07:25 +0000772 outputs_ref = {
773 'isolated': isolated,
774 'isolatedserver': storage.server_ref.url,
775 'namespace': storage.server_ref.namespace,
776 }
nodir6f801882016-04-29 14:41:50 -0700777
nodir6f801882016-04-29 14:41:50 -0700778 stats = {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000779 'duration': time.time() - start,
Ye Kuangfb0bad62020-07-28 08:07:25 +0000780 'items_cold': cold,
781 'items_hot': hot,
nodir6f801882016-04-29 14:41:50 -0700782 }
Ye Kuangbc4e8402020-07-29 09:54:30 +0000783 return outputs_ref, stats
maruela9cfd6f2015-09-15 11:03:15 -0700784
785
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000786def upload_outdir_with_cas(cas_client, cas_instance, outdir, tmp_dir):
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000787 """Uploads the results in |outdir|, if there is any.
788
789 Returns:
790 tuple(root_digest, stats)
791 - root_digest: a digest of the output directory.
792 - stats: uploading stats.
793 """
Junji Watanabe15f9e042021-11-12 07:13:50 +0000794 if not fs.listdir(outdir):
795 return None, None
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000796 digest_file_handle, digest_path = tempfile.mkstemp(
797 prefix=u'cas-digest', suffix=u'.txt')
798 os.close(digest_file_handle)
799 stats_json_handle, stats_json_path = tempfile.mkstemp(
800 prefix=u'upload-stats', suffix=u'.json')
801 os.close(stats_json_handle)
802
803 try:
804 cmd = [
805 cas_client,
806 'archive',
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000807 '-paths',
808 # Format: <working directory>:<relative path to dir>
809 outdir + ':',
810 # output
811 '-dump-digest',
812 digest_path,
813 '-dump-stats-json',
814 stats_json_path,
815 ]
816
Junji Watanabe66d807b2021-11-08 03:20:10 +0000817 # When RUN_ISOLATED_CAS_ADDRESS is set in test mode,
818 # Use it and ignore CAS instance option.
819 cas_addr = os.environ.get('RUN_ISOLATED_CAS_ADDRESS')
820 if cas_addr:
821 cmd.extend([
822 '-cas-addr',
823 cas_addr,
824 ])
825 else:
826 cmd.extend([
827 '-cas-instance',
828 cas_instance
829 ])
830
Takuto Ikutabfcef252021-08-25 07:46:19 +0000831 if sys.platform.startswith('linux'):
832 # TODO(crbug.com/1243194): remove this after investigation.
833 cmd.extend(['-log-level', 'debug'])
834
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000835 start = time.time()
836
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000837 _run_go_cmd_and_wait(cmd, tmp_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000838
839 with open(digest_path) as digest_file:
840 digest = digest_file.read()
Junji Watanabec208b302020-09-25 09:18:27 +0000841 h, s = digest.split('/')
842 cas_output_root = {
843 'cas_instance': cas_instance,
844 'digest': {
845 'hash': h,
846 'size_bytes': int(s)
847 }
848 }
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000849 with open(stats_json_path) as stats_file:
850 stats = json.load(stats_file)
851
852 stats['duration'] = time.time() - start
853
Junji Watanabec208b302020-09-25 09:18:27 +0000854 return cas_output_root, stats
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000855 finally:
856 fs.remove(digest_path)
857 fs.remove(stats_json_path)
858
859
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500860def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700861 """Runs a command with optional isolated input/output.
862
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500863 Arguments:
864 - data: TaskData instance.
865 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700866
867 Returns metadata about the result.
868 """
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000869
870 if data.isolate_cache:
871 download_stats = {
872 #'duration': 0.,
873 'initial_number_items': len(data.isolate_cache),
874 'initial_size': data.isolate_cache.total_size,
875 #'items_cold': '<large.pack()>',
876 #'items_hot': '<large.pack()>',
877 }
878 else:
879 # TODO(tikuta): take stats from state.json in this case too.
880 download_stats = {}
881
maruela9cfd6f2015-09-15 11:03:15 -0700882 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000883 'duration': None,
884 'exit_code': None,
885 'had_hard_timeout': False,
886 'internal_failure': 'run_isolated did not complete properly',
887 'stats': {
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000888 'trim_caches': {
889 'duration': 0,
890 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000891 #'cipd': {
892 # 'duration': 0.,
893 # 'get_client_duration': 0.,
894 #},
895 'isolated': {
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000896 'download': download_stats,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000897 #'upload': {
898 # 'duration': 0.,
899 # 'items_cold': '<large.pack()>',
900 # 'items_hot': '<large.pack()>',
901 #},
902 },
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000903 'named_caches': {
904 'install': {
905 'duration': 0,
906 },
907 'uninstall': {
908 'duration': 0,
909 },
910 },
911 'cleanup': {
912 'duration': 0,
913 }
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000914 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000915 #'cipd_pins': {
916 # 'packages': [
917 # {'package_name': ..., 'version': ..., 'path': ...},
918 # ...
919 # ],
920 # 'client_package': {'package_name': ..., 'version': ...},
921 #},
922 'outputs_ref': None,
Junji Watanabe54925c32020-09-08 00:56:18 +0000923 'cas_output_root': None,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000924 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700925 }
nodirbe642ff2016-06-09 15:51:51 -0700926
Takuto Ikutad46ea762020-10-07 05:43:22 +0000927 assert os.path.isabs(data.root_dir), ("data.root_dir is not abs path: %s" %
928 data.root_dir)
929 file_path.ensure_tree(data.root_dir, 0o700)
930
maruele2f2cb82016-07-13 14:41:03 -0700931 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700932 # TODO(maruel): This is not obvious. Change this to become an error once we
933 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500934 if constant_run_path and data.root_dir:
935 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700936 if os.path.isdir(run_dir):
937 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000938 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700939 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500940 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000941
942 # True if CAS is used for download/upload files.
943 use_cas = bool(data.cas_digest)
944
maruel03e11842016-07-14 10:50:16 -0700945 # storage should be normally set but don't crash if it is not. This can happen
946 # as Swarming task can run without an isolate server.
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000947 out_dir = None
948 if data.storage or use_cas:
949 out_dir = make_temp_dir(ISOLATED_OUT_DIR, data.root_dir)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500950 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700951 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500952 if data.relative_cwd:
953 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500954 command = data.command
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000955
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000956 cas_client = None
957 cas_client_dir = make_temp_dir(_CAS_CLIENT_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000958 if use_cas:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000959 cas_client = os.path.join(cas_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX)
960
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000961 data.trim_caches_fn(result['stats']['trim_caches'])
962
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000963 nsjail_dir = None
964 if (sys.platform == "linux" and cipd.get_platform() == "amd64" and
965 data.containment.containment_type == subprocess42.Containment.NSJAIL):
966 nsjail_dir = make_temp_dir(_NSJAIL_DIR, data.root_dir)
967
nodir55be77b2016-05-03 09:39:57 -0700968 try:
Takuto Ikuta1ce61362021-11-16 05:44:17 +0000969 with data.install_packages_fn(run_dir, cas_client_dir,
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +0000970 nsjail_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800971 if cipd_info:
972 result['stats']['cipd'] = cipd_info.stats
973 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700974
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000975 isolated_stats = result['stats'].setdefault('isolated', {})
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500976 if data.isolated_hash:
Takuto Ikuta1ce61362021-11-16 05:44:17 +0000977 stats = fetch_and_map(isolated_hash=data.isolated_hash,
978 storage=data.storage,
979 cache=data.isolate_cache,
980 outdir=run_dir)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000981 isolated_stats['download'].update(stats)
Takuto Ikutab58dbd12020-06-05 09:29:14 +0000982
Junji Watanabe54925c32020-09-08 00:56:18 +0000983 elif data.cas_digest:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000984 stats = _fetch_and_map_with_cas(
985 cas_client=cas_client,
986 digest=data.cas_digest,
987 instance=data.cas_instance,
988 output_dir=run_dir,
Junji Watanabeb03450b2020-09-25 05:09:27 +0000989 cache_dir=data.cas_cache_dir,
Takuto Ikutaae391c52020-12-03 08:43:45 +0000990 policies=data.cas_cache_policies,
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000991 kvs_dir=data.cas_kvs,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000992 tmp_dir=tmp_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000993 isolated_stats['download'].update(stats)
Junji Watanabe54925c32020-09-08 00:56:18 +0000994
maruelabec63c2017-04-26 11:53:24 -0700995 if not command:
996 # Handle this as a task failure, not an internal failure.
997 sys.stderr.write(
998 '<No command was specified!>\n'
999 '<Please secify a command when triggering your Swarming task>\n')
1000 result['exit_code'] = 1
1001 return result
nodirbe642ff2016-06-09 15:51:51 -07001002
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001003 if not cwd.startswith(run_dir):
1004 # Handle this as a task failure, not an internal failure. This is a
1005 # 'last chance' way to gate against directory escape.
1006 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
1007 result['exit_code'] = 1
1008 return result
1009
1010 if not os.path.isdir(cwd):
1011 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +00001012 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001013
vadimsh232f5a82017-01-20 19:23:44 -08001014 # If we have an explicit list of files to return, make sure their
1015 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001016 if data.storage and data.outputs:
Takuto Ikutae0dce462021-11-16 08:49:46 +00001017 file_path.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -07001018
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001019 with data.install_named_caches(run_dir, result['stats']['named_caches']):
nodird6160682017-02-02 13:03:35 -08001020 sys.stdout.flush()
1021 start = time.time()
1022 try:
vadimsh9c54b2c2017-07-25 14:08:29 -07001023 # Need to switch the default account before 'get_command_env' call,
1024 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001025 with set_luci_context_account(data.switch_to_account, tmp_dir):
1026 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +00001027 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
1028 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +00001029 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -08001030 command = process_command(command, out_dir, data.bot_file)
1031 file_path.ensure_command_has_abs_path(command, cwd)
1032
vadimsh9c54b2c2017-07-25 14:08:29 -07001033 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001034 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001035 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -08001036 finally:
1037 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -05001038
Ye Kuangbc4e8402020-07-29 09:54:30 +00001039 if out_dir:
1040 # Try to link files to the output directory, if specified.
1041 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
1042 isolated_stats = result['stats'].setdefault('isolated', {})
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001043 if use_cas:
1044 result['cas_output_root'], isolated_stats['upload'] = (
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +00001045 upload_outdir_with_cas(cas_client, data.cas_instance, out_dir,
1046 tmp_dir))
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001047 else:
1048 # This could use |go_isolated_client|, so make sure it runs when the
1049 # CIPD package still exists.
1050 result['outputs_ref'], isolated_stats['upload'] = (
Takuto Ikutaf5173872021-05-11 03:18:40 +00001051 upload_out_dir(data.storage, out_dir))
Seth Koehler49139812017-12-19 13:59:33 -05001052 # We successfully ran the command, set internal_failure back to
1053 # None (even if the command failed, it's not an internal error).
1054 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -07001055 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -07001056 # An internal error occurred. Report accordingly so the swarming task will
1057 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -07001058 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -07001059 result['internal_failure'] = str(e)
1060 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -07001061
1062 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -07001063 finally:
1064 try:
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001065 cleanup_start = time.time()
Ye Kuangbc4e8402020-07-29 09:54:30 +00001066 success = True
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001067 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -07001068 success = True
maruela9cfd6f2015-09-15 11:03:15 -07001069 logging.warning(
1070 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -07001071 else:
maruel84537cb2015-10-16 14:21:28 -07001072 # On Windows rmtree(run_dir) call above has a synchronization effect: it
1073 # finishes only when all task child processes terminate (since a running
1074 # process locks *.exe file). Examine out_dir only after that call
1075 # completes (since child processes may write to out_dir too and we need
1076 # to wait for them to finish).
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001077 dirs_to_remove = [run_dir, tmp_dir, cas_client_dir]
Ye Kuangbc4e8402020-07-29 09:54:30 +00001078 if out_dir:
1079 dirs_to_remove.append(out_dir)
1080 for directory in dirs_to_remove:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001081 if not fs.isdir(directory):
1082 continue
Junji Watanabe9cdfff52021-01-08 07:20:35 +00001083 start = time.time()
maruel84537cb2015-10-16 14:21:28 -07001084 try:
Junji Watanabecc4eefd2021-01-19 01:46:10 +00001085 file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -07001086 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001087 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -07001088 success = False
Junji Watanabe9cdfff52021-01-08 07:20:35 +00001089 finally:
1090 logging.info('Cleanup: rmtree(%r) took %d seconds', directory,
1091 time.time() - start)
maruel84537cb2015-10-16 14:21:28 -07001092 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001093 sys.stderr.write(
1094 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
Junji Watanabed952bf12021-05-13 03:15:54 +00001095 if sys.platform == 'win32':
1096 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
1097 else:
1098 subprocess42.check_call(['ps', 'axu'], stdout=sys.stderr)
maruel84537cb2015-10-16 14:21:28 -07001099 if result['exit_code'] == 0:
1100 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -07001101
maruela9cfd6f2015-09-15 11:03:15 -07001102 if not success and result['exit_code'] == 0:
1103 result['exit_code'] = 1
1104 except Exception as e:
1105 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -07001106 if out_dir:
1107 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -07001108 result['internal_failure'] = str(e)
Takuto Ikutaa9a907b2020-04-17 08:50:50 +00001109 on_error.report(None)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001110 finally:
1111 cleanup_duration = time.time() - cleanup_start
1112 result['stats']['cleanup']['duration'] = cleanup_duration
1113 logging.info('Cleanup: removing directories took %d seconds',
1114 cleanup_duration)
maruela9cfd6f2015-09-15 11:03:15 -07001115 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001116
1117
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001118def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -07001119 """Runs an executable and records execution metadata.
1120
nodir55be77b2016-05-03 09:39:57 -07001121 If isolated_hash is specified, downloads the dependencies in the cache,
1122 hardlinks them into a temporary directory and runs the command specified in
1123 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001124
1125 A temporary directory is created to hold the output files. The content inside
1126 this directory will be uploaded back to |storage| packaged as a .isolated
1127 file.
1128
1129 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001130 - data: TaskData instance.
1131 - result_json: File path to dump result metadata into. If set, the process
1132 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -07001133
1134 Returns:
1135 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001136 """
maruela76b9ee2015-12-15 06:18:08 -08001137 if result_json:
1138 # Write a json output file right away in case we get killed.
1139 result = {
Junji Watanabe54925c32020-09-08 00:56:18 +00001140 'exit_code': None,
1141 'had_hard_timeout': False,
1142 'internal_failure': 'Was terminated before completion',
1143 'outputs_ref': None,
1144 'cas_output_root': None,
1145 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -08001146 }
1147 tools.write_json(result_json, result, dense=True)
1148
maruela9cfd6f2015-09-15 11:03:15 -07001149 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001150 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -07001151 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -07001152
maruela9cfd6f2015-09-15 11:03:15 -07001153 if result_json:
maruel05d5a882015-09-21 13:59:02 -07001154 # We've found tests to delete 'work' when quitting, causing an exception
1155 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -07001156 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -07001157 tools.write_json(result_json, result, dense=True)
1158 # Only return 1 if there was an internal error.
1159 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +00001160
maruela9cfd6f2015-09-15 11:03:15 -07001161 # Marshall into old-style inline output.
1162 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +00001163 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -07001164 data = {
Junji Watanabe38b28b02020-04-23 10:23:30 +00001165 'hash': result['outputs_ref']['isolated'],
1166 'namespace': result['outputs_ref']['namespace'],
1167 'storage': result['outputs_ref']['isolatedserver'],
maruela9cfd6f2015-09-15 11:03:15 -07001168 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -05001169 sys.stdout.flush()
Junji Watanabe38b28b02020-04-23 10:23:30 +00001170 print('[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
1171 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -08001172 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -07001173 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001174
1175
iannuccib58d10d2017-03-18 02:00:25 -07001176# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -08001177CipdInfo = collections.namedtuple('CipdInfo', [
1178 'client', # cipd.CipdClient object
1179 'cache_dir', # absolute path to bot-global cipd tag and instance cache
1180 'stats', # dict with stats to return to the server
1181 'pins', # dict with installed cipd pins to return to the server
1182])
1183
1184
1185@contextlib.contextmanager
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001186def copy_local_packages(_run_dir, cas_dir, _nsjail_dir):
Junji Watanabedc2f89e2021-11-08 08:44:30 +00001187 """Copies CIPD packages from luci/luci-go dir."""
1188 go_client_dir = os.environ.get('LUCI_GO_CLIENT_DIR')
1189 assert go_client_dir, ('Please set LUCI_GO_CLIENT_DIR env var to install CIPD'
1190 ' packages locally.')
1191 shutil.copy2(os.path.join(go_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX),
1192 os.path.join(cas_dir, 'cas' + cipd.EXECUTABLE_SUFFIX))
vadimsh232f5a82017-01-20 19:23:44 -08001193 yield None
1194
1195
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001196def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -07001197 """Calls 'cipd ensure' for packages.
1198
1199 Args:
1200 run_dir (str): root of installation.
1201 cipd_cache_dir (str): the directory to use for the cipd package cache.
1202 client (CipdClient): the cipd client to use
1203 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -07001204
1205 Returns: list of pinned packages. Looks like [
1206 {
1207 'path': 'subdirectory',
1208 'package_name': 'resolved/package/name',
1209 'version': 'deadbeef...',
1210 },
1211 ...
1212 ]
1213 """
1214 package_pins = [None]*len(packages)
1215 def insert_pin(path, name, version, idx):
1216 package_pins[idx] = {
1217 'package_name': name,
1218 # swarming deals with 'root' as '.'
1219 'path': path or '.',
1220 'version': version,
1221 }
1222
1223 by_path = collections.defaultdict(list)
1224 for i, (path, name, version) in enumerate(packages):
1225 # cipd deals with 'root' as ''
1226 if path == '.':
1227 path = ''
1228 by_path[path].append((name, version, i))
1229
1230 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001231 run_dir,
1232 {
1233 subdir: [(name, vers) for name, vers, _ in pkgs
1234 ] for subdir, pkgs in by_path.items()
1235 },
1236 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -07001237 )
1238
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +00001239 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -07001240 this_subdir = by_path[subdir]
1241 for i, (name, version) in enumerate(pin_list):
1242 insert_pin(subdir, name, version, this_subdir[i][2])
1243
Robert Iannucci461b30d2017-12-13 11:34:03 -08001244 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -07001245
1246 return package_pins
1247
1248
vadimsh232f5a82017-01-20 19:23:44 -08001249@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001250def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001251 client_package_name, client_version, cache_dir,
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001252 cas_dir, nsjail_dir):
vadimsh902948e2017-01-20 15:57:32 -08001253 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -07001254
vadimsh232f5a82017-01-20 19:23:44 -08001255 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
1256
1257 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -07001258 [
1259 {
1260 "path": path, "package_name": package_name, "version": version,
1261 },
1262 ...
1263 ]
vadimsh902948e2017-01-20 15:57:32 -08001264 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -07001265
1266 such that they correspond 1:1 to all input package arguments from the command
1267 line. These dictionaries make their all the way back to swarming, where they
1268 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -07001269
vadimsh902948e2017-01-20 15:57:32 -08001270 If 'packages' list is empty, will bootstrap CIPD client, but won't install
1271 any packages.
1272
1273 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -08001274 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -08001275
nodirbe642ff2016-06-09 15:51:51 -07001276 Args:
nodir90bc8dc2016-06-15 13:35:21 -07001277 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -08001278 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -07001279 service_url (str): CIPD server url, e.g.
1280 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -07001281 client_package_name (str): CIPD package name of CIPD client.
1282 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -07001283 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001284 cas_dir (str): where to download cas client.
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001285 nsjail_dir (str): where to download nsjail. If set to None, nsjail is not
1286 downloaded.
nodirbe642ff2016-06-09 15:51:51 -07001287 """
1288 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001289
nodirbe642ff2016-06-09 15:51:51 -07001290 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001291
vadimsh902948e2017-01-20 15:57:32 -08001292 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001293 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001294 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001295 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001296
nodirbe642ff2016-06-09 15:51:51 -07001297 get_client_start = time.time()
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001298 client_manager = cipd.get_client(cache_dir, service_url, client_package_name,
1299 client_version)
iannucci96fcccc2016-08-30 15:52:22 -07001300
nodirbe642ff2016-06-09 15:51:51 -07001301 with client_manager as client:
1302 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001303
iannuccib58d10d2017-03-18 02:00:25 -07001304 package_pins = []
1305 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001306 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1307 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001308
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001309 # Install cas client to |cas_dir|.
1310 _install_packages(cas_dir, cipd_cache_dir, client,
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +00001311 [('', _CAS_PACKAGE, _LUCI_GO_REVISION)])
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001312
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001313 # Install nsjail to |nsjail_dir|.
1314 if nsjail_dir is not None:
1315 _install_packages(nsjail_dir, cipd_cache_dir, client,
1316 [('', _NSJAIL_PACKAGE, _NSJAIL_VERSION)])
1317
iannuccib58d10d2017-03-18 02:00:25 -07001318 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001319
vadimsh232f5a82017-01-20 19:23:44 -08001320 total_duration = time.time() - start
Junji Watanabe38b28b02020-04-23 10:23:30 +00001321 logging.info('Installing CIPD client and packages took %d seconds',
1322 total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001323
vadimsh232f5a82017-01-20 19:23:44 -08001324 yield CipdInfo(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001325 client=client,
1326 cache_dir=cipd_cache_dir,
1327 stats={
1328 'duration': total_duration,
1329 'get_client_duration': get_client_duration,
iannuccib58d10d2017-03-18 02:00:25 -07001330 },
Junji Watanabe38b28b02020-04-23 10:23:30 +00001331 pins={
1332 'client_package': {
1333 'package_name': client.package_name,
1334 'version': client.instance_id,
1335 },
1336 'packages': package_pins,
1337 })
nodirbe642ff2016-06-09 15:51:51 -07001338
1339
1340def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001341 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001342 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001343 version=__version__,
1344 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001345 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001346 '--clean',
1347 action='store_true',
maruel36a963d2016-04-08 17:15:49 -07001348 help='Cleans the cache, trimming it necessary and remove corrupted items '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001349 'and returns without executing anything; use with -v to know what '
1350 'was done')
maruel36a963d2016-04-08 17:15:49 -07001351 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001352 '--json',
1353 help='dump output metadata to json file. When used, run_isolated returns '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001354 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001355 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001356 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001357 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001358 '--grace-period',
1359 type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001360 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001361 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001362 '--relative-cwd',
Takuto Ikuta18ca29a2020-12-04 07:34:20 +00001363 help='Ignore the isolated \'relative_cwd\' and use this one instead')
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001364 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001365 '--env',
1366 default=[],
1367 action='append',
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001368 help='Environment variables to set for the child process')
1369 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001370 '--env-prefix',
1371 default=[],
1372 action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001373 help='Specify a VAR=./path/fragment to put in the environment variable '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001374 'before executing the command. The path fragment must be relative '
1375 'to the isolated run directory, and must not contain a `..` token. '
1376 'The path will be made absolute and prepended to the indicated '
1377 '$VAR using the OS\'s path separator. Multiple items for the same '
1378 '$VAR will be prepended in order.')
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001379 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001380 '--bot-file',
1381 help='Path to a file describing the state of the host. The content is '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001382 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001383 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001384 '--switch-to-account',
1385 help='If given, switches LUCI_CONTEXT to given logical service account '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001386 '(e.g. "task" or "system") before launching the isolated process.')
vadimsh9c54b2c2017-07-25 14:08:29 -07001387 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001388 '--output',
1389 action='append',
aludwin0a8e17d2016-10-27 15:57:39 -07001390 help='Specifies an output to return. If no outputs are specified, all '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001391 'files located in $(ISOLATED_OUTDIR) will be returned; '
1392 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1393 'specified by --output option (there can be multiple) will be '
1394 'returned. Note that if a file in OUT_DIR has the same path '
1395 'as an --output option, the --output version will be returned.')
aludwin0a8e17d2016-10-27 15:57:39 -07001396 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001397 '-a',
1398 '--argsfile',
aludwin7556e0c2016-10-26 08:46:10 -07001399 # This is actually handled in parse_args; it's included here purely so it
1400 # can make it into the help text.
1401 help='Specify a file containing a JSON array of arguments to this '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001402 'script. If --argsfile is provided, no other argument may be '
1403 'provided on the command line.')
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001404 parser.add_option(
1405 '--report-on-exception',
1406 action='store_true',
1407 help='Whether report exception during execution to isolate server. '
1408 'This flag should only be used in swarming bot.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001409
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001410 group = optparse.OptionGroup(parser, 'Data source - Isolate server')
Junji Watanabe54925c32020-09-08 00:56:18 +00001411 # Deprecated. Isoate server is being migrated to RBE-CAS.
1412 # Remove --isolated and isolate server options after migration.
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001413 group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001414 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001415 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001416 isolateserver.add_isolate_server_options(group)
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001417 parser.add_option_group(group)
1418
1419 group = optparse.OptionGroup(parser,
1420 'Data source - Content Addressed Storage')
Junji Watanabe54925c32020-09-08 00:56:18 +00001421 group.add_option(
1422 '--cas-instance', help='Full CAS instance name for input/output files.')
1423 group.add_option(
1424 '--cas-digest',
1425 help='Digest of the input root on RBE-CAS. The format is '
1426 '`{hash}/{size_bytes}`.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001427 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001428
Junji Watanabeb03450b2020-09-25 05:09:27 +00001429 # Cache options.
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001430 isolateserver.add_cache_options(parser)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001431 add_cas_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001432
1433 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001434
1435 group = optparse.OptionGroup(parser, 'Named caches')
1436 group.add_option(
1437 '--named-cache',
1438 dest='named_caches',
1439 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001440 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001441 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001442 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001443 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1444 'path is a path relative to the run dir where the cache directory '
1445 'must be put to. '
1446 'This option can be specified more than once.')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001447 group.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001448 '--named-cache-root',
1449 default='named_caches',
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001450 help='Cache root directory. Default=%default')
1451 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001452
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001453 group = optparse.OptionGroup(parser, 'Process containment')
1454 parser.add_option(
1455 '--lower-priority', action='store_true',
1456 help='Lowers the child process priority')
1457 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001458 '--containment-type',
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001459 choices=('NONE', 'AUTO', 'JOB_OBJECT', 'NSJAIL'),
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001460 default='NONE',
1461 help='Type of container to use')
1462 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001463 '--limit-processes',
1464 type='int',
1465 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001466 help='Maximum number of active processes in the containment')
1467 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001468 '--limit-total-committed-memory',
1469 type='int',
1470 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001471 help='Maximum sum of committed memory in the containment')
1472 parser.add_option_group(group)
1473
1474 group = optparse.OptionGroup(parser, 'Debugging')
1475 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001476 '--leak-temp-dir',
1477 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001478 help='Deliberately leak isolate\'s temp dir for later examination. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001479 'Default: %default')
1480 group.add_option('--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001481 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001482
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001483 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001484
Ye Kuang1d096cb2020-06-26 08:38:21 +00001485 parser.set_defaults(cache='cache')
nodirbe642ff2016-06-09 15:51:51 -07001486 return parser
1487
1488
Junji Watanabeb03450b2020-09-25 05:09:27 +00001489def add_cas_cache_options(parser):
1490 group = optparse.OptionGroup(parser, 'CAS cache management')
1491 group.add_option(
1492 '--cas-cache',
1493 metavar='DIR',
1494 default='cas-cache',
1495 help='Directory to keep a local cache of the files. Accelerates download '
1496 'by reusing already downloaded files. Default=%default')
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001497 group.add_option(
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001498 '--kvs-dir',
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001499 default='',
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001500 help='CAS cache dir using kvs for small files. Default=%default')
Junji Watanabeb03450b2020-09-25 05:09:27 +00001501 parser.add_option_group(group)
1502
1503
1504def process_cas_cache_options(options):
1505 if options.cas_cache:
1506 policies = local_caching.CachePolicies(
1507 max_cache_size=options.max_cache_size,
1508 min_free_space=options.min_free_space,
1509 # max_items isn't used for CAS cache for now.
1510 max_items=None,
1511 max_age_secs=MAX_AGE_SECS)
1512
1513 return local_caching.DiskContentAddressedCache(
1514 six.text_type(os.path.abspath(options.cas_cache)), policies, trim=False)
1515 return local_caching.MemoryContentAddressedCache()
1516
1517
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001518def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001519 """Validates named cache options and returns a CacheManager."""
1520 if options.named_caches and not options.named_cache_root:
1521 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001522 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001523 if not CACHE_NAME_RE.match(name):
1524 parser.error(
1525 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1526 if not path:
1527 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001528 try:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001529 int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001530 except ValueError:
1531 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001532 if options.named_cache_root:
1533 # Make these configurable later if there is use case but for now it's fairly
1534 # safe values.
1535 # In practice, a fair chunk of bots are already recycled on a daily schedule
1536 # so this code doesn't have any effect to them, unless they are preloaded
1537 # with a really old cache.
1538 policies = local_caching.CachePolicies(
1539 # 1TiB.
1540 max_cache_size=1024*1024*1024*1024,
1541 min_free_space=options.min_free_space,
1542 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001543 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001544 root_dir = six.text_type(os.path.abspath(options.named_cache_root))
John Budorickc6186972020-02-26 00:58:14 +00001545 cache = local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
1546 # Touch any named caches we're going to use to minimize thrashing
1547 # between tasks that request some (but not all) of the same named caches.
John Budorick0a4dab62020-03-02 22:23:35 +00001548 cache.touch(*[name for name, _, _ in options.named_caches])
John Budorickc6186972020-02-26 00:58:14 +00001549 return cache
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001550 return None
1551
1552
aludwin7556e0c2016-10-26 08:46:10 -07001553def parse_args(args):
1554 # Create a fake mini-parser just to get out the "-a" command. Note that
1555 # it's not documented here; instead, it's documented in create_option_parser
1556 # even though that parser will never actually get to parse it. This is
1557 # because --argsfile is exclusive with all other options and arguments.
1558 file_argparse = argparse.ArgumentParser(add_help=False)
1559 file_argparse.add_argument('-a', '--argsfile')
1560 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1561 if file_args.argsfile:
1562 if nonfile_args:
1563 file_argparse.error('Can\'t specify --argsfile with'
1564 'any other arguments (%s)' % nonfile_args)
1565 try:
1566 with open(file_args.argsfile, 'r') as f:
1567 args = json.load(f)
1568 except (IOError, OSError, ValueError) as e:
1569 # We don't need to error out here - "args" is now empty,
1570 # so the call below to parser.parse_args(args) will fail
1571 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001572 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001573
1574 # Even if we failed to read the args, just call the normal parser now since it
1575 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001576 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001577 options, args = parser.parse_args(args)
Ye Kuangfff1e502020-07-13 13:21:57 +00001578 if not isinstance(options.cipd_enabled, (bool, int)):
1579 options.cipd_enabled = distutils.util.strtobool(options.cipd_enabled)
aludwin7556e0c2016-10-26 08:46:10 -07001580 return (parser, options, args)
1581
1582
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001583def _calc_named_cache_hint(named_cache, named_caches):
1584 """Returns the expected size of the missing named caches."""
1585 present = named_cache.available
1586 size = 0
Takuto Ikutad169bfd2021-08-02 05:45:09 +00001587 logging.info('available named cache %s', present)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001588 for name, _, hint in named_caches:
1589 if name not in present:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001590 hint = int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001591 if hint > 0:
Takuto Ikuta74686842021-07-30 04:11:03 +00001592 logging.info("named cache hint: %s, %d", name, hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001593 size += hint
Takuto Ikuta74686842021-07-30 04:11:03 +00001594 logging.info("total size of named cache hint: %d", size)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001595 return size
1596
1597
Takuto Ikutaae391c52020-12-03 08:43:45 +00001598def _clean_cmd(parser, options, caches, root):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001599 """Cleanup cache dirs/files."""
1600 if options.isolated:
1601 parser.error('Can\'t use --isolated with --clean.')
1602 if options.isolate_server:
1603 parser.error('Can\'t use --isolate-server with --clean.')
1604 if options.json:
1605 parser.error('Can\'t use --json with --clean.')
1606 if options.named_caches:
1607 parser.error('Can\t use --named-cache with --clean.')
1608 if options.cas_instance or options.cas_digest:
1609 parser.error('Can\t use --cas-instance, --cas-digest with --clean.')
1610
1611 logging.info("initial free space: %d", file_path.get_free_space(root))
1612
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001613 if options.kvs_dir and fs.isdir(six.text_type(options.kvs_dir)):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001614 # Remove kvs file if its size exceeds fixed threshold.
Takuto Ikutab1b70062021-03-22 01:02:41 +00001615 kvs_dir = six.text_type(options.kvs_dir)
1616 size = file_path.get_recursive_size(kvs_dir)
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001617 if size >= _CAS_KVS_CACHE_THRESHOLD:
1618 logging.info("remove kvs dir with size: %d", size)
Takuto Ikutab1b70062021-03-22 01:02:41 +00001619 file_path.rmtree(kvs_dir)
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001620
1621 # Trim first, then clean.
1622 local_caching.trim_caches(
1623 caches,
1624 root,
1625 min_free_space=options.min_free_space,
1626 max_age_secs=MAX_AGE_SECS)
1627 logging.info("free space after trim: %d", file_path.get_free_space(root))
1628 for c in caches:
1629 c.cleanup()
1630 logging.info("free space after cleanup: %d", file_path.get_free_space(root))
1631
1632
aludwin7556e0c2016-10-26 08:46:10 -07001633def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001634 # Warning: when --argsfile is used, the strings are unicode instances, when
1635 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001636 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001637
Joanna Wang40959bf2021-08-12 18:10:12 +00001638 # Must be logged after parse_args(), which eventually calls
1639 # logging_utils.prepare_logging() which expects no logs before its call.
1640 logging.info('Starting run_isolated script')
1641
Junji Watanabe1d83d282021-05-11 05:50:40 +00001642 SWARMING_SERVER = os.environ.get('SWARMING_SERVER')
1643 SWARMING_TASK_ID = os.environ.get('SWARMING_TASK_ID')
1644 if options.report_on_exception and SWARMING_SERVER:
1645 task_url = None
1646 if SWARMING_TASK_ID:
1647 task_url = '%s/task?id=%s' % (SWARMING_SERVER, SWARMING_TASK_ID)
1648 on_error.report_on_exception_exit(SWARMING_SERVER, source=task_url)
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001649
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001650 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001651 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001652
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001653 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001654 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001655 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1656 if hint:
1657 # Increase the --min-free-space value by the hint, and recreate the
1658 # NamedCache instance so it gets the updated CachePolicy.
1659 options.min_free_space += hint
1660 named_cache = process_named_cache_options(parser, options)
1661
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001662 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1663 # they can be cleaned the same way.
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001664
1665 isolate_cache = isolateserver.process_cache_options(options, trim=False)
1666 cas_cache = process_cas_cache_options(options)
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +00001667
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001668 caches = []
1669 if isolate_cache:
1670 caches.append(isolate_cache)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001671 if cas_cache:
1672 caches.append(cas_cache)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001673 if named_cache:
1674 caches.append(named_cache)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001675 root = caches[0].cache_dir if caches else six.text_type(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001676 if options.clean:
Takuto Ikutaae391c52020-12-03 08:43:45 +00001677 _clean_cmd(parser, options, caches, root)
maruel36a963d2016-04-08 17:15:49 -07001678 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001679
1680 # Trim must still be done for the following case:
1681 # - named-cache was used
1682 # - some entries, with a large hint, where missing
1683 # - --min-free-space was increased accordingly, thus trimming is needed
1684 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1685 # --clean after each task.
Takuto Ikutac9ddff22021-02-18 07:58:39 +00001686 additional_buffer = _FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001687 if options.kvs_dir:
Takuto Ikuta7f45c592021-02-09 05:57:05 +00001688 additional_buffer += _CAS_KVS_CACHE_THRESHOLD
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001689 # Add some buffer for Go CLI.
1690 min_free_space = options.min_free_space + additional_buffer
1691
1692 def trim_caches_fn(stats):
1693 start = time.time()
1694 local_caching.trim_caches(
1695 caches, root, min_free_space=min_free_space, max_age_secs=MAX_AGE_SECS)
1696 duration = time.time() - start
1697 stats['duration'] = duration
1698 logging.info('trim_caches: took %d seconds', duration)
maruel36a963d2016-04-08 17:15:49 -07001699
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001700 # Save state of cas cache not to overwrite state from go client.
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001701 if cas_cache:
1702 cas_cache.save()
1703 cas_cache = None
1704
Takuto Ikutadc496672021-11-12 05:58:59 +00001705 if not args:
1706 parser.error('command to run is required.')
nodir55be77b2016-05-03 09:39:57 -07001707
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001708 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001709
Takuto Ikutaae767b32020-05-11 01:22:19 +00001710 isolateserver.process_isolate_server_options(parser, options, False)
Junji Watanabeed9ce352020-09-25 12:32:07 +00001711 if ISOLATED_OUTDIR_PARAMETER in args and (not options.isolate_server and
1712 not options.cas_instance):
1713 parser.error('%s in args requires --isolate-server or --cas-instance' %
1714 ISOLATED_OUTDIR_PARAMETER)
1715
1716 if options.isolated and not options.isolate_server:
1717 parser.error('--isolated requires --isolate-server')
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001718
nodir90bc8dc2016-06-15 13:35:21 -07001719 if options.root_dir:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001720 options.root_dir = six.text_type(os.path.abspath(options.root_dir))
Takuto Ikutad46ea762020-10-07 05:43:22 +00001721 else:
1722 options.root_dir = six.text_type(tempfile.mkdtemp(prefix='root'))
maruel12e30012015-10-09 11:55:35 -07001723 if options.json:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001724 options.json = six.text_type(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001725
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001726 if any('=' not in i for i in options.env):
1727 parser.error(
1728 '--env required key=value form. value can be skipped to delete '
1729 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001730 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001731
1732 prefixes = {}
1733 cwd = os.path.realpath(os.getcwd())
1734 for item in options.env_prefix:
1735 if '=' not in item:
1736 parser.error(
1737 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1738 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001739 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001740 if os.path.isabs(opath):
1741 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1742 opath = os.path.normpath(opath)
1743 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1744 parser.error(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001745 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1746 % opath)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001747 prefixes.setdefault(key, []).append(opath)
1748 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001749
nodirbe642ff2016-06-09 15:51:51 -07001750 cipd.validate_cipd_options(parser, options)
1751
Junji Watanabedc2f89e2021-11-08 08:44:30 +00001752 install_packages_fn = copy_local_packages
Ye Kuang1d096cb2020-06-26 08:38:21 +00001753 tmp_cipd_cache_dir = None
vadimsh902948e2017-01-20 15:57:32 -08001754 if options.cipd_enabled:
Ye Kuang1d096cb2020-06-26 08:38:21 +00001755 cache_dir = options.cipd_cache
1756 if not cache_dir:
1757 tmp_cipd_cache_dir = six.text_type(tempfile.mkdtemp())
1758 cache_dir = tmp_cipd_cache_dir
Takuto Ikuta1ce61362021-11-16 05:44:17 +00001759 install_packages_fn = (
1760 lambda run_dir, cas_dir, nsjail_dir: install_client_and_packages(
1761 run_dir,
1762 cipd.parse_package_args(options.cipd_packages),
1763 options.cipd_server,
1764 options.cipd_client_package,
1765 options.cipd_client_version,
1766 cache_dir=cache_dir,
1767 cas_dir=cas_dir,
1768 nsjail_dir=nsjail_dir,
1769 ))
nodirbe642ff2016-06-09 15:51:51 -07001770
nodird6160682017-02-02 13:03:35 -08001771 @contextlib.contextmanager
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001772 def install_named_caches(run_dir, stats):
nodird6160682017-02-02 13:03:35 -08001773 # WARNING: this function depends on "options" variable defined in the outer
1774 # function.
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001775 assert six.text_type(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001776 assert os.path.isabs(run_dir), run_dir
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001777 named_caches = [(os.path.join(run_dir, six.text_type(relpath)), name)
1778 for name, relpath, _ in options.named_caches]
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001779 install_start = time.time()
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001780 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001781 named_cache.install(path, name)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001782 install_duration = time.time() - install_start
1783 stats['install']['duration'] = install_duration
1784 logging.info('named_caches: install took %d seconds', install_duration)
nodird6160682017-02-02 13:03:35 -08001785 try:
1786 yield
1787 finally:
dnje289d132017-07-07 11:16:44 -07001788 # Uninstall each named cache, returning it to the cache pool. If an
1789 # uninstall fails for a given cache, it will remain in the task's
1790 # temporary space, get cleaned up by the Swarming bot, and be lost.
1791 #
1792 # If the Swarming bot cannot clean up the cache, it will handle it like
1793 # any other bot file that could not be removed.
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001794 uninstall_start = time.time()
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001795 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001796 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001797 # uninstall() doesn't trim but does call save() implicitly. Trimming
1798 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001799 named_cache.uninstall(path, name)
1800 except local_caching.NamedCacheError:
Takuto Ikuta463ecdd2021-03-05 09:35:38 +00001801 if sys.platform == 'win32':
1802 # Show running processes.
1803 sys.stderr.write("running process\n")
1804 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
1805
Junji Watanabed2ab86b2021-08-13 07:20:23 +00001806 error = (
1807 'Error while removing named cache %r at %r. The cache will be'
1808 ' lost.' % (path, name))
1809 logging.exception(error)
1810 on_error.report(error)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001811 uninstall_duration = time.time() - uninstall_start
1812 stats['uninstall']['duration'] = uninstall_duration
1813 logging.info('named_caches: uninstall took %d seconds',
1814 uninstall_duration)
nodirf33b8d62016-10-26 22:34:58 -07001815
Takuto Ikutaf3caa9b2020-11-02 05:38:26 +00001816 command = args
1817 if options.relative_cwd:
1818 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1819 if not a.startswith(os.getcwd()):
1820 parser.error(
1821 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001822
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001823 containment_type = subprocess42.Containment.NONE
1824 if options.containment_type == 'AUTO':
1825 containment_type = subprocess42.Containment.AUTO
1826 if options.containment_type == 'JOB_OBJECT':
1827 containment_type = subprocess42.Containment.JOB_OBJECT
Anirudh Mathukumilli92d57b62021-08-04 23:21:57 +00001828 if options.containment_type == 'NSJAIL':
1829 containment_type = subprocess42.Containment.NSJAIL
1830 # TODO(https://crbug.com/1227833): This object should eventually contain the
1831 # path to the nsjail binary and the nsjail configuration file.
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001832 containment = subprocess42.Containment(
1833 containment_type=containment_type,
1834 limit_processes=options.limit_processes,
1835 limit_total_committed_memory=options.limit_total_committed_memory)
1836
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001837 data = TaskData(
1838 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001839 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001840 isolated_hash=options.isolated,
1841 storage=None,
1842 isolate_cache=isolate_cache,
Junji Watanabe54925c32020-09-08 00:56:18 +00001843 cas_instance=options.cas_instance,
1844 cas_digest=options.cas_digest,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001845 outputs=options.output,
1846 install_named_caches=install_named_caches,
1847 leak_temp_dir=options.leak_temp_dir,
1848 root_dir=_to_unicode(options.root_dir),
1849 hard_timeout=options.hard_timeout,
1850 grace_period=options.grace_period,
1851 bot_file=options.bot_file,
1852 switch_to_account=options.switch_to_account,
1853 install_packages_fn=install_packages_fn,
Junji Watanabeb03450b2020-09-25 05:09:27 +00001854 cas_cache_dir=options.cas_cache,
1855 cas_cache_policies=local_caching.CachePolicies(
1856 max_cache_size=options.max_cache_size,
1857 min_free_space=options.min_free_space,
1858 max_items=None,
1859 max_age_secs=None,
1860 ),
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001861 cas_kvs=options.kvs_dir,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001862 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001863 env_prefix=options.env_prefix,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001864 lower_priority=bool(options.lower_priority),
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001865 containment=containment,
1866 trim_caches_fn=trim_caches_fn)
nodirbe642ff2016-06-09 15:51:51 -07001867 try:
nodir90bc8dc2016-06-15 13:35:21 -07001868 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001869 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001870 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001871 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001872 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001873 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001874 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001875 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001876 return run_tha_test(data, options.json)
1877 return run_tha_test(data, options.json)
Junji Watanabe38b28b02020-04-23 10:23:30 +00001878 except (cipd.Error, local_caching.NamedCacheError,
1879 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001880 print(ex.message, file=sys.stderr)
Junji Watanabed2ab86b2021-08-13 07:20:23 +00001881 on_error.report(None)
nodirbe642ff2016-06-09 15:51:51 -07001882 return 1
Ye Kuang1d096cb2020-06-26 08:38:21 +00001883 finally:
1884 if tmp_cipd_cache_dir is not None:
1885 try:
1886 file_path.rmtree(tmp_cipd_cache_dir)
1887 except OSError:
1888 logging.exception('Remove tmp_cipd_cache_dir=%s failed',
1889 tmp_cipd_cache_dir)
1890 # Best effort clean up. Failed to do so doesn't affect the outcome.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001891
1892
1893if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001894 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001895 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001896 fix_encoding.fix_encoding()
Ye Kuang2dd17442020-04-22 08:45:52 +00001897 net.set_user_agent('run_isolated.py/' + __version__)
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001898 sys.exit(main(sys.argv[1:]))