blob: b89b673fedfbf07857196ecd79b04e3d2e96efd1 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
33See
34https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
35for all the variables.
36
37See
38https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
39for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000040"""
41
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000042from __future__ import print_function
43
44__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000045
aludwin7556e0c2016-10-26 08:46:10 -070046import argparse
maruel064c0a32016-04-05 11:47:15 -070047import base64
iannucci96fcccc2016-08-30 15:52:22 -070048import collections
vadimsh232f5a82017-01-20 19:23:44 -080049import contextlib
Ye Kuangfff1e502020-07-13 13:21:57 +000050import distutils
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040051import errno
aludwin7556e0c2016-10-26 08:46:10 -070052import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000053import logging
54import optparse
55import os
Takuto Ikuta5c59a842020-01-24 03:05:24 +000056import platform
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040057import re
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000058import sys
59import tempfile
maruel064c0a32016-04-05 11:47:15 -070060import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000061
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000062from utils import tools
63tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000064
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000065# third_party/
66from depot_tools import fix_encoding
Takuto Ikuta6e2ff962019-10-29 12:35:27 +000067import six
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000068
69# pylint: disable=ungrouped-imports
70import auth
71import cipd
72import isolate_storage
73import isolateserver
74import local_caching
75from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070076from utils import file_path
maruel12e30012015-10-09 11:55:35 -070077from utils import fs
maruel064c0a32016-04-05 11:47:15 -070078from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040079from utils import logging_utils
Ye Kuang2dd17442020-04-22 08:45:52 +000080from utils import net
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040081from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050082from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000083
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000084
maruele2f2cb82016-07-13 14:41:03 -070085# Magic variables that can be found in the isolate task command line.
86ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
87EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
88SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
89
90
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000091# The name of the log file to use.
92RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
93
maruele2f2cb82016-07-13 14:41:03 -070094
csharp@chromium.orge217f302012-11-22 16:51:53 +000095# The name of the log to use for the run_test_cases.py command
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000096RUN_TEST_CASES_LOG = 'run_test_cases.log'
csharp@chromium.orge217f302012-11-22 16:51:53 +000097
vadimsh@chromium.org87d63262013-04-04 19:34:21 +000098
maruele2f2cb82016-07-13 14:41:03 -070099# Use short names for temporary directories. This is driven by Windows, which
100# imposes a relatively short maximum path length of 260 characters, often
101# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000102# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -0700103#
104# It is recommended to start the script with a `root_dir` as short as
105# possible.
106# - ir stands for isolated_run
107# - io stands for isolated_out
108# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000109# - ic stands for isolated_client
maruele2f2cb82016-07-13 14:41:03 -0700110ISOLATED_RUN_DIR = u'ir'
111ISOLATED_OUT_DIR = u'io'
112ISOLATED_TMP_DIR = u'it'
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000113ISOLATED_CLIENT_DIR = u'ic'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000114_CAS_CLIENT_DIR = u'cc'
maruele2f2cb82016-07-13 14:41:03 -0700115
Takuto Ikuta02edca22019-11-29 10:04:51 +0000116# TODO(tikuta): take these parameter from luci-config?
Takuto Ikutac8c92e62020-04-01 07:07:29 +0000117# Update tag by `./client/update_isolated.sh`.
118# Or take revision from
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000119# https://ci.chromium.org/p/infra-internal/g/infra-packagers/console
Takuto Ikuta02edca22019-11-29 10:04:51 +0000120ISOLATED_PACKAGE = 'infra/tools/luci/isolated/${platform}'
Takuto Ikuta3d3dcf52020-08-24 08:24:16 +0000121ISOLATED_REVISION = 'git_revision:3ccf4cc0119188dbc4befff330348d972b15711d'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000122_CAS_PACKAGE = 'infra/tools/luci/cas/${platform}'
123# TODO(jwata): pin a stable version.
124_CAS_REVISION = 'latest'
maruele2f2cb82016-07-13 14:41:03 -0700125
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400126# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000127CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400128
129
marueld928c862017-06-08 08:20:04 -0700130OUTLIVING_ZOMBIE_MSG = """\
131*** Swarming tried multiple times to delete the %s directory and failed ***
132*** Hard failing the task ***
133
134Swarming detected that your testing script ran an executable, which may have
135started a child executable, and the main script returned early, leaving the
136children executables playing around unguided.
137
138You don't want to leave children processes outliving the task on the Swarming
139bot, do you? The Swarming bot doesn't.
140
141How to fix?
142- For any process that starts children processes, make sure all children
143 processes terminated properly before each parent process exits. This is
144 especially important in very deep process trees.
145 - This must be done properly both in normal successful task and in case of
146 task failure. Cleanup is very important.
147- The Swarming bot sends a SIGTERM in case of timeout.
148 - You have %s seconds to comply after the signal was sent to the process
149 before the process is forcibly killed.
150- To achieve not leaking children processes in case of signals on timeout, you
151 MUST handle signals in each executable / python script and propagate them to
152 children processes.
153 - When your test script (python or binary) receives a signal like SIGTERM or
154 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
155 them to terminate before quitting.
156
157See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400158https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700159for more information.
160
161*** May the SIGKILL force be with you ***
162"""
163
164
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000165# Currently hardcoded. Eventually could be exposed as a flag once there's value.
166# 3 weeks
167MAX_AGE_SECS = 21*24*60*60
168
Ye Kuang72e6fe82020-08-05 06:30:04 +0000169# TODO(1099655): Enable this once all prod issues are gone.
170_USE_GO_ISOLATED_TO_UPLOAD = False
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000171
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500172TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000173 'TaskData',
174 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000175 # List of strings; the command line to use, independent of what was
176 # specified in the isolated file.
177 'command',
178 # Relative directory to start command into.
179 'relative_cwd',
180 # List of strings; the arguments to add to the command specified in the
181 # isolated file.
182 'extra_args',
183 # Hash of the .isolated file that must be retrieved to recreate the tree
184 # of files to run the target executable. The command specified in the
185 # .isolated is executed. Mutually exclusive with command argument.
186 'isolated_hash',
187 # isolateserver.Storage instance to retrieve remote objects. This object
188 # has a reference to an isolateserver.StorageApi, which does the actual
189 # I/O.
190 'storage',
191 # isolateserver.LocalCache instance to keep from retrieving the same
192 # objects constantly by caching the objects retrieved. Can be on-disk or
193 # in-memory.
194 'isolate_cache',
Junji Watanabe54925c32020-09-08 00:56:18 +0000195 # Digest of the input root on RBE-CAS.
196 'cas_digest',
197 # Full CAS instance name.
198 'cas_instance',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000199 # List of paths relative to root_dir to put into the output isolated
200 # bundle upon task completion (see link_outputs_to_outdir).
201 'outputs',
202 # Function (run_dir) => context manager that installs named caches into
203 # |run_dir|.
204 'install_named_caches',
205 # If True, the temporary directory will be deliberately leaked for later
206 # examination.
207 'leak_temp_dir',
208 # Path to the directory to use to create the temporary directory. If not
209 # specified, a random temporary directory is created.
210 'root_dir',
211 # Kills the process if it lasts more than this amount of seconds.
212 'hard_timeout',
213 # Number of seconds to wait between SIGTERM and SIGKILL.
214 'grace_period',
215 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
216 # task command line argument.
217 'bot_file',
218 # Logical account to switch LUCI_CONTEXT into.
219 'switch_to_account',
220 # Context manager dir => CipdInfo, see install_client_and_packages.
221 'install_packages_fn',
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000222 # Use go isolated client.
223 'use_go_isolated',
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000224 # Cache directory for go `isolated` or `cas` client.
Takuto Ikuta057c5342019-12-03 04:05:05 +0000225 'go_cache_dir',
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000226 # Parameters passed to go `isolated` or `cas` client.
Takuto Ikuta879788c2020-01-10 08:00:26 +0000227 'go_cache_policies',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000228 # Environment variables to set.
229 'env',
230 # Environment variables to mutate with relative directories.
231 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
232 'env_prefix',
233 # Lowers the task process priority.
234 'lower_priority',
235 # subprocess42.Containment instance. Can be None.
236 'containment',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000237 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500238
239
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500240def _to_str(s):
241 """Downgrades a unicode instance to str. Pass str through as-is."""
242 if isinstance(s, str):
243 return s
244 # This is technically incorrect, especially on Windows. In theory
245 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
246 # page' on Windows, but that causes other problems, as the character set
247 # is very limited.
248 return s.encode('utf-8')
249
250
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500251def _to_unicode(s):
252 """Upgrades a str instance to unicode. Pass unicode through as-is."""
Takuto Ikuta95459dd2019-10-29 12:39:47 +0000253 if isinstance(s, six.text_type) or s is None:
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500254 return s
255 return s.decode('utf-8')
256
257
maruel03e11842016-07-14 10:50:16 -0700258def make_temp_dir(prefix, root_dir):
259 """Returns a new unique temporary directory."""
Takuto Ikuta6e2ff962019-10-29 12:35:27 +0000260 return six.text_type(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000261
262
vadimsh9c54b2c2017-07-25 14:08:29 -0700263@contextlib.contextmanager
264def set_luci_context_account(account, tmp_dir):
265 """Sets LUCI_CONTEXT account to be used by the task.
266
267 If 'account' is None or '', does nothing at all. This happens when
268 run_isolated.py is called without '--switch-to-account' flag. In this case,
269 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000270 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700271 run_isolated.py explicitly from their code.
272
273 If the requested account is not defined in the context, switches to
274 non-authenticated access. This happens for Swarming tasks that don't use
275 'task' service accounts.
276
277 If not using LUCI_CONTEXT-based auth, does nothing.
278 If already running as requested account, does nothing.
279 """
280 if not account:
281 # Not actually switching.
282 yield
283 return
284
285 local_auth = luci_context.read('local_auth')
286 if not local_auth:
287 # Not using LUCI_CONTEXT auth at all.
288 yield
289 return
290
291 # See LUCI_CONTEXT.md for the format of 'local_auth'.
292 if local_auth.get('default_account_id') == account:
293 # Already set, no need to switch.
294 yield
295 return
296
297 available = {a['id'] for a in local_auth.get('accounts') or []}
298 if account in available:
299 logging.info('Switching default LUCI_CONTEXT account to %r', account)
300 local_auth['default_account_id'] = account
301 else:
302 logging.warning(
303 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
304 'disabling authentication', account, sorted(available))
305 local_auth.pop('default_account_id', None)
306
307 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
308 yield
309
310
nodir90bc8dc2016-06-15 13:35:21 -0700311def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000312 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700313
314 Raises:
315 ValueError if a parameter is requested in |command| but its value is not
316 provided.
317 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000318 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
319
320
321def replace_parameters(arg, out_dir, bot_file):
322 """Replaces parameter tokens with appropriate values in a string.
323
324 Raises:
325 ValueError if a parameter is requested in |arg| but its value is not
326 provided.
327 """
328 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
329 replace_slash = False
330 if ISOLATED_OUTDIR_PARAMETER in arg:
331 if not out_dir:
332 raise ValueError(
333 'output directory is requested in command or env var, but not '
334 'provided; please specify one')
335 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
336 replace_slash = True
337 if SWARMING_BOT_FILE_PARAMETER in arg:
338 if bot_file:
339 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700340 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000341 else:
342 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
343 'var, but no bot_file specified. Leaving parameter '
344 'unchanged.')
345 if replace_slash:
346 # Replace slashes only if parameters are present
347 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
348 arg = arg.replace('/', os.sep)
349 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700350
351
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000352
353def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
354 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800355 """Returns full OS environment to run a command in.
356
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800357 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
358 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800359
360 Args:
361 tmp_dir: temp directory.
362 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500363 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500364 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800365 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000366 out_dir: Isolated output directory. Required to be != None if any of the
367 env vars contain ISOLATED_OUTDIR_PARAMETER.
368 bot_file: Required to be != None if any of the env vars contain
369 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800370 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500371 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000372 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500373 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500374 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500375 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000376 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500377
378 if cipd_info:
379 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500380 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
381 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500382
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000383 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500384 assert isinstance(paths, list), paths
385 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500386 cur = out.get(key)
387 if cur:
388 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500389 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800390
Marc-Antoine Ruelefb30b12018-07-25 18:34:36 +0000391 tmp_dir = _to_str(tmp_dir)
392 # pylint: disable=line-too-long
393 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
394 # platform. So $TMPDIR must be set on all platforms.
395 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
396 out['TMPDIR'] = tmp_dir
397 if sys.platform == 'win32':
398 # * chromium's base utils uses GetTempPath().
399 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
400 # * Go uses GetTempPath().
401 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
402 # set.
403 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
404 out['TMP'] = tmp_dir
405 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
406 out['TEMP'] = tmp_dir
407 elif sys.platform == 'darwin':
408 # * Chromium uses an hack on macOS before calling into
409 # NSTemporaryDirectory().
410 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
411 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
412 out['MAC_CHROMIUM_TMPDIR'] = tmp_dir
413 else:
414 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
415 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
416 # * mktemp on linux respects $TMPDIR.
417 # * Chromium respects $TMPDIR on linux.
418 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
419 # * Go uses $TMPDIR.
420 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
421 pass
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500422 return out
vadimsh232f5a82017-01-20 19:23:44 -0800423
424
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000425def run_command(
426 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700427 """Runs the command.
428
429 Returns:
430 tuple(process exit code, bool if had a hard timeout)
431 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000432 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000433 'run_command(%s, %s, %s, %s, %s, %s)',
434 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700435
maruel6be7f9e2015-10-01 12:25:30 -0700436 exit_code = None
437 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700438 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700439 proc = None
440 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700441 try:
maruel6be7f9e2015-10-01 12:25:30 -0700442 # TODO(maruel): This code is imperfect. It doesn't handle well signals
443 # during the download phase and there's short windows were things can go
444 # wrong.
445 def handler(signum, _frame):
446 if proc and not had_signal:
447 logging.info('Received signal %d', signum)
448 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700449 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700450
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000451 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000452 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000453 lower_priority=lower_priority, containment=containment)
maruel6be7f9e2015-10-01 12:25:30 -0700454 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
455 try:
John Budorickc398f092019-06-10 22:49:44 +0000456 exit_code = proc.wait(hard_timeout or None)
maruel6be7f9e2015-10-01 12:25:30 -0700457 except subprocess42.TimeoutExpired:
458 if not had_signal:
459 logging.warning('Hard timeout')
460 had_hard_timeout = True
461 logging.warning('Sending SIGTERM')
462 proc.terminate()
463
464 # Ignore signals in grace period. Forcibly give the grace period to the
465 # child process.
466 if exit_code is None:
467 ignore = lambda *_: None
468 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
469 try:
470 exit_code = proc.wait(grace_period or None)
471 except subprocess42.TimeoutExpired:
472 # Now kill for real. The user can distinguish between the
473 # following states:
474 # - signal but process exited within grace period,
475 # hard_timed_out will be set but the process exit code will be
476 # script provided.
477 # - processed exited late, exit code will be -9 on posix.
478 logging.warning('Grace exhausted; sending SIGKILL')
479 proc.kill()
martiniss5c8043e2017-08-01 17:09:43 -0700480 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700481 exit_code = proc.wait()
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000482 except OSError as e:
maruela9cfd6f2015-09-15 11:03:15 -0700483 # This is not considered to be an internal error. The executable simply
484 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800485 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000486 '<The executable does not exist, a dependent library is missing or '
487 'the command line is too long>\n'
488 '<Check for missing .so/.dll in the .isolate or GN file or length of '
489 'command line args>\n'
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000490 '<Command: %s, Exception: %s>\n' % (command, e))
maruela72f46e2016-02-24 11:05:45 -0800491 if os.environ.get('SWARMING_TASK_ID'):
492 # Give an additional hint when running as a swarming task.
493 sys.stderr.write(
494 '<See the task\'s page for commands to help diagnose this issue '
495 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700496 exit_code = 1
497 logging.info(
498 'Command finished with exit code %d (%s)',
499 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700500 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700501
502
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000503def _run_go_cmd_and_wait(cmd):
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000504 """
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000505 Runs an external Go command, `isolated` or `cas`, and wait for its completion.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000506
507 While this is a generic function to launch a subprocess, it has logic that
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000508 is specific to Go `isolated` and `cas` for waiting and logging.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000509
510 Returns:
511 The subprocess object
512 """
Ye Kuang3c40e9f2020-07-28 13:15:25 +0000513 cmd_str = ' '.join(cmd)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000514 try:
515 proc = subprocess42.Popen(cmd)
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000516
Ye Kuangc1d800f2020-07-28 10:14:55 +0000517 exceeded_max_timeout = True
518 check_period_sec = 30
519 max_checks = 100
520 # max timeout = max_checks * check_period_sec = 50 minutes
521 for i in range(max_checks):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000522 # This is to prevent I/O timeout error during setup.
Ye Kuangc1d800f2020-07-28 10:14:55 +0000523 try:
524 retcode = proc.wait(check_period_sec)
525 if retcode != 0:
526 raise ValueError("retcode is not 0: %s (cmd=%s)" % (retcode, cmd_str))
527 exceeded_max_timeout = False
528 break
529 except subprocess42.TimeoutExpired:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000530 print('still running (after %d seconds)' % ((i + 1) * check_period_sec))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000531
Ye Kuangc1d800f2020-07-28 10:14:55 +0000532 if exceeded_max_timeout:
533 proc.terminate()
534 try:
535 proc.wait(check_period_sec)
536 except subprocess42.TimeoutExpired:
537 logging.exception(
538 "failed to terminate? timeout happened after %d seconds",
539 check_period_sec)
540 proc.kill()
541 proc.wait()
542 # Raise unconditionally, because |proc| was forcefully terminated.
543 raise ValueError("timedout after %d seconds (cmd=%s)" %
544 (check_period_sec * max_checks, cmd_str))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000545
Ye Kuangc1d800f2020-07-28 10:14:55 +0000546 return proc
547 except Exception:
548 logging.exception('Failed to run Go cmd %s', cmd_str)
549 raise
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000550
551
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000552def _fetch_and_map_with_cas(cas_client, digest, instance, output_dir, cache_dir,
553 policies):
554 """
555 Fetches a CAS tree using cas client, create the tree and returns download
556 stats.
557 """
558
559 start = time.time()
560 result_json_handle, result_json_path = tempfile.mkstemp(
561 prefix=u'fetch-and-map-result-', suffix=u'.json')
562 os.close(result_json_handle)
563 try:
564 cmd = [
565 cas_client,
566 'download',
567 '-digest',
568 digest,
569 '-cas-instance',
570 instance,
571 # flags for cache.
572 '-cache-dir',
573 cache_dir,
574 '-cache-max-items',
575 str(policies.max_items),
576 '-cache-max-size',
577 str(policies.max_cache_size),
578 '-cache-min-free-space',
579 str(policies.min_free_space),
580 # flags for output.
581 '-dir',
582 output_dir,
583 '-dump-stats-json',
584 result_json_path,
585 ]
586 _run_go_cmd_and_wait(cmd)
587
588 with open(result_json_path) as json_file:
589 result_json = json.load(json_file)
590
591 return {
592 'duration': time.time() - start,
593 'items_cold': result_json['items_cold'],
594 'items_hot': result_json['items_hot'],
595 }
596 finally:
597 fs.remove(result_json_path)
598
599
600def _fetch_and_map_with_go_isolated(isolated_hash, storage, outdir,
601 go_cache_dir, policies, isolated_client):
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000602 """
603 Fetches an isolated tree using go client, create the tree and returns
604 (bundle, stats).
605 """
606 start = time.time()
607 server_ref = storage.server_ref
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000608 result_json_handle, result_json_path = tempfile.mkstemp(
609 prefix=u'fetch-and-map-result-', suffix=u'.json')
610 os.close(result_json_handle)
611 try:
Ye Kuanga98764c2020-04-09 03:17:37 +0000612 cmd = [
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000613 isolated_client,
614 'download',
615 '-isolate-server',
616 server_ref.url,
617 '-namespace',
618 server_ref.namespace,
619 '-isolated',
620 isolated_hash,
621
622 # flags for cache
623 '-cache-dir',
Takuto Ikuta057c5342019-12-03 04:05:05 +0000624 go_cache_dir,
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000625 '-cache-max-items',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000626 str(policies.max_items),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000627 '-cache-max-size',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000628 str(policies.max_cache_size),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000629 '-cache-min-free-space',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000630 str(policies.min_free_space),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000631
632 # flags for output
633 '-output-dir',
634 outdir,
635 '-fetch-and-map-result-json',
636 result_json_path,
Ye Kuanga98764c2020-04-09 03:17:37 +0000637 ]
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000638 _run_go_cmd_and_wait(cmd)
Takuto Ikuta3153e3b2020-02-18 06:11:47 +0000639
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000640 with open(result_json_path) as json_file:
641 result_json = json.load(json_file)
642
643 isolated = result_json['isolated']
644 bundle = isolateserver.IsolatedBundle(filter_cb=None)
645 # Only following properties are used in caller.
646 bundle.command = isolated.get('command')
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000647 bundle.relative_cwd = isolated.get('relative_cwd')
648
649 return bundle, {
650 'duration': time.time() - start,
651 'items_cold': result_json['items_cold'],
652 'items_hot': result_json['items_hot'],
653 }
654 finally:
655 fs.remove(result_json_path)
656
657
658# TODO(crbug.com/932396): remove this function.
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000659def fetch_and_map(isolated_hash, storage, cache, outdir):
maruel4409e302016-07-19 14:25:51 -0700660 """Fetches an isolated tree, create the tree and returns (bundle, stats)."""
nodir6f801882016-04-29 14:41:50 -0700661 start = time.time()
662 bundle = isolateserver.fetch_isolated(
663 isolated_hash=isolated_hash,
664 storage=storage,
665 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700666 outdir=outdir,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000667 use_symlinks=False)
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000668 hot = (collections.Counter(cache.used) -
669 collections.Counter(cache.added)).elements()
nodir6f801882016-04-29 14:41:50 -0700670 return bundle, {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000671 'duration': time.time() - start,
672 'items_cold': base64.b64encode(large.pack(sorted(cache.added))).decode(),
673 'items_hot': base64.b64encode(large.pack(sorted(hot))).decode(),
nodir6f801882016-04-29 14:41:50 -0700674 }
675
676
aludwin0a8e17d2016-10-27 15:57:39 -0700677def link_outputs_to_outdir(run_dir, out_dir, outputs):
678 """Links any named outputs to out_dir so they can be uploaded.
679
680 Raises an error if the file already exists in that directory.
681 """
682 if not outputs:
683 return
684 isolateserver.create_directories(out_dir, outputs)
685 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400686 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
687
688
689def copy_recursively(src, dst):
690 """Efficiently copies a file or directory from src_dir to dst_dir.
691
692 `item` may be a file, directory, or a symlink to a file or directory.
693 All symlinks are replaced with their targets, so the resulting
694 directory structure in dst_dir will never have any symlinks.
695
696 To increase speed, copy_recursively hardlinks individual files into the
697 (newly created) directory structure if possible, unlike Python's
698 shutil.copytree().
699 """
700 orig_src = src
701 try:
702 # Replace symlinks with their final target.
703 while fs.islink(src):
704 res = fs.readlink(src)
705 src = os.path.join(os.path.dirname(src), res)
706 # TODO(sadafm): Explicitly handle cyclic symlinks.
707
708 # Note that fs.isfile (which is a wrapper around os.path.isfile) throws
709 # an exception if src does not exist. A warning will be logged in that case.
710 if fs.isfile(src):
711 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
712 return
713
714 if not fs.exists(dst):
715 os.makedirs(dst)
716
717 for child in fs.listdir(src):
718 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
719
720 except OSError as e:
721 if e.errno == errno.ENOENT:
722 logging.warning('Path %s does not exist or %s is a broken symlink',
723 src, orig_src)
724 else:
725 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700726
727
Ye Kuangfb0bad62020-07-28 08:07:25 +0000728def _upload_with_py(storage, out_dir):
729
730 def process_stats(f_st):
731 st = sorted(i.size for i in f_st)
732 return base64.b64encode(large.pack(st)).decode()
733
734 try:
735 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
736 storage, [out_dir], None, verify_push=True)
737
738 isolated = list(results.values())[0]
739 cold = process_stats(f_cold)
740 hot = process_stats(f_hot)
741 return isolated, cold, hot
742
743 except isolateserver.Aborted:
744 # This happens when a signal SIGTERM was received while uploading data.
745 # There is 2 causes:
746 # - The task was too slow and was about to be killed anyway due to
747 # exceeding the hard timeout.
748 # - The amount of data uploaded back is very large and took too much
749 # time to archive.
750 sys.stderr.write('Received SIGTERM while uploading')
751 # Re-raise, so it will be treated as an internal failure.
752 raise
753
754
755def _upload_with_go(storage, outdir, isolated_client):
756 """
757 Uploads results back using the Go `isolated` CLI.
758 """
759 server_ref = storage.server_ref
760 isolated_handle, isolated_path = tempfile.mkstemp(
761 prefix=u'isolated-hash-', suffix=u'.txt')
762 stats_json_handle, stats_json_path = tempfile.mkstemp(
763 prefix=u'dump-stats-', suffix=u'.json')
764 os.close(isolated_handle)
765 os.close(stats_json_handle)
766 try:
767 cmd = [
768 isolated_client,
769 'archive',
770 '-isolate-server',
771 server_ref.url,
772 '-namespace',
773 server_ref.namespace,
774 '-dirs',
775 # Format: <working directory>:<relative path to dir>
776 outdir + ':',
777
778 # output
779 '-dump-hash',
780 isolated_path,
781 '-dump-stats-json',
782 stats_json_path,
Ye Kuangbc4e8402020-07-29 09:54:30 +0000783 '-quiet',
Ye Kuangfb0bad62020-07-28 08:07:25 +0000784 ]
Ye Kuang0023dc52020-08-04 05:28:41 +0000785 # Will do exponential backoff, e.g. 10, 20, 40...
786 # This mitigates https://crbug.com/1094369, where there is a data race on
787 # the uploaded files.
788 backoff = 10
Takuto Ikutae0bfec72020-08-28 02:52:52 +0000789 started = time.time()
Ye Kuang0023dc52020-08-04 05:28:41 +0000790 while True:
791 try:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000792 _run_go_cmd_and_wait(cmd)
Ye Kuang0023dc52020-08-04 05:28:41 +0000793 break
794 except Exception:
Takuto Ikutae0bfec72020-08-28 02:52:52 +0000795 if time.time() > started + 60 * 2:
796 # This is to not wait task having leaked process long time.
Ye Kuang0023dc52020-08-04 05:28:41 +0000797 raise
798
799 on_error.report('error before %d second backoff' % backoff)
800 logging.exception(
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000801 '_run_go_cmd_and_wait() failed, will retry after %d seconds',
Ye Kuang0023dc52020-08-04 05:28:41 +0000802 backoff)
803 time.sleep(backoff)
804 backoff *= 2
Ye Kuangfb0bad62020-07-28 08:07:25 +0000805
806 with open(isolated_path) as isol_file:
807 isolated = isol_file.read()
808 with open(stats_json_path) as json_file:
809 stats_json = json.load(json_file)
810
811 return isolated, stats_json['items_cold'], stats_json['items_hot']
812 finally:
813 fs.remove(isolated_path)
814 fs.remove(stats_json_path)
815
816
Ye Kuangbc4e8402020-07-29 09:54:30 +0000817def upload_out_dir(storage, out_dir, go_isolated_client):
818 """Uploads the results in |out_dir| back, if there is any.
maruela9cfd6f2015-09-15 11:03:15 -0700819
820 Returns:
Ye Kuangbc4e8402020-07-29 09:54:30 +0000821 tuple(outputs_ref, stats)
maruel064c0a32016-04-05 11:47:15 -0700822 - outputs_ref: a dict referring to the results archived back to the isolated
823 server, if applicable.
nodir6f801882016-04-29 14:41:50 -0700824 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700825 """
maruela9cfd6f2015-09-15 11:03:15 -0700826 # Upload out_dir and generate a .isolated file out of this directory. It is
827 # only done if files were written in the directory.
828 outputs_ref = None
Ye Kuangfb0bad62020-07-28 08:07:25 +0000829 cold = ''
830 hot = ''
nodir6f801882016-04-29 14:41:50 -0700831 start = time.time()
832
maruel12e30012015-10-09 11:55:35 -0700833 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700834 with tools.Profiler('ArchiveOutput'):
Ye Kuangfb0bad62020-07-28 08:07:25 +0000835 isolated = None
Ye Kuang72e6fe82020-08-05 06:30:04 +0000836 if _USE_GO_ISOLATED_TO_UPLOAD and go_isolated_client is not None:
Ye Kuangfb0bad62020-07-28 08:07:25 +0000837 isolated, cold, hot = _upload_with_go(storage, out_dir,
838 go_isolated_client)
Ye Kuang72e6fe82020-08-05 06:30:04 +0000839 else:
840 isolated, cold, hot = _upload_with_py(storage, out_dir)
Ye Kuangfb0bad62020-07-28 08:07:25 +0000841 outputs_ref = {
842 'isolated': isolated,
843 'isolatedserver': storage.server_ref.url,
844 'namespace': storage.server_ref.namespace,
845 }
nodir6f801882016-04-29 14:41:50 -0700846
nodir6f801882016-04-29 14:41:50 -0700847 stats = {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000848 'duration': time.time() - start,
Ye Kuangfb0bad62020-07-28 08:07:25 +0000849 'items_cold': cold,
850 'items_hot': hot,
nodir6f801882016-04-29 14:41:50 -0700851 }
Ye Kuangbc4e8402020-07-29 09:54:30 +0000852 return outputs_ref, stats
maruela9cfd6f2015-09-15 11:03:15 -0700853
854
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000855def upload_outdir_with_cas(cas_client, cas_instance, outdir):
856 """Uploads the results in |outdir|, if there is any.
857
858 Returns:
859 tuple(root_digest, stats)
860 - root_digest: a digest of the output directory.
861 - stats: uploading stats.
862 """
863 digest_file_handle, digest_path = tempfile.mkstemp(
864 prefix=u'cas-digest', suffix=u'.txt')
865 os.close(digest_file_handle)
866 stats_json_handle, stats_json_path = tempfile.mkstemp(
867 prefix=u'upload-stats', suffix=u'.json')
868 os.close(stats_json_handle)
869
870 try:
871 cmd = [
872 cas_client,
873 'archive',
874 '-cas-instance',
875 cas_instance,
876 '-paths',
877 # Format: <working directory>:<relative path to dir>
878 outdir + ':',
879 # output
880 '-dump-digest',
881 digest_path,
882 '-dump-stats-json',
883 stats_json_path,
884 ]
885
886 start = time.time()
887
888 _run_go_cmd_and_wait(cmd)
889
890 with open(digest_path) as digest_file:
891 digest = digest_file.read()
892 with open(stats_json_path) as stats_file:
893 stats = json.load(stats_file)
894
895 stats['duration'] = time.time() - start
896
897 return digest, stats
898 finally:
899 fs.remove(digest_path)
900 fs.remove(stats_json_path)
901
902
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500903def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700904 """Runs a command with optional isolated input/output.
905
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500906 Arguments:
907 - data: TaskData instance.
908 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700909
910 Returns metadata about the result.
911 """
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000912
913 if data.isolate_cache:
914 download_stats = {
915 #'duration': 0.,
916 'initial_number_items': len(data.isolate_cache),
917 'initial_size': data.isolate_cache.total_size,
918 #'items_cold': '<large.pack()>',
919 #'items_hot': '<large.pack()>',
920 }
921 else:
922 # TODO(tikuta): take stats from state.json in this case too.
923 download_stats = {}
924
maruela9cfd6f2015-09-15 11:03:15 -0700925 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000926 'duration': None,
927 'exit_code': None,
928 'had_hard_timeout': False,
929 'internal_failure': 'run_isolated did not complete properly',
930 'stats': {
931 #'cipd': {
932 # 'duration': 0.,
933 # 'get_client_duration': 0.,
934 #},
935 'isolated': {
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000936 'download': download_stats,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000937 #'upload': {
938 # 'duration': 0.,
939 # 'items_cold': '<large.pack()>',
940 # 'items_hot': '<large.pack()>',
941 #},
942 },
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000943 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000944 #'cipd_pins': {
945 # 'packages': [
946 # {'package_name': ..., 'version': ..., 'path': ...},
947 # ...
948 # ],
949 # 'client_package': {'package_name': ..., 'version': ...},
950 #},
951 'outputs_ref': None,
Junji Watanabe54925c32020-09-08 00:56:18 +0000952 'cas_output_root': None,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000953 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700954 }
nodirbe642ff2016-06-09 15:51:51 -0700955
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500956 if data.root_dir:
Lei Leife202df2019-06-11 17:33:34 +0000957 file_path.ensure_tree(data.root_dir, 0o700)
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000958 elif data.use_go_isolated:
959 data = data._replace(root_dir=os.path.dirname(data.go_cache_dir))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500960 elif data.isolate_cache.cache_dir:
961 data = data._replace(
962 root_dir=os.path.dirname(data.isolate_cache.cache_dir))
maruele2f2cb82016-07-13 14:41:03 -0700963 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700964 # If root_dir is not specified, it is not constant.
965 # TODO(maruel): This is not obvious. Change this to become an error once we
966 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500967 if constant_run_path and data.root_dir:
968 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700969 if os.path.isdir(run_dir):
970 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000971 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700972 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500973 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000974
975 # True if CAS is used for download/upload files.
976 use_cas = bool(data.cas_digest)
977
maruel03e11842016-07-14 10:50:16 -0700978 # storage should be normally set but don't crash if it is not. This can happen
979 # as Swarming task can run without an isolate server.
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000980 out_dir = None
981 if data.storage or use_cas:
982 out_dir = make_temp_dir(ISOLATED_OUT_DIR, data.root_dir)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500983 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000984 isolated_client_dir = make_temp_dir(ISOLATED_CLIENT_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700985 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500986 if data.relative_cwd:
987 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500988 command = data.command
Ye Kuangfb0bad62020-07-28 08:07:25 +0000989 go_isolated_client = None
990 if data.use_go_isolated:
991 go_isolated_client = os.path.join(isolated_client_dir,
992 'isolated' + cipd.EXECUTABLE_SUFFIX)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000993
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000994 cas_client = None
995 cas_client_dir = make_temp_dir(_CAS_CLIENT_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000996 if use_cas:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000997 cas_client = os.path.join(cas_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX)
998
nodir55be77b2016-05-03 09:39:57 -0700999 try:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001000 with data.install_packages_fn(run_dir, isolated_client_dir,
1001 cas_client_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -08001002 if cipd_info:
1003 result['stats']['cipd'] = cipd_info.stats
1004 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -07001005
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001006 isolated_stats = result['stats'].setdefault('isolated', {})
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001007 if data.isolated_hash:
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001008 if data.use_go_isolated:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001009 bundle, stats = _fetch_and_map_with_go_isolated(
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001010 isolated_hash=data.isolated_hash,
1011 storage=data.storage,
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001012 outdir=run_dir,
1013 go_cache_dir=data.go_cache_dir,
Takuto Ikuta879788c2020-01-10 08:00:26 +00001014 policies=data.go_cache_policies,
Ye Kuangfb0bad62020-07-28 08:07:25 +00001015 isolated_client=go_isolated_client)
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001016 else:
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001017 bundle, stats = fetch_and_map(
1018 isolated_hash=data.isolated_hash,
1019 storage=data.storage,
1020 cache=data.isolate_cache,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +00001021 outdir=run_dir)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001022 isolated_stats['download'].update(stats)
Takuto Ikutab58dbd12020-06-05 09:29:14 +00001023
maruelabec63c2017-04-26 11:53:24 -07001024 # Inject the command
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001025 if not command and bundle.command:
1026 command = bundle.command + data.extra_args
Marc-Antoine Rueld704a1f2017-10-31 10:51:23 -04001027 # Only set the relative directory if the isolated file specified a
1028 # command, and no raw command was specified.
1029 if bundle.relative_cwd:
1030 cwd = os.path.normpath(os.path.join(cwd, bundle.relative_cwd))
maruelabec63c2017-04-26 11:53:24 -07001031
Junji Watanabe54925c32020-09-08 00:56:18 +00001032 elif data.cas_digest:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001033 stats = _fetch_and_map_with_cas(
1034 cas_client=cas_client,
1035 digest=data.cas_digest,
1036 instance=data.cas_instance,
1037 output_dir=run_dir,
1038 cache_dir=data.go_cache_dir,
1039 policies=data.go_cache_policies)
1040 isolated_stats['download'].update(stats)
Junji Watanabe54925c32020-09-08 00:56:18 +00001041
maruelabec63c2017-04-26 11:53:24 -07001042 if not command:
1043 # Handle this as a task failure, not an internal failure.
1044 sys.stderr.write(
1045 '<No command was specified!>\n'
1046 '<Please secify a command when triggering your Swarming task>\n')
1047 result['exit_code'] = 1
1048 return result
nodirbe642ff2016-06-09 15:51:51 -07001049
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001050 if not cwd.startswith(run_dir):
1051 # Handle this as a task failure, not an internal failure. This is a
1052 # 'last chance' way to gate against directory escape.
1053 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
1054 result['exit_code'] = 1
1055 return result
1056
1057 if not os.path.isdir(cwd):
1058 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +00001059 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001060
vadimsh232f5a82017-01-20 19:23:44 -08001061 # If we have an explicit list of files to return, make sure their
1062 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001063 if data.storage and data.outputs:
1064 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -07001065
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001066 with data.install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001067 sys.stdout.flush()
1068 start = time.time()
1069 try:
vadimsh9c54b2c2017-07-25 14:08:29 -07001070 # Need to switch the default account before 'get_command_env' call,
1071 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001072 with set_luci_context_account(data.switch_to_account, tmp_dir):
1073 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +00001074 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
1075 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +00001076 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -08001077 command = process_command(command, out_dir, data.bot_file)
1078 file_path.ensure_command_has_abs_path(command, cwd)
1079
vadimsh9c54b2c2017-07-25 14:08:29 -07001080 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001081 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001082 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -08001083 finally:
1084 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -05001085
Ye Kuangbc4e8402020-07-29 09:54:30 +00001086 if out_dir:
1087 # Try to link files to the output directory, if specified.
1088 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
1089 isolated_stats = result['stats'].setdefault('isolated', {})
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001090 if use_cas:
1091 result['cas_output_root'], isolated_stats['upload'] = (
1092 upload_outdir_with_cas(cas_client, data.cas_instance, out_dir))
1093 else:
1094 # This could use |go_isolated_client|, so make sure it runs when the
1095 # CIPD package still exists.
1096 result['outputs_ref'], isolated_stats['upload'] = (
1097 upload_out_dir(data.storage, out_dir, go_isolated_client))
Seth Koehler49139812017-12-19 13:59:33 -05001098 # We successfully ran the command, set internal_failure back to
1099 # None (even if the command failed, it's not an internal error).
1100 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -07001101 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -07001102 # An internal error occurred. Report accordingly so the swarming task will
1103 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -07001104 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -07001105 result['internal_failure'] = str(e)
1106 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -07001107
1108 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -07001109 finally:
1110 try:
Ye Kuangbc4e8402020-07-29 09:54:30 +00001111 success = True
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001112 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -07001113 success = True
maruela9cfd6f2015-09-15 11:03:15 -07001114 logging.warning(
1115 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -07001116 else:
maruel84537cb2015-10-16 14:21:28 -07001117 # On Windows rmtree(run_dir) call above has a synchronization effect: it
1118 # finishes only when all task child processes terminate (since a running
1119 # process locks *.exe file). Examine out_dir only after that call
1120 # completes (since child processes may write to out_dir too and we need
1121 # to wait for them to finish).
Ye Kuangbc4e8402020-07-29 09:54:30 +00001122 dirs_to_remove = [run_dir, tmp_dir, isolated_client_dir]
1123 if out_dir:
1124 dirs_to_remove.append(out_dir)
1125 for directory in dirs_to_remove:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001126 if not fs.isdir(directory):
1127 continue
maruel84537cb2015-10-16 14:21:28 -07001128 try:
Ye Kuangbc4e8402020-07-29 09:54:30 +00001129 success = success and file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -07001130 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001131 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -07001132 success = False
1133 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001134 sys.stderr.write(
1135 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
Takuto Ikutad7d64e12020-07-31 06:18:45 +00001136 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
maruel84537cb2015-10-16 14:21:28 -07001137 if result['exit_code'] == 0:
1138 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -07001139
maruela9cfd6f2015-09-15 11:03:15 -07001140 if not success and result['exit_code'] == 0:
1141 result['exit_code'] = 1
1142 except Exception as e:
1143 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -07001144 if out_dir:
1145 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -07001146 result['internal_failure'] = str(e)
Takuto Ikutaa9a907b2020-04-17 08:50:50 +00001147 on_error.report(None)
maruela9cfd6f2015-09-15 11:03:15 -07001148 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001149
1150
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001151def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -07001152 """Runs an executable and records execution metadata.
1153
nodir55be77b2016-05-03 09:39:57 -07001154 If isolated_hash is specified, downloads the dependencies in the cache,
1155 hardlinks them into a temporary directory and runs the command specified in
1156 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001157
1158 A temporary directory is created to hold the output files. The content inside
1159 this directory will be uploaded back to |storage| packaged as a .isolated
1160 file.
1161
1162 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001163 - data: TaskData instance.
1164 - result_json: File path to dump result metadata into. If set, the process
1165 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -07001166
1167 Returns:
1168 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001169 """
maruela76b9ee2015-12-15 06:18:08 -08001170 if result_json:
1171 # Write a json output file right away in case we get killed.
1172 result = {
Junji Watanabe54925c32020-09-08 00:56:18 +00001173 'exit_code': None,
1174 'had_hard_timeout': False,
1175 'internal_failure': 'Was terminated before completion',
1176 'outputs_ref': None,
1177 'cas_output_root': None,
1178 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -08001179 }
1180 tools.write_json(result_json, result, dense=True)
1181
maruela9cfd6f2015-09-15 11:03:15 -07001182 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001183 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -07001184 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -07001185
maruela9cfd6f2015-09-15 11:03:15 -07001186 if result_json:
maruel05d5a882015-09-21 13:59:02 -07001187 # We've found tests to delete 'work' when quitting, causing an exception
1188 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -07001189 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -07001190 tools.write_json(result_json, result, dense=True)
1191 # Only return 1 if there was an internal error.
1192 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +00001193
maruela9cfd6f2015-09-15 11:03:15 -07001194 # Marshall into old-style inline output.
1195 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +00001196 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -07001197 data = {
Junji Watanabe38b28b02020-04-23 10:23:30 +00001198 'hash': result['outputs_ref']['isolated'],
1199 'namespace': result['outputs_ref']['namespace'],
1200 'storage': result['outputs_ref']['isolatedserver'],
maruela9cfd6f2015-09-15 11:03:15 -07001201 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -05001202 sys.stdout.flush()
Junji Watanabe38b28b02020-04-23 10:23:30 +00001203 print('[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
1204 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -08001205 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -07001206 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001207
1208
iannuccib58d10d2017-03-18 02:00:25 -07001209# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -08001210CipdInfo = collections.namedtuple('CipdInfo', [
1211 'client', # cipd.CipdClient object
1212 'cache_dir', # absolute path to bot-global cipd tag and instance cache
1213 'stats', # dict with stats to return to the server
1214 'pins', # dict with installed cipd pins to return to the server
1215])
1216
1217
1218@contextlib.contextmanager
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001219def noop_install_packages(_run_dir, _isolated_dir, _cas_dir):
iannuccib58d10d2017-03-18 02:00:25 -07001220 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -08001221 yield None
1222
1223
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001224def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -07001225 """Calls 'cipd ensure' for packages.
1226
1227 Args:
1228 run_dir (str): root of installation.
1229 cipd_cache_dir (str): the directory to use for the cipd package cache.
1230 client (CipdClient): the cipd client to use
1231 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -07001232
1233 Returns: list of pinned packages. Looks like [
1234 {
1235 'path': 'subdirectory',
1236 'package_name': 'resolved/package/name',
1237 'version': 'deadbeef...',
1238 },
1239 ...
1240 ]
1241 """
1242 package_pins = [None]*len(packages)
1243 def insert_pin(path, name, version, idx):
1244 package_pins[idx] = {
1245 'package_name': name,
1246 # swarming deals with 'root' as '.'
1247 'path': path or '.',
1248 'version': version,
1249 }
1250
1251 by_path = collections.defaultdict(list)
1252 for i, (path, name, version) in enumerate(packages):
1253 # cipd deals with 'root' as ''
1254 if path == '.':
1255 path = ''
1256 by_path[path].append((name, version, i))
1257
1258 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001259 run_dir,
1260 {
1261 subdir: [(name, vers) for name, vers, _ in pkgs
1262 ] for subdir, pkgs in by_path.items()
1263 },
1264 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -07001265 )
1266
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +00001267 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -07001268 this_subdir = by_path[subdir]
1269 for i, (name, version) in enumerate(pin_list):
1270 insert_pin(subdir, name, version, this_subdir[i][2])
1271
Robert Iannucci461b30d2017-12-13 11:34:03 -08001272 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -07001273
1274 return package_pins
1275
1276
vadimsh232f5a82017-01-20 19:23:44 -08001277@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001278def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001279 client_package_name, client_version, cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001280 isolated_dir, cas_dir):
vadimsh902948e2017-01-20 15:57:32 -08001281 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -07001282
vadimsh232f5a82017-01-20 19:23:44 -08001283 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
1284
1285 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -07001286 [
1287 {
1288 "path": path, "package_name": package_name, "version": version,
1289 },
1290 ...
1291 ]
vadimsh902948e2017-01-20 15:57:32 -08001292 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -07001293
1294 such that they correspond 1:1 to all input package arguments from the command
1295 line. These dictionaries make their all the way back to swarming, where they
1296 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -07001297
vadimsh902948e2017-01-20 15:57:32 -08001298 If 'packages' list is empty, will bootstrap CIPD client, but won't install
1299 any packages.
1300
1301 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -08001302 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -08001303
nodirbe642ff2016-06-09 15:51:51 -07001304 Args:
nodir90bc8dc2016-06-15 13:35:21 -07001305 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -08001306 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -07001307 service_url (str): CIPD server url, e.g.
1308 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -07001309 client_package_name (str): CIPD package name of CIPD client.
1310 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -07001311 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001312 isolated_dir (str): where to download isolated client.
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001313 cas_dir (str): where to download cas client.
nodirbe642ff2016-06-09 15:51:51 -07001314 """
1315 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001316
nodirbe642ff2016-06-09 15:51:51 -07001317 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001318
vadimsh902948e2017-01-20 15:57:32 -08001319 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001320 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001321 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001322 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001323
nodirbe642ff2016-06-09 15:51:51 -07001324 get_client_start = time.time()
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001325 client_manager = cipd.get_client(cache_dir, service_url, client_package_name,
1326 client_version)
iannucci96fcccc2016-08-30 15:52:22 -07001327
nodirbe642ff2016-06-09 15:51:51 -07001328 with client_manager as client:
1329 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001330
iannuccib58d10d2017-03-18 02:00:25 -07001331 package_pins = []
1332 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001333 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1334 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001335
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001336 # Install isolated client to |isolated_dir|.
Takuto Ikuta02edca22019-11-29 10:04:51 +00001337 _install_packages(isolated_dir, cipd_cache_dir, client,
1338 [('', ISOLATED_PACKAGE, ISOLATED_REVISION)])
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001339
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001340 # Install cas client to |cas_dir|.
1341 _install_packages(cas_dir, cipd_cache_dir, client,
1342 [('', _CAS_PACKAGE, _CAS_REVISION)])
1343
iannuccib58d10d2017-03-18 02:00:25 -07001344 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001345
vadimsh232f5a82017-01-20 19:23:44 -08001346 total_duration = time.time() - start
Junji Watanabe38b28b02020-04-23 10:23:30 +00001347 logging.info('Installing CIPD client and packages took %d seconds',
1348 total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001349
vadimsh232f5a82017-01-20 19:23:44 -08001350 yield CipdInfo(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001351 client=client,
1352 cache_dir=cipd_cache_dir,
1353 stats={
1354 'duration': total_duration,
1355 'get_client_duration': get_client_duration,
iannuccib58d10d2017-03-18 02:00:25 -07001356 },
Junji Watanabe38b28b02020-04-23 10:23:30 +00001357 pins={
1358 'client_package': {
1359 'package_name': client.package_name,
1360 'version': client.instance_id,
1361 },
1362 'packages': package_pins,
1363 })
nodirbe642ff2016-06-09 15:51:51 -07001364
1365
1366def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001367 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001368 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001369 version=__version__,
1370 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001371 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001372 '--clean',
1373 action='store_true',
maruel36a963d2016-04-08 17:15:49 -07001374 help='Cleans the cache, trimming it necessary and remove corrupted items '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001375 'and returns without executing anything; use with -v to know what '
1376 'was done')
maruel36a963d2016-04-08 17:15:49 -07001377 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001378 '--json',
1379 help='dump output metadata to json file. When used, run_isolated returns '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001380 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001381 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001382 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001383 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001384 '--grace-period',
1385 type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001386 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001387 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001388 '--raw-cmd',
1389 action='store_true',
Marc-Antoine Ruel49e347d2017-10-24 16:52:02 -07001390 help='Ignore the isolated command, use the one supplied at the command '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001391 'line')
Marc-Antoine Ruel49e347d2017-10-24 16:52:02 -07001392 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001393 '--relative-cwd',
1394 help='Ignore the isolated \'relative_cwd\' and use this one instead; '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001395 'requires --raw-cmd')
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001396 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001397 '--env',
1398 default=[],
1399 action='append',
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001400 help='Environment variables to set for the child process')
1401 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001402 '--env-prefix',
1403 default=[],
1404 action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001405 help='Specify a VAR=./path/fragment to put in the environment variable '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001406 'before executing the command. The path fragment must be relative '
1407 'to the isolated run directory, and must not contain a `..` token. '
1408 'The path will be made absolute and prepended to the indicated '
1409 '$VAR using the OS\'s path separator. Multiple items for the same '
1410 '$VAR will be prepended in order.')
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001411 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001412 '--bot-file',
1413 help='Path to a file describing the state of the host. The content is '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001414 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001415 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001416 '--switch-to-account',
1417 help='If given, switches LUCI_CONTEXT to given logical service account '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001418 '(e.g. "task" or "system") before launching the isolated process.')
vadimsh9c54b2c2017-07-25 14:08:29 -07001419 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001420 '--output',
1421 action='append',
aludwin0a8e17d2016-10-27 15:57:39 -07001422 help='Specifies an output to return. If no outputs are specified, all '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001423 'files located in $(ISOLATED_OUTDIR) will be returned; '
1424 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1425 'specified by --output option (there can be multiple) will be '
1426 'returned. Note that if a file in OUT_DIR has the same path '
1427 'as an --output option, the --output version will be returned.')
aludwin0a8e17d2016-10-27 15:57:39 -07001428 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001429 '-a',
1430 '--argsfile',
aludwin7556e0c2016-10-26 08:46:10 -07001431 # This is actually handled in parse_args; it's included here purely so it
1432 # can make it into the help text.
1433 help='Specify a file containing a JSON array of arguments to this '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001434 'script. If --argsfile is provided, no other argument may be '
1435 'provided on the command line.')
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001436 parser.add_option(
1437 '--report-on-exception',
1438 action='store_true',
1439 help='Whether report exception during execution to isolate server. '
1440 'This flag should only be used in swarming bot.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001441
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001442 group = optparse.OptionGroup(parser, 'Data source - Isolate server')
Junji Watanabe54925c32020-09-08 00:56:18 +00001443 # Deprecated. Isoate server is being migrated to RBE-CAS.
1444 # Remove --isolated and isolate server options after migration.
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001445 group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001446 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001447 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001448 isolateserver.add_isolate_server_options(group)
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001449 parser.add_option_group(group)
1450
1451 group = optparse.OptionGroup(parser,
1452 'Data source - Content Addressed Storage')
Junji Watanabe54925c32020-09-08 00:56:18 +00001453 group.add_option(
1454 '--cas-instance', help='Full CAS instance name for input/output files.')
1455 group.add_option(
1456 '--cas-digest',
1457 help='Digest of the input root on RBE-CAS. The format is '
1458 '`{hash}/{size_bytes}`.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001459 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001460
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001461 isolateserver.add_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001462
1463 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001464
1465 group = optparse.OptionGroup(parser, 'Named caches')
1466 group.add_option(
1467 '--named-cache',
1468 dest='named_caches',
1469 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001470 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001471 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001472 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001473 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1474 'path is a path relative to the run dir where the cache directory '
1475 'must be put to. '
1476 'This option can be specified more than once.')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001477 group.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001478 '--named-cache-root',
1479 default='named_caches',
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001480 help='Cache root directory. Default=%default')
1481 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001482
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001483 group = optparse.OptionGroup(parser, 'Process containment')
1484 parser.add_option(
1485 '--lower-priority', action='store_true',
1486 help='Lowers the child process priority')
1487 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001488 '--containment-type',
1489 choices=('NONE', 'AUTO', 'JOB_OBJECT'),
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001490 default='NONE',
1491 help='Type of container to use')
1492 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001493 '--limit-processes',
1494 type='int',
1495 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001496 help='Maximum number of active processes in the containment')
1497 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001498 '--limit-total-committed-memory',
1499 type='int',
1500 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001501 help='Maximum sum of committed memory in the containment')
1502 parser.add_option_group(group)
1503
1504 group = optparse.OptionGroup(parser, 'Debugging')
1505 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001506 '--leak-temp-dir',
1507 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001508 help='Deliberately leak isolate\'s temp dir for later examination. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001509 'Default: %default')
1510 group.add_option('--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001511 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001512
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001513 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001514
Ye Kuang1d096cb2020-06-26 08:38:21 +00001515 parser.set_defaults(cache='cache')
nodirbe642ff2016-06-09 15:51:51 -07001516 return parser
1517
1518
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001519def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001520 """Validates named cache options and returns a CacheManager."""
1521 if options.named_caches and not options.named_cache_root:
1522 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001523 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001524 if not CACHE_NAME_RE.match(name):
1525 parser.error(
1526 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1527 if not path:
1528 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001529 try:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001530 int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001531 except ValueError:
1532 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001533 if options.named_cache_root:
1534 # Make these configurable later if there is use case but for now it's fairly
1535 # safe values.
1536 # In practice, a fair chunk of bots are already recycled on a daily schedule
1537 # so this code doesn't have any effect to them, unless they are preloaded
1538 # with a really old cache.
1539 policies = local_caching.CachePolicies(
1540 # 1TiB.
1541 max_cache_size=1024*1024*1024*1024,
1542 min_free_space=options.min_free_space,
1543 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001544 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001545 root_dir = six.text_type(os.path.abspath(options.named_cache_root))
John Budorickc6186972020-02-26 00:58:14 +00001546 cache = local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
1547 # Touch any named caches we're going to use to minimize thrashing
1548 # between tasks that request some (but not all) of the same named caches.
John Budorick0a4dab62020-03-02 22:23:35 +00001549 cache.touch(*[name for name, _, _ in options.named_caches])
John Budorickc6186972020-02-26 00:58:14 +00001550 return cache
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001551 return None
1552
1553
aludwin7556e0c2016-10-26 08:46:10 -07001554def parse_args(args):
1555 # Create a fake mini-parser just to get out the "-a" command. Note that
1556 # it's not documented here; instead, it's documented in create_option_parser
1557 # even though that parser will never actually get to parse it. This is
1558 # because --argsfile is exclusive with all other options and arguments.
1559 file_argparse = argparse.ArgumentParser(add_help=False)
1560 file_argparse.add_argument('-a', '--argsfile')
1561 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1562 if file_args.argsfile:
1563 if nonfile_args:
1564 file_argparse.error('Can\'t specify --argsfile with'
1565 'any other arguments (%s)' % nonfile_args)
1566 try:
1567 with open(file_args.argsfile, 'r') as f:
1568 args = json.load(f)
1569 except (IOError, OSError, ValueError) as e:
1570 # We don't need to error out here - "args" is now empty,
1571 # so the call below to parser.parse_args(args) will fail
1572 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001573 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001574
1575 # Even if we failed to read the args, just call the normal parser now since it
1576 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001577 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001578 options, args = parser.parse_args(args)
Ye Kuangfff1e502020-07-13 13:21:57 +00001579 if not isinstance(options.cipd_enabled, (bool, int)):
1580 options.cipd_enabled = distutils.util.strtobool(options.cipd_enabled)
aludwin7556e0c2016-10-26 08:46:10 -07001581 return (parser, options, args)
1582
1583
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001584def _calc_named_cache_hint(named_cache, named_caches):
1585 """Returns the expected size of the missing named caches."""
1586 present = named_cache.available
1587 size = 0
1588 for name, _, hint in named_caches:
1589 if name not in present:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001590 hint = int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001591 if hint > 0:
1592 size += hint
1593 return size
1594
1595
aludwin7556e0c2016-10-26 08:46:10 -07001596def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001597 # Warning: when --argsfile is used, the strings are unicode instances, when
1598 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001599 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001600
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001601 if options.report_on_exception and options.isolate_server:
1602 on_error.report_on_exception_exit(options.isolate_server)
1603
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001604 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001605 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001606
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001607 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001608 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001609 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1610 if hint:
1611 # Increase the --min-free-space value by the hint, and recreate the
1612 # NamedCache instance so it gets the updated CachePolicy.
1613 options.min_free_space += hint
1614 named_cache = process_named_cache_options(parser, options)
1615
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001616 # TODO(crbug.com/932396): Remove this.
Takuto Ikuta4a22c2c2020-06-05 02:02:23 +00001617 use_go_isolated = options.cipd_enabled
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001618
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001619 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1620 # they can be cleaned the same way.
Ye Kuang97849802020-06-29 13:17:09 +00001621 if use_go_isolated and not options.clean:
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +00001622 isolate_cache = None
1623 else:
1624 isolate_cache = isolateserver.process_cache_options(options, trim=False)
1625
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001626 caches = []
1627 if isolate_cache:
1628 caches.append(isolate_cache)
1629 if named_cache:
1630 caches.append(named_cache)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001631 root = caches[0].cache_dir if caches else six.text_type(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001632 if options.clean:
1633 if options.isolated:
1634 parser.error('Can\'t use --isolated with --clean.')
1635 if options.isolate_server:
1636 parser.error('Can\'t use --isolate-server with --clean.')
1637 if options.json:
1638 parser.error('Can\'t use --json with --clean.')
nodirf33b8d62016-10-26 22:34:58 -07001639 if options.named_caches:
1640 parser.error('Can\t use --named-cache with --clean.')
Junji Watanabeb19f54d2020-09-17 05:54:52 +00001641 if options.cas_instance or options.cas_digest:
1642 parser.error('Can\t use --cas-instance, --cas-digest with --clean.')
Takuto Ikuta9ab28552020-07-31 08:15:45 +00001643
1644 logging.info("initial free space: %d", file_path.get_free_space(root))
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001645 # Trim first, then clean.
1646 local_caching.trim_caches(
1647 caches,
1648 root,
Takuto Ikuta616ce262020-09-07 08:43:48 +00001649 min_free_space=options.min_free_space,
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001650 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta9ab28552020-07-31 08:15:45 +00001651 logging.info("free space after trim: %d", file_path.get_free_space(root))
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001652 for c in caches:
Marc-Antoine Ruel87fc2222018-06-18 13:09:24 +00001653 c.cleanup()
Takuto Ikuta9ab28552020-07-31 08:15:45 +00001654 logging.info("free space after cleanup: %d", file_path.get_free_space(root))
maruel36a963d2016-04-08 17:15:49 -07001655 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001656
1657 # Trim must still be done for the following case:
1658 # - named-cache was used
1659 # - some entries, with a large hint, where missing
1660 # - --min-free-space was increased accordingly, thus trimming is needed
1661 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1662 # --clean after each task.
1663 if hint:
1664 logging.info('Additional trimming of %d bytes', hint)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001665 local_caching.trim_caches(
1666 caches,
1667 root,
Takuto Ikuta616ce262020-09-07 08:43:48 +00001668 min_free_space=options.min_free_space,
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001669 max_age_secs=MAX_AGE_SECS)
maruel36a963d2016-04-08 17:15:49 -07001670
nodir55be77b2016-05-03 09:39:57 -07001671 if not options.isolated and not args:
1672 parser.error('--isolated or command to run is required.')
1673
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001674 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001675
Takuto Ikutaae767b32020-05-11 01:22:19 +00001676 isolateserver.process_isolate_server_options(parser, options, False)
nodir55be77b2016-05-03 09:39:57 -07001677 if not options.isolate_server:
1678 if options.isolated:
1679 parser.error('--isolated requires --isolate-server')
1680 if ISOLATED_OUTDIR_PARAMETER in args:
1681 parser.error(
1682 '%s in args requires --isolate-server' % ISOLATED_OUTDIR_PARAMETER)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001683
nodir90bc8dc2016-06-15 13:35:21 -07001684 if options.root_dir:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001685 options.root_dir = six.text_type(os.path.abspath(options.root_dir))
maruel12e30012015-10-09 11:55:35 -07001686 if options.json:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001687 options.json = six.text_type(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001688
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001689 if any('=' not in i for i in options.env):
1690 parser.error(
1691 '--env required key=value form. value can be skipped to delete '
1692 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001693 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001694
1695 prefixes = {}
1696 cwd = os.path.realpath(os.getcwd())
1697 for item in options.env_prefix:
1698 if '=' not in item:
1699 parser.error(
1700 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1701 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001702 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001703 if os.path.isabs(opath):
1704 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1705 opath = os.path.normpath(opath)
1706 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1707 parser.error(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001708 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1709 % opath)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001710 prefixes.setdefault(key, []).append(opath)
1711 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001712
nodirbe642ff2016-06-09 15:51:51 -07001713 cipd.validate_cipd_options(parser, options)
1714
vadimsh232f5a82017-01-20 19:23:44 -08001715 install_packages_fn = noop_install_packages
Ye Kuang1d096cb2020-06-26 08:38:21 +00001716 tmp_cipd_cache_dir = None
vadimsh902948e2017-01-20 15:57:32 -08001717 if options.cipd_enabled:
Ye Kuang1d096cb2020-06-26 08:38:21 +00001718 cache_dir = options.cipd_cache
1719 if not cache_dir:
1720 tmp_cipd_cache_dir = six.text_type(tempfile.mkdtemp())
1721 cache_dir = tmp_cipd_cache_dir
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001722 install_packages_fn = (
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001723 lambda run_dir, isolated_dir, cas_dir: install_client_and_packages(
Ye Kuang1d096cb2020-06-26 08:38:21 +00001724 run_dir,
1725 cipd.parse_package_args(options.cipd_packages),
1726 options.cipd_server,
1727 options.cipd_client_package,
1728 options.cipd_client_version,
1729 cache_dir=cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001730 isolated_dir=isolated_dir,
1731 cas_dir=cas_dir,
1732 ))
nodirbe642ff2016-06-09 15:51:51 -07001733
nodird6160682017-02-02 13:03:35 -08001734 @contextlib.contextmanager
nodir0ae98b32017-05-11 13:21:53 -07001735 def install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001736 # WARNING: this function depends on "options" variable defined in the outer
1737 # function.
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001738 assert six.text_type(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001739 assert os.path.isabs(run_dir), run_dir
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001740 named_caches = [(os.path.join(run_dir, six.text_type(relpath)), name)
1741 for name, relpath, _ in options.named_caches]
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001742 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001743 named_cache.install(path, name)
nodird6160682017-02-02 13:03:35 -08001744 try:
1745 yield
1746 finally:
dnje289d132017-07-07 11:16:44 -07001747 # Uninstall each named cache, returning it to the cache pool. If an
1748 # uninstall fails for a given cache, it will remain in the task's
1749 # temporary space, get cleaned up by the Swarming bot, and be lost.
1750 #
1751 # If the Swarming bot cannot clean up the cache, it will handle it like
1752 # any other bot file that could not be removed.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001753 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001754 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001755 # uninstall() doesn't trim but does call save() implicitly. Trimming
1756 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001757 named_cache.uninstall(path, name)
1758 except local_caching.NamedCacheError:
1759 logging.exception('Error while removing named cache %r at %r. '
1760 'The cache will be lost.', path, name)
nodirf33b8d62016-10-26 22:34:58 -07001761
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001762 extra_args = []
1763 command = []
1764 if options.raw_cmd:
1765 command = args
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001766 if options.relative_cwd:
1767 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1768 if not a.startswith(os.getcwd()):
1769 parser.error(
1770 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001771 else:
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001772 if options.relative_cwd:
1773 parser.error('--relative-cwd requires --raw-cmd')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001774 extra_args = args
1775
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001776 containment_type = subprocess42.Containment.NONE
1777 if options.containment_type == 'AUTO':
1778 containment_type = subprocess42.Containment.AUTO
1779 if options.containment_type == 'JOB_OBJECT':
1780 containment_type = subprocess42.Containment.JOB_OBJECT
1781 containment = subprocess42.Containment(
1782 containment_type=containment_type,
1783 limit_processes=options.limit_processes,
1784 limit_total_committed_memory=options.limit_total_committed_memory)
1785
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001786 data = TaskData(
1787 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001788 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001789 extra_args=extra_args,
1790 isolated_hash=options.isolated,
1791 storage=None,
1792 isolate_cache=isolate_cache,
Junji Watanabe54925c32020-09-08 00:56:18 +00001793 cas_instance=options.cas_instance,
1794 cas_digest=options.cas_digest,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001795 outputs=options.output,
1796 install_named_caches=install_named_caches,
1797 leak_temp_dir=options.leak_temp_dir,
1798 root_dir=_to_unicode(options.root_dir),
1799 hard_timeout=options.hard_timeout,
1800 grace_period=options.grace_period,
1801 bot_file=options.bot_file,
1802 switch_to_account=options.switch_to_account,
1803 install_packages_fn=install_packages_fn,
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001804 use_go_isolated=use_go_isolated,
Takuto Ikuta10cae642020-01-08 08:12:07 +00001805 go_cache_dir=options.cache,
Takuto Ikuta879788c2020-01-10 08:00:26 +00001806 go_cache_policies=local_caching.CachePolicies(
1807 max_cache_size=options.max_cache_size,
1808 min_free_space=options.min_free_space,
1809 max_items=options.max_items,
1810 max_age_secs=None,
1811 ),
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001812 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001813 env_prefix=options.env_prefix,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001814 lower_priority=bool(options.lower_priority),
1815 containment=containment)
nodirbe642ff2016-06-09 15:51:51 -07001816 try:
nodir90bc8dc2016-06-15 13:35:21 -07001817 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001818 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001819 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001820 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001821 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001822 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001823 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001824 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001825 return run_tha_test(data, options.json)
1826 return run_tha_test(data, options.json)
Junji Watanabe38b28b02020-04-23 10:23:30 +00001827 except (cipd.Error, local_caching.NamedCacheError,
1828 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001829 print(ex.message, file=sys.stderr)
nodirbe642ff2016-06-09 15:51:51 -07001830 return 1
Ye Kuang1d096cb2020-06-26 08:38:21 +00001831 finally:
1832 if tmp_cipd_cache_dir is not None:
1833 try:
1834 file_path.rmtree(tmp_cipd_cache_dir)
1835 except OSError:
1836 logging.exception('Remove tmp_cipd_cache_dir=%s failed',
1837 tmp_cipd_cache_dir)
1838 # Best effort clean up. Failed to do so doesn't affect the outcome.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001839
1840
1841if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001842 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001843 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001844 fix_encoding.fix_encoding()
Ye Kuang2dd17442020-04-22 08:45:52 +00001845 net.set_user_agent('run_isolated.py/' + __version__)
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001846 sys.exit(main(sys.argv[1:]))