blob: 005af1900ca5d0105b36d1dcf399154499e587f9 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
33See
34https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
35for all the variables.
36
37See
38https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
39for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000040"""
41
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000042from __future__ import print_function
43
44__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000045
aludwin7556e0c2016-10-26 08:46:10 -070046import argparse
maruel064c0a32016-04-05 11:47:15 -070047import base64
iannucci96fcccc2016-08-30 15:52:22 -070048import collections
vadimsh232f5a82017-01-20 19:23:44 -080049import contextlib
Ye Kuangfff1e502020-07-13 13:21:57 +000050import distutils
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040051import errno
aludwin7556e0c2016-10-26 08:46:10 -070052import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000053import logging
54import optparse
55import os
Takuto Ikuta5c59a842020-01-24 03:05:24 +000056import platform
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040057import re
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000058import sys
59import tempfile
maruel064c0a32016-04-05 11:47:15 -070060import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000061
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000062from utils import tools
63tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000064
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000065# third_party/
66from depot_tools import fix_encoding
Takuto Ikuta6e2ff962019-10-29 12:35:27 +000067import six
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000068
69# pylint: disable=ungrouped-imports
70import auth
71import cipd
72import isolate_storage
73import isolateserver
74import local_caching
75from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070076from utils import file_path
maruel12e30012015-10-09 11:55:35 -070077from utils import fs
maruel064c0a32016-04-05 11:47:15 -070078from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040079from utils import logging_utils
Ye Kuang2dd17442020-04-22 08:45:52 +000080from utils import net
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040081from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050082from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000083
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000084
maruele2f2cb82016-07-13 14:41:03 -070085# Magic variables that can be found in the isolate task command line.
86ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
87EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
88SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
89
90
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000091# The name of the log file to use.
92RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
93
maruele2f2cb82016-07-13 14:41:03 -070094
csharp@chromium.orge217f302012-11-22 16:51:53 +000095# The name of the log to use for the run_test_cases.py command
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000096RUN_TEST_CASES_LOG = 'run_test_cases.log'
csharp@chromium.orge217f302012-11-22 16:51:53 +000097
vadimsh@chromium.org87d63262013-04-04 19:34:21 +000098
maruele2f2cb82016-07-13 14:41:03 -070099# Use short names for temporary directories. This is driven by Windows, which
100# imposes a relatively short maximum path length of 260 characters, often
101# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000102# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -0700103#
104# It is recommended to start the script with a `root_dir` as short as
105# possible.
106# - ir stands for isolated_run
107# - io stands for isolated_out
108# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000109# - ic stands for isolated_client
maruele2f2cb82016-07-13 14:41:03 -0700110ISOLATED_RUN_DIR = u'ir'
111ISOLATED_OUT_DIR = u'io'
112ISOLATED_TMP_DIR = u'it'
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000113ISOLATED_CLIENT_DIR = u'ic'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000114_CAS_CLIENT_DIR = u'cc'
maruele2f2cb82016-07-13 14:41:03 -0700115
Takuto Ikuta02edca22019-11-29 10:04:51 +0000116# TODO(tikuta): take these parameter from luci-config?
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +0000117# Update tag by `./client/update_go_clients.sh`.
Takuto Ikutac8c92e62020-04-01 07:07:29 +0000118# Or take revision from
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000119# https://ci.chromium.org/p/infra-internal/g/infra-packagers/console
Takuto Ikuta02edca22019-11-29 10:04:51 +0000120ISOLATED_PACKAGE = 'infra/tools/luci/isolated/${platform}'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000121_CAS_PACKAGE = 'infra/tools/luci/cas/${platform}'
Takuto Ikutab8e89282020-12-02 08:08:17 +0000122_LUCI_GO_REVISION = 'git_revision:eea9e0f87b642f8435d2ab4bc13929e2a3cfac19'
maruele2f2cb82016-07-13 14:41:03 -0700123
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400124# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000125CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400126
Takuto Ikutaa010c532020-10-21 05:42:29 +0000127_FREE_SPACE_BUFFER_FOR_GO = 1024 * 1024 * 1024
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400128
marueld928c862017-06-08 08:20:04 -0700129OUTLIVING_ZOMBIE_MSG = """\
130*** Swarming tried multiple times to delete the %s directory and failed ***
131*** Hard failing the task ***
132
133Swarming detected that your testing script ran an executable, which may have
134started a child executable, and the main script returned early, leaving the
135children executables playing around unguided.
136
137You don't want to leave children processes outliving the task on the Swarming
138bot, do you? The Swarming bot doesn't.
139
140How to fix?
141- For any process that starts children processes, make sure all children
142 processes terminated properly before each parent process exits. This is
143 especially important in very deep process trees.
144 - This must be done properly both in normal successful task and in case of
145 task failure. Cleanup is very important.
146- The Swarming bot sends a SIGTERM in case of timeout.
147 - You have %s seconds to comply after the signal was sent to the process
148 before the process is forcibly killed.
149- To achieve not leaking children processes in case of signals on timeout, you
150 MUST handle signals in each executable / python script and propagate them to
151 children processes.
152 - When your test script (python or binary) receives a signal like SIGTERM or
153 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
154 them to terminate before quitting.
155
156See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400157https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700158for more information.
159
160*** May the SIGKILL force be with you ***
161"""
162
163
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000164# Currently hardcoded. Eventually could be exposed as a flag once there's value.
165# 3 weeks
166MAX_AGE_SECS = 21*24*60*60
167
Ye Kuang72e6fe82020-08-05 06:30:04 +0000168# TODO(1099655): Enable this once all prod issues are gone.
169_USE_GO_ISOLATED_TO_UPLOAD = False
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000170
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500171TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000172 'TaskData',
173 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000174 # List of strings; the command line to use, independent of what was
175 # specified in the isolated file.
176 'command',
177 # Relative directory to start command into.
178 'relative_cwd',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000179 # Hash of the .isolated file that must be retrieved to recreate the tree
180 # of files to run the target executable. The command specified in the
181 # .isolated is executed. Mutually exclusive with command argument.
182 'isolated_hash',
183 # isolateserver.Storage instance to retrieve remote objects. This object
184 # has a reference to an isolateserver.StorageApi, which does the actual
185 # I/O.
186 'storage',
187 # isolateserver.LocalCache instance to keep from retrieving the same
188 # objects constantly by caching the objects retrieved. Can be on-disk or
189 # in-memory.
190 'isolate_cache',
Junji Watanabe54925c32020-09-08 00:56:18 +0000191 # Digest of the input root on RBE-CAS.
192 'cas_digest',
193 # Full CAS instance name.
194 'cas_instance',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000195 # List of paths relative to root_dir to put into the output isolated
196 # bundle upon task completion (see link_outputs_to_outdir).
197 'outputs',
198 # Function (run_dir) => context manager that installs named caches into
199 # |run_dir|.
200 'install_named_caches',
201 # If True, the temporary directory will be deliberately leaked for later
202 # examination.
203 'leak_temp_dir',
204 # Path to the directory to use to create the temporary directory. If not
205 # specified, a random temporary directory is created.
206 'root_dir',
207 # Kills the process if it lasts more than this amount of seconds.
208 'hard_timeout',
209 # Number of seconds to wait between SIGTERM and SIGKILL.
210 'grace_period',
211 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
212 # task command line argument.
213 'bot_file',
214 # Logical account to switch LUCI_CONTEXT into.
215 'switch_to_account',
216 # Context manager dir => CipdInfo, see install_client_and_packages.
217 'install_packages_fn',
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000218 # Use go isolated client.
219 'use_go_isolated',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000220 # Cache directory for go `isolated` client.
Takuto Ikuta057c5342019-12-03 04:05:05 +0000221 'go_cache_dir',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000222 # Parameters passed to go `isolated` client.
Takuto Ikuta879788c2020-01-10 08:00:26 +0000223 'go_cache_policies',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000224 # Cache directory for `cas` client.
225 'cas_cache_dir',
226 # Parameters passed to `cas` client.
227 'cas_cache_policies',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000228 # Environment variables to set.
229 'env',
230 # Environment variables to mutate with relative directories.
231 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
232 'env_prefix',
233 # Lowers the task process priority.
234 'lower_priority',
235 # subprocess42.Containment instance. Can be None.
236 'containment',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000237 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500238
239
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500240def _to_str(s):
241 """Downgrades a unicode instance to str. Pass str through as-is."""
242 if isinstance(s, str):
243 return s
244 # This is technically incorrect, especially on Windows. In theory
245 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
246 # page' on Windows, but that causes other problems, as the character set
247 # is very limited.
248 return s.encode('utf-8')
249
250
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500251def _to_unicode(s):
252 """Upgrades a str instance to unicode. Pass unicode through as-is."""
Takuto Ikuta95459dd2019-10-29 12:39:47 +0000253 if isinstance(s, six.text_type) or s is None:
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500254 return s
255 return s.decode('utf-8')
256
257
maruel03e11842016-07-14 10:50:16 -0700258def make_temp_dir(prefix, root_dir):
259 """Returns a new unique temporary directory."""
Takuto Ikuta6e2ff962019-10-29 12:35:27 +0000260 return six.text_type(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000261
262
vadimsh9c54b2c2017-07-25 14:08:29 -0700263@contextlib.contextmanager
264def set_luci_context_account(account, tmp_dir):
265 """Sets LUCI_CONTEXT account to be used by the task.
266
267 If 'account' is None or '', does nothing at all. This happens when
268 run_isolated.py is called without '--switch-to-account' flag. In this case,
269 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000270 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700271 run_isolated.py explicitly from their code.
272
273 If the requested account is not defined in the context, switches to
274 non-authenticated access. This happens for Swarming tasks that don't use
275 'task' service accounts.
276
277 If not using LUCI_CONTEXT-based auth, does nothing.
278 If already running as requested account, does nothing.
279 """
280 if not account:
281 # Not actually switching.
282 yield
283 return
284
285 local_auth = luci_context.read('local_auth')
286 if not local_auth:
287 # Not using LUCI_CONTEXT auth at all.
288 yield
289 return
290
291 # See LUCI_CONTEXT.md for the format of 'local_auth'.
292 if local_auth.get('default_account_id') == account:
293 # Already set, no need to switch.
294 yield
295 return
296
297 available = {a['id'] for a in local_auth.get('accounts') or []}
298 if account in available:
299 logging.info('Switching default LUCI_CONTEXT account to %r', account)
300 local_auth['default_account_id'] = account
301 else:
302 logging.warning(
303 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
304 'disabling authentication', account, sorted(available))
305 local_auth.pop('default_account_id', None)
306
307 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
308 yield
309
310
nodir90bc8dc2016-06-15 13:35:21 -0700311def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000312 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700313
314 Raises:
315 ValueError if a parameter is requested in |command| but its value is not
316 provided.
317 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000318 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
319
320
321def replace_parameters(arg, out_dir, bot_file):
322 """Replaces parameter tokens with appropriate values in a string.
323
324 Raises:
325 ValueError if a parameter is requested in |arg| but its value is not
326 provided.
327 """
328 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
329 replace_slash = False
330 if ISOLATED_OUTDIR_PARAMETER in arg:
331 if not out_dir:
332 raise ValueError(
333 'output directory is requested in command or env var, but not '
334 'provided; please specify one')
335 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
336 replace_slash = True
337 if SWARMING_BOT_FILE_PARAMETER in arg:
338 if bot_file:
339 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700340 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000341 else:
342 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
343 'var, but no bot_file specified. Leaving parameter '
344 'unchanged.')
345 if replace_slash:
346 # Replace slashes only if parameters are present
347 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
348 arg = arg.replace('/', os.sep)
349 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700350
351
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000352
353def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
354 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800355 """Returns full OS environment to run a command in.
356
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800357 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
358 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800359
360 Args:
361 tmp_dir: temp directory.
362 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500363 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500364 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800365 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000366 out_dir: Isolated output directory. Required to be != None if any of the
367 env vars contain ISOLATED_OUTDIR_PARAMETER.
368 bot_file: Required to be != None if any of the env vars contain
369 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800370 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500371 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000372 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500373 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500374 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500375 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000376 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500377
378 if cipd_info:
379 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500380 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
381 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500382
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000383 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500384 assert isinstance(paths, list), paths
385 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500386 cur = out.get(key)
387 if cur:
388 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500389 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800390
Marc-Antoine Ruelefb30b12018-07-25 18:34:36 +0000391 tmp_dir = _to_str(tmp_dir)
392 # pylint: disable=line-too-long
393 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
394 # platform. So $TMPDIR must be set on all platforms.
395 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
396 out['TMPDIR'] = tmp_dir
397 if sys.platform == 'win32':
398 # * chromium's base utils uses GetTempPath().
399 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
400 # * Go uses GetTempPath().
401 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
402 # set.
403 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
404 out['TMP'] = tmp_dir
405 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
406 out['TEMP'] = tmp_dir
407 elif sys.platform == 'darwin':
408 # * Chromium uses an hack on macOS before calling into
409 # NSTemporaryDirectory().
410 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
411 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
412 out['MAC_CHROMIUM_TMPDIR'] = tmp_dir
413 else:
414 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
415 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
416 # * mktemp on linux respects $TMPDIR.
417 # * Chromium respects $TMPDIR on linux.
418 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
419 # * Go uses $TMPDIR.
420 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
421 pass
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500422 return out
vadimsh232f5a82017-01-20 19:23:44 -0800423
424
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000425def run_command(
426 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700427 """Runs the command.
428
429 Returns:
430 tuple(process exit code, bool if had a hard timeout)
431 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000432 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000433 'run_command(%s, %s, %s, %s, %s, %s)',
434 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700435
maruel6be7f9e2015-10-01 12:25:30 -0700436 exit_code = None
437 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700438 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700439 proc = None
440 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700441 try:
maruel6be7f9e2015-10-01 12:25:30 -0700442 # TODO(maruel): This code is imperfect. It doesn't handle well signals
443 # during the download phase and there's short windows were things can go
444 # wrong.
445 def handler(signum, _frame):
446 if proc and not had_signal:
447 logging.info('Received signal %d', signum)
448 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700449 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700450
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000451 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000452 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000453 lower_priority=lower_priority, containment=containment)
maruel6be7f9e2015-10-01 12:25:30 -0700454 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
455 try:
John Budorickc398f092019-06-10 22:49:44 +0000456 exit_code = proc.wait(hard_timeout or None)
maruel6be7f9e2015-10-01 12:25:30 -0700457 except subprocess42.TimeoutExpired:
458 if not had_signal:
459 logging.warning('Hard timeout')
460 had_hard_timeout = True
461 logging.warning('Sending SIGTERM')
462 proc.terminate()
463
Takuto Ikuta684f7912020-09-29 07:49:49 +0000464 kill_sent = False
maruel6be7f9e2015-10-01 12:25:30 -0700465 # Ignore signals in grace period. Forcibly give the grace period to the
466 # child process.
467 if exit_code is None:
468 ignore = lambda *_: None
469 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
470 try:
471 exit_code = proc.wait(grace_period or None)
472 except subprocess42.TimeoutExpired:
473 # Now kill for real. The user can distinguish between the
474 # following states:
475 # - signal but process exited within grace period,
476 # hard_timed_out will be set but the process exit code will be
477 # script provided.
478 # - processed exited late, exit code will be -9 on posix.
479 logging.warning('Grace exhausted; sending SIGKILL')
480 proc.kill()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000481 kill_sent = True
martiniss5c8043e2017-08-01 17:09:43 -0700482 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700483 exit_code = proc.wait()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000484
485 # the process group / job object may be dangling so if we didn't kill
486 # it already, give it a poke now.
487 if not kill_sent:
488 proc.kill()
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000489 except OSError as e:
maruela9cfd6f2015-09-15 11:03:15 -0700490 # This is not considered to be an internal error. The executable simply
491 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800492 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000493 '<The executable does not exist, a dependent library is missing or '
494 'the command line is too long>\n'
495 '<Check for missing .so/.dll in the .isolate or GN file or length of '
496 'command line args>\n'
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000497 '<Command: %s, Exception: %s>\n' % (command, e))
maruela72f46e2016-02-24 11:05:45 -0800498 if os.environ.get('SWARMING_TASK_ID'):
499 # Give an additional hint when running as a swarming task.
500 sys.stderr.write(
501 '<See the task\'s page for commands to help diagnose this issue '
502 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700503 exit_code = 1
504 logging.info(
505 'Command finished with exit code %d (%s)',
506 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700507 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700508
509
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000510def _run_go_cmd_and_wait(cmd):
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000511 """
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000512 Runs an external Go command, `isolated` or `cas`, and wait for its completion.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000513
514 While this is a generic function to launch a subprocess, it has logic that
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000515 is specific to Go `isolated` and `cas` for waiting and logging.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000516
517 Returns:
518 The subprocess object
519 """
Ye Kuang3c40e9f2020-07-28 13:15:25 +0000520 cmd_str = ' '.join(cmd)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000521 try:
522 proc = subprocess42.Popen(cmd)
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000523
Ye Kuangc1d800f2020-07-28 10:14:55 +0000524 exceeded_max_timeout = True
525 check_period_sec = 30
526 max_checks = 100
527 # max timeout = max_checks * check_period_sec = 50 minutes
528 for i in range(max_checks):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000529 # This is to prevent I/O timeout error during setup.
Ye Kuangc1d800f2020-07-28 10:14:55 +0000530 try:
531 retcode = proc.wait(check_period_sec)
532 if retcode != 0:
533 raise ValueError("retcode is not 0: %s (cmd=%s)" % (retcode, cmd_str))
534 exceeded_max_timeout = False
535 break
536 except subprocess42.TimeoutExpired:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000537 print('still running (after %d seconds)' % ((i + 1) * check_period_sec))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000538
Ye Kuangc1d800f2020-07-28 10:14:55 +0000539 if exceeded_max_timeout:
540 proc.terminate()
541 try:
542 proc.wait(check_period_sec)
543 except subprocess42.TimeoutExpired:
544 logging.exception(
545 "failed to terminate? timeout happened after %d seconds",
546 check_period_sec)
547 proc.kill()
548 proc.wait()
549 # Raise unconditionally, because |proc| was forcefully terminated.
550 raise ValueError("timedout after %d seconds (cmd=%s)" %
551 (check_period_sec * max_checks, cmd_str))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000552
Ye Kuangc1d800f2020-07-28 10:14:55 +0000553 return proc
554 except Exception:
555 logging.exception('Failed to run Go cmd %s', cmd_str)
556 raise
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000557
558
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000559def _fetch_and_map_with_cas(cas_client, digest, instance, output_dir, cache_dir,
560 policies):
561 """
562 Fetches a CAS tree using cas client, create the tree and returns download
563 stats.
564 """
565
Takuto Ikuta34a86c52020-10-13 05:30:57 +0000566 # TODO(crbug.com/chrome-operations/49):
567 # remove this after isolate to RBE-CAS migration.
568 _CAS_EMPTY_DIR_DIGEST = (
569 'e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855/0')
570 if digest == _CAS_EMPTY_DIR_DIGEST:
571 return {
572 'duration': 0.0,
573 'items_cold': '',
574 'items_hot': '',
575 }
576
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000577 start = time.time()
578 result_json_handle, result_json_path = tempfile.mkstemp(
579 prefix=u'fetch-and-map-result-', suffix=u'.json')
580 os.close(result_json_handle)
581 try:
582 cmd = [
583 cas_client,
584 'download',
585 '-digest',
586 digest,
587 '-cas-instance',
588 instance,
589 # flags for cache.
590 '-cache-dir',
591 cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000592 '-cache-max-size',
593 str(policies.max_cache_size),
594 '-cache-min-free-space',
595 str(policies.min_free_space),
596 # flags for output.
597 '-dir',
598 output_dir,
599 '-dump-stats-json',
600 result_json_path,
601 ]
602 _run_go_cmd_and_wait(cmd)
603
604 with open(result_json_path) as json_file:
605 result_json = json.load(json_file)
606
607 return {
608 'duration': time.time() - start,
609 'items_cold': result_json['items_cold'],
610 'items_hot': result_json['items_hot'],
611 }
612 finally:
613 fs.remove(result_json_path)
614
615
616def _fetch_and_map_with_go_isolated(isolated_hash, storage, outdir,
617 go_cache_dir, policies, isolated_client):
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000618 """
619 Fetches an isolated tree using go client, create the tree and returns
Takuto Ikuta57219f42020-11-02 07:35:36 +0000620 stats.
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000621 """
622 start = time.time()
623 server_ref = storage.server_ref
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000624 result_json_handle, result_json_path = tempfile.mkstemp(
625 prefix=u'fetch-and-map-result-', suffix=u'.json')
626 os.close(result_json_handle)
627 try:
Ye Kuanga98764c2020-04-09 03:17:37 +0000628 cmd = [
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000629 isolated_client,
630 'download',
631 '-isolate-server',
632 server_ref.url,
633 '-namespace',
634 server_ref.namespace,
635 '-isolated',
636 isolated_hash,
637
638 # flags for cache
639 '-cache-dir',
Takuto Ikuta057c5342019-12-03 04:05:05 +0000640 go_cache_dir,
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000641 '-cache-max-items',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000642 str(policies.max_items),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000643 '-cache-max-size',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000644 str(policies.max_cache_size),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000645 '-cache-min-free-space',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000646 str(policies.min_free_space),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000647
648 # flags for output
649 '-output-dir',
650 outdir,
651 '-fetch-and-map-result-json',
652 result_json_path,
Ye Kuanga98764c2020-04-09 03:17:37 +0000653 ]
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000654 _run_go_cmd_and_wait(cmd)
Takuto Ikuta3153e3b2020-02-18 06:11:47 +0000655
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000656 with open(result_json_path) as json_file:
657 result_json = json.load(json_file)
658
Takuto Ikuta57219f42020-11-02 07:35:36 +0000659 return {
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000660 'duration': time.time() - start,
661 'items_cold': result_json['items_cold'],
662 'items_hot': result_json['items_hot'],
Ye Kuang65a1de52020-10-16 08:31:16 +0000663 'initial_number_items': result_json['initial_number_items'],
664 'initial_size': result_json['initial_size'],
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000665 }
666 finally:
667 fs.remove(result_json_path)
668
669
670# TODO(crbug.com/932396): remove this function.
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000671def fetch_and_map(isolated_hash, storage, cache, outdir):
Takuto Ikuta57219f42020-11-02 07:35:36 +0000672 """Fetches an isolated tree, create the tree and returns stats."""
nodir6f801882016-04-29 14:41:50 -0700673 start = time.time()
Takuto Ikuta57219f42020-11-02 07:35:36 +0000674 isolateserver.fetch_isolated(
nodir6f801882016-04-29 14:41:50 -0700675 isolated_hash=isolated_hash,
676 storage=storage,
677 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700678 outdir=outdir,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000679 use_symlinks=False)
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000680 hot = (collections.Counter(cache.used) -
681 collections.Counter(cache.added)).elements()
Takuto Ikuta57219f42020-11-02 07:35:36 +0000682 return {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000683 'duration': time.time() - start,
684 'items_cold': base64.b64encode(large.pack(sorted(cache.added))).decode(),
685 'items_hot': base64.b64encode(large.pack(sorted(hot))).decode(),
nodir6f801882016-04-29 14:41:50 -0700686 }
687
688
aludwin0a8e17d2016-10-27 15:57:39 -0700689def link_outputs_to_outdir(run_dir, out_dir, outputs):
690 """Links any named outputs to out_dir so they can be uploaded.
691
692 Raises an error if the file already exists in that directory.
693 """
694 if not outputs:
695 return
696 isolateserver.create_directories(out_dir, outputs)
697 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400698 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
699
700
701def copy_recursively(src, dst):
702 """Efficiently copies a file or directory from src_dir to dst_dir.
703
704 `item` may be a file, directory, or a symlink to a file or directory.
705 All symlinks are replaced with their targets, so the resulting
706 directory structure in dst_dir will never have any symlinks.
707
708 To increase speed, copy_recursively hardlinks individual files into the
709 (newly created) directory structure if possible, unlike Python's
710 shutil.copytree().
711 """
712 orig_src = src
713 try:
714 # Replace symlinks with their final target.
715 while fs.islink(src):
716 res = fs.readlink(src)
717 src = os.path.join(os.path.dirname(src), res)
718 # TODO(sadafm): Explicitly handle cyclic symlinks.
719
720 # Note that fs.isfile (which is a wrapper around os.path.isfile) throws
721 # an exception if src does not exist. A warning will be logged in that case.
722 if fs.isfile(src):
723 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
724 return
725
726 if not fs.exists(dst):
727 os.makedirs(dst)
728
729 for child in fs.listdir(src):
730 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
731
732 except OSError as e:
733 if e.errno == errno.ENOENT:
734 logging.warning('Path %s does not exist or %s is a broken symlink',
735 src, orig_src)
736 else:
737 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700738
739
Ye Kuangfb0bad62020-07-28 08:07:25 +0000740def _upload_with_py(storage, out_dir):
741
742 def process_stats(f_st):
743 st = sorted(i.size for i in f_st)
744 return base64.b64encode(large.pack(st)).decode()
745
746 try:
747 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
748 storage, [out_dir], None, verify_push=True)
749
750 isolated = list(results.values())[0]
751 cold = process_stats(f_cold)
752 hot = process_stats(f_hot)
753 return isolated, cold, hot
754
755 except isolateserver.Aborted:
756 # This happens when a signal SIGTERM was received while uploading data.
757 # There is 2 causes:
758 # - The task was too slow and was about to be killed anyway due to
759 # exceeding the hard timeout.
760 # - The amount of data uploaded back is very large and took too much
761 # time to archive.
762 sys.stderr.write('Received SIGTERM while uploading')
763 # Re-raise, so it will be treated as an internal failure.
764 raise
765
766
767def _upload_with_go(storage, outdir, isolated_client):
768 """
769 Uploads results back using the Go `isolated` CLI.
770 """
771 server_ref = storage.server_ref
772 isolated_handle, isolated_path = tempfile.mkstemp(
773 prefix=u'isolated-hash-', suffix=u'.txt')
774 stats_json_handle, stats_json_path = tempfile.mkstemp(
775 prefix=u'dump-stats-', suffix=u'.json')
776 os.close(isolated_handle)
777 os.close(stats_json_handle)
778 try:
779 cmd = [
780 isolated_client,
781 'archive',
782 '-isolate-server',
783 server_ref.url,
784 '-namespace',
785 server_ref.namespace,
786 '-dirs',
787 # Format: <working directory>:<relative path to dir>
788 outdir + ':',
789
790 # output
791 '-dump-hash',
792 isolated_path,
793 '-dump-stats-json',
794 stats_json_path,
Ye Kuangbc4e8402020-07-29 09:54:30 +0000795 '-quiet',
Ye Kuangfb0bad62020-07-28 08:07:25 +0000796 ]
Ye Kuang0023dc52020-08-04 05:28:41 +0000797 # Will do exponential backoff, e.g. 10, 20, 40...
798 # This mitigates https://crbug.com/1094369, where there is a data race on
799 # the uploaded files.
800 backoff = 10
Takuto Ikutae0bfec72020-08-28 02:52:52 +0000801 started = time.time()
Ye Kuang0023dc52020-08-04 05:28:41 +0000802 while True:
803 try:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000804 _run_go_cmd_and_wait(cmd)
Ye Kuang0023dc52020-08-04 05:28:41 +0000805 break
806 except Exception:
Takuto Ikutae0bfec72020-08-28 02:52:52 +0000807 if time.time() > started + 60 * 2:
808 # This is to not wait task having leaked process long time.
Ye Kuang0023dc52020-08-04 05:28:41 +0000809 raise
810
811 on_error.report('error before %d second backoff' % backoff)
812 logging.exception(
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000813 '_run_go_cmd_and_wait() failed, will retry after %d seconds',
Ye Kuang0023dc52020-08-04 05:28:41 +0000814 backoff)
815 time.sleep(backoff)
816 backoff *= 2
Ye Kuangfb0bad62020-07-28 08:07:25 +0000817
818 with open(isolated_path) as isol_file:
819 isolated = isol_file.read()
820 with open(stats_json_path) as json_file:
821 stats_json = json.load(json_file)
822
823 return isolated, stats_json['items_cold'], stats_json['items_hot']
824 finally:
825 fs.remove(isolated_path)
826 fs.remove(stats_json_path)
827
828
Ye Kuangbc4e8402020-07-29 09:54:30 +0000829def upload_out_dir(storage, out_dir, go_isolated_client):
830 """Uploads the results in |out_dir| back, if there is any.
maruela9cfd6f2015-09-15 11:03:15 -0700831
832 Returns:
Ye Kuangbc4e8402020-07-29 09:54:30 +0000833 tuple(outputs_ref, stats)
maruel064c0a32016-04-05 11:47:15 -0700834 - outputs_ref: a dict referring to the results archived back to the isolated
835 server, if applicable.
nodir6f801882016-04-29 14:41:50 -0700836 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700837 """
maruela9cfd6f2015-09-15 11:03:15 -0700838 # Upload out_dir and generate a .isolated file out of this directory. It is
839 # only done if files were written in the directory.
840 outputs_ref = None
Ye Kuangfb0bad62020-07-28 08:07:25 +0000841 cold = ''
842 hot = ''
nodir6f801882016-04-29 14:41:50 -0700843 start = time.time()
844
maruel12e30012015-10-09 11:55:35 -0700845 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700846 with tools.Profiler('ArchiveOutput'):
Ye Kuangfb0bad62020-07-28 08:07:25 +0000847 isolated = None
Ye Kuang72e6fe82020-08-05 06:30:04 +0000848 if _USE_GO_ISOLATED_TO_UPLOAD and go_isolated_client is not None:
Ye Kuangfb0bad62020-07-28 08:07:25 +0000849 isolated, cold, hot = _upload_with_go(storage, out_dir,
850 go_isolated_client)
Ye Kuang72e6fe82020-08-05 06:30:04 +0000851 else:
852 isolated, cold, hot = _upload_with_py(storage, out_dir)
Ye Kuangfb0bad62020-07-28 08:07:25 +0000853 outputs_ref = {
854 'isolated': isolated,
855 'isolatedserver': storage.server_ref.url,
856 'namespace': storage.server_ref.namespace,
857 }
nodir6f801882016-04-29 14:41:50 -0700858
nodir6f801882016-04-29 14:41:50 -0700859 stats = {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000860 'duration': time.time() - start,
Ye Kuangfb0bad62020-07-28 08:07:25 +0000861 'items_cold': cold,
862 'items_hot': hot,
nodir6f801882016-04-29 14:41:50 -0700863 }
Ye Kuangbc4e8402020-07-29 09:54:30 +0000864 return outputs_ref, stats
maruela9cfd6f2015-09-15 11:03:15 -0700865
866
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000867def upload_outdir_with_cas(cas_client, cas_instance, outdir):
868 """Uploads the results in |outdir|, if there is any.
869
870 Returns:
871 tuple(root_digest, stats)
872 - root_digest: a digest of the output directory.
873 - stats: uploading stats.
874 """
875 digest_file_handle, digest_path = tempfile.mkstemp(
876 prefix=u'cas-digest', suffix=u'.txt')
877 os.close(digest_file_handle)
878 stats_json_handle, stats_json_path = tempfile.mkstemp(
879 prefix=u'upload-stats', suffix=u'.json')
880 os.close(stats_json_handle)
881
882 try:
883 cmd = [
884 cas_client,
885 'archive',
886 '-cas-instance',
887 cas_instance,
888 '-paths',
889 # Format: <working directory>:<relative path to dir>
890 outdir + ':',
891 # output
892 '-dump-digest',
893 digest_path,
894 '-dump-stats-json',
895 stats_json_path,
896 ]
897
898 start = time.time()
899
900 _run_go_cmd_and_wait(cmd)
901
902 with open(digest_path) as digest_file:
903 digest = digest_file.read()
Junji Watanabec208b302020-09-25 09:18:27 +0000904 h, s = digest.split('/')
905 cas_output_root = {
906 'cas_instance': cas_instance,
907 'digest': {
908 'hash': h,
909 'size_bytes': int(s)
910 }
911 }
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000912 with open(stats_json_path) as stats_file:
913 stats = json.load(stats_file)
914
915 stats['duration'] = time.time() - start
916
Junji Watanabec208b302020-09-25 09:18:27 +0000917 return cas_output_root, stats
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000918 finally:
919 fs.remove(digest_path)
920 fs.remove(stats_json_path)
921
922
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500923def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700924 """Runs a command with optional isolated input/output.
925
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500926 Arguments:
927 - data: TaskData instance.
928 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700929
930 Returns metadata about the result.
931 """
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000932
933 if data.isolate_cache:
934 download_stats = {
935 #'duration': 0.,
936 'initial_number_items': len(data.isolate_cache),
937 'initial_size': data.isolate_cache.total_size,
938 #'items_cold': '<large.pack()>',
939 #'items_hot': '<large.pack()>',
940 }
941 else:
942 # TODO(tikuta): take stats from state.json in this case too.
943 download_stats = {}
944
maruela9cfd6f2015-09-15 11:03:15 -0700945 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000946 'duration': None,
947 'exit_code': None,
948 'had_hard_timeout': False,
949 'internal_failure': 'run_isolated did not complete properly',
950 'stats': {
951 #'cipd': {
952 # 'duration': 0.,
953 # 'get_client_duration': 0.,
954 #},
955 'isolated': {
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000956 'download': download_stats,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000957 #'upload': {
958 # 'duration': 0.,
959 # 'items_cold': '<large.pack()>',
960 # 'items_hot': '<large.pack()>',
961 #},
962 },
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000963 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000964 #'cipd_pins': {
965 # 'packages': [
966 # {'package_name': ..., 'version': ..., 'path': ...},
967 # ...
968 # ],
969 # 'client_package': {'package_name': ..., 'version': ...},
970 #},
971 'outputs_ref': None,
Junji Watanabe54925c32020-09-08 00:56:18 +0000972 'cas_output_root': None,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000973 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700974 }
nodirbe642ff2016-06-09 15:51:51 -0700975
Takuto Ikutad46ea762020-10-07 05:43:22 +0000976 assert os.path.isabs(data.root_dir), ("data.root_dir is not abs path: %s" %
977 data.root_dir)
978 file_path.ensure_tree(data.root_dir, 0o700)
979
maruele2f2cb82016-07-13 14:41:03 -0700980 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700981 # TODO(maruel): This is not obvious. Change this to become an error once we
982 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500983 if constant_run_path and data.root_dir:
984 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700985 if os.path.isdir(run_dir):
986 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000987 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700988 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500989 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000990
991 # True if CAS is used for download/upload files.
992 use_cas = bool(data.cas_digest)
993
maruel03e11842016-07-14 10:50:16 -0700994 # storage should be normally set but don't crash if it is not. This can happen
995 # as Swarming task can run without an isolate server.
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000996 out_dir = None
997 if data.storage or use_cas:
998 out_dir = make_temp_dir(ISOLATED_OUT_DIR, data.root_dir)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500999 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001000 isolated_client_dir = make_temp_dir(ISOLATED_CLIENT_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -07001001 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001002 if data.relative_cwd:
1003 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001004 command = data.command
Ye Kuangfb0bad62020-07-28 08:07:25 +00001005 go_isolated_client = None
1006 if data.use_go_isolated:
1007 go_isolated_client = os.path.join(isolated_client_dir,
1008 'isolated' + cipd.EXECUTABLE_SUFFIX)
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001009
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001010 cas_client = None
1011 cas_client_dir = make_temp_dir(_CAS_CLIENT_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001012 if use_cas:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001013 cas_client = os.path.join(cas_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX)
1014
nodir55be77b2016-05-03 09:39:57 -07001015 try:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001016 with data.install_packages_fn(run_dir, isolated_client_dir,
1017 cas_client_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -08001018 if cipd_info:
1019 result['stats']['cipd'] = cipd_info.stats
1020 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -07001021
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001022 isolated_stats = result['stats'].setdefault('isolated', {})
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001023 if data.isolated_hash:
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001024 if data.use_go_isolated:
Takuto Ikuta57219f42020-11-02 07:35:36 +00001025 stats = _fetch_and_map_with_go_isolated(
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001026 isolated_hash=data.isolated_hash,
1027 storage=data.storage,
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001028 outdir=run_dir,
1029 go_cache_dir=data.go_cache_dir,
Takuto Ikuta879788c2020-01-10 08:00:26 +00001030 policies=data.go_cache_policies,
Ye Kuangfb0bad62020-07-28 08:07:25 +00001031 isolated_client=go_isolated_client)
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001032 else:
Takuto Ikuta57219f42020-11-02 07:35:36 +00001033 stats = fetch_and_map(
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001034 isolated_hash=data.isolated_hash,
1035 storage=data.storage,
1036 cache=data.isolate_cache,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +00001037 outdir=run_dir)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001038 isolated_stats['download'].update(stats)
Takuto Ikutab58dbd12020-06-05 09:29:14 +00001039
Junji Watanabe54925c32020-09-08 00:56:18 +00001040 elif data.cas_digest:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001041 stats = _fetch_and_map_with_cas(
1042 cas_client=cas_client,
1043 digest=data.cas_digest,
1044 instance=data.cas_instance,
1045 output_dir=run_dir,
Junji Watanabeb03450b2020-09-25 05:09:27 +00001046 cache_dir=data.cas_cache_dir,
1047 policies=data.cas_cache_policies)
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001048 isolated_stats['download'].update(stats)
Junji Watanabe54925c32020-09-08 00:56:18 +00001049
maruelabec63c2017-04-26 11:53:24 -07001050 if not command:
1051 # Handle this as a task failure, not an internal failure.
1052 sys.stderr.write(
1053 '<No command was specified!>\n'
1054 '<Please secify a command when triggering your Swarming task>\n')
1055 result['exit_code'] = 1
1056 return result
nodirbe642ff2016-06-09 15:51:51 -07001057
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001058 if not cwd.startswith(run_dir):
1059 # Handle this as a task failure, not an internal failure. This is a
1060 # 'last chance' way to gate against directory escape.
1061 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
1062 result['exit_code'] = 1
1063 return result
1064
1065 if not os.path.isdir(cwd):
1066 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +00001067 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001068
vadimsh232f5a82017-01-20 19:23:44 -08001069 # If we have an explicit list of files to return, make sure their
1070 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001071 if data.storage and data.outputs:
1072 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -07001073
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001074 with data.install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001075 sys.stdout.flush()
1076 start = time.time()
1077 try:
vadimsh9c54b2c2017-07-25 14:08:29 -07001078 # Need to switch the default account before 'get_command_env' call,
1079 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001080 with set_luci_context_account(data.switch_to_account, tmp_dir):
1081 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +00001082 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
1083 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +00001084 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -08001085 command = process_command(command, out_dir, data.bot_file)
1086 file_path.ensure_command_has_abs_path(command, cwd)
1087
vadimsh9c54b2c2017-07-25 14:08:29 -07001088 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001089 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001090 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -08001091 finally:
1092 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -05001093
Ye Kuangbc4e8402020-07-29 09:54:30 +00001094 if out_dir:
1095 # Try to link files to the output directory, if specified.
1096 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
1097 isolated_stats = result['stats'].setdefault('isolated', {})
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001098 if use_cas:
1099 result['cas_output_root'], isolated_stats['upload'] = (
1100 upload_outdir_with_cas(cas_client, data.cas_instance, out_dir))
1101 else:
1102 # This could use |go_isolated_client|, so make sure it runs when the
1103 # CIPD package still exists.
1104 result['outputs_ref'], isolated_stats['upload'] = (
1105 upload_out_dir(data.storage, out_dir, go_isolated_client))
Seth Koehler49139812017-12-19 13:59:33 -05001106 # We successfully ran the command, set internal_failure back to
1107 # None (even if the command failed, it's not an internal error).
1108 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -07001109 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -07001110 # An internal error occurred. Report accordingly so the swarming task will
1111 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -07001112 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -07001113 result['internal_failure'] = str(e)
1114 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -07001115
1116 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -07001117 finally:
1118 try:
Ye Kuangbc4e8402020-07-29 09:54:30 +00001119 success = True
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001120 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -07001121 success = True
maruela9cfd6f2015-09-15 11:03:15 -07001122 logging.warning(
1123 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -07001124 else:
maruel84537cb2015-10-16 14:21:28 -07001125 # On Windows rmtree(run_dir) call above has a synchronization effect: it
1126 # finishes only when all task child processes terminate (since a running
1127 # process locks *.exe file). Examine out_dir only after that call
1128 # completes (since child processes may write to out_dir too and we need
1129 # to wait for them to finish).
Junji Watanabeb03450b2020-09-25 05:09:27 +00001130 dirs_to_remove = [run_dir, tmp_dir, isolated_client_dir, cas_client_dir]
Ye Kuangbc4e8402020-07-29 09:54:30 +00001131 if out_dir:
1132 dirs_to_remove.append(out_dir)
1133 for directory in dirs_to_remove:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001134 if not fs.isdir(directory):
1135 continue
maruel84537cb2015-10-16 14:21:28 -07001136 try:
Ye Kuangbc4e8402020-07-29 09:54:30 +00001137 success = success and file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -07001138 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001139 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -07001140 success = False
1141 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001142 sys.stderr.write(
1143 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
Takuto Ikutad7d64e12020-07-31 06:18:45 +00001144 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
maruel84537cb2015-10-16 14:21:28 -07001145 if result['exit_code'] == 0:
1146 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -07001147
maruela9cfd6f2015-09-15 11:03:15 -07001148 if not success and result['exit_code'] == 0:
1149 result['exit_code'] = 1
1150 except Exception as e:
1151 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -07001152 if out_dir:
1153 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -07001154 result['internal_failure'] = str(e)
Takuto Ikutaa9a907b2020-04-17 08:50:50 +00001155 on_error.report(None)
maruela9cfd6f2015-09-15 11:03:15 -07001156 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001157
1158
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001159def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -07001160 """Runs an executable and records execution metadata.
1161
nodir55be77b2016-05-03 09:39:57 -07001162 If isolated_hash is specified, downloads the dependencies in the cache,
1163 hardlinks them into a temporary directory and runs the command specified in
1164 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001165
1166 A temporary directory is created to hold the output files. The content inside
1167 this directory will be uploaded back to |storage| packaged as a .isolated
1168 file.
1169
1170 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001171 - data: TaskData instance.
1172 - result_json: File path to dump result metadata into. If set, the process
1173 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -07001174
1175 Returns:
1176 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001177 """
maruela76b9ee2015-12-15 06:18:08 -08001178 if result_json:
1179 # Write a json output file right away in case we get killed.
1180 result = {
Junji Watanabe54925c32020-09-08 00:56:18 +00001181 'exit_code': None,
1182 'had_hard_timeout': False,
1183 'internal_failure': 'Was terminated before completion',
1184 'outputs_ref': None,
1185 'cas_output_root': None,
1186 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -08001187 }
1188 tools.write_json(result_json, result, dense=True)
1189
maruela9cfd6f2015-09-15 11:03:15 -07001190 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001191 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -07001192 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -07001193
maruela9cfd6f2015-09-15 11:03:15 -07001194 if result_json:
maruel05d5a882015-09-21 13:59:02 -07001195 # We've found tests to delete 'work' when quitting, causing an exception
1196 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -07001197 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -07001198 tools.write_json(result_json, result, dense=True)
1199 # Only return 1 if there was an internal error.
1200 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +00001201
maruela9cfd6f2015-09-15 11:03:15 -07001202 # Marshall into old-style inline output.
1203 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +00001204 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -07001205 data = {
Junji Watanabe38b28b02020-04-23 10:23:30 +00001206 'hash': result['outputs_ref']['isolated'],
1207 'namespace': result['outputs_ref']['namespace'],
1208 'storage': result['outputs_ref']['isolatedserver'],
maruela9cfd6f2015-09-15 11:03:15 -07001209 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -05001210 sys.stdout.flush()
Junji Watanabe38b28b02020-04-23 10:23:30 +00001211 print('[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
1212 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -08001213 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -07001214 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001215
1216
iannuccib58d10d2017-03-18 02:00:25 -07001217# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -08001218CipdInfo = collections.namedtuple('CipdInfo', [
1219 'client', # cipd.CipdClient object
1220 'cache_dir', # absolute path to bot-global cipd tag and instance cache
1221 'stats', # dict with stats to return to the server
1222 'pins', # dict with installed cipd pins to return to the server
1223])
1224
1225
1226@contextlib.contextmanager
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001227def noop_install_packages(_run_dir, _isolated_dir, _cas_dir):
iannuccib58d10d2017-03-18 02:00:25 -07001228 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -08001229 yield None
1230
1231
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001232def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -07001233 """Calls 'cipd ensure' for packages.
1234
1235 Args:
1236 run_dir (str): root of installation.
1237 cipd_cache_dir (str): the directory to use for the cipd package cache.
1238 client (CipdClient): the cipd client to use
1239 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -07001240
1241 Returns: list of pinned packages. Looks like [
1242 {
1243 'path': 'subdirectory',
1244 'package_name': 'resolved/package/name',
1245 'version': 'deadbeef...',
1246 },
1247 ...
1248 ]
1249 """
1250 package_pins = [None]*len(packages)
1251 def insert_pin(path, name, version, idx):
1252 package_pins[idx] = {
1253 'package_name': name,
1254 # swarming deals with 'root' as '.'
1255 'path': path or '.',
1256 'version': version,
1257 }
1258
1259 by_path = collections.defaultdict(list)
1260 for i, (path, name, version) in enumerate(packages):
1261 # cipd deals with 'root' as ''
1262 if path == '.':
1263 path = ''
1264 by_path[path].append((name, version, i))
1265
1266 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001267 run_dir,
1268 {
1269 subdir: [(name, vers) for name, vers, _ in pkgs
1270 ] for subdir, pkgs in by_path.items()
1271 },
1272 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -07001273 )
1274
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +00001275 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -07001276 this_subdir = by_path[subdir]
1277 for i, (name, version) in enumerate(pin_list):
1278 insert_pin(subdir, name, version, this_subdir[i][2])
1279
Robert Iannucci461b30d2017-12-13 11:34:03 -08001280 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -07001281
1282 return package_pins
1283
1284
vadimsh232f5a82017-01-20 19:23:44 -08001285@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001286def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001287 client_package_name, client_version, cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001288 isolated_dir, cas_dir):
vadimsh902948e2017-01-20 15:57:32 -08001289 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -07001290
vadimsh232f5a82017-01-20 19:23:44 -08001291 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
1292
1293 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -07001294 [
1295 {
1296 "path": path, "package_name": package_name, "version": version,
1297 },
1298 ...
1299 ]
vadimsh902948e2017-01-20 15:57:32 -08001300 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -07001301
1302 such that they correspond 1:1 to all input package arguments from the command
1303 line. These dictionaries make their all the way back to swarming, where they
1304 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -07001305
vadimsh902948e2017-01-20 15:57:32 -08001306 If 'packages' list is empty, will bootstrap CIPD client, but won't install
1307 any packages.
1308
1309 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -08001310 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -08001311
nodirbe642ff2016-06-09 15:51:51 -07001312 Args:
nodir90bc8dc2016-06-15 13:35:21 -07001313 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -08001314 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -07001315 service_url (str): CIPD server url, e.g.
1316 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -07001317 client_package_name (str): CIPD package name of CIPD client.
1318 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -07001319 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001320 isolated_dir (str): where to download isolated client.
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001321 cas_dir (str): where to download cas client.
nodirbe642ff2016-06-09 15:51:51 -07001322 """
1323 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001324
nodirbe642ff2016-06-09 15:51:51 -07001325 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001326
vadimsh902948e2017-01-20 15:57:32 -08001327 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001328 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001329 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001330 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001331
nodirbe642ff2016-06-09 15:51:51 -07001332 get_client_start = time.time()
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001333 client_manager = cipd.get_client(cache_dir, service_url, client_package_name,
1334 client_version)
iannucci96fcccc2016-08-30 15:52:22 -07001335
nodirbe642ff2016-06-09 15:51:51 -07001336 with client_manager as client:
1337 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001338
iannuccib58d10d2017-03-18 02:00:25 -07001339 package_pins = []
1340 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001341 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1342 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001343
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001344 # Install isolated client to |isolated_dir|.
Takuto Ikuta02edca22019-11-29 10:04:51 +00001345 _install_packages(isolated_dir, cipd_cache_dir, client,
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +00001346 [('', ISOLATED_PACKAGE, _LUCI_GO_REVISION)])
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001347
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001348 # Install cas client to |cas_dir|.
1349 _install_packages(cas_dir, cipd_cache_dir, client,
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +00001350 [('', _CAS_PACKAGE, _LUCI_GO_REVISION)])
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001351
iannuccib58d10d2017-03-18 02:00:25 -07001352 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001353
vadimsh232f5a82017-01-20 19:23:44 -08001354 total_duration = time.time() - start
Junji Watanabe38b28b02020-04-23 10:23:30 +00001355 logging.info('Installing CIPD client and packages took %d seconds',
1356 total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001357
vadimsh232f5a82017-01-20 19:23:44 -08001358 yield CipdInfo(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001359 client=client,
1360 cache_dir=cipd_cache_dir,
1361 stats={
1362 'duration': total_duration,
1363 'get_client_duration': get_client_duration,
iannuccib58d10d2017-03-18 02:00:25 -07001364 },
Junji Watanabe38b28b02020-04-23 10:23:30 +00001365 pins={
1366 'client_package': {
1367 'package_name': client.package_name,
1368 'version': client.instance_id,
1369 },
1370 'packages': package_pins,
1371 })
nodirbe642ff2016-06-09 15:51:51 -07001372
1373
1374def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001375 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001376 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001377 version=__version__,
1378 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001379 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001380 '--clean',
1381 action='store_true',
maruel36a963d2016-04-08 17:15:49 -07001382 help='Cleans the cache, trimming it necessary and remove corrupted items '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001383 'and returns without executing anything; use with -v to know what '
1384 'was done')
maruel36a963d2016-04-08 17:15:49 -07001385 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001386 '--json',
1387 help='dump output metadata to json file. When used, run_isolated returns '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001388 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001389 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001390 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001391 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001392 '--grace-period',
1393 type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001394 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001395 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001396 '--raw-cmd',
1397 action='store_true',
Marc-Antoine Ruel49e347d2017-10-24 16:52:02 -07001398 help='Ignore the isolated command, use the one supplied at the command '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001399 'line')
Marc-Antoine Ruel49e347d2017-10-24 16:52:02 -07001400 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001401 '--relative-cwd',
1402 help='Ignore the isolated \'relative_cwd\' and use this one instead; '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001403 'requires --raw-cmd')
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001404 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001405 '--env',
1406 default=[],
1407 action='append',
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001408 help='Environment variables to set for the child process')
1409 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001410 '--env-prefix',
1411 default=[],
1412 action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001413 help='Specify a VAR=./path/fragment to put in the environment variable '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001414 'before executing the command. The path fragment must be relative '
1415 'to the isolated run directory, and must not contain a `..` token. '
1416 'The path will be made absolute and prepended to the indicated '
1417 '$VAR using the OS\'s path separator. Multiple items for the same '
1418 '$VAR will be prepended in order.')
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001419 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001420 '--bot-file',
1421 help='Path to a file describing the state of the host. The content is '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001422 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001423 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001424 '--switch-to-account',
1425 help='If given, switches LUCI_CONTEXT to given logical service account '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001426 '(e.g. "task" or "system") before launching the isolated process.')
vadimsh9c54b2c2017-07-25 14:08:29 -07001427 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001428 '--output',
1429 action='append',
aludwin0a8e17d2016-10-27 15:57:39 -07001430 help='Specifies an output to return. If no outputs are specified, all '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001431 'files located in $(ISOLATED_OUTDIR) will be returned; '
1432 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1433 'specified by --output option (there can be multiple) will be '
1434 'returned. Note that if a file in OUT_DIR has the same path '
1435 'as an --output option, the --output version will be returned.')
aludwin0a8e17d2016-10-27 15:57:39 -07001436 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001437 '-a',
1438 '--argsfile',
aludwin7556e0c2016-10-26 08:46:10 -07001439 # This is actually handled in parse_args; it's included here purely so it
1440 # can make it into the help text.
1441 help='Specify a file containing a JSON array of arguments to this '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001442 'script. If --argsfile is provided, no other argument may be '
1443 'provided on the command line.')
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001444 parser.add_option(
1445 '--report-on-exception',
1446 action='store_true',
1447 help='Whether report exception during execution to isolate server. '
1448 'This flag should only be used in swarming bot.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001449
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001450 group = optparse.OptionGroup(parser, 'Data source - Isolate server')
Junji Watanabe54925c32020-09-08 00:56:18 +00001451 # Deprecated. Isoate server is being migrated to RBE-CAS.
1452 # Remove --isolated and isolate server options after migration.
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001453 group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001454 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001455 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001456 isolateserver.add_isolate_server_options(group)
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001457 parser.add_option_group(group)
1458
1459 group = optparse.OptionGroup(parser,
1460 'Data source - Content Addressed Storage')
Junji Watanabe54925c32020-09-08 00:56:18 +00001461 group.add_option(
1462 '--cas-instance', help='Full CAS instance name for input/output files.')
1463 group.add_option(
1464 '--cas-digest',
1465 help='Digest of the input root on RBE-CAS. The format is '
1466 '`{hash}/{size_bytes}`.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001467 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001468
Junji Watanabeb03450b2020-09-25 05:09:27 +00001469 # Cache options.
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001470 isolateserver.add_cache_options(parser)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001471 add_cas_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001472
1473 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001474
1475 group = optparse.OptionGroup(parser, 'Named caches')
1476 group.add_option(
1477 '--named-cache',
1478 dest='named_caches',
1479 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001480 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001481 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001482 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001483 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1484 'path is a path relative to the run dir where the cache directory '
1485 'must be put to. '
1486 'This option can be specified more than once.')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001487 group.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001488 '--named-cache-root',
1489 default='named_caches',
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001490 help='Cache root directory. Default=%default')
1491 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001492
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001493 group = optparse.OptionGroup(parser, 'Process containment')
1494 parser.add_option(
1495 '--lower-priority', action='store_true',
1496 help='Lowers the child process priority')
1497 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001498 '--containment-type',
1499 choices=('NONE', 'AUTO', 'JOB_OBJECT'),
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001500 default='NONE',
1501 help='Type of container to use')
1502 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001503 '--limit-processes',
1504 type='int',
1505 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001506 help='Maximum number of active processes in the containment')
1507 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001508 '--limit-total-committed-memory',
1509 type='int',
1510 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001511 help='Maximum sum of committed memory in the containment')
1512 parser.add_option_group(group)
1513
1514 group = optparse.OptionGroup(parser, 'Debugging')
1515 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001516 '--leak-temp-dir',
1517 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001518 help='Deliberately leak isolate\'s temp dir for later examination. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001519 'Default: %default')
1520 group.add_option('--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001521 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001522
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001523 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001524
Ye Kuang1d096cb2020-06-26 08:38:21 +00001525 parser.set_defaults(cache='cache')
nodirbe642ff2016-06-09 15:51:51 -07001526 return parser
1527
1528
Junji Watanabeb03450b2020-09-25 05:09:27 +00001529def add_cas_cache_options(parser):
1530 group = optparse.OptionGroup(parser, 'CAS cache management')
1531 group.add_option(
1532 '--cas-cache',
1533 metavar='DIR',
1534 default='cas-cache',
1535 help='Directory to keep a local cache of the files. Accelerates download '
1536 'by reusing already downloaded files. Default=%default')
1537 parser.add_option_group(group)
1538
1539
1540def process_cas_cache_options(options):
1541 if options.cas_cache:
1542 policies = local_caching.CachePolicies(
1543 max_cache_size=options.max_cache_size,
1544 min_free_space=options.min_free_space,
1545 # max_items isn't used for CAS cache for now.
1546 max_items=None,
1547 max_age_secs=MAX_AGE_SECS)
1548
1549 return local_caching.DiskContentAddressedCache(
1550 six.text_type(os.path.abspath(options.cas_cache)), policies, trim=False)
1551 return local_caching.MemoryContentAddressedCache()
1552
1553
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001554def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001555 """Validates named cache options and returns a CacheManager."""
1556 if options.named_caches and not options.named_cache_root:
1557 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001558 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001559 if not CACHE_NAME_RE.match(name):
1560 parser.error(
1561 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1562 if not path:
1563 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001564 try:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001565 int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001566 except ValueError:
1567 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001568 if options.named_cache_root:
1569 # Make these configurable later if there is use case but for now it's fairly
1570 # safe values.
1571 # In practice, a fair chunk of bots are already recycled on a daily schedule
1572 # so this code doesn't have any effect to them, unless they are preloaded
1573 # with a really old cache.
1574 policies = local_caching.CachePolicies(
1575 # 1TiB.
1576 max_cache_size=1024*1024*1024*1024,
1577 min_free_space=options.min_free_space,
1578 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001579 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001580 root_dir = six.text_type(os.path.abspath(options.named_cache_root))
John Budorickc6186972020-02-26 00:58:14 +00001581 cache = local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
1582 # Touch any named caches we're going to use to minimize thrashing
1583 # between tasks that request some (but not all) of the same named caches.
John Budorick0a4dab62020-03-02 22:23:35 +00001584 cache.touch(*[name for name, _, _ in options.named_caches])
John Budorickc6186972020-02-26 00:58:14 +00001585 return cache
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001586 return None
1587
1588
aludwin7556e0c2016-10-26 08:46:10 -07001589def parse_args(args):
1590 # Create a fake mini-parser just to get out the "-a" command. Note that
1591 # it's not documented here; instead, it's documented in create_option_parser
1592 # even though that parser will never actually get to parse it. This is
1593 # because --argsfile is exclusive with all other options and arguments.
1594 file_argparse = argparse.ArgumentParser(add_help=False)
1595 file_argparse.add_argument('-a', '--argsfile')
1596 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1597 if file_args.argsfile:
1598 if nonfile_args:
1599 file_argparse.error('Can\'t specify --argsfile with'
1600 'any other arguments (%s)' % nonfile_args)
1601 try:
1602 with open(file_args.argsfile, 'r') as f:
1603 args = json.load(f)
1604 except (IOError, OSError, ValueError) as e:
1605 # We don't need to error out here - "args" is now empty,
1606 # so the call below to parser.parse_args(args) will fail
1607 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001608 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001609
1610 # Even if we failed to read the args, just call the normal parser now since it
1611 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001612 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001613 options, args = parser.parse_args(args)
Ye Kuangfff1e502020-07-13 13:21:57 +00001614 if not isinstance(options.cipd_enabled, (bool, int)):
1615 options.cipd_enabled = distutils.util.strtobool(options.cipd_enabled)
aludwin7556e0c2016-10-26 08:46:10 -07001616 return (parser, options, args)
1617
1618
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001619def _calc_named_cache_hint(named_cache, named_caches):
1620 """Returns the expected size of the missing named caches."""
1621 present = named_cache.available
1622 size = 0
1623 for name, _, hint in named_caches:
1624 if name not in present:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001625 hint = int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001626 if hint > 0:
1627 size += hint
1628 return size
1629
1630
aludwin7556e0c2016-10-26 08:46:10 -07001631def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001632 # Warning: when --argsfile is used, the strings are unicode instances, when
1633 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001634 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001635
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001636 if options.report_on_exception and options.isolate_server:
1637 on_error.report_on_exception_exit(options.isolate_server)
1638
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001639 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001640 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001641
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001642 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001643 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001644 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1645 if hint:
1646 # Increase the --min-free-space value by the hint, and recreate the
1647 # NamedCache instance so it gets the updated CachePolicy.
1648 options.min_free_space += hint
1649 named_cache = process_named_cache_options(parser, options)
1650
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001651 # TODO(crbug.com/932396): Remove this.
Takuto Ikuta4a22c2c2020-06-05 02:02:23 +00001652 use_go_isolated = options.cipd_enabled
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001653
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001654 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1655 # they can be cleaned the same way.
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001656
1657 isolate_cache = isolateserver.process_cache_options(options, trim=False)
1658 cas_cache = process_cas_cache_options(options)
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +00001659
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001660 caches = []
1661 if isolate_cache:
1662 caches.append(isolate_cache)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001663 if cas_cache:
1664 caches.append(cas_cache)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001665 if named_cache:
1666 caches.append(named_cache)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001667 root = caches[0].cache_dir if caches else six.text_type(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001668 if options.clean:
1669 if options.isolated:
1670 parser.error('Can\'t use --isolated with --clean.')
1671 if options.isolate_server:
1672 parser.error('Can\'t use --isolate-server with --clean.')
1673 if options.json:
1674 parser.error('Can\'t use --json with --clean.')
nodirf33b8d62016-10-26 22:34:58 -07001675 if options.named_caches:
1676 parser.error('Can\t use --named-cache with --clean.')
Junji Watanabeb19f54d2020-09-17 05:54:52 +00001677 if options.cas_instance or options.cas_digest:
1678 parser.error('Can\t use --cas-instance, --cas-digest with --clean.')
Takuto Ikuta9ab28552020-07-31 08:15:45 +00001679
1680 logging.info("initial free space: %d", file_path.get_free_space(root))
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001681 # Trim first, then clean.
1682 local_caching.trim_caches(
1683 caches,
1684 root,
Takuto Ikuta616ce262020-09-07 08:43:48 +00001685 min_free_space=options.min_free_space,
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001686 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta9ab28552020-07-31 08:15:45 +00001687 logging.info("free space after trim: %d", file_path.get_free_space(root))
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001688 for c in caches:
Marc-Antoine Ruel87fc2222018-06-18 13:09:24 +00001689 c.cleanup()
Takuto Ikuta9ab28552020-07-31 08:15:45 +00001690 logging.info("free space after cleanup: %d", file_path.get_free_space(root))
maruel36a963d2016-04-08 17:15:49 -07001691 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001692
1693 # Trim must still be done for the following case:
1694 # - named-cache was used
1695 # - some entries, with a large hint, where missing
1696 # - --min-free-space was increased accordingly, thus trimming is needed
1697 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1698 # --clean after each task.
Takuto Ikutaa010c532020-10-21 05:42:29 +00001699 local_caching.trim_caches(
1700 caches,
1701 root,
1702 # Add 1GB more buffer for Go CLI.
1703 min_free_space=options.min_free_space + _FREE_SPACE_BUFFER_FOR_GO,
1704 max_age_secs=MAX_AGE_SECS)
maruel36a963d2016-04-08 17:15:49 -07001705
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001706 # Save state of isolate/cas cache not to overwrite state from go client.
1707 if use_go_isolated:
1708 isolate_cache.save()
1709 isolate_cache = None
1710 if cas_cache:
1711 cas_cache.save()
1712 cas_cache = None
1713
nodir55be77b2016-05-03 09:39:57 -07001714 if not options.isolated and not args:
1715 parser.error('--isolated or command to run is required.')
1716
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001717 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001718
Takuto Ikutaae767b32020-05-11 01:22:19 +00001719 isolateserver.process_isolate_server_options(parser, options, False)
Junji Watanabeed9ce352020-09-25 12:32:07 +00001720 if ISOLATED_OUTDIR_PARAMETER in args and (not options.isolate_server and
1721 not options.cas_instance):
1722 parser.error('%s in args requires --isolate-server or --cas-instance' %
1723 ISOLATED_OUTDIR_PARAMETER)
1724
1725 if options.isolated and not options.isolate_server:
1726 parser.error('--isolated requires --isolate-server')
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001727
nodir90bc8dc2016-06-15 13:35:21 -07001728 if options.root_dir:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001729 options.root_dir = six.text_type(os.path.abspath(options.root_dir))
Takuto Ikutad46ea762020-10-07 05:43:22 +00001730 else:
1731 options.root_dir = six.text_type(tempfile.mkdtemp(prefix='root'))
maruel12e30012015-10-09 11:55:35 -07001732 if options.json:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001733 options.json = six.text_type(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001734
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001735 if any('=' not in i for i in options.env):
1736 parser.error(
1737 '--env required key=value form. value can be skipped to delete '
1738 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001739 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001740
1741 prefixes = {}
1742 cwd = os.path.realpath(os.getcwd())
1743 for item in options.env_prefix:
1744 if '=' not in item:
1745 parser.error(
1746 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1747 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001748 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001749 if os.path.isabs(opath):
1750 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1751 opath = os.path.normpath(opath)
1752 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1753 parser.error(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001754 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1755 % opath)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001756 prefixes.setdefault(key, []).append(opath)
1757 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001758
nodirbe642ff2016-06-09 15:51:51 -07001759 cipd.validate_cipd_options(parser, options)
1760
vadimsh232f5a82017-01-20 19:23:44 -08001761 install_packages_fn = noop_install_packages
Ye Kuang1d096cb2020-06-26 08:38:21 +00001762 tmp_cipd_cache_dir = None
vadimsh902948e2017-01-20 15:57:32 -08001763 if options.cipd_enabled:
Ye Kuang1d096cb2020-06-26 08:38:21 +00001764 cache_dir = options.cipd_cache
1765 if not cache_dir:
1766 tmp_cipd_cache_dir = six.text_type(tempfile.mkdtemp())
1767 cache_dir = tmp_cipd_cache_dir
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001768 install_packages_fn = (
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001769 lambda run_dir, isolated_dir, cas_dir: install_client_and_packages(
Ye Kuang1d096cb2020-06-26 08:38:21 +00001770 run_dir,
1771 cipd.parse_package_args(options.cipd_packages),
1772 options.cipd_server,
1773 options.cipd_client_package,
1774 options.cipd_client_version,
1775 cache_dir=cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001776 isolated_dir=isolated_dir,
1777 cas_dir=cas_dir,
1778 ))
nodirbe642ff2016-06-09 15:51:51 -07001779
nodird6160682017-02-02 13:03:35 -08001780 @contextlib.contextmanager
nodir0ae98b32017-05-11 13:21:53 -07001781 def install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001782 # WARNING: this function depends on "options" variable defined in the outer
1783 # function.
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001784 assert six.text_type(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001785 assert os.path.isabs(run_dir), run_dir
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001786 named_caches = [(os.path.join(run_dir, six.text_type(relpath)), name)
1787 for name, relpath, _ in options.named_caches]
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001788 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001789 named_cache.install(path, name)
nodird6160682017-02-02 13:03:35 -08001790 try:
1791 yield
1792 finally:
dnje289d132017-07-07 11:16:44 -07001793 # Uninstall each named cache, returning it to the cache pool. If an
1794 # uninstall fails for a given cache, it will remain in the task's
1795 # temporary space, get cleaned up by the Swarming bot, and be lost.
1796 #
1797 # If the Swarming bot cannot clean up the cache, it will handle it like
1798 # any other bot file that could not be removed.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001799 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001800 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001801 # uninstall() doesn't trim but does call save() implicitly. Trimming
1802 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001803 named_cache.uninstall(path, name)
1804 except local_caching.NamedCacheError:
1805 logging.exception('Error while removing named cache %r at %r. '
1806 'The cache will be lost.', path, name)
nodirf33b8d62016-10-26 22:34:58 -07001807
Takuto Ikutaf3caa9b2020-11-02 05:38:26 +00001808 command = args
1809 if options.relative_cwd:
1810 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1811 if not a.startswith(os.getcwd()):
1812 parser.error(
1813 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001814
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001815 containment_type = subprocess42.Containment.NONE
1816 if options.containment_type == 'AUTO':
1817 containment_type = subprocess42.Containment.AUTO
1818 if options.containment_type == 'JOB_OBJECT':
1819 containment_type = subprocess42.Containment.JOB_OBJECT
1820 containment = subprocess42.Containment(
1821 containment_type=containment_type,
1822 limit_processes=options.limit_processes,
1823 limit_total_committed_memory=options.limit_total_committed_memory)
1824
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001825 data = TaskData(
1826 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001827 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001828 isolated_hash=options.isolated,
1829 storage=None,
1830 isolate_cache=isolate_cache,
Junji Watanabe54925c32020-09-08 00:56:18 +00001831 cas_instance=options.cas_instance,
1832 cas_digest=options.cas_digest,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001833 outputs=options.output,
1834 install_named_caches=install_named_caches,
1835 leak_temp_dir=options.leak_temp_dir,
1836 root_dir=_to_unicode(options.root_dir),
1837 hard_timeout=options.hard_timeout,
1838 grace_period=options.grace_period,
1839 bot_file=options.bot_file,
1840 switch_to_account=options.switch_to_account,
1841 install_packages_fn=install_packages_fn,
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001842 use_go_isolated=use_go_isolated,
Takuto Ikuta10cae642020-01-08 08:12:07 +00001843 go_cache_dir=options.cache,
Takuto Ikuta879788c2020-01-10 08:00:26 +00001844 go_cache_policies=local_caching.CachePolicies(
1845 max_cache_size=options.max_cache_size,
1846 min_free_space=options.min_free_space,
1847 max_items=options.max_items,
1848 max_age_secs=None,
1849 ),
Junji Watanabeb03450b2020-09-25 05:09:27 +00001850 cas_cache_dir=options.cas_cache,
1851 cas_cache_policies=local_caching.CachePolicies(
1852 max_cache_size=options.max_cache_size,
1853 min_free_space=options.min_free_space,
1854 max_items=None,
1855 max_age_secs=None,
1856 ),
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001857 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001858 env_prefix=options.env_prefix,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001859 lower_priority=bool(options.lower_priority),
1860 containment=containment)
nodirbe642ff2016-06-09 15:51:51 -07001861 try:
nodir90bc8dc2016-06-15 13:35:21 -07001862 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001863 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001864 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001865 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001866 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001867 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001868 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001869 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001870 return run_tha_test(data, options.json)
1871 return run_tha_test(data, options.json)
Junji Watanabe38b28b02020-04-23 10:23:30 +00001872 except (cipd.Error, local_caching.NamedCacheError,
1873 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001874 print(ex.message, file=sys.stderr)
nodirbe642ff2016-06-09 15:51:51 -07001875 return 1
Ye Kuang1d096cb2020-06-26 08:38:21 +00001876 finally:
1877 if tmp_cipd_cache_dir is not None:
1878 try:
1879 file_path.rmtree(tmp_cipd_cache_dir)
1880 except OSError:
1881 logging.exception('Remove tmp_cipd_cache_dir=%s failed',
1882 tmp_cipd_cache_dir)
1883 # Best effort clean up. Failed to do so doesn't affect the outcome.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001884
1885
1886if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001887 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001888 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001889 fix_encoding.fix_encoding()
Ye Kuang2dd17442020-04-22 08:45:52 +00001890 net.set_user_agent('run_isolated.py/' + __version__)
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001891 sys.exit(main(sys.argv[1:]))