blob: 583daf24447ce4c5dbd85ba7f08b06cb636dcffe [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
33See
34https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
35for all the variables.
36
37See
38https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
39for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000040"""
41
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000042from __future__ import print_function
43
44__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000045
aludwin7556e0c2016-10-26 08:46:10 -070046import argparse
maruel064c0a32016-04-05 11:47:15 -070047import base64
iannucci96fcccc2016-08-30 15:52:22 -070048import collections
vadimsh232f5a82017-01-20 19:23:44 -080049import contextlib
Ye Kuangfff1e502020-07-13 13:21:57 +000050import distutils
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040051import errno
aludwin7556e0c2016-10-26 08:46:10 -070052import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000053import logging
54import optparse
55import os
Takuto Ikuta5c59a842020-01-24 03:05:24 +000056import platform
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040057import re
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000058import sys
59import tempfile
maruel064c0a32016-04-05 11:47:15 -070060import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000061
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000062from utils import tools
63tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000064
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000065# third_party/
66from depot_tools import fix_encoding
Takuto Ikuta6e2ff962019-10-29 12:35:27 +000067import six
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000068
69# pylint: disable=ungrouped-imports
70import auth
71import cipd
72import isolate_storage
73import isolateserver
74import local_caching
75from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070076from utils import file_path
maruel12e30012015-10-09 11:55:35 -070077from utils import fs
maruel064c0a32016-04-05 11:47:15 -070078from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040079from utils import logging_utils
Ye Kuang2dd17442020-04-22 08:45:52 +000080from utils import net
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040081from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050082from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000083
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000084
maruele2f2cb82016-07-13 14:41:03 -070085# Magic variables that can be found in the isolate task command line.
86ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
87EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
88SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
89
90
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000091# The name of the log file to use.
92RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
93
maruele2f2cb82016-07-13 14:41:03 -070094
csharp@chromium.orge217f302012-11-22 16:51:53 +000095# The name of the log to use for the run_test_cases.py command
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000096RUN_TEST_CASES_LOG = 'run_test_cases.log'
csharp@chromium.orge217f302012-11-22 16:51:53 +000097
vadimsh@chromium.org87d63262013-04-04 19:34:21 +000098
maruele2f2cb82016-07-13 14:41:03 -070099# Use short names for temporary directories. This is driven by Windows, which
100# imposes a relatively short maximum path length of 260 characters, often
101# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000102# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -0700103#
104# It is recommended to start the script with a `root_dir` as short as
105# possible.
106# - ir stands for isolated_run
107# - io stands for isolated_out
108# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000109# - ic stands for isolated_client
maruele2f2cb82016-07-13 14:41:03 -0700110ISOLATED_RUN_DIR = u'ir'
111ISOLATED_OUT_DIR = u'io'
112ISOLATED_TMP_DIR = u'it'
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000113ISOLATED_CLIENT_DIR = u'ic'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000114_CAS_CLIENT_DIR = u'cc'
maruele2f2cb82016-07-13 14:41:03 -0700115
Takuto Ikuta02edca22019-11-29 10:04:51 +0000116# TODO(tikuta): take these parameter from luci-config?
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +0000117# Update tag by `./client/update_go_clients.sh`.
Takuto Ikutac8c92e62020-04-01 07:07:29 +0000118# Or take revision from
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000119# https://ci.chromium.org/p/infra-internal/g/infra-packagers/console
Takuto Ikuta02edca22019-11-29 10:04:51 +0000120ISOLATED_PACKAGE = 'infra/tools/luci/isolated/${platform}'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000121_CAS_PACKAGE = 'infra/tools/luci/cas/${platform}'
Takuto Ikutacbafaf22021-02-08 06:40:49 +0000122_LUCI_GO_REVISION = 'git_revision:3b0580790418214279a001a9620f28db765edadd'
maruele2f2cb82016-07-13 14:41:03 -0700123
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400124# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000125CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400126
Takuto Ikutaa010c532020-10-21 05:42:29 +0000127_FREE_SPACE_BUFFER_FOR_GO = 1024 * 1024 * 1024
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400128
marueld928c862017-06-08 08:20:04 -0700129OUTLIVING_ZOMBIE_MSG = """\
130*** Swarming tried multiple times to delete the %s directory and failed ***
131*** Hard failing the task ***
132
133Swarming detected that your testing script ran an executable, which may have
134started a child executable, and the main script returned early, leaving the
135children executables playing around unguided.
136
137You don't want to leave children processes outliving the task on the Swarming
138bot, do you? The Swarming bot doesn't.
139
140How to fix?
141- For any process that starts children processes, make sure all children
142 processes terminated properly before each parent process exits. This is
143 especially important in very deep process trees.
144 - This must be done properly both in normal successful task and in case of
145 task failure. Cleanup is very important.
146- The Swarming bot sends a SIGTERM in case of timeout.
147 - You have %s seconds to comply after the signal was sent to the process
148 before the process is forcibly killed.
149- To achieve not leaking children processes in case of signals on timeout, you
150 MUST handle signals in each executable / python script and propagate them to
151 children processes.
152 - When your test script (python or binary) receives a signal like SIGTERM or
153 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
154 them to terminate before quitting.
155
156See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400157https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700158for more information.
159
160*** May the SIGKILL force be with you ***
161"""
162
163
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000164# Currently hardcoded. Eventually could be exposed as a flag once there's value.
165# 3 weeks
166MAX_AGE_SECS = 21*24*60*60
167
Ye Kuang72e6fe82020-08-05 06:30:04 +0000168# TODO(1099655): Enable this once all prod issues are gone.
169_USE_GO_ISOLATED_TO_UPLOAD = False
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000170
Takuto Ikuta7ff4b242020-12-03 08:07:06 +0000171_CAS_KVS_CACHE_THRESHOLD = 5 * 1024 * 1024 * 1024 # 5 GiB
172
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500173TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000174 'TaskData',
175 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000176 # List of strings; the command line to use, independent of what was
177 # specified in the isolated file.
178 'command',
179 # Relative directory to start command into.
180 'relative_cwd',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000181 # Hash of the .isolated file that must be retrieved to recreate the tree
182 # of files to run the target executable. The command specified in the
183 # .isolated is executed. Mutually exclusive with command argument.
184 'isolated_hash',
185 # isolateserver.Storage instance to retrieve remote objects. This object
186 # has a reference to an isolateserver.StorageApi, which does the actual
187 # I/O.
188 'storage',
189 # isolateserver.LocalCache instance to keep from retrieving the same
190 # objects constantly by caching the objects retrieved. Can be on-disk or
191 # in-memory.
192 'isolate_cache',
Junji Watanabe54925c32020-09-08 00:56:18 +0000193 # Digest of the input root on RBE-CAS.
194 'cas_digest',
195 # Full CAS instance name.
196 'cas_instance',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000197 # List of paths relative to root_dir to put into the output isolated
198 # bundle upon task completion (see link_outputs_to_outdir).
199 'outputs',
200 # Function (run_dir) => context manager that installs named caches into
201 # |run_dir|.
202 'install_named_caches',
203 # If True, the temporary directory will be deliberately leaked for later
204 # examination.
205 'leak_temp_dir',
206 # Path to the directory to use to create the temporary directory. If not
207 # specified, a random temporary directory is created.
208 'root_dir',
209 # Kills the process if it lasts more than this amount of seconds.
210 'hard_timeout',
211 # Number of seconds to wait between SIGTERM and SIGKILL.
212 'grace_period',
213 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
214 # task command line argument.
215 'bot_file',
216 # Logical account to switch LUCI_CONTEXT into.
217 'switch_to_account',
218 # Context manager dir => CipdInfo, see install_client_and_packages.
219 'install_packages_fn',
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000220 # Use go isolated client.
221 'use_go_isolated',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000222 # Cache directory for go `isolated` client.
Takuto Ikuta057c5342019-12-03 04:05:05 +0000223 'go_cache_dir',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000224 # Parameters passed to go `isolated` client.
Takuto Ikuta879788c2020-01-10 08:00:26 +0000225 'go_cache_policies',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000226 # Cache directory for `cas` client.
227 'cas_cache_dir',
228 # Parameters passed to `cas` client.
229 'cas_cache_policies',
Takuto Ikutaae391c52020-12-03 08:43:45 +0000230 # Parameters for kvs file used by `cas` client.
231 'cas_kvs',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000232 # Environment variables to set.
233 'env',
234 # Environment variables to mutate with relative directories.
235 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
236 'env_prefix',
237 # Lowers the task process priority.
238 'lower_priority',
239 # subprocess42.Containment instance. Can be None.
240 'containment',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000241 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500242
243
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500244def _to_str(s):
245 """Downgrades a unicode instance to str. Pass str through as-is."""
246 if isinstance(s, str):
247 return s
248 # This is technically incorrect, especially on Windows. In theory
249 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
250 # page' on Windows, but that causes other problems, as the character set
251 # is very limited.
252 return s.encode('utf-8')
253
254
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500255def _to_unicode(s):
256 """Upgrades a str instance to unicode. Pass unicode through as-is."""
Takuto Ikuta95459dd2019-10-29 12:39:47 +0000257 if isinstance(s, six.text_type) or s is None:
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500258 return s
259 return s.decode('utf-8')
260
261
maruel03e11842016-07-14 10:50:16 -0700262def make_temp_dir(prefix, root_dir):
263 """Returns a new unique temporary directory."""
Takuto Ikuta6e2ff962019-10-29 12:35:27 +0000264 return six.text_type(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000265
266
vadimsh9c54b2c2017-07-25 14:08:29 -0700267@contextlib.contextmanager
268def set_luci_context_account(account, tmp_dir):
269 """Sets LUCI_CONTEXT account to be used by the task.
270
271 If 'account' is None or '', does nothing at all. This happens when
272 run_isolated.py is called without '--switch-to-account' flag. In this case,
273 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000274 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700275 run_isolated.py explicitly from their code.
276
277 If the requested account is not defined in the context, switches to
278 non-authenticated access. This happens for Swarming tasks that don't use
279 'task' service accounts.
280
281 If not using LUCI_CONTEXT-based auth, does nothing.
282 If already running as requested account, does nothing.
283 """
284 if not account:
285 # Not actually switching.
286 yield
287 return
288
289 local_auth = luci_context.read('local_auth')
290 if not local_auth:
291 # Not using LUCI_CONTEXT auth at all.
292 yield
293 return
294
295 # See LUCI_CONTEXT.md for the format of 'local_auth'.
296 if local_auth.get('default_account_id') == account:
297 # Already set, no need to switch.
298 yield
299 return
300
301 available = {a['id'] for a in local_auth.get('accounts') or []}
302 if account in available:
303 logging.info('Switching default LUCI_CONTEXT account to %r', account)
304 local_auth['default_account_id'] = account
305 else:
306 logging.warning(
307 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
308 'disabling authentication', account, sorted(available))
309 local_auth.pop('default_account_id', None)
310
311 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
312 yield
313
314
nodir90bc8dc2016-06-15 13:35:21 -0700315def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000316 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700317
318 Raises:
319 ValueError if a parameter is requested in |command| but its value is not
320 provided.
321 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000322 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
323
324
325def replace_parameters(arg, out_dir, bot_file):
326 """Replaces parameter tokens with appropriate values in a string.
327
328 Raises:
329 ValueError if a parameter is requested in |arg| but its value is not
330 provided.
331 """
332 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
333 replace_slash = False
334 if ISOLATED_OUTDIR_PARAMETER in arg:
335 if not out_dir:
336 raise ValueError(
337 'output directory is requested in command or env var, but not '
338 'provided; please specify one')
339 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
340 replace_slash = True
341 if SWARMING_BOT_FILE_PARAMETER in arg:
342 if bot_file:
343 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700344 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000345 else:
346 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
347 'var, but no bot_file specified. Leaving parameter '
348 'unchanged.')
349 if replace_slash:
350 # Replace slashes only if parameters are present
351 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
352 arg = arg.replace('/', os.sep)
353 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700354
355
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000356
357def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
358 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800359 """Returns full OS environment to run a command in.
360
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800361 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
362 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800363
364 Args:
365 tmp_dir: temp directory.
366 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500367 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500368 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800369 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000370 out_dir: Isolated output directory. Required to be != None if any of the
371 env vars contain ISOLATED_OUTDIR_PARAMETER.
372 bot_file: Required to be != None if any of the env vars contain
373 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800374 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500375 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000376 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500377 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500378 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500379 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000380 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500381
382 if cipd_info:
383 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500384 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
385 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500386
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000387 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500388 assert isinstance(paths, list), paths
389 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500390 cur = out.get(key)
391 if cur:
392 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500393 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800394
Marc-Antoine Ruelefb30b12018-07-25 18:34:36 +0000395 tmp_dir = _to_str(tmp_dir)
396 # pylint: disable=line-too-long
397 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
398 # platform. So $TMPDIR must be set on all platforms.
399 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
400 out['TMPDIR'] = tmp_dir
401 if sys.platform == 'win32':
402 # * chromium's base utils uses GetTempPath().
403 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
404 # * Go uses GetTempPath().
405 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
406 # set.
407 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
408 out['TMP'] = tmp_dir
409 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
410 out['TEMP'] = tmp_dir
411 elif sys.platform == 'darwin':
412 # * Chromium uses an hack on macOS before calling into
413 # NSTemporaryDirectory().
414 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
415 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
416 out['MAC_CHROMIUM_TMPDIR'] = tmp_dir
417 else:
418 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
419 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
420 # * mktemp on linux respects $TMPDIR.
421 # * Chromium respects $TMPDIR on linux.
422 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
423 # * Go uses $TMPDIR.
424 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
425 pass
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500426 return out
vadimsh232f5a82017-01-20 19:23:44 -0800427
428
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000429def run_command(
430 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700431 """Runs the command.
432
433 Returns:
434 tuple(process exit code, bool if had a hard timeout)
435 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000436 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000437 'run_command(%s, %s, %s, %s, %s, %s)',
438 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700439
maruel6be7f9e2015-10-01 12:25:30 -0700440 exit_code = None
441 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700442 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700443 proc = None
444 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700445 try:
maruel6be7f9e2015-10-01 12:25:30 -0700446 # TODO(maruel): This code is imperfect. It doesn't handle well signals
447 # during the download phase and there's short windows were things can go
448 # wrong.
449 def handler(signum, _frame):
450 if proc and not had_signal:
451 logging.info('Received signal %d', signum)
452 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700453 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700454
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000455 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000456 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000457 lower_priority=lower_priority, containment=containment)
maruel6be7f9e2015-10-01 12:25:30 -0700458 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
459 try:
John Budorickc398f092019-06-10 22:49:44 +0000460 exit_code = proc.wait(hard_timeout or None)
maruel6be7f9e2015-10-01 12:25:30 -0700461 except subprocess42.TimeoutExpired:
462 if not had_signal:
463 logging.warning('Hard timeout')
464 had_hard_timeout = True
465 logging.warning('Sending SIGTERM')
466 proc.terminate()
467
Takuto Ikuta684f7912020-09-29 07:49:49 +0000468 kill_sent = False
maruel6be7f9e2015-10-01 12:25:30 -0700469 # Ignore signals in grace period. Forcibly give the grace period to the
470 # child process.
471 if exit_code is None:
472 ignore = lambda *_: None
473 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
474 try:
475 exit_code = proc.wait(grace_period or None)
476 except subprocess42.TimeoutExpired:
477 # Now kill for real. The user can distinguish between the
478 # following states:
479 # - signal but process exited within grace period,
480 # hard_timed_out will be set but the process exit code will be
481 # script provided.
482 # - processed exited late, exit code will be -9 on posix.
483 logging.warning('Grace exhausted; sending SIGKILL')
484 proc.kill()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000485 kill_sent = True
martiniss5c8043e2017-08-01 17:09:43 -0700486 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700487 exit_code = proc.wait()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000488
489 # the process group / job object may be dangling so if we didn't kill
490 # it already, give it a poke now.
491 if not kill_sent:
492 proc.kill()
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000493 except OSError as e:
maruela9cfd6f2015-09-15 11:03:15 -0700494 # This is not considered to be an internal error. The executable simply
495 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800496 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000497 '<The executable does not exist, a dependent library is missing or '
498 'the command line is too long>\n'
499 '<Check for missing .so/.dll in the .isolate or GN file or length of '
500 'command line args>\n'
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000501 '<Command: %s, Exception: %s>\n' % (command, e))
maruela72f46e2016-02-24 11:05:45 -0800502 if os.environ.get('SWARMING_TASK_ID'):
503 # Give an additional hint when running as a swarming task.
504 sys.stderr.write(
505 '<See the task\'s page for commands to help diagnose this issue '
506 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700507 exit_code = 1
508 logging.info(
509 'Command finished with exit code %d (%s)',
510 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700511 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700512
513
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000514def _run_go_cmd_and_wait(cmd):
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000515 """
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000516 Runs an external Go command, `isolated` or `cas`, and wait for its completion.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000517
518 While this is a generic function to launch a subprocess, it has logic that
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000519 is specific to Go `isolated` and `cas` for waiting and logging.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000520
521 Returns:
522 The subprocess object
523 """
Ye Kuang3c40e9f2020-07-28 13:15:25 +0000524 cmd_str = ' '.join(cmd)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000525 try:
526 proc = subprocess42.Popen(cmd)
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000527
Ye Kuangc1d800f2020-07-28 10:14:55 +0000528 exceeded_max_timeout = True
529 check_period_sec = 30
530 max_checks = 100
531 # max timeout = max_checks * check_period_sec = 50 minutes
532 for i in range(max_checks):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000533 # This is to prevent I/O timeout error during setup.
Ye Kuangc1d800f2020-07-28 10:14:55 +0000534 try:
535 retcode = proc.wait(check_period_sec)
536 if retcode != 0:
537 raise ValueError("retcode is not 0: %s (cmd=%s)" % (retcode, cmd_str))
538 exceeded_max_timeout = False
539 break
540 except subprocess42.TimeoutExpired:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000541 print('still running (after %d seconds)' % ((i + 1) * check_period_sec))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000542
Ye Kuangc1d800f2020-07-28 10:14:55 +0000543 if exceeded_max_timeout:
544 proc.terminate()
545 try:
546 proc.wait(check_period_sec)
547 except subprocess42.TimeoutExpired:
548 logging.exception(
549 "failed to terminate? timeout happened after %d seconds",
550 check_period_sec)
551 proc.kill()
552 proc.wait()
553 # Raise unconditionally, because |proc| was forcefully terminated.
554 raise ValueError("timedout after %d seconds (cmd=%s)" %
555 (check_period_sec * max_checks, cmd_str))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000556
Ye Kuangc1d800f2020-07-28 10:14:55 +0000557 return proc
558 except Exception:
559 logging.exception('Failed to run Go cmd %s', cmd_str)
560 raise
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000561
562
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000563def _fetch_and_map_with_cas(cas_client, digest, instance, output_dir, cache_dir,
Takuto Ikutaae391c52020-12-03 08:43:45 +0000564 policies, kvs_file):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000565 """
566 Fetches a CAS tree using cas client, create the tree and returns download
567 stats.
568 """
569
Takuto Ikuta34a86c52020-10-13 05:30:57 +0000570 # TODO(crbug.com/chrome-operations/49):
571 # remove this after isolate to RBE-CAS migration.
572 _CAS_EMPTY_DIR_DIGEST = (
573 'e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855/0')
574 if digest == _CAS_EMPTY_DIR_DIGEST:
575 return {
576 'duration': 0.0,
577 'items_cold': '',
578 'items_hot': '',
579 }
580
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000581 start = time.time()
582 result_json_handle, result_json_path = tempfile.mkstemp(
583 prefix=u'fetch-and-map-result-', suffix=u'.json')
584 os.close(result_json_handle)
585 try:
586 cmd = [
587 cas_client,
588 'download',
589 '-digest',
590 digest,
591 '-cas-instance',
592 instance,
593 # flags for cache.
594 '-cache-dir',
595 cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000596 '-cache-max-size',
597 str(policies.max_cache_size),
598 '-cache-min-free-space',
599 str(policies.min_free_space),
600 # flags for output.
601 '-dir',
602 output_dir,
603 '-dump-stats-json',
604 result_json_path,
Takuto Ikuta557025b2021-02-01 08:37:40 +0000605 '-log-level',
606 'info'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000607 ]
Takuto Ikutaae391c52020-12-03 08:43:45 +0000608
609 if kvs_file:
610 cmd.extend(['-kvs-file', kvs_file])
611
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000612 _run_go_cmd_and_wait(cmd)
613
614 with open(result_json_path) as json_file:
615 result_json = json.load(json_file)
616
617 return {
618 'duration': time.time() - start,
619 'items_cold': result_json['items_cold'],
620 'items_hot': result_json['items_hot'],
621 }
622 finally:
623 fs.remove(result_json_path)
624
625
626def _fetch_and_map_with_go_isolated(isolated_hash, storage, outdir,
627 go_cache_dir, policies, isolated_client):
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000628 """
629 Fetches an isolated tree using go client, create the tree and returns
Takuto Ikuta57219f42020-11-02 07:35:36 +0000630 stats.
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000631 """
632 start = time.time()
633 server_ref = storage.server_ref
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000634 result_json_handle, result_json_path = tempfile.mkstemp(
635 prefix=u'fetch-and-map-result-', suffix=u'.json')
636 os.close(result_json_handle)
637 try:
Ye Kuanga98764c2020-04-09 03:17:37 +0000638 cmd = [
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000639 isolated_client,
640 'download',
641 '-isolate-server',
642 server_ref.url,
643 '-namespace',
644 server_ref.namespace,
645 '-isolated',
646 isolated_hash,
647
648 # flags for cache
649 '-cache-dir',
Takuto Ikuta057c5342019-12-03 04:05:05 +0000650 go_cache_dir,
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000651 '-cache-max-items',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000652 str(policies.max_items),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000653 '-cache-max-size',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000654 str(policies.max_cache_size),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000655 '-cache-min-free-space',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000656 str(policies.min_free_space),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000657
658 # flags for output
659 '-output-dir',
660 outdir,
661 '-fetch-and-map-result-json',
662 result_json_path,
Ye Kuanga98764c2020-04-09 03:17:37 +0000663 ]
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000664 _run_go_cmd_and_wait(cmd)
Takuto Ikuta3153e3b2020-02-18 06:11:47 +0000665
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000666 with open(result_json_path) as json_file:
667 result_json = json.load(json_file)
668
Takuto Ikuta57219f42020-11-02 07:35:36 +0000669 return {
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000670 'duration': time.time() - start,
671 'items_cold': result_json['items_cold'],
672 'items_hot': result_json['items_hot'],
Ye Kuang65a1de52020-10-16 08:31:16 +0000673 'initial_number_items': result_json['initial_number_items'],
674 'initial_size': result_json['initial_size'],
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000675 }
676 finally:
677 fs.remove(result_json_path)
678
679
680# TODO(crbug.com/932396): remove this function.
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000681def fetch_and_map(isolated_hash, storage, cache, outdir):
Takuto Ikuta57219f42020-11-02 07:35:36 +0000682 """Fetches an isolated tree, create the tree and returns stats."""
nodir6f801882016-04-29 14:41:50 -0700683 start = time.time()
Takuto Ikuta57219f42020-11-02 07:35:36 +0000684 isolateserver.fetch_isolated(
nodir6f801882016-04-29 14:41:50 -0700685 isolated_hash=isolated_hash,
686 storage=storage,
687 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700688 outdir=outdir,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000689 use_symlinks=False)
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000690 hot = (collections.Counter(cache.used) -
691 collections.Counter(cache.added)).elements()
Takuto Ikuta57219f42020-11-02 07:35:36 +0000692 return {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000693 'duration': time.time() - start,
694 'items_cold': base64.b64encode(large.pack(sorted(cache.added))).decode(),
695 'items_hot': base64.b64encode(large.pack(sorted(hot))).decode(),
nodir6f801882016-04-29 14:41:50 -0700696 }
697
698
aludwin0a8e17d2016-10-27 15:57:39 -0700699def link_outputs_to_outdir(run_dir, out_dir, outputs):
700 """Links any named outputs to out_dir so they can be uploaded.
701
702 Raises an error if the file already exists in that directory.
703 """
704 if not outputs:
705 return
706 isolateserver.create_directories(out_dir, outputs)
707 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400708 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
709
710
711def copy_recursively(src, dst):
712 """Efficiently copies a file or directory from src_dir to dst_dir.
713
714 `item` may be a file, directory, or a symlink to a file or directory.
715 All symlinks are replaced with their targets, so the resulting
716 directory structure in dst_dir will never have any symlinks.
717
718 To increase speed, copy_recursively hardlinks individual files into the
719 (newly created) directory structure if possible, unlike Python's
720 shutil.copytree().
721 """
722 orig_src = src
723 try:
724 # Replace symlinks with their final target.
725 while fs.islink(src):
726 res = fs.readlink(src)
727 src = os.path.join(os.path.dirname(src), res)
728 # TODO(sadafm): Explicitly handle cyclic symlinks.
729
730 # Note that fs.isfile (which is a wrapper around os.path.isfile) throws
731 # an exception if src does not exist. A warning will be logged in that case.
732 if fs.isfile(src):
733 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
734 return
735
736 if not fs.exists(dst):
737 os.makedirs(dst)
738
739 for child in fs.listdir(src):
740 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
741
742 except OSError as e:
743 if e.errno == errno.ENOENT:
744 logging.warning('Path %s does not exist or %s is a broken symlink',
745 src, orig_src)
746 else:
747 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700748
749
Ye Kuangfb0bad62020-07-28 08:07:25 +0000750def _upload_with_py(storage, out_dir):
751
752 def process_stats(f_st):
753 st = sorted(i.size for i in f_st)
754 return base64.b64encode(large.pack(st)).decode()
755
756 try:
757 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
758 storage, [out_dir], None, verify_push=True)
759
760 isolated = list(results.values())[0]
761 cold = process_stats(f_cold)
762 hot = process_stats(f_hot)
763 return isolated, cold, hot
764
765 except isolateserver.Aborted:
766 # This happens when a signal SIGTERM was received while uploading data.
767 # There is 2 causes:
768 # - The task was too slow and was about to be killed anyway due to
769 # exceeding the hard timeout.
770 # - The amount of data uploaded back is very large and took too much
771 # time to archive.
772 sys.stderr.write('Received SIGTERM while uploading')
773 # Re-raise, so it will be treated as an internal failure.
774 raise
775
776
777def _upload_with_go(storage, outdir, isolated_client):
778 """
779 Uploads results back using the Go `isolated` CLI.
780 """
781 server_ref = storage.server_ref
782 isolated_handle, isolated_path = tempfile.mkstemp(
783 prefix=u'isolated-hash-', suffix=u'.txt')
784 stats_json_handle, stats_json_path = tempfile.mkstemp(
785 prefix=u'dump-stats-', suffix=u'.json')
786 os.close(isolated_handle)
787 os.close(stats_json_handle)
788 try:
789 cmd = [
790 isolated_client,
791 'archive',
792 '-isolate-server',
793 server_ref.url,
794 '-namespace',
795 server_ref.namespace,
796 '-dirs',
797 # Format: <working directory>:<relative path to dir>
798 outdir + ':',
799
800 # output
801 '-dump-hash',
802 isolated_path,
803 '-dump-stats-json',
804 stats_json_path,
Ye Kuangbc4e8402020-07-29 09:54:30 +0000805 '-quiet',
Ye Kuangfb0bad62020-07-28 08:07:25 +0000806 ]
Ye Kuang0023dc52020-08-04 05:28:41 +0000807 # Will do exponential backoff, e.g. 10, 20, 40...
808 # This mitigates https://crbug.com/1094369, where there is a data race on
809 # the uploaded files.
810 backoff = 10
Takuto Ikutae0bfec72020-08-28 02:52:52 +0000811 started = time.time()
Ye Kuang0023dc52020-08-04 05:28:41 +0000812 while True:
813 try:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000814 _run_go_cmd_and_wait(cmd)
Ye Kuang0023dc52020-08-04 05:28:41 +0000815 break
816 except Exception:
Takuto Ikutae0bfec72020-08-28 02:52:52 +0000817 if time.time() > started + 60 * 2:
818 # This is to not wait task having leaked process long time.
Ye Kuang0023dc52020-08-04 05:28:41 +0000819 raise
820
821 on_error.report('error before %d second backoff' % backoff)
822 logging.exception(
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000823 '_run_go_cmd_and_wait() failed, will retry after %d seconds',
Ye Kuang0023dc52020-08-04 05:28:41 +0000824 backoff)
825 time.sleep(backoff)
826 backoff *= 2
Ye Kuangfb0bad62020-07-28 08:07:25 +0000827
828 with open(isolated_path) as isol_file:
829 isolated = isol_file.read()
830 with open(stats_json_path) as json_file:
831 stats_json = json.load(json_file)
832
833 return isolated, stats_json['items_cold'], stats_json['items_hot']
834 finally:
835 fs.remove(isolated_path)
836 fs.remove(stats_json_path)
837
838
Ye Kuangbc4e8402020-07-29 09:54:30 +0000839def upload_out_dir(storage, out_dir, go_isolated_client):
840 """Uploads the results in |out_dir| back, if there is any.
maruela9cfd6f2015-09-15 11:03:15 -0700841
842 Returns:
Ye Kuangbc4e8402020-07-29 09:54:30 +0000843 tuple(outputs_ref, stats)
maruel064c0a32016-04-05 11:47:15 -0700844 - outputs_ref: a dict referring to the results archived back to the isolated
845 server, if applicable.
nodir6f801882016-04-29 14:41:50 -0700846 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700847 """
maruela9cfd6f2015-09-15 11:03:15 -0700848 # Upload out_dir and generate a .isolated file out of this directory. It is
849 # only done if files were written in the directory.
850 outputs_ref = None
Ye Kuangfb0bad62020-07-28 08:07:25 +0000851 cold = ''
852 hot = ''
nodir6f801882016-04-29 14:41:50 -0700853 start = time.time()
854
maruel12e30012015-10-09 11:55:35 -0700855 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700856 with tools.Profiler('ArchiveOutput'):
Ye Kuangfb0bad62020-07-28 08:07:25 +0000857 isolated = None
Ye Kuang72e6fe82020-08-05 06:30:04 +0000858 if _USE_GO_ISOLATED_TO_UPLOAD and go_isolated_client is not None:
Ye Kuangfb0bad62020-07-28 08:07:25 +0000859 isolated, cold, hot = _upload_with_go(storage, out_dir,
860 go_isolated_client)
Ye Kuang72e6fe82020-08-05 06:30:04 +0000861 else:
862 isolated, cold, hot = _upload_with_py(storage, out_dir)
Ye Kuangfb0bad62020-07-28 08:07:25 +0000863 outputs_ref = {
864 'isolated': isolated,
865 'isolatedserver': storage.server_ref.url,
866 'namespace': storage.server_ref.namespace,
867 }
nodir6f801882016-04-29 14:41:50 -0700868
nodir6f801882016-04-29 14:41:50 -0700869 stats = {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000870 'duration': time.time() - start,
Ye Kuangfb0bad62020-07-28 08:07:25 +0000871 'items_cold': cold,
872 'items_hot': hot,
nodir6f801882016-04-29 14:41:50 -0700873 }
Ye Kuangbc4e8402020-07-29 09:54:30 +0000874 return outputs_ref, stats
maruela9cfd6f2015-09-15 11:03:15 -0700875
876
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000877def upload_outdir_with_cas(cas_client, cas_instance, outdir):
878 """Uploads the results in |outdir|, if there is any.
879
880 Returns:
881 tuple(root_digest, stats)
882 - root_digest: a digest of the output directory.
883 - stats: uploading stats.
884 """
885 digest_file_handle, digest_path = tempfile.mkstemp(
886 prefix=u'cas-digest', suffix=u'.txt')
887 os.close(digest_file_handle)
888 stats_json_handle, stats_json_path = tempfile.mkstemp(
889 prefix=u'upload-stats', suffix=u'.json')
890 os.close(stats_json_handle)
891
892 try:
893 cmd = [
894 cas_client,
895 'archive',
896 '-cas-instance',
897 cas_instance,
898 '-paths',
899 # Format: <working directory>:<relative path to dir>
900 outdir + ':',
901 # output
902 '-dump-digest',
903 digest_path,
904 '-dump-stats-json',
905 stats_json_path,
906 ]
907
908 start = time.time()
909
910 _run_go_cmd_and_wait(cmd)
911
912 with open(digest_path) as digest_file:
913 digest = digest_file.read()
Junji Watanabec208b302020-09-25 09:18:27 +0000914 h, s = digest.split('/')
915 cas_output_root = {
916 'cas_instance': cas_instance,
917 'digest': {
918 'hash': h,
919 'size_bytes': int(s)
920 }
921 }
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000922 with open(stats_json_path) as stats_file:
923 stats = json.load(stats_file)
924
925 stats['duration'] = time.time() - start
926
Junji Watanabec208b302020-09-25 09:18:27 +0000927 return cas_output_root, stats
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000928 finally:
929 fs.remove(digest_path)
930 fs.remove(stats_json_path)
931
932
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500933def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700934 """Runs a command with optional isolated input/output.
935
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500936 Arguments:
937 - data: TaskData instance.
938 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700939
940 Returns metadata about the result.
941 """
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000942
943 if data.isolate_cache:
944 download_stats = {
945 #'duration': 0.,
946 'initial_number_items': len(data.isolate_cache),
947 'initial_size': data.isolate_cache.total_size,
948 #'items_cold': '<large.pack()>',
949 #'items_hot': '<large.pack()>',
950 }
951 else:
952 # TODO(tikuta): take stats from state.json in this case too.
953 download_stats = {}
954
maruela9cfd6f2015-09-15 11:03:15 -0700955 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000956 'duration': None,
957 'exit_code': None,
958 'had_hard_timeout': False,
959 'internal_failure': 'run_isolated did not complete properly',
960 'stats': {
961 #'cipd': {
962 # 'duration': 0.,
963 # 'get_client_duration': 0.,
964 #},
965 'isolated': {
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000966 'download': download_stats,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000967 #'upload': {
968 # 'duration': 0.,
969 # 'items_cold': '<large.pack()>',
970 # 'items_hot': '<large.pack()>',
971 #},
972 },
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000973 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000974 #'cipd_pins': {
975 # 'packages': [
976 # {'package_name': ..., 'version': ..., 'path': ...},
977 # ...
978 # ],
979 # 'client_package': {'package_name': ..., 'version': ...},
980 #},
981 'outputs_ref': None,
Junji Watanabe54925c32020-09-08 00:56:18 +0000982 'cas_output_root': None,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000983 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700984 }
nodirbe642ff2016-06-09 15:51:51 -0700985
Takuto Ikutad46ea762020-10-07 05:43:22 +0000986 assert os.path.isabs(data.root_dir), ("data.root_dir is not abs path: %s" %
987 data.root_dir)
988 file_path.ensure_tree(data.root_dir, 0o700)
989
maruele2f2cb82016-07-13 14:41:03 -0700990 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700991 # TODO(maruel): This is not obvious. Change this to become an error once we
992 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500993 if constant_run_path and data.root_dir:
994 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700995 if os.path.isdir(run_dir):
996 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000997 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700998 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500999 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001000
1001 # True if CAS is used for download/upload files.
1002 use_cas = bool(data.cas_digest)
1003
maruel03e11842016-07-14 10:50:16 -07001004 # storage should be normally set but don't crash if it is not. This can happen
1005 # as Swarming task can run without an isolate server.
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001006 out_dir = None
1007 if data.storage or use_cas:
1008 out_dir = make_temp_dir(ISOLATED_OUT_DIR, data.root_dir)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001009 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001010 isolated_client_dir = make_temp_dir(ISOLATED_CLIENT_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -07001011 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001012 if data.relative_cwd:
1013 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001014 command = data.command
Ye Kuangfb0bad62020-07-28 08:07:25 +00001015 go_isolated_client = None
1016 if data.use_go_isolated:
1017 go_isolated_client = os.path.join(isolated_client_dir,
1018 'isolated' + cipd.EXECUTABLE_SUFFIX)
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001019
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001020 cas_client = None
1021 cas_client_dir = make_temp_dir(_CAS_CLIENT_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001022 if use_cas:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001023 cas_client = os.path.join(cas_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX)
1024
nodir55be77b2016-05-03 09:39:57 -07001025 try:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001026 with data.install_packages_fn(run_dir, isolated_client_dir,
1027 cas_client_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -08001028 if cipd_info:
1029 result['stats']['cipd'] = cipd_info.stats
1030 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -07001031
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001032 isolated_stats = result['stats'].setdefault('isolated', {})
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001033 if data.isolated_hash:
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001034 if data.use_go_isolated:
Takuto Ikuta57219f42020-11-02 07:35:36 +00001035 stats = _fetch_and_map_with_go_isolated(
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001036 isolated_hash=data.isolated_hash,
1037 storage=data.storage,
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001038 outdir=run_dir,
1039 go_cache_dir=data.go_cache_dir,
Takuto Ikuta879788c2020-01-10 08:00:26 +00001040 policies=data.go_cache_policies,
Ye Kuangfb0bad62020-07-28 08:07:25 +00001041 isolated_client=go_isolated_client)
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001042 else:
Takuto Ikuta57219f42020-11-02 07:35:36 +00001043 stats = fetch_and_map(
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001044 isolated_hash=data.isolated_hash,
1045 storage=data.storage,
1046 cache=data.isolate_cache,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +00001047 outdir=run_dir)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001048 isolated_stats['download'].update(stats)
Takuto Ikutab58dbd12020-06-05 09:29:14 +00001049
Junji Watanabe54925c32020-09-08 00:56:18 +00001050 elif data.cas_digest:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001051 stats = _fetch_and_map_with_cas(
1052 cas_client=cas_client,
1053 digest=data.cas_digest,
1054 instance=data.cas_instance,
1055 output_dir=run_dir,
Junji Watanabeb03450b2020-09-25 05:09:27 +00001056 cache_dir=data.cas_cache_dir,
Takuto Ikutaae391c52020-12-03 08:43:45 +00001057 policies=data.cas_cache_policies,
1058 kvs_file=data.cas_kvs)
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001059 isolated_stats['download'].update(stats)
Junji Watanabe54925c32020-09-08 00:56:18 +00001060
maruelabec63c2017-04-26 11:53:24 -07001061 if not command:
1062 # Handle this as a task failure, not an internal failure.
1063 sys.stderr.write(
1064 '<No command was specified!>\n'
1065 '<Please secify a command when triggering your Swarming task>\n')
1066 result['exit_code'] = 1
1067 return result
nodirbe642ff2016-06-09 15:51:51 -07001068
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001069 if not cwd.startswith(run_dir):
1070 # Handle this as a task failure, not an internal failure. This is a
1071 # 'last chance' way to gate against directory escape.
1072 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
1073 result['exit_code'] = 1
1074 return result
1075
1076 if not os.path.isdir(cwd):
1077 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +00001078 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001079
vadimsh232f5a82017-01-20 19:23:44 -08001080 # If we have an explicit list of files to return, make sure their
1081 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001082 if data.storage and data.outputs:
1083 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -07001084
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001085 with data.install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001086 sys.stdout.flush()
1087 start = time.time()
1088 try:
vadimsh9c54b2c2017-07-25 14:08:29 -07001089 # Need to switch the default account before 'get_command_env' call,
1090 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001091 with set_luci_context_account(data.switch_to_account, tmp_dir):
1092 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +00001093 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
1094 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +00001095 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -08001096 command = process_command(command, out_dir, data.bot_file)
1097 file_path.ensure_command_has_abs_path(command, cwd)
1098
vadimsh9c54b2c2017-07-25 14:08:29 -07001099 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001100 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001101 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -08001102 finally:
1103 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -05001104
Ye Kuangbc4e8402020-07-29 09:54:30 +00001105 if out_dir:
1106 # Try to link files to the output directory, if specified.
1107 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
1108 isolated_stats = result['stats'].setdefault('isolated', {})
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001109 if use_cas:
1110 result['cas_output_root'], isolated_stats['upload'] = (
1111 upload_outdir_with_cas(cas_client, data.cas_instance, out_dir))
1112 else:
1113 # This could use |go_isolated_client|, so make sure it runs when the
1114 # CIPD package still exists.
1115 result['outputs_ref'], isolated_stats['upload'] = (
1116 upload_out_dir(data.storage, out_dir, go_isolated_client))
Seth Koehler49139812017-12-19 13:59:33 -05001117 # We successfully ran the command, set internal_failure back to
1118 # None (even if the command failed, it's not an internal error).
1119 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -07001120 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -07001121 # An internal error occurred. Report accordingly so the swarming task will
1122 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -07001123 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -07001124 result['internal_failure'] = str(e)
1125 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -07001126
1127 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -07001128 finally:
1129 try:
Ye Kuangbc4e8402020-07-29 09:54:30 +00001130 success = True
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001131 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -07001132 success = True
maruela9cfd6f2015-09-15 11:03:15 -07001133 logging.warning(
1134 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -07001135 else:
maruel84537cb2015-10-16 14:21:28 -07001136 # On Windows rmtree(run_dir) call above has a synchronization effect: it
1137 # finishes only when all task child processes terminate (since a running
1138 # process locks *.exe file). Examine out_dir only after that call
1139 # completes (since child processes may write to out_dir too and we need
1140 # to wait for them to finish).
Junji Watanabeb03450b2020-09-25 05:09:27 +00001141 dirs_to_remove = [run_dir, tmp_dir, isolated_client_dir, cas_client_dir]
Ye Kuangbc4e8402020-07-29 09:54:30 +00001142 if out_dir:
1143 dirs_to_remove.append(out_dir)
1144 for directory in dirs_to_remove:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001145 if not fs.isdir(directory):
1146 continue
Junji Watanabe9cdfff52021-01-08 07:20:35 +00001147 start = time.time()
maruel84537cb2015-10-16 14:21:28 -07001148 try:
Junji Watanabecc4eefd2021-01-19 01:46:10 +00001149 file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -07001150 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001151 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -07001152 success = False
Junji Watanabe9cdfff52021-01-08 07:20:35 +00001153 finally:
1154 logging.info('Cleanup: rmtree(%r) took %d seconds', directory,
1155 time.time() - start)
maruel84537cb2015-10-16 14:21:28 -07001156 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001157 sys.stderr.write(
1158 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
Takuto Ikutad7d64e12020-07-31 06:18:45 +00001159 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
maruel84537cb2015-10-16 14:21:28 -07001160 if result['exit_code'] == 0:
1161 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -07001162
maruela9cfd6f2015-09-15 11:03:15 -07001163 if not success and result['exit_code'] == 0:
1164 result['exit_code'] = 1
1165 except Exception as e:
1166 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -07001167 if out_dir:
1168 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -07001169 result['internal_failure'] = str(e)
Takuto Ikutaa9a907b2020-04-17 08:50:50 +00001170 on_error.report(None)
maruela9cfd6f2015-09-15 11:03:15 -07001171 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001172
1173
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001174def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -07001175 """Runs an executable and records execution metadata.
1176
nodir55be77b2016-05-03 09:39:57 -07001177 If isolated_hash is specified, downloads the dependencies in the cache,
1178 hardlinks them into a temporary directory and runs the command specified in
1179 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001180
1181 A temporary directory is created to hold the output files. The content inside
1182 this directory will be uploaded back to |storage| packaged as a .isolated
1183 file.
1184
1185 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001186 - data: TaskData instance.
1187 - result_json: File path to dump result metadata into. If set, the process
1188 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -07001189
1190 Returns:
1191 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001192 """
maruela76b9ee2015-12-15 06:18:08 -08001193 if result_json:
1194 # Write a json output file right away in case we get killed.
1195 result = {
Junji Watanabe54925c32020-09-08 00:56:18 +00001196 'exit_code': None,
1197 'had_hard_timeout': False,
1198 'internal_failure': 'Was terminated before completion',
1199 'outputs_ref': None,
1200 'cas_output_root': None,
1201 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -08001202 }
1203 tools.write_json(result_json, result, dense=True)
1204
maruela9cfd6f2015-09-15 11:03:15 -07001205 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001206 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -07001207 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -07001208
maruela9cfd6f2015-09-15 11:03:15 -07001209 if result_json:
maruel05d5a882015-09-21 13:59:02 -07001210 # We've found tests to delete 'work' when quitting, causing an exception
1211 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -07001212 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -07001213 tools.write_json(result_json, result, dense=True)
1214 # Only return 1 if there was an internal error.
1215 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +00001216
maruela9cfd6f2015-09-15 11:03:15 -07001217 # Marshall into old-style inline output.
1218 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +00001219 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -07001220 data = {
Junji Watanabe38b28b02020-04-23 10:23:30 +00001221 'hash': result['outputs_ref']['isolated'],
1222 'namespace': result['outputs_ref']['namespace'],
1223 'storage': result['outputs_ref']['isolatedserver'],
maruela9cfd6f2015-09-15 11:03:15 -07001224 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -05001225 sys.stdout.flush()
Junji Watanabe38b28b02020-04-23 10:23:30 +00001226 print('[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
1227 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -08001228 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -07001229 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001230
1231
iannuccib58d10d2017-03-18 02:00:25 -07001232# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -08001233CipdInfo = collections.namedtuple('CipdInfo', [
1234 'client', # cipd.CipdClient object
1235 'cache_dir', # absolute path to bot-global cipd tag and instance cache
1236 'stats', # dict with stats to return to the server
1237 'pins', # dict with installed cipd pins to return to the server
1238])
1239
1240
1241@contextlib.contextmanager
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001242def noop_install_packages(_run_dir, _isolated_dir, _cas_dir):
iannuccib58d10d2017-03-18 02:00:25 -07001243 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -08001244 yield None
1245
1246
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001247def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -07001248 """Calls 'cipd ensure' for packages.
1249
1250 Args:
1251 run_dir (str): root of installation.
1252 cipd_cache_dir (str): the directory to use for the cipd package cache.
1253 client (CipdClient): the cipd client to use
1254 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -07001255
1256 Returns: list of pinned packages. Looks like [
1257 {
1258 'path': 'subdirectory',
1259 'package_name': 'resolved/package/name',
1260 'version': 'deadbeef...',
1261 },
1262 ...
1263 ]
1264 """
1265 package_pins = [None]*len(packages)
1266 def insert_pin(path, name, version, idx):
1267 package_pins[idx] = {
1268 'package_name': name,
1269 # swarming deals with 'root' as '.'
1270 'path': path or '.',
1271 'version': version,
1272 }
1273
1274 by_path = collections.defaultdict(list)
1275 for i, (path, name, version) in enumerate(packages):
1276 # cipd deals with 'root' as ''
1277 if path == '.':
1278 path = ''
1279 by_path[path].append((name, version, i))
1280
1281 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001282 run_dir,
1283 {
1284 subdir: [(name, vers) for name, vers, _ in pkgs
1285 ] for subdir, pkgs in by_path.items()
1286 },
1287 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -07001288 )
1289
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +00001290 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -07001291 this_subdir = by_path[subdir]
1292 for i, (name, version) in enumerate(pin_list):
1293 insert_pin(subdir, name, version, this_subdir[i][2])
1294
Robert Iannucci461b30d2017-12-13 11:34:03 -08001295 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -07001296
1297 return package_pins
1298
1299
vadimsh232f5a82017-01-20 19:23:44 -08001300@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001301def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001302 client_package_name, client_version, cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001303 isolated_dir, cas_dir):
vadimsh902948e2017-01-20 15:57:32 -08001304 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -07001305
vadimsh232f5a82017-01-20 19:23:44 -08001306 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
1307
1308 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -07001309 [
1310 {
1311 "path": path, "package_name": package_name, "version": version,
1312 },
1313 ...
1314 ]
vadimsh902948e2017-01-20 15:57:32 -08001315 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -07001316
1317 such that they correspond 1:1 to all input package arguments from the command
1318 line. These dictionaries make their all the way back to swarming, where they
1319 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -07001320
vadimsh902948e2017-01-20 15:57:32 -08001321 If 'packages' list is empty, will bootstrap CIPD client, but won't install
1322 any packages.
1323
1324 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -08001325 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -08001326
nodirbe642ff2016-06-09 15:51:51 -07001327 Args:
nodir90bc8dc2016-06-15 13:35:21 -07001328 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -08001329 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -07001330 service_url (str): CIPD server url, e.g.
1331 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -07001332 client_package_name (str): CIPD package name of CIPD client.
1333 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -07001334 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001335 isolated_dir (str): where to download isolated client.
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001336 cas_dir (str): where to download cas client.
nodirbe642ff2016-06-09 15:51:51 -07001337 """
1338 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001339
nodirbe642ff2016-06-09 15:51:51 -07001340 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001341
vadimsh902948e2017-01-20 15:57:32 -08001342 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001343 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001344 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001345 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001346
nodirbe642ff2016-06-09 15:51:51 -07001347 get_client_start = time.time()
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001348 client_manager = cipd.get_client(cache_dir, service_url, client_package_name,
1349 client_version)
iannucci96fcccc2016-08-30 15:52:22 -07001350
nodirbe642ff2016-06-09 15:51:51 -07001351 with client_manager as client:
1352 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001353
iannuccib58d10d2017-03-18 02:00:25 -07001354 package_pins = []
1355 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001356 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1357 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001358
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001359 # Install isolated client to |isolated_dir|.
Takuto Ikuta02edca22019-11-29 10:04:51 +00001360 _install_packages(isolated_dir, cipd_cache_dir, client,
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +00001361 [('', ISOLATED_PACKAGE, _LUCI_GO_REVISION)])
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001362
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001363 # Install cas client to |cas_dir|.
1364 _install_packages(cas_dir, cipd_cache_dir, client,
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +00001365 [('', _CAS_PACKAGE, _LUCI_GO_REVISION)])
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001366
iannuccib58d10d2017-03-18 02:00:25 -07001367 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001368
vadimsh232f5a82017-01-20 19:23:44 -08001369 total_duration = time.time() - start
Junji Watanabe38b28b02020-04-23 10:23:30 +00001370 logging.info('Installing CIPD client and packages took %d seconds',
1371 total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001372
vadimsh232f5a82017-01-20 19:23:44 -08001373 yield CipdInfo(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001374 client=client,
1375 cache_dir=cipd_cache_dir,
1376 stats={
1377 'duration': total_duration,
1378 'get_client_duration': get_client_duration,
iannuccib58d10d2017-03-18 02:00:25 -07001379 },
Junji Watanabe38b28b02020-04-23 10:23:30 +00001380 pins={
1381 'client_package': {
1382 'package_name': client.package_name,
1383 'version': client.instance_id,
1384 },
1385 'packages': package_pins,
1386 })
nodirbe642ff2016-06-09 15:51:51 -07001387
1388
1389def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001390 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001391 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001392 version=__version__,
1393 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001394 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001395 '--clean',
1396 action='store_true',
maruel36a963d2016-04-08 17:15:49 -07001397 help='Cleans the cache, trimming it necessary and remove corrupted items '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001398 'and returns without executing anything; use with -v to know what '
1399 'was done')
maruel36a963d2016-04-08 17:15:49 -07001400 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001401 '--json',
1402 help='dump output metadata to json file. When used, run_isolated returns '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001403 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001404 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001405 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001406 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001407 '--grace-period',
1408 type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001409 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001410 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001411 '--relative-cwd',
Takuto Ikuta18ca29a2020-12-04 07:34:20 +00001412 help='Ignore the isolated \'relative_cwd\' and use this one instead')
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001413 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001414 '--env',
1415 default=[],
1416 action='append',
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001417 help='Environment variables to set for the child process')
1418 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001419 '--env-prefix',
1420 default=[],
1421 action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001422 help='Specify a VAR=./path/fragment to put in the environment variable '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001423 'before executing the command. The path fragment must be relative '
1424 'to the isolated run directory, and must not contain a `..` token. '
1425 'The path will be made absolute and prepended to the indicated '
1426 '$VAR using the OS\'s path separator. Multiple items for the same '
1427 '$VAR will be prepended in order.')
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001428 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001429 '--bot-file',
1430 help='Path to a file describing the state of the host. The content is '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001431 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001432 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001433 '--switch-to-account',
1434 help='If given, switches LUCI_CONTEXT to given logical service account '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001435 '(e.g. "task" or "system") before launching the isolated process.')
vadimsh9c54b2c2017-07-25 14:08:29 -07001436 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001437 '--output',
1438 action='append',
aludwin0a8e17d2016-10-27 15:57:39 -07001439 help='Specifies an output to return. If no outputs are specified, all '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001440 'files located in $(ISOLATED_OUTDIR) will be returned; '
1441 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1442 'specified by --output option (there can be multiple) will be '
1443 'returned. Note that if a file in OUT_DIR has the same path '
1444 'as an --output option, the --output version will be returned.')
aludwin0a8e17d2016-10-27 15:57:39 -07001445 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001446 '-a',
1447 '--argsfile',
aludwin7556e0c2016-10-26 08:46:10 -07001448 # This is actually handled in parse_args; it's included here purely so it
1449 # can make it into the help text.
1450 help='Specify a file containing a JSON array of arguments to this '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001451 'script. If --argsfile is provided, no other argument may be '
1452 'provided on the command line.')
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001453 parser.add_option(
1454 '--report-on-exception',
1455 action='store_true',
1456 help='Whether report exception during execution to isolate server. '
1457 'This flag should only be used in swarming bot.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001458
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001459 group = optparse.OptionGroup(parser, 'Data source - Isolate server')
Junji Watanabe54925c32020-09-08 00:56:18 +00001460 # Deprecated. Isoate server is being migrated to RBE-CAS.
1461 # Remove --isolated and isolate server options after migration.
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001462 group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001463 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001464 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001465 isolateserver.add_isolate_server_options(group)
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001466 parser.add_option_group(group)
1467
1468 group = optparse.OptionGroup(parser,
1469 'Data source - Content Addressed Storage')
Junji Watanabe54925c32020-09-08 00:56:18 +00001470 group.add_option(
1471 '--cas-instance', help='Full CAS instance name for input/output files.')
1472 group.add_option(
1473 '--cas-digest',
1474 help='Digest of the input root on RBE-CAS. The format is '
1475 '`{hash}/{size_bytes}`.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001476 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001477
Junji Watanabeb03450b2020-09-25 05:09:27 +00001478 # Cache options.
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001479 isolateserver.add_cache_options(parser)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001480 add_cas_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001481
1482 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001483
1484 group = optparse.OptionGroup(parser, 'Named caches')
1485 group.add_option(
1486 '--named-cache',
1487 dest='named_caches',
1488 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001489 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001490 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001491 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001492 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1493 'path is a path relative to the run dir where the cache directory '
1494 'must be put to. '
1495 'This option can be specified more than once.')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001496 group.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001497 '--named-cache-root',
1498 default='named_caches',
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001499 help='Cache root directory. Default=%default')
1500 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001501
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001502 group = optparse.OptionGroup(parser, 'Process containment')
1503 parser.add_option(
1504 '--lower-priority', action='store_true',
1505 help='Lowers the child process priority')
1506 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001507 '--containment-type',
1508 choices=('NONE', 'AUTO', 'JOB_OBJECT'),
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001509 default='NONE',
1510 help='Type of container to use')
1511 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001512 '--limit-processes',
1513 type='int',
1514 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001515 help='Maximum number of active processes in the containment')
1516 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001517 '--limit-total-committed-memory',
1518 type='int',
1519 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001520 help='Maximum sum of committed memory in the containment')
1521 parser.add_option_group(group)
1522
1523 group = optparse.OptionGroup(parser, 'Debugging')
1524 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001525 '--leak-temp-dir',
1526 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001527 help='Deliberately leak isolate\'s temp dir for later examination. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001528 'Default: %default')
1529 group.add_option('--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001530 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001531
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001532 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001533
Ye Kuang1d096cb2020-06-26 08:38:21 +00001534 parser.set_defaults(cache='cache')
nodirbe642ff2016-06-09 15:51:51 -07001535 return parser
1536
1537
Junji Watanabeb03450b2020-09-25 05:09:27 +00001538def add_cas_cache_options(parser):
1539 group = optparse.OptionGroup(parser, 'CAS cache management')
1540 group.add_option(
1541 '--cas-cache',
1542 metavar='DIR',
1543 default='cas-cache',
1544 help='Directory to keep a local cache of the files. Accelerates download '
1545 'by reusing already downloaded files. Default=%default')
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001546 group.add_option(
1547 '--kvs-file',
1548 default='',
1549 help='CAS cache using kvs for small files. Default=%default')
Junji Watanabeb03450b2020-09-25 05:09:27 +00001550 parser.add_option_group(group)
1551
1552
1553def process_cas_cache_options(options):
1554 if options.cas_cache:
1555 policies = local_caching.CachePolicies(
1556 max_cache_size=options.max_cache_size,
1557 min_free_space=options.min_free_space,
1558 # max_items isn't used for CAS cache for now.
1559 max_items=None,
1560 max_age_secs=MAX_AGE_SECS)
1561
1562 return local_caching.DiskContentAddressedCache(
1563 six.text_type(os.path.abspath(options.cas_cache)), policies, trim=False)
1564 return local_caching.MemoryContentAddressedCache()
1565
1566
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001567def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001568 """Validates named cache options and returns a CacheManager."""
1569 if options.named_caches and not options.named_cache_root:
1570 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001571 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001572 if not CACHE_NAME_RE.match(name):
1573 parser.error(
1574 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1575 if not path:
1576 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001577 try:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001578 int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001579 except ValueError:
1580 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001581 if options.named_cache_root:
1582 # Make these configurable later if there is use case but for now it's fairly
1583 # safe values.
1584 # In practice, a fair chunk of bots are already recycled on a daily schedule
1585 # so this code doesn't have any effect to them, unless they are preloaded
1586 # with a really old cache.
1587 policies = local_caching.CachePolicies(
1588 # 1TiB.
1589 max_cache_size=1024*1024*1024*1024,
1590 min_free_space=options.min_free_space,
1591 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001592 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001593 root_dir = six.text_type(os.path.abspath(options.named_cache_root))
John Budorickc6186972020-02-26 00:58:14 +00001594 cache = local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
1595 # Touch any named caches we're going to use to minimize thrashing
1596 # between tasks that request some (but not all) of the same named caches.
John Budorick0a4dab62020-03-02 22:23:35 +00001597 cache.touch(*[name for name, _, _ in options.named_caches])
John Budorickc6186972020-02-26 00:58:14 +00001598 return cache
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001599 return None
1600
1601
aludwin7556e0c2016-10-26 08:46:10 -07001602def parse_args(args):
1603 # Create a fake mini-parser just to get out the "-a" command. Note that
1604 # it's not documented here; instead, it's documented in create_option_parser
1605 # even though that parser will never actually get to parse it. This is
1606 # because --argsfile is exclusive with all other options and arguments.
1607 file_argparse = argparse.ArgumentParser(add_help=False)
1608 file_argparse.add_argument('-a', '--argsfile')
1609 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1610 if file_args.argsfile:
1611 if nonfile_args:
1612 file_argparse.error('Can\'t specify --argsfile with'
1613 'any other arguments (%s)' % nonfile_args)
1614 try:
1615 with open(file_args.argsfile, 'r') as f:
1616 args = json.load(f)
1617 except (IOError, OSError, ValueError) as e:
1618 # We don't need to error out here - "args" is now empty,
1619 # so the call below to parser.parse_args(args) will fail
1620 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001621 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001622
1623 # Even if we failed to read the args, just call the normal parser now since it
1624 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001625 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001626 options, args = parser.parse_args(args)
Ye Kuangfff1e502020-07-13 13:21:57 +00001627 if not isinstance(options.cipd_enabled, (bool, int)):
1628 options.cipd_enabled = distutils.util.strtobool(options.cipd_enabled)
aludwin7556e0c2016-10-26 08:46:10 -07001629 return (parser, options, args)
1630
1631
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001632def _calc_named_cache_hint(named_cache, named_caches):
1633 """Returns the expected size of the missing named caches."""
1634 present = named_cache.available
1635 size = 0
1636 for name, _, hint in named_caches:
1637 if name not in present:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001638 hint = int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001639 if hint > 0:
1640 size += hint
1641 return size
1642
1643
Takuto Ikutaae391c52020-12-03 08:43:45 +00001644def _clean_cmd(parser, options, caches, root):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001645 """Cleanup cache dirs/files."""
1646 if options.isolated:
1647 parser.error('Can\'t use --isolated with --clean.')
1648 if options.isolate_server:
1649 parser.error('Can\'t use --isolate-server with --clean.')
1650 if options.json:
1651 parser.error('Can\'t use --json with --clean.')
1652 if options.named_caches:
1653 parser.error('Can\t use --named-cache with --clean.')
1654 if options.cas_instance or options.cas_digest:
1655 parser.error('Can\t use --cas-instance, --cas-digest with --clean.')
1656
1657 logging.info("initial free space: %d", file_path.get_free_space(root))
1658
Takuto Ikutaae391c52020-12-03 08:43:45 +00001659 if options.kvs_file and fs.isfile(six.text_type(options.kvs_file)):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001660 # Remove kvs file if its size exceeds fixed threshold.
Takuto Ikuta80bee362020-12-03 10:51:37 +00001661 st = fs.stat(six.text_type(options.kvs_file))
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001662 if st.st_size >= _CAS_KVS_CACHE_THRESHOLD:
1663 logging.info("remove kvs file with size: %d", st.st_size)
Takuto Ikuta80bee362020-12-03 10:51:37 +00001664 fs.remove(six.text_type(options.kvs_file))
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001665
1666 # Trim first, then clean.
1667 local_caching.trim_caches(
1668 caches,
1669 root,
1670 min_free_space=options.min_free_space,
1671 max_age_secs=MAX_AGE_SECS)
1672 logging.info("free space after trim: %d", file_path.get_free_space(root))
1673 for c in caches:
1674 c.cleanup()
1675 logging.info("free space after cleanup: %d", file_path.get_free_space(root))
1676
1677
aludwin7556e0c2016-10-26 08:46:10 -07001678def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001679 # Warning: when --argsfile is used, the strings are unicode instances, when
1680 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001681 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001682
Takuto Ikuta74682862021-02-03 04:49:12 +00001683 SWARMING_SERVER = 'SWARMING_SERVER'
1684 if options.report_on_exception and SWARMING_SERVER in os.environ:
1685 on_error.report_on_exception_exit(os.environ[SWARMING_SERVER])
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001686
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001687 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001688 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001689
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001690 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001691 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001692 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1693 if hint:
1694 # Increase the --min-free-space value by the hint, and recreate the
1695 # NamedCache instance so it gets the updated CachePolicy.
1696 options.min_free_space += hint
1697 named_cache = process_named_cache_options(parser, options)
1698
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001699 # TODO(crbug.com/932396): Remove this.
Takuto Ikuta4a22c2c2020-06-05 02:02:23 +00001700 use_go_isolated = options.cipd_enabled
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001701
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001702 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1703 # they can be cleaned the same way.
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001704
1705 isolate_cache = isolateserver.process_cache_options(options, trim=False)
1706 cas_cache = process_cas_cache_options(options)
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +00001707
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001708 caches = []
1709 if isolate_cache:
1710 caches.append(isolate_cache)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001711 if cas_cache:
1712 caches.append(cas_cache)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001713 if named_cache:
1714 caches.append(named_cache)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001715 root = caches[0].cache_dir if caches else six.text_type(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001716 if options.clean:
Takuto Ikutaae391c52020-12-03 08:43:45 +00001717 _clean_cmd(parser, options, caches, root)
maruel36a963d2016-04-08 17:15:49 -07001718 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001719
1720 # Trim must still be done for the following case:
1721 # - named-cache was used
1722 # - some entries, with a large hint, where missing
1723 # - --min-free-space was increased accordingly, thus trimming is needed
1724 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1725 # --clean after each task.
Takuto Ikutaa010c532020-10-21 05:42:29 +00001726 local_caching.trim_caches(
1727 caches,
1728 root,
Takuto Ikutaa32a1602021-01-20 06:55:16 +00001729 # Add 5+1GB more buffer for Go CLI.
1730 min_free_space=options.min_free_space + _CAS_KVS_CACHE_THRESHOLD +
1731 _FREE_SPACE_BUFFER_FOR_GO,
Takuto Ikutaa010c532020-10-21 05:42:29 +00001732 max_age_secs=MAX_AGE_SECS)
maruel36a963d2016-04-08 17:15:49 -07001733
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001734 # Save state of isolate/cas cache not to overwrite state from go client.
1735 if use_go_isolated:
1736 isolate_cache.save()
1737 isolate_cache = None
1738 if cas_cache:
1739 cas_cache.save()
1740 cas_cache = None
1741
nodir55be77b2016-05-03 09:39:57 -07001742 if not options.isolated and not args:
1743 parser.error('--isolated or command to run is required.')
1744
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001745 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001746
Takuto Ikutaae767b32020-05-11 01:22:19 +00001747 isolateserver.process_isolate_server_options(parser, options, False)
Junji Watanabeed9ce352020-09-25 12:32:07 +00001748 if ISOLATED_OUTDIR_PARAMETER in args and (not options.isolate_server and
1749 not options.cas_instance):
1750 parser.error('%s in args requires --isolate-server or --cas-instance' %
1751 ISOLATED_OUTDIR_PARAMETER)
1752
1753 if options.isolated and not options.isolate_server:
1754 parser.error('--isolated requires --isolate-server')
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001755
nodir90bc8dc2016-06-15 13:35:21 -07001756 if options.root_dir:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001757 options.root_dir = six.text_type(os.path.abspath(options.root_dir))
Takuto Ikutad46ea762020-10-07 05:43:22 +00001758 else:
1759 options.root_dir = six.text_type(tempfile.mkdtemp(prefix='root'))
maruel12e30012015-10-09 11:55:35 -07001760 if options.json:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001761 options.json = six.text_type(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001762
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001763 if any('=' not in i for i in options.env):
1764 parser.error(
1765 '--env required key=value form. value can be skipped to delete '
1766 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001767 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001768
1769 prefixes = {}
1770 cwd = os.path.realpath(os.getcwd())
1771 for item in options.env_prefix:
1772 if '=' not in item:
1773 parser.error(
1774 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1775 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001776 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001777 if os.path.isabs(opath):
1778 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1779 opath = os.path.normpath(opath)
1780 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1781 parser.error(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001782 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1783 % opath)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001784 prefixes.setdefault(key, []).append(opath)
1785 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001786
nodirbe642ff2016-06-09 15:51:51 -07001787 cipd.validate_cipd_options(parser, options)
1788
vadimsh232f5a82017-01-20 19:23:44 -08001789 install_packages_fn = noop_install_packages
Ye Kuang1d096cb2020-06-26 08:38:21 +00001790 tmp_cipd_cache_dir = None
vadimsh902948e2017-01-20 15:57:32 -08001791 if options.cipd_enabled:
Ye Kuang1d096cb2020-06-26 08:38:21 +00001792 cache_dir = options.cipd_cache
1793 if not cache_dir:
1794 tmp_cipd_cache_dir = six.text_type(tempfile.mkdtemp())
1795 cache_dir = tmp_cipd_cache_dir
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001796 install_packages_fn = (
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001797 lambda run_dir, isolated_dir, cas_dir: install_client_and_packages(
Ye Kuang1d096cb2020-06-26 08:38:21 +00001798 run_dir,
1799 cipd.parse_package_args(options.cipd_packages),
1800 options.cipd_server,
1801 options.cipd_client_package,
1802 options.cipd_client_version,
1803 cache_dir=cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001804 isolated_dir=isolated_dir,
1805 cas_dir=cas_dir,
1806 ))
nodirbe642ff2016-06-09 15:51:51 -07001807
nodird6160682017-02-02 13:03:35 -08001808 @contextlib.contextmanager
nodir0ae98b32017-05-11 13:21:53 -07001809 def install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001810 # WARNING: this function depends on "options" variable defined in the outer
1811 # function.
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001812 assert six.text_type(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001813 assert os.path.isabs(run_dir), run_dir
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001814 named_caches = [(os.path.join(run_dir, six.text_type(relpath)), name)
1815 for name, relpath, _ in options.named_caches]
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001816 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001817 named_cache.install(path, name)
nodird6160682017-02-02 13:03:35 -08001818 try:
1819 yield
1820 finally:
dnje289d132017-07-07 11:16:44 -07001821 # Uninstall each named cache, returning it to the cache pool. If an
1822 # uninstall fails for a given cache, it will remain in the task's
1823 # temporary space, get cleaned up by the Swarming bot, and be lost.
1824 #
1825 # If the Swarming bot cannot clean up the cache, it will handle it like
1826 # any other bot file that could not be removed.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001827 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001828 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001829 # uninstall() doesn't trim but does call save() implicitly. Trimming
1830 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001831 named_cache.uninstall(path, name)
1832 except local_caching.NamedCacheError:
1833 logging.exception('Error while removing named cache %r at %r. '
1834 'The cache will be lost.', path, name)
nodirf33b8d62016-10-26 22:34:58 -07001835
Takuto Ikutaf3caa9b2020-11-02 05:38:26 +00001836 command = args
1837 if options.relative_cwd:
1838 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1839 if not a.startswith(os.getcwd()):
1840 parser.error(
1841 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001842
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001843 containment_type = subprocess42.Containment.NONE
1844 if options.containment_type == 'AUTO':
1845 containment_type = subprocess42.Containment.AUTO
1846 if options.containment_type == 'JOB_OBJECT':
1847 containment_type = subprocess42.Containment.JOB_OBJECT
1848 containment = subprocess42.Containment(
1849 containment_type=containment_type,
1850 limit_processes=options.limit_processes,
1851 limit_total_committed_memory=options.limit_total_committed_memory)
1852
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001853 data = TaskData(
1854 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001855 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001856 isolated_hash=options.isolated,
1857 storage=None,
1858 isolate_cache=isolate_cache,
Junji Watanabe54925c32020-09-08 00:56:18 +00001859 cas_instance=options.cas_instance,
1860 cas_digest=options.cas_digest,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001861 outputs=options.output,
1862 install_named_caches=install_named_caches,
1863 leak_temp_dir=options.leak_temp_dir,
1864 root_dir=_to_unicode(options.root_dir),
1865 hard_timeout=options.hard_timeout,
1866 grace_period=options.grace_period,
1867 bot_file=options.bot_file,
1868 switch_to_account=options.switch_to_account,
1869 install_packages_fn=install_packages_fn,
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001870 use_go_isolated=use_go_isolated,
Takuto Ikuta10cae642020-01-08 08:12:07 +00001871 go_cache_dir=options.cache,
Takuto Ikuta879788c2020-01-10 08:00:26 +00001872 go_cache_policies=local_caching.CachePolicies(
1873 max_cache_size=options.max_cache_size,
1874 min_free_space=options.min_free_space,
1875 max_items=options.max_items,
1876 max_age_secs=None,
1877 ),
Junji Watanabeb03450b2020-09-25 05:09:27 +00001878 cas_cache_dir=options.cas_cache,
1879 cas_cache_policies=local_caching.CachePolicies(
1880 max_cache_size=options.max_cache_size,
1881 min_free_space=options.min_free_space,
1882 max_items=None,
1883 max_age_secs=None,
1884 ),
Takuto Ikutaae391c52020-12-03 08:43:45 +00001885 cas_kvs=options.kvs_file,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001886 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001887 env_prefix=options.env_prefix,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001888 lower_priority=bool(options.lower_priority),
1889 containment=containment)
nodirbe642ff2016-06-09 15:51:51 -07001890 try:
nodir90bc8dc2016-06-15 13:35:21 -07001891 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001892 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001893 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001894 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001895 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001896 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001897 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001898 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001899 return run_tha_test(data, options.json)
1900 return run_tha_test(data, options.json)
Junji Watanabe38b28b02020-04-23 10:23:30 +00001901 except (cipd.Error, local_caching.NamedCacheError,
1902 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001903 print(ex.message, file=sys.stderr)
nodirbe642ff2016-06-09 15:51:51 -07001904 return 1
Ye Kuang1d096cb2020-06-26 08:38:21 +00001905 finally:
1906 if tmp_cipd_cache_dir is not None:
1907 try:
1908 file_path.rmtree(tmp_cipd_cache_dir)
1909 except OSError:
1910 logging.exception('Remove tmp_cipd_cache_dir=%s failed',
1911 tmp_cipd_cache_dir)
1912 # Best effort clean up. Failed to do so doesn't affect the outcome.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001913
1914
1915if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001916 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001917 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001918 fix_encoding.fix_encoding()
Ye Kuang2dd17442020-04-22 08:45:52 +00001919 net.set_user_agent('run_isolated.py/' + __version__)
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001920 sys.exit(main(sys.argv[1:]))