blob: b2cc3c7045750c8e01d4666edcd3e2c2f357ab8d [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
33See
34https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
35for all the variables.
36
37See
38https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
39for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000040"""
41
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000042from __future__ import print_function
43
44__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000045
aludwin7556e0c2016-10-26 08:46:10 -070046import argparse
maruel064c0a32016-04-05 11:47:15 -070047import base64
iannucci96fcccc2016-08-30 15:52:22 -070048import collections
vadimsh232f5a82017-01-20 19:23:44 -080049import contextlib
Ye Kuangfff1e502020-07-13 13:21:57 +000050import distutils
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040051import errno
aludwin7556e0c2016-10-26 08:46:10 -070052import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000053import logging
54import optparse
55import os
Takuto Ikuta5c59a842020-01-24 03:05:24 +000056import platform
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040057import re
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000058import sys
59import tempfile
maruel064c0a32016-04-05 11:47:15 -070060import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000061
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000062from utils import tools
63tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000064
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000065# third_party/
66from depot_tools import fix_encoding
Takuto Ikuta6e2ff962019-10-29 12:35:27 +000067import six
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000068
69# pylint: disable=ungrouped-imports
Takuto Ikutad53d7bd2021-07-16 03:09:33 +000070import DEPS
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000071import auth
72import cipd
73import isolate_storage
74import isolateserver
75import local_caching
76from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070077from utils import file_path
maruel12e30012015-10-09 11:55:35 -070078from utils import fs
maruel064c0a32016-04-05 11:47:15 -070079from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040080from utils import logging_utils
Ye Kuang2dd17442020-04-22 08:45:52 +000081from utils import net
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040082from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050083from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000084
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000085
maruele2f2cb82016-07-13 14:41:03 -070086# Magic variables that can be found in the isolate task command line.
87ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
88EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
89SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
90
91
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000092# The name of the log file to use.
93RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
94
maruele2f2cb82016-07-13 14:41:03 -070095
maruele2f2cb82016-07-13 14:41:03 -070096# Use short names for temporary directories. This is driven by Windows, which
97# imposes a relatively short maximum path length of 260 characters, often
98# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +000099# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -0700100#
101# It is recommended to start the script with a `root_dir` as short as
102# possible.
103# - ir stands for isolated_run
104# - io stands for isolated_out
105# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000106# - ic stands for isolated_client
maruele2f2cb82016-07-13 14:41:03 -0700107ISOLATED_RUN_DIR = u'ir'
108ISOLATED_OUT_DIR = u'io'
109ISOLATED_TMP_DIR = u'it'
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000110ISOLATED_CLIENT_DIR = u'ic'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000111_CAS_CLIENT_DIR = u'cc'
maruele2f2cb82016-07-13 14:41:03 -0700112
Takuto Ikuta02edca22019-11-29 10:04:51 +0000113# TODO(tikuta): take these parameter from luci-config?
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +0000114# Update tag by `./client/update_go_clients.sh`.
Takuto Ikutac8c92e62020-04-01 07:07:29 +0000115# Or take revision from
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000116# https://ci.chromium.org/p/infra-internal/g/infra-packagers/console
Takuto Ikuta02edca22019-11-29 10:04:51 +0000117ISOLATED_PACKAGE = 'infra/tools/luci/isolated/${platform}'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000118_CAS_PACKAGE = 'infra/tools/luci/cas/${platform}'
Takuto Ikutad53d7bd2021-07-16 03:09:33 +0000119_LUCI_GO_REVISION = DEPS.deps['luci-go']['packages'][0]['version']
maruele2f2cb82016-07-13 14:41:03 -0700120
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400121# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000122CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400123
Takuto Ikutac9ddff22021-02-18 07:58:39 +0000124_FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES = 2 * 1024 * 1024 * 1024
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400125
marueld928c862017-06-08 08:20:04 -0700126OUTLIVING_ZOMBIE_MSG = """\
127*** Swarming tried multiple times to delete the %s directory and failed ***
128*** Hard failing the task ***
129
130Swarming detected that your testing script ran an executable, which may have
131started a child executable, and the main script returned early, leaving the
132children executables playing around unguided.
133
134You don't want to leave children processes outliving the task on the Swarming
135bot, do you? The Swarming bot doesn't.
136
137How to fix?
138- For any process that starts children processes, make sure all children
139 processes terminated properly before each parent process exits. This is
140 especially important in very deep process trees.
141 - This must be done properly both in normal successful task and in case of
142 task failure. Cleanup is very important.
143- The Swarming bot sends a SIGTERM in case of timeout.
144 - You have %s seconds to comply after the signal was sent to the process
145 before the process is forcibly killed.
146- To achieve not leaking children processes in case of signals on timeout, you
147 MUST handle signals in each executable / python script and propagate them to
148 children processes.
149 - When your test script (python or binary) receives a signal like SIGTERM or
150 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
151 them to terminate before quitting.
152
153See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400154https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700155for more information.
156
157*** May the SIGKILL force be with you ***
158"""
159
160
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000161# Currently hardcoded. Eventually could be exposed as a flag once there's value.
162# 3 weeks
163MAX_AGE_SECS = 21*24*60*60
164
Takuto Ikuta7ff4b242020-12-03 08:07:06 +0000165_CAS_KVS_CACHE_THRESHOLD = 5 * 1024 * 1024 * 1024 # 5 GiB
166
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500167TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000168 'TaskData',
169 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000170 # List of strings; the command line to use, independent of what was
171 # specified in the isolated file.
172 'command',
173 # Relative directory to start command into.
174 'relative_cwd',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000175 # Hash of the .isolated file that must be retrieved to recreate the tree
176 # of files to run the target executable. The command specified in the
177 # .isolated is executed. Mutually exclusive with command argument.
178 'isolated_hash',
179 # isolateserver.Storage instance to retrieve remote objects. This object
180 # has a reference to an isolateserver.StorageApi, which does the actual
181 # I/O.
182 'storage',
183 # isolateserver.LocalCache instance to keep from retrieving the same
184 # objects constantly by caching the objects retrieved. Can be on-disk or
185 # in-memory.
186 'isolate_cache',
Junji Watanabe54925c32020-09-08 00:56:18 +0000187 # Digest of the input root on RBE-CAS.
188 'cas_digest',
189 # Full CAS instance name.
190 'cas_instance',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000191 # List of paths relative to root_dir to put into the output isolated
192 # bundle upon task completion (see link_outputs_to_outdir).
193 'outputs',
194 # Function (run_dir) => context manager that installs named caches into
195 # |run_dir|.
196 'install_named_caches',
197 # If True, the temporary directory will be deliberately leaked for later
198 # examination.
199 'leak_temp_dir',
200 # Path to the directory to use to create the temporary directory. If not
201 # specified, a random temporary directory is created.
202 'root_dir',
203 # Kills the process if it lasts more than this amount of seconds.
204 'hard_timeout',
205 # Number of seconds to wait between SIGTERM and SIGKILL.
206 'grace_period',
207 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
208 # task command line argument.
209 'bot_file',
210 # Logical account to switch LUCI_CONTEXT into.
211 'switch_to_account',
212 # Context manager dir => CipdInfo, see install_client_and_packages.
213 'install_packages_fn',
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000214 # Use go isolated client.
215 'use_go_isolated',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000216 # Cache directory for go `isolated` client.
Takuto Ikuta057c5342019-12-03 04:05:05 +0000217 'go_cache_dir',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000218 # Parameters passed to go `isolated` client.
Takuto Ikuta879788c2020-01-10 08:00:26 +0000219 'go_cache_policies',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000220 # Cache directory for `cas` client.
221 'cas_cache_dir',
222 # Parameters passed to `cas` client.
223 'cas_cache_policies',
Takuto Ikutaae391c52020-12-03 08:43:45 +0000224 # Parameters for kvs file used by `cas` client.
225 'cas_kvs',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000226 # Environment variables to set.
227 'env',
228 # Environment variables to mutate with relative directories.
229 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
230 'env_prefix',
231 # Lowers the task process priority.
232 'lower_priority',
233 # subprocess42.Containment instance. Can be None.
234 'containment',
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000235 # Function to trim caches before installing cipd packages and
236 # downloading isolated files.
237 'trim_caches_fn',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000238 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500239
240
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500241def _to_str(s):
242 """Downgrades a unicode instance to str. Pass str through as-is."""
243 if isinstance(s, str):
244 return s
245 # This is technically incorrect, especially on Windows. In theory
246 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
247 # page' on Windows, but that causes other problems, as the character set
248 # is very limited.
249 return s.encode('utf-8')
250
251
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500252def _to_unicode(s):
253 """Upgrades a str instance to unicode. Pass unicode through as-is."""
Takuto Ikuta95459dd2019-10-29 12:39:47 +0000254 if isinstance(s, six.text_type) or s is None:
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500255 return s
256 return s.decode('utf-8')
257
258
maruel03e11842016-07-14 10:50:16 -0700259def make_temp_dir(prefix, root_dir):
260 """Returns a new unique temporary directory."""
Takuto Ikuta6e2ff962019-10-29 12:35:27 +0000261 return six.text_type(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000262
263
vadimsh9c54b2c2017-07-25 14:08:29 -0700264@contextlib.contextmanager
265def set_luci_context_account(account, tmp_dir):
266 """Sets LUCI_CONTEXT account to be used by the task.
267
268 If 'account' is None or '', does nothing at all. This happens when
269 run_isolated.py is called without '--switch-to-account' flag. In this case,
270 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000271 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700272 run_isolated.py explicitly from their code.
273
274 If the requested account is not defined in the context, switches to
275 non-authenticated access. This happens for Swarming tasks that don't use
276 'task' service accounts.
277
278 If not using LUCI_CONTEXT-based auth, does nothing.
279 If already running as requested account, does nothing.
280 """
281 if not account:
282 # Not actually switching.
283 yield
284 return
285
286 local_auth = luci_context.read('local_auth')
287 if not local_auth:
288 # Not using LUCI_CONTEXT auth at all.
289 yield
290 return
291
292 # See LUCI_CONTEXT.md for the format of 'local_auth'.
293 if local_auth.get('default_account_id') == account:
294 # Already set, no need to switch.
295 yield
296 return
297
298 available = {a['id'] for a in local_auth.get('accounts') or []}
299 if account in available:
300 logging.info('Switching default LUCI_CONTEXT account to %r', account)
301 local_auth['default_account_id'] = account
302 else:
303 logging.warning(
304 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
305 'disabling authentication', account, sorted(available))
306 local_auth.pop('default_account_id', None)
307
308 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
309 yield
310
311
nodir90bc8dc2016-06-15 13:35:21 -0700312def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000313 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700314
315 Raises:
316 ValueError if a parameter is requested in |command| but its value is not
317 provided.
318 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000319 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
320
321
322def replace_parameters(arg, out_dir, bot_file):
323 """Replaces parameter tokens with appropriate values in a string.
324
325 Raises:
326 ValueError if a parameter is requested in |arg| but its value is not
327 provided.
328 """
329 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
330 replace_slash = False
331 if ISOLATED_OUTDIR_PARAMETER in arg:
332 if not out_dir:
333 raise ValueError(
334 'output directory is requested in command or env var, but not '
335 'provided; please specify one')
336 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
337 replace_slash = True
338 if SWARMING_BOT_FILE_PARAMETER in arg:
339 if bot_file:
340 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700341 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000342 else:
343 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
344 'var, but no bot_file specified. Leaving parameter '
345 'unchanged.')
346 if replace_slash:
347 # Replace slashes only if parameters are present
348 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
349 arg = arg.replace('/', os.sep)
350 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700351
352
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000353def set_temp_dir(env, tmp_dir):
354 """Set temp dir to given env var dictionary"""
355 tmp_dir = _to_str(tmp_dir)
356 # pylint: disable=line-too-long
357 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
358 # platform. So $TMPDIR must be set on all platforms.
359 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
360 env['TMPDIR'] = tmp_dir
361 if sys.platform == 'win32':
362 # * chromium's base utils uses GetTempPath().
363 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
364 # * Go uses GetTempPath().
365 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
366 # set.
367 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
368 env['TMP'] = tmp_dir
369 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
370 env['TEMP'] = tmp_dir
371 elif sys.platform == 'darwin':
372 # * Chromium uses an hack on macOS before calling into
373 # NSTemporaryDirectory().
374 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
375 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
376 env['MAC_CHROMIUM_TMPDIR'] = tmp_dir
377 else:
378 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
379 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
380 # * mktemp on linux respects $TMPDIR.
381 # * Chromium respects $TMPDIR on linux.
382 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
383 # * Go uses $TMPDIR.
384 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
385 pass
386
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000387
388def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
389 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800390 """Returns full OS environment to run a command in.
391
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800392 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
393 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800394
395 Args:
396 tmp_dir: temp directory.
397 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500398 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500399 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800400 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000401 out_dir: Isolated output directory. Required to be != None if any of the
402 env vars contain ISOLATED_OUTDIR_PARAMETER.
403 bot_file: Required to be != None if any of the env vars contain
404 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800405 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500406 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000407 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500408 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500409 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500410 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000411 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500412
413 if cipd_info:
414 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500415 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
416 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Takuto Ikuta4ec3e8f2021-04-05 10:21:29 +0000417 cipd_info_path = os.path.join(tmp_dir, 'cipd_info.json')
418 with open(cipd_info_path, 'w') as f:
419 json.dump(cipd_info.pins, f)
420 out['ISOLATED_RESOLVED_PACKAGE_VERSIONS_FILE'] = cipd_info_path
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500421
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000422 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500423 assert isinstance(paths, list), paths
424 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500425 cur = out.get(key)
426 if cur:
427 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500428 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800429
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000430 set_temp_dir(out, tmp_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500431 return out
vadimsh232f5a82017-01-20 19:23:44 -0800432
433
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000434def run_command(
435 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700436 """Runs the command.
437
438 Returns:
439 tuple(process exit code, bool if had a hard timeout)
440 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000441 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000442 'run_command(%s, %s, %s, %s, %s, %s)',
443 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700444
maruel6be7f9e2015-10-01 12:25:30 -0700445 exit_code = None
446 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700447 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700448 proc = None
449 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700450 try:
maruel6be7f9e2015-10-01 12:25:30 -0700451 # TODO(maruel): This code is imperfect. It doesn't handle well signals
452 # during the download phase and there's short windows were things can go
453 # wrong.
454 def handler(signum, _frame):
455 if proc and not had_signal:
456 logging.info('Received signal %d', signum)
457 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700458 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700459
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000460 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000461 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000462 lower_priority=lower_priority, containment=containment)
maruel6be7f9e2015-10-01 12:25:30 -0700463 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
464 try:
John Budorickc398f092019-06-10 22:49:44 +0000465 exit_code = proc.wait(hard_timeout or None)
maruel6be7f9e2015-10-01 12:25:30 -0700466 except subprocess42.TimeoutExpired:
467 if not had_signal:
468 logging.warning('Hard timeout')
469 had_hard_timeout = True
470 logging.warning('Sending SIGTERM')
471 proc.terminate()
472
Takuto Ikuta684f7912020-09-29 07:49:49 +0000473 kill_sent = False
maruel6be7f9e2015-10-01 12:25:30 -0700474 # Ignore signals in grace period. Forcibly give the grace period to the
475 # child process.
476 if exit_code is None:
477 ignore = lambda *_: None
478 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
479 try:
480 exit_code = proc.wait(grace_period or None)
481 except subprocess42.TimeoutExpired:
482 # Now kill for real. The user can distinguish between the
483 # following states:
484 # - signal but process exited within grace period,
485 # hard_timed_out will be set but the process exit code will be
486 # script provided.
487 # - processed exited late, exit code will be -9 on posix.
488 logging.warning('Grace exhausted; sending SIGKILL')
489 proc.kill()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000490 kill_sent = True
martiniss5c8043e2017-08-01 17:09:43 -0700491 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700492 exit_code = proc.wait()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000493
494 # the process group / job object may be dangling so if we didn't kill
495 # it already, give it a poke now.
496 if not kill_sent:
497 proc.kill()
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000498 except OSError as e:
maruela9cfd6f2015-09-15 11:03:15 -0700499 # This is not considered to be an internal error. The executable simply
500 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800501 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000502 '<The executable does not exist, a dependent library is missing or '
503 'the command line is too long>\n'
504 '<Check for missing .so/.dll in the .isolate or GN file or length of '
505 'command line args>\n'
Takuto Ikutae900df42021-04-14 04:40:11 +0000506 '<Command: %s>\n'
507 '<Exception: %s>\n' % (command, e))
maruela72f46e2016-02-24 11:05:45 -0800508 if os.environ.get('SWARMING_TASK_ID'):
509 # Give an additional hint when running as a swarming task.
510 sys.stderr.write(
511 '<See the task\'s page for commands to help diagnose this issue '
512 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700513 exit_code = 1
514 logging.info(
515 'Command finished with exit code %d (%s)',
516 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700517 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700518
519
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000520def _run_go_cmd_and_wait(cmd, tmp_dir):
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000521 """
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000522 Runs an external Go command, `isolated` or `cas`, and wait for its completion.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000523
524 While this is a generic function to launch a subprocess, it has logic that
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000525 is specific to Go `isolated` and `cas` for waiting and logging.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000526
527 Returns:
528 The subprocess object
529 """
Ye Kuang3c40e9f2020-07-28 13:15:25 +0000530 cmd_str = ' '.join(cmd)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000531 try:
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000532 env = os.environ.copy()
533 set_temp_dir(env, tmp_dir)
534 proc = subprocess42.Popen(cmd, env=env)
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000535
Ye Kuangc1d800f2020-07-28 10:14:55 +0000536 exceeded_max_timeout = True
537 check_period_sec = 30
538 max_checks = 100
539 # max timeout = max_checks * check_period_sec = 50 minutes
540 for i in range(max_checks):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000541 # This is to prevent I/O timeout error during setup.
Ye Kuangc1d800f2020-07-28 10:14:55 +0000542 try:
543 retcode = proc.wait(check_period_sec)
544 if retcode != 0:
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000545 raise subprocess42.CalledProcessError(retcode, cmd=cmd_str)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000546 exceeded_max_timeout = False
547 break
548 except subprocess42.TimeoutExpired:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000549 print('still running (after %d seconds)' % ((i + 1) * check_period_sec))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000550
Ye Kuangc1d800f2020-07-28 10:14:55 +0000551 if exceeded_max_timeout:
552 proc.terminate()
553 try:
554 proc.wait(check_period_sec)
555 except subprocess42.TimeoutExpired:
556 logging.exception(
557 "failed to terminate? timeout happened after %d seconds",
558 check_period_sec)
559 proc.kill()
560 proc.wait()
561 # Raise unconditionally, because |proc| was forcefully terminated.
562 raise ValueError("timedout after %d seconds (cmd=%s)" %
563 (check_period_sec * max_checks, cmd_str))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000564
Ye Kuangc1d800f2020-07-28 10:14:55 +0000565 return proc
566 except Exception:
567 logging.exception('Failed to run Go cmd %s', cmd_str)
568 raise
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000569
570
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000571def _fetch_and_map_with_cas(cas_client, digest, instance, output_dir, cache_dir,
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000572 policies, kvs_dir, tmp_dir):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000573 """
574 Fetches a CAS tree using cas client, create the tree and returns download
575 stats.
576 """
577
578 start = time.time()
579 result_json_handle, result_json_path = tempfile.mkstemp(
580 prefix=u'fetch-and-map-result-', suffix=u'.json')
581 os.close(result_json_handle)
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000582 profile_dir = tempfile.mkdtemp(dir=tmp_dir)
583
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000584 try:
585 cmd = [
586 cas_client,
587 'download',
588 '-digest',
589 digest,
590 '-cas-instance',
591 instance,
592 # flags for cache.
593 '-cache-dir',
594 cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000595 '-cache-max-size',
596 str(policies.max_cache_size),
597 '-cache-min-free-space',
598 str(policies.min_free_space),
599 # flags for output.
600 '-dir',
601 output_dir,
602 '-dump-stats-json',
603 result_json_path,
Takuto Ikuta557025b2021-02-01 08:37:40 +0000604 '-log-level',
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000605 'info',
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000606 ]
Takuto Ikutaae391c52020-12-03 08:43:45 +0000607
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000608 if kvs_dir:
609 cmd.extend(['-kvs-dir', kvs_dir])
Takuto Ikutaae391c52020-12-03 08:43:45 +0000610
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000611 try:
612 _run_go_cmd_and_wait(cmd, tmp_dir)
Takuto Ikuta0909eae2021-04-27 02:54:07 +0000613 except subprocess42.CalledProcessError as ex:
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000614 if not kvs_dir:
615 raise
616 logging.exception('Failed to run cas, removing kvs cache dir and retry.')
Takuto Ikuta0909eae2021-04-27 02:54:07 +0000617 on_error.report("Failed to run cas %s" % ex)
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000618 file_path.rmtree(kvs_dir)
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000619 _run_go_cmd_and_wait(cmd, tmp_dir)
620
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000621 with open(result_json_path) as json_file:
622 result_json = json.load(json_file)
623
624 return {
625 'duration': time.time() - start,
626 'items_cold': result_json['items_cold'],
627 'items_hot': result_json['items_hot'],
628 }
629 finally:
630 fs.remove(result_json_path)
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000631 file_path.rmtree(profile_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000632
633
634def _fetch_and_map_with_go_isolated(isolated_hash, storage, outdir,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000635 go_cache_dir, policies, isolated_client,
636 tmp_dir):
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000637 """
638 Fetches an isolated tree using go client, create the tree and returns
Takuto Ikuta57219f42020-11-02 07:35:36 +0000639 stats.
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000640 """
641 start = time.time()
642 server_ref = storage.server_ref
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000643 result_json_handle, result_json_path = tempfile.mkstemp(
644 prefix=u'fetch-and-map-result-', suffix=u'.json')
645 os.close(result_json_handle)
646 try:
Ye Kuanga98764c2020-04-09 03:17:37 +0000647 cmd = [
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000648 isolated_client,
649 'download',
650 '-isolate-server',
651 server_ref.url,
652 '-namespace',
653 server_ref.namespace,
654 '-isolated',
655 isolated_hash,
656
657 # flags for cache
658 '-cache-dir',
Takuto Ikuta057c5342019-12-03 04:05:05 +0000659 go_cache_dir,
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000660 '-cache-max-items',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000661 str(policies.max_items),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000662 '-cache-max-size',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000663 str(policies.max_cache_size),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000664 '-cache-min-free-space',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000665 str(policies.min_free_space),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000666
667 # flags for output
668 '-output-dir',
669 outdir,
670 '-fetch-and-map-result-json',
671 result_json_path,
Ye Kuanga98764c2020-04-09 03:17:37 +0000672 ]
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000673 _run_go_cmd_and_wait(cmd, tmp_dir)
Takuto Ikuta3153e3b2020-02-18 06:11:47 +0000674
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000675 with open(result_json_path) as json_file:
676 result_json = json.load(json_file)
677
Takuto Ikuta57219f42020-11-02 07:35:36 +0000678 return {
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000679 'duration': time.time() - start,
680 'items_cold': result_json['items_cold'],
681 'items_hot': result_json['items_hot'],
Ye Kuang65a1de52020-10-16 08:31:16 +0000682 'initial_number_items': result_json['initial_number_items'],
683 'initial_size': result_json['initial_size'],
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000684 }
685 finally:
686 fs.remove(result_json_path)
687
688
689# TODO(crbug.com/932396): remove this function.
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000690def fetch_and_map(isolated_hash, storage, cache, outdir):
Takuto Ikuta57219f42020-11-02 07:35:36 +0000691 """Fetches an isolated tree, create the tree and returns stats."""
nodir6f801882016-04-29 14:41:50 -0700692 start = time.time()
Takuto Ikuta57219f42020-11-02 07:35:36 +0000693 isolateserver.fetch_isolated(
nodir6f801882016-04-29 14:41:50 -0700694 isolated_hash=isolated_hash,
695 storage=storage,
696 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700697 outdir=outdir,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000698 use_symlinks=False)
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000699 hot = (collections.Counter(cache.used) -
700 collections.Counter(cache.added)).elements()
Takuto Ikuta57219f42020-11-02 07:35:36 +0000701 return {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000702 'duration': time.time() - start,
703 'items_cold': base64.b64encode(large.pack(sorted(cache.added))).decode(),
704 'items_hot': base64.b64encode(large.pack(sorted(hot))).decode(),
nodir6f801882016-04-29 14:41:50 -0700705 }
706
707
aludwin0a8e17d2016-10-27 15:57:39 -0700708def link_outputs_to_outdir(run_dir, out_dir, outputs):
709 """Links any named outputs to out_dir so they can be uploaded.
710
711 Raises an error if the file already exists in that directory.
712 """
713 if not outputs:
714 return
715 isolateserver.create_directories(out_dir, outputs)
716 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400717 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
718
719
720def copy_recursively(src, dst):
721 """Efficiently copies a file or directory from src_dir to dst_dir.
722
723 `item` may be a file, directory, or a symlink to a file or directory.
724 All symlinks are replaced with their targets, so the resulting
725 directory structure in dst_dir will never have any symlinks.
726
727 To increase speed, copy_recursively hardlinks individual files into the
728 (newly created) directory structure if possible, unlike Python's
729 shutil.copytree().
730 """
731 orig_src = src
732 try:
733 # Replace symlinks with their final target.
734 while fs.islink(src):
735 res = fs.readlink(src)
Takuto Ikutaf2ad0a02021-06-24 08:38:40 +0000736 src = os.path.realpath(os.path.join(os.path.dirname(src), res))
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400737 # TODO(sadafm): Explicitly handle cyclic symlinks.
738
Takuto Ikutaf2ad0a02021-06-24 08:38:40 +0000739 if not fs.exists(src):
740 logging.warning('Path %s does not exist or %s is a broken symlink', src,
741 orig_src)
742 return
743
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400744 if fs.isfile(src):
745 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
746 return
747
748 if not fs.exists(dst):
749 os.makedirs(dst)
750
751 for child in fs.listdir(src):
752 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
753
754 except OSError as e:
755 if e.errno == errno.ENOENT:
756 logging.warning('Path %s does not exist or %s is a broken symlink',
757 src, orig_src)
758 else:
759 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700760
761
Ye Kuangfb0bad62020-07-28 08:07:25 +0000762def _upload_with_py(storage, out_dir):
763
764 def process_stats(f_st):
765 st = sorted(i.size for i in f_st)
766 return base64.b64encode(large.pack(st)).decode()
767
768 try:
769 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
770 storage, [out_dir], None, verify_push=True)
771
772 isolated = list(results.values())[0]
773 cold = process_stats(f_cold)
774 hot = process_stats(f_hot)
775 return isolated, cold, hot
776
777 except isolateserver.Aborted:
778 # This happens when a signal SIGTERM was received while uploading data.
779 # There is 2 causes:
780 # - The task was too slow and was about to be killed anyway due to
781 # exceeding the hard timeout.
782 # - The amount of data uploaded back is very large and took too much
783 # time to archive.
784 sys.stderr.write('Received SIGTERM while uploading')
785 # Re-raise, so it will be treated as an internal failure.
786 raise
787
788
Takuto Ikutaf5173872021-05-11 03:18:40 +0000789def upload_out_dir(storage, out_dir):
Ye Kuangbc4e8402020-07-29 09:54:30 +0000790 """Uploads the results in |out_dir| back, if there is any.
maruela9cfd6f2015-09-15 11:03:15 -0700791
792 Returns:
Ye Kuangbc4e8402020-07-29 09:54:30 +0000793 tuple(outputs_ref, stats)
maruel064c0a32016-04-05 11:47:15 -0700794 - outputs_ref: a dict referring to the results archived back to the isolated
795 server, if applicable.
nodir6f801882016-04-29 14:41:50 -0700796 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700797 """
maruela9cfd6f2015-09-15 11:03:15 -0700798 # Upload out_dir and generate a .isolated file out of this directory. It is
799 # only done if files were written in the directory.
800 outputs_ref = None
Ye Kuangfb0bad62020-07-28 08:07:25 +0000801 cold = ''
802 hot = ''
nodir6f801882016-04-29 14:41:50 -0700803 start = time.time()
804
maruel12e30012015-10-09 11:55:35 -0700805 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700806 with tools.Profiler('ArchiveOutput'):
Takuto Ikutaf5173872021-05-11 03:18:40 +0000807 isolated, cold, hot = _upload_with_py(storage, out_dir)
Ye Kuangfb0bad62020-07-28 08:07:25 +0000808 outputs_ref = {
809 'isolated': isolated,
810 'isolatedserver': storage.server_ref.url,
811 'namespace': storage.server_ref.namespace,
812 }
nodir6f801882016-04-29 14:41:50 -0700813
nodir6f801882016-04-29 14:41:50 -0700814 stats = {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000815 'duration': time.time() - start,
Ye Kuangfb0bad62020-07-28 08:07:25 +0000816 'items_cold': cold,
817 'items_hot': hot,
nodir6f801882016-04-29 14:41:50 -0700818 }
Ye Kuangbc4e8402020-07-29 09:54:30 +0000819 return outputs_ref, stats
maruela9cfd6f2015-09-15 11:03:15 -0700820
821
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000822def upload_outdir_with_cas(cas_client, cas_instance, outdir, tmp_dir):
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000823 """Uploads the results in |outdir|, if there is any.
824
825 Returns:
826 tuple(root_digest, stats)
827 - root_digest: a digest of the output directory.
828 - stats: uploading stats.
829 """
830 digest_file_handle, digest_path = tempfile.mkstemp(
831 prefix=u'cas-digest', suffix=u'.txt')
832 os.close(digest_file_handle)
833 stats_json_handle, stats_json_path = tempfile.mkstemp(
834 prefix=u'upload-stats', suffix=u'.json')
835 os.close(stats_json_handle)
836
837 try:
838 cmd = [
839 cas_client,
840 'archive',
841 '-cas-instance',
842 cas_instance,
843 '-paths',
844 # Format: <working directory>:<relative path to dir>
845 outdir + ':',
846 # output
847 '-dump-digest',
848 digest_path,
849 '-dump-stats-json',
850 stats_json_path,
851 ]
852
853 start = time.time()
854
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000855 _run_go_cmd_and_wait(cmd, tmp_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000856
857 with open(digest_path) as digest_file:
858 digest = digest_file.read()
Junji Watanabec208b302020-09-25 09:18:27 +0000859 h, s = digest.split('/')
860 cas_output_root = {
861 'cas_instance': cas_instance,
862 'digest': {
863 'hash': h,
864 'size_bytes': int(s)
865 }
866 }
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000867 with open(stats_json_path) as stats_file:
868 stats = json.load(stats_file)
869
870 stats['duration'] = time.time() - start
871
Junji Watanabec208b302020-09-25 09:18:27 +0000872 return cas_output_root, stats
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000873 finally:
874 fs.remove(digest_path)
875 fs.remove(stats_json_path)
876
877
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500878def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700879 """Runs a command with optional isolated input/output.
880
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500881 Arguments:
882 - data: TaskData instance.
883 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700884
885 Returns metadata about the result.
886 """
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000887
888 if data.isolate_cache:
889 download_stats = {
890 #'duration': 0.,
891 'initial_number_items': len(data.isolate_cache),
892 'initial_size': data.isolate_cache.total_size,
893 #'items_cold': '<large.pack()>',
894 #'items_hot': '<large.pack()>',
895 }
896 else:
897 # TODO(tikuta): take stats from state.json in this case too.
898 download_stats = {}
899
maruela9cfd6f2015-09-15 11:03:15 -0700900 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000901 'duration': None,
902 'exit_code': None,
903 'had_hard_timeout': False,
904 'internal_failure': 'run_isolated did not complete properly',
905 'stats': {
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000906 'trim_caches': {
907 'duration': 0,
908 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000909 #'cipd': {
910 # 'duration': 0.,
911 # 'get_client_duration': 0.,
912 #},
913 'isolated': {
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000914 'download': download_stats,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000915 #'upload': {
916 # 'duration': 0.,
917 # 'items_cold': '<large.pack()>',
918 # 'items_hot': '<large.pack()>',
919 #},
920 },
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000921 'named_caches': {
922 'install': {
923 'duration': 0,
924 },
925 'uninstall': {
926 'duration': 0,
927 },
928 },
929 'cleanup': {
930 'duration': 0,
931 }
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000932 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000933 #'cipd_pins': {
934 # 'packages': [
935 # {'package_name': ..., 'version': ..., 'path': ...},
936 # ...
937 # ],
938 # 'client_package': {'package_name': ..., 'version': ...},
939 #},
940 'outputs_ref': None,
Junji Watanabe54925c32020-09-08 00:56:18 +0000941 'cas_output_root': None,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000942 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700943 }
nodirbe642ff2016-06-09 15:51:51 -0700944
Takuto Ikutad46ea762020-10-07 05:43:22 +0000945 assert os.path.isabs(data.root_dir), ("data.root_dir is not abs path: %s" %
946 data.root_dir)
947 file_path.ensure_tree(data.root_dir, 0o700)
948
maruele2f2cb82016-07-13 14:41:03 -0700949 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700950 # TODO(maruel): This is not obvious. Change this to become an error once we
951 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500952 if constant_run_path and data.root_dir:
953 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700954 if os.path.isdir(run_dir):
955 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000956 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700957 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500958 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000959
960 # True if CAS is used for download/upload files.
961 use_cas = bool(data.cas_digest)
962
maruel03e11842016-07-14 10:50:16 -0700963 # storage should be normally set but don't crash if it is not. This can happen
964 # as Swarming task can run without an isolate server.
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000965 out_dir = None
966 if data.storage or use_cas:
967 out_dir = make_temp_dir(ISOLATED_OUT_DIR, data.root_dir)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500968 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000969 isolated_client_dir = make_temp_dir(ISOLATED_CLIENT_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700970 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500971 if data.relative_cwd:
972 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500973 command = data.command
Ye Kuangfb0bad62020-07-28 08:07:25 +0000974 go_isolated_client = None
975 if data.use_go_isolated:
976 go_isolated_client = os.path.join(isolated_client_dir,
977 'isolated' + cipd.EXECUTABLE_SUFFIX)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000978
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000979 cas_client = None
980 cas_client_dir = make_temp_dir(_CAS_CLIENT_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000981 if use_cas:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000982 cas_client = os.path.join(cas_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX)
983
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000984 data.trim_caches_fn(result['stats']['trim_caches'])
985
nodir55be77b2016-05-03 09:39:57 -0700986 try:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000987 with data.install_packages_fn(run_dir, isolated_client_dir,
988 cas_client_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800989 if cipd_info:
990 result['stats']['cipd'] = cipd_info.stats
991 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700992
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000993 isolated_stats = result['stats'].setdefault('isolated', {})
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500994 if data.isolated_hash:
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000995 if data.use_go_isolated:
Takuto Ikuta57219f42020-11-02 07:35:36 +0000996 stats = _fetch_and_map_with_go_isolated(
Takuto Ikuta90397ca2020-01-08 10:07:55 +0000997 isolated_hash=data.isolated_hash,
998 storage=data.storage,
Takuto Ikuta90397ca2020-01-08 10:07:55 +0000999 outdir=run_dir,
1000 go_cache_dir=data.go_cache_dir,
Takuto Ikuta879788c2020-01-10 08:00:26 +00001001 policies=data.go_cache_policies,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +00001002 isolated_client=go_isolated_client,
1003 tmp_dir=tmp_dir)
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001004 else:
Takuto Ikuta57219f42020-11-02 07:35:36 +00001005 stats = fetch_and_map(
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001006 isolated_hash=data.isolated_hash,
1007 storage=data.storage,
1008 cache=data.isolate_cache,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +00001009 outdir=run_dir)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001010 isolated_stats['download'].update(stats)
Takuto Ikutab58dbd12020-06-05 09:29:14 +00001011
Junji Watanabe54925c32020-09-08 00:56:18 +00001012 elif data.cas_digest:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001013 stats = _fetch_and_map_with_cas(
1014 cas_client=cas_client,
1015 digest=data.cas_digest,
1016 instance=data.cas_instance,
1017 output_dir=run_dir,
Junji Watanabeb03450b2020-09-25 05:09:27 +00001018 cache_dir=data.cas_cache_dir,
Takuto Ikutaae391c52020-12-03 08:43:45 +00001019 policies=data.cas_cache_policies,
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001020 kvs_dir=data.cas_kvs,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +00001021 tmp_dir=tmp_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001022 isolated_stats['download'].update(stats)
Junji Watanabe54925c32020-09-08 00:56:18 +00001023
maruelabec63c2017-04-26 11:53:24 -07001024 if not command:
1025 # Handle this as a task failure, not an internal failure.
1026 sys.stderr.write(
1027 '<No command was specified!>\n'
1028 '<Please secify a command when triggering your Swarming task>\n')
1029 result['exit_code'] = 1
1030 return result
nodirbe642ff2016-06-09 15:51:51 -07001031
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001032 if not cwd.startswith(run_dir):
1033 # Handle this as a task failure, not an internal failure. This is a
1034 # 'last chance' way to gate against directory escape.
1035 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
1036 result['exit_code'] = 1
1037 return result
1038
1039 if not os.path.isdir(cwd):
1040 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +00001041 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001042
vadimsh232f5a82017-01-20 19:23:44 -08001043 # If we have an explicit list of files to return, make sure their
1044 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001045 if data.storage and data.outputs:
1046 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -07001047
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001048 with data.install_named_caches(run_dir, result['stats']['named_caches']):
nodird6160682017-02-02 13:03:35 -08001049 sys.stdout.flush()
1050 start = time.time()
1051 try:
vadimsh9c54b2c2017-07-25 14:08:29 -07001052 # Need to switch the default account before 'get_command_env' call,
1053 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001054 with set_luci_context_account(data.switch_to_account, tmp_dir):
1055 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +00001056 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
1057 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +00001058 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -08001059 command = process_command(command, out_dir, data.bot_file)
1060 file_path.ensure_command_has_abs_path(command, cwd)
1061
vadimsh9c54b2c2017-07-25 14:08:29 -07001062 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001063 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001064 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -08001065 finally:
1066 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -05001067
Ye Kuangbc4e8402020-07-29 09:54:30 +00001068 if out_dir:
1069 # Try to link files to the output directory, if specified.
1070 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
1071 isolated_stats = result['stats'].setdefault('isolated', {})
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001072 if use_cas:
1073 result['cas_output_root'], isolated_stats['upload'] = (
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +00001074 upload_outdir_with_cas(cas_client, data.cas_instance, out_dir,
1075 tmp_dir))
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001076 else:
1077 # This could use |go_isolated_client|, so make sure it runs when the
1078 # CIPD package still exists.
1079 result['outputs_ref'], isolated_stats['upload'] = (
Takuto Ikutaf5173872021-05-11 03:18:40 +00001080 upload_out_dir(data.storage, out_dir))
Seth Koehler49139812017-12-19 13:59:33 -05001081 # We successfully ran the command, set internal_failure back to
1082 # None (even if the command failed, it's not an internal error).
1083 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -07001084 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -07001085 # An internal error occurred. Report accordingly so the swarming task will
1086 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -07001087 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -07001088 result['internal_failure'] = str(e)
1089 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -07001090
1091 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -07001092 finally:
1093 try:
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001094 cleanup_start = time.time()
Ye Kuangbc4e8402020-07-29 09:54:30 +00001095 success = True
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001096 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -07001097 success = True
maruela9cfd6f2015-09-15 11:03:15 -07001098 logging.warning(
1099 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -07001100 else:
maruel84537cb2015-10-16 14:21:28 -07001101 # On Windows rmtree(run_dir) call above has a synchronization effect: it
1102 # finishes only when all task child processes terminate (since a running
1103 # process locks *.exe file). Examine out_dir only after that call
1104 # completes (since child processes may write to out_dir too and we need
1105 # to wait for them to finish).
Junji Watanabeb03450b2020-09-25 05:09:27 +00001106 dirs_to_remove = [run_dir, tmp_dir, isolated_client_dir, cas_client_dir]
Ye Kuangbc4e8402020-07-29 09:54:30 +00001107 if out_dir:
1108 dirs_to_remove.append(out_dir)
1109 for directory in dirs_to_remove:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001110 if not fs.isdir(directory):
1111 continue
Junji Watanabe9cdfff52021-01-08 07:20:35 +00001112 start = time.time()
maruel84537cb2015-10-16 14:21:28 -07001113 try:
Junji Watanabecc4eefd2021-01-19 01:46:10 +00001114 file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -07001115 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001116 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -07001117 success = False
Junji Watanabe9cdfff52021-01-08 07:20:35 +00001118 finally:
1119 logging.info('Cleanup: rmtree(%r) took %d seconds', directory,
1120 time.time() - start)
maruel84537cb2015-10-16 14:21:28 -07001121 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001122 sys.stderr.write(
1123 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
Junji Watanabed952bf12021-05-13 03:15:54 +00001124 if sys.platform == 'win32':
1125 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
1126 else:
1127 subprocess42.check_call(['ps', 'axu'], stdout=sys.stderr)
maruel84537cb2015-10-16 14:21:28 -07001128 if result['exit_code'] == 0:
1129 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -07001130
maruela9cfd6f2015-09-15 11:03:15 -07001131 if not success and result['exit_code'] == 0:
1132 result['exit_code'] = 1
1133 except Exception as e:
1134 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -07001135 if out_dir:
1136 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -07001137 result['internal_failure'] = str(e)
Takuto Ikutaa9a907b2020-04-17 08:50:50 +00001138 on_error.report(None)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001139 finally:
1140 cleanup_duration = time.time() - cleanup_start
1141 result['stats']['cleanup']['duration'] = cleanup_duration
1142 logging.info('Cleanup: removing directories took %d seconds',
1143 cleanup_duration)
maruela9cfd6f2015-09-15 11:03:15 -07001144 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001145
1146
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001147def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -07001148 """Runs an executable and records execution metadata.
1149
nodir55be77b2016-05-03 09:39:57 -07001150 If isolated_hash is specified, downloads the dependencies in the cache,
1151 hardlinks them into a temporary directory and runs the command specified in
1152 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001153
1154 A temporary directory is created to hold the output files. The content inside
1155 this directory will be uploaded back to |storage| packaged as a .isolated
1156 file.
1157
1158 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001159 - data: TaskData instance.
1160 - result_json: File path to dump result metadata into. If set, the process
1161 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -07001162
1163 Returns:
1164 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001165 """
maruela76b9ee2015-12-15 06:18:08 -08001166 if result_json:
1167 # Write a json output file right away in case we get killed.
1168 result = {
Junji Watanabe54925c32020-09-08 00:56:18 +00001169 'exit_code': None,
1170 'had_hard_timeout': False,
1171 'internal_failure': 'Was terminated before completion',
1172 'outputs_ref': None,
1173 'cas_output_root': None,
1174 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -08001175 }
1176 tools.write_json(result_json, result, dense=True)
1177
maruela9cfd6f2015-09-15 11:03:15 -07001178 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001179 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -07001180 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -07001181
maruela9cfd6f2015-09-15 11:03:15 -07001182 if result_json:
maruel05d5a882015-09-21 13:59:02 -07001183 # We've found tests to delete 'work' when quitting, causing an exception
1184 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -07001185 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -07001186 tools.write_json(result_json, result, dense=True)
1187 # Only return 1 if there was an internal error.
1188 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +00001189
maruela9cfd6f2015-09-15 11:03:15 -07001190 # Marshall into old-style inline output.
1191 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +00001192 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -07001193 data = {
Junji Watanabe38b28b02020-04-23 10:23:30 +00001194 'hash': result['outputs_ref']['isolated'],
1195 'namespace': result['outputs_ref']['namespace'],
1196 'storage': result['outputs_ref']['isolatedserver'],
maruela9cfd6f2015-09-15 11:03:15 -07001197 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -05001198 sys.stdout.flush()
Junji Watanabe38b28b02020-04-23 10:23:30 +00001199 print('[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
1200 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -08001201 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -07001202 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001203
1204
iannuccib58d10d2017-03-18 02:00:25 -07001205# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -08001206CipdInfo = collections.namedtuple('CipdInfo', [
1207 'client', # cipd.CipdClient object
1208 'cache_dir', # absolute path to bot-global cipd tag and instance cache
1209 'stats', # dict with stats to return to the server
1210 'pins', # dict with installed cipd pins to return to the server
1211])
1212
1213
1214@contextlib.contextmanager
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001215def noop_install_packages(_run_dir, _isolated_dir, _cas_dir):
iannuccib58d10d2017-03-18 02:00:25 -07001216 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -08001217 yield None
1218
1219
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001220def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -07001221 """Calls 'cipd ensure' for packages.
1222
1223 Args:
1224 run_dir (str): root of installation.
1225 cipd_cache_dir (str): the directory to use for the cipd package cache.
1226 client (CipdClient): the cipd client to use
1227 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -07001228
1229 Returns: list of pinned packages. Looks like [
1230 {
1231 'path': 'subdirectory',
1232 'package_name': 'resolved/package/name',
1233 'version': 'deadbeef...',
1234 },
1235 ...
1236 ]
1237 """
1238 package_pins = [None]*len(packages)
1239 def insert_pin(path, name, version, idx):
1240 package_pins[idx] = {
1241 'package_name': name,
1242 # swarming deals with 'root' as '.'
1243 'path': path or '.',
1244 'version': version,
1245 }
1246
1247 by_path = collections.defaultdict(list)
1248 for i, (path, name, version) in enumerate(packages):
1249 # cipd deals with 'root' as ''
1250 if path == '.':
1251 path = ''
1252 by_path[path].append((name, version, i))
1253
1254 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001255 run_dir,
1256 {
1257 subdir: [(name, vers) for name, vers, _ in pkgs
1258 ] for subdir, pkgs in by_path.items()
1259 },
1260 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -07001261 )
1262
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +00001263 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -07001264 this_subdir = by_path[subdir]
1265 for i, (name, version) in enumerate(pin_list):
1266 insert_pin(subdir, name, version, this_subdir[i][2])
1267
Robert Iannucci461b30d2017-12-13 11:34:03 -08001268 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -07001269
1270 return package_pins
1271
1272
vadimsh232f5a82017-01-20 19:23:44 -08001273@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001274def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001275 client_package_name, client_version, cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001276 isolated_dir, cas_dir):
vadimsh902948e2017-01-20 15:57:32 -08001277 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -07001278
vadimsh232f5a82017-01-20 19:23:44 -08001279 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
1280
1281 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -07001282 [
1283 {
1284 "path": path, "package_name": package_name, "version": version,
1285 },
1286 ...
1287 ]
vadimsh902948e2017-01-20 15:57:32 -08001288 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -07001289
1290 such that they correspond 1:1 to all input package arguments from the command
1291 line. These dictionaries make their all the way back to swarming, where they
1292 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -07001293
vadimsh902948e2017-01-20 15:57:32 -08001294 If 'packages' list is empty, will bootstrap CIPD client, but won't install
1295 any packages.
1296
1297 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -08001298 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -08001299
nodirbe642ff2016-06-09 15:51:51 -07001300 Args:
nodir90bc8dc2016-06-15 13:35:21 -07001301 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -08001302 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -07001303 service_url (str): CIPD server url, e.g.
1304 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -07001305 client_package_name (str): CIPD package name of CIPD client.
1306 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -07001307 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001308 isolated_dir (str): where to download isolated client.
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001309 cas_dir (str): where to download cas client.
nodirbe642ff2016-06-09 15:51:51 -07001310 """
1311 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001312
nodirbe642ff2016-06-09 15:51:51 -07001313 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001314
vadimsh902948e2017-01-20 15:57:32 -08001315 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001316 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001317 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001318 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001319
nodirbe642ff2016-06-09 15:51:51 -07001320 get_client_start = time.time()
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001321 client_manager = cipd.get_client(cache_dir, service_url, client_package_name,
1322 client_version)
iannucci96fcccc2016-08-30 15:52:22 -07001323
nodirbe642ff2016-06-09 15:51:51 -07001324 with client_manager as client:
1325 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001326
iannuccib58d10d2017-03-18 02:00:25 -07001327 package_pins = []
1328 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001329 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1330 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001331
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001332 # Install isolated client to |isolated_dir|.
Takuto Ikuta02edca22019-11-29 10:04:51 +00001333 _install_packages(isolated_dir, cipd_cache_dir, client,
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +00001334 [('', ISOLATED_PACKAGE, _LUCI_GO_REVISION)])
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001335
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001336 # Install cas client to |cas_dir|.
1337 _install_packages(cas_dir, cipd_cache_dir, client,
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +00001338 [('', _CAS_PACKAGE, _LUCI_GO_REVISION)])
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001339
iannuccib58d10d2017-03-18 02:00:25 -07001340 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001341
vadimsh232f5a82017-01-20 19:23:44 -08001342 total_duration = time.time() - start
Junji Watanabe38b28b02020-04-23 10:23:30 +00001343 logging.info('Installing CIPD client and packages took %d seconds',
1344 total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001345
vadimsh232f5a82017-01-20 19:23:44 -08001346 yield CipdInfo(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001347 client=client,
1348 cache_dir=cipd_cache_dir,
1349 stats={
1350 'duration': total_duration,
1351 'get_client_duration': get_client_duration,
iannuccib58d10d2017-03-18 02:00:25 -07001352 },
Junji Watanabe38b28b02020-04-23 10:23:30 +00001353 pins={
1354 'client_package': {
1355 'package_name': client.package_name,
1356 'version': client.instance_id,
1357 },
1358 'packages': package_pins,
1359 })
nodirbe642ff2016-06-09 15:51:51 -07001360
1361
1362def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001363 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001364 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001365 version=__version__,
1366 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001367 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001368 '--clean',
1369 action='store_true',
maruel36a963d2016-04-08 17:15:49 -07001370 help='Cleans the cache, trimming it necessary and remove corrupted items '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001371 'and returns without executing anything; use with -v to know what '
1372 'was done')
maruel36a963d2016-04-08 17:15:49 -07001373 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001374 '--json',
1375 help='dump output metadata to json file. When used, run_isolated returns '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001376 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001377 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001378 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001379 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001380 '--grace-period',
1381 type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001382 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001383 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001384 '--relative-cwd',
Takuto Ikuta18ca29a2020-12-04 07:34:20 +00001385 help='Ignore the isolated \'relative_cwd\' and use this one instead')
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001386 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001387 '--env',
1388 default=[],
1389 action='append',
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001390 help='Environment variables to set for the child process')
1391 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001392 '--env-prefix',
1393 default=[],
1394 action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001395 help='Specify a VAR=./path/fragment to put in the environment variable '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001396 'before executing the command. The path fragment must be relative '
1397 'to the isolated run directory, and must not contain a `..` token. '
1398 'The path will be made absolute and prepended to the indicated '
1399 '$VAR using the OS\'s path separator. Multiple items for the same '
1400 '$VAR will be prepended in order.')
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001401 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001402 '--bot-file',
1403 help='Path to a file describing the state of the host. The content is '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001404 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001405 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001406 '--switch-to-account',
1407 help='If given, switches LUCI_CONTEXT to given logical service account '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001408 '(e.g. "task" or "system") before launching the isolated process.')
vadimsh9c54b2c2017-07-25 14:08:29 -07001409 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001410 '--output',
1411 action='append',
aludwin0a8e17d2016-10-27 15:57:39 -07001412 help='Specifies an output to return. If no outputs are specified, all '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001413 'files located in $(ISOLATED_OUTDIR) will be returned; '
1414 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1415 'specified by --output option (there can be multiple) will be '
1416 'returned. Note that if a file in OUT_DIR has the same path '
1417 'as an --output option, the --output version will be returned.')
aludwin0a8e17d2016-10-27 15:57:39 -07001418 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001419 '-a',
1420 '--argsfile',
aludwin7556e0c2016-10-26 08:46:10 -07001421 # This is actually handled in parse_args; it's included here purely so it
1422 # can make it into the help text.
1423 help='Specify a file containing a JSON array of arguments to this '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001424 'script. If --argsfile is provided, no other argument may be '
1425 'provided on the command line.')
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001426 parser.add_option(
1427 '--report-on-exception',
1428 action='store_true',
1429 help='Whether report exception during execution to isolate server. '
1430 'This flag should only be used in swarming bot.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001431
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001432 group = optparse.OptionGroup(parser, 'Data source - Isolate server')
Junji Watanabe54925c32020-09-08 00:56:18 +00001433 # Deprecated. Isoate server is being migrated to RBE-CAS.
1434 # Remove --isolated and isolate server options after migration.
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001435 group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001436 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001437 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001438 isolateserver.add_isolate_server_options(group)
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001439 parser.add_option_group(group)
1440
1441 group = optparse.OptionGroup(parser,
1442 'Data source - Content Addressed Storage')
Junji Watanabe54925c32020-09-08 00:56:18 +00001443 group.add_option(
1444 '--cas-instance', help='Full CAS instance name for input/output files.')
1445 group.add_option(
1446 '--cas-digest',
1447 help='Digest of the input root on RBE-CAS. The format is '
1448 '`{hash}/{size_bytes}`.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001449 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001450
Junji Watanabeb03450b2020-09-25 05:09:27 +00001451 # Cache options.
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001452 isolateserver.add_cache_options(parser)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001453 add_cas_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001454
1455 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001456
1457 group = optparse.OptionGroup(parser, 'Named caches')
1458 group.add_option(
1459 '--named-cache',
1460 dest='named_caches',
1461 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001462 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001463 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001464 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001465 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1466 'path is a path relative to the run dir where the cache directory '
1467 'must be put to. '
1468 'This option can be specified more than once.')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001469 group.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001470 '--named-cache-root',
1471 default='named_caches',
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001472 help='Cache root directory. Default=%default')
1473 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001474
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001475 group = optparse.OptionGroup(parser, 'Process containment')
1476 parser.add_option(
1477 '--lower-priority', action='store_true',
1478 help='Lowers the child process priority')
1479 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001480 '--containment-type',
1481 choices=('NONE', 'AUTO', 'JOB_OBJECT'),
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001482 default='NONE',
1483 help='Type of container to use')
1484 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001485 '--limit-processes',
1486 type='int',
1487 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001488 help='Maximum number of active processes in the containment')
1489 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001490 '--limit-total-committed-memory',
1491 type='int',
1492 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001493 help='Maximum sum of committed memory in the containment')
1494 parser.add_option_group(group)
1495
1496 group = optparse.OptionGroup(parser, 'Debugging')
1497 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001498 '--leak-temp-dir',
1499 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001500 help='Deliberately leak isolate\'s temp dir for later examination. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001501 'Default: %default')
1502 group.add_option('--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001503 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001504
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001505 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001506
Ye Kuang1d096cb2020-06-26 08:38:21 +00001507 parser.set_defaults(cache='cache')
nodirbe642ff2016-06-09 15:51:51 -07001508 return parser
1509
1510
Junji Watanabeb03450b2020-09-25 05:09:27 +00001511def add_cas_cache_options(parser):
1512 group = optparse.OptionGroup(parser, 'CAS cache management')
1513 group.add_option(
1514 '--cas-cache',
1515 metavar='DIR',
1516 default='cas-cache',
1517 help='Directory to keep a local cache of the files. Accelerates download '
1518 'by reusing already downloaded files. Default=%default')
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001519 group.add_option(
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001520 '--kvs-dir',
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001521 default='',
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001522 help='CAS cache dir using kvs for small files. Default=%default')
Junji Watanabeb03450b2020-09-25 05:09:27 +00001523 parser.add_option_group(group)
1524
1525
1526def process_cas_cache_options(options):
1527 if options.cas_cache:
1528 policies = local_caching.CachePolicies(
1529 max_cache_size=options.max_cache_size,
1530 min_free_space=options.min_free_space,
1531 # max_items isn't used for CAS cache for now.
1532 max_items=None,
1533 max_age_secs=MAX_AGE_SECS)
1534
1535 return local_caching.DiskContentAddressedCache(
1536 six.text_type(os.path.abspath(options.cas_cache)), policies, trim=False)
1537 return local_caching.MemoryContentAddressedCache()
1538
1539
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001540def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001541 """Validates named cache options and returns a CacheManager."""
1542 if options.named_caches and not options.named_cache_root:
1543 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001544 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001545 if not CACHE_NAME_RE.match(name):
1546 parser.error(
1547 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1548 if not path:
1549 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001550 try:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001551 int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001552 except ValueError:
1553 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001554 if options.named_cache_root:
1555 # Make these configurable later if there is use case but for now it's fairly
1556 # safe values.
1557 # In practice, a fair chunk of bots are already recycled on a daily schedule
1558 # so this code doesn't have any effect to them, unless they are preloaded
1559 # with a really old cache.
1560 policies = local_caching.CachePolicies(
1561 # 1TiB.
1562 max_cache_size=1024*1024*1024*1024,
1563 min_free_space=options.min_free_space,
1564 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001565 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001566 root_dir = six.text_type(os.path.abspath(options.named_cache_root))
John Budorickc6186972020-02-26 00:58:14 +00001567 cache = local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
1568 # Touch any named caches we're going to use to minimize thrashing
1569 # between tasks that request some (but not all) of the same named caches.
John Budorick0a4dab62020-03-02 22:23:35 +00001570 cache.touch(*[name for name, _, _ in options.named_caches])
John Budorickc6186972020-02-26 00:58:14 +00001571 return cache
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001572 return None
1573
1574
aludwin7556e0c2016-10-26 08:46:10 -07001575def parse_args(args):
1576 # Create a fake mini-parser just to get out the "-a" command. Note that
1577 # it's not documented here; instead, it's documented in create_option_parser
1578 # even though that parser will never actually get to parse it. This is
1579 # because --argsfile is exclusive with all other options and arguments.
1580 file_argparse = argparse.ArgumentParser(add_help=False)
1581 file_argparse.add_argument('-a', '--argsfile')
1582 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1583 if file_args.argsfile:
1584 if nonfile_args:
1585 file_argparse.error('Can\'t specify --argsfile with'
1586 'any other arguments (%s)' % nonfile_args)
1587 try:
1588 with open(file_args.argsfile, 'r') as f:
1589 args = json.load(f)
1590 except (IOError, OSError, ValueError) as e:
1591 # We don't need to error out here - "args" is now empty,
1592 # so the call below to parser.parse_args(args) will fail
1593 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001594 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001595
1596 # Even if we failed to read the args, just call the normal parser now since it
1597 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001598 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001599 options, args = parser.parse_args(args)
Ye Kuangfff1e502020-07-13 13:21:57 +00001600 if not isinstance(options.cipd_enabled, (bool, int)):
1601 options.cipd_enabled = distutils.util.strtobool(options.cipd_enabled)
aludwin7556e0c2016-10-26 08:46:10 -07001602 return (parser, options, args)
1603
1604
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001605def _calc_named_cache_hint(named_cache, named_caches):
1606 """Returns the expected size of the missing named caches."""
1607 present = named_cache.available
1608 size = 0
1609 for name, _, hint in named_caches:
1610 if name not in present:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001611 hint = int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001612 if hint > 0:
1613 size += hint
1614 return size
1615
1616
Takuto Ikutaae391c52020-12-03 08:43:45 +00001617def _clean_cmd(parser, options, caches, root):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001618 """Cleanup cache dirs/files."""
1619 if options.isolated:
1620 parser.error('Can\'t use --isolated with --clean.')
1621 if options.isolate_server:
1622 parser.error('Can\'t use --isolate-server with --clean.')
1623 if options.json:
1624 parser.error('Can\'t use --json with --clean.')
1625 if options.named_caches:
1626 parser.error('Can\t use --named-cache with --clean.')
1627 if options.cas_instance or options.cas_digest:
1628 parser.error('Can\t use --cas-instance, --cas-digest with --clean.')
1629
1630 logging.info("initial free space: %d", file_path.get_free_space(root))
1631
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001632 if options.kvs_dir and fs.isdir(six.text_type(options.kvs_dir)):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001633 # Remove kvs file if its size exceeds fixed threshold.
Takuto Ikutab1b70062021-03-22 01:02:41 +00001634 kvs_dir = six.text_type(options.kvs_dir)
1635 size = file_path.get_recursive_size(kvs_dir)
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001636 if size >= _CAS_KVS_CACHE_THRESHOLD:
1637 logging.info("remove kvs dir with size: %d", size)
Takuto Ikutab1b70062021-03-22 01:02:41 +00001638 file_path.rmtree(kvs_dir)
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001639
1640 # Trim first, then clean.
1641 local_caching.trim_caches(
1642 caches,
1643 root,
1644 min_free_space=options.min_free_space,
1645 max_age_secs=MAX_AGE_SECS)
1646 logging.info("free space after trim: %d", file_path.get_free_space(root))
1647 for c in caches:
1648 c.cleanup()
1649 logging.info("free space after cleanup: %d", file_path.get_free_space(root))
1650
1651
aludwin7556e0c2016-10-26 08:46:10 -07001652def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001653 # Warning: when --argsfile is used, the strings are unicode instances, when
1654 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001655 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001656
Junji Watanabe1d83d282021-05-11 05:50:40 +00001657 SWARMING_SERVER = os.environ.get('SWARMING_SERVER')
1658 SWARMING_TASK_ID = os.environ.get('SWARMING_TASK_ID')
1659 if options.report_on_exception and SWARMING_SERVER:
1660 task_url = None
1661 if SWARMING_TASK_ID:
1662 task_url = '%s/task?id=%s' % (SWARMING_SERVER, SWARMING_TASK_ID)
1663 on_error.report_on_exception_exit(SWARMING_SERVER, source=task_url)
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001664
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001665 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001666 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001667
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001668 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001669 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001670 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1671 if hint:
1672 # Increase the --min-free-space value by the hint, and recreate the
1673 # NamedCache instance so it gets the updated CachePolicy.
1674 options.min_free_space += hint
1675 named_cache = process_named_cache_options(parser, options)
1676
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001677 # TODO(crbug.com/932396): Remove this.
Takuto Ikuta4a22c2c2020-06-05 02:02:23 +00001678 use_go_isolated = options.cipd_enabled
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001679
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001680 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1681 # they can be cleaned the same way.
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001682
1683 isolate_cache = isolateserver.process_cache_options(options, trim=False)
1684 cas_cache = process_cas_cache_options(options)
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +00001685
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001686 caches = []
1687 if isolate_cache:
1688 caches.append(isolate_cache)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001689 if cas_cache:
1690 caches.append(cas_cache)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001691 if named_cache:
1692 caches.append(named_cache)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001693 root = caches[0].cache_dir if caches else six.text_type(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001694 if options.clean:
Takuto Ikutaae391c52020-12-03 08:43:45 +00001695 _clean_cmd(parser, options, caches, root)
maruel36a963d2016-04-08 17:15:49 -07001696 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001697
1698 # Trim must still be done for the following case:
1699 # - named-cache was used
1700 # - some entries, with a large hint, where missing
1701 # - --min-free-space was increased accordingly, thus trimming is needed
1702 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1703 # --clean after each task.
Takuto Ikutac9ddff22021-02-18 07:58:39 +00001704 additional_buffer = _FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001705 if options.kvs_dir:
Takuto Ikuta7f45c592021-02-09 05:57:05 +00001706 additional_buffer += _CAS_KVS_CACHE_THRESHOLD
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001707 # Add some buffer for Go CLI.
1708 min_free_space = options.min_free_space + additional_buffer
1709
1710 def trim_caches_fn(stats):
1711 start = time.time()
1712 local_caching.trim_caches(
1713 caches, root, min_free_space=min_free_space, max_age_secs=MAX_AGE_SECS)
1714 duration = time.time() - start
1715 stats['duration'] = duration
1716 logging.info('trim_caches: took %d seconds', duration)
maruel36a963d2016-04-08 17:15:49 -07001717
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001718 # Save state of isolate/cas cache not to overwrite state from go client.
1719 if use_go_isolated:
1720 isolate_cache.save()
1721 isolate_cache = None
1722 if cas_cache:
1723 cas_cache.save()
1724 cas_cache = None
1725
nodir55be77b2016-05-03 09:39:57 -07001726 if not options.isolated and not args:
1727 parser.error('--isolated or command to run is required.')
1728
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001729 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001730
Takuto Ikutaae767b32020-05-11 01:22:19 +00001731 isolateserver.process_isolate_server_options(parser, options, False)
Junji Watanabeed9ce352020-09-25 12:32:07 +00001732 if ISOLATED_OUTDIR_PARAMETER in args and (not options.isolate_server and
1733 not options.cas_instance):
1734 parser.error('%s in args requires --isolate-server or --cas-instance' %
1735 ISOLATED_OUTDIR_PARAMETER)
1736
1737 if options.isolated and not options.isolate_server:
1738 parser.error('--isolated requires --isolate-server')
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001739
nodir90bc8dc2016-06-15 13:35:21 -07001740 if options.root_dir:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001741 options.root_dir = six.text_type(os.path.abspath(options.root_dir))
Takuto Ikutad46ea762020-10-07 05:43:22 +00001742 else:
1743 options.root_dir = six.text_type(tempfile.mkdtemp(prefix='root'))
maruel12e30012015-10-09 11:55:35 -07001744 if options.json:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001745 options.json = six.text_type(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001746
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001747 if any('=' not in i for i in options.env):
1748 parser.error(
1749 '--env required key=value form. value can be skipped to delete '
1750 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001751 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001752
1753 prefixes = {}
1754 cwd = os.path.realpath(os.getcwd())
1755 for item in options.env_prefix:
1756 if '=' not in item:
1757 parser.error(
1758 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1759 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001760 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001761 if os.path.isabs(opath):
1762 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1763 opath = os.path.normpath(opath)
1764 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1765 parser.error(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001766 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1767 % opath)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001768 prefixes.setdefault(key, []).append(opath)
1769 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001770
nodirbe642ff2016-06-09 15:51:51 -07001771 cipd.validate_cipd_options(parser, options)
1772
vadimsh232f5a82017-01-20 19:23:44 -08001773 install_packages_fn = noop_install_packages
Ye Kuang1d096cb2020-06-26 08:38:21 +00001774 tmp_cipd_cache_dir = None
vadimsh902948e2017-01-20 15:57:32 -08001775 if options.cipd_enabled:
Ye Kuang1d096cb2020-06-26 08:38:21 +00001776 cache_dir = options.cipd_cache
1777 if not cache_dir:
1778 tmp_cipd_cache_dir = six.text_type(tempfile.mkdtemp())
1779 cache_dir = tmp_cipd_cache_dir
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001780 install_packages_fn = (
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001781 lambda run_dir, isolated_dir, cas_dir: install_client_and_packages(
Ye Kuang1d096cb2020-06-26 08:38:21 +00001782 run_dir,
1783 cipd.parse_package_args(options.cipd_packages),
1784 options.cipd_server,
1785 options.cipd_client_package,
1786 options.cipd_client_version,
1787 cache_dir=cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001788 isolated_dir=isolated_dir,
1789 cas_dir=cas_dir,
1790 ))
nodirbe642ff2016-06-09 15:51:51 -07001791
nodird6160682017-02-02 13:03:35 -08001792 @contextlib.contextmanager
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001793 def install_named_caches(run_dir, stats):
nodird6160682017-02-02 13:03:35 -08001794 # WARNING: this function depends on "options" variable defined in the outer
1795 # function.
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001796 assert six.text_type(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001797 assert os.path.isabs(run_dir), run_dir
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001798 named_caches = [(os.path.join(run_dir, six.text_type(relpath)), name)
1799 for name, relpath, _ in options.named_caches]
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001800 install_start = time.time()
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001801 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001802 named_cache.install(path, name)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001803 install_duration = time.time() - install_start
1804 stats['install']['duration'] = install_duration
1805 logging.info('named_caches: install took %d seconds', install_duration)
nodird6160682017-02-02 13:03:35 -08001806 try:
1807 yield
1808 finally:
dnje289d132017-07-07 11:16:44 -07001809 # Uninstall each named cache, returning it to the cache pool. If an
1810 # uninstall fails for a given cache, it will remain in the task's
1811 # temporary space, get cleaned up by the Swarming bot, and be lost.
1812 #
1813 # If the Swarming bot cannot clean up the cache, it will handle it like
1814 # any other bot file that could not be removed.
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001815 uninstall_start = time.time()
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001816 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001817 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001818 # uninstall() doesn't trim but does call save() implicitly. Trimming
1819 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001820 named_cache.uninstall(path, name)
1821 except local_caching.NamedCacheError:
Takuto Ikuta463ecdd2021-03-05 09:35:38 +00001822 if sys.platform == 'win32':
1823 # Show running processes.
1824 sys.stderr.write("running process\n")
1825 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
1826
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001827 logging.exception('Error while removing named cache %r at %r. '
1828 'The cache will be lost.', path, name)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001829 uninstall_duration = time.time() - uninstall_start
1830 stats['uninstall']['duration'] = uninstall_duration
1831 logging.info('named_caches: uninstall took %d seconds',
1832 uninstall_duration)
nodirf33b8d62016-10-26 22:34:58 -07001833
Takuto Ikutaf3caa9b2020-11-02 05:38:26 +00001834 command = args
1835 if options.relative_cwd:
1836 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1837 if not a.startswith(os.getcwd()):
1838 parser.error(
1839 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001840
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001841 containment_type = subprocess42.Containment.NONE
1842 if options.containment_type == 'AUTO':
1843 containment_type = subprocess42.Containment.AUTO
1844 if options.containment_type == 'JOB_OBJECT':
1845 containment_type = subprocess42.Containment.JOB_OBJECT
1846 containment = subprocess42.Containment(
1847 containment_type=containment_type,
1848 limit_processes=options.limit_processes,
1849 limit_total_committed_memory=options.limit_total_committed_memory)
1850
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001851 data = TaskData(
1852 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001853 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001854 isolated_hash=options.isolated,
1855 storage=None,
1856 isolate_cache=isolate_cache,
Junji Watanabe54925c32020-09-08 00:56:18 +00001857 cas_instance=options.cas_instance,
1858 cas_digest=options.cas_digest,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001859 outputs=options.output,
1860 install_named_caches=install_named_caches,
1861 leak_temp_dir=options.leak_temp_dir,
1862 root_dir=_to_unicode(options.root_dir),
1863 hard_timeout=options.hard_timeout,
1864 grace_period=options.grace_period,
1865 bot_file=options.bot_file,
1866 switch_to_account=options.switch_to_account,
1867 install_packages_fn=install_packages_fn,
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001868 use_go_isolated=use_go_isolated,
Takuto Ikuta10cae642020-01-08 08:12:07 +00001869 go_cache_dir=options.cache,
Takuto Ikuta879788c2020-01-10 08:00:26 +00001870 go_cache_policies=local_caching.CachePolicies(
1871 max_cache_size=options.max_cache_size,
1872 min_free_space=options.min_free_space,
1873 max_items=options.max_items,
1874 max_age_secs=None,
1875 ),
Junji Watanabeb03450b2020-09-25 05:09:27 +00001876 cas_cache_dir=options.cas_cache,
1877 cas_cache_policies=local_caching.CachePolicies(
1878 max_cache_size=options.max_cache_size,
1879 min_free_space=options.min_free_space,
1880 max_items=None,
1881 max_age_secs=None,
1882 ),
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001883 cas_kvs=options.kvs_dir,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001884 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001885 env_prefix=options.env_prefix,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001886 lower_priority=bool(options.lower_priority),
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001887 containment=containment,
1888 trim_caches_fn=trim_caches_fn)
nodirbe642ff2016-06-09 15:51:51 -07001889 try:
nodir90bc8dc2016-06-15 13:35:21 -07001890 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001891 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001892 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001893 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001894 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001895 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001896 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001897 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001898 return run_tha_test(data, options.json)
1899 return run_tha_test(data, options.json)
Junji Watanabe38b28b02020-04-23 10:23:30 +00001900 except (cipd.Error, local_caching.NamedCacheError,
1901 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001902 print(ex.message, file=sys.stderr)
nodirbe642ff2016-06-09 15:51:51 -07001903 return 1
Ye Kuang1d096cb2020-06-26 08:38:21 +00001904 finally:
1905 if tmp_cipd_cache_dir is not None:
1906 try:
1907 file_path.rmtree(tmp_cipd_cache_dir)
1908 except OSError:
1909 logging.exception('Remove tmp_cipd_cache_dir=%s failed',
1910 tmp_cipd_cache_dir)
1911 # Best effort clean up. Failed to do so doesn't affect the outcome.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001912
1913
1914if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001915 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001916 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001917 fix_encoding.fix_encoding()
Ye Kuang2dd17442020-04-22 08:45:52 +00001918 net.set_user_agent('run_isolated.py/' + __version__)
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001919 sys.exit(main(sys.argv[1:]))