blob: 089c1fafe5bbc6786c5fca9e234ae9911f62a267 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
33See
34https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
35for all the variables.
36
37See
38https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
39for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000040"""
41
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000042from __future__ import print_function
43
44__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000045
aludwin7556e0c2016-10-26 08:46:10 -070046import argparse
maruel064c0a32016-04-05 11:47:15 -070047import base64
iannucci96fcccc2016-08-30 15:52:22 -070048import collections
vadimsh232f5a82017-01-20 19:23:44 -080049import contextlib
Ye Kuangfff1e502020-07-13 13:21:57 +000050import distutils
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040051import errno
aludwin7556e0c2016-10-26 08:46:10 -070052import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000053import logging
54import optparse
55import os
Takuto Ikuta5c59a842020-01-24 03:05:24 +000056import platform
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040057import re
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000058import sys
59import tempfile
maruel064c0a32016-04-05 11:47:15 -070060import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000061
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000062from utils import tools
63tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000064
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000065# third_party/
66from depot_tools import fix_encoding
Takuto Ikuta6e2ff962019-10-29 12:35:27 +000067import six
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000068
69# pylint: disable=ungrouped-imports
Takuto Ikutad53d7bd2021-07-16 03:09:33 +000070import DEPS
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000071import auth
72import cipd
73import isolate_storage
74import isolateserver
75import local_caching
76from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070077from utils import file_path
maruel12e30012015-10-09 11:55:35 -070078from utils import fs
maruel064c0a32016-04-05 11:47:15 -070079from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040080from utils import logging_utils
Ye Kuang2dd17442020-04-22 08:45:52 +000081from utils import net
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040082from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050083from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000084
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000085
maruele2f2cb82016-07-13 14:41:03 -070086# Magic variables that can be found in the isolate task command line.
87ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
88EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
89SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
90
91
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000092# The name of the log file to use.
93RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
94
maruele2f2cb82016-07-13 14:41:03 -070095
maruele2f2cb82016-07-13 14:41:03 -070096# Use short names for temporary directories. This is driven by Windows, which
97# imposes a relatively short maximum path length of 260 characters, often
98# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +000099# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -0700100#
101# It is recommended to start the script with a `root_dir` as short as
102# possible.
103# - ir stands for isolated_run
104# - io stands for isolated_out
105# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000106# - ic stands for isolated_client
maruele2f2cb82016-07-13 14:41:03 -0700107ISOLATED_RUN_DIR = u'ir'
108ISOLATED_OUT_DIR = u'io'
109ISOLATED_TMP_DIR = u'it'
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000110ISOLATED_CLIENT_DIR = u'ic'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000111_CAS_CLIENT_DIR = u'cc'
maruele2f2cb82016-07-13 14:41:03 -0700112
Takuto Ikuta02edca22019-11-29 10:04:51 +0000113# TODO(tikuta): take these parameter from luci-config?
Takuto Ikuta02edca22019-11-29 10:04:51 +0000114ISOLATED_PACKAGE = 'infra/tools/luci/isolated/${platform}'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000115_CAS_PACKAGE = 'infra/tools/luci/cas/${platform}'
Takuto Ikutad53d7bd2021-07-16 03:09:33 +0000116_LUCI_GO_REVISION = DEPS.deps['luci-go']['packages'][0]['version']
maruele2f2cb82016-07-13 14:41:03 -0700117
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400118# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000119CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400120
Takuto Ikutac9ddff22021-02-18 07:58:39 +0000121_FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES = 2 * 1024 * 1024 * 1024
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400122
marueld928c862017-06-08 08:20:04 -0700123OUTLIVING_ZOMBIE_MSG = """\
124*** Swarming tried multiple times to delete the %s directory and failed ***
125*** Hard failing the task ***
126
127Swarming detected that your testing script ran an executable, which may have
128started a child executable, and the main script returned early, leaving the
129children executables playing around unguided.
130
131You don't want to leave children processes outliving the task on the Swarming
132bot, do you? The Swarming bot doesn't.
133
134How to fix?
135- For any process that starts children processes, make sure all children
136 processes terminated properly before each parent process exits. This is
137 especially important in very deep process trees.
138 - This must be done properly both in normal successful task and in case of
139 task failure. Cleanup is very important.
140- The Swarming bot sends a SIGTERM in case of timeout.
141 - You have %s seconds to comply after the signal was sent to the process
142 before the process is forcibly killed.
143- To achieve not leaking children processes in case of signals on timeout, you
144 MUST handle signals in each executable / python script and propagate them to
145 children processes.
146 - When your test script (python or binary) receives a signal like SIGTERM or
147 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
148 them to terminate before quitting.
149
150See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400151https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700152for more information.
153
154*** May the SIGKILL force be with you ***
155"""
156
157
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000158# Currently hardcoded. Eventually could be exposed as a flag once there's value.
159# 3 weeks
160MAX_AGE_SECS = 21*24*60*60
161
Takuto Ikuta7ff4b242020-12-03 08:07:06 +0000162_CAS_KVS_CACHE_THRESHOLD = 5 * 1024 * 1024 * 1024 # 5 GiB
163
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500164TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000165 'TaskData',
166 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000167 # List of strings; the command line to use, independent of what was
168 # specified in the isolated file.
169 'command',
170 # Relative directory to start command into.
171 'relative_cwd',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000172 # Hash of the .isolated file that must be retrieved to recreate the tree
173 # of files to run the target executable. The command specified in the
174 # .isolated is executed. Mutually exclusive with command argument.
175 'isolated_hash',
176 # isolateserver.Storage instance to retrieve remote objects. This object
177 # has a reference to an isolateserver.StorageApi, which does the actual
178 # I/O.
179 'storage',
180 # isolateserver.LocalCache instance to keep from retrieving the same
181 # objects constantly by caching the objects retrieved. Can be on-disk or
182 # in-memory.
183 'isolate_cache',
Junji Watanabe54925c32020-09-08 00:56:18 +0000184 # Digest of the input root on RBE-CAS.
185 'cas_digest',
186 # Full CAS instance name.
187 'cas_instance',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000188 # List of paths relative to root_dir to put into the output isolated
189 # bundle upon task completion (see link_outputs_to_outdir).
190 'outputs',
191 # Function (run_dir) => context manager that installs named caches into
192 # |run_dir|.
193 'install_named_caches',
194 # If True, the temporary directory will be deliberately leaked for later
195 # examination.
196 'leak_temp_dir',
197 # Path to the directory to use to create the temporary directory. If not
198 # specified, a random temporary directory is created.
199 'root_dir',
200 # Kills the process if it lasts more than this amount of seconds.
201 'hard_timeout',
202 # Number of seconds to wait between SIGTERM and SIGKILL.
203 'grace_period',
204 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
205 # task command line argument.
206 'bot_file',
207 # Logical account to switch LUCI_CONTEXT into.
208 'switch_to_account',
209 # Context manager dir => CipdInfo, see install_client_and_packages.
210 'install_packages_fn',
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000211 # Use go isolated client.
212 'use_go_isolated',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000213 # Cache directory for go `isolated` client.
Takuto Ikuta057c5342019-12-03 04:05:05 +0000214 'go_cache_dir',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000215 # Parameters passed to go `isolated` client.
Takuto Ikuta879788c2020-01-10 08:00:26 +0000216 'go_cache_policies',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000217 # Cache directory for `cas` client.
218 'cas_cache_dir',
219 # Parameters passed to `cas` client.
220 'cas_cache_policies',
Takuto Ikutaae391c52020-12-03 08:43:45 +0000221 # Parameters for kvs file used by `cas` client.
222 'cas_kvs',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000223 # Environment variables to set.
224 'env',
225 # Environment variables to mutate with relative directories.
226 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
227 'env_prefix',
228 # Lowers the task process priority.
229 'lower_priority',
230 # subprocess42.Containment instance. Can be None.
231 'containment',
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000232 # Function to trim caches before installing cipd packages and
233 # downloading isolated files.
234 'trim_caches_fn',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000235 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500236
237
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500238def _to_str(s):
239 """Downgrades a unicode instance to str. Pass str through as-is."""
240 if isinstance(s, str):
241 return s
242 # This is technically incorrect, especially on Windows. In theory
243 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
244 # page' on Windows, but that causes other problems, as the character set
245 # is very limited.
246 return s.encode('utf-8')
247
248
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500249def _to_unicode(s):
250 """Upgrades a str instance to unicode. Pass unicode through as-is."""
Takuto Ikuta95459dd2019-10-29 12:39:47 +0000251 if isinstance(s, six.text_type) or s is None:
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500252 return s
253 return s.decode('utf-8')
254
255
maruel03e11842016-07-14 10:50:16 -0700256def make_temp_dir(prefix, root_dir):
257 """Returns a new unique temporary directory."""
Takuto Ikuta6e2ff962019-10-29 12:35:27 +0000258 return six.text_type(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000259
260
vadimsh9c54b2c2017-07-25 14:08:29 -0700261@contextlib.contextmanager
262def set_luci_context_account(account, tmp_dir):
263 """Sets LUCI_CONTEXT account to be used by the task.
264
265 If 'account' is None or '', does nothing at all. This happens when
266 run_isolated.py is called without '--switch-to-account' flag. In this case,
267 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000268 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700269 run_isolated.py explicitly from their code.
270
271 If the requested account is not defined in the context, switches to
272 non-authenticated access. This happens for Swarming tasks that don't use
273 'task' service accounts.
274
275 If not using LUCI_CONTEXT-based auth, does nothing.
276 If already running as requested account, does nothing.
277 """
278 if not account:
279 # Not actually switching.
280 yield
281 return
282
283 local_auth = luci_context.read('local_auth')
284 if not local_auth:
285 # Not using LUCI_CONTEXT auth at all.
286 yield
287 return
288
289 # See LUCI_CONTEXT.md for the format of 'local_auth'.
290 if local_auth.get('default_account_id') == account:
291 # Already set, no need to switch.
292 yield
293 return
294
295 available = {a['id'] for a in local_auth.get('accounts') or []}
296 if account in available:
297 logging.info('Switching default LUCI_CONTEXT account to %r', account)
298 local_auth['default_account_id'] = account
299 else:
300 logging.warning(
301 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
302 'disabling authentication', account, sorted(available))
303 local_auth.pop('default_account_id', None)
304
305 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
306 yield
307
308
nodir90bc8dc2016-06-15 13:35:21 -0700309def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000310 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700311
312 Raises:
313 ValueError if a parameter is requested in |command| but its value is not
314 provided.
315 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000316 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
317
318
319def replace_parameters(arg, out_dir, bot_file):
320 """Replaces parameter tokens with appropriate values in a string.
321
322 Raises:
323 ValueError if a parameter is requested in |arg| but its value is not
324 provided.
325 """
326 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
327 replace_slash = False
328 if ISOLATED_OUTDIR_PARAMETER in arg:
329 if not out_dir:
330 raise ValueError(
331 'output directory is requested in command or env var, but not '
332 'provided; please specify one')
333 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
334 replace_slash = True
335 if SWARMING_BOT_FILE_PARAMETER in arg:
336 if bot_file:
337 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700338 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000339 else:
340 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
341 'var, but no bot_file specified. Leaving parameter '
342 'unchanged.')
343 if replace_slash:
344 # Replace slashes only if parameters are present
345 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
346 arg = arg.replace('/', os.sep)
347 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700348
349
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000350def set_temp_dir(env, tmp_dir):
351 """Set temp dir to given env var dictionary"""
352 tmp_dir = _to_str(tmp_dir)
353 # pylint: disable=line-too-long
354 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
355 # platform. So $TMPDIR must be set on all platforms.
356 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
357 env['TMPDIR'] = tmp_dir
358 if sys.platform == 'win32':
359 # * chromium's base utils uses GetTempPath().
360 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
361 # * Go uses GetTempPath().
362 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
363 # set.
364 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
365 env['TMP'] = tmp_dir
366 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
367 env['TEMP'] = tmp_dir
368 elif sys.platform == 'darwin':
369 # * Chromium uses an hack on macOS before calling into
370 # NSTemporaryDirectory().
371 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
372 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
373 env['MAC_CHROMIUM_TMPDIR'] = tmp_dir
374 else:
375 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
376 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
377 # * mktemp on linux respects $TMPDIR.
378 # * Chromium respects $TMPDIR on linux.
379 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
380 # * Go uses $TMPDIR.
381 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
382 pass
383
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000384
385def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
386 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800387 """Returns full OS environment to run a command in.
388
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800389 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
390 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800391
392 Args:
393 tmp_dir: temp directory.
394 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500395 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500396 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800397 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000398 out_dir: Isolated output directory. Required to be != None if any of the
399 env vars contain ISOLATED_OUTDIR_PARAMETER.
400 bot_file: Required to be != None if any of the env vars contain
401 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800402 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500403 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000404 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500405 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500406 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500407 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000408 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500409
410 if cipd_info:
411 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500412 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
413 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Takuto Ikuta4ec3e8f2021-04-05 10:21:29 +0000414 cipd_info_path = os.path.join(tmp_dir, 'cipd_info.json')
415 with open(cipd_info_path, 'w') as f:
416 json.dump(cipd_info.pins, f)
417 out['ISOLATED_RESOLVED_PACKAGE_VERSIONS_FILE'] = cipd_info_path
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500418
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000419 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500420 assert isinstance(paths, list), paths
421 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500422 cur = out.get(key)
423 if cur:
424 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500425 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800426
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000427 set_temp_dir(out, tmp_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500428 return out
vadimsh232f5a82017-01-20 19:23:44 -0800429
430
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000431def run_command(
432 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700433 """Runs the command.
434
435 Returns:
436 tuple(process exit code, bool if had a hard timeout)
437 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000438 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000439 'run_command(%s, %s, %s, %s, %s, %s)',
440 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700441
maruel6be7f9e2015-10-01 12:25:30 -0700442 exit_code = None
443 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700444 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700445 proc = None
446 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700447 try:
maruel6be7f9e2015-10-01 12:25:30 -0700448 # TODO(maruel): This code is imperfect. It doesn't handle well signals
449 # during the download phase and there's short windows were things can go
450 # wrong.
451 def handler(signum, _frame):
452 if proc and not had_signal:
453 logging.info('Received signal %d', signum)
454 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700455 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700456
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000457 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000458 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000459 lower_priority=lower_priority, containment=containment)
maruel6be7f9e2015-10-01 12:25:30 -0700460 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
461 try:
John Budorickc398f092019-06-10 22:49:44 +0000462 exit_code = proc.wait(hard_timeout or None)
maruel6be7f9e2015-10-01 12:25:30 -0700463 except subprocess42.TimeoutExpired:
464 if not had_signal:
465 logging.warning('Hard timeout')
466 had_hard_timeout = True
467 logging.warning('Sending SIGTERM')
468 proc.terminate()
469
Takuto Ikuta684f7912020-09-29 07:49:49 +0000470 kill_sent = False
maruel6be7f9e2015-10-01 12:25:30 -0700471 # Ignore signals in grace period. Forcibly give the grace period to the
472 # child process.
473 if exit_code is None:
474 ignore = lambda *_: None
475 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
476 try:
477 exit_code = proc.wait(grace_period or None)
478 except subprocess42.TimeoutExpired:
479 # Now kill for real. The user can distinguish between the
480 # following states:
481 # - signal but process exited within grace period,
482 # hard_timed_out will be set but the process exit code will be
483 # script provided.
484 # - processed exited late, exit code will be -9 on posix.
485 logging.warning('Grace exhausted; sending SIGKILL')
486 proc.kill()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000487 kill_sent = True
martiniss5c8043e2017-08-01 17:09:43 -0700488 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700489 exit_code = proc.wait()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000490
491 # the process group / job object may be dangling so if we didn't kill
492 # it already, give it a poke now.
493 if not kill_sent:
494 proc.kill()
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000495 except OSError as e:
maruela9cfd6f2015-09-15 11:03:15 -0700496 # This is not considered to be an internal error. The executable simply
497 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800498 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000499 '<The executable does not exist, a dependent library is missing or '
500 'the command line is too long>\n'
501 '<Check for missing .so/.dll in the .isolate or GN file or length of '
502 'command line args>\n'
Takuto Ikutae900df42021-04-14 04:40:11 +0000503 '<Command: %s>\n'
504 '<Exception: %s>\n' % (command, e))
maruela72f46e2016-02-24 11:05:45 -0800505 if os.environ.get('SWARMING_TASK_ID'):
506 # Give an additional hint when running as a swarming task.
507 sys.stderr.write(
508 '<See the task\'s page for commands to help diagnose this issue '
509 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700510 exit_code = 1
511 logging.info(
512 'Command finished with exit code %d (%s)',
513 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700514 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700515
516
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000517def _run_go_cmd_and_wait(cmd, tmp_dir):
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000518 """
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000519 Runs an external Go command, `isolated` or `cas`, and wait for its completion.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000520
521 While this is a generic function to launch a subprocess, it has logic that
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000522 is specific to Go `isolated` and `cas` for waiting and logging.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000523
524 Returns:
525 The subprocess object
526 """
Ye Kuang3c40e9f2020-07-28 13:15:25 +0000527 cmd_str = ' '.join(cmd)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000528 try:
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000529 env = os.environ.copy()
530 set_temp_dir(env, tmp_dir)
531 proc = subprocess42.Popen(cmd, env=env)
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000532
Ye Kuangc1d800f2020-07-28 10:14:55 +0000533 exceeded_max_timeout = True
534 check_period_sec = 30
535 max_checks = 100
536 # max timeout = max_checks * check_period_sec = 50 minutes
537 for i in range(max_checks):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000538 # This is to prevent I/O timeout error during setup.
Ye Kuangc1d800f2020-07-28 10:14:55 +0000539 try:
540 retcode = proc.wait(check_period_sec)
541 if retcode != 0:
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000542 raise subprocess42.CalledProcessError(retcode, cmd=cmd_str)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000543 exceeded_max_timeout = False
544 break
545 except subprocess42.TimeoutExpired:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000546 print('still running (after %d seconds)' % ((i + 1) * check_period_sec))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000547
Ye Kuangc1d800f2020-07-28 10:14:55 +0000548 if exceeded_max_timeout:
549 proc.terminate()
550 try:
551 proc.wait(check_period_sec)
552 except subprocess42.TimeoutExpired:
553 logging.exception(
554 "failed to terminate? timeout happened after %d seconds",
555 check_period_sec)
556 proc.kill()
557 proc.wait()
558 # Raise unconditionally, because |proc| was forcefully terminated.
559 raise ValueError("timedout after %d seconds (cmd=%s)" %
560 (check_period_sec * max_checks, cmd_str))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000561
Ye Kuangc1d800f2020-07-28 10:14:55 +0000562 return proc
563 except Exception:
564 logging.exception('Failed to run Go cmd %s', cmd_str)
565 raise
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000566
567
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000568def _fetch_and_map_with_cas(cas_client, digest, instance, output_dir, cache_dir,
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000569 policies, kvs_dir, tmp_dir):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000570 """
571 Fetches a CAS tree using cas client, create the tree and returns download
572 stats.
573 """
574
575 start = time.time()
576 result_json_handle, result_json_path = tempfile.mkstemp(
577 prefix=u'fetch-and-map-result-', suffix=u'.json')
578 os.close(result_json_handle)
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000579 profile_dir = tempfile.mkdtemp(dir=tmp_dir)
580
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000581 try:
582 cmd = [
583 cas_client,
584 'download',
585 '-digest',
586 digest,
587 '-cas-instance',
588 instance,
589 # flags for cache.
590 '-cache-dir',
591 cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000592 '-cache-max-size',
593 str(policies.max_cache_size),
594 '-cache-min-free-space',
595 str(policies.min_free_space),
596 # flags for output.
597 '-dir',
598 output_dir,
599 '-dump-stats-json',
600 result_json_path,
Takuto Ikuta557025b2021-02-01 08:37:40 +0000601 '-log-level',
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000602 'info',
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000603 ]
Takuto Ikutaae391c52020-12-03 08:43:45 +0000604
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +0000605 if kvs_dir:
606 cmd.extend(['-kvs-dir', kvs_dir])
Takuto Ikutaae391c52020-12-03 08:43:45 +0000607
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000608 try:
609 _run_go_cmd_and_wait(cmd, tmp_dir)
Takuto Ikuta0909eae2021-04-27 02:54:07 +0000610 except subprocess42.CalledProcessError as ex:
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000611 if not kvs_dir:
612 raise
613 logging.exception('Failed to run cas, removing kvs cache dir and retry.')
Takuto Ikuta0909eae2021-04-27 02:54:07 +0000614 on_error.report("Failed to run cas %s" % ex)
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000615 file_path.rmtree(kvs_dir)
Takuto Ikuta27f4b2f2021-04-26 07:18:55 +0000616 _run_go_cmd_and_wait(cmd, tmp_dir)
617
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000618 with open(result_json_path) as json_file:
619 result_json = json.load(json_file)
620
621 return {
622 'duration': time.time() - start,
623 'items_cold': result_json['items_cold'],
624 'items_hot': result_json['items_hot'],
625 }
626 finally:
627 fs.remove(result_json_path)
Takuto Ikutad5749ac2021-04-07 06:16:19 +0000628 file_path.rmtree(profile_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000629
630
631def _fetch_and_map_with_go_isolated(isolated_hash, storage, outdir,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000632 go_cache_dir, policies, isolated_client,
633 tmp_dir):
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000634 """
635 Fetches an isolated tree using go client, create the tree and returns
Takuto Ikuta57219f42020-11-02 07:35:36 +0000636 stats.
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000637 """
638 start = time.time()
639 server_ref = storage.server_ref
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000640 result_json_handle, result_json_path = tempfile.mkstemp(
641 prefix=u'fetch-and-map-result-', suffix=u'.json')
642 os.close(result_json_handle)
643 try:
Ye Kuanga98764c2020-04-09 03:17:37 +0000644 cmd = [
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000645 isolated_client,
646 'download',
647 '-isolate-server',
648 server_ref.url,
649 '-namespace',
650 server_ref.namespace,
651 '-isolated',
652 isolated_hash,
653
654 # flags for cache
655 '-cache-dir',
Takuto Ikuta057c5342019-12-03 04:05:05 +0000656 go_cache_dir,
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000657 '-cache-max-items',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000658 str(policies.max_items),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000659 '-cache-max-size',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000660 str(policies.max_cache_size),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000661 '-cache-min-free-space',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000662 str(policies.min_free_space),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000663
664 # flags for output
665 '-output-dir',
666 outdir,
667 '-fetch-and-map-result-json',
668 result_json_path,
Ye Kuanga98764c2020-04-09 03:17:37 +0000669 ]
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000670 _run_go_cmd_and_wait(cmd, tmp_dir)
Takuto Ikuta3153e3b2020-02-18 06:11:47 +0000671
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000672 with open(result_json_path) as json_file:
673 result_json = json.load(json_file)
674
Takuto Ikuta57219f42020-11-02 07:35:36 +0000675 return {
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000676 'duration': time.time() - start,
677 'items_cold': result_json['items_cold'],
678 'items_hot': result_json['items_hot'],
Ye Kuang65a1de52020-10-16 08:31:16 +0000679 'initial_number_items': result_json['initial_number_items'],
680 'initial_size': result_json['initial_size'],
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000681 }
682 finally:
683 fs.remove(result_json_path)
684
685
686# TODO(crbug.com/932396): remove this function.
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000687def fetch_and_map(isolated_hash, storage, cache, outdir):
Takuto Ikuta57219f42020-11-02 07:35:36 +0000688 """Fetches an isolated tree, create the tree and returns stats."""
nodir6f801882016-04-29 14:41:50 -0700689 start = time.time()
Takuto Ikuta57219f42020-11-02 07:35:36 +0000690 isolateserver.fetch_isolated(
nodir6f801882016-04-29 14:41:50 -0700691 isolated_hash=isolated_hash,
692 storage=storage,
693 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700694 outdir=outdir,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000695 use_symlinks=False)
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000696 hot = (collections.Counter(cache.used) -
697 collections.Counter(cache.added)).elements()
Takuto Ikuta57219f42020-11-02 07:35:36 +0000698 return {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000699 'duration': time.time() - start,
700 'items_cold': base64.b64encode(large.pack(sorted(cache.added))).decode(),
701 'items_hot': base64.b64encode(large.pack(sorted(hot))).decode(),
nodir6f801882016-04-29 14:41:50 -0700702 }
703
704
aludwin0a8e17d2016-10-27 15:57:39 -0700705def link_outputs_to_outdir(run_dir, out_dir, outputs):
706 """Links any named outputs to out_dir so they can be uploaded.
707
708 Raises an error if the file already exists in that directory.
709 """
710 if not outputs:
711 return
712 isolateserver.create_directories(out_dir, outputs)
713 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400714 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
715
716
717def copy_recursively(src, dst):
718 """Efficiently copies a file or directory from src_dir to dst_dir.
719
720 `item` may be a file, directory, or a symlink to a file or directory.
721 All symlinks are replaced with their targets, so the resulting
722 directory structure in dst_dir will never have any symlinks.
723
724 To increase speed, copy_recursively hardlinks individual files into the
725 (newly created) directory structure if possible, unlike Python's
726 shutil.copytree().
727 """
728 orig_src = src
729 try:
730 # Replace symlinks with their final target.
731 while fs.islink(src):
732 res = fs.readlink(src)
Takuto Ikutaf2ad0a02021-06-24 08:38:40 +0000733 src = os.path.realpath(os.path.join(os.path.dirname(src), res))
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400734 # TODO(sadafm): Explicitly handle cyclic symlinks.
735
Takuto Ikutaf2ad0a02021-06-24 08:38:40 +0000736 if not fs.exists(src):
737 logging.warning('Path %s does not exist or %s is a broken symlink', src,
738 orig_src)
739 return
740
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400741 if fs.isfile(src):
742 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
743 return
744
745 if not fs.exists(dst):
746 os.makedirs(dst)
747
748 for child in fs.listdir(src):
749 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
750
751 except OSError as e:
752 if e.errno == errno.ENOENT:
753 logging.warning('Path %s does not exist or %s is a broken symlink',
754 src, orig_src)
755 else:
756 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700757
758
Ye Kuangfb0bad62020-07-28 08:07:25 +0000759def _upload_with_py(storage, out_dir):
760
761 def process_stats(f_st):
762 st = sorted(i.size for i in f_st)
763 return base64.b64encode(large.pack(st)).decode()
764
765 try:
766 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
767 storage, [out_dir], None, verify_push=True)
768
769 isolated = list(results.values())[0]
770 cold = process_stats(f_cold)
771 hot = process_stats(f_hot)
772 return isolated, cold, hot
773
774 except isolateserver.Aborted:
775 # This happens when a signal SIGTERM was received while uploading data.
776 # There is 2 causes:
777 # - The task was too slow and was about to be killed anyway due to
778 # exceeding the hard timeout.
779 # - The amount of data uploaded back is very large and took too much
780 # time to archive.
781 sys.stderr.write('Received SIGTERM while uploading')
782 # Re-raise, so it will be treated as an internal failure.
783 raise
784
785
Takuto Ikutaf5173872021-05-11 03:18:40 +0000786def upload_out_dir(storage, out_dir):
Ye Kuangbc4e8402020-07-29 09:54:30 +0000787 """Uploads the results in |out_dir| back, if there is any.
maruela9cfd6f2015-09-15 11:03:15 -0700788
789 Returns:
Ye Kuangbc4e8402020-07-29 09:54:30 +0000790 tuple(outputs_ref, stats)
maruel064c0a32016-04-05 11:47:15 -0700791 - outputs_ref: a dict referring to the results archived back to the isolated
792 server, if applicable.
nodir6f801882016-04-29 14:41:50 -0700793 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700794 """
maruela9cfd6f2015-09-15 11:03:15 -0700795 # Upload out_dir and generate a .isolated file out of this directory. It is
796 # only done if files were written in the directory.
797 outputs_ref = None
Ye Kuangfb0bad62020-07-28 08:07:25 +0000798 cold = ''
799 hot = ''
nodir6f801882016-04-29 14:41:50 -0700800 start = time.time()
801
maruel12e30012015-10-09 11:55:35 -0700802 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700803 with tools.Profiler('ArchiveOutput'):
Takuto Ikutaf5173872021-05-11 03:18:40 +0000804 isolated, cold, hot = _upload_with_py(storage, out_dir)
Ye Kuangfb0bad62020-07-28 08:07:25 +0000805 outputs_ref = {
806 'isolated': isolated,
807 'isolatedserver': storage.server_ref.url,
808 'namespace': storage.server_ref.namespace,
809 }
nodir6f801882016-04-29 14:41:50 -0700810
nodir6f801882016-04-29 14:41:50 -0700811 stats = {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000812 'duration': time.time() - start,
Ye Kuangfb0bad62020-07-28 08:07:25 +0000813 'items_cold': cold,
814 'items_hot': hot,
nodir6f801882016-04-29 14:41:50 -0700815 }
Ye Kuangbc4e8402020-07-29 09:54:30 +0000816 return outputs_ref, stats
maruela9cfd6f2015-09-15 11:03:15 -0700817
818
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000819def upload_outdir_with_cas(cas_client, cas_instance, outdir, tmp_dir):
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000820 """Uploads the results in |outdir|, if there is any.
821
822 Returns:
823 tuple(root_digest, stats)
824 - root_digest: a digest of the output directory.
825 - stats: uploading stats.
826 """
827 digest_file_handle, digest_path = tempfile.mkstemp(
828 prefix=u'cas-digest', suffix=u'.txt')
829 os.close(digest_file_handle)
830 stats_json_handle, stats_json_path = tempfile.mkstemp(
831 prefix=u'upload-stats', suffix=u'.json')
832 os.close(stats_json_handle)
833
834 try:
835 cmd = [
836 cas_client,
837 'archive',
838 '-cas-instance',
839 cas_instance,
840 '-paths',
841 # Format: <working directory>:<relative path to dir>
842 outdir + ':',
843 # output
844 '-dump-digest',
845 digest_path,
846 '-dump-stats-json',
847 stats_json_path,
848 ]
849
850 start = time.time()
851
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000852 _run_go_cmd_and_wait(cmd, tmp_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000853
854 with open(digest_path) as digest_file:
855 digest = digest_file.read()
Junji Watanabec208b302020-09-25 09:18:27 +0000856 h, s = digest.split('/')
857 cas_output_root = {
858 'cas_instance': cas_instance,
859 'digest': {
860 'hash': h,
861 'size_bytes': int(s)
862 }
863 }
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000864 with open(stats_json_path) as stats_file:
865 stats = json.load(stats_file)
866
867 stats['duration'] = time.time() - start
868
Junji Watanabec208b302020-09-25 09:18:27 +0000869 return cas_output_root, stats
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000870 finally:
871 fs.remove(digest_path)
872 fs.remove(stats_json_path)
873
874
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500875def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700876 """Runs a command with optional isolated input/output.
877
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500878 Arguments:
879 - data: TaskData instance.
880 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700881
882 Returns metadata about the result.
883 """
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000884
885 if data.isolate_cache:
886 download_stats = {
887 #'duration': 0.,
888 'initial_number_items': len(data.isolate_cache),
889 'initial_size': data.isolate_cache.total_size,
890 #'items_cold': '<large.pack()>',
891 #'items_hot': '<large.pack()>',
892 }
893 else:
894 # TODO(tikuta): take stats from state.json in this case too.
895 download_stats = {}
896
maruela9cfd6f2015-09-15 11:03:15 -0700897 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000898 'duration': None,
899 'exit_code': None,
900 'had_hard_timeout': False,
901 'internal_failure': 'run_isolated did not complete properly',
902 'stats': {
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000903 'trim_caches': {
904 'duration': 0,
905 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000906 #'cipd': {
907 # 'duration': 0.,
908 # 'get_client_duration': 0.,
909 #},
910 'isolated': {
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000911 'download': download_stats,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000912 #'upload': {
913 # 'duration': 0.,
914 # 'items_cold': '<large.pack()>',
915 # 'items_hot': '<large.pack()>',
916 #},
917 },
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000918 'named_caches': {
919 'install': {
920 'duration': 0,
921 },
922 'uninstall': {
923 'duration': 0,
924 },
925 },
926 'cleanup': {
927 'duration': 0,
928 }
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000929 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000930 #'cipd_pins': {
931 # 'packages': [
932 # {'package_name': ..., 'version': ..., 'path': ...},
933 # ...
934 # ],
935 # 'client_package': {'package_name': ..., 'version': ...},
936 #},
937 'outputs_ref': None,
Junji Watanabe54925c32020-09-08 00:56:18 +0000938 'cas_output_root': None,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000939 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700940 }
nodirbe642ff2016-06-09 15:51:51 -0700941
Takuto Ikutad46ea762020-10-07 05:43:22 +0000942 assert os.path.isabs(data.root_dir), ("data.root_dir is not abs path: %s" %
943 data.root_dir)
944 file_path.ensure_tree(data.root_dir, 0o700)
945
maruele2f2cb82016-07-13 14:41:03 -0700946 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700947 # TODO(maruel): This is not obvious. Change this to become an error once we
948 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500949 if constant_run_path and data.root_dir:
950 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700951 if os.path.isdir(run_dir):
952 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000953 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700954 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500955 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000956
957 # True if CAS is used for download/upload files.
958 use_cas = bool(data.cas_digest)
959
maruel03e11842016-07-14 10:50:16 -0700960 # storage should be normally set but don't crash if it is not. This can happen
961 # as Swarming task can run without an isolate server.
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000962 out_dir = None
963 if data.storage or use_cas:
964 out_dir = make_temp_dir(ISOLATED_OUT_DIR, data.root_dir)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500965 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000966 isolated_client_dir = make_temp_dir(ISOLATED_CLIENT_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700967 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500968 if data.relative_cwd:
969 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500970 command = data.command
Ye Kuangfb0bad62020-07-28 08:07:25 +0000971 go_isolated_client = None
972 if data.use_go_isolated:
973 go_isolated_client = os.path.join(isolated_client_dir,
974 'isolated' + cipd.EXECUTABLE_SUFFIX)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000975
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000976 cas_client = None
977 cas_client_dir = make_temp_dir(_CAS_CLIENT_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000978 if use_cas:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000979 cas_client = os.path.join(cas_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX)
980
Junji Watanabeaee69ad2021-04-28 03:17:34 +0000981 data.trim_caches_fn(result['stats']['trim_caches'])
982
nodir55be77b2016-05-03 09:39:57 -0700983 try:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000984 with data.install_packages_fn(run_dir, isolated_client_dir,
985 cas_client_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800986 if cipd_info:
987 result['stats']['cipd'] = cipd_info.stats
988 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700989
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000990 isolated_stats = result['stats'].setdefault('isolated', {})
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500991 if data.isolated_hash:
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000992 if data.use_go_isolated:
Takuto Ikuta57219f42020-11-02 07:35:36 +0000993 stats = _fetch_and_map_with_go_isolated(
Takuto Ikuta90397ca2020-01-08 10:07:55 +0000994 isolated_hash=data.isolated_hash,
995 storage=data.storage,
Takuto Ikuta90397ca2020-01-08 10:07:55 +0000996 outdir=run_dir,
997 go_cache_dir=data.go_cache_dir,
Takuto Ikuta879788c2020-01-10 08:00:26 +0000998 policies=data.go_cache_policies,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000999 isolated_client=go_isolated_client,
1000 tmp_dir=tmp_dir)
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001001 else:
Takuto Ikuta57219f42020-11-02 07:35:36 +00001002 stats = fetch_and_map(
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001003 isolated_hash=data.isolated_hash,
1004 storage=data.storage,
1005 cache=data.isolate_cache,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +00001006 outdir=run_dir)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001007 isolated_stats['download'].update(stats)
Takuto Ikutab58dbd12020-06-05 09:29:14 +00001008
Junji Watanabe54925c32020-09-08 00:56:18 +00001009 elif data.cas_digest:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001010 stats = _fetch_and_map_with_cas(
1011 cas_client=cas_client,
1012 digest=data.cas_digest,
1013 instance=data.cas_instance,
1014 output_dir=run_dir,
Junji Watanabeb03450b2020-09-25 05:09:27 +00001015 cache_dir=data.cas_cache_dir,
Takuto Ikutaae391c52020-12-03 08:43:45 +00001016 policies=data.cas_cache_policies,
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001017 kvs_dir=data.cas_kvs,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +00001018 tmp_dir=tmp_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001019 isolated_stats['download'].update(stats)
Junji Watanabe54925c32020-09-08 00:56:18 +00001020
maruelabec63c2017-04-26 11:53:24 -07001021 if not command:
1022 # Handle this as a task failure, not an internal failure.
1023 sys.stderr.write(
1024 '<No command was specified!>\n'
1025 '<Please secify a command when triggering your Swarming task>\n')
1026 result['exit_code'] = 1
1027 return result
nodirbe642ff2016-06-09 15:51:51 -07001028
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001029 if not cwd.startswith(run_dir):
1030 # Handle this as a task failure, not an internal failure. This is a
1031 # 'last chance' way to gate against directory escape.
1032 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
1033 result['exit_code'] = 1
1034 return result
1035
1036 if not os.path.isdir(cwd):
1037 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +00001038 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001039
vadimsh232f5a82017-01-20 19:23:44 -08001040 # If we have an explicit list of files to return, make sure their
1041 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001042 if data.storage and data.outputs:
1043 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -07001044
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001045 with data.install_named_caches(run_dir, result['stats']['named_caches']):
nodird6160682017-02-02 13:03:35 -08001046 sys.stdout.flush()
1047 start = time.time()
1048 try:
vadimsh9c54b2c2017-07-25 14:08:29 -07001049 # Need to switch the default account before 'get_command_env' call,
1050 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001051 with set_luci_context_account(data.switch_to_account, tmp_dir):
1052 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +00001053 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
1054 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +00001055 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -08001056 command = process_command(command, out_dir, data.bot_file)
1057 file_path.ensure_command_has_abs_path(command, cwd)
1058
vadimsh9c54b2c2017-07-25 14:08:29 -07001059 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001060 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001061 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -08001062 finally:
1063 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -05001064
Ye Kuangbc4e8402020-07-29 09:54:30 +00001065 if out_dir:
1066 # Try to link files to the output directory, if specified.
1067 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
1068 isolated_stats = result['stats'].setdefault('isolated', {})
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001069 if use_cas:
1070 result['cas_output_root'], isolated_stats['upload'] = (
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +00001071 upload_outdir_with_cas(cas_client, data.cas_instance, out_dir,
1072 tmp_dir))
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001073 else:
1074 # This could use |go_isolated_client|, so make sure it runs when the
1075 # CIPD package still exists.
1076 result['outputs_ref'], isolated_stats['upload'] = (
Takuto Ikutaf5173872021-05-11 03:18:40 +00001077 upload_out_dir(data.storage, out_dir))
Seth Koehler49139812017-12-19 13:59:33 -05001078 # We successfully ran the command, set internal_failure back to
1079 # None (even if the command failed, it's not an internal error).
1080 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -07001081 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -07001082 # An internal error occurred. Report accordingly so the swarming task will
1083 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -07001084 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -07001085 result['internal_failure'] = str(e)
1086 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -07001087
1088 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -07001089 finally:
1090 try:
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001091 cleanup_start = time.time()
Ye Kuangbc4e8402020-07-29 09:54:30 +00001092 success = True
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001093 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -07001094 success = True
maruela9cfd6f2015-09-15 11:03:15 -07001095 logging.warning(
1096 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -07001097 else:
maruel84537cb2015-10-16 14:21:28 -07001098 # On Windows rmtree(run_dir) call above has a synchronization effect: it
1099 # finishes only when all task child processes terminate (since a running
1100 # process locks *.exe file). Examine out_dir only after that call
1101 # completes (since child processes may write to out_dir too and we need
1102 # to wait for them to finish).
Junji Watanabeb03450b2020-09-25 05:09:27 +00001103 dirs_to_remove = [run_dir, tmp_dir, isolated_client_dir, cas_client_dir]
Ye Kuangbc4e8402020-07-29 09:54:30 +00001104 if out_dir:
1105 dirs_to_remove.append(out_dir)
1106 for directory in dirs_to_remove:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001107 if not fs.isdir(directory):
1108 continue
Junji Watanabe9cdfff52021-01-08 07:20:35 +00001109 start = time.time()
maruel84537cb2015-10-16 14:21:28 -07001110 try:
Junji Watanabecc4eefd2021-01-19 01:46:10 +00001111 file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -07001112 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001113 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -07001114 success = False
Junji Watanabe9cdfff52021-01-08 07:20:35 +00001115 finally:
1116 logging.info('Cleanup: rmtree(%r) took %d seconds', directory,
1117 time.time() - start)
maruel84537cb2015-10-16 14:21:28 -07001118 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001119 sys.stderr.write(
1120 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
Junji Watanabed952bf12021-05-13 03:15:54 +00001121 if sys.platform == 'win32':
1122 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
1123 else:
1124 subprocess42.check_call(['ps', 'axu'], stdout=sys.stderr)
maruel84537cb2015-10-16 14:21:28 -07001125 if result['exit_code'] == 0:
1126 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -07001127
maruela9cfd6f2015-09-15 11:03:15 -07001128 if not success and result['exit_code'] == 0:
1129 result['exit_code'] = 1
1130 except Exception as e:
1131 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -07001132 if out_dir:
1133 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -07001134 result['internal_failure'] = str(e)
Takuto Ikutaa9a907b2020-04-17 08:50:50 +00001135 on_error.report(None)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001136 finally:
1137 cleanup_duration = time.time() - cleanup_start
1138 result['stats']['cleanup']['duration'] = cleanup_duration
1139 logging.info('Cleanup: removing directories took %d seconds',
1140 cleanup_duration)
maruela9cfd6f2015-09-15 11:03:15 -07001141 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001142
1143
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001144def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -07001145 """Runs an executable and records execution metadata.
1146
nodir55be77b2016-05-03 09:39:57 -07001147 If isolated_hash is specified, downloads the dependencies in the cache,
1148 hardlinks them into a temporary directory and runs the command specified in
1149 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001150
1151 A temporary directory is created to hold the output files. The content inside
1152 this directory will be uploaded back to |storage| packaged as a .isolated
1153 file.
1154
1155 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001156 - data: TaskData instance.
1157 - result_json: File path to dump result metadata into. If set, the process
1158 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -07001159
1160 Returns:
1161 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001162 """
maruela76b9ee2015-12-15 06:18:08 -08001163 if result_json:
1164 # Write a json output file right away in case we get killed.
1165 result = {
Junji Watanabe54925c32020-09-08 00:56:18 +00001166 'exit_code': None,
1167 'had_hard_timeout': False,
1168 'internal_failure': 'Was terminated before completion',
1169 'outputs_ref': None,
1170 'cas_output_root': None,
1171 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -08001172 }
1173 tools.write_json(result_json, result, dense=True)
1174
maruela9cfd6f2015-09-15 11:03:15 -07001175 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001176 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -07001177 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -07001178
maruela9cfd6f2015-09-15 11:03:15 -07001179 if result_json:
maruel05d5a882015-09-21 13:59:02 -07001180 # We've found tests to delete 'work' when quitting, causing an exception
1181 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -07001182 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -07001183 tools.write_json(result_json, result, dense=True)
1184 # Only return 1 if there was an internal error.
1185 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +00001186
maruela9cfd6f2015-09-15 11:03:15 -07001187 # Marshall into old-style inline output.
1188 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +00001189 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -07001190 data = {
Junji Watanabe38b28b02020-04-23 10:23:30 +00001191 'hash': result['outputs_ref']['isolated'],
1192 'namespace': result['outputs_ref']['namespace'],
1193 'storage': result['outputs_ref']['isolatedserver'],
maruela9cfd6f2015-09-15 11:03:15 -07001194 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -05001195 sys.stdout.flush()
Junji Watanabe38b28b02020-04-23 10:23:30 +00001196 print('[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
1197 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -08001198 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -07001199 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001200
1201
iannuccib58d10d2017-03-18 02:00:25 -07001202# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -08001203CipdInfo = collections.namedtuple('CipdInfo', [
1204 'client', # cipd.CipdClient object
1205 'cache_dir', # absolute path to bot-global cipd tag and instance cache
1206 'stats', # dict with stats to return to the server
1207 'pins', # dict with installed cipd pins to return to the server
1208])
1209
1210
1211@contextlib.contextmanager
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001212def noop_install_packages(_run_dir, _isolated_dir, _cas_dir):
iannuccib58d10d2017-03-18 02:00:25 -07001213 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -08001214 yield None
1215
1216
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001217def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -07001218 """Calls 'cipd ensure' for packages.
1219
1220 Args:
1221 run_dir (str): root of installation.
1222 cipd_cache_dir (str): the directory to use for the cipd package cache.
1223 client (CipdClient): the cipd client to use
1224 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -07001225
1226 Returns: list of pinned packages. Looks like [
1227 {
1228 'path': 'subdirectory',
1229 'package_name': 'resolved/package/name',
1230 'version': 'deadbeef...',
1231 },
1232 ...
1233 ]
1234 """
1235 package_pins = [None]*len(packages)
1236 def insert_pin(path, name, version, idx):
1237 package_pins[idx] = {
1238 'package_name': name,
1239 # swarming deals with 'root' as '.'
1240 'path': path or '.',
1241 'version': version,
1242 }
1243
1244 by_path = collections.defaultdict(list)
1245 for i, (path, name, version) in enumerate(packages):
1246 # cipd deals with 'root' as ''
1247 if path == '.':
1248 path = ''
1249 by_path[path].append((name, version, i))
1250
1251 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001252 run_dir,
1253 {
1254 subdir: [(name, vers) for name, vers, _ in pkgs
1255 ] for subdir, pkgs in by_path.items()
1256 },
1257 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -07001258 )
1259
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +00001260 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -07001261 this_subdir = by_path[subdir]
1262 for i, (name, version) in enumerate(pin_list):
1263 insert_pin(subdir, name, version, this_subdir[i][2])
1264
Robert Iannucci461b30d2017-12-13 11:34:03 -08001265 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -07001266
1267 return package_pins
1268
1269
vadimsh232f5a82017-01-20 19:23:44 -08001270@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001271def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001272 client_package_name, client_version, cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001273 isolated_dir, cas_dir):
vadimsh902948e2017-01-20 15:57:32 -08001274 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -07001275
vadimsh232f5a82017-01-20 19:23:44 -08001276 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
1277
1278 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -07001279 [
1280 {
1281 "path": path, "package_name": package_name, "version": version,
1282 },
1283 ...
1284 ]
vadimsh902948e2017-01-20 15:57:32 -08001285 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -07001286
1287 such that they correspond 1:1 to all input package arguments from the command
1288 line. These dictionaries make their all the way back to swarming, where they
1289 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -07001290
vadimsh902948e2017-01-20 15:57:32 -08001291 If 'packages' list is empty, will bootstrap CIPD client, but won't install
1292 any packages.
1293
1294 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -08001295 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -08001296
nodirbe642ff2016-06-09 15:51:51 -07001297 Args:
nodir90bc8dc2016-06-15 13:35:21 -07001298 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -08001299 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -07001300 service_url (str): CIPD server url, e.g.
1301 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -07001302 client_package_name (str): CIPD package name of CIPD client.
1303 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -07001304 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001305 isolated_dir (str): where to download isolated client.
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001306 cas_dir (str): where to download cas client.
nodirbe642ff2016-06-09 15:51:51 -07001307 """
1308 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001309
nodirbe642ff2016-06-09 15:51:51 -07001310 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001311
vadimsh902948e2017-01-20 15:57:32 -08001312 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001313 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001314 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001315 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001316
nodirbe642ff2016-06-09 15:51:51 -07001317 get_client_start = time.time()
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001318 client_manager = cipd.get_client(cache_dir, service_url, client_package_name,
1319 client_version)
iannucci96fcccc2016-08-30 15:52:22 -07001320
nodirbe642ff2016-06-09 15:51:51 -07001321 with client_manager as client:
1322 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001323
iannuccib58d10d2017-03-18 02:00:25 -07001324 package_pins = []
1325 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001326 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1327 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001328
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001329 # Install isolated client to |isolated_dir|.
Takuto Ikuta02edca22019-11-29 10:04:51 +00001330 _install_packages(isolated_dir, cipd_cache_dir, client,
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +00001331 [('', ISOLATED_PACKAGE, _LUCI_GO_REVISION)])
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001332
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001333 # Install cas client to |cas_dir|.
1334 _install_packages(cas_dir, cipd_cache_dir, client,
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +00001335 [('', _CAS_PACKAGE, _LUCI_GO_REVISION)])
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001336
iannuccib58d10d2017-03-18 02:00:25 -07001337 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001338
vadimsh232f5a82017-01-20 19:23:44 -08001339 total_duration = time.time() - start
Junji Watanabe38b28b02020-04-23 10:23:30 +00001340 logging.info('Installing CIPD client and packages took %d seconds',
1341 total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001342
vadimsh232f5a82017-01-20 19:23:44 -08001343 yield CipdInfo(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001344 client=client,
1345 cache_dir=cipd_cache_dir,
1346 stats={
1347 'duration': total_duration,
1348 'get_client_duration': get_client_duration,
iannuccib58d10d2017-03-18 02:00:25 -07001349 },
Junji Watanabe38b28b02020-04-23 10:23:30 +00001350 pins={
1351 'client_package': {
1352 'package_name': client.package_name,
1353 'version': client.instance_id,
1354 },
1355 'packages': package_pins,
1356 })
nodirbe642ff2016-06-09 15:51:51 -07001357
1358
1359def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001360 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001361 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001362 version=__version__,
1363 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001364 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001365 '--clean',
1366 action='store_true',
maruel36a963d2016-04-08 17:15:49 -07001367 help='Cleans the cache, trimming it necessary and remove corrupted items '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001368 'and returns without executing anything; use with -v to know what '
1369 'was done')
maruel36a963d2016-04-08 17:15:49 -07001370 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001371 '--json',
1372 help='dump output metadata to json file. When used, run_isolated returns '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001373 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001374 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001375 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001376 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001377 '--grace-period',
1378 type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001379 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001380 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001381 '--relative-cwd',
Takuto Ikuta18ca29a2020-12-04 07:34:20 +00001382 help='Ignore the isolated \'relative_cwd\' and use this one instead')
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001383 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001384 '--env',
1385 default=[],
1386 action='append',
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001387 help='Environment variables to set for the child process')
1388 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001389 '--env-prefix',
1390 default=[],
1391 action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001392 help='Specify a VAR=./path/fragment to put in the environment variable '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001393 'before executing the command. The path fragment must be relative '
1394 'to the isolated run directory, and must not contain a `..` token. '
1395 'The path will be made absolute and prepended to the indicated '
1396 '$VAR using the OS\'s path separator. Multiple items for the same '
1397 '$VAR will be prepended in order.')
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001398 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001399 '--bot-file',
1400 help='Path to a file describing the state of the host. The content is '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001401 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001402 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001403 '--switch-to-account',
1404 help='If given, switches LUCI_CONTEXT to given logical service account '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001405 '(e.g. "task" or "system") before launching the isolated process.')
vadimsh9c54b2c2017-07-25 14:08:29 -07001406 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001407 '--output',
1408 action='append',
aludwin0a8e17d2016-10-27 15:57:39 -07001409 help='Specifies an output to return. If no outputs are specified, all '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001410 'files located in $(ISOLATED_OUTDIR) will be returned; '
1411 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1412 'specified by --output option (there can be multiple) will be '
1413 'returned. Note that if a file in OUT_DIR has the same path '
1414 'as an --output option, the --output version will be returned.')
aludwin0a8e17d2016-10-27 15:57:39 -07001415 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001416 '-a',
1417 '--argsfile',
aludwin7556e0c2016-10-26 08:46:10 -07001418 # This is actually handled in parse_args; it's included here purely so it
1419 # can make it into the help text.
1420 help='Specify a file containing a JSON array of arguments to this '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001421 'script. If --argsfile is provided, no other argument may be '
1422 'provided on the command line.')
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001423 parser.add_option(
1424 '--report-on-exception',
1425 action='store_true',
1426 help='Whether report exception during execution to isolate server. '
1427 'This flag should only be used in swarming bot.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001428
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001429 group = optparse.OptionGroup(parser, 'Data source - Isolate server')
Junji Watanabe54925c32020-09-08 00:56:18 +00001430 # Deprecated. Isoate server is being migrated to RBE-CAS.
1431 # Remove --isolated and isolate server options after migration.
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001432 group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001433 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001434 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001435 isolateserver.add_isolate_server_options(group)
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001436 parser.add_option_group(group)
1437
1438 group = optparse.OptionGroup(parser,
1439 'Data source - Content Addressed Storage')
Junji Watanabe54925c32020-09-08 00:56:18 +00001440 group.add_option(
1441 '--cas-instance', help='Full CAS instance name for input/output files.')
1442 group.add_option(
1443 '--cas-digest',
1444 help='Digest of the input root on RBE-CAS. The format is '
1445 '`{hash}/{size_bytes}`.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001446 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001447
Junji Watanabeb03450b2020-09-25 05:09:27 +00001448 # Cache options.
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001449 isolateserver.add_cache_options(parser)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001450 add_cas_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001451
1452 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001453
1454 group = optparse.OptionGroup(parser, 'Named caches')
1455 group.add_option(
1456 '--named-cache',
1457 dest='named_caches',
1458 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001459 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001460 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001461 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001462 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1463 'path is a path relative to the run dir where the cache directory '
1464 'must be put to. '
1465 'This option can be specified more than once.')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001466 group.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001467 '--named-cache-root',
1468 default='named_caches',
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001469 help='Cache root directory. Default=%default')
1470 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001471
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001472 group = optparse.OptionGroup(parser, 'Process containment')
1473 parser.add_option(
1474 '--lower-priority', action='store_true',
1475 help='Lowers the child process priority')
1476 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001477 '--containment-type',
1478 choices=('NONE', 'AUTO', 'JOB_OBJECT'),
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001479 default='NONE',
1480 help='Type of container to use')
1481 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001482 '--limit-processes',
1483 type='int',
1484 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001485 help='Maximum number of active processes in the containment')
1486 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001487 '--limit-total-committed-memory',
1488 type='int',
1489 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001490 help='Maximum sum of committed memory in the containment')
1491 parser.add_option_group(group)
1492
1493 group = optparse.OptionGroup(parser, 'Debugging')
1494 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001495 '--leak-temp-dir',
1496 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001497 help='Deliberately leak isolate\'s temp dir for later examination. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001498 'Default: %default')
1499 group.add_option('--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001500 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001501
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001502 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001503
Ye Kuang1d096cb2020-06-26 08:38:21 +00001504 parser.set_defaults(cache='cache')
nodirbe642ff2016-06-09 15:51:51 -07001505 return parser
1506
1507
Junji Watanabeb03450b2020-09-25 05:09:27 +00001508def add_cas_cache_options(parser):
1509 group = optparse.OptionGroup(parser, 'CAS cache management')
1510 group.add_option(
1511 '--cas-cache',
1512 metavar='DIR',
1513 default='cas-cache',
1514 help='Directory to keep a local cache of the files. Accelerates download '
1515 'by reusing already downloaded files. Default=%default')
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001516 group.add_option(
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001517 '--kvs-dir',
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001518 default='',
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001519 help='CAS cache dir using kvs for small files. Default=%default')
Junji Watanabeb03450b2020-09-25 05:09:27 +00001520 parser.add_option_group(group)
1521
1522
1523def process_cas_cache_options(options):
1524 if options.cas_cache:
1525 policies = local_caching.CachePolicies(
1526 max_cache_size=options.max_cache_size,
1527 min_free_space=options.min_free_space,
1528 # max_items isn't used for CAS cache for now.
1529 max_items=None,
1530 max_age_secs=MAX_AGE_SECS)
1531
1532 return local_caching.DiskContentAddressedCache(
1533 six.text_type(os.path.abspath(options.cas_cache)), policies, trim=False)
1534 return local_caching.MemoryContentAddressedCache()
1535
1536
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001537def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001538 """Validates named cache options and returns a CacheManager."""
1539 if options.named_caches and not options.named_cache_root:
1540 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001541 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001542 if not CACHE_NAME_RE.match(name):
1543 parser.error(
1544 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1545 if not path:
1546 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001547 try:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001548 int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001549 except ValueError:
1550 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001551 if options.named_cache_root:
1552 # Make these configurable later if there is use case but for now it's fairly
1553 # safe values.
1554 # In practice, a fair chunk of bots are already recycled on a daily schedule
1555 # so this code doesn't have any effect to them, unless they are preloaded
1556 # with a really old cache.
1557 policies = local_caching.CachePolicies(
1558 # 1TiB.
1559 max_cache_size=1024*1024*1024*1024,
1560 min_free_space=options.min_free_space,
1561 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001562 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001563 root_dir = six.text_type(os.path.abspath(options.named_cache_root))
John Budorickc6186972020-02-26 00:58:14 +00001564 cache = local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
1565 # Touch any named caches we're going to use to minimize thrashing
1566 # between tasks that request some (but not all) of the same named caches.
John Budorick0a4dab62020-03-02 22:23:35 +00001567 cache.touch(*[name for name, _, _ in options.named_caches])
John Budorickc6186972020-02-26 00:58:14 +00001568 return cache
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001569 return None
1570
1571
aludwin7556e0c2016-10-26 08:46:10 -07001572def parse_args(args):
1573 # Create a fake mini-parser just to get out the "-a" command. Note that
1574 # it's not documented here; instead, it's documented in create_option_parser
1575 # even though that parser will never actually get to parse it. This is
1576 # because --argsfile is exclusive with all other options and arguments.
1577 file_argparse = argparse.ArgumentParser(add_help=False)
1578 file_argparse.add_argument('-a', '--argsfile')
1579 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1580 if file_args.argsfile:
1581 if nonfile_args:
1582 file_argparse.error('Can\'t specify --argsfile with'
1583 'any other arguments (%s)' % nonfile_args)
1584 try:
1585 with open(file_args.argsfile, 'r') as f:
1586 args = json.load(f)
1587 except (IOError, OSError, ValueError) as e:
1588 # We don't need to error out here - "args" is now empty,
1589 # so the call below to parser.parse_args(args) will fail
1590 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001591 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001592
1593 # Even if we failed to read the args, just call the normal parser now since it
1594 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001595 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001596 options, args = parser.parse_args(args)
Ye Kuangfff1e502020-07-13 13:21:57 +00001597 if not isinstance(options.cipd_enabled, (bool, int)):
1598 options.cipd_enabled = distutils.util.strtobool(options.cipd_enabled)
aludwin7556e0c2016-10-26 08:46:10 -07001599 return (parser, options, args)
1600
1601
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001602def _calc_named_cache_hint(named_cache, named_caches):
1603 """Returns the expected size of the missing named caches."""
1604 present = named_cache.available
1605 size = 0
1606 for name, _, hint in named_caches:
1607 if name not in present:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001608 hint = int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001609 if hint > 0:
Takuto Ikuta74686842021-07-30 04:11:03 +00001610 logging.info("named cache hint: %s, %d", name, hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001611 size += hint
Takuto Ikuta74686842021-07-30 04:11:03 +00001612 logging.info("total size of named cache hint: %d", size)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001613 return size
1614
1615
Takuto Ikutaae391c52020-12-03 08:43:45 +00001616def _clean_cmd(parser, options, caches, root):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001617 """Cleanup cache dirs/files."""
1618 if options.isolated:
1619 parser.error('Can\'t use --isolated with --clean.')
1620 if options.isolate_server:
1621 parser.error('Can\'t use --isolate-server with --clean.')
1622 if options.json:
1623 parser.error('Can\'t use --json with --clean.')
1624 if options.named_caches:
1625 parser.error('Can\t use --named-cache with --clean.')
1626 if options.cas_instance or options.cas_digest:
1627 parser.error('Can\t use --cas-instance, --cas-digest with --clean.')
1628
1629 logging.info("initial free space: %d", file_path.get_free_space(root))
1630
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001631 if options.kvs_dir and fs.isdir(six.text_type(options.kvs_dir)):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001632 # Remove kvs file if its size exceeds fixed threshold.
Takuto Ikutab1b70062021-03-22 01:02:41 +00001633 kvs_dir = six.text_type(options.kvs_dir)
1634 size = file_path.get_recursive_size(kvs_dir)
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001635 if size >= _CAS_KVS_CACHE_THRESHOLD:
1636 logging.info("remove kvs dir with size: %d", size)
Takuto Ikutab1b70062021-03-22 01:02:41 +00001637 file_path.rmtree(kvs_dir)
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001638
1639 # Trim first, then clean.
1640 local_caching.trim_caches(
1641 caches,
1642 root,
1643 min_free_space=options.min_free_space,
1644 max_age_secs=MAX_AGE_SECS)
1645 logging.info("free space after trim: %d", file_path.get_free_space(root))
1646 for c in caches:
1647 c.cleanup()
1648 logging.info("free space after cleanup: %d", file_path.get_free_space(root))
1649
1650
aludwin7556e0c2016-10-26 08:46:10 -07001651def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001652 # Warning: when --argsfile is used, the strings are unicode instances, when
1653 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001654 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001655
Junji Watanabe1d83d282021-05-11 05:50:40 +00001656 SWARMING_SERVER = os.environ.get('SWARMING_SERVER')
1657 SWARMING_TASK_ID = os.environ.get('SWARMING_TASK_ID')
1658 if options.report_on_exception and SWARMING_SERVER:
1659 task_url = None
1660 if SWARMING_TASK_ID:
1661 task_url = '%s/task?id=%s' % (SWARMING_SERVER, SWARMING_TASK_ID)
1662 on_error.report_on_exception_exit(SWARMING_SERVER, source=task_url)
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001663
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001664 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001665 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001666
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001667 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001668 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001669 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1670 if hint:
1671 # Increase the --min-free-space value by the hint, and recreate the
1672 # NamedCache instance so it gets the updated CachePolicy.
1673 options.min_free_space += hint
1674 named_cache = process_named_cache_options(parser, options)
1675
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001676 # TODO(crbug.com/932396): Remove this.
Takuto Ikuta4a22c2c2020-06-05 02:02:23 +00001677 use_go_isolated = options.cipd_enabled
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001678
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001679 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1680 # they can be cleaned the same way.
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001681
1682 isolate_cache = isolateserver.process_cache_options(options, trim=False)
1683 cas_cache = process_cas_cache_options(options)
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +00001684
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001685 caches = []
1686 if isolate_cache:
1687 caches.append(isolate_cache)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001688 if cas_cache:
1689 caches.append(cas_cache)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001690 if named_cache:
1691 caches.append(named_cache)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001692 root = caches[0].cache_dir if caches else six.text_type(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001693 if options.clean:
Takuto Ikutaae391c52020-12-03 08:43:45 +00001694 _clean_cmd(parser, options, caches, root)
maruel36a963d2016-04-08 17:15:49 -07001695 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001696
1697 # Trim must still be done for the following case:
1698 # - named-cache was used
1699 # - some entries, with a large hint, where missing
1700 # - --min-free-space was increased accordingly, thus trimming is needed
1701 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1702 # --clean after each task.
Takuto Ikutac9ddff22021-02-18 07:58:39 +00001703 additional_buffer = _FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001704 if options.kvs_dir:
Takuto Ikuta7f45c592021-02-09 05:57:05 +00001705 additional_buffer += _CAS_KVS_CACHE_THRESHOLD
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001706 # Add some buffer for Go CLI.
1707 min_free_space = options.min_free_space + additional_buffer
1708
1709 def trim_caches_fn(stats):
1710 start = time.time()
1711 local_caching.trim_caches(
1712 caches, root, min_free_space=min_free_space, max_age_secs=MAX_AGE_SECS)
1713 duration = time.time() - start
1714 stats['duration'] = duration
1715 logging.info('trim_caches: took %d seconds', duration)
maruel36a963d2016-04-08 17:15:49 -07001716
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001717 # Save state of isolate/cas cache not to overwrite state from go client.
1718 if use_go_isolated:
1719 isolate_cache.save()
1720 isolate_cache = None
1721 if cas_cache:
1722 cas_cache.save()
1723 cas_cache = None
1724
nodir55be77b2016-05-03 09:39:57 -07001725 if not options.isolated and not args:
1726 parser.error('--isolated or command to run is required.')
1727
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001728 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001729
Takuto Ikutaae767b32020-05-11 01:22:19 +00001730 isolateserver.process_isolate_server_options(parser, options, False)
Junji Watanabeed9ce352020-09-25 12:32:07 +00001731 if ISOLATED_OUTDIR_PARAMETER in args and (not options.isolate_server and
1732 not options.cas_instance):
1733 parser.error('%s in args requires --isolate-server or --cas-instance' %
1734 ISOLATED_OUTDIR_PARAMETER)
1735
1736 if options.isolated and not options.isolate_server:
1737 parser.error('--isolated requires --isolate-server')
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001738
nodir90bc8dc2016-06-15 13:35:21 -07001739 if options.root_dir:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001740 options.root_dir = six.text_type(os.path.abspath(options.root_dir))
Takuto Ikutad46ea762020-10-07 05:43:22 +00001741 else:
1742 options.root_dir = six.text_type(tempfile.mkdtemp(prefix='root'))
maruel12e30012015-10-09 11:55:35 -07001743 if options.json:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001744 options.json = six.text_type(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001745
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001746 if any('=' not in i for i in options.env):
1747 parser.error(
1748 '--env required key=value form. value can be skipped to delete '
1749 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001750 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001751
1752 prefixes = {}
1753 cwd = os.path.realpath(os.getcwd())
1754 for item in options.env_prefix:
1755 if '=' not in item:
1756 parser.error(
1757 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1758 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001759 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001760 if os.path.isabs(opath):
1761 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1762 opath = os.path.normpath(opath)
1763 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1764 parser.error(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001765 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1766 % opath)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001767 prefixes.setdefault(key, []).append(opath)
1768 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001769
nodirbe642ff2016-06-09 15:51:51 -07001770 cipd.validate_cipd_options(parser, options)
1771
vadimsh232f5a82017-01-20 19:23:44 -08001772 install_packages_fn = noop_install_packages
Ye Kuang1d096cb2020-06-26 08:38:21 +00001773 tmp_cipd_cache_dir = None
vadimsh902948e2017-01-20 15:57:32 -08001774 if options.cipd_enabled:
Ye Kuang1d096cb2020-06-26 08:38:21 +00001775 cache_dir = options.cipd_cache
1776 if not cache_dir:
1777 tmp_cipd_cache_dir = six.text_type(tempfile.mkdtemp())
1778 cache_dir = tmp_cipd_cache_dir
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001779 install_packages_fn = (
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001780 lambda run_dir, isolated_dir, cas_dir: install_client_and_packages(
Ye Kuang1d096cb2020-06-26 08:38:21 +00001781 run_dir,
1782 cipd.parse_package_args(options.cipd_packages),
1783 options.cipd_server,
1784 options.cipd_client_package,
1785 options.cipd_client_version,
1786 cache_dir=cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001787 isolated_dir=isolated_dir,
1788 cas_dir=cas_dir,
1789 ))
nodirbe642ff2016-06-09 15:51:51 -07001790
nodird6160682017-02-02 13:03:35 -08001791 @contextlib.contextmanager
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001792 def install_named_caches(run_dir, stats):
nodird6160682017-02-02 13:03:35 -08001793 # WARNING: this function depends on "options" variable defined in the outer
1794 # function.
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001795 assert six.text_type(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001796 assert os.path.isabs(run_dir), run_dir
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001797 named_caches = [(os.path.join(run_dir, six.text_type(relpath)), name)
1798 for name, relpath, _ in options.named_caches]
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001799 install_start = time.time()
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001800 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001801 named_cache.install(path, name)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001802 install_duration = time.time() - install_start
1803 stats['install']['duration'] = install_duration
1804 logging.info('named_caches: install took %d seconds', install_duration)
nodird6160682017-02-02 13:03:35 -08001805 try:
1806 yield
1807 finally:
dnje289d132017-07-07 11:16:44 -07001808 # Uninstall each named cache, returning it to the cache pool. If an
1809 # uninstall fails for a given cache, it will remain in the task's
1810 # temporary space, get cleaned up by the Swarming bot, and be lost.
1811 #
1812 # If the Swarming bot cannot clean up the cache, it will handle it like
1813 # any other bot file that could not be removed.
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001814 uninstall_start = time.time()
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001815 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001816 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001817 # uninstall() doesn't trim but does call save() implicitly. Trimming
1818 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001819 named_cache.uninstall(path, name)
1820 except local_caching.NamedCacheError:
Takuto Ikuta463ecdd2021-03-05 09:35:38 +00001821 if sys.platform == 'win32':
1822 # Show running processes.
1823 sys.stderr.write("running process\n")
1824 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
1825
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001826 logging.exception('Error while removing named cache %r at %r. '
1827 'The cache will be lost.', path, name)
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001828 uninstall_duration = time.time() - uninstall_start
1829 stats['uninstall']['duration'] = uninstall_duration
1830 logging.info('named_caches: uninstall took %d seconds',
1831 uninstall_duration)
nodirf33b8d62016-10-26 22:34:58 -07001832
Takuto Ikutaf3caa9b2020-11-02 05:38:26 +00001833 command = args
1834 if options.relative_cwd:
1835 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1836 if not a.startswith(os.getcwd()):
1837 parser.error(
1838 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001839
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001840 containment_type = subprocess42.Containment.NONE
1841 if options.containment_type == 'AUTO':
1842 containment_type = subprocess42.Containment.AUTO
1843 if options.containment_type == 'JOB_OBJECT':
1844 containment_type = subprocess42.Containment.JOB_OBJECT
1845 containment = subprocess42.Containment(
1846 containment_type=containment_type,
1847 limit_processes=options.limit_processes,
1848 limit_total_committed_memory=options.limit_total_committed_memory)
1849
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001850 data = TaskData(
1851 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001852 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001853 isolated_hash=options.isolated,
1854 storage=None,
1855 isolate_cache=isolate_cache,
Junji Watanabe54925c32020-09-08 00:56:18 +00001856 cas_instance=options.cas_instance,
1857 cas_digest=options.cas_digest,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001858 outputs=options.output,
1859 install_named_caches=install_named_caches,
1860 leak_temp_dir=options.leak_temp_dir,
1861 root_dir=_to_unicode(options.root_dir),
1862 hard_timeout=options.hard_timeout,
1863 grace_period=options.grace_period,
1864 bot_file=options.bot_file,
1865 switch_to_account=options.switch_to_account,
1866 install_packages_fn=install_packages_fn,
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001867 use_go_isolated=use_go_isolated,
Takuto Ikuta10cae642020-01-08 08:12:07 +00001868 go_cache_dir=options.cache,
Takuto Ikuta879788c2020-01-10 08:00:26 +00001869 go_cache_policies=local_caching.CachePolicies(
1870 max_cache_size=options.max_cache_size,
1871 min_free_space=options.min_free_space,
1872 max_items=options.max_items,
1873 max_age_secs=None,
1874 ),
Junji Watanabeb03450b2020-09-25 05:09:27 +00001875 cas_cache_dir=options.cas_cache,
1876 cas_cache_policies=local_caching.CachePolicies(
1877 max_cache_size=options.max_cache_size,
1878 min_free_space=options.min_free_space,
1879 max_items=None,
1880 max_age_secs=None,
1881 ),
Takuto Ikuta91cb5ca2021-03-17 07:19:30 +00001882 cas_kvs=options.kvs_dir,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001883 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001884 env_prefix=options.env_prefix,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001885 lower_priority=bool(options.lower_priority),
Junji Watanabeaee69ad2021-04-28 03:17:34 +00001886 containment=containment,
1887 trim_caches_fn=trim_caches_fn)
nodirbe642ff2016-06-09 15:51:51 -07001888 try:
nodir90bc8dc2016-06-15 13:35:21 -07001889 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001890 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001891 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001892 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001893 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001894 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001895 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001896 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001897 return run_tha_test(data, options.json)
1898 return run_tha_test(data, options.json)
Junji Watanabe38b28b02020-04-23 10:23:30 +00001899 except (cipd.Error, local_caching.NamedCacheError,
1900 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001901 print(ex.message, file=sys.stderr)
nodirbe642ff2016-06-09 15:51:51 -07001902 return 1
Ye Kuang1d096cb2020-06-26 08:38:21 +00001903 finally:
1904 if tmp_cipd_cache_dir is not None:
1905 try:
1906 file_path.rmtree(tmp_cipd_cache_dir)
1907 except OSError:
1908 logging.exception('Remove tmp_cipd_cache_dir=%s failed',
1909 tmp_cipd_cache_dir)
1910 # Best effort clean up. Failed to do so doesn't affect the outcome.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001911
1912
1913if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001914 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001915 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001916 fix_encoding.fix_encoding()
Ye Kuang2dd17442020-04-22 08:45:52 +00001917 net.set_user_agent('run_isolated.py/' + __version__)
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001918 sys.exit(main(sys.argv[1:]))