blob: f904e1b473b90b8d322c8a7da975eb8121ab8985 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
33See
34https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
35for all the variables.
36
37See
38https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
39for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000040"""
41
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000042from __future__ import print_function
43
44__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000045
aludwin7556e0c2016-10-26 08:46:10 -070046import argparse
maruel064c0a32016-04-05 11:47:15 -070047import base64
iannucci96fcccc2016-08-30 15:52:22 -070048import collections
vadimsh232f5a82017-01-20 19:23:44 -080049import contextlib
Ye Kuangfff1e502020-07-13 13:21:57 +000050import distutils
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040051import errno
aludwin7556e0c2016-10-26 08:46:10 -070052import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000053import logging
54import optparse
55import os
Takuto Ikuta5c59a842020-01-24 03:05:24 +000056import platform
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040057import re
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000058import sys
59import tempfile
maruel064c0a32016-04-05 11:47:15 -070060import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000061
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000062from utils import tools
63tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000064
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000065# third_party/
66from depot_tools import fix_encoding
Takuto Ikuta6e2ff962019-10-29 12:35:27 +000067import six
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000068
69# pylint: disable=ungrouped-imports
70import auth
71import cipd
72import isolate_storage
73import isolateserver
74import local_caching
75from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070076from utils import file_path
maruel12e30012015-10-09 11:55:35 -070077from utils import fs
maruel064c0a32016-04-05 11:47:15 -070078from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040079from utils import logging_utils
Ye Kuang2dd17442020-04-22 08:45:52 +000080from utils import net
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040081from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050082from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000083
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000084
maruele2f2cb82016-07-13 14:41:03 -070085# Magic variables that can be found in the isolate task command line.
86ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
87EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
88SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
89
90
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000091# The name of the log file to use.
92RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
93
maruele2f2cb82016-07-13 14:41:03 -070094
maruele2f2cb82016-07-13 14:41:03 -070095# Use short names for temporary directories. This is driven by Windows, which
96# imposes a relatively short maximum path length of 260 characters, often
97# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +000098# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -070099#
100# It is recommended to start the script with a `root_dir` as short as
101# possible.
102# - ir stands for isolated_run
103# - io stands for isolated_out
104# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000105# - ic stands for isolated_client
maruele2f2cb82016-07-13 14:41:03 -0700106ISOLATED_RUN_DIR = u'ir'
107ISOLATED_OUT_DIR = u'io'
108ISOLATED_TMP_DIR = u'it'
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000109ISOLATED_CLIENT_DIR = u'ic'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000110_CAS_CLIENT_DIR = u'cc'
maruele2f2cb82016-07-13 14:41:03 -0700111
Takuto Ikuta02edca22019-11-29 10:04:51 +0000112# TODO(tikuta): take these parameter from luci-config?
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +0000113# Update tag by `./client/update_go_clients.sh`.
Takuto Ikutac8c92e62020-04-01 07:07:29 +0000114# Or take revision from
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000115# https://ci.chromium.org/p/infra-internal/g/infra-packagers/console
Takuto Ikuta02edca22019-11-29 10:04:51 +0000116ISOLATED_PACKAGE = 'infra/tools/luci/isolated/${platform}'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000117_CAS_PACKAGE = 'infra/tools/luci/cas/${platform}'
Takuto Ikuta9cde9b72021-02-19 06:32:03 +0000118_LUCI_GO_REVISION = 'git_revision:4a7aac4e8f17bee1f995442ee032775855ce251e'
maruele2f2cb82016-07-13 14:41:03 -0700119
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400120# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000121CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400122
Takuto Ikutac9ddff22021-02-18 07:58:39 +0000123_FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES = 2 * 1024 * 1024 * 1024
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400124
marueld928c862017-06-08 08:20:04 -0700125OUTLIVING_ZOMBIE_MSG = """\
126*** Swarming tried multiple times to delete the %s directory and failed ***
127*** Hard failing the task ***
128
129Swarming detected that your testing script ran an executable, which may have
130started a child executable, and the main script returned early, leaving the
131children executables playing around unguided.
132
133You don't want to leave children processes outliving the task on the Swarming
134bot, do you? The Swarming bot doesn't.
135
136How to fix?
137- For any process that starts children processes, make sure all children
138 processes terminated properly before each parent process exits. This is
139 especially important in very deep process trees.
140 - This must be done properly both in normal successful task and in case of
141 task failure. Cleanup is very important.
142- The Swarming bot sends a SIGTERM in case of timeout.
143 - You have %s seconds to comply after the signal was sent to the process
144 before the process is forcibly killed.
145- To achieve not leaking children processes in case of signals on timeout, you
146 MUST handle signals in each executable / python script and propagate them to
147 children processes.
148 - When your test script (python or binary) receives a signal like SIGTERM or
149 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
150 them to terminate before quitting.
151
152See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400153https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700154for more information.
155
156*** May the SIGKILL force be with you ***
157"""
158
159
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000160# Currently hardcoded. Eventually could be exposed as a flag once there's value.
161# 3 weeks
162MAX_AGE_SECS = 21*24*60*60
163
Ye Kuang72e6fe82020-08-05 06:30:04 +0000164# TODO(1099655): Enable this once all prod issues are gone.
165_USE_GO_ISOLATED_TO_UPLOAD = False
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000166
Takuto Ikuta7ff4b242020-12-03 08:07:06 +0000167_CAS_KVS_CACHE_THRESHOLD = 5 * 1024 * 1024 * 1024 # 5 GiB
168
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500169TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000170 'TaskData',
171 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000172 # List of strings; the command line to use, independent of what was
173 # specified in the isolated file.
174 'command',
175 # Relative directory to start command into.
176 'relative_cwd',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000177 # Hash of the .isolated file that must be retrieved to recreate the tree
178 # of files to run the target executable. The command specified in the
179 # .isolated is executed. Mutually exclusive with command argument.
180 'isolated_hash',
181 # isolateserver.Storage instance to retrieve remote objects. This object
182 # has a reference to an isolateserver.StorageApi, which does the actual
183 # I/O.
184 'storage',
185 # isolateserver.LocalCache instance to keep from retrieving the same
186 # objects constantly by caching the objects retrieved. Can be on-disk or
187 # in-memory.
188 'isolate_cache',
Junji Watanabe54925c32020-09-08 00:56:18 +0000189 # Digest of the input root on RBE-CAS.
190 'cas_digest',
191 # Full CAS instance name.
192 'cas_instance',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000193 # List of paths relative to root_dir to put into the output isolated
194 # bundle upon task completion (see link_outputs_to_outdir).
195 'outputs',
196 # Function (run_dir) => context manager that installs named caches into
197 # |run_dir|.
198 'install_named_caches',
199 # If True, the temporary directory will be deliberately leaked for later
200 # examination.
201 'leak_temp_dir',
202 # Path to the directory to use to create the temporary directory. If not
203 # specified, a random temporary directory is created.
204 'root_dir',
205 # Kills the process if it lasts more than this amount of seconds.
206 'hard_timeout',
207 # Number of seconds to wait between SIGTERM and SIGKILL.
208 'grace_period',
209 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
210 # task command line argument.
211 'bot_file',
212 # Logical account to switch LUCI_CONTEXT into.
213 'switch_to_account',
214 # Context manager dir => CipdInfo, see install_client_and_packages.
215 'install_packages_fn',
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000216 # Use go isolated client.
217 'use_go_isolated',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000218 # Cache directory for go `isolated` client.
Takuto Ikuta057c5342019-12-03 04:05:05 +0000219 'go_cache_dir',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000220 # Parameters passed to go `isolated` client.
Takuto Ikuta879788c2020-01-10 08:00:26 +0000221 'go_cache_policies',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000222 # Cache directory for `cas` client.
223 'cas_cache_dir',
224 # Parameters passed to `cas` client.
225 'cas_cache_policies',
Takuto Ikutaae391c52020-12-03 08:43:45 +0000226 # Parameters for kvs file used by `cas` client.
227 'cas_kvs',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000228 # Environment variables to set.
229 'env',
230 # Environment variables to mutate with relative directories.
231 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
232 'env_prefix',
233 # Lowers the task process priority.
234 'lower_priority',
235 # subprocess42.Containment instance. Can be None.
236 'containment',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000237 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500238
239
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500240def _to_str(s):
241 """Downgrades a unicode instance to str. Pass str through as-is."""
242 if isinstance(s, str):
243 return s
244 # This is technically incorrect, especially on Windows. In theory
245 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
246 # page' on Windows, but that causes other problems, as the character set
247 # is very limited.
248 return s.encode('utf-8')
249
250
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500251def _to_unicode(s):
252 """Upgrades a str instance to unicode. Pass unicode through as-is."""
Takuto Ikuta95459dd2019-10-29 12:39:47 +0000253 if isinstance(s, six.text_type) or s is None:
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500254 return s
255 return s.decode('utf-8')
256
257
maruel03e11842016-07-14 10:50:16 -0700258def make_temp_dir(prefix, root_dir):
259 """Returns a new unique temporary directory."""
Takuto Ikuta6e2ff962019-10-29 12:35:27 +0000260 return six.text_type(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000261
262
vadimsh9c54b2c2017-07-25 14:08:29 -0700263@contextlib.contextmanager
264def set_luci_context_account(account, tmp_dir):
265 """Sets LUCI_CONTEXT account to be used by the task.
266
267 If 'account' is None or '', does nothing at all. This happens when
268 run_isolated.py is called without '--switch-to-account' flag. In this case,
269 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000270 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700271 run_isolated.py explicitly from their code.
272
273 If the requested account is not defined in the context, switches to
274 non-authenticated access. This happens for Swarming tasks that don't use
275 'task' service accounts.
276
277 If not using LUCI_CONTEXT-based auth, does nothing.
278 If already running as requested account, does nothing.
279 """
280 if not account:
281 # Not actually switching.
282 yield
283 return
284
285 local_auth = luci_context.read('local_auth')
286 if not local_auth:
287 # Not using LUCI_CONTEXT auth at all.
288 yield
289 return
290
291 # See LUCI_CONTEXT.md for the format of 'local_auth'.
292 if local_auth.get('default_account_id') == account:
293 # Already set, no need to switch.
294 yield
295 return
296
297 available = {a['id'] for a in local_auth.get('accounts') or []}
298 if account in available:
299 logging.info('Switching default LUCI_CONTEXT account to %r', account)
300 local_auth['default_account_id'] = account
301 else:
302 logging.warning(
303 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
304 'disabling authentication', account, sorted(available))
305 local_auth.pop('default_account_id', None)
306
307 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
308 yield
309
310
nodir90bc8dc2016-06-15 13:35:21 -0700311def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000312 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700313
314 Raises:
315 ValueError if a parameter is requested in |command| but its value is not
316 provided.
317 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000318 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
319
320
321def replace_parameters(arg, out_dir, bot_file):
322 """Replaces parameter tokens with appropriate values in a string.
323
324 Raises:
325 ValueError if a parameter is requested in |arg| but its value is not
326 provided.
327 """
328 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
329 replace_slash = False
330 if ISOLATED_OUTDIR_PARAMETER in arg:
331 if not out_dir:
332 raise ValueError(
333 'output directory is requested in command or env var, but not '
334 'provided; please specify one')
335 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
336 replace_slash = True
337 if SWARMING_BOT_FILE_PARAMETER in arg:
338 if bot_file:
339 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700340 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000341 else:
342 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
343 'var, but no bot_file specified. Leaving parameter '
344 'unchanged.')
345 if replace_slash:
346 # Replace slashes only if parameters are present
347 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
348 arg = arg.replace('/', os.sep)
349 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700350
351
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000352def set_temp_dir(env, tmp_dir):
353 """Set temp dir to given env var dictionary"""
354 tmp_dir = _to_str(tmp_dir)
355 # pylint: disable=line-too-long
356 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
357 # platform. So $TMPDIR must be set on all platforms.
358 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
359 env['TMPDIR'] = tmp_dir
360 if sys.platform == 'win32':
361 # * chromium's base utils uses GetTempPath().
362 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
363 # * Go uses GetTempPath().
364 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
365 # set.
366 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
367 env['TMP'] = tmp_dir
368 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
369 env['TEMP'] = tmp_dir
370 elif sys.platform == 'darwin':
371 # * Chromium uses an hack on macOS before calling into
372 # NSTemporaryDirectory().
373 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
374 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
375 env['MAC_CHROMIUM_TMPDIR'] = tmp_dir
376 else:
377 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
378 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
379 # * mktemp on linux respects $TMPDIR.
380 # * Chromium respects $TMPDIR on linux.
381 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
382 # * Go uses $TMPDIR.
383 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
384 pass
385
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000386
387def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
388 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800389 """Returns full OS environment to run a command in.
390
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800391 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
392 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800393
394 Args:
395 tmp_dir: temp directory.
396 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500397 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500398 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800399 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000400 out_dir: Isolated output directory. Required to be != None if any of the
401 env vars contain ISOLATED_OUTDIR_PARAMETER.
402 bot_file: Required to be != None if any of the env vars contain
403 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800404 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500405 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000406 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500407 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500408 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500409 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000410 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500411
412 if cipd_info:
413 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500414 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
415 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500416
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000417 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500418 assert isinstance(paths, list), paths
419 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500420 cur = out.get(key)
421 if cur:
422 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500423 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800424
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000425 set_temp_dir(out, tmp_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500426 return out
vadimsh232f5a82017-01-20 19:23:44 -0800427
428
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000429def run_command(
430 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700431 """Runs the command.
432
433 Returns:
434 tuple(process exit code, bool if had a hard timeout)
435 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000436 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000437 'run_command(%s, %s, %s, %s, %s, %s)',
438 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700439
maruel6be7f9e2015-10-01 12:25:30 -0700440 exit_code = None
441 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700442 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700443 proc = None
444 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700445 try:
maruel6be7f9e2015-10-01 12:25:30 -0700446 # TODO(maruel): This code is imperfect. It doesn't handle well signals
447 # during the download phase and there's short windows were things can go
448 # wrong.
449 def handler(signum, _frame):
450 if proc and not had_signal:
451 logging.info('Received signal %d', signum)
452 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700453 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700454
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000455 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000456 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000457 lower_priority=lower_priority, containment=containment)
maruel6be7f9e2015-10-01 12:25:30 -0700458 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
459 try:
John Budorickc398f092019-06-10 22:49:44 +0000460 exit_code = proc.wait(hard_timeout or None)
maruel6be7f9e2015-10-01 12:25:30 -0700461 except subprocess42.TimeoutExpired:
462 if not had_signal:
463 logging.warning('Hard timeout')
464 had_hard_timeout = True
465 logging.warning('Sending SIGTERM')
466 proc.terminate()
467
Takuto Ikuta684f7912020-09-29 07:49:49 +0000468 kill_sent = False
maruel6be7f9e2015-10-01 12:25:30 -0700469 # Ignore signals in grace period. Forcibly give the grace period to the
470 # child process.
471 if exit_code is None:
472 ignore = lambda *_: None
473 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
474 try:
475 exit_code = proc.wait(grace_period or None)
476 except subprocess42.TimeoutExpired:
477 # Now kill for real. The user can distinguish between the
478 # following states:
479 # - signal but process exited within grace period,
480 # hard_timed_out will be set but the process exit code will be
481 # script provided.
482 # - processed exited late, exit code will be -9 on posix.
483 logging.warning('Grace exhausted; sending SIGKILL')
484 proc.kill()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000485 kill_sent = True
martiniss5c8043e2017-08-01 17:09:43 -0700486 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700487 exit_code = proc.wait()
Takuto Ikuta684f7912020-09-29 07:49:49 +0000488
489 # the process group / job object may be dangling so if we didn't kill
490 # it already, give it a poke now.
491 if not kill_sent:
492 proc.kill()
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000493 except OSError as e:
maruela9cfd6f2015-09-15 11:03:15 -0700494 # This is not considered to be an internal error. The executable simply
495 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800496 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000497 '<The executable does not exist, a dependent library is missing or '
498 'the command line is too long>\n'
499 '<Check for missing .so/.dll in the .isolate or GN file or length of '
500 'command line args>\n'
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000501 '<Command: %s, Exception: %s>\n' % (command, e))
maruela72f46e2016-02-24 11:05:45 -0800502 if os.environ.get('SWARMING_TASK_ID'):
503 # Give an additional hint when running as a swarming task.
504 sys.stderr.write(
505 '<See the task\'s page for commands to help diagnose this issue '
506 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700507 exit_code = 1
508 logging.info(
509 'Command finished with exit code %d (%s)',
510 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700511 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700512
513
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000514def _run_go_cmd_and_wait(cmd, tmp_dir):
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000515 """
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000516 Runs an external Go command, `isolated` or `cas`, and wait for its completion.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000517
518 While this is a generic function to launch a subprocess, it has logic that
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000519 is specific to Go `isolated` and `cas` for waiting and logging.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000520
521 Returns:
522 The subprocess object
523 """
Ye Kuang3c40e9f2020-07-28 13:15:25 +0000524 cmd_str = ' '.join(cmd)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000525 try:
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000526 env = os.environ.copy()
527 set_temp_dir(env, tmp_dir)
528 proc = subprocess42.Popen(cmd, env=env)
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000529
Ye Kuangc1d800f2020-07-28 10:14:55 +0000530 exceeded_max_timeout = True
531 check_period_sec = 30
532 max_checks = 100
533 # max timeout = max_checks * check_period_sec = 50 minutes
534 for i in range(max_checks):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000535 # This is to prevent I/O timeout error during setup.
Ye Kuangc1d800f2020-07-28 10:14:55 +0000536 try:
537 retcode = proc.wait(check_period_sec)
538 if retcode != 0:
539 raise ValueError("retcode is not 0: %s (cmd=%s)" % (retcode, cmd_str))
540 exceeded_max_timeout = False
541 break
542 except subprocess42.TimeoutExpired:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000543 print('still running (after %d seconds)' % ((i + 1) * check_period_sec))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000544
Ye Kuangc1d800f2020-07-28 10:14:55 +0000545 if exceeded_max_timeout:
546 proc.terminate()
547 try:
548 proc.wait(check_period_sec)
549 except subprocess42.TimeoutExpired:
550 logging.exception(
551 "failed to terminate? timeout happened after %d seconds",
552 check_period_sec)
553 proc.kill()
554 proc.wait()
555 # Raise unconditionally, because |proc| was forcefully terminated.
556 raise ValueError("timedout after %d seconds (cmd=%s)" %
557 (check_period_sec * max_checks, cmd_str))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000558
Ye Kuangc1d800f2020-07-28 10:14:55 +0000559 return proc
560 except Exception:
561 logging.exception('Failed to run Go cmd %s', cmd_str)
562 raise
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000563
564
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000565def _fetch_and_map_with_cas(cas_client, digest, instance, output_dir, cache_dir,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000566 policies, kvs_file, tmp_dir):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000567 """
568 Fetches a CAS tree using cas client, create the tree and returns download
569 stats.
570 """
571
Takuto Ikuta34a86c52020-10-13 05:30:57 +0000572 # TODO(crbug.com/chrome-operations/49):
573 # remove this after isolate to RBE-CAS migration.
574 _CAS_EMPTY_DIR_DIGEST = (
575 'e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855/0')
576 if digest == _CAS_EMPTY_DIR_DIGEST:
577 return {
578 'duration': 0.0,
579 'items_cold': '',
580 'items_hot': '',
581 }
582
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000583 start = time.time()
584 result_json_handle, result_json_path = tempfile.mkstemp(
585 prefix=u'fetch-and-map-result-', suffix=u'.json')
586 os.close(result_json_handle)
587 try:
588 cmd = [
589 cas_client,
590 'download',
591 '-digest',
592 digest,
593 '-cas-instance',
594 instance,
595 # flags for cache.
596 '-cache-dir',
597 cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000598 '-cache-max-size',
599 str(policies.max_cache_size),
600 '-cache-min-free-space',
601 str(policies.min_free_space),
602 # flags for output.
603 '-dir',
604 output_dir,
605 '-dump-stats-json',
606 result_json_path,
Takuto Ikuta557025b2021-02-01 08:37:40 +0000607 '-log-level',
608 'info'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000609 ]
Takuto Ikutaae391c52020-12-03 08:43:45 +0000610
611 if kvs_file:
612 cmd.extend(['-kvs-file', kvs_file])
613
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000614 _run_go_cmd_and_wait(cmd, tmp_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000615
616 with open(result_json_path) as json_file:
617 result_json = json.load(json_file)
618
619 return {
620 'duration': time.time() - start,
621 'items_cold': result_json['items_cold'],
622 'items_hot': result_json['items_hot'],
623 }
624 finally:
625 fs.remove(result_json_path)
626
627
628def _fetch_and_map_with_go_isolated(isolated_hash, storage, outdir,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000629 go_cache_dir, policies, isolated_client,
630 tmp_dir):
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000631 """
632 Fetches an isolated tree using go client, create the tree and returns
Takuto Ikuta57219f42020-11-02 07:35:36 +0000633 stats.
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000634 """
635 start = time.time()
636 server_ref = storage.server_ref
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000637 result_json_handle, result_json_path = tempfile.mkstemp(
638 prefix=u'fetch-and-map-result-', suffix=u'.json')
639 os.close(result_json_handle)
640 try:
Ye Kuanga98764c2020-04-09 03:17:37 +0000641 cmd = [
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000642 isolated_client,
643 'download',
644 '-isolate-server',
645 server_ref.url,
646 '-namespace',
647 server_ref.namespace,
648 '-isolated',
649 isolated_hash,
650
651 # flags for cache
652 '-cache-dir',
Takuto Ikuta057c5342019-12-03 04:05:05 +0000653 go_cache_dir,
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000654 '-cache-max-items',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000655 str(policies.max_items),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000656 '-cache-max-size',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000657 str(policies.max_cache_size),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000658 '-cache-min-free-space',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000659 str(policies.min_free_space),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000660
661 # flags for output
662 '-output-dir',
663 outdir,
664 '-fetch-and-map-result-json',
665 result_json_path,
Ye Kuanga98764c2020-04-09 03:17:37 +0000666 ]
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000667 _run_go_cmd_and_wait(cmd, tmp_dir)
Takuto Ikuta3153e3b2020-02-18 06:11:47 +0000668
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000669 with open(result_json_path) as json_file:
670 result_json = json.load(json_file)
671
Takuto Ikuta57219f42020-11-02 07:35:36 +0000672 return {
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000673 'duration': time.time() - start,
674 'items_cold': result_json['items_cold'],
675 'items_hot': result_json['items_hot'],
Ye Kuang65a1de52020-10-16 08:31:16 +0000676 'initial_number_items': result_json['initial_number_items'],
677 'initial_size': result_json['initial_size'],
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000678 }
679 finally:
680 fs.remove(result_json_path)
681
682
683# TODO(crbug.com/932396): remove this function.
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000684def fetch_and_map(isolated_hash, storage, cache, outdir):
Takuto Ikuta57219f42020-11-02 07:35:36 +0000685 """Fetches an isolated tree, create the tree and returns stats."""
nodir6f801882016-04-29 14:41:50 -0700686 start = time.time()
Takuto Ikuta57219f42020-11-02 07:35:36 +0000687 isolateserver.fetch_isolated(
nodir6f801882016-04-29 14:41:50 -0700688 isolated_hash=isolated_hash,
689 storage=storage,
690 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700691 outdir=outdir,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000692 use_symlinks=False)
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000693 hot = (collections.Counter(cache.used) -
694 collections.Counter(cache.added)).elements()
Takuto Ikuta57219f42020-11-02 07:35:36 +0000695 return {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000696 'duration': time.time() - start,
697 'items_cold': base64.b64encode(large.pack(sorted(cache.added))).decode(),
698 'items_hot': base64.b64encode(large.pack(sorted(hot))).decode(),
nodir6f801882016-04-29 14:41:50 -0700699 }
700
701
aludwin0a8e17d2016-10-27 15:57:39 -0700702def link_outputs_to_outdir(run_dir, out_dir, outputs):
703 """Links any named outputs to out_dir so they can be uploaded.
704
705 Raises an error if the file already exists in that directory.
706 """
707 if not outputs:
708 return
709 isolateserver.create_directories(out_dir, outputs)
710 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400711 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
712
713
714def copy_recursively(src, dst):
715 """Efficiently copies a file or directory from src_dir to dst_dir.
716
717 `item` may be a file, directory, or a symlink to a file or directory.
718 All symlinks are replaced with their targets, so the resulting
719 directory structure in dst_dir will never have any symlinks.
720
721 To increase speed, copy_recursively hardlinks individual files into the
722 (newly created) directory structure if possible, unlike Python's
723 shutil.copytree().
724 """
725 orig_src = src
726 try:
727 # Replace symlinks with their final target.
728 while fs.islink(src):
729 res = fs.readlink(src)
730 src = os.path.join(os.path.dirname(src), res)
731 # TODO(sadafm): Explicitly handle cyclic symlinks.
732
733 # Note that fs.isfile (which is a wrapper around os.path.isfile) throws
734 # an exception if src does not exist. A warning will be logged in that case.
735 if fs.isfile(src):
736 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
737 return
738
739 if not fs.exists(dst):
740 os.makedirs(dst)
741
742 for child in fs.listdir(src):
743 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
744
745 except OSError as e:
746 if e.errno == errno.ENOENT:
747 logging.warning('Path %s does not exist or %s is a broken symlink',
748 src, orig_src)
749 else:
750 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700751
752
Ye Kuangfb0bad62020-07-28 08:07:25 +0000753def _upload_with_py(storage, out_dir):
754
755 def process_stats(f_st):
756 st = sorted(i.size for i in f_st)
757 return base64.b64encode(large.pack(st)).decode()
758
759 try:
760 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
761 storage, [out_dir], None, verify_push=True)
762
763 isolated = list(results.values())[0]
764 cold = process_stats(f_cold)
765 hot = process_stats(f_hot)
766 return isolated, cold, hot
767
768 except isolateserver.Aborted:
769 # This happens when a signal SIGTERM was received while uploading data.
770 # There is 2 causes:
771 # - The task was too slow and was about to be killed anyway due to
772 # exceeding the hard timeout.
773 # - The amount of data uploaded back is very large and took too much
774 # time to archive.
775 sys.stderr.write('Received SIGTERM while uploading')
776 # Re-raise, so it will be treated as an internal failure.
777 raise
778
779
780def _upload_with_go(storage, outdir, isolated_client):
781 """
782 Uploads results back using the Go `isolated` CLI.
783 """
784 server_ref = storage.server_ref
785 isolated_handle, isolated_path = tempfile.mkstemp(
786 prefix=u'isolated-hash-', suffix=u'.txt')
787 stats_json_handle, stats_json_path = tempfile.mkstemp(
788 prefix=u'dump-stats-', suffix=u'.json')
789 os.close(isolated_handle)
790 os.close(stats_json_handle)
791 try:
792 cmd = [
793 isolated_client,
794 'archive',
795 '-isolate-server',
796 server_ref.url,
797 '-namespace',
798 server_ref.namespace,
799 '-dirs',
800 # Format: <working directory>:<relative path to dir>
801 outdir + ':',
802
803 # output
804 '-dump-hash',
805 isolated_path,
806 '-dump-stats-json',
807 stats_json_path,
Ye Kuangbc4e8402020-07-29 09:54:30 +0000808 '-quiet',
Ye Kuangfb0bad62020-07-28 08:07:25 +0000809 ]
Ye Kuang0023dc52020-08-04 05:28:41 +0000810 # Will do exponential backoff, e.g. 10, 20, 40...
811 # This mitigates https://crbug.com/1094369, where there is a data race on
812 # the uploaded files.
813 backoff = 10
Takuto Ikutae0bfec72020-08-28 02:52:52 +0000814 started = time.time()
Ye Kuang0023dc52020-08-04 05:28:41 +0000815 while True:
816 try:
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000817 _run_go_cmd_and_wait(cmd, tmp_dir)
Ye Kuang0023dc52020-08-04 05:28:41 +0000818 break
819 except Exception:
Takuto Ikutae0bfec72020-08-28 02:52:52 +0000820 if time.time() > started + 60 * 2:
821 # This is to not wait task having leaked process long time.
Ye Kuang0023dc52020-08-04 05:28:41 +0000822 raise
823
824 on_error.report('error before %d second backoff' % backoff)
825 logging.exception(
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000826 '_run_go_cmd_and_wait() failed, will retry after %d seconds',
Ye Kuang0023dc52020-08-04 05:28:41 +0000827 backoff)
828 time.sleep(backoff)
829 backoff *= 2
Ye Kuangfb0bad62020-07-28 08:07:25 +0000830
831 with open(isolated_path) as isol_file:
832 isolated = isol_file.read()
833 with open(stats_json_path) as json_file:
834 stats_json = json.load(json_file)
835
836 return isolated, stats_json['items_cold'], stats_json['items_hot']
837 finally:
838 fs.remove(isolated_path)
839 fs.remove(stats_json_path)
840
841
Ye Kuangbc4e8402020-07-29 09:54:30 +0000842def upload_out_dir(storage, out_dir, go_isolated_client):
843 """Uploads the results in |out_dir| back, if there is any.
maruela9cfd6f2015-09-15 11:03:15 -0700844
845 Returns:
Ye Kuangbc4e8402020-07-29 09:54:30 +0000846 tuple(outputs_ref, stats)
maruel064c0a32016-04-05 11:47:15 -0700847 - outputs_ref: a dict referring to the results archived back to the isolated
848 server, if applicable.
nodir6f801882016-04-29 14:41:50 -0700849 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700850 """
maruela9cfd6f2015-09-15 11:03:15 -0700851 # Upload out_dir and generate a .isolated file out of this directory. It is
852 # only done if files were written in the directory.
853 outputs_ref = None
Ye Kuangfb0bad62020-07-28 08:07:25 +0000854 cold = ''
855 hot = ''
nodir6f801882016-04-29 14:41:50 -0700856 start = time.time()
857
maruel12e30012015-10-09 11:55:35 -0700858 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700859 with tools.Profiler('ArchiveOutput'):
Ye Kuangfb0bad62020-07-28 08:07:25 +0000860 isolated = None
Ye Kuang72e6fe82020-08-05 06:30:04 +0000861 if _USE_GO_ISOLATED_TO_UPLOAD and go_isolated_client is not None:
Ye Kuangfb0bad62020-07-28 08:07:25 +0000862 isolated, cold, hot = _upload_with_go(storage, out_dir,
863 go_isolated_client)
Ye Kuang72e6fe82020-08-05 06:30:04 +0000864 else:
865 isolated, cold, hot = _upload_with_py(storage, out_dir)
Ye Kuangfb0bad62020-07-28 08:07:25 +0000866 outputs_ref = {
867 'isolated': isolated,
868 'isolatedserver': storage.server_ref.url,
869 'namespace': storage.server_ref.namespace,
870 }
nodir6f801882016-04-29 14:41:50 -0700871
nodir6f801882016-04-29 14:41:50 -0700872 stats = {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000873 'duration': time.time() - start,
Ye Kuangfb0bad62020-07-28 08:07:25 +0000874 'items_cold': cold,
875 'items_hot': hot,
nodir6f801882016-04-29 14:41:50 -0700876 }
Ye Kuangbc4e8402020-07-29 09:54:30 +0000877 return outputs_ref, stats
maruela9cfd6f2015-09-15 11:03:15 -0700878
879
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000880def upload_outdir_with_cas(cas_client, cas_instance, outdir, tmp_dir):
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000881 """Uploads the results in |outdir|, if there is any.
882
883 Returns:
884 tuple(root_digest, stats)
885 - root_digest: a digest of the output directory.
886 - stats: uploading stats.
887 """
888 digest_file_handle, digest_path = tempfile.mkstemp(
889 prefix=u'cas-digest', suffix=u'.txt')
890 os.close(digest_file_handle)
891 stats_json_handle, stats_json_path = tempfile.mkstemp(
892 prefix=u'upload-stats', suffix=u'.json')
893 os.close(stats_json_handle)
894
895 try:
896 cmd = [
897 cas_client,
898 'archive',
899 '-cas-instance',
900 cas_instance,
901 '-paths',
902 # Format: <working directory>:<relative path to dir>
903 outdir + ':',
904 # output
905 '-dump-digest',
906 digest_path,
907 '-dump-stats-json',
908 stats_json_path,
909 ]
910
911 start = time.time()
912
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +0000913 _run_go_cmd_and_wait(cmd, tmp_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000914
915 with open(digest_path) as digest_file:
916 digest = digest_file.read()
Junji Watanabec208b302020-09-25 09:18:27 +0000917 h, s = digest.split('/')
918 cas_output_root = {
919 'cas_instance': cas_instance,
920 'digest': {
921 'hash': h,
922 'size_bytes': int(s)
923 }
924 }
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000925 with open(stats_json_path) as stats_file:
926 stats = json.load(stats_file)
927
928 stats['duration'] = time.time() - start
929
Junji Watanabec208b302020-09-25 09:18:27 +0000930 return cas_output_root, stats
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000931 finally:
932 fs.remove(digest_path)
933 fs.remove(stats_json_path)
934
935
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500936def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700937 """Runs a command with optional isolated input/output.
938
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500939 Arguments:
940 - data: TaskData instance.
941 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700942
943 Returns metadata about the result.
944 """
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000945
946 if data.isolate_cache:
947 download_stats = {
948 #'duration': 0.,
949 'initial_number_items': len(data.isolate_cache),
950 'initial_size': data.isolate_cache.total_size,
951 #'items_cold': '<large.pack()>',
952 #'items_hot': '<large.pack()>',
953 }
954 else:
955 # TODO(tikuta): take stats from state.json in this case too.
956 download_stats = {}
957
maruela9cfd6f2015-09-15 11:03:15 -0700958 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000959 'duration': None,
960 'exit_code': None,
961 'had_hard_timeout': False,
962 'internal_failure': 'run_isolated did not complete properly',
963 'stats': {
964 #'cipd': {
965 # 'duration': 0.,
966 # 'get_client_duration': 0.,
967 #},
968 'isolated': {
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000969 'download': download_stats,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000970 #'upload': {
971 # 'duration': 0.,
972 # 'items_cold': '<large.pack()>',
973 # 'items_hot': '<large.pack()>',
974 #},
975 },
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000976 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000977 #'cipd_pins': {
978 # 'packages': [
979 # {'package_name': ..., 'version': ..., 'path': ...},
980 # ...
981 # ],
982 # 'client_package': {'package_name': ..., 'version': ...},
983 #},
984 'outputs_ref': None,
Junji Watanabe54925c32020-09-08 00:56:18 +0000985 'cas_output_root': None,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000986 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700987 }
nodirbe642ff2016-06-09 15:51:51 -0700988
Takuto Ikutad46ea762020-10-07 05:43:22 +0000989 assert os.path.isabs(data.root_dir), ("data.root_dir is not abs path: %s" %
990 data.root_dir)
991 file_path.ensure_tree(data.root_dir, 0o700)
992
maruele2f2cb82016-07-13 14:41:03 -0700993 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700994 # TODO(maruel): This is not obvious. Change this to become an error once we
995 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500996 if constant_run_path and data.root_dir:
997 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700998 if os.path.isdir(run_dir):
999 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +00001000 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -07001001 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001002 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001003
1004 # True if CAS is used for download/upload files.
1005 use_cas = bool(data.cas_digest)
1006
maruel03e11842016-07-14 10:50:16 -07001007 # storage should be normally set but don't crash if it is not. This can happen
1008 # as Swarming task can run without an isolate server.
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001009 out_dir = None
1010 if data.storage or use_cas:
1011 out_dir = make_temp_dir(ISOLATED_OUT_DIR, data.root_dir)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001012 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001013 isolated_client_dir = make_temp_dir(ISOLATED_CLIENT_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -07001014 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001015 if data.relative_cwd:
1016 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001017 command = data.command
Ye Kuangfb0bad62020-07-28 08:07:25 +00001018 go_isolated_client = None
1019 if data.use_go_isolated:
1020 go_isolated_client = os.path.join(isolated_client_dir,
1021 'isolated' + cipd.EXECUTABLE_SUFFIX)
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001022
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001023 cas_client = None
1024 cas_client_dir = make_temp_dir(_CAS_CLIENT_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001025 if use_cas:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001026 cas_client = os.path.join(cas_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX)
1027
nodir55be77b2016-05-03 09:39:57 -07001028 try:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001029 with data.install_packages_fn(run_dir, isolated_client_dir,
1030 cas_client_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -08001031 if cipd_info:
1032 result['stats']['cipd'] = cipd_info.stats
1033 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -07001034
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001035 isolated_stats = result['stats'].setdefault('isolated', {})
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001036 if data.isolated_hash:
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001037 if data.use_go_isolated:
Takuto Ikuta57219f42020-11-02 07:35:36 +00001038 stats = _fetch_and_map_with_go_isolated(
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001039 isolated_hash=data.isolated_hash,
1040 storage=data.storage,
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001041 outdir=run_dir,
1042 go_cache_dir=data.go_cache_dir,
Takuto Ikuta879788c2020-01-10 08:00:26 +00001043 policies=data.go_cache_policies,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +00001044 isolated_client=go_isolated_client,
1045 tmp_dir=tmp_dir)
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001046 else:
Takuto Ikuta57219f42020-11-02 07:35:36 +00001047 stats = fetch_and_map(
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001048 isolated_hash=data.isolated_hash,
1049 storage=data.storage,
1050 cache=data.isolate_cache,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +00001051 outdir=run_dir)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001052 isolated_stats['download'].update(stats)
Takuto Ikutab58dbd12020-06-05 09:29:14 +00001053
Junji Watanabe54925c32020-09-08 00:56:18 +00001054 elif data.cas_digest:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001055 stats = _fetch_and_map_with_cas(
1056 cas_client=cas_client,
1057 digest=data.cas_digest,
1058 instance=data.cas_instance,
1059 output_dir=run_dir,
Junji Watanabeb03450b2020-09-25 05:09:27 +00001060 cache_dir=data.cas_cache_dir,
Takuto Ikutaae391c52020-12-03 08:43:45 +00001061 policies=data.cas_cache_policies,
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +00001062 kvs_file=data.cas_kvs,
1063 tmp_dir=tmp_dir)
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001064 isolated_stats['download'].update(stats)
Junji Watanabe54925c32020-09-08 00:56:18 +00001065
maruelabec63c2017-04-26 11:53:24 -07001066 if not command:
1067 # Handle this as a task failure, not an internal failure.
1068 sys.stderr.write(
1069 '<No command was specified!>\n'
1070 '<Please secify a command when triggering your Swarming task>\n')
1071 result['exit_code'] = 1
1072 return result
nodirbe642ff2016-06-09 15:51:51 -07001073
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001074 if not cwd.startswith(run_dir):
1075 # Handle this as a task failure, not an internal failure. This is a
1076 # 'last chance' way to gate against directory escape.
1077 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
1078 result['exit_code'] = 1
1079 return result
1080
1081 if not os.path.isdir(cwd):
1082 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +00001083 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001084
vadimsh232f5a82017-01-20 19:23:44 -08001085 # If we have an explicit list of files to return, make sure their
1086 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001087 if data.storage and data.outputs:
1088 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -07001089
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001090 with data.install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001091 sys.stdout.flush()
1092 start = time.time()
1093 try:
vadimsh9c54b2c2017-07-25 14:08:29 -07001094 # Need to switch the default account before 'get_command_env' call,
1095 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001096 with set_luci_context_account(data.switch_to_account, tmp_dir):
1097 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +00001098 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
1099 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +00001100 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -08001101 command = process_command(command, out_dir, data.bot_file)
1102 file_path.ensure_command_has_abs_path(command, cwd)
1103
vadimsh9c54b2c2017-07-25 14:08:29 -07001104 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001105 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001106 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -08001107 finally:
1108 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -05001109
Ye Kuangbc4e8402020-07-29 09:54:30 +00001110 if out_dir:
1111 # Try to link files to the output directory, if specified.
1112 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
1113 isolated_stats = result['stats'].setdefault('isolated', {})
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001114 if use_cas:
1115 result['cas_output_root'], isolated_stats['upload'] = (
Takuto Ikuta0f8a19c2021-03-02 00:50:38 +00001116 upload_outdir_with_cas(cas_client, data.cas_instance, out_dir,
1117 tmp_dir))
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001118 else:
1119 # This could use |go_isolated_client|, so make sure it runs when the
1120 # CIPD package still exists.
1121 result['outputs_ref'], isolated_stats['upload'] = (
1122 upload_out_dir(data.storage, out_dir, go_isolated_client))
Seth Koehler49139812017-12-19 13:59:33 -05001123 # We successfully ran the command, set internal_failure back to
1124 # None (even if the command failed, it's not an internal error).
1125 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -07001126 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -07001127 # An internal error occurred. Report accordingly so the swarming task will
1128 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -07001129 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -07001130 result['internal_failure'] = str(e)
1131 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -07001132
1133 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -07001134 finally:
1135 try:
Ye Kuangbc4e8402020-07-29 09:54:30 +00001136 success = True
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001137 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -07001138 success = True
maruela9cfd6f2015-09-15 11:03:15 -07001139 logging.warning(
1140 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -07001141 else:
maruel84537cb2015-10-16 14:21:28 -07001142 # On Windows rmtree(run_dir) call above has a synchronization effect: it
1143 # finishes only when all task child processes terminate (since a running
1144 # process locks *.exe file). Examine out_dir only after that call
1145 # completes (since child processes may write to out_dir too and we need
1146 # to wait for them to finish).
Junji Watanabeb03450b2020-09-25 05:09:27 +00001147 dirs_to_remove = [run_dir, tmp_dir, isolated_client_dir, cas_client_dir]
Ye Kuangbc4e8402020-07-29 09:54:30 +00001148 if out_dir:
1149 dirs_to_remove.append(out_dir)
1150 for directory in dirs_to_remove:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001151 if not fs.isdir(directory):
1152 continue
Junji Watanabe9cdfff52021-01-08 07:20:35 +00001153 start = time.time()
maruel84537cb2015-10-16 14:21:28 -07001154 try:
Junji Watanabecc4eefd2021-01-19 01:46:10 +00001155 file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -07001156 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001157 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -07001158 success = False
Junji Watanabe9cdfff52021-01-08 07:20:35 +00001159 finally:
1160 logging.info('Cleanup: rmtree(%r) took %d seconds', directory,
1161 time.time() - start)
maruel84537cb2015-10-16 14:21:28 -07001162 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001163 sys.stderr.write(
1164 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
Takuto Ikutad7d64e12020-07-31 06:18:45 +00001165 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
maruel84537cb2015-10-16 14:21:28 -07001166 if result['exit_code'] == 0:
1167 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -07001168
maruela9cfd6f2015-09-15 11:03:15 -07001169 if not success and result['exit_code'] == 0:
1170 result['exit_code'] = 1
1171 except Exception as e:
1172 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -07001173 if out_dir:
1174 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -07001175 result['internal_failure'] = str(e)
Takuto Ikutaa9a907b2020-04-17 08:50:50 +00001176 on_error.report(None)
maruela9cfd6f2015-09-15 11:03:15 -07001177 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001178
1179
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001180def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -07001181 """Runs an executable and records execution metadata.
1182
nodir55be77b2016-05-03 09:39:57 -07001183 If isolated_hash is specified, downloads the dependencies in the cache,
1184 hardlinks them into a temporary directory and runs the command specified in
1185 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001186
1187 A temporary directory is created to hold the output files. The content inside
1188 this directory will be uploaded back to |storage| packaged as a .isolated
1189 file.
1190
1191 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001192 - data: TaskData instance.
1193 - result_json: File path to dump result metadata into. If set, the process
1194 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -07001195
1196 Returns:
1197 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001198 """
maruela76b9ee2015-12-15 06:18:08 -08001199 if result_json:
1200 # Write a json output file right away in case we get killed.
1201 result = {
Junji Watanabe54925c32020-09-08 00:56:18 +00001202 'exit_code': None,
1203 'had_hard_timeout': False,
1204 'internal_failure': 'Was terminated before completion',
1205 'outputs_ref': None,
1206 'cas_output_root': None,
1207 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -08001208 }
1209 tools.write_json(result_json, result, dense=True)
1210
maruela9cfd6f2015-09-15 11:03:15 -07001211 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001212 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -07001213 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -07001214
maruela9cfd6f2015-09-15 11:03:15 -07001215 if result_json:
maruel05d5a882015-09-21 13:59:02 -07001216 # We've found tests to delete 'work' when quitting, causing an exception
1217 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -07001218 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -07001219 tools.write_json(result_json, result, dense=True)
1220 # Only return 1 if there was an internal error.
1221 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +00001222
maruela9cfd6f2015-09-15 11:03:15 -07001223 # Marshall into old-style inline output.
1224 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +00001225 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -07001226 data = {
Junji Watanabe38b28b02020-04-23 10:23:30 +00001227 'hash': result['outputs_ref']['isolated'],
1228 'namespace': result['outputs_ref']['namespace'],
1229 'storage': result['outputs_ref']['isolatedserver'],
maruela9cfd6f2015-09-15 11:03:15 -07001230 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -05001231 sys.stdout.flush()
Junji Watanabe38b28b02020-04-23 10:23:30 +00001232 print('[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
1233 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -08001234 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -07001235 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001236
1237
iannuccib58d10d2017-03-18 02:00:25 -07001238# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -08001239CipdInfo = collections.namedtuple('CipdInfo', [
1240 'client', # cipd.CipdClient object
1241 'cache_dir', # absolute path to bot-global cipd tag and instance cache
1242 'stats', # dict with stats to return to the server
1243 'pins', # dict with installed cipd pins to return to the server
1244])
1245
1246
1247@contextlib.contextmanager
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001248def noop_install_packages(_run_dir, _isolated_dir, _cas_dir):
iannuccib58d10d2017-03-18 02:00:25 -07001249 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -08001250 yield None
1251
1252
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001253def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -07001254 """Calls 'cipd ensure' for packages.
1255
1256 Args:
1257 run_dir (str): root of installation.
1258 cipd_cache_dir (str): the directory to use for the cipd package cache.
1259 client (CipdClient): the cipd client to use
1260 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -07001261
1262 Returns: list of pinned packages. Looks like [
1263 {
1264 'path': 'subdirectory',
1265 'package_name': 'resolved/package/name',
1266 'version': 'deadbeef...',
1267 },
1268 ...
1269 ]
1270 """
1271 package_pins = [None]*len(packages)
1272 def insert_pin(path, name, version, idx):
1273 package_pins[idx] = {
1274 'package_name': name,
1275 # swarming deals with 'root' as '.'
1276 'path': path or '.',
1277 'version': version,
1278 }
1279
1280 by_path = collections.defaultdict(list)
1281 for i, (path, name, version) in enumerate(packages):
1282 # cipd deals with 'root' as ''
1283 if path == '.':
1284 path = ''
1285 by_path[path].append((name, version, i))
1286
1287 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001288 run_dir,
1289 {
1290 subdir: [(name, vers) for name, vers, _ in pkgs
1291 ] for subdir, pkgs in by_path.items()
1292 },
1293 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -07001294 )
1295
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +00001296 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -07001297 this_subdir = by_path[subdir]
1298 for i, (name, version) in enumerate(pin_list):
1299 insert_pin(subdir, name, version, this_subdir[i][2])
1300
Robert Iannucci461b30d2017-12-13 11:34:03 -08001301 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -07001302
1303 return package_pins
1304
1305
vadimsh232f5a82017-01-20 19:23:44 -08001306@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001307def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001308 client_package_name, client_version, cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001309 isolated_dir, cas_dir):
vadimsh902948e2017-01-20 15:57:32 -08001310 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -07001311
vadimsh232f5a82017-01-20 19:23:44 -08001312 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
1313
1314 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -07001315 [
1316 {
1317 "path": path, "package_name": package_name, "version": version,
1318 },
1319 ...
1320 ]
vadimsh902948e2017-01-20 15:57:32 -08001321 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -07001322
1323 such that they correspond 1:1 to all input package arguments from the command
1324 line. These dictionaries make their all the way back to swarming, where they
1325 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -07001326
vadimsh902948e2017-01-20 15:57:32 -08001327 If 'packages' list is empty, will bootstrap CIPD client, but won't install
1328 any packages.
1329
1330 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -08001331 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -08001332
nodirbe642ff2016-06-09 15:51:51 -07001333 Args:
nodir90bc8dc2016-06-15 13:35:21 -07001334 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -08001335 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -07001336 service_url (str): CIPD server url, e.g.
1337 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -07001338 client_package_name (str): CIPD package name of CIPD client.
1339 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -07001340 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001341 isolated_dir (str): where to download isolated client.
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001342 cas_dir (str): where to download cas client.
nodirbe642ff2016-06-09 15:51:51 -07001343 """
1344 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001345
nodirbe642ff2016-06-09 15:51:51 -07001346 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001347
vadimsh902948e2017-01-20 15:57:32 -08001348 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001349 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001350 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001351 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001352
nodirbe642ff2016-06-09 15:51:51 -07001353 get_client_start = time.time()
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001354 client_manager = cipd.get_client(cache_dir, service_url, client_package_name,
1355 client_version)
iannucci96fcccc2016-08-30 15:52:22 -07001356
nodirbe642ff2016-06-09 15:51:51 -07001357 with client_manager as client:
1358 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001359
iannuccib58d10d2017-03-18 02:00:25 -07001360 package_pins = []
1361 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001362 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1363 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001364
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001365 # Install isolated client to |isolated_dir|.
Takuto Ikuta02edca22019-11-29 10:04:51 +00001366 _install_packages(isolated_dir, cipd_cache_dir, client,
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +00001367 [('', ISOLATED_PACKAGE, _LUCI_GO_REVISION)])
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001368
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001369 # Install cas client to |cas_dir|.
1370 _install_packages(cas_dir, cipd_cache_dir, client,
Takuto Ikuta9c4eb1d2020-10-05 03:40:14 +00001371 [('', _CAS_PACKAGE, _LUCI_GO_REVISION)])
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001372
iannuccib58d10d2017-03-18 02:00:25 -07001373 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001374
vadimsh232f5a82017-01-20 19:23:44 -08001375 total_duration = time.time() - start
Junji Watanabe38b28b02020-04-23 10:23:30 +00001376 logging.info('Installing CIPD client and packages took %d seconds',
1377 total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001378
vadimsh232f5a82017-01-20 19:23:44 -08001379 yield CipdInfo(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001380 client=client,
1381 cache_dir=cipd_cache_dir,
1382 stats={
1383 'duration': total_duration,
1384 'get_client_duration': get_client_duration,
iannuccib58d10d2017-03-18 02:00:25 -07001385 },
Junji Watanabe38b28b02020-04-23 10:23:30 +00001386 pins={
1387 'client_package': {
1388 'package_name': client.package_name,
1389 'version': client.instance_id,
1390 },
1391 'packages': package_pins,
1392 })
nodirbe642ff2016-06-09 15:51:51 -07001393
1394
1395def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001396 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001397 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001398 version=__version__,
1399 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001400 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001401 '--clean',
1402 action='store_true',
maruel36a963d2016-04-08 17:15:49 -07001403 help='Cleans the cache, trimming it necessary and remove corrupted items '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001404 'and returns without executing anything; use with -v to know what '
1405 'was done')
maruel36a963d2016-04-08 17:15:49 -07001406 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001407 '--json',
1408 help='dump output metadata to json file. When used, run_isolated returns '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001409 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001410 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001411 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001412 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001413 '--grace-period',
1414 type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001415 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001416 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001417 '--relative-cwd',
Takuto Ikuta18ca29a2020-12-04 07:34:20 +00001418 help='Ignore the isolated \'relative_cwd\' and use this one instead')
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001419 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001420 '--env',
1421 default=[],
1422 action='append',
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001423 help='Environment variables to set for the child process')
1424 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001425 '--env-prefix',
1426 default=[],
1427 action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001428 help='Specify a VAR=./path/fragment to put in the environment variable '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001429 'before executing the command. The path fragment must be relative '
1430 'to the isolated run directory, and must not contain a `..` token. '
1431 'The path will be made absolute and prepended to the indicated '
1432 '$VAR using the OS\'s path separator. Multiple items for the same '
1433 '$VAR will be prepended in order.')
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001434 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001435 '--bot-file',
1436 help='Path to a file describing the state of the host. The content is '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001437 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001438 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001439 '--switch-to-account',
1440 help='If given, switches LUCI_CONTEXT to given logical service account '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001441 '(e.g. "task" or "system") before launching the isolated process.')
vadimsh9c54b2c2017-07-25 14:08:29 -07001442 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001443 '--output',
1444 action='append',
aludwin0a8e17d2016-10-27 15:57:39 -07001445 help='Specifies an output to return. If no outputs are specified, all '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001446 'files located in $(ISOLATED_OUTDIR) will be returned; '
1447 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1448 'specified by --output option (there can be multiple) will be '
1449 'returned. Note that if a file in OUT_DIR has the same path '
1450 'as an --output option, the --output version will be returned.')
aludwin0a8e17d2016-10-27 15:57:39 -07001451 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001452 '-a',
1453 '--argsfile',
aludwin7556e0c2016-10-26 08:46:10 -07001454 # This is actually handled in parse_args; it's included here purely so it
1455 # can make it into the help text.
1456 help='Specify a file containing a JSON array of arguments to this '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001457 'script. If --argsfile is provided, no other argument may be '
1458 'provided on the command line.')
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001459 parser.add_option(
1460 '--report-on-exception',
1461 action='store_true',
1462 help='Whether report exception during execution to isolate server. '
1463 'This flag should only be used in swarming bot.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001464
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001465 group = optparse.OptionGroup(parser, 'Data source - Isolate server')
Junji Watanabe54925c32020-09-08 00:56:18 +00001466 # Deprecated. Isoate server is being migrated to RBE-CAS.
1467 # Remove --isolated and isolate server options after migration.
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001468 group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001469 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001470 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001471 isolateserver.add_isolate_server_options(group)
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001472 parser.add_option_group(group)
1473
1474 group = optparse.OptionGroup(parser,
1475 'Data source - Content Addressed Storage')
Junji Watanabe54925c32020-09-08 00:56:18 +00001476 group.add_option(
1477 '--cas-instance', help='Full CAS instance name for input/output files.')
1478 group.add_option(
1479 '--cas-digest',
1480 help='Digest of the input root on RBE-CAS. The format is '
1481 '`{hash}/{size_bytes}`.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001482 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001483
Junji Watanabeb03450b2020-09-25 05:09:27 +00001484 # Cache options.
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001485 isolateserver.add_cache_options(parser)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001486 add_cas_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001487
1488 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001489
1490 group = optparse.OptionGroup(parser, 'Named caches')
1491 group.add_option(
1492 '--named-cache',
1493 dest='named_caches',
1494 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001495 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001496 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001497 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001498 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1499 'path is a path relative to the run dir where the cache directory '
1500 'must be put to. '
1501 'This option can be specified more than once.')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001502 group.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001503 '--named-cache-root',
1504 default='named_caches',
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001505 help='Cache root directory. Default=%default')
1506 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001507
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001508 group = optparse.OptionGroup(parser, 'Process containment')
1509 parser.add_option(
1510 '--lower-priority', action='store_true',
1511 help='Lowers the child process priority')
1512 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001513 '--containment-type',
1514 choices=('NONE', 'AUTO', 'JOB_OBJECT'),
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001515 default='NONE',
1516 help='Type of container to use')
1517 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001518 '--limit-processes',
1519 type='int',
1520 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001521 help='Maximum number of active processes in the containment')
1522 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001523 '--limit-total-committed-memory',
1524 type='int',
1525 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001526 help='Maximum sum of committed memory in the containment')
1527 parser.add_option_group(group)
1528
1529 group = optparse.OptionGroup(parser, 'Debugging')
1530 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001531 '--leak-temp-dir',
1532 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001533 help='Deliberately leak isolate\'s temp dir for later examination. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001534 'Default: %default')
1535 group.add_option('--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001536 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001537
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001538 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001539
Ye Kuang1d096cb2020-06-26 08:38:21 +00001540 parser.set_defaults(cache='cache')
nodirbe642ff2016-06-09 15:51:51 -07001541 return parser
1542
1543
Junji Watanabeb03450b2020-09-25 05:09:27 +00001544def add_cas_cache_options(parser):
1545 group = optparse.OptionGroup(parser, 'CAS cache management')
1546 group.add_option(
1547 '--cas-cache',
1548 metavar='DIR',
1549 default='cas-cache',
1550 help='Directory to keep a local cache of the files. Accelerates download '
1551 'by reusing already downloaded files. Default=%default')
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001552 group.add_option(
1553 '--kvs-file',
1554 default='',
1555 help='CAS cache using kvs for small files. Default=%default')
Junji Watanabeb03450b2020-09-25 05:09:27 +00001556 parser.add_option_group(group)
1557
1558
1559def process_cas_cache_options(options):
1560 if options.cas_cache:
1561 policies = local_caching.CachePolicies(
1562 max_cache_size=options.max_cache_size,
1563 min_free_space=options.min_free_space,
1564 # max_items isn't used for CAS cache for now.
1565 max_items=None,
1566 max_age_secs=MAX_AGE_SECS)
1567
1568 return local_caching.DiskContentAddressedCache(
1569 six.text_type(os.path.abspath(options.cas_cache)), policies, trim=False)
1570 return local_caching.MemoryContentAddressedCache()
1571
1572
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001573def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001574 """Validates named cache options and returns a CacheManager."""
1575 if options.named_caches and not options.named_cache_root:
1576 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001577 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001578 if not CACHE_NAME_RE.match(name):
1579 parser.error(
1580 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1581 if not path:
1582 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001583 try:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001584 int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001585 except ValueError:
1586 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001587 if options.named_cache_root:
1588 # Make these configurable later if there is use case but for now it's fairly
1589 # safe values.
1590 # In practice, a fair chunk of bots are already recycled on a daily schedule
1591 # so this code doesn't have any effect to them, unless they are preloaded
1592 # with a really old cache.
1593 policies = local_caching.CachePolicies(
1594 # 1TiB.
1595 max_cache_size=1024*1024*1024*1024,
1596 min_free_space=options.min_free_space,
1597 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001598 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001599 root_dir = six.text_type(os.path.abspath(options.named_cache_root))
John Budorickc6186972020-02-26 00:58:14 +00001600 cache = local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
1601 # Touch any named caches we're going to use to minimize thrashing
1602 # between tasks that request some (but not all) of the same named caches.
John Budorick0a4dab62020-03-02 22:23:35 +00001603 cache.touch(*[name for name, _, _ in options.named_caches])
John Budorickc6186972020-02-26 00:58:14 +00001604 return cache
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001605 return None
1606
1607
aludwin7556e0c2016-10-26 08:46:10 -07001608def parse_args(args):
1609 # Create a fake mini-parser just to get out the "-a" command. Note that
1610 # it's not documented here; instead, it's documented in create_option_parser
1611 # even though that parser will never actually get to parse it. This is
1612 # because --argsfile is exclusive with all other options and arguments.
1613 file_argparse = argparse.ArgumentParser(add_help=False)
1614 file_argparse.add_argument('-a', '--argsfile')
1615 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1616 if file_args.argsfile:
1617 if nonfile_args:
1618 file_argparse.error('Can\'t specify --argsfile with'
1619 'any other arguments (%s)' % nonfile_args)
1620 try:
1621 with open(file_args.argsfile, 'r') as f:
1622 args = json.load(f)
1623 except (IOError, OSError, ValueError) as e:
1624 # We don't need to error out here - "args" is now empty,
1625 # so the call below to parser.parse_args(args) will fail
1626 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001627 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001628
1629 # Even if we failed to read the args, just call the normal parser now since it
1630 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001631 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001632 options, args = parser.parse_args(args)
Ye Kuangfff1e502020-07-13 13:21:57 +00001633 if not isinstance(options.cipd_enabled, (bool, int)):
1634 options.cipd_enabled = distutils.util.strtobool(options.cipd_enabled)
aludwin7556e0c2016-10-26 08:46:10 -07001635 return (parser, options, args)
1636
1637
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001638def _calc_named_cache_hint(named_cache, named_caches):
1639 """Returns the expected size of the missing named caches."""
1640 present = named_cache.available
1641 size = 0
1642 for name, _, hint in named_caches:
1643 if name not in present:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001644 hint = int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001645 if hint > 0:
1646 size += hint
1647 return size
1648
1649
Takuto Ikutaae391c52020-12-03 08:43:45 +00001650def _clean_cmd(parser, options, caches, root):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001651 """Cleanup cache dirs/files."""
1652 if options.isolated:
1653 parser.error('Can\'t use --isolated with --clean.')
1654 if options.isolate_server:
1655 parser.error('Can\'t use --isolate-server with --clean.')
1656 if options.json:
1657 parser.error('Can\'t use --json with --clean.')
1658 if options.named_caches:
1659 parser.error('Can\t use --named-cache with --clean.')
1660 if options.cas_instance or options.cas_digest:
1661 parser.error('Can\t use --cas-instance, --cas-digest with --clean.')
1662
1663 logging.info("initial free space: %d", file_path.get_free_space(root))
1664
Takuto Ikutaae391c52020-12-03 08:43:45 +00001665 if options.kvs_file and fs.isfile(six.text_type(options.kvs_file)):
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001666 # Remove kvs file if its size exceeds fixed threshold.
Takuto Ikuta80bee362020-12-03 10:51:37 +00001667 st = fs.stat(six.text_type(options.kvs_file))
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001668 if st.st_size >= _CAS_KVS_CACHE_THRESHOLD:
1669 logging.info("remove kvs file with size: %d", st.st_size)
Takuto Ikuta80bee362020-12-03 10:51:37 +00001670 fs.remove(six.text_type(options.kvs_file))
Takuto Ikuta7ff4b242020-12-03 08:07:06 +00001671
1672 # Trim first, then clean.
1673 local_caching.trim_caches(
1674 caches,
1675 root,
1676 min_free_space=options.min_free_space,
1677 max_age_secs=MAX_AGE_SECS)
1678 logging.info("free space after trim: %d", file_path.get_free_space(root))
1679 for c in caches:
1680 c.cleanup()
1681 logging.info("free space after cleanup: %d", file_path.get_free_space(root))
1682
1683
aludwin7556e0c2016-10-26 08:46:10 -07001684def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001685 # Warning: when --argsfile is used, the strings are unicode instances, when
1686 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001687 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001688
Takuto Ikuta74682862021-02-03 04:49:12 +00001689 SWARMING_SERVER = 'SWARMING_SERVER'
1690 if options.report_on_exception and SWARMING_SERVER in os.environ:
1691 on_error.report_on_exception_exit(os.environ[SWARMING_SERVER])
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001692
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001693 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001694 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001695
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001696 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001697 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001698 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1699 if hint:
1700 # Increase the --min-free-space value by the hint, and recreate the
1701 # NamedCache instance so it gets the updated CachePolicy.
1702 options.min_free_space += hint
1703 named_cache = process_named_cache_options(parser, options)
1704
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001705 # TODO(crbug.com/932396): Remove this.
Takuto Ikuta4a22c2c2020-06-05 02:02:23 +00001706 use_go_isolated = options.cipd_enabled
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001707
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001708 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1709 # they can be cleaned the same way.
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001710
1711 isolate_cache = isolateserver.process_cache_options(options, trim=False)
1712 cas_cache = process_cas_cache_options(options)
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +00001713
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001714 caches = []
1715 if isolate_cache:
1716 caches.append(isolate_cache)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001717 if cas_cache:
1718 caches.append(cas_cache)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001719 if named_cache:
1720 caches.append(named_cache)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001721 root = caches[0].cache_dir if caches else six.text_type(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001722 if options.clean:
Takuto Ikutaae391c52020-12-03 08:43:45 +00001723 _clean_cmd(parser, options, caches, root)
maruel36a963d2016-04-08 17:15:49 -07001724 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001725
1726 # Trim must still be done for the following case:
1727 # - named-cache was used
1728 # - some entries, with a large hint, where missing
1729 # - --min-free-space was increased accordingly, thus trimming is needed
1730 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1731 # --clean after each task.
Takuto Ikutac9ddff22021-02-18 07:58:39 +00001732 additional_buffer = _FREE_SPACE_BUFFER_FOR_CIPD_PACKAGES
Takuto Ikuta7f45c592021-02-09 05:57:05 +00001733 if options.kvs_file:
1734 additional_buffer += _CAS_KVS_CACHE_THRESHOLD
Takuto Ikutaa010c532020-10-21 05:42:29 +00001735 local_caching.trim_caches(
1736 caches,
1737 root,
Takuto Ikutac9ddff22021-02-18 07:58:39 +00001738 # Add some buffer for Go CLI.
Takuto Ikuta7f45c592021-02-09 05:57:05 +00001739 min_free_space=options.min_free_space + additional_buffer,
Takuto Ikutaa010c532020-10-21 05:42:29 +00001740 max_age_secs=MAX_AGE_SECS)
maruel36a963d2016-04-08 17:15:49 -07001741
Takuto Ikutaf1c58442020-10-20 09:03:27 +00001742 # Save state of isolate/cas cache not to overwrite state from go client.
1743 if use_go_isolated:
1744 isolate_cache.save()
1745 isolate_cache = None
1746 if cas_cache:
1747 cas_cache.save()
1748 cas_cache = None
1749
nodir55be77b2016-05-03 09:39:57 -07001750 if not options.isolated and not args:
1751 parser.error('--isolated or command to run is required.')
1752
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001753 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001754
Takuto Ikutaae767b32020-05-11 01:22:19 +00001755 isolateserver.process_isolate_server_options(parser, options, False)
Junji Watanabeed9ce352020-09-25 12:32:07 +00001756 if ISOLATED_OUTDIR_PARAMETER in args and (not options.isolate_server and
1757 not options.cas_instance):
1758 parser.error('%s in args requires --isolate-server or --cas-instance' %
1759 ISOLATED_OUTDIR_PARAMETER)
1760
1761 if options.isolated and not options.isolate_server:
1762 parser.error('--isolated requires --isolate-server')
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001763
nodir90bc8dc2016-06-15 13:35:21 -07001764 if options.root_dir:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001765 options.root_dir = six.text_type(os.path.abspath(options.root_dir))
Takuto Ikutad46ea762020-10-07 05:43:22 +00001766 else:
1767 options.root_dir = six.text_type(tempfile.mkdtemp(prefix='root'))
maruel12e30012015-10-09 11:55:35 -07001768 if options.json:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001769 options.json = six.text_type(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001770
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001771 if any('=' not in i for i in options.env):
1772 parser.error(
1773 '--env required key=value form. value can be skipped to delete '
1774 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001775 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001776
1777 prefixes = {}
1778 cwd = os.path.realpath(os.getcwd())
1779 for item in options.env_prefix:
1780 if '=' not in item:
1781 parser.error(
1782 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1783 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001784 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001785 if os.path.isabs(opath):
1786 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1787 opath = os.path.normpath(opath)
1788 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1789 parser.error(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001790 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1791 % opath)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001792 prefixes.setdefault(key, []).append(opath)
1793 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001794
nodirbe642ff2016-06-09 15:51:51 -07001795 cipd.validate_cipd_options(parser, options)
1796
vadimsh232f5a82017-01-20 19:23:44 -08001797 install_packages_fn = noop_install_packages
Ye Kuang1d096cb2020-06-26 08:38:21 +00001798 tmp_cipd_cache_dir = None
vadimsh902948e2017-01-20 15:57:32 -08001799 if options.cipd_enabled:
Ye Kuang1d096cb2020-06-26 08:38:21 +00001800 cache_dir = options.cipd_cache
1801 if not cache_dir:
1802 tmp_cipd_cache_dir = six.text_type(tempfile.mkdtemp())
1803 cache_dir = tmp_cipd_cache_dir
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001804 install_packages_fn = (
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001805 lambda run_dir, isolated_dir, cas_dir: install_client_and_packages(
Ye Kuang1d096cb2020-06-26 08:38:21 +00001806 run_dir,
1807 cipd.parse_package_args(options.cipd_packages),
1808 options.cipd_server,
1809 options.cipd_client_package,
1810 options.cipd_client_version,
1811 cache_dir=cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001812 isolated_dir=isolated_dir,
1813 cas_dir=cas_dir,
1814 ))
nodirbe642ff2016-06-09 15:51:51 -07001815
nodird6160682017-02-02 13:03:35 -08001816 @contextlib.contextmanager
nodir0ae98b32017-05-11 13:21:53 -07001817 def install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001818 # WARNING: this function depends on "options" variable defined in the outer
1819 # function.
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001820 assert six.text_type(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001821 assert os.path.isabs(run_dir), run_dir
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001822 named_caches = [(os.path.join(run_dir, six.text_type(relpath)), name)
1823 for name, relpath, _ in options.named_caches]
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001824 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001825 named_cache.install(path, name)
nodird6160682017-02-02 13:03:35 -08001826 try:
1827 yield
1828 finally:
dnje289d132017-07-07 11:16:44 -07001829 # Uninstall each named cache, returning it to the cache pool. If an
1830 # uninstall fails for a given cache, it will remain in the task's
1831 # temporary space, get cleaned up by the Swarming bot, and be lost.
1832 #
1833 # If the Swarming bot cannot clean up the cache, it will handle it like
1834 # any other bot file that could not be removed.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001835 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001836 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001837 # uninstall() doesn't trim but does call save() implicitly. Trimming
1838 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001839 named_cache.uninstall(path, name)
1840 except local_caching.NamedCacheError:
1841 logging.exception('Error while removing named cache %r at %r. '
1842 'The cache will be lost.', path, name)
nodirf33b8d62016-10-26 22:34:58 -07001843
Takuto Ikutaf3caa9b2020-11-02 05:38:26 +00001844 command = args
1845 if options.relative_cwd:
1846 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1847 if not a.startswith(os.getcwd()):
1848 parser.error(
1849 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001850
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001851 containment_type = subprocess42.Containment.NONE
1852 if options.containment_type == 'AUTO':
1853 containment_type = subprocess42.Containment.AUTO
1854 if options.containment_type == 'JOB_OBJECT':
1855 containment_type = subprocess42.Containment.JOB_OBJECT
1856 containment = subprocess42.Containment(
1857 containment_type=containment_type,
1858 limit_processes=options.limit_processes,
1859 limit_total_committed_memory=options.limit_total_committed_memory)
1860
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001861 data = TaskData(
1862 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001863 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001864 isolated_hash=options.isolated,
1865 storage=None,
1866 isolate_cache=isolate_cache,
Junji Watanabe54925c32020-09-08 00:56:18 +00001867 cas_instance=options.cas_instance,
1868 cas_digest=options.cas_digest,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001869 outputs=options.output,
1870 install_named_caches=install_named_caches,
1871 leak_temp_dir=options.leak_temp_dir,
1872 root_dir=_to_unicode(options.root_dir),
1873 hard_timeout=options.hard_timeout,
1874 grace_period=options.grace_period,
1875 bot_file=options.bot_file,
1876 switch_to_account=options.switch_to_account,
1877 install_packages_fn=install_packages_fn,
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001878 use_go_isolated=use_go_isolated,
Takuto Ikuta10cae642020-01-08 08:12:07 +00001879 go_cache_dir=options.cache,
Takuto Ikuta879788c2020-01-10 08:00:26 +00001880 go_cache_policies=local_caching.CachePolicies(
1881 max_cache_size=options.max_cache_size,
1882 min_free_space=options.min_free_space,
1883 max_items=options.max_items,
1884 max_age_secs=None,
1885 ),
Junji Watanabeb03450b2020-09-25 05:09:27 +00001886 cas_cache_dir=options.cas_cache,
1887 cas_cache_policies=local_caching.CachePolicies(
1888 max_cache_size=options.max_cache_size,
1889 min_free_space=options.min_free_space,
1890 max_items=None,
1891 max_age_secs=None,
1892 ),
Takuto Ikutaae391c52020-12-03 08:43:45 +00001893 cas_kvs=options.kvs_file,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001894 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001895 env_prefix=options.env_prefix,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001896 lower_priority=bool(options.lower_priority),
1897 containment=containment)
nodirbe642ff2016-06-09 15:51:51 -07001898 try:
nodir90bc8dc2016-06-15 13:35:21 -07001899 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001900 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001901 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001902 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001903 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001904 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001905 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001906 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001907 return run_tha_test(data, options.json)
1908 return run_tha_test(data, options.json)
Junji Watanabe38b28b02020-04-23 10:23:30 +00001909 except (cipd.Error, local_caching.NamedCacheError,
1910 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001911 print(ex.message, file=sys.stderr)
nodirbe642ff2016-06-09 15:51:51 -07001912 return 1
Ye Kuang1d096cb2020-06-26 08:38:21 +00001913 finally:
1914 if tmp_cipd_cache_dir is not None:
1915 try:
1916 file_path.rmtree(tmp_cipd_cache_dir)
1917 except OSError:
1918 logging.exception('Remove tmp_cipd_cache_dir=%s failed',
1919 tmp_cipd_cache_dir)
1920 # Best effort clean up. Failed to do so doesn't affect the outcome.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001921
1922
1923if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001924 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001925 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001926 fix_encoding.fix_encoding()
Ye Kuang2dd17442020-04-22 08:45:52 +00001927 net.set_user_agent('run_isolated.py/' + __version__)
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001928 sys.exit(main(sys.argv[1:]))