blob: 1a1c6a722dd72524ac9fc5d91a3deadcefaee387 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
33See
34https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
35for all the variables.
36
37See
38https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
39for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000040"""
41
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000042from __future__ import print_function
43
44__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000045
aludwin7556e0c2016-10-26 08:46:10 -070046import argparse
maruel064c0a32016-04-05 11:47:15 -070047import base64
iannucci96fcccc2016-08-30 15:52:22 -070048import collections
vadimsh232f5a82017-01-20 19:23:44 -080049import contextlib
Ye Kuangfff1e502020-07-13 13:21:57 +000050import distutils
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040051import errno
aludwin7556e0c2016-10-26 08:46:10 -070052import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000053import logging
54import optparse
55import os
Takuto Ikuta5c59a842020-01-24 03:05:24 +000056import platform
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040057import re
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000058import sys
59import tempfile
maruel064c0a32016-04-05 11:47:15 -070060import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000061
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000062from utils import tools
63tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000064
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000065# third_party/
66from depot_tools import fix_encoding
Takuto Ikuta6e2ff962019-10-29 12:35:27 +000067import six
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000068
69# pylint: disable=ungrouped-imports
70import auth
71import cipd
72import isolate_storage
73import isolateserver
74import local_caching
75from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070076from utils import file_path
maruel12e30012015-10-09 11:55:35 -070077from utils import fs
maruel064c0a32016-04-05 11:47:15 -070078from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040079from utils import logging_utils
Ye Kuang2dd17442020-04-22 08:45:52 +000080from utils import net
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040081from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050082from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000083
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000084
maruele2f2cb82016-07-13 14:41:03 -070085# Magic variables that can be found in the isolate task command line.
86ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
87EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
88SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
89
90
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000091# The name of the log file to use.
92RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
93
maruele2f2cb82016-07-13 14:41:03 -070094
csharp@chromium.orge217f302012-11-22 16:51:53 +000095# The name of the log to use for the run_test_cases.py command
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000096RUN_TEST_CASES_LOG = 'run_test_cases.log'
csharp@chromium.orge217f302012-11-22 16:51:53 +000097
vadimsh@chromium.org87d63262013-04-04 19:34:21 +000098
maruele2f2cb82016-07-13 14:41:03 -070099# Use short names for temporary directories. This is driven by Windows, which
100# imposes a relatively short maximum path length of 260 characters, often
101# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000102# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -0700103#
104# It is recommended to start the script with a `root_dir` as short as
105# possible.
106# - ir stands for isolated_run
107# - io stands for isolated_out
108# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000109# - ic stands for isolated_client
maruele2f2cb82016-07-13 14:41:03 -0700110ISOLATED_RUN_DIR = u'ir'
111ISOLATED_OUT_DIR = u'io'
112ISOLATED_TMP_DIR = u'it'
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000113ISOLATED_CLIENT_DIR = u'ic'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000114_CAS_CLIENT_DIR = u'cc'
maruele2f2cb82016-07-13 14:41:03 -0700115
Takuto Ikuta02edca22019-11-29 10:04:51 +0000116# TODO(tikuta): take these parameter from luci-config?
Takuto Ikutac8c92e62020-04-01 07:07:29 +0000117# Update tag by `./client/update_isolated.sh`.
118# Or take revision from
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000119# https://ci.chromium.org/p/infra-internal/g/infra-packagers/console
Takuto Ikuta02edca22019-11-29 10:04:51 +0000120ISOLATED_PACKAGE = 'infra/tools/luci/isolated/${platform}'
Takuto Ikuta3d3dcf52020-08-24 08:24:16 +0000121ISOLATED_REVISION = 'git_revision:3ccf4cc0119188dbc4befff330348d972b15711d'
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000122_CAS_PACKAGE = 'infra/tools/luci/cas/${platform}'
123# TODO(jwata): pin a stable version.
124_CAS_REVISION = 'latest'
maruele2f2cb82016-07-13 14:41:03 -0700125
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400126# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000127CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400128
129
marueld928c862017-06-08 08:20:04 -0700130OUTLIVING_ZOMBIE_MSG = """\
131*** Swarming tried multiple times to delete the %s directory and failed ***
132*** Hard failing the task ***
133
134Swarming detected that your testing script ran an executable, which may have
135started a child executable, and the main script returned early, leaving the
136children executables playing around unguided.
137
138You don't want to leave children processes outliving the task on the Swarming
139bot, do you? The Swarming bot doesn't.
140
141How to fix?
142- For any process that starts children processes, make sure all children
143 processes terminated properly before each parent process exits. This is
144 especially important in very deep process trees.
145 - This must be done properly both in normal successful task and in case of
146 task failure. Cleanup is very important.
147- The Swarming bot sends a SIGTERM in case of timeout.
148 - You have %s seconds to comply after the signal was sent to the process
149 before the process is forcibly killed.
150- To achieve not leaking children processes in case of signals on timeout, you
151 MUST handle signals in each executable / python script and propagate them to
152 children processes.
153 - When your test script (python or binary) receives a signal like SIGTERM or
154 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
155 them to terminate before quitting.
156
157See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400158https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700159for more information.
160
161*** May the SIGKILL force be with you ***
162"""
163
164
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000165# Currently hardcoded. Eventually could be exposed as a flag once there's value.
166# 3 weeks
167MAX_AGE_SECS = 21*24*60*60
168
Ye Kuang72e6fe82020-08-05 06:30:04 +0000169# TODO(1099655): Enable this once all prod issues are gone.
170_USE_GO_ISOLATED_TO_UPLOAD = False
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000171
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500172TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000173 'TaskData',
174 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000175 # List of strings; the command line to use, independent of what was
176 # specified in the isolated file.
177 'command',
178 # Relative directory to start command into.
179 'relative_cwd',
180 # List of strings; the arguments to add to the command specified in the
181 # isolated file.
182 'extra_args',
183 # Hash of the .isolated file that must be retrieved to recreate the tree
184 # of files to run the target executable. The command specified in the
185 # .isolated is executed. Mutually exclusive with command argument.
186 'isolated_hash',
187 # isolateserver.Storage instance to retrieve remote objects. This object
188 # has a reference to an isolateserver.StorageApi, which does the actual
189 # I/O.
190 'storage',
191 # isolateserver.LocalCache instance to keep from retrieving the same
192 # objects constantly by caching the objects retrieved. Can be on-disk or
193 # in-memory.
194 'isolate_cache',
Junji Watanabe54925c32020-09-08 00:56:18 +0000195 # Digest of the input root on RBE-CAS.
196 'cas_digest',
197 # Full CAS instance name.
198 'cas_instance',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000199 # List of paths relative to root_dir to put into the output isolated
200 # bundle upon task completion (see link_outputs_to_outdir).
201 'outputs',
202 # Function (run_dir) => context manager that installs named caches into
203 # |run_dir|.
204 'install_named_caches',
205 # If True, the temporary directory will be deliberately leaked for later
206 # examination.
207 'leak_temp_dir',
208 # Path to the directory to use to create the temporary directory. If not
209 # specified, a random temporary directory is created.
210 'root_dir',
211 # Kills the process if it lasts more than this amount of seconds.
212 'hard_timeout',
213 # Number of seconds to wait between SIGTERM and SIGKILL.
214 'grace_period',
215 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
216 # task command line argument.
217 'bot_file',
218 # Logical account to switch LUCI_CONTEXT into.
219 'switch_to_account',
220 # Context manager dir => CipdInfo, see install_client_and_packages.
221 'install_packages_fn',
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000222 # Use go isolated client.
223 'use_go_isolated',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000224 # Cache directory for go `isolated` client.
Takuto Ikuta057c5342019-12-03 04:05:05 +0000225 'go_cache_dir',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000226 # Parameters passed to go `isolated` client.
Takuto Ikuta879788c2020-01-10 08:00:26 +0000227 'go_cache_policies',
Junji Watanabeb03450b2020-09-25 05:09:27 +0000228 # Cache directory for `cas` client.
229 'cas_cache_dir',
230 # Parameters passed to `cas` client.
231 'cas_cache_policies',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000232 # Environment variables to set.
233 'env',
234 # Environment variables to mutate with relative directories.
235 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
236 'env_prefix',
237 # Lowers the task process priority.
238 'lower_priority',
239 # subprocess42.Containment instance. Can be None.
240 'containment',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000241 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500242
243
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500244def _to_str(s):
245 """Downgrades a unicode instance to str. Pass str through as-is."""
246 if isinstance(s, str):
247 return s
248 # This is technically incorrect, especially on Windows. In theory
249 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
250 # page' on Windows, but that causes other problems, as the character set
251 # is very limited.
252 return s.encode('utf-8')
253
254
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500255def _to_unicode(s):
256 """Upgrades a str instance to unicode. Pass unicode through as-is."""
Takuto Ikuta95459dd2019-10-29 12:39:47 +0000257 if isinstance(s, six.text_type) or s is None:
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500258 return s
259 return s.decode('utf-8')
260
261
maruel03e11842016-07-14 10:50:16 -0700262def make_temp_dir(prefix, root_dir):
263 """Returns a new unique temporary directory."""
Takuto Ikuta6e2ff962019-10-29 12:35:27 +0000264 return six.text_type(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000265
266
vadimsh9c54b2c2017-07-25 14:08:29 -0700267@contextlib.contextmanager
268def set_luci_context_account(account, tmp_dir):
269 """Sets LUCI_CONTEXT account to be used by the task.
270
271 If 'account' is None or '', does nothing at all. This happens when
272 run_isolated.py is called without '--switch-to-account' flag. In this case,
273 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000274 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700275 run_isolated.py explicitly from their code.
276
277 If the requested account is not defined in the context, switches to
278 non-authenticated access. This happens for Swarming tasks that don't use
279 'task' service accounts.
280
281 If not using LUCI_CONTEXT-based auth, does nothing.
282 If already running as requested account, does nothing.
283 """
284 if not account:
285 # Not actually switching.
286 yield
287 return
288
289 local_auth = luci_context.read('local_auth')
290 if not local_auth:
291 # Not using LUCI_CONTEXT auth at all.
292 yield
293 return
294
295 # See LUCI_CONTEXT.md for the format of 'local_auth'.
296 if local_auth.get('default_account_id') == account:
297 # Already set, no need to switch.
298 yield
299 return
300
301 available = {a['id'] for a in local_auth.get('accounts') or []}
302 if account in available:
303 logging.info('Switching default LUCI_CONTEXT account to %r', account)
304 local_auth['default_account_id'] = account
305 else:
306 logging.warning(
307 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
308 'disabling authentication', account, sorted(available))
309 local_auth.pop('default_account_id', None)
310
311 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
312 yield
313
314
nodir90bc8dc2016-06-15 13:35:21 -0700315def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000316 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700317
318 Raises:
319 ValueError if a parameter is requested in |command| but its value is not
320 provided.
321 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000322 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
323
324
325def replace_parameters(arg, out_dir, bot_file):
326 """Replaces parameter tokens with appropriate values in a string.
327
328 Raises:
329 ValueError if a parameter is requested in |arg| but its value is not
330 provided.
331 """
332 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
333 replace_slash = False
334 if ISOLATED_OUTDIR_PARAMETER in arg:
335 if not out_dir:
336 raise ValueError(
337 'output directory is requested in command or env var, but not '
338 'provided; please specify one')
339 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
340 replace_slash = True
341 if SWARMING_BOT_FILE_PARAMETER in arg:
342 if bot_file:
343 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700344 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000345 else:
346 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
347 'var, but no bot_file specified. Leaving parameter '
348 'unchanged.')
349 if replace_slash:
350 # Replace slashes only if parameters are present
351 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
352 arg = arg.replace('/', os.sep)
353 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700354
355
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000356
357def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
358 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800359 """Returns full OS environment to run a command in.
360
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800361 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
362 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800363
364 Args:
365 tmp_dir: temp directory.
366 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500367 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500368 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800369 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000370 out_dir: Isolated output directory. Required to be != None if any of the
371 env vars contain ISOLATED_OUTDIR_PARAMETER.
372 bot_file: Required to be != None if any of the env vars contain
373 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800374 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500375 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000376 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500377 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500378 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500379 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000380 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500381
382 if cipd_info:
383 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500384 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
385 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500386
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000387 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500388 assert isinstance(paths, list), paths
389 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500390 cur = out.get(key)
391 if cur:
392 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500393 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800394
Marc-Antoine Ruelefb30b12018-07-25 18:34:36 +0000395 tmp_dir = _to_str(tmp_dir)
396 # pylint: disable=line-too-long
397 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
398 # platform. So $TMPDIR must be set on all platforms.
399 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
400 out['TMPDIR'] = tmp_dir
401 if sys.platform == 'win32':
402 # * chromium's base utils uses GetTempPath().
403 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
404 # * Go uses GetTempPath().
405 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
406 # set.
407 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
408 out['TMP'] = tmp_dir
409 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
410 out['TEMP'] = tmp_dir
411 elif sys.platform == 'darwin':
412 # * Chromium uses an hack on macOS before calling into
413 # NSTemporaryDirectory().
414 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
415 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
416 out['MAC_CHROMIUM_TMPDIR'] = tmp_dir
417 else:
418 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
419 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
420 # * mktemp on linux respects $TMPDIR.
421 # * Chromium respects $TMPDIR on linux.
422 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
423 # * Go uses $TMPDIR.
424 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
425 pass
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500426 return out
vadimsh232f5a82017-01-20 19:23:44 -0800427
428
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000429def run_command(
430 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700431 """Runs the command.
432
433 Returns:
434 tuple(process exit code, bool if had a hard timeout)
435 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000436 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000437 'run_command(%s, %s, %s, %s, %s, %s)',
438 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700439
maruel6be7f9e2015-10-01 12:25:30 -0700440 exit_code = None
441 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700442 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700443 proc = None
444 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700445 try:
maruel6be7f9e2015-10-01 12:25:30 -0700446 # TODO(maruel): This code is imperfect. It doesn't handle well signals
447 # during the download phase and there's short windows were things can go
448 # wrong.
449 def handler(signum, _frame):
450 if proc and not had_signal:
451 logging.info('Received signal %d', signum)
452 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700453 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700454
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000455 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000456 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000457 lower_priority=lower_priority, containment=containment)
maruel6be7f9e2015-10-01 12:25:30 -0700458 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
459 try:
John Budorickc398f092019-06-10 22:49:44 +0000460 exit_code = proc.wait(hard_timeout or None)
maruel6be7f9e2015-10-01 12:25:30 -0700461 except subprocess42.TimeoutExpired:
462 if not had_signal:
463 logging.warning('Hard timeout')
464 had_hard_timeout = True
465 logging.warning('Sending SIGTERM')
466 proc.terminate()
467
468 # Ignore signals in grace period. Forcibly give the grace period to the
469 # child process.
470 if exit_code is None:
471 ignore = lambda *_: None
472 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
473 try:
474 exit_code = proc.wait(grace_period or None)
475 except subprocess42.TimeoutExpired:
476 # Now kill for real. The user can distinguish between the
477 # following states:
478 # - signal but process exited within grace period,
479 # hard_timed_out will be set but the process exit code will be
480 # script provided.
481 # - processed exited late, exit code will be -9 on posix.
482 logging.warning('Grace exhausted; sending SIGKILL')
483 proc.kill()
martiniss5c8043e2017-08-01 17:09:43 -0700484 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700485 exit_code = proc.wait()
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000486 except OSError as e:
maruela9cfd6f2015-09-15 11:03:15 -0700487 # This is not considered to be an internal error. The executable simply
488 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800489 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000490 '<The executable does not exist, a dependent library is missing or '
491 'the command line is too long>\n'
492 '<Check for missing .so/.dll in the .isolate or GN file or length of '
493 'command line args>\n'
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000494 '<Command: %s, Exception: %s>\n' % (command, e))
maruela72f46e2016-02-24 11:05:45 -0800495 if os.environ.get('SWARMING_TASK_ID'):
496 # Give an additional hint when running as a swarming task.
497 sys.stderr.write(
498 '<See the task\'s page for commands to help diagnose this issue '
499 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700500 exit_code = 1
501 logging.info(
502 'Command finished with exit code %d (%s)',
503 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700504 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700505
506
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000507def _run_go_cmd_and_wait(cmd):
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000508 """
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000509 Runs an external Go command, `isolated` or `cas`, and wait for its completion.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000510
511 While this is a generic function to launch a subprocess, it has logic that
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000512 is specific to Go `isolated` and `cas` for waiting and logging.
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000513
514 Returns:
515 The subprocess object
516 """
Ye Kuang3c40e9f2020-07-28 13:15:25 +0000517 cmd_str = ' '.join(cmd)
Ye Kuangc1d800f2020-07-28 10:14:55 +0000518 try:
519 proc = subprocess42.Popen(cmd)
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000520
Ye Kuangc1d800f2020-07-28 10:14:55 +0000521 exceeded_max_timeout = True
522 check_period_sec = 30
523 max_checks = 100
524 # max timeout = max_checks * check_period_sec = 50 minutes
525 for i in range(max_checks):
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000526 # This is to prevent I/O timeout error during setup.
Ye Kuangc1d800f2020-07-28 10:14:55 +0000527 try:
528 retcode = proc.wait(check_period_sec)
529 if retcode != 0:
530 raise ValueError("retcode is not 0: %s (cmd=%s)" % (retcode, cmd_str))
531 exceeded_max_timeout = False
532 break
533 except subprocess42.TimeoutExpired:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000534 print('still running (after %d seconds)' % ((i + 1) * check_period_sec))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000535
Ye Kuangc1d800f2020-07-28 10:14:55 +0000536 if exceeded_max_timeout:
537 proc.terminate()
538 try:
539 proc.wait(check_period_sec)
540 except subprocess42.TimeoutExpired:
541 logging.exception(
542 "failed to terminate? timeout happened after %d seconds",
543 check_period_sec)
544 proc.kill()
545 proc.wait()
546 # Raise unconditionally, because |proc| was forcefully terminated.
547 raise ValueError("timedout after %d seconds (cmd=%s)" %
548 (check_period_sec * max_checks, cmd_str))
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000549
Ye Kuangc1d800f2020-07-28 10:14:55 +0000550 return proc
551 except Exception:
552 logging.exception('Failed to run Go cmd %s', cmd_str)
553 raise
Ye Kuangc0cf9ca2020-07-16 08:56:51 +0000554
555
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000556def _fetch_and_map_with_cas(cas_client, digest, instance, output_dir, cache_dir,
557 policies):
558 """
559 Fetches a CAS tree using cas client, create the tree and returns download
560 stats.
561 """
562
563 start = time.time()
564 result_json_handle, result_json_path = tempfile.mkstemp(
565 prefix=u'fetch-and-map-result-', suffix=u'.json')
566 os.close(result_json_handle)
567 try:
568 cmd = [
569 cas_client,
570 'download',
571 '-digest',
572 digest,
573 '-cas-instance',
574 instance,
575 # flags for cache.
576 '-cache-dir',
577 cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000578 '-cache-max-size',
579 str(policies.max_cache_size),
580 '-cache-min-free-space',
581 str(policies.min_free_space),
582 # flags for output.
583 '-dir',
584 output_dir,
585 '-dump-stats-json',
586 result_json_path,
587 ]
588 _run_go_cmd_and_wait(cmd)
589
590 with open(result_json_path) as json_file:
591 result_json = json.load(json_file)
592
593 return {
594 'duration': time.time() - start,
595 'items_cold': result_json['items_cold'],
596 'items_hot': result_json['items_hot'],
597 }
598 finally:
599 fs.remove(result_json_path)
600
601
602def _fetch_and_map_with_go_isolated(isolated_hash, storage, outdir,
603 go_cache_dir, policies, isolated_client):
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000604 """
605 Fetches an isolated tree using go client, create the tree and returns
606 (bundle, stats).
607 """
608 start = time.time()
609 server_ref = storage.server_ref
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000610 result_json_handle, result_json_path = tempfile.mkstemp(
611 prefix=u'fetch-and-map-result-', suffix=u'.json')
612 os.close(result_json_handle)
613 try:
Ye Kuanga98764c2020-04-09 03:17:37 +0000614 cmd = [
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000615 isolated_client,
616 'download',
617 '-isolate-server',
618 server_ref.url,
619 '-namespace',
620 server_ref.namespace,
621 '-isolated',
622 isolated_hash,
623
624 # flags for cache
625 '-cache-dir',
Takuto Ikuta057c5342019-12-03 04:05:05 +0000626 go_cache_dir,
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000627 '-cache-max-items',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000628 str(policies.max_items),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000629 '-cache-max-size',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000630 str(policies.max_cache_size),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000631 '-cache-min-free-space',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000632 str(policies.min_free_space),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000633
634 # flags for output
635 '-output-dir',
636 outdir,
637 '-fetch-and-map-result-json',
638 result_json_path,
Ye Kuanga98764c2020-04-09 03:17:37 +0000639 ]
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000640 _run_go_cmd_and_wait(cmd)
Takuto Ikuta3153e3b2020-02-18 06:11:47 +0000641
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000642 with open(result_json_path) as json_file:
643 result_json = json.load(json_file)
644
645 isolated = result_json['isolated']
646 bundle = isolateserver.IsolatedBundle(filter_cb=None)
647 # Only following properties are used in caller.
648 bundle.command = isolated.get('command')
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000649 bundle.relative_cwd = isolated.get('relative_cwd')
650
651 return bundle, {
652 'duration': time.time() - start,
653 'items_cold': result_json['items_cold'],
654 'items_hot': result_json['items_hot'],
655 }
656 finally:
657 fs.remove(result_json_path)
658
659
660# TODO(crbug.com/932396): remove this function.
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000661def fetch_and_map(isolated_hash, storage, cache, outdir):
maruel4409e302016-07-19 14:25:51 -0700662 """Fetches an isolated tree, create the tree and returns (bundle, stats)."""
nodir6f801882016-04-29 14:41:50 -0700663 start = time.time()
664 bundle = isolateserver.fetch_isolated(
665 isolated_hash=isolated_hash,
666 storage=storage,
667 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700668 outdir=outdir,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000669 use_symlinks=False)
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000670 hot = (collections.Counter(cache.used) -
671 collections.Counter(cache.added)).elements()
nodir6f801882016-04-29 14:41:50 -0700672 return bundle, {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000673 'duration': time.time() - start,
674 'items_cold': base64.b64encode(large.pack(sorted(cache.added))).decode(),
675 'items_hot': base64.b64encode(large.pack(sorted(hot))).decode(),
nodir6f801882016-04-29 14:41:50 -0700676 }
677
678
aludwin0a8e17d2016-10-27 15:57:39 -0700679def link_outputs_to_outdir(run_dir, out_dir, outputs):
680 """Links any named outputs to out_dir so they can be uploaded.
681
682 Raises an error if the file already exists in that directory.
683 """
684 if not outputs:
685 return
686 isolateserver.create_directories(out_dir, outputs)
687 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400688 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
689
690
691def copy_recursively(src, dst):
692 """Efficiently copies a file or directory from src_dir to dst_dir.
693
694 `item` may be a file, directory, or a symlink to a file or directory.
695 All symlinks are replaced with their targets, so the resulting
696 directory structure in dst_dir will never have any symlinks.
697
698 To increase speed, copy_recursively hardlinks individual files into the
699 (newly created) directory structure if possible, unlike Python's
700 shutil.copytree().
701 """
702 orig_src = src
703 try:
704 # Replace symlinks with their final target.
705 while fs.islink(src):
706 res = fs.readlink(src)
707 src = os.path.join(os.path.dirname(src), res)
708 # TODO(sadafm): Explicitly handle cyclic symlinks.
709
710 # Note that fs.isfile (which is a wrapper around os.path.isfile) throws
711 # an exception if src does not exist. A warning will be logged in that case.
712 if fs.isfile(src):
713 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
714 return
715
716 if not fs.exists(dst):
717 os.makedirs(dst)
718
719 for child in fs.listdir(src):
720 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
721
722 except OSError as e:
723 if e.errno == errno.ENOENT:
724 logging.warning('Path %s does not exist or %s is a broken symlink',
725 src, orig_src)
726 else:
727 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700728
729
Ye Kuangfb0bad62020-07-28 08:07:25 +0000730def _upload_with_py(storage, out_dir):
731
732 def process_stats(f_st):
733 st = sorted(i.size for i in f_st)
734 return base64.b64encode(large.pack(st)).decode()
735
736 try:
737 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
738 storage, [out_dir], None, verify_push=True)
739
740 isolated = list(results.values())[0]
741 cold = process_stats(f_cold)
742 hot = process_stats(f_hot)
743 return isolated, cold, hot
744
745 except isolateserver.Aborted:
746 # This happens when a signal SIGTERM was received while uploading data.
747 # There is 2 causes:
748 # - The task was too slow and was about to be killed anyway due to
749 # exceeding the hard timeout.
750 # - The amount of data uploaded back is very large and took too much
751 # time to archive.
752 sys.stderr.write('Received SIGTERM while uploading')
753 # Re-raise, so it will be treated as an internal failure.
754 raise
755
756
757def _upload_with_go(storage, outdir, isolated_client):
758 """
759 Uploads results back using the Go `isolated` CLI.
760 """
761 server_ref = storage.server_ref
762 isolated_handle, isolated_path = tempfile.mkstemp(
763 prefix=u'isolated-hash-', suffix=u'.txt')
764 stats_json_handle, stats_json_path = tempfile.mkstemp(
765 prefix=u'dump-stats-', suffix=u'.json')
766 os.close(isolated_handle)
767 os.close(stats_json_handle)
768 try:
769 cmd = [
770 isolated_client,
771 'archive',
772 '-isolate-server',
773 server_ref.url,
774 '-namespace',
775 server_ref.namespace,
776 '-dirs',
777 # Format: <working directory>:<relative path to dir>
778 outdir + ':',
779
780 # output
781 '-dump-hash',
782 isolated_path,
783 '-dump-stats-json',
784 stats_json_path,
Ye Kuangbc4e8402020-07-29 09:54:30 +0000785 '-quiet',
Ye Kuangfb0bad62020-07-28 08:07:25 +0000786 ]
Ye Kuang0023dc52020-08-04 05:28:41 +0000787 # Will do exponential backoff, e.g. 10, 20, 40...
788 # This mitigates https://crbug.com/1094369, where there is a data race on
789 # the uploaded files.
790 backoff = 10
Takuto Ikutae0bfec72020-08-28 02:52:52 +0000791 started = time.time()
Ye Kuang0023dc52020-08-04 05:28:41 +0000792 while True:
793 try:
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000794 _run_go_cmd_and_wait(cmd)
Ye Kuang0023dc52020-08-04 05:28:41 +0000795 break
796 except Exception:
Takuto Ikutae0bfec72020-08-28 02:52:52 +0000797 if time.time() > started + 60 * 2:
798 # This is to not wait task having leaked process long time.
Ye Kuang0023dc52020-08-04 05:28:41 +0000799 raise
800
801 on_error.report('error before %d second backoff' % backoff)
802 logging.exception(
Junji Watanabe4b890ef2020-09-16 01:43:27 +0000803 '_run_go_cmd_and_wait() failed, will retry after %d seconds',
Ye Kuang0023dc52020-08-04 05:28:41 +0000804 backoff)
805 time.sleep(backoff)
806 backoff *= 2
Ye Kuangfb0bad62020-07-28 08:07:25 +0000807
808 with open(isolated_path) as isol_file:
809 isolated = isol_file.read()
810 with open(stats_json_path) as json_file:
811 stats_json = json.load(json_file)
812
813 return isolated, stats_json['items_cold'], stats_json['items_hot']
814 finally:
815 fs.remove(isolated_path)
816 fs.remove(stats_json_path)
817
818
Ye Kuangbc4e8402020-07-29 09:54:30 +0000819def upload_out_dir(storage, out_dir, go_isolated_client):
820 """Uploads the results in |out_dir| back, if there is any.
maruela9cfd6f2015-09-15 11:03:15 -0700821
822 Returns:
Ye Kuangbc4e8402020-07-29 09:54:30 +0000823 tuple(outputs_ref, stats)
maruel064c0a32016-04-05 11:47:15 -0700824 - outputs_ref: a dict referring to the results archived back to the isolated
825 server, if applicable.
nodir6f801882016-04-29 14:41:50 -0700826 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700827 """
maruela9cfd6f2015-09-15 11:03:15 -0700828 # Upload out_dir and generate a .isolated file out of this directory. It is
829 # only done if files were written in the directory.
830 outputs_ref = None
Ye Kuangfb0bad62020-07-28 08:07:25 +0000831 cold = ''
832 hot = ''
nodir6f801882016-04-29 14:41:50 -0700833 start = time.time()
834
maruel12e30012015-10-09 11:55:35 -0700835 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700836 with tools.Profiler('ArchiveOutput'):
Ye Kuangfb0bad62020-07-28 08:07:25 +0000837 isolated = None
Ye Kuang72e6fe82020-08-05 06:30:04 +0000838 if _USE_GO_ISOLATED_TO_UPLOAD and go_isolated_client is not None:
Ye Kuangfb0bad62020-07-28 08:07:25 +0000839 isolated, cold, hot = _upload_with_go(storage, out_dir,
840 go_isolated_client)
Ye Kuang72e6fe82020-08-05 06:30:04 +0000841 else:
842 isolated, cold, hot = _upload_with_py(storage, out_dir)
Ye Kuangfb0bad62020-07-28 08:07:25 +0000843 outputs_ref = {
844 'isolated': isolated,
845 'isolatedserver': storage.server_ref.url,
846 'namespace': storage.server_ref.namespace,
847 }
nodir6f801882016-04-29 14:41:50 -0700848
nodir6f801882016-04-29 14:41:50 -0700849 stats = {
Takuto Ikuta630f99d2020-07-02 12:59:35 +0000850 'duration': time.time() - start,
Ye Kuangfb0bad62020-07-28 08:07:25 +0000851 'items_cold': cold,
852 'items_hot': hot,
nodir6f801882016-04-29 14:41:50 -0700853 }
Ye Kuangbc4e8402020-07-29 09:54:30 +0000854 return outputs_ref, stats
maruela9cfd6f2015-09-15 11:03:15 -0700855
856
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000857def upload_outdir_with_cas(cas_client, cas_instance, outdir):
858 """Uploads the results in |outdir|, if there is any.
859
860 Returns:
861 tuple(root_digest, stats)
862 - root_digest: a digest of the output directory.
863 - stats: uploading stats.
864 """
865 digest_file_handle, digest_path = tempfile.mkstemp(
866 prefix=u'cas-digest', suffix=u'.txt')
867 os.close(digest_file_handle)
868 stats_json_handle, stats_json_path = tempfile.mkstemp(
869 prefix=u'upload-stats', suffix=u'.json')
870 os.close(stats_json_handle)
871
872 try:
873 cmd = [
874 cas_client,
875 'archive',
876 '-cas-instance',
877 cas_instance,
878 '-paths',
879 # Format: <working directory>:<relative path to dir>
880 outdir + ':',
881 # output
882 '-dump-digest',
883 digest_path,
884 '-dump-stats-json',
885 stats_json_path,
886 ]
887
888 start = time.time()
889
890 _run_go_cmd_and_wait(cmd)
891
892 with open(digest_path) as digest_file:
893 digest = digest_file.read()
Junji Watanabec208b302020-09-25 09:18:27 +0000894 h, s = digest.split('/')
895 cas_output_root = {
896 'cas_instance': cas_instance,
897 'digest': {
898 'hash': h,
899 'size_bytes': int(s)
900 }
901 }
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000902 with open(stats_json_path) as stats_file:
903 stats = json.load(stats_file)
904
905 stats['duration'] = time.time() - start
906
Junji Watanabec208b302020-09-25 09:18:27 +0000907 return cas_output_root, stats
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000908 finally:
909 fs.remove(digest_path)
910 fs.remove(stats_json_path)
911
912
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500913def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700914 """Runs a command with optional isolated input/output.
915
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500916 Arguments:
917 - data: TaskData instance.
918 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700919
920 Returns metadata about the result.
921 """
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000922
923 if data.isolate_cache:
924 download_stats = {
925 #'duration': 0.,
926 'initial_number_items': len(data.isolate_cache),
927 'initial_size': data.isolate_cache.total_size,
928 #'items_cold': '<large.pack()>',
929 #'items_hot': '<large.pack()>',
930 }
931 else:
932 # TODO(tikuta): take stats from state.json in this case too.
933 download_stats = {}
934
maruela9cfd6f2015-09-15 11:03:15 -0700935 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000936 'duration': None,
937 'exit_code': None,
938 'had_hard_timeout': False,
939 'internal_failure': 'run_isolated did not complete properly',
940 'stats': {
941 #'cipd': {
942 # 'duration': 0.,
943 # 'get_client_duration': 0.,
944 #},
945 'isolated': {
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000946 'download': download_stats,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000947 #'upload': {
948 # 'duration': 0.,
949 # 'items_cold': '<large.pack()>',
950 # 'items_hot': '<large.pack()>',
951 #},
952 },
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000953 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000954 #'cipd_pins': {
955 # 'packages': [
956 # {'package_name': ..., 'version': ..., 'path': ...},
957 # ...
958 # ],
959 # 'client_package': {'package_name': ..., 'version': ...},
960 #},
961 'outputs_ref': None,
Junji Watanabe54925c32020-09-08 00:56:18 +0000962 'cas_output_root': None,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000963 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700964 }
nodirbe642ff2016-06-09 15:51:51 -0700965
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500966 if data.root_dir:
Lei Leife202df2019-06-11 17:33:34 +0000967 file_path.ensure_tree(data.root_dir, 0o700)
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000968 elif data.use_go_isolated:
969 data = data._replace(root_dir=os.path.dirname(data.go_cache_dir))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500970 elif data.isolate_cache.cache_dir:
971 data = data._replace(
972 root_dir=os.path.dirname(data.isolate_cache.cache_dir))
maruele2f2cb82016-07-13 14:41:03 -0700973 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700974 # If root_dir is not specified, it is not constant.
975 # TODO(maruel): This is not obvious. Change this to become an error once we
976 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500977 if constant_run_path and data.root_dir:
978 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700979 if os.path.isdir(run_dir):
980 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000981 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700982 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500983 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000984
985 # True if CAS is used for download/upload files.
986 use_cas = bool(data.cas_digest)
987
maruel03e11842016-07-14 10:50:16 -0700988 # storage should be normally set but don't crash if it is not. This can happen
989 # as Swarming task can run without an isolate server.
Junji Watanabe1adba7b2020-09-18 07:03:58 +0000990 out_dir = None
991 if data.storage or use_cas:
992 out_dir = make_temp_dir(ISOLATED_OUT_DIR, data.root_dir)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500993 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000994 isolated_client_dir = make_temp_dir(ISOLATED_CLIENT_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700995 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500996 if data.relative_cwd:
997 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500998 command = data.command
Ye Kuangfb0bad62020-07-28 08:07:25 +0000999 go_isolated_client = None
1000 if data.use_go_isolated:
1001 go_isolated_client = os.path.join(isolated_client_dir,
1002 'isolated' + cipd.EXECUTABLE_SUFFIX)
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001003
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001004 cas_client = None
1005 cas_client_dir = make_temp_dir(_CAS_CLIENT_DIR, data.root_dir)
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001006 if use_cas:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001007 cas_client = os.path.join(cas_client_dir, 'cas' + cipd.EXECUTABLE_SUFFIX)
1008
nodir55be77b2016-05-03 09:39:57 -07001009 try:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001010 with data.install_packages_fn(run_dir, isolated_client_dir,
1011 cas_client_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -08001012 if cipd_info:
1013 result['stats']['cipd'] = cipd_info.stats
1014 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -07001015
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001016 isolated_stats = result['stats'].setdefault('isolated', {})
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001017 if data.isolated_hash:
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001018 if data.use_go_isolated:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001019 bundle, stats = _fetch_and_map_with_go_isolated(
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001020 isolated_hash=data.isolated_hash,
1021 storage=data.storage,
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001022 outdir=run_dir,
1023 go_cache_dir=data.go_cache_dir,
Takuto Ikuta879788c2020-01-10 08:00:26 +00001024 policies=data.go_cache_policies,
Ye Kuangfb0bad62020-07-28 08:07:25 +00001025 isolated_client=go_isolated_client)
Takuto Ikuta90397ca2020-01-08 10:07:55 +00001026 else:
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001027 bundle, stats = fetch_and_map(
1028 isolated_hash=data.isolated_hash,
1029 storage=data.storage,
1030 cache=data.isolate_cache,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +00001031 outdir=run_dir)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001032 isolated_stats['download'].update(stats)
Takuto Ikutab58dbd12020-06-05 09:29:14 +00001033
maruelabec63c2017-04-26 11:53:24 -07001034 # Inject the command
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001035 if not command and bundle.command:
1036 command = bundle.command + data.extra_args
Marc-Antoine Rueld704a1f2017-10-31 10:51:23 -04001037 # Only set the relative directory if the isolated file specified a
1038 # command, and no raw command was specified.
1039 if bundle.relative_cwd:
1040 cwd = os.path.normpath(os.path.join(cwd, bundle.relative_cwd))
maruelabec63c2017-04-26 11:53:24 -07001041
Junji Watanabe54925c32020-09-08 00:56:18 +00001042 elif data.cas_digest:
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001043 stats = _fetch_and_map_with_cas(
1044 cas_client=cas_client,
1045 digest=data.cas_digest,
1046 instance=data.cas_instance,
1047 output_dir=run_dir,
Junji Watanabeb03450b2020-09-25 05:09:27 +00001048 cache_dir=data.cas_cache_dir,
1049 policies=data.cas_cache_policies)
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001050 isolated_stats['download'].update(stats)
Junji Watanabe54925c32020-09-08 00:56:18 +00001051
maruelabec63c2017-04-26 11:53:24 -07001052 if not command:
1053 # Handle this as a task failure, not an internal failure.
1054 sys.stderr.write(
1055 '<No command was specified!>\n'
1056 '<Please secify a command when triggering your Swarming task>\n')
1057 result['exit_code'] = 1
1058 return result
nodirbe642ff2016-06-09 15:51:51 -07001059
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001060 if not cwd.startswith(run_dir):
1061 # Handle this as a task failure, not an internal failure. This is a
1062 # 'last chance' way to gate against directory escape.
1063 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
1064 result['exit_code'] = 1
1065 return result
1066
1067 if not os.path.isdir(cwd):
1068 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +00001069 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001070
vadimsh232f5a82017-01-20 19:23:44 -08001071 # If we have an explicit list of files to return, make sure their
1072 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001073 if data.storage and data.outputs:
1074 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -07001075
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001076 with data.install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001077 sys.stdout.flush()
1078 start = time.time()
1079 try:
vadimsh9c54b2c2017-07-25 14:08:29 -07001080 # Need to switch the default account before 'get_command_env' call,
1081 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001082 with set_luci_context_account(data.switch_to_account, tmp_dir):
1083 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +00001084 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
1085 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +00001086 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -08001087 command = process_command(command, out_dir, data.bot_file)
1088 file_path.ensure_command_has_abs_path(command, cwd)
1089
vadimsh9c54b2c2017-07-25 14:08:29 -07001090 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001091 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001092 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -08001093 finally:
1094 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -05001095
Ye Kuangbc4e8402020-07-29 09:54:30 +00001096 if out_dir:
1097 # Try to link files to the output directory, if specified.
1098 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
1099 isolated_stats = result['stats'].setdefault('isolated', {})
Junji Watanabe1adba7b2020-09-18 07:03:58 +00001100 if use_cas:
1101 result['cas_output_root'], isolated_stats['upload'] = (
1102 upload_outdir_with_cas(cas_client, data.cas_instance, out_dir))
1103 else:
1104 # This could use |go_isolated_client|, so make sure it runs when the
1105 # CIPD package still exists.
1106 result['outputs_ref'], isolated_stats['upload'] = (
1107 upload_out_dir(data.storage, out_dir, go_isolated_client))
Seth Koehler49139812017-12-19 13:59:33 -05001108 # We successfully ran the command, set internal_failure back to
1109 # None (even if the command failed, it's not an internal error).
1110 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -07001111 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -07001112 # An internal error occurred. Report accordingly so the swarming task will
1113 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -07001114 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -07001115 result['internal_failure'] = str(e)
1116 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -07001117
1118 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -07001119 finally:
1120 try:
Ye Kuangbc4e8402020-07-29 09:54:30 +00001121 success = True
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001122 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -07001123 success = True
maruela9cfd6f2015-09-15 11:03:15 -07001124 logging.warning(
1125 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -07001126 else:
maruel84537cb2015-10-16 14:21:28 -07001127 # On Windows rmtree(run_dir) call above has a synchronization effect: it
1128 # finishes only when all task child processes terminate (since a running
1129 # process locks *.exe file). Examine out_dir only after that call
1130 # completes (since child processes may write to out_dir too and we need
1131 # to wait for them to finish).
Junji Watanabeb03450b2020-09-25 05:09:27 +00001132 dirs_to_remove = [run_dir, tmp_dir, isolated_client_dir, cas_client_dir]
Ye Kuangbc4e8402020-07-29 09:54:30 +00001133 if out_dir:
1134 dirs_to_remove.append(out_dir)
1135 for directory in dirs_to_remove:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001136 if not fs.isdir(directory):
1137 continue
maruel84537cb2015-10-16 14:21:28 -07001138 try:
Ye Kuangbc4e8402020-07-29 09:54:30 +00001139 success = success and file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -07001140 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001141 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -07001142 success = False
1143 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +00001144 sys.stderr.write(
1145 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
Takuto Ikutad7d64e12020-07-31 06:18:45 +00001146 subprocess42.check_call(['tasklist.exe', '/V'], stdout=sys.stderr)
maruel84537cb2015-10-16 14:21:28 -07001147 if result['exit_code'] == 0:
1148 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -07001149
maruela9cfd6f2015-09-15 11:03:15 -07001150 if not success and result['exit_code'] == 0:
1151 result['exit_code'] = 1
1152 except Exception as e:
1153 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -07001154 if out_dir:
1155 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -07001156 result['internal_failure'] = str(e)
Takuto Ikutaa9a907b2020-04-17 08:50:50 +00001157 on_error.report(None)
maruela9cfd6f2015-09-15 11:03:15 -07001158 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001159
1160
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001161def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -07001162 """Runs an executable and records execution metadata.
1163
nodir55be77b2016-05-03 09:39:57 -07001164 If isolated_hash is specified, downloads the dependencies in the cache,
1165 hardlinks them into a temporary directory and runs the command specified in
1166 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -05001167
1168 A temporary directory is created to hold the output files. The content inside
1169 this directory will be uploaded back to |storage| packaged as a .isolated
1170 file.
1171
1172 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001173 - data: TaskData instance.
1174 - result_json: File path to dump result metadata into. If set, the process
1175 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -07001176
1177 Returns:
1178 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001179 """
maruela76b9ee2015-12-15 06:18:08 -08001180 if result_json:
1181 # Write a json output file right away in case we get killed.
1182 result = {
Junji Watanabe54925c32020-09-08 00:56:18 +00001183 'exit_code': None,
1184 'had_hard_timeout': False,
1185 'internal_failure': 'Was terminated before completion',
1186 'outputs_ref': None,
1187 'cas_output_root': None,
1188 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -08001189 }
1190 tools.write_json(result_json, result, dense=True)
1191
maruela9cfd6f2015-09-15 11:03:15 -07001192 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001193 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -07001194 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -07001195
maruela9cfd6f2015-09-15 11:03:15 -07001196 if result_json:
maruel05d5a882015-09-21 13:59:02 -07001197 # We've found tests to delete 'work' when quitting, causing an exception
1198 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -07001199 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -07001200 tools.write_json(result_json, result, dense=True)
1201 # Only return 1 if there was an internal error.
1202 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +00001203
maruela9cfd6f2015-09-15 11:03:15 -07001204 # Marshall into old-style inline output.
1205 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +00001206 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -07001207 data = {
Junji Watanabe38b28b02020-04-23 10:23:30 +00001208 'hash': result['outputs_ref']['isolated'],
1209 'namespace': result['outputs_ref']['namespace'],
1210 'storage': result['outputs_ref']['isolatedserver'],
maruela9cfd6f2015-09-15 11:03:15 -07001211 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -05001212 sys.stdout.flush()
Junji Watanabe38b28b02020-04-23 10:23:30 +00001213 print('[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
1214 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -08001215 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -07001216 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001217
1218
iannuccib58d10d2017-03-18 02:00:25 -07001219# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -08001220CipdInfo = collections.namedtuple('CipdInfo', [
1221 'client', # cipd.CipdClient object
1222 'cache_dir', # absolute path to bot-global cipd tag and instance cache
1223 'stats', # dict with stats to return to the server
1224 'pins', # dict with installed cipd pins to return to the server
1225])
1226
1227
1228@contextlib.contextmanager
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001229def noop_install_packages(_run_dir, _isolated_dir, _cas_dir):
iannuccib58d10d2017-03-18 02:00:25 -07001230 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -08001231 yield None
1232
1233
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001234def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -07001235 """Calls 'cipd ensure' for packages.
1236
1237 Args:
1238 run_dir (str): root of installation.
1239 cipd_cache_dir (str): the directory to use for the cipd package cache.
1240 client (CipdClient): the cipd client to use
1241 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -07001242
1243 Returns: list of pinned packages. Looks like [
1244 {
1245 'path': 'subdirectory',
1246 'package_name': 'resolved/package/name',
1247 'version': 'deadbeef...',
1248 },
1249 ...
1250 ]
1251 """
1252 package_pins = [None]*len(packages)
1253 def insert_pin(path, name, version, idx):
1254 package_pins[idx] = {
1255 'package_name': name,
1256 # swarming deals with 'root' as '.'
1257 'path': path or '.',
1258 'version': version,
1259 }
1260
1261 by_path = collections.defaultdict(list)
1262 for i, (path, name, version) in enumerate(packages):
1263 # cipd deals with 'root' as ''
1264 if path == '.':
1265 path = ''
1266 by_path[path].append((name, version, i))
1267
1268 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001269 run_dir,
1270 {
1271 subdir: [(name, vers) for name, vers, _ in pkgs
1272 ] for subdir, pkgs in by_path.items()
1273 },
1274 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -07001275 )
1276
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +00001277 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -07001278 this_subdir = by_path[subdir]
1279 for i, (name, version) in enumerate(pin_list):
1280 insert_pin(subdir, name, version, this_subdir[i][2])
1281
Robert Iannucci461b30d2017-12-13 11:34:03 -08001282 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -07001283
1284 return package_pins
1285
1286
vadimsh232f5a82017-01-20 19:23:44 -08001287@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001288def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001289 client_package_name, client_version, cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001290 isolated_dir, cas_dir):
vadimsh902948e2017-01-20 15:57:32 -08001291 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -07001292
vadimsh232f5a82017-01-20 19:23:44 -08001293 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
1294
1295 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -07001296 [
1297 {
1298 "path": path, "package_name": package_name, "version": version,
1299 },
1300 ...
1301 ]
vadimsh902948e2017-01-20 15:57:32 -08001302 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -07001303
1304 such that they correspond 1:1 to all input package arguments from the command
1305 line. These dictionaries make their all the way back to swarming, where they
1306 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -07001307
vadimsh902948e2017-01-20 15:57:32 -08001308 If 'packages' list is empty, will bootstrap CIPD client, but won't install
1309 any packages.
1310
1311 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -08001312 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -08001313
nodirbe642ff2016-06-09 15:51:51 -07001314 Args:
nodir90bc8dc2016-06-15 13:35:21 -07001315 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -08001316 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -07001317 service_url (str): CIPD server url, e.g.
1318 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -07001319 client_package_name (str): CIPD package name of CIPD client.
1320 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -07001321 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001322 isolated_dir (str): where to download isolated client.
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001323 cas_dir (str): where to download cas client.
nodirbe642ff2016-06-09 15:51:51 -07001324 """
1325 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001326
nodirbe642ff2016-06-09 15:51:51 -07001327 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001328
vadimsh902948e2017-01-20 15:57:32 -08001329 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001330 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001331 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001332 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001333
nodirbe642ff2016-06-09 15:51:51 -07001334 get_client_start = time.time()
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001335 client_manager = cipd.get_client(cache_dir, service_url, client_package_name,
1336 client_version)
iannucci96fcccc2016-08-30 15:52:22 -07001337
nodirbe642ff2016-06-09 15:51:51 -07001338 with client_manager as client:
1339 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001340
iannuccib58d10d2017-03-18 02:00:25 -07001341 package_pins = []
1342 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001343 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1344 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001345
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001346 # Install isolated client to |isolated_dir|.
Takuto Ikuta02edca22019-11-29 10:04:51 +00001347 _install_packages(isolated_dir, cipd_cache_dir, client,
1348 [('', ISOLATED_PACKAGE, ISOLATED_REVISION)])
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001349
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001350 # Install cas client to |cas_dir|.
1351 _install_packages(cas_dir, cipd_cache_dir, client,
1352 [('', _CAS_PACKAGE, _CAS_REVISION)])
1353
iannuccib58d10d2017-03-18 02:00:25 -07001354 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001355
vadimsh232f5a82017-01-20 19:23:44 -08001356 total_duration = time.time() - start
Junji Watanabe38b28b02020-04-23 10:23:30 +00001357 logging.info('Installing CIPD client and packages took %d seconds',
1358 total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001359
vadimsh232f5a82017-01-20 19:23:44 -08001360 yield CipdInfo(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001361 client=client,
1362 cache_dir=cipd_cache_dir,
1363 stats={
1364 'duration': total_duration,
1365 'get_client_duration': get_client_duration,
iannuccib58d10d2017-03-18 02:00:25 -07001366 },
Junji Watanabe38b28b02020-04-23 10:23:30 +00001367 pins={
1368 'client_package': {
1369 'package_name': client.package_name,
1370 'version': client.instance_id,
1371 },
1372 'packages': package_pins,
1373 })
nodirbe642ff2016-06-09 15:51:51 -07001374
1375
1376def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001377 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001378 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001379 version=__version__,
1380 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001381 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001382 '--clean',
1383 action='store_true',
maruel36a963d2016-04-08 17:15:49 -07001384 help='Cleans the cache, trimming it necessary and remove corrupted items '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001385 'and returns without executing anything; use with -v to know what '
1386 'was done')
maruel36a963d2016-04-08 17:15:49 -07001387 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001388 '--json',
1389 help='dump output metadata to json file. When used, run_isolated returns '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001390 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001391 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001392 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001393 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001394 '--grace-period',
1395 type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001396 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001397 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001398 '--raw-cmd',
1399 action='store_true',
Marc-Antoine Ruel49e347d2017-10-24 16:52:02 -07001400 help='Ignore the isolated command, use the one supplied at the command '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001401 'line')
Marc-Antoine Ruel49e347d2017-10-24 16:52:02 -07001402 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001403 '--relative-cwd',
1404 help='Ignore the isolated \'relative_cwd\' and use this one instead; '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001405 'requires --raw-cmd')
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001406 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001407 '--env',
1408 default=[],
1409 action='append',
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001410 help='Environment variables to set for the child process')
1411 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001412 '--env-prefix',
1413 default=[],
1414 action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001415 help='Specify a VAR=./path/fragment to put in the environment variable '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001416 'before executing the command. The path fragment must be relative '
1417 'to the isolated run directory, and must not contain a `..` token. '
1418 'The path will be made absolute and prepended to the indicated '
1419 '$VAR using the OS\'s path separator. Multiple items for the same '
1420 '$VAR will be prepended in order.')
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001421 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001422 '--bot-file',
1423 help='Path to a file describing the state of the host. The content is '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001424 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001425 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001426 '--switch-to-account',
1427 help='If given, switches LUCI_CONTEXT to given logical service account '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001428 '(e.g. "task" or "system") before launching the isolated process.')
vadimsh9c54b2c2017-07-25 14:08:29 -07001429 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001430 '--output',
1431 action='append',
aludwin0a8e17d2016-10-27 15:57:39 -07001432 help='Specifies an output to return. If no outputs are specified, all '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001433 'files located in $(ISOLATED_OUTDIR) will be returned; '
1434 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1435 'specified by --output option (there can be multiple) will be '
1436 'returned. Note that if a file in OUT_DIR has the same path '
1437 'as an --output option, the --output version will be returned.')
aludwin0a8e17d2016-10-27 15:57:39 -07001438 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001439 '-a',
1440 '--argsfile',
aludwin7556e0c2016-10-26 08:46:10 -07001441 # This is actually handled in parse_args; it's included here purely so it
1442 # can make it into the help text.
1443 help='Specify a file containing a JSON array of arguments to this '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001444 'script. If --argsfile is provided, no other argument may be '
1445 'provided on the command line.')
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001446 parser.add_option(
1447 '--report-on-exception',
1448 action='store_true',
1449 help='Whether report exception during execution to isolate server. '
1450 'This flag should only be used in swarming bot.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001451
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001452 group = optparse.OptionGroup(parser, 'Data source - Isolate server')
Junji Watanabe54925c32020-09-08 00:56:18 +00001453 # Deprecated. Isoate server is being migrated to RBE-CAS.
1454 # Remove --isolated and isolate server options after migration.
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001455 group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001456 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001457 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001458 isolateserver.add_isolate_server_options(group)
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001459 parser.add_option_group(group)
1460
1461 group = optparse.OptionGroup(parser,
1462 'Data source - Content Addressed Storage')
Junji Watanabe54925c32020-09-08 00:56:18 +00001463 group.add_option(
1464 '--cas-instance', help='Full CAS instance name for input/output files.')
1465 group.add_option(
1466 '--cas-digest',
1467 help='Digest of the input root on RBE-CAS. The format is '
1468 '`{hash}/{size_bytes}`.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001469 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001470
Junji Watanabeb03450b2020-09-25 05:09:27 +00001471 # Cache options.
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001472 isolateserver.add_cache_options(parser)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001473 add_cas_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001474
1475 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001476
1477 group = optparse.OptionGroup(parser, 'Named caches')
1478 group.add_option(
1479 '--named-cache',
1480 dest='named_caches',
1481 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001482 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001483 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001484 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001485 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1486 'path is a path relative to the run dir where the cache directory '
1487 'must be put to. '
1488 'This option can be specified more than once.')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001489 group.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001490 '--named-cache-root',
1491 default='named_caches',
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001492 help='Cache root directory. Default=%default')
1493 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001494
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001495 group = optparse.OptionGroup(parser, 'Process containment')
1496 parser.add_option(
1497 '--lower-priority', action='store_true',
1498 help='Lowers the child process priority')
1499 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001500 '--containment-type',
1501 choices=('NONE', 'AUTO', 'JOB_OBJECT'),
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001502 default='NONE',
1503 help='Type of container to use')
1504 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001505 '--limit-processes',
1506 type='int',
1507 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001508 help='Maximum number of active processes in the containment')
1509 parser.add_option(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001510 '--limit-total-committed-memory',
1511 type='int',
1512 default=0,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001513 help='Maximum sum of committed memory in the containment')
1514 parser.add_option_group(group)
1515
1516 group = optparse.OptionGroup(parser, 'Debugging')
1517 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001518 '--leak-temp-dir',
1519 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001520 help='Deliberately leak isolate\'s temp dir for later examination. '
Junji Watanabe38b28b02020-04-23 10:23:30 +00001521 'Default: %default')
1522 group.add_option('--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001523 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001524
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001525 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001526
Ye Kuang1d096cb2020-06-26 08:38:21 +00001527 parser.set_defaults(cache='cache')
nodirbe642ff2016-06-09 15:51:51 -07001528 return parser
1529
1530
Junji Watanabeb03450b2020-09-25 05:09:27 +00001531def add_cas_cache_options(parser):
1532 group = optparse.OptionGroup(parser, 'CAS cache management')
1533 group.add_option(
1534 '--cas-cache',
1535 metavar='DIR',
1536 default='cas-cache',
1537 help='Directory to keep a local cache of the files. Accelerates download '
1538 'by reusing already downloaded files. Default=%default')
1539 parser.add_option_group(group)
1540
1541
1542def process_cas_cache_options(options):
1543 if options.cas_cache:
1544 policies = local_caching.CachePolicies(
1545 max_cache_size=options.max_cache_size,
1546 min_free_space=options.min_free_space,
1547 # max_items isn't used for CAS cache for now.
1548 max_items=None,
1549 max_age_secs=MAX_AGE_SECS)
1550
1551 return local_caching.DiskContentAddressedCache(
1552 six.text_type(os.path.abspath(options.cas_cache)), policies, trim=False)
1553 return local_caching.MemoryContentAddressedCache()
1554
1555
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001556def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001557 """Validates named cache options and returns a CacheManager."""
1558 if options.named_caches and not options.named_cache_root:
1559 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001560 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001561 if not CACHE_NAME_RE.match(name):
1562 parser.error(
1563 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1564 if not path:
1565 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001566 try:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001567 int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001568 except ValueError:
1569 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001570 if options.named_cache_root:
1571 # Make these configurable later if there is use case but for now it's fairly
1572 # safe values.
1573 # In practice, a fair chunk of bots are already recycled on a daily schedule
1574 # so this code doesn't have any effect to them, unless they are preloaded
1575 # with a really old cache.
1576 policies = local_caching.CachePolicies(
1577 # 1TiB.
1578 max_cache_size=1024*1024*1024*1024,
1579 min_free_space=options.min_free_space,
1580 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001581 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001582 root_dir = six.text_type(os.path.abspath(options.named_cache_root))
John Budorickc6186972020-02-26 00:58:14 +00001583 cache = local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
1584 # Touch any named caches we're going to use to minimize thrashing
1585 # between tasks that request some (but not all) of the same named caches.
John Budorick0a4dab62020-03-02 22:23:35 +00001586 cache.touch(*[name for name, _, _ in options.named_caches])
John Budorickc6186972020-02-26 00:58:14 +00001587 return cache
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001588 return None
1589
1590
aludwin7556e0c2016-10-26 08:46:10 -07001591def parse_args(args):
1592 # Create a fake mini-parser just to get out the "-a" command. Note that
1593 # it's not documented here; instead, it's documented in create_option_parser
1594 # even though that parser will never actually get to parse it. This is
1595 # because --argsfile is exclusive with all other options and arguments.
1596 file_argparse = argparse.ArgumentParser(add_help=False)
1597 file_argparse.add_argument('-a', '--argsfile')
1598 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1599 if file_args.argsfile:
1600 if nonfile_args:
1601 file_argparse.error('Can\'t specify --argsfile with'
1602 'any other arguments (%s)' % nonfile_args)
1603 try:
1604 with open(file_args.argsfile, 'r') as f:
1605 args = json.load(f)
1606 except (IOError, OSError, ValueError) as e:
1607 # We don't need to error out here - "args" is now empty,
1608 # so the call below to parser.parse_args(args) will fail
1609 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001610 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001611
1612 # Even if we failed to read the args, just call the normal parser now since it
1613 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001614 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001615 options, args = parser.parse_args(args)
Ye Kuangfff1e502020-07-13 13:21:57 +00001616 if not isinstance(options.cipd_enabled, (bool, int)):
1617 options.cipd_enabled = distutils.util.strtobool(options.cipd_enabled)
aludwin7556e0c2016-10-26 08:46:10 -07001618 return (parser, options, args)
1619
1620
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001621def _calc_named_cache_hint(named_cache, named_caches):
1622 """Returns the expected size of the missing named caches."""
1623 present = named_cache.available
1624 size = 0
1625 for name, _, hint in named_caches:
1626 if name not in present:
Takuto Ikuta630f99d2020-07-02 12:59:35 +00001627 hint = int(hint)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001628 if hint > 0:
1629 size += hint
1630 return size
1631
1632
aludwin7556e0c2016-10-26 08:46:10 -07001633def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001634 # Warning: when --argsfile is used, the strings are unicode instances, when
1635 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001636 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001637
Takuto Ikutad4be2f12020-05-12 02:15:25 +00001638 if options.report_on_exception and options.isolate_server:
1639 on_error.report_on_exception_exit(options.isolate_server)
1640
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001641 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001642 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001643
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001644 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001645 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001646 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1647 if hint:
1648 # Increase the --min-free-space value by the hint, and recreate the
1649 # NamedCache instance so it gets the updated CachePolicy.
1650 options.min_free_space += hint
1651 named_cache = process_named_cache_options(parser, options)
1652
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001653 # TODO(crbug.com/932396): Remove this.
Takuto Ikuta4a22c2c2020-06-05 02:02:23 +00001654 use_go_isolated = options.cipd_enabled
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001655
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001656 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1657 # they can be cleaned the same way.
Junji Watanabeb03450b2020-09-25 05:09:27 +00001658 # TODO(crbug.com/1131313):
1659 # Modifying stats.json from run_isolated.py and Go isolated/cas clients may
1660 # cause unexpected issues. Initialize CachePolicies when not using Go client
1661 # or executing --clean.
1662 isolate_cache = None
1663 if options.clean or not use_go_isolated:
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +00001664 isolate_cache = isolateserver.process_cache_options(options, trim=False)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001665 cas_cache = None
1666 if options.clean:
1667 cas_cache = process_cas_cache_options(options)
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +00001668
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001669 caches = []
1670 if isolate_cache:
1671 caches.append(isolate_cache)
Junji Watanabeb03450b2020-09-25 05:09:27 +00001672 if cas_cache:
1673 caches.append(cas_cache)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001674 if named_cache:
1675 caches.append(named_cache)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001676 root = caches[0].cache_dir if caches else six.text_type(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001677 if options.clean:
1678 if options.isolated:
1679 parser.error('Can\'t use --isolated with --clean.')
1680 if options.isolate_server:
1681 parser.error('Can\'t use --isolate-server with --clean.')
1682 if options.json:
1683 parser.error('Can\'t use --json with --clean.')
nodirf33b8d62016-10-26 22:34:58 -07001684 if options.named_caches:
1685 parser.error('Can\t use --named-cache with --clean.')
Junji Watanabeb19f54d2020-09-17 05:54:52 +00001686 if options.cas_instance or options.cas_digest:
1687 parser.error('Can\t use --cas-instance, --cas-digest with --clean.')
Takuto Ikuta9ab28552020-07-31 08:15:45 +00001688
1689 logging.info("initial free space: %d", file_path.get_free_space(root))
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001690 # Trim first, then clean.
1691 local_caching.trim_caches(
1692 caches,
1693 root,
Takuto Ikuta616ce262020-09-07 08:43:48 +00001694 min_free_space=options.min_free_space,
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001695 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta9ab28552020-07-31 08:15:45 +00001696 logging.info("free space after trim: %d", file_path.get_free_space(root))
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001697 for c in caches:
Marc-Antoine Ruel87fc2222018-06-18 13:09:24 +00001698 c.cleanup()
Takuto Ikuta9ab28552020-07-31 08:15:45 +00001699 logging.info("free space after cleanup: %d", file_path.get_free_space(root))
maruel36a963d2016-04-08 17:15:49 -07001700 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001701
1702 # Trim must still be done for the following case:
1703 # - named-cache was used
1704 # - some entries, with a large hint, where missing
1705 # - --min-free-space was increased accordingly, thus trimming is needed
1706 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1707 # --clean after each task.
1708 if hint:
1709 logging.info('Additional trimming of %d bytes', hint)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001710 local_caching.trim_caches(
1711 caches,
1712 root,
Takuto Ikuta616ce262020-09-07 08:43:48 +00001713 min_free_space=options.min_free_space,
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001714 max_age_secs=MAX_AGE_SECS)
maruel36a963d2016-04-08 17:15:49 -07001715
nodir55be77b2016-05-03 09:39:57 -07001716 if not options.isolated and not args:
1717 parser.error('--isolated or command to run is required.')
1718
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001719 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001720
Takuto Ikutaae767b32020-05-11 01:22:19 +00001721 isolateserver.process_isolate_server_options(parser, options, False)
nodir55be77b2016-05-03 09:39:57 -07001722 if not options.isolate_server:
1723 if options.isolated:
1724 parser.error('--isolated requires --isolate-server')
1725 if ISOLATED_OUTDIR_PARAMETER in args:
1726 parser.error(
1727 '%s in args requires --isolate-server' % ISOLATED_OUTDIR_PARAMETER)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001728
nodir90bc8dc2016-06-15 13:35:21 -07001729 if options.root_dir:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001730 options.root_dir = six.text_type(os.path.abspath(options.root_dir))
maruel12e30012015-10-09 11:55:35 -07001731 if options.json:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001732 options.json = six.text_type(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001733
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001734 if any('=' not in i for i in options.env):
1735 parser.error(
1736 '--env required key=value form. value can be skipped to delete '
1737 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001738 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001739
1740 prefixes = {}
1741 cwd = os.path.realpath(os.getcwd())
1742 for item in options.env_prefix:
1743 if '=' not in item:
1744 parser.error(
1745 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1746 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001747 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001748 if os.path.isabs(opath):
1749 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1750 opath = os.path.normpath(opath)
1751 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1752 parser.error(
Junji Watanabe38b28b02020-04-23 10:23:30 +00001753 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1754 % opath)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001755 prefixes.setdefault(key, []).append(opath)
1756 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001757
nodirbe642ff2016-06-09 15:51:51 -07001758 cipd.validate_cipd_options(parser, options)
1759
vadimsh232f5a82017-01-20 19:23:44 -08001760 install_packages_fn = noop_install_packages
Ye Kuang1d096cb2020-06-26 08:38:21 +00001761 tmp_cipd_cache_dir = None
vadimsh902948e2017-01-20 15:57:32 -08001762 if options.cipd_enabled:
Ye Kuang1d096cb2020-06-26 08:38:21 +00001763 cache_dir = options.cipd_cache
1764 if not cache_dir:
1765 tmp_cipd_cache_dir = six.text_type(tempfile.mkdtemp())
1766 cache_dir = tmp_cipd_cache_dir
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001767 install_packages_fn = (
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001768 lambda run_dir, isolated_dir, cas_dir: install_client_and_packages(
Ye Kuang1d096cb2020-06-26 08:38:21 +00001769 run_dir,
1770 cipd.parse_package_args(options.cipd_packages),
1771 options.cipd_server,
1772 options.cipd_client_package,
1773 options.cipd_client_version,
1774 cache_dir=cache_dir,
Junji Watanabe4b890ef2020-09-16 01:43:27 +00001775 isolated_dir=isolated_dir,
1776 cas_dir=cas_dir,
1777 ))
nodirbe642ff2016-06-09 15:51:51 -07001778
nodird6160682017-02-02 13:03:35 -08001779 @contextlib.contextmanager
nodir0ae98b32017-05-11 13:21:53 -07001780 def install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001781 # WARNING: this function depends on "options" variable defined in the outer
1782 # function.
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001783 assert six.text_type(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001784 assert os.path.isabs(run_dir), run_dir
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001785 named_caches = [(os.path.join(run_dir, six.text_type(relpath)), name)
1786 for name, relpath, _ in options.named_caches]
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001787 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001788 named_cache.install(path, name)
nodird6160682017-02-02 13:03:35 -08001789 try:
1790 yield
1791 finally:
dnje289d132017-07-07 11:16:44 -07001792 # Uninstall each named cache, returning it to the cache pool. If an
1793 # uninstall fails for a given cache, it will remain in the task's
1794 # temporary space, get cleaned up by the Swarming bot, and be lost.
1795 #
1796 # If the Swarming bot cannot clean up the cache, it will handle it like
1797 # any other bot file that could not be removed.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001798 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001799 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001800 # uninstall() doesn't trim but does call save() implicitly. Trimming
1801 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001802 named_cache.uninstall(path, name)
1803 except local_caching.NamedCacheError:
1804 logging.exception('Error while removing named cache %r at %r. '
1805 'The cache will be lost.', path, name)
nodirf33b8d62016-10-26 22:34:58 -07001806
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001807 extra_args = []
1808 command = []
1809 if options.raw_cmd:
1810 command = args
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001811 if options.relative_cwd:
1812 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1813 if not a.startswith(os.getcwd()):
1814 parser.error(
1815 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001816 else:
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001817 if options.relative_cwd:
1818 parser.error('--relative-cwd requires --raw-cmd')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001819 extra_args = args
1820
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001821 containment_type = subprocess42.Containment.NONE
1822 if options.containment_type == 'AUTO':
1823 containment_type = subprocess42.Containment.AUTO
1824 if options.containment_type == 'JOB_OBJECT':
1825 containment_type = subprocess42.Containment.JOB_OBJECT
1826 containment = subprocess42.Containment(
1827 containment_type=containment_type,
1828 limit_processes=options.limit_processes,
1829 limit_total_committed_memory=options.limit_total_committed_memory)
1830
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001831 data = TaskData(
1832 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001833 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001834 extra_args=extra_args,
1835 isolated_hash=options.isolated,
1836 storage=None,
1837 isolate_cache=isolate_cache,
Junji Watanabe54925c32020-09-08 00:56:18 +00001838 cas_instance=options.cas_instance,
1839 cas_digest=options.cas_digest,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001840 outputs=options.output,
1841 install_named_caches=install_named_caches,
1842 leak_temp_dir=options.leak_temp_dir,
1843 root_dir=_to_unicode(options.root_dir),
1844 hard_timeout=options.hard_timeout,
1845 grace_period=options.grace_period,
1846 bot_file=options.bot_file,
1847 switch_to_account=options.switch_to_account,
1848 install_packages_fn=install_packages_fn,
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001849 use_go_isolated=use_go_isolated,
Takuto Ikuta10cae642020-01-08 08:12:07 +00001850 go_cache_dir=options.cache,
Takuto Ikuta879788c2020-01-10 08:00:26 +00001851 go_cache_policies=local_caching.CachePolicies(
1852 max_cache_size=options.max_cache_size,
1853 min_free_space=options.min_free_space,
1854 max_items=options.max_items,
1855 max_age_secs=None,
1856 ),
Junji Watanabeb03450b2020-09-25 05:09:27 +00001857 cas_cache_dir=options.cas_cache,
1858 cas_cache_policies=local_caching.CachePolicies(
1859 max_cache_size=options.max_cache_size,
1860 min_free_space=options.min_free_space,
1861 max_items=None,
1862 max_age_secs=None,
1863 ),
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001864 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001865 env_prefix=options.env_prefix,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001866 lower_priority=bool(options.lower_priority),
1867 containment=containment)
nodirbe642ff2016-06-09 15:51:51 -07001868 try:
nodir90bc8dc2016-06-15 13:35:21 -07001869 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001870 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001871 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001872 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001873 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001874 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001875 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001876 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001877 return run_tha_test(data, options.json)
1878 return run_tha_test(data, options.json)
Junji Watanabe38b28b02020-04-23 10:23:30 +00001879 except (cipd.Error, local_caching.NamedCacheError,
1880 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001881 print(ex.message, file=sys.stderr)
nodirbe642ff2016-06-09 15:51:51 -07001882 return 1
Ye Kuang1d096cb2020-06-26 08:38:21 +00001883 finally:
1884 if tmp_cipd_cache_dir is not None:
1885 try:
1886 file_path.rmtree(tmp_cipd_cache_dir)
1887 except OSError:
1888 logging.exception('Remove tmp_cipd_cache_dir=%s failed',
1889 tmp_cipd_cache_dir)
1890 # Best effort clean up. Failed to do so doesn't affect the outcome.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001891
1892
1893if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001894 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001895 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001896 fix_encoding.fix_encoding()
Ye Kuang2dd17442020-04-22 08:45:52 +00001897 net.set_user_agent('run_isolated.py/' + __version__)
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001898 sys.exit(main(sys.argv[1:]))