blob: e290098bfd52c9e44ecf2050b114169adaa43d6d [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
33See
34https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
35for all the variables.
36
37See
38https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
39for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000040"""
41
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000042from __future__ import print_function
43
44__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000045
aludwin7556e0c2016-10-26 08:46:10 -070046import argparse
maruel064c0a32016-04-05 11:47:15 -070047import base64
iannucci96fcccc2016-08-30 15:52:22 -070048import collections
vadimsh232f5a82017-01-20 19:23:44 -080049import contextlib
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040050import errno
aludwin7556e0c2016-10-26 08:46:10 -070051import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000052import logging
53import optparse
54import os
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040055import re
Takuto Ikuta27c93b22019-12-11 07:56:43 +000056import subprocess
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000057import sys
58import tempfile
maruel064c0a32016-04-05 11:47:15 -070059import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000060
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000061from utils import tools
62tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000063
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000064# third_party/
65from depot_tools import fix_encoding
Takuto Ikuta6e2ff962019-10-29 12:35:27 +000066import six
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000067
68# pylint: disable=ungrouped-imports
69import auth
70import cipd
71import isolate_storage
72import isolateserver
73import local_caching
74from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070075from utils import file_path
maruel12e30012015-10-09 11:55:35 -070076from utils import fs
maruel064c0a32016-04-05 11:47:15 -070077from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040078from utils import logging_utils
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040079from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050080from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000081
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000082
maruele2f2cb82016-07-13 14:41:03 -070083# Magic variables that can be found in the isolate task command line.
84ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
85EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
86SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
87
88
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000089# The name of the log file to use.
90RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
91
maruele2f2cb82016-07-13 14:41:03 -070092
csharp@chromium.orge217f302012-11-22 16:51:53 +000093# The name of the log to use for the run_test_cases.py command
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000094RUN_TEST_CASES_LOG = 'run_test_cases.log'
csharp@chromium.orge217f302012-11-22 16:51:53 +000095
vadimsh@chromium.org87d63262013-04-04 19:34:21 +000096
maruele2f2cb82016-07-13 14:41:03 -070097# Use short names for temporary directories. This is driven by Windows, which
98# imposes a relatively short maximum path length of 260 characters, often
99# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000100# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -0700101#
102# It is recommended to start the script with a `root_dir` as short as
103# possible.
104# - ir stands for isolated_run
105# - io stands for isolated_out
106# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000107# - ic stands for isolated_client
maruele2f2cb82016-07-13 14:41:03 -0700108ISOLATED_RUN_DIR = u'ir'
109ISOLATED_OUT_DIR = u'io'
110ISOLATED_TMP_DIR = u'it'
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000111ISOLATED_CLIENT_DIR = u'ic'
maruele2f2cb82016-07-13 14:41:03 -0700112
Takuto Ikuta02edca22019-11-29 10:04:51 +0000113# TODO(tikuta): take these parameter from luci-config?
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000114# Take revision from
115# https://ci.chromium.org/p/infra-internal/g/infra-packagers/console
Takuto Ikuta02edca22019-11-29 10:04:51 +0000116ISOLATED_PACKAGE = 'infra/tools/luci/isolated/${platform}'
Takuto Ikuta3f385f12020-01-08 08:11:51 +0000117ISOLATED_REVISION = 'git_revision:4e6b4d31c342d1e7b8dbd478da7378f52652b279'
maruele2f2cb82016-07-13 14:41:03 -0700118
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400119# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000120CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400121
122
marueld928c862017-06-08 08:20:04 -0700123OUTLIVING_ZOMBIE_MSG = """\
124*** Swarming tried multiple times to delete the %s directory and failed ***
125*** Hard failing the task ***
126
127Swarming detected that your testing script ran an executable, which may have
128started a child executable, and the main script returned early, leaving the
129children executables playing around unguided.
130
131You don't want to leave children processes outliving the task on the Swarming
132bot, do you? The Swarming bot doesn't.
133
134How to fix?
135- For any process that starts children processes, make sure all children
136 processes terminated properly before each parent process exits. This is
137 especially important in very deep process trees.
138 - This must be done properly both in normal successful task and in case of
139 task failure. Cleanup is very important.
140- The Swarming bot sends a SIGTERM in case of timeout.
141 - You have %s seconds to comply after the signal was sent to the process
142 before the process is forcibly killed.
143- To achieve not leaking children processes in case of signals on timeout, you
144 MUST handle signals in each executable / python script and propagate them to
145 children processes.
146 - When your test script (python or binary) receives a signal like SIGTERM or
147 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
148 them to terminate before quitting.
149
150See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400151https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700152for more information.
153
154*** May the SIGKILL force be with you ***
155"""
156
157
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000158# Currently hardcoded. Eventually could be exposed as a flag once there's value.
159# 3 weeks
160MAX_AGE_SECS = 21*24*60*60
161
162
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500163TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000164 'TaskData',
165 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000166 # List of strings; the command line to use, independent of what was
167 # specified in the isolated file.
168 'command',
169 # Relative directory to start command into.
170 'relative_cwd',
171 # List of strings; the arguments to add to the command specified in the
172 # isolated file.
173 'extra_args',
174 # Hash of the .isolated file that must be retrieved to recreate the tree
175 # of files to run the target executable. The command specified in the
176 # .isolated is executed. Mutually exclusive with command argument.
177 'isolated_hash',
178 # isolateserver.Storage instance to retrieve remote objects. This object
179 # has a reference to an isolateserver.StorageApi, which does the actual
180 # I/O.
181 'storage',
182 # isolateserver.LocalCache instance to keep from retrieving the same
183 # objects constantly by caching the objects retrieved. Can be on-disk or
184 # in-memory.
185 'isolate_cache',
186 # List of paths relative to root_dir to put into the output isolated
187 # bundle upon task completion (see link_outputs_to_outdir).
188 'outputs',
189 # Function (run_dir) => context manager that installs named caches into
190 # |run_dir|.
191 'install_named_caches',
192 # If True, the temporary directory will be deliberately leaked for later
193 # examination.
194 'leak_temp_dir',
195 # Path to the directory to use to create the temporary directory. If not
196 # specified, a random temporary directory is created.
197 'root_dir',
198 # Kills the process if it lasts more than this amount of seconds.
199 'hard_timeout',
200 # Number of seconds to wait between SIGTERM and SIGKILL.
201 'grace_period',
202 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
203 # task command line argument.
204 'bot_file',
205 # Logical account to switch LUCI_CONTEXT into.
206 'switch_to_account',
207 # Context manager dir => CipdInfo, see install_client_and_packages.
208 'install_packages_fn',
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000209 # Use go isolated client.
210 'use_go_isolated',
Takuto Ikuta057c5342019-12-03 04:05:05 +0000211 # Cache directory for go isolated client.
212 'go_cache_dir',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000213 # Environment variables to set.
214 'env',
215 # Environment variables to mutate with relative directories.
216 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
217 'env_prefix',
218 # Lowers the task process priority.
219 'lower_priority',
220 # subprocess42.Containment instance. Can be None.
221 'containment',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000222 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500223
224
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500225def _to_str(s):
226 """Downgrades a unicode instance to str. Pass str through as-is."""
227 if isinstance(s, str):
228 return s
229 # This is technically incorrect, especially on Windows. In theory
230 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
231 # page' on Windows, but that causes other problems, as the character set
232 # is very limited.
233 return s.encode('utf-8')
234
235
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500236def _to_unicode(s):
237 """Upgrades a str instance to unicode. Pass unicode through as-is."""
Takuto Ikuta95459dd2019-10-29 12:39:47 +0000238 if isinstance(s, six.text_type) or s is None:
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500239 return s
240 return s.decode('utf-8')
241
242
maruel03e11842016-07-14 10:50:16 -0700243def make_temp_dir(prefix, root_dir):
244 """Returns a new unique temporary directory."""
Takuto Ikuta6e2ff962019-10-29 12:35:27 +0000245 return six.text_type(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000246
247
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500248def change_tree_read_only(rootdir, read_only):
249 """Changes the tree read-only bits according to the read_only specification.
250
251 The flag can be 0, 1 or 2, which will affect the possibility to modify files
252 and create or delete files.
253 """
254 if read_only == 2:
255 # Files and directories (except on Windows) are marked read only. This
256 # inhibits modifying, creating or deleting files in the test directory,
257 # except on Windows where creating and deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400258 file_path.make_tree_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500259 elif read_only == 1:
260 # Files are marked read only but not the directories. This inhibits
261 # modifying files but creating or deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400262 file_path.make_tree_files_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500263 elif read_only in (0, None):
Marc-Antoine Ruelf1d827c2014-11-24 15:22:25 -0500264 # Anything can be modified.
Marc-Antoine Ruel2666d9c2018-05-18 13:52:02 -0400265 # TODO(maruel): This is currently dangerous as long as
266 # DiskContentAddressedCache.touch() is not yet changed to verify the hash of
267 # the content of the files it is looking at, so that if a test modifies an
268 # input file, the file must be deleted.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400269 file_path.make_tree_writeable(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500270 else:
271 raise ValueError(
272 'change_tree_read_only(%s, %s): Unknown flag %s' %
273 (rootdir, read_only, read_only))
274
275
vadimsh9c54b2c2017-07-25 14:08:29 -0700276@contextlib.contextmanager
277def set_luci_context_account(account, tmp_dir):
278 """Sets LUCI_CONTEXT account to be used by the task.
279
280 If 'account' is None or '', does nothing at all. This happens when
281 run_isolated.py is called without '--switch-to-account' flag. In this case,
282 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000283 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700284 run_isolated.py explicitly from their code.
285
286 If the requested account is not defined in the context, switches to
287 non-authenticated access. This happens for Swarming tasks that don't use
288 'task' service accounts.
289
290 If not using LUCI_CONTEXT-based auth, does nothing.
291 If already running as requested account, does nothing.
292 """
293 if not account:
294 # Not actually switching.
295 yield
296 return
297
298 local_auth = luci_context.read('local_auth')
299 if not local_auth:
300 # Not using LUCI_CONTEXT auth at all.
301 yield
302 return
303
304 # See LUCI_CONTEXT.md for the format of 'local_auth'.
305 if local_auth.get('default_account_id') == account:
306 # Already set, no need to switch.
307 yield
308 return
309
310 available = {a['id'] for a in local_auth.get('accounts') or []}
311 if account in available:
312 logging.info('Switching default LUCI_CONTEXT account to %r', account)
313 local_auth['default_account_id'] = account
314 else:
315 logging.warning(
316 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
317 'disabling authentication', account, sorted(available))
318 local_auth.pop('default_account_id', None)
319
320 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
321 yield
322
323
nodir90bc8dc2016-06-15 13:35:21 -0700324def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000325 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700326
327 Raises:
328 ValueError if a parameter is requested in |command| but its value is not
329 provided.
330 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000331 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
332
333
334def replace_parameters(arg, out_dir, bot_file):
335 """Replaces parameter tokens with appropriate values in a string.
336
337 Raises:
338 ValueError if a parameter is requested in |arg| but its value is not
339 provided.
340 """
341 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
342 replace_slash = False
343 if ISOLATED_OUTDIR_PARAMETER in arg:
344 if not out_dir:
345 raise ValueError(
346 'output directory is requested in command or env var, but not '
347 'provided; please specify one')
348 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
349 replace_slash = True
350 if SWARMING_BOT_FILE_PARAMETER in arg:
351 if bot_file:
352 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700353 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000354 else:
355 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
356 'var, but no bot_file specified. Leaving parameter '
357 'unchanged.')
358 if replace_slash:
359 # Replace slashes only if parameters are present
360 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
361 arg = arg.replace('/', os.sep)
362 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700363
364
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000365
366def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
367 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800368 """Returns full OS environment to run a command in.
369
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800370 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
371 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800372
373 Args:
374 tmp_dir: temp directory.
375 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500376 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500377 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800378 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000379 out_dir: Isolated output directory. Required to be != None if any of the
380 env vars contain ISOLATED_OUTDIR_PARAMETER.
381 bot_file: Required to be != None if any of the env vars contain
382 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800383 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500384 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000385 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500386 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500387 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500388 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000389 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500390
391 if cipd_info:
392 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500393 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
394 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500395
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000396 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500397 assert isinstance(paths, list), paths
398 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500399 cur = out.get(key)
400 if cur:
401 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500402 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800403
Marc-Antoine Ruelefb30b12018-07-25 18:34:36 +0000404 tmp_dir = _to_str(tmp_dir)
405 # pylint: disable=line-too-long
406 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
407 # platform. So $TMPDIR must be set on all platforms.
408 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
409 out['TMPDIR'] = tmp_dir
410 if sys.platform == 'win32':
411 # * chromium's base utils uses GetTempPath().
412 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
413 # * Go uses GetTempPath().
414 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
415 # set.
416 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
417 out['TMP'] = tmp_dir
418 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
419 out['TEMP'] = tmp_dir
420 elif sys.platform == 'darwin':
421 # * Chromium uses an hack on macOS before calling into
422 # NSTemporaryDirectory().
423 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
424 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
425 out['MAC_CHROMIUM_TMPDIR'] = tmp_dir
426 else:
427 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
428 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
429 # * mktemp on linux respects $TMPDIR.
430 # * Chromium respects $TMPDIR on linux.
431 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
432 # * Go uses $TMPDIR.
433 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
434 pass
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500435 return out
vadimsh232f5a82017-01-20 19:23:44 -0800436
437
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000438def run_command(
439 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700440 """Runs the command.
441
442 Returns:
443 tuple(process exit code, bool if had a hard timeout)
444 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000445 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000446 'run_command(%s, %s, %s, %s, %s, %s)',
447 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700448
maruel6be7f9e2015-10-01 12:25:30 -0700449 exit_code = None
450 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700451 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700452 proc = None
453 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700454 try:
maruel6be7f9e2015-10-01 12:25:30 -0700455 # TODO(maruel): This code is imperfect. It doesn't handle well signals
456 # during the download phase and there's short windows were things can go
457 # wrong.
458 def handler(signum, _frame):
459 if proc and not had_signal:
460 logging.info('Received signal %d', signum)
461 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700462 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700463
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000464 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000465 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000466 lower_priority=lower_priority, containment=containment)
maruel6be7f9e2015-10-01 12:25:30 -0700467 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
468 try:
John Budorickc398f092019-06-10 22:49:44 +0000469 exit_code = proc.wait(hard_timeout or None)
maruel6be7f9e2015-10-01 12:25:30 -0700470 except subprocess42.TimeoutExpired:
471 if not had_signal:
472 logging.warning('Hard timeout')
473 had_hard_timeout = True
474 logging.warning('Sending SIGTERM')
475 proc.terminate()
476
477 # Ignore signals in grace period. Forcibly give the grace period to the
478 # child process.
479 if exit_code is None:
480 ignore = lambda *_: None
481 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
482 try:
483 exit_code = proc.wait(grace_period or None)
484 except subprocess42.TimeoutExpired:
485 # Now kill for real. The user can distinguish between the
486 # following states:
487 # - signal but process exited within grace period,
488 # hard_timed_out will be set but the process exit code will be
489 # script provided.
490 # - processed exited late, exit code will be -9 on posix.
491 logging.warning('Grace exhausted; sending SIGKILL')
492 proc.kill()
martiniss5c8043e2017-08-01 17:09:43 -0700493 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700494 exit_code = proc.wait()
maruela9cfd6f2015-09-15 11:03:15 -0700495 except OSError:
496 # This is not considered to be an internal error. The executable simply
497 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800498 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000499 '<The executable does not exist, a dependent library is missing or '
500 'the command line is too long>\n'
501 '<Check for missing .so/.dll in the .isolate or GN file or length of '
502 'command line args>\n'
maruela72f46e2016-02-24 11:05:45 -0800503 '<Command: %s>\n' % command)
504 if os.environ.get('SWARMING_TASK_ID'):
505 # Give an additional hint when running as a swarming task.
506 sys.stderr.write(
507 '<See the task\'s page for commands to help diagnose this issue '
508 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700509 exit_code = 1
510 logging.info(
511 'Command finished with exit code %d (%s)',
512 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700513 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700514
515
Takuto Ikuta057c5342019-12-03 04:05:05 +0000516def _fetch_and_map_with_go(isolated_hash, storage, cache, outdir, go_cache_dir,
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000517 isolated_client):
518 """
519 Fetches an isolated tree using go client, create the tree and returns
520 (bundle, stats).
521 """
522 start = time.time()
523 server_ref = storage.server_ref
524 policies = cache.policies
525 result_json_handle, result_json_path = tempfile.mkstemp(
526 prefix=u'fetch-and-map-result-', suffix=u'.json')
527 os.close(result_json_handle)
528 try:
529 subprocess42.check_call([
530 isolated_client,
531 'download',
532 '-isolate-server',
533 server_ref.url,
534 '-namespace',
535 server_ref.namespace,
536 '-isolated',
537 isolated_hash,
538
539 # flags for cache
540 '-cache-dir',
Takuto Ikuta057c5342019-12-03 04:05:05 +0000541 go_cache_dir,
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000542 '-cache-max-items',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000543 str(policies.max_items),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000544 '-cache-max-size',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000545 str(policies.max_cache_size),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000546 '-cache-min-free-space',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000547 str(policies.min_free_space),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000548
549 # flags for output
550 '-output-dir',
551 outdir,
552 '-fetch-and-map-result-json',
553 result_json_path,
554 ])
555 with open(result_json_path) as json_file:
556 result_json = json.load(json_file)
557
558 isolated = result_json['isolated']
559 bundle = isolateserver.IsolatedBundle(filter_cb=None)
560 # Only following properties are used in caller.
561 bundle.command = isolated.get('command')
562 bundle.read_only = isolated.get('read_only')
563 bundle.relative_cwd = isolated.get('relative_cwd')
564
565 return bundle, {
566 'duration': time.time() - start,
567 'items_cold': result_json['items_cold'],
568 'items_hot': result_json['items_hot'],
569 }
570 finally:
571 fs.remove(result_json_path)
572
573
574# TODO(crbug.com/932396): remove this function.
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000575def fetch_and_map(isolated_hash, storage, cache, outdir):
maruel4409e302016-07-19 14:25:51 -0700576 """Fetches an isolated tree, create the tree and returns (bundle, stats)."""
nodir6f801882016-04-29 14:41:50 -0700577 start = time.time()
578 bundle = isolateserver.fetch_isolated(
579 isolated_hash=isolated_hash,
580 storage=storage,
581 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700582 outdir=outdir,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000583 use_symlinks=False)
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000584 hot = (collections.Counter(cache.used) -
585 collections.Counter(cache.added)).elements()
nodir6f801882016-04-29 14:41:50 -0700586 return bundle, {
587 'duration': time.time() - start,
nodir6f801882016-04-29 14:41:50 -0700588 'items_cold': base64.b64encode(large.pack(sorted(cache.added))),
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000589 'items_hot': base64.b64encode(large.pack(sorted(hot))),
nodir6f801882016-04-29 14:41:50 -0700590 }
591
592
aludwin0a8e17d2016-10-27 15:57:39 -0700593def link_outputs_to_outdir(run_dir, out_dir, outputs):
594 """Links any named outputs to out_dir so they can be uploaded.
595
596 Raises an error if the file already exists in that directory.
597 """
598 if not outputs:
599 return
600 isolateserver.create_directories(out_dir, outputs)
601 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400602 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
603
604
605def copy_recursively(src, dst):
606 """Efficiently copies a file or directory from src_dir to dst_dir.
607
608 `item` may be a file, directory, or a symlink to a file or directory.
609 All symlinks are replaced with their targets, so the resulting
610 directory structure in dst_dir will never have any symlinks.
611
612 To increase speed, copy_recursively hardlinks individual files into the
613 (newly created) directory structure if possible, unlike Python's
614 shutil.copytree().
615 """
616 orig_src = src
617 try:
618 # Replace symlinks with their final target.
619 while fs.islink(src):
620 res = fs.readlink(src)
621 src = os.path.join(os.path.dirname(src), res)
622 # TODO(sadafm): Explicitly handle cyclic symlinks.
623
624 # Note that fs.isfile (which is a wrapper around os.path.isfile) throws
625 # an exception if src does not exist. A warning will be logged in that case.
626 if fs.isfile(src):
627 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
628 return
629
630 if not fs.exists(dst):
631 os.makedirs(dst)
632
633 for child in fs.listdir(src):
634 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
635
636 except OSError as e:
637 if e.errno == errno.ENOENT:
638 logging.warning('Path %s does not exist or %s is a broken symlink',
639 src, orig_src)
640 else:
641 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700642
643
Takuto Ikutab4aa8662019-09-17 05:54:36 +0000644def upload_then_delete(storage, out_dir, leak_temp_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700645 """Deletes the temporary run directory and uploads results back.
646
647 Returns:
nodir6f801882016-04-29 14:41:50 -0700648 tuple(outputs_ref, success, stats)
maruel064c0a32016-04-05 11:47:15 -0700649 - outputs_ref: a dict referring to the results archived back to the isolated
650 server, if applicable.
651 - success: False if something occurred that means that the task must
652 forcibly be considered a failure, e.g. zombie processes were left
653 behind.
nodir6f801882016-04-29 14:41:50 -0700654 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700655 """
maruela9cfd6f2015-09-15 11:03:15 -0700656 # Upload out_dir and generate a .isolated file out of this directory. It is
657 # only done if files were written in the directory.
658 outputs_ref = None
maruel064c0a32016-04-05 11:47:15 -0700659 cold = []
660 hot = []
nodir6f801882016-04-29 14:41:50 -0700661 start = time.time()
662
maruel12e30012015-10-09 11:55:35 -0700663 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700664 with tools.Profiler('ArchiveOutput'):
665 try:
maruel064c0a32016-04-05 11:47:15 -0700666 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
maruela9cfd6f2015-09-15 11:03:15 -0700667 storage, [out_dir], None)
668 outputs_ref = {
Marc-Antoine Rueld0868ec2018-11-28 20:47:29 +0000669 'isolated': results.values()[0],
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +0000670 'isolatedserver': storage.server_ref.url,
671 'namespace': storage.server_ref.namespace,
maruela9cfd6f2015-09-15 11:03:15 -0700672 }
maruel064c0a32016-04-05 11:47:15 -0700673 cold = sorted(i.size for i in f_cold)
674 hot = sorted(i.size for i in f_hot)
maruela9cfd6f2015-09-15 11:03:15 -0700675 except isolateserver.Aborted:
676 # This happens when a signal SIGTERM was received while uploading data.
677 # There is 2 causes:
678 # - The task was too slow and was about to be killed anyway due to
679 # exceeding the hard timeout.
680 # - The amount of data uploaded back is very large and took too much
681 # time to archive.
682 sys.stderr.write('Received SIGTERM while uploading')
683 # Re-raise, so it will be treated as an internal failure.
684 raise
nodir6f801882016-04-29 14:41:50 -0700685
686 success = False
maruela9cfd6f2015-09-15 11:03:15 -0700687 try:
maruel12e30012015-10-09 11:55:35 -0700688 if (not leak_temp_dir and fs.isdir(out_dir) and
maruel6eeea7d2015-09-16 12:17:42 -0700689 not file_path.rmtree(out_dir)):
maruela9cfd6f2015-09-15 11:03:15 -0700690 logging.error('Had difficulties removing out_dir %s', out_dir)
nodir6f801882016-04-29 14:41:50 -0700691 else:
692 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700693 except OSError as e:
694 # When this happens, it means there's a process error.
maruel12e30012015-10-09 11:55:35 -0700695 logging.exception('Had difficulties removing out_dir %s: %s', out_dir, e)
nodir6f801882016-04-29 14:41:50 -0700696 stats = {
697 'duration': time.time() - start,
698 'items_cold': base64.b64encode(large.pack(cold)),
699 'items_hot': base64.b64encode(large.pack(hot)),
700 }
701 return outputs_ref, success, stats
maruela9cfd6f2015-09-15 11:03:15 -0700702
703
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500704def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700705 """Runs a command with optional isolated input/output.
706
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500707 Arguments:
708 - data: TaskData instance.
709 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700710
711 Returns metadata about the result.
712 """
maruela9cfd6f2015-09-15 11:03:15 -0700713 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000714 'duration': None,
715 'exit_code': None,
716 'had_hard_timeout': False,
717 'internal_failure': 'run_isolated did not complete properly',
718 'stats': {
719 #'cipd': {
720 # 'duration': 0.,
721 # 'get_client_duration': 0.,
722 #},
723 'isolated': {
724 'download': {
725 #'duration': 0.,
726 'initial_number_items': len(data.isolate_cache),
727 'initial_size': data.isolate_cache.total_size,
728 #'items_cold': '<large.pack()>',
729 #'items_hot': '<large.pack()>',
730 },
731 #'upload': {
732 # 'duration': 0.,
733 # 'items_cold': '<large.pack()>',
734 # 'items_hot': '<large.pack()>',
735 #},
736 },
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000737 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000738 #'cipd_pins': {
739 # 'packages': [
740 # {'package_name': ..., 'version': ..., 'path': ...},
741 # ...
742 # ],
743 # 'client_package': {'package_name': ..., 'version': ...},
744 #},
745 'outputs_ref': None,
746 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700747 }
nodirbe642ff2016-06-09 15:51:51 -0700748
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500749 if data.root_dir:
Lei Leife202df2019-06-11 17:33:34 +0000750 file_path.ensure_tree(data.root_dir, 0o700)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500751 elif data.isolate_cache.cache_dir:
752 data = data._replace(
753 root_dir=os.path.dirname(data.isolate_cache.cache_dir))
maruele2f2cb82016-07-13 14:41:03 -0700754 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700755 # If root_dir is not specified, it is not constant.
756 # TODO(maruel): This is not obvious. Change this to become an error once we
757 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500758 if constant_run_path and data.root_dir:
759 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700760 if os.path.isdir(run_dir):
761 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000762 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700763 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500764 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
maruel03e11842016-07-14 10:50:16 -0700765 # storage should be normally set but don't crash if it is not. This can happen
766 # as Swarming task can run without an isolate server.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500767 out_dir = make_temp_dir(
768 ISOLATED_OUT_DIR, data.root_dir) if data.storage else None
769 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000770 isolated_client_dir = make_temp_dir(ISOLATED_CLIENT_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700771 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500772 if data.relative_cwd:
773 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500774 command = data.command
nodir55be77b2016-05-03 09:39:57 -0700775 try:
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000776 with data.install_packages_fn(run_dir, isolated_client_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800777 if cipd_info:
778 result['stats']['cipd'] = cipd_info.stats
779 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700780
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500781 if data.isolated_hash:
vadimsh232f5a82017-01-20 19:23:44 -0800782 isolated_stats = result['stats'].setdefault('isolated', {})
Takuto Ikuta27c93b22019-12-11 07:56:43 +0000783 python_fallback = False
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000784 if data.use_go_isolated:
Takuto Ikuta27c93b22019-12-11 07:56:43 +0000785 try:
786 bundle, stats = _fetch_and_map_with_go(
787 isolated_hash=data.isolated_hash,
788 storage=data.storage,
789 cache=data.isolate_cache,
790 outdir=run_dir,
791 go_cache_dir=data.go_cache_dir,
792 isolated_client=os.path.join(
793 isolated_client_dir, 'isolated' + cipd.EXECUTABLE_SUFFIX))
794 except subprocess.CalledProcessError as e:
795 logging.error(
796 'failed to run go client, fallback to python client: %s', e)
797 file_path.rmtree(run_dir)
798 os.mkdir(run_dir, 0o700)
799 python_fallback = True
800
801 if not data.use_go_isolated or python_fallback:
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000802 bundle, stats = fetch_and_map(
803 isolated_hash=data.isolated_hash,
804 storage=data.storage,
805 cache=data.isolate_cache,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000806 outdir=run_dir)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000807 isolated_stats['download'].update(stats)
vadimsh232f5a82017-01-20 19:23:44 -0800808 change_tree_read_only(run_dir, bundle.read_only)
maruelabec63c2017-04-26 11:53:24 -0700809 # Inject the command
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500810 if not command and bundle.command:
811 command = bundle.command + data.extra_args
Marc-Antoine Rueld704a1f2017-10-31 10:51:23 -0400812 # Only set the relative directory if the isolated file specified a
813 # command, and no raw command was specified.
814 if bundle.relative_cwd:
815 cwd = os.path.normpath(os.path.join(cwd, bundle.relative_cwd))
maruelabec63c2017-04-26 11:53:24 -0700816
817 if not command:
818 # Handle this as a task failure, not an internal failure.
819 sys.stderr.write(
820 '<No command was specified!>\n'
821 '<Please secify a command when triggering your Swarming task>\n')
822 result['exit_code'] = 1
823 return result
nodirbe642ff2016-06-09 15:51:51 -0700824
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500825 if not cwd.startswith(run_dir):
826 # Handle this as a task failure, not an internal failure. This is a
827 # 'last chance' way to gate against directory escape.
828 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
829 result['exit_code'] = 1
830 return result
831
832 if not os.path.isdir(cwd):
833 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +0000834 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500835
vadimsh232f5a82017-01-20 19:23:44 -0800836 # If we have an explicit list of files to return, make sure their
837 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500838 if data.storage and data.outputs:
839 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700840
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500841 with data.install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -0800842 sys.stdout.flush()
843 start = time.time()
844 try:
vadimsh9c54b2c2017-07-25 14:08:29 -0700845 # Need to switch the default account before 'get_command_env' call,
846 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500847 with set_luci_context_account(data.switch_to_account, tmp_dir):
848 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000849 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
850 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +0000851 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -0800852 command = process_command(command, out_dir, data.bot_file)
853 file_path.ensure_command_has_abs_path(command, cwd)
854
vadimsh9c54b2c2017-07-25 14:08:29 -0700855 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000856 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000857 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -0800858 finally:
859 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -0500860
861 # We successfully ran the command, set internal_failure back to
862 # None (even if the command failed, it's not an internal error).
863 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -0700864 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -0700865 # An internal error occurred. Report accordingly so the swarming task will
866 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -0700867 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -0700868 result['internal_failure'] = str(e)
869 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -0700870
871 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -0700872 finally:
873 try:
aludwin0a8e17d2016-10-27 15:57:39 -0700874 # Try to link files to the output directory, if specified.
875 if out_dir:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500876 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700877
nodir32a1ec12016-10-26 18:34:07 -0700878 success = False
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500879 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -0700880 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700881 logging.warning(
882 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -0700883 else:
maruel84537cb2015-10-16 14:21:28 -0700884 # On Windows rmtree(run_dir) call above has a synchronization effect: it
885 # finishes only when all task child processes terminate (since a running
886 # process locks *.exe file). Examine out_dir only after that call
887 # completes (since child processes may write to out_dir too and we need
888 # to wait for them to finish).
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000889 for directory in (run_dir, tmp_dir, isolated_client_dir):
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000890 if not fs.isdir(directory):
891 continue
maruel84537cb2015-10-16 14:21:28 -0700892 try:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000893 success = file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -0700894 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000895 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -0700896 success = False
897 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000898 sys.stderr.write(
899 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
maruel84537cb2015-10-16 14:21:28 -0700900 if result['exit_code'] == 0:
901 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -0700902
marueleb5fbee2015-09-17 13:01:36 -0700903 # This deletes out_dir if leak_temp_dir is not set.
nodir9130f072016-05-27 13:59:08 -0700904 if out_dir:
nodir55715712016-06-03 12:28:19 -0700905 isolated_stats = result['stats'].setdefault('isolated', {})
906 result['outputs_ref'], success, isolated_stats['upload'] = (
Takuto Ikutab4aa8662019-09-17 05:54:36 +0000907 upload_then_delete(data.storage, out_dir, data.leak_temp_dir))
maruela9cfd6f2015-09-15 11:03:15 -0700908 if not success and result['exit_code'] == 0:
909 result['exit_code'] = 1
910 except Exception as e:
911 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -0700912 if out_dir:
913 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -0700914 result['internal_failure'] = str(e)
915 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500916
917
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500918def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -0700919 """Runs an executable and records execution metadata.
920
nodir55be77b2016-05-03 09:39:57 -0700921 If isolated_hash is specified, downloads the dependencies in the cache,
922 hardlinks them into a temporary directory and runs the command specified in
923 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500924
925 A temporary directory is created to hold the output files. The content inside
926 this directory will be uploaded back to |storage| packaged as a .isolated
927 file.
928
929 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500930 - data: TaskData instance.
931 - result_json: File path to dump result metadata into. If set, the process
932 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -0700933
934 Returns:
935 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000936 """
maruela76b9ee2015-12-15 06:18:08 -0800937 if result_json:
938 # Write a json output file right away in case we get killed.
939 result = {
940 'exit_code': None,
941 'had_hard_timeout': False,
942 'internal_failure': 'Was terminated before completion',
943 'outputs_ref': None,
nodirbe642ff2016-06-09 15:51:51 -0700944 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -0800945 }
946 tools.write_json(result_json, result, dense=True)
947
maruela9cfd6f2015-09-15 11:03:15 -0700948 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500949 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -0700950 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -0700951
maruela9cfd6f2015-09-15 11:03:15 -0700952 if result_json:
maruel05d5a882015-09-21 13:59:02 -0700953 # We've found tests to delete 'work' when quitting, causing an exception
954 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -0700955 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -0700956 tools.write_json(result_json, result, dense=True)
957 # Only return 1 if there was an internal error.
958 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +0000959
maruela9cfd6f2015-09-15 11:03:15 -0700960 # Marshall into old-style inline output.
961 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000962 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -0700963 data = {
964 'hash': result['outputs_ref']['isolated'],
965 'namespace': result['outputs_ref']['namespace'],
966 'storage': result['outputs_ref']['isolatedserver'],
967 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -0500968 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700969 print(
970 '[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
971 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -0800972 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700973 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000974
975
iannuccib58d10d2017-03-18 02:00:25 -0700976# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -0800977CipdInfo = collections.namedtuple('CipdInfo', [
978 'client', # cipd.CipdClient object
979 'cache_dir', # absolute path to bot-global cipd tag and instance cache
980 'stats', # dict with stats to return to the server
981 'pins', # dict with installed cipd pins to return to the server
982])
983
984
985@contextlib.contextmanager
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000986def noop_install_packages(_run_dir, _isolated_dir):
iannuccib58d10d2017-03-18 02:00:25 -0700987 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -0800988 yield None
989
990
Takuto Ikuta2efc7792019-11-27 14:33:34 +0000991def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -0700992 """Calls 'cipd ensure' for packages.
993
994 Args:
995 run_dir (str): root of installation.
996 cipd_cache_dir (str): the directory to use for the cipd package cache.
997 client (CipdClient): the cipd client to use
998 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -0700999
1000 Returns: list of pinned packages. Looks like [
1001 {
1002 'path': 'subdirectory',
1003 'package_name': 'resolved/package/name',
1004 'version': 'deadbeef...',
1005 },
1006 ...
1007 ]
1008 """
1009 package_pins = [None]*len(packages)
1010 def insert_pin(path, name, version, idx):
1011 package_pins[idx] = {
1012 'package_name': name,
1013 # swarming deals with 'root' as '.'
1014 'path': path or '.',
1015 'version': version,
1016 }
1017
1018 by_path = collections.defaultdict(list)
1019 for i, (path, name, version) in enumerate(packages):
1020 # cipd deals with 'root' as ''
1021 if path == '.':
1022 path = ''
1023 by_path[path].append((name, version, i))
1024
1025 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001026 run_dir,
1027 {
1028 subdir: [(name, vers) for name, vers, _ in pkgs
1029 ] for subdir, pkgs in by_path.items()
1030 },
1031 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -07001032 )
1033
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +00001034 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -07001035 this_subdir = by_path[subdir]
1036 for i, (name, version) in enumerate(pin_list):
1037 insert_pin(subdir, name, version, this_subdir[i][2])
1038
Robert Iannucci461b30d2017-12-13 11:34:03 -08001039 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -07001040
1041 return package_pins
1042
1043
vadimsh232f5a82017-01-20 19:23:44 -08001044@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001045def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001046 client_package_name, client_version, cache_dir,
1047 isolated_dir):
vadimsh902948e2017-01-20 15:57:32 -08001048 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -07001049
vadimsh232f5a82017-01-20 19:23:44 -08001050 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
1051
1052 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -07001053 [
1054 {
1055 "path": path, "package_name": package_name, "version": version,
1056 },
1057 ...
1058 ]
vadimsh902948e2017-01-20 15:57:32 -08001059 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -07001060
1061 such that they correspond 1:1 to all input package arguments from the command
1062 line. These dictionaries make their all the way back to swarming, where they
1063 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -07001064
vadimsh902948e2017-01-20 15:57:32 -08001065 If 'packages' list is empty, will bootstrap CIPD client, but won't install
1066 any packages.
1067
1068 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -08001069 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -08001070
nodirbe642ff2016-06-09 15:51:51 -07001071 Args:
nodir90bc8dc2016-06-15 13:35:21 -07001072 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -08001073 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -07001074 service_url (str): CIPD server url, e.g.
1075 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -07001076 client_package_name (str): CIPD package name of CIPD client.
1077 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -07001078 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001079 isolated_dir (str): where to download isolated client.
nodirbe642ff2016-06-09 15:51:51 -07001080 """
1081 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001082
nodirbe642ff2016-06-09 15:51:51 -07001083 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001084
vadimsh902948e2017-01-20 15:57:32 -08001085 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001086 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001087 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001088 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001089
nodirbe642ff2016-06-09 15:51:51 -07001090 get_client_start = time.time()
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001091 client_manager = cipd.get_client(service_url, client_package_name,
1092 client_version, cache_dir)
iannucci96fcccc2016-08-30 15:52:22 -07001093
nodirbe642ff2016-06-09 15:51:51 -07001094 with client_manager as client:
1095 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001096
iannuccib58d10d2017-03-18 02:00:25 -07001097 package_pins = []
1098 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001099 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1100 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001101
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001102 # Install isolated client to |isolated_dir|.
Takuto Ikuta02edca22019-11-29 10:04:51 +00001103 _install_packages(isolated_dir, cipd_cache_dir, client,
1104 [('', ISOLATED_PACKAGE, ISOLATED_REVISION)])
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001105
iannuccib58d10d2017-03-18 02:00:25 -07001106 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001107
vadimsh232f5a82017-01-20 19:23:44 -08001108 total_duration = time.time() - start
1109 logging.info(
1110 'Installing CIPD client and packages took %d seconds', total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001111
vadimsh232f5a82017-01-20 19:23:44 -08001112 yield CipdInfo(
1113 client=client,
1114 cache_dir=cipd_cache_dir,
1115 stats={
1116 'duration': total_duration,
1117 'get_client_duration': get_client_duration,
1118 },
1119 pins={
iannuccib58d10d2017-03-18 02:00:25 -07001120 'client_package': {
1121 'package_name': client.package_name,
1122 'version': client.instance_id,
1123 },
vadimsh232f5a82017-01-20 19:23:44 -08001124 'packages': package_pins,
1125 })
nodirbe642ff2016-06-09 15:51:51 -07001126
1127
1128def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001129 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001130 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001131 version=__version__,
1132 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001133 parser.add_option(
maruel36a963d2016-04-08 17:15:49 -07001134 '--clean', action='store_true',
1135 help='Cleans the cache, trimming it necessary and remove corrupted items '
1136 'and returns without executing anything; use with -v to know what '
1137 'was done')
1138 parser.add_option(
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001139 '--use-go-isolated',
1140 action='store_true',
1141 help='Use go isolated instead of python implementation')
1142 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001143 '--json',
1144 help='dump output metadata to json file. When used, run_isolated returns '
1145 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001146 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001147 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001148 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001149 '--grace-period', type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001150 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001151 parser.add_option(
Marc-Antoine Ruel49e347d2017-10-24 16:52:02 -07001152 '--raw-cmd', action='store_true',
1153 help='Ignore the isolated command, use the one supplied at the command '
1154 'line')
1155 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001156 '--relative-cwd',
1157 help='Ignore the isolated \'relative_cwd\' and use this one instead; '
1158 'requires --raw-cmd')
1159 parser.add_option(
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001160 '--env', default=[], action='append',
1161 help='Environment variables to set for the child process')
1162 parser.add_option(
1163 '--env-prefix', default=[], action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001164 help='Specify a VAR=./path/fragment to put in the environment variable '
1165 'before executing the command. The path fragment must be relative '
1166 'to the isolated run directory, and must not contain a `..` token. '
1167 'The path will be made absolute and prepended to the indicated '
1168 '$VAR using the OS\'s path separator. Multiple items for the same '
1169 '$VAR will be prepended in order.')
1170 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001171 '--bot-file',
1172 help='Path to a file describing the state of the host. The content is '
1173 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001174 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001175 '--switch-to-account',
1176 help='If given, switches LUCI_CONTEXT to given logical service account '
1177 '(e.g. "task" or "system") before launching the isolated process.')
1178 parser.add_option(
aludwin0a8e17d2016-10-27 15:57:39 -07001179 '--output', action='append',
1180 help='Specifies an output to return. If no outputs are specified, all '
1181 'files located in $(ISOLATED_OUTDIR) will be returned; '
1182 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1183 'specified by --output option (there can be multiple) will be '
1184 'returned. Note that if a file in OUT_DIR has the same path '
1185 'as an --output option, the --output version will be returned.')
1186 parser.add_option(
aludwin7556e0c2016-10-26 08:46:10 -07001187 '-a', '--argsfile',
1188 # This is actually handled in parse_args; it's included here purely so it
1189 # can make it into the help text.
1190 help='Specify a file containing a JSON array of arguments to this '
1191 'script. If --argsfile is provided, no other argument may be '
1192 'provided on the command line.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001193
1194 group = optparse.OptionGroup(parser, 'Data source')
1195 group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001196 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001197 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001198 isolateserver.add_isolate_server_options(group)
1199 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001200
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001201 isolateserver.add_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001202
1203 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001204
1205 group = optparse.OptionGroup(parser, 'Named caches')
1206 group.add_option(
1207 '--named-cache',
1208 dest='named_caches',
1209 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001210 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001211 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001212 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001213 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1214 'path is a path relative to the run dir where the cache directory '
1215 'must be put to. '
1216 'This option can be specified more than once.')
1217 group.add_option(
1218 '--named-cache-root', default='named_caches',
1219 help='Cache root directory. Default=%default')
1220 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001221
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001222 group = optparse.OptionGroup(parser, 'Process containment')
1223 parser.add_option(
1224 '--lower-priority', action='store_true',
1225 help='Lowers the child process priority')
1226 parser.add_option(
1227 '--containment-type', choices=('NONE', 'AUTO', 'JOB_OBJECT'),
1228 default='NONE',
1229 help='Type of container to use')
1230 parser.add_option(
1231 '--limit-processes', type='int', default=0,
1232 help='Maximum number of active processes in the containment')
1233 parser.add_option(
1234 '--limit-total-committed-memory', type='int', default=0,
1235 help='Maximum sum of committed memory in the containment')
1236 parser.add_option_group(group)
1237
1238 group = optparse.OptionGroup(parser, 'Debugging')
1239 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001240 '--leak-temp-dir',
1241 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001242 help='Deliberately leak isolate\'s temp dir for later examination. '
1243 'Default: %default')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001244 group.add_option(
marueleb5fbee2015-09-17 13:01:36 -07001245 '--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001246 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001247
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001248 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001249
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001250 parser.set_defaults(cache='cache', cipd_cache='cipd_cache')
nodirbe642ff2016-06-09 15:51:51 -07001251 return parser
1252
1253
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001254def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001255 """Validates named cache options and returns a CacheManager."""
1256 if options.named_caches and not options.named_cache_root:
1257 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001258 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001259 if not CACHE_NAME_RE.match(name):
1260 parser.error(
1261 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1262 if not path:
1263 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001264 try:
1265 long(hint)
1266 except ValueError:
1267 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001268 if options.named_cache_root:
1269 # Make these configurable later if there is use case but for now it's fairly
1270 # safe values.
1271 # In practice, a fair chunk of bots are already recycled on a daily schedule
1272 # so this code doesn't have any effect to them, unless they are preloaded
1273 # with a really old cache.
1274 policies = local_caching.CachePolicies(
1275 # 1TiB.
1276 max_cache_size=1024*1024*1024*1024,
1277 min_free_space=options.min_free_space,
1278 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001279 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001280 root_dir = six.text_type(os.path.abspath(options.named_cache_root))
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001281 return local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001282 return None
1283
1284
aludwin7556e0c2016-10-26 08:46:10 -07001285def parse_args(args):
1286 # Create a fake mini-parser just to get out the "-a" command. Note that
1287 # it's not documented here; instead, it's documented in create_option_parser
1288 # even though that parser will never actually get to parse it. This is
1289 # because --argsfile is exclusive with all other options and arguments.
1290 file_argparse = argparse.ArgumentParser(add_help=False)
1291 file_argparse.add_argument('-a', '--argsfile')
1292 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1293 if file_args.argsfile:
1294 if nonfile_args:
1295 file_argparse.error('Can\'t specify --argsfile with'
1296 'any other arguments (%s)' % nonfile_args)
1297 try:
1298 with open(file_args.argsfile, 'r') as f:
1299 args = json.load(f)
1300 except (IOError, OSError, ValueError) as e:
1301 # We don't need to error out here - "args" is now empty,
1302 # so the call below to parser.parse_args(args) will fail
1303 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001304 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001305
1306 # Even if we failed to read the args, just call the normal parser now since it
1307 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001308 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001309 options, args = parser.parse_args(args)
aludwin7556e0c2016-10-26 08:46:10 -07001310 return (parser, options, args)
1311
1312
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001313def _calc_named_cache_hint(named_cache, named_caches):
1314 """Returns the expected size of the missing named caches."""
1315 present = named_cache.available
1316 size = 0
1317 for name, _, hint in named_caches:
1318 if name not in present:
1319 hint = long(hint)
1320 if hint > 0:
1321 size += hint
1322 return size
1323
1324
aludwin7556e0c2016-10-26 08:46:10 -07001325def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001326 # Warning: when --argsfile is used, the strings are unicode instances, when
1327 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001328 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001329
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001330 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001331 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001332
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001333 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001334 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001335 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1336 if hint:
1337 # Increase the --min-free-space value by the hint, and recreate the
1338 # NamedCache instance so it gets the updated CachePolicy.
1339 options.min_free_space += hint
1340 named_cache = process_named_cache_options(parser, options)
1341
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001342 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1343 # they can be cleaned the same way.
nodirf33b8d62016-10-26 22:34:58 -07001344 isolate_cache = isolateserver.process_cache_options(options, trim=False)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001345 caches = []
1346 if isolate_cache:
1347 caches.append(isolate_cache)
1348 if named_cache:
1349 caches.append(named_cache)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001350 root = caches[0].cache_dir if caches else six.text_type(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001351 if options.clean:
1352 if options.isolated:
1353 parser.error('Can\'t use --isolated with --clean.')
1354 if options.isolate_server:
1355 parser.error('Can\'t use --isolate-server with --clean.')
1356 if options.json:
1357 parser.error('Can\'t use --json with --clean.')
nodirf33b8d62016-10-26 22:34:58 -07001358 if options.named_caches:
1359 parser.error('Can\t use --named-cache with --clean.')
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001360 # Trim first, then clean.
1361 local_caching.trim_caches(
1362 caches,
1363 root,
1364 min_free_space=options.min_free_space,
1365 max_age_secs=MAX_AGE_SECS)
1366 for c in caches:
Marc-Antoine Ruel87fc2222018-06-18 13:09:24 +00001367 c.cleanup()
maruel36a963d2016-04-08 17:15:49 -07001368 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001369
1370 # Trim must still be done for the following case:
1371 # - named-cache was used
1372 # - some entries, with a large hint, where missing
1373 # - --min-free-space was increased accordingly, thus trimming is needed
1374 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1375 # --clean after each task.
1376 if hint:
1377 logging.info('Additional trimming of %d bytes', hint)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001378 local_caching.trim_caches(
1379 caches,
1380 root,
1381 min_free_space=options.min_free_space,
1382 max_age_secs=MAX_AGE_SECS)
maruel36a963d2016-04-08 17:15:49 -07001383
nodir55be77b2016-05-03 09:39:57 -07001384 if not options.isolated and not args:
1385 parser.error('--isolated or command to run is required.')
1386
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001387 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001388
1389 isolateserver.process_isolate_server_options(
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001390 parser, options, True, False)
nodir55be77b2016-05-03 09:39:57 -07001391 if not options.isolate_server:
1392 if options.isolated:
1393 parser.error('--isolated requires --isolate-server')
1394 if ISOLATED_OUTDIR_PARAMETER in args:
1395 parser.error(
1396 '%s in args requires --isolate-server' % ISOLATED_OUTDIR_PARAMETER)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001397
nodir90bc8dc2016-06-15 13:35:21 -07001398 if options.root_dir:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001399 options.root_dir = six.text_type(os.path.abspath(options.root_dir))
maruel12e30012015-10-09 11:55:35 -07001400 if options.json:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001401 options.json = six.text_type(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001402
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001403 if any('=' not in i for i in options.env):
1404 parser.error(
1405 '--env required key=value form. value can be skipped to delete '
1406 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001407 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001408
1409 prefixes = {}
1410 cwd = os.path.realpath(os.getcwd())
1411 for item in options.env_prefix:
1412 if '=' not in item:
1413 parser.error(
1414 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1415 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001416 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001417 if os.path.isabs(opath):
1418 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1419 opath = os.path.normpath(opath)
1420 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1421 parser.error(
1422 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1423 % opath)
1424 prefixes.setdefault(key, []).append(opath)
1425 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001426
nodirbe642ff2016-06-09 15:51:51 -07001427 cipd.validate_cipd_options(parser, options)
Takuto Ikuta7f1471c2019-12-02 04:34:03 +00001428 if options.use_go_isolated and not options.cipd_enabled:
1429 parser.error('--cipd-enabled should be set if --use-go-isolated is set.')
nodirbe642ff2016-06-09 15:51:51 -07001430
vadimsh232f5a82017-01-20 19:23:44 -08001431 install_packages_fn = noop_install_packages
vadimsh902948e2017-01-20 15:57:32 -08001432 if options.cipd_enabled:
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001433 install_packages_fn = (
1434 lambda run_dir, isolated_dir: install_client_and_packages(
vadimsh902948e2017-01-20 15:57:32 -08001435 run_dir, cipd.parse_package_args(options.cipd_packages),
1436 options.cipd_server, options.cipd_client_package,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001437 options.cipd_client_version, cache_dir=options.cipd_cache,
1438 isolated_dir=isolated_dir))
nodirbe642ff2016-06-09 15:51:51 -07001439
nodird6160682017-02-02 13:03:35 -08001440 @contextlib.contextmanager
nodir0ae98b32017-05-11 13:21:53 -07001441 def install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001442 # WARNING: this function depends on "options" variable defined in the outer
1443 # function.
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001444 assert six.text_type(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001445 assert os.path.isabs(run_dir), run_dir
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001446 named_caches = [(os.path.join(run_dir, six.text_type(relpath)), name)
1447 for name, relpath, _ in options.named_caches]
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001448 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001449 named_cache.install(path, name)
nodird6160682017-02-02 13:03:35 -08001450 try:
1451 yield
1452 finally:
dnje289d132017-07-07 11:16:44 -07001453 # Uninstall each named cache, returning it to the cache pool. If an
1454 # uninstall fails for a given cache, it will remain in the task's
1455 # temporary space, get cleaned up by the Swarming bot, and be lost.
1456 #
1457 # If the Swarming bot cannot clean up the cache, it will handle it like
1458 # any other bot file that could not be removed.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001459 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001460 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001461 # uninstall() doesn't trim but does call save() implicitly. Trimming
1462 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001463 named_cache.uninstall(path, name)
1464 except local_caching.NamedCacheError:
1465 logging.exception('Error while removing named cache %r at %r. '
1466 'The cache will be lost.', path, name)
nodirf33b8d62016-10-26 22:34:58 -07001467
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001468 extra_args = []
1469 command = []
1470 if options.raw_cmd:
1471 command = args
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001472 if options.relative_cwd:
1473 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1474 if not a.startswith(os.getcwd()):
1475 parser.error(
1476 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001477 else:
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001478 if options.relative_cwd:
1479 parser.error('--relative-cwd requires --raw-cmd')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001480 extra_args = args
1481
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001482 containment_type = subprocess42.Containment.NONE
1483 if options.containment_type == 'AUTO':
1484 containment_type = subprocess42.Containment.AUTO
1485 if options.containment_type == 'JOB_OBJECT':
1486 containment_type = subprocess42.Containment.JOB_OBJECT
1487 containment = subprocess42.Containment(
1488 containment_type=containment_type,
1489 limit_processes=options.limit_processes,
1490 limit_total_committed_memory=options.limit_total_committed_memory)
1491
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001492 data = TaskData(
1493 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001494 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001495 extra_args=extra_args,
1496 isolated_hash=options.isolated,
1497 storage=None,
1498 isolate_cache=isolate_cache,
1499 outputs=options.output,
1500 install_named_caches=install_named_caches,
1501 leak_temp_dir=options.leak_temp_dir,
1502 root_dir=_to_unicode(options.root_dir),
1503 hard_timeout=options.hard_timeout,
1504 grace_period=options.grace_period,
1505 bot_file=options.bot_file,
1506 switch_to_account=options.switch_to_account,
1507 install_packages_fn=install_packages_fn,
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001508 use_go_isolated=bool(options.use_go_isolated),
Takuto Ikuta10cae642020-01-08 08:12:07 +00001509 go_cache_dir=options.cache,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001510 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001511 env_prefix=options.env_prefix,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001512 lower_priority=bool(options.lower_priority),
1513 containment=containment)
nodirbe642ff2016-06-09 15:51:51 -07001514 try:
nodir90bc8dc2016-06-15 13:35:21 -07001515 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001516 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001517 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001518 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001519 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001520 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001521 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001522 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001523 return run_tha_test(data, options.json)
1524 return run_tha_test(data, options.json)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001525 except (
1526 cipd.Error,
1527 local_caching.NamedCacheError,
Marc-Antoine Ruelb6e9e232018-11-20 00:12:33 +00001528 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001529 print(ex.message, file=sys.stderr)
nodirbe642ff2016-06-09 15:51:51 -07001530 return 1
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001531
1532
1533if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001534 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001535 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001536 fix_encoding.fix_encoding()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001537 sys.exit(main(sys.argv[1:]))