blob: 83d684c0692f0514e569558528c60af4da012c38 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
33See
34https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
35for all the variables.
36
37See
38https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
39for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000040"""
41
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000042from __future__ import print_function
43
44__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000045
aludwin7556e0c2016-10-26 08:46:10 -070046import argparse
maruel064c0a32016-04-05 11:47:15 -070047import base64
iannucci96fcccc2016-08-30 15:52:22 -070048import collections
vadimsh232f5a82017-01-20 19:23:44 -080049import contextlib
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040050import errno
aludwin7556e0c2016-10-26 08:46:10 -070051import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000052import logging
53import optparse
54import os
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040055import re
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000056import sys
57import tempfile
maruel064c0a32016-04-05 11:47:15 -070058import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000059
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000060from utils import tools
61tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000062
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000063# third_party/
64from depot_tools import fix_encoding
Takuto Ikuta6e2ff962019-10-29 12:35:27 +000065import six
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000066
67# pylint: disable=ungrouped-imports
68import auth
69import cipd
70import isolate_storage
71import isolateserver
72import local_caching
73from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070074from utils import file_path
maruel12e30012015-10-09 11:55:35 -070075from utils import fs
maruel064c0a32016-04-05 11:47:15 -070076from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040077from utils import logging_utils
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040078from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050079from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000080
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000081
maruele2f2cb82016-07-13 14:41:03 -070082# Magic variables that can be found in the isolate task command line.
83ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
84EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
85SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
86
87
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000088# The name of the log file to use.
89RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
90
maruele2f2cb82016-07-13 14:41:03 -070091
csharp@chromium.orge217f302012-11-22 16:51:53 +000092# The name of the log to use for the run_test_cases.py command
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000093RUN_TEST_CASES_LOG = 'run_test_cases.log'
csharp@chromium.orge217f302012-11-22 16:51:53 +000094
vadimsh@chromium.org87d63262013-04-04 19:34:21 +000095
maruele2f2cb82016-07-13 14:41:03 -070096# Use short names for temporary directories. This is driven by Windows, which
97# imposes a relatively short maximum path length of 260 characters, often
98# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +000099# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -0700100#
101# It is recommended to start the script with a `root_dir` as short as
102# possible.
103# - ir stands for isolated_run
104# - io stands for isolated_out
105# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000106# - ic stands for isolated_client
maruele2f2cb82016-07-13 14:41:03 -0700107ISOLATED_RUN_DIR = u'ir'
108ISOLATED_OUT_DIR = u'io'
109ISOLATED_TMP_DIR = u'it'
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000110ISOLATED_CLIENT_DIR = u'ic'
maruele2f2cb82016-07-13 14:41:03 -0700111
Takuto Ikuta02edca22019-11-29 10:04:51 +0000112# TODO(tikuta): take these parameter from luci-config?
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000113# Take revision from
114# https://ci.chromium.org/p/infra-internal/g/infra-packagers/console
Takuto Ikuta02edca22019-11-29 10:04:51 +0000115ISOLATED_PACKAGE = 'infra/tools/luci/isolated/${platform}'
Takuto Ikuta84ef3682019-11-29 06:10:01 +0000116ISOLATED_REVISION = 'git_revision:2ee27ca739de90c29d46eb3af3371a42fec3ebff'
maruele2f2cb82016-07-13 14:41:03 -0700117
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400118# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000119CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400120
121
marueld928c862017-06-08 08:20:04 -0700122OUTLIVING_ZOMBIE_MSG = """\
123*** Swarming tried multiple times to delete the %s directory and failed ***
124*** Hard failing the task ***
125
126Swarming detected that your testing script ran an executable, which may have
127started a child executable, and the main script returned early, leaving the
128children executables playing around unguided.
129
130You don't want to leave children processes outliving the task on the Swarming
131bot, do you? The Swarming bot doesn't.
132
133How to fix?
134- For any process that starts children processes, make sure all children
135 processes terminated properly before each parent process exits. This is
136 especially important in very deep process trees.
137 - This must be done properly both in normal successful task and in case of
138 task failure. Cleanup is very important.
139- The Swarming bot sends a SIGTERM in case of timeout.
140 - You have %s seconds to comply after the signal was sent to the process
141 before the process is forcibly killed.
142- To achieve not leaking children processes in case of signals on timeout, you
143 MUST handle signals in each executable / python script and propagate them to
144 children processes.
145 - When your test script (python or binary) receives a signal like SIGTERM or
146 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
147 them to terminate before quitting.
148
149See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400150https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700151for more information.
152
153*** May the SIGKILL force be with you ***
154"""
155
156
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000157# Currently hardcoded. Eventually could be exposed as a flag once there's value.
158# 3 weeks
159MAX_AGE_SECS = 21*24*60*60
160
161
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500162TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000163 'TaskData',
164 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000165 # List of strings; the command line to use, independent of what was
166 # specified in the isolated file.
167 'command',
168 # Relative directory to start command into.
169 'relative_cwd',
170 # List of strings; the arguments to add to the command specified in the
171 # isolated file.
172 'extra_args',
173 # Hash of the .isolated file that must be retrieved to recreate the tree
174 # of files to run the target executable. The command specified in the
175 # .isolated is executed. Mutually exclusive with command argument.
176 'isolated_hash',
177 # isolateserver.Storage instance to retrieve remote objects. This object
178 # has a reference to an isolateserver.StorageApi, which does the actual
179 # I/O.
180 'storage',
181 # isolateserver.LocalCache instance to keep from retrieving the same
182 # objects constantly by caching the objects retrieved. Can be on-disk or
183 # in-memory.
184 'isolate_cache',
185 # List of paths relative to root_dir to put into the output isolated
186 # bundle upon task completion (see link_outputs_to_outdir).
187 'outputs',
188 # Function (run_dir) => context manager that installs named caches into
189 # |run_dir|.
190 'install_named_caches',
191 # If True, the temporary directory will be deliberately leaked for later
192 # examination.
193 'leak_temp_dir',
194 # Path to the directory to use to create the temporary directory. If not
195 # specified, a random temporary directory is created.
196 'root_dir',
197 # Kills the process if it lasts more than this amount of seconds.
198 'hard_timeout',
199 # Number of seconds to wait between SIGTERM and SIGKILL.
200 'grace_period',
201 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
202 # task command line argument.
203 'bot_file',
204 # Logical account to switch LUCI_CONTEXT into.
205 'switch_to_account',
206 # Context manager dir => CipdInfo, see install_client_and_packages.
207 'install_packages_fn',
208 # Create tree with symlinks instead of hardlinks.
209 'use_symlinks',
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000210 # Use go isolated client.
211 'use_go_isolated',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000212 # Environment variables to set.
213 'env',
214 # Environment variables to mutate with relative directories.
215 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
216 'env_prefix',
217 # Lowers the task process priority.
218 'lower_priority',
219 # subprocess42.Containment instance. Can be None.
220 'containment',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000221 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500222
223
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500224def _to_str(s):
225 """Downgrades a unicode instance to str. Pass str through as-is."""
226 if isinstance(s, str):
227 return s
228 # This is technically incorrect, especially on Windows. In theory
229 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
230 # page' on Windows, but that causes other problems, as the character set
231 # is very limited.
232 return s.encode('utf-8')
233
234
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500235def _to_unicode(s):
236 """Upgrades a str instance to unicode. Pass unicode through as-is."""
Takuto Ikuta95459dd2019-10-29 12:39:47 +0000237 if isinstance(s, six.text_type) or s is None:
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500238 return s
239 return s.decode('utf-8')
240
241
maruel03e11842016-07-14 10:50:16 -0700242def make_temp_dir(prefix, root_dir):
243 """Returns a new unique temporary directory."""
Takuto Ikuta6e2ff962019-10-29 12:35:27 +0000244 return six.text_type(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000245
246
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500247def change_tree_read_only(rootdir, read_only):
248 """Changes the tree read-only bits according to the read_only specification.
249
250 The flag can be 0, 1 or 2, which will affect the possibility to modify files
251 and create or delete files.
252 """
253 if read_only == 2:
254 # Files and directories (except on Windows) are marked read only. This
255 # inhibits modifying, creating or deleting files in the test directory,
256 # except on Windows where creating and deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400257 file_path.make_tree_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500258 elif read_only == 1:
259 # Files are marked read only but not the directories. This inhibits
260 # modifying files but creating or deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400261 file_path.make_tree_files_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500262 elif read_only in (0, None):
Marc-Antoine Ruelf1d827c2014-11-24 15:22:25 -0500263 # Anything can be modified.
Marc-Antoine Ruel2666d9c2018-05-18 13:52:02 -0400264 # TODO(maruel): This is currently dangerous as long as
265 # DiskContentAddressedCache.touch() is not yet changed to verify the hash of
266 # the content of the files it is looking at, so that if a test modifies an
267 # input file, the file must be deleted.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400268 file_path.make_tree_writeable(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500269 else:
270 raise ValueError(
271 'change_tree_read_only(%s, %s): Unknown flag %s' %
272 (rootdir, read_only, read_only))
273
274
vadimsh9c54b2c2017-07-25 14:08:29 -0700275@contextlib.contextmanager
276def set_luci_context_account(account, tmp_dir):
277 """Sets LUCI_CONTEXT account to be used by the task.
278
279 If 'account' is None or '', does nothing at all. This happens when
280 run_isolated.py is called without '--switch-to-account' flag. In this case,
281 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000282 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700283 run_isolated.py explicitly from their code.
284
285 If the requested account is not defined in the context, switches to
286 non-authenticated access. This happens for Swarming tasks that don't use
287 'task' service accounts.
288
289 If not using LUCI_CONTEXT-based auth, does nothing.
290 If already running as requested account, does nothing.
291 """
292 if not account:
293 # Not actually switching.
294 yield
295 return
296
297 local_auth = luci_context.read('local_auth')
298 if not local_auth:
299 # Not using LUCI_CONTEXT auth at all.
300 yield
301 return
302
303 # See LUCI_CONTEXT.md for the format of 'local_auth'.
304 if local_auth.get('default_account_id') == account:
305 # Already set, no need to switch.
306 yield
307 return
308
309 available = {a['id'] for a in local_auth.get('accounts') or []}
310 if account in available:
311 logging.info('Switching default LUCI_CONTEXT account to %r', account)
312 local_auth['default_account_id'] = account
313 else:
314 logging.warning(
315 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
316 'disabling authentication', account, sorted(available))
317 local_auth.pop('default_account_id', None)
318
319 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
320 yield
321
322
nodir90bc8dc2016-06-15 13:35:21 -0700323def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000324 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700325
326 Raises:
327 ValueError if a parameter is requested in |command| but its value is not
328 provided.
329 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000330 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
331
332
333def replace_parameters(arg, out_dir, bot_file):
334 """Replaces parameter tokens with appropriate values in a string.
335
336 Raises:
337 ValueError if a parameter is requested in |arg| but its value is not
338 provided.
339 """
340 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
341 replace_slash = False
342 if ISOLATED_OUTDIR_PARAMETER in arg:
343 if not out_dir:
344 raise ValueError(
345 'output directory is requested in command or env var, but not '
346 'provided; please specify one')
347 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
348 replace_slash = True
349 if SWARMING_BOT_FILE_PARAMETER in arg:
350 if bot_file:
351 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700352 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000353 else:
354 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
355 'var, but no bot_file specified. Leaving parameter '
356 'unchanged.')
357 if replace_slash:
358 # Replace slashes only if parameters are present
359 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
360 arg = arg.replace('/', os.sep)
361 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700362
363
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000364
365def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
366 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800367 """Returns full OS environment to run a command in.
368
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800369 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
370 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800371
372 Args:
373 tmp_dir: temp directory.
374 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500375 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500376 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800377 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000378 out_dir: Isolated output directory. Required to be != None if any of the
379 env vars contain ISOLATED_OUTDIR_PARAMETER.
380 bot_file: Required to be != None if any of the env vars contain
381 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800382 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500383 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000384 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500385 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500386 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500387 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000388 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500389
390 if cipd_info:
391 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500392 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
393 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500394
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000395 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500396 assert isinstance(paths, list), paths
397 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500398 cur = out.get(key)
399 if cur:
400 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500401 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800402
Marc-Antoine Ruelefb30b12018-07-25 18:34:36 +0000403 tmp_dir = _to_str(tmp_dir)
404 # pylint: disable=line-too-long
405 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
406 # platform. So $TMPDIR must be set on all platforms.
407 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
408 out['TMPDIR'] = tmp_dir
409 if sys.platform == 'win32':
410 # * chromium's base utils uses GetTempPath().
411 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
412 # * Go uses GetTempPath().
413 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
414 # set.
415 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
416 out['TMP'] = tmp_dir
417 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
418 out['TEMP'] = tmp_dir
419 elif sys.platform == 'darwin':
420 # * Chromium uses an hack on macOS before calling into
421 # NSTemporaryDirectory().
422 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
423 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
424 out['MAC_CHROMIUM_TMPDIR'] = tmp_dir
425 else:
426 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
427 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
428 # * mktemp on linux respects $TMPDIR.
429 # * Chromium respects $TMPDIR on linux.
430 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
431 # * Go uses $TMPDIR.
432 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
433 pass
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500434 return out
vadimsh232f5a82017-01-20 19:23:44 -0800435
436
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000437def run_command(
438 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700439 """Runs the command.
440
441 Returns:
442 tuple(process exit code, bool if had a hard timeout)
443 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000444 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000445 'run_command(%s, %s, %s, %s, %s, %s)',
446 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700447
maruel6be7f9e2015-10-01 12:25:30 -0700448 exit_code = None
449 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700450 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700451 proc = None
452 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700453 try:
maruel6be7f9e2015-10-01 12:25:30 -0700454 # TODO(maruel): This code is imperfect. It doesn't handle well signals
455 # during the download phase and there's short windows were things can go
456 # wrong.
457 def handler(signum, _frame):
458 if proc and not had_signal:
459 logging.info('Received signal %d', signum)
460 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700461 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700462
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000463 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000464 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000465 lower_priority=lower_priority, containment=containment)
maruel6be7f9e2015-10-01 12:25:30 -0700466 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
467 try:
John Budorickc398f092019-06-10 22:49:44 +0000468 exit_code = proc.wait(hard_timeout or None)
maruel6be7f9e2015-10-01 12:25:30 -0700469 except subprocess42.TimeoutExpired:
470 if not had_signal:
471 logging.warning('Hard timeout')
472 had_hard_timeout = True
473 logging.warning('Sending SIGTERM')
474 proc.terminate()
475
476 # Ignore signals in grace period. Forcibly give the grace period to the
477 # child process.
478 if exit_code is None:
479 ignore = lambda *_: None
480 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
481 try:
482 exit_code = proc.wait(grace_period or None)
483 except subprocess42.TimeoutExpired:
484 # Now kill for real. The user can distinguish between the
485 # following states:
486 # - signal but process exited within grace period,
487 # hard_timed_out will be set but the process exit code will be
488 # script provided.
489 # - processed exited late, exit code will be -9 on posix.
490 logging.warning('Grace exhausted; sending SIGKILL')
491 proc.kill()
martiniss5c8043e2017-08-01 17:09:43 -0700492 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700493 exit_code = proc.wait()
maruela9cfd6f2015-09-15 11:03:15 -0700494 except OSError:
495 # This is not considered to be an internal error. The executable simply
496 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800497 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000498 '<The executable does not exist, a dependent library is missing or '
499 'the command line is too long>\n'
500 '<Check for missing .so/.dll in the .isolate or GN file or length of '
501 'command line args>\n'
maruela72f46e2016-02-24 11:05:45 -0800502 '<Command: %s>\n' % command)
503 if os.environ.get('SWARMING_TASK_ID'):
504 # Give an additional hint when running as a swarming task.
505 sys.stderr.write(
506 '<See the task\'s page for commands to help diagnose this issue '
507 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700508 exit_code = 1
509 logging.info(
510 'Command finished with exit code %d (%s)',
511 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700512 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700513
514
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000515def _fetch_and_map_with_go(isolated_hash, storage, cache, outdir,
516 isolated_client):
517 """
518 Fetches an isolated tree using go client, create the tree and returns
519 (bundle, stats).
520 """
521 start = time.time()
522 server_ref = storage.server_ref
523 policies = cache.policies
524 result_json_handle, result_json_path = tempfile.mkstemp(
525 prefix=u'fetch-and-map-result-', suffix=u'.json')
526 os.close(result_json_handle)
527 try:
528 subprocess42.check_call([
529 isolated_client,
530 'download',
531 '-isolate-server',
532 server_ref.url,
533 '-namespace',
534 server_ref.namespace,
535 '-isolated',
536 isolated_hash,
537
538 # flags for cache
539 '-cache-dir',
540 cache.cache_dir,
541 '-cache-max-items',
542 policies.max_items,
543 '-cache-max-size',
544 policies.max_cache_size,
545 '-cache-min-free-space',
546 policies.min_free_space,
547
548 # flags for output
549 '-output-dir',
550 outdir,
551 '-fetch-and-map-result-json',
552 result_json_path,
553 ])
554 with open(result_json_path) as json_file:
555 result_json = json.load(json_file)
556
557 isolated = result_json['isolated']
558 bundle = isolateserver.IsolatedBundle(filter_cb=None)
559 # Only following properties are used in caller.
560 bundle.command = isolated.get('command')
561 bundle.read_only = isolated.get('read_only')
562 bundle.relative_cwd = isolated.get('relative_cwd')
563
564 return bundle, {
565 'duration': time.time() - start,
566 'items_cold': result_json['items_cold'],
567 'items_hot': result_json['items_hot'],
568 }
569 finally:
570 fs.remove(result_json_path)
571
572
573# TODO(crbug.com/932396): remove this function.
maruel4409e302016-07-19 14:25:51 -0700574def fetch_and_map(isolated_hash, storage, cache, outdir, use_symlinks):
575 """Fetches an isolated tree, create the tree and returns (bundle, stats)."""
nodir6f801882016-04-29 14:41:50 -0700576 start = time.time()
577 bundle = isolateserver.fetch_isolated(
578 isolated_hash=isolated_hash,
579 storage=storage,
580 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700581 outdir=outdir,
582 use_symlinks=use_symlinks)
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000583 hot = (collections.Counter(cache.used) -
584 collections.Counter(cache.added)).elements()
nodir6f801882016-04-29 14:41:50 -0700585 return bundle, {
586 'duration': time.time() - start,
nodir6f801882016-04-29 14:41:50 -0700587 'items_cold': base64.b64encode(large.pack(sorted(cache.added))),
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000588 'items_hot': base64.b64encode(large.pack(sorted(hot))),
nodir6f801882016-04-29 14:41:50 -0700589 }
590
591
aludwin0a8e17d2016-10-27 15:57:39 -0700592def link_outputs_to_outdir(run_dir, out_dir, outputs):
593 """Links any named outputs to out_dir so they can be uploaded.
594
595 Raises an error if the file already exists in that directory.
596 """
597 if not outputs:
598 return
599 isolateserver.create_directories(out_dir, outputs)
600 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400601 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
602
603
604def copy_recursively(src, dst):
605 """Efficiently copies a file or directory from src_dir to dst_dir.
606
607 `item` may be a file, directory, or a symlink to a file or directory.
608 All symlinks are replaced with their targets, so the resulting
609 directory structure in dst_dir will never have any symlinks.
610
611 To increase speed, copy_recursively hardlinks individual files into the
612 (newly created) directory structure if possible, unlike Python's
613 shutil.copytree().
614 """
615 orig_src = src
616 try:
617 # Replace symlinks with their final target.
618 while fs.islink(src):
619 res = fs.readlink(src)
620 src = os.path.join(os.path.dirname(src), res)
621 # TODO(sadafm): Explicitly handle cyclic symlinks.
622
623 # Note that fs.isfile (which is a wrapper around os.path.isfile) throws
624 # an exception if src does not exist. A warning will be logged in that case.
625 if fs.isfile(src):
626 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
627 return
628
629 if not fs.exists(dst):
630 os.makedirs(dst)
631
632 for child in fs.listdir(src):
633 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
634
635 except OSError as e:
636 if e.errno == errno.ENOENT:
637 logging.warning('Path %s does not exist or %s is a broken symlink',
638 src, orig_src)
639 else:
640 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700641
642
Takuto Ikutab4aa8662019-09-17 05:54:36 +0000643def upload_then_delete(storage, out_dir, leak_temp_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700644 """Deletes the temporary run directory and uploads results back.
645
646 Returns:
nodir6f801882016-04-29 14:41:50 -0700647 tuple(outputs_ref, success, stats)
maruel064c0a32016-04-05 11:47:15 -0700648 - outputs_ref: a dict referring to the results archived back to the isolated
649 server, if applicable.
650 - success: False if something occurred that means that the task must
651 forcibly be considered a failure, e.g. zombie processes were left
652 behind.
nodir6f801882016-04-29 14:41:50 -0700653 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700654 """
maruela9cfd6f2015-09-15 11:03:15 -0700655 # Upload out_dir and generate a .isolated file out of this directory. It is
656 # only done if files were written in the directory.
657 outputs_ref = None
maruel064c0a32016-04-05 11:47:15 -0700658 cold = []
659 hot = []
nodir6f801882016-04-29 14:41:50 -0700660 start = time.time()
661
maruel12e30012015-10-09 11:55:35 -0700662 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700663 with tools.Profiler('ArchiveOutput'):
664 try:
maruel064c0a32016-04-05 11:47:15 -0700665 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
maruela9cfd6f2015-09-15 11:03:15 -0700666 storage, [out_dir], None)
667 outputs_ref = {
Marc-Antoine Rueld0868ec2018-11-28 20:47:29 +0000668 'isolated': results.values()[0],
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +0000669 'isolatedserver': storage.server_ref.url,
670 'namespace': storage.server_ref.namespace,
maruela9cfd6f2015-09-15 11:03:15 -0700671 }
maruel064c0a32016-04-05 11:47:15 -0700672 cold = sorted(i.size for i in f_cold)
673 hot = sorted(i.size for i in f_hot)
maruela9cfd6f2015-09-15 11:03:15 -0700674 except isolateserver.Aborted:
675 # This happens when a signal SIGTERM was received while uploading data.
676 # There is 2 causes:
677 # - The task was too slow and was about to be killed anyway due to
678 # exceeding the hard timeout.
679 # - The amount of data uploaded back is very large and took too much
680 # time to archive.
681 sys.stderr.write('Received SIGTERM while uploading')
682 # Re-raise, so it will be treated as an internal failure.
683 raise
nodir6f801882016-04-29 14:41:50 -0700684
685 success = False
maruela9cfd6f2015-09-15 11:03:15 -0700686 try:
maruel12e30012015-10-09 11:55:35 -0700687 if (not leak_temp_dir and fs.isdir(out_dir) and
maruel6eeea7d2015-09-16 12:17:42 -0700688 not file_path.rmtree(out_dir)):
maruela9cfd6f2015-09-15 11:03:15 -0700689 logging.error('Had difficulties removing out_dir %s', out_dir)
nodir6f801882016-04-29 14:41:50 -0700690 else:
691 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700692 except OSError as e:
693 # When this happens, it means there's a process error.
maruel12e30012015-10-09 11:55:35 -0700694 logging.exception('Had difficulties removing out_dir %s: %s', out_dir, e)
nodir6f801882016-04-29 14:41:50 -0700695 stats = {
696 'duration': time.time() - start,
697 'items_cold': base64.b64encode(large.pack(cold)),
698 'items_hot': base64.b64encode(large.pack(hot)),
699 }
700 return outputs_ref, success, stats
maruela9cfd6f2015-09-15 11:03:15 -0700701
702
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500703def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700704 """Runs a command with optional isolated input/output.
705
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500706 Arguments:
707 - data: TaskData instance.
708 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700709
710 Returns metadata about the result.
711 """
maruela9cfd6f2015-09-15 11:03:15 -0700712 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000713 'duration': None,
714 'exit_code': None,
715 'had_hard_timeout': False,
716 'internal_failure': 'run_isolated did not complete properly',
717 'stats': {
718 #'cipd': {
719 # 'duration': 0.,
720 # 'get_client_duration': 0.,
721 #},
722 'isolated': {
723 'download': {
724 #'duration': 0.,
725 'initial_number_items': len(data.isolate_cache),
726 'initial_size': data.isolate_cache.total_size,
727 #'items_cold': '<large.pack()>',
728 #'items_hot': '<large.pack()>',
729 },
730 #'upload': {
731 # 'duration': 0.,
732 # 'items_cold': '<large.pack()>',
733 # 'items_hot': '<large.pack()>',
734 #},
735 },
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000736 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000737 #'cipd_pins': {
738 # 'packages': [
739 # {'package_name': ..., 'version': ..., 'path': ...},
740 # ...
741 # ],
742 # 'client_package': {'package_name': ..., 'version': ...},
743 #},
744 'outputs_ref': None,
745 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700746 }
nodirbe642ff2016-06-09 15:51:51 -0700747
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500748 if data.root_dir:
Lei Leife202df2019-06-11 17:33:34 +0000749 file_path.ensure_tree(data.root_dir, 0o700)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500750 elif data.isolate_cache.cache_dir:
751 data = data._replace(
752 root_dir=os.path.dirname(data.isolate_cache.cache_dir))
maruele2f2cb82016-07-13 14:41:03 -0700753 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700754 # If root_dir is not specified, it is not constant.
755 # TODO(maruel): This is not obvious. Change this to become an error once we
756 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500757 if constant_run_path and data.root_dir:
758 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700759 if os.path.isdir(run_dir):
760 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000761 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700762 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500763 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
maruel03e11842016-07-14 10:50:16 -0700764 # storage should be normally set but don't crash if it is not. This can happen
765 # as Swarming task can run without an isolate server.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500766 out_dir = make_temp_dir(
767 ISOLATED_OUT_DIR, data.root_dir) if data.storage else None
768 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000769 isolated_client_dir = make_temp_dir(ISOLATED_CLIENT_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700770 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500771 if data.relative_cwd:
772 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500773 command = data.command
nodir55be77b2016-05-03 09:39:57 -0700774 try:
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000775 with data.install_packages_fn(run_dir, isolated_client_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800776 if cipd_info:
777 result['stats']['cipd'] = cipd_info.stats
778 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700779
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500780 if data.isolated_hash:
vadimsh232f5a82017-01-20 19:23:44 -0800781 isolated_stats = result['stats'].setdefault('isolated', {})
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000782 if data.use_go_isolated:
783 bundle, stats = _fetch_and_map_with_go(
784 isolated_hash=data.isolated_hash,
785 storage=data.storage,
786 cache=data.isolate_cache,
787 outdir=run_dir,
788 isolated_client=os.path.join(isolated_client_dir,
789 'isolated' + cipd.EXECUTABLE_SUFFIX))
790 else:
791 bundle, stats = fetch_and_map(
792 isolated_hash=data.isolated_hash,
793 storage=data.storage,
794 cache=data.isolate_cache,
795 outdir=run_dir,
796 use_symlinks=data.use_symlinks)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000797 isolated_stats['download'].update(stats)
vadimsh232f5a82017-01-20 19:23:44 -0800798 change_tree_read_only(run_dir, bundle.read_only)
maruelabec63c2017-04-26 11:53:24 -0700799 # Inject the command
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500800 if not command and bundle.command:
801 command = bundle.command + data.extra_args
Marc-Antoine Rueld704a1f2017-10-31 10:51:23 -0400802 # Only set the relative directory if the isolated file specified a
803 # command, and no raw command was specified.
804 if bundle.relative_cwd:
805 cwd = os.path.normpath(os.path.join(cwd, bundle.relative_cwd))
maruelabec63c2017-04-26 11:53:24 -0700806
807 if not command:
808 # Handle this as a task failure, not an internal failure.
809 sys.stderr.write(
810 '<No command was specified!>\n'
811 '<Please secify a command when triggering your Swarming task>\n')
812 result['exit_code'] = 1
813 return result
nodirbe642ff2016-06-09 15:51:51 -0700814
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500815 if not cwd.startswith(run_dir):
816 # Handle this as a task failure, not an internal failure. This is a
817 # 'last chance' way to gate against directory escape.
818 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
819 result['exit_code'] = 1
820 return result
821
822 if not os.path.isdir(cwd):
823 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +0000824 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500825
vadimsh232f5a82017-01-20 19:23:44 -0800826 # If we have an explicit list of files to return, make sure their
827 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500828 if data.storage and data.outputs:
829 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700830
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500831 with data.install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -0800832 sys.stdout.flush()
833 start = time.time()
834 try:
vadimsh9c54b2c2017-07-25 14:08:29 -0700835 # Need to switch the default account before 'get_command_env' call,
836 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500837 with set_luci_context_account(data.switch_to_account, tmp_dir):
838 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000839 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
840 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +0000841 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -0800842 command = process_command(command, out_dir, data.bot_file)
843 file_path.ensure_command_has_abs_path(command, cwd)
844
vadimsh9c54b2c2017-07-25 14:08:29 -0700845 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000846 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000847 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -0800848 finally:
849 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -0500850
851 # We successfully ran the command, set internal_failure back to
852 # None (even if the command failed, it's not an internal error).
853 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -0700854 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -0700855 # An internal error occurred. Report accordingly so the swarming task will
856 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -0700857 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -0700858 result['internal_failure'] = str(e)
859 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -0700860
861 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -0700862 finally:
863 try:
aludwin0a8e17d2016-10-27 15:57:39 -0700864 # Try to link files to the output directory, if specified.
865 if out_dir:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500866 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700867
nodir32a1ec12016-10-26 18:34:07 -0700868 success = False
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500869 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -0700870 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700871 logging.warning(
872 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -0700873 else:
maruel84537cb2015-10-16 14:21:28 -0700874 # On Windows rmtree(run_dir) call above has a synchronization effect: it
875 # finishes only when all task child processes terminate (since a running
876 # process locks *.exe file). Examine out_dir only after that call
877 # completes (since child processes may write to out_dir too and we need
878 # to wait for them to finish).
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000879 for directory in (run_dir, tmp_dir, isolated_client_dir):
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000880 if not fs.isdir(directory):
881 continue
maruel84537cb2015-10-16 14:21:28 -0700882 try:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000883 success = file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -0700884 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000885 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -0700886 success = False
887 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000888 sys.stderr.write(
889 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
maruel84537cb2015-10-16 14:21:28 -0700890 if result['exit_code'] == 0:
891 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -0700892
marueleb5fbee2015-09-17 13:01:36 -0700893 # This deletes out_dir if leak_temp_dir is not set.
nodir9130f072016-05-27 13:59:08 -0700894 if out_dir:
nodir55715712016-06-03 12:28:19 -0700895 isolated_stats = result['stats'].setdefault('isolated', {})
896 result['outputs_ref'], success, isolated_stats['upload'] = (
Takuto Ikutab4aa8662019-09-17 05:54:36 +0000897 upload_then_delete(data.storage, out_dir, data.leak_temp_dir))
maruela9cfd6f2015-09-15 11:03:15 -0700898 if not success and result['exit_code'] == 0:
899 result['exit_code'] = 1
900 except Exception as e:
901 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -0700902 if out_dir:
903 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -0700904 result['internal_failure'] = str(e)
905 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500906
907
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500908def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -0700909 """Runs an executable and records execution metadata.
910
nodir55be77b2016-05-03 09:39:57 -0700911 If isolated_hash is specified, downloads the dependencies in the cache,
912 hardlinks them into a temporary directory and runs the command specified in
913 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500914
915 A temporary directory is created to hold the output files. The content inside
916 this directory will be uploaded back to |storage| packaged as a .isolated
917 file.
918
919 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500920 - data: TaskData instance.
921 - result_json: File path to dump result metadata into. If set, the process
922 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -0700923
924 Returns:
925 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000926 """
maruela76b9ee2015-12-15 06:18:08 -0800927 if result_json:
928 # Write a json output file right away in case we get killed.
929 result = {
930 'exit_code': None,
931 'had_hard_timeout': False,
932 'internal_failure': 'Was terminated before completion',
933 'outputs_ref': None,
nodirbe642ff2016-06-09 15:51:51 -0700934 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -0800935 }
936 tools.write_json(result_json, result, dense=True)
937
maruela9cfd6f2015-09-15 11:03:15 -0700938 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500939 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -0700940 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -0700941
maruela9cfd6f2015-09-15 11:03:15 -0700942 if result_json:
maruel05d5a882015-09-21 13:59:02 -0700943 # We've found tests to delete 'work' when quitting, causing an exception
944 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -0700945 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -0700946 tools.write_json(result_json, result, dense=True)
947 # Only return 1 if there was an internal error.
948 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +0000949
maruela9cfd6f2015-09-15 11:03:15 -0700950 # Marshall into old-style inline output.
951 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000952 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -0700953 data = {
954 'hash': result['outputs_ref']['isolated'],
955 'namespace': result['outputs_ref']['namespace'],
956 'storage': result['outputs_ref']['isolatedserver'],
957 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -0500958 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700959 print(
960 '[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
961 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -0800962 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700963 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000964
965
iannuccib58d10d2017-03-18 02:00:25 -0700966# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -0800967CipdInfo = collections.namedtuple('CipdInfo', [
968 'client', # cipd.CipdClient object
969 'cache_dir', # absolute path to bot-global cipd tag and instance cache
970 'stats', # dict with stats to return to the server
971 'pins', # dict with installed cipd pins to return to the server
972])
973
974
975@contextlib.contextmanager
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000976def noop_install_packages(_run_dir, _isolated_dir):
iannuccib58d10d2017-03-18 02:00:25 -0700977 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -0800978 yield None
979
980
Takuto Ikuta2efc7792019-11-27 14:33:34 +0000981def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -0700982 """Calls 'cipd ensure' for packages.
983
984 Args:
985 run_dir (str): root of installation.
986 cipd_cache_dir (str): the directory to use for the cipd package cache.
987 client (CipdClient): the cipd client to use
988 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -0700989
990 Returns: list of pinned packages. Looks like [
991 {
992 'path': 'subdirectory',
993 'package_name': 'resolved/package/name',
994 'version': 'deadbeef...',
995 },
996 ...
997 ]
998 """
999 package_pins = [None]*len(packages)
1000 def insert_pin(path, name, version, idx):
1001 package_pins[idx] = {
1002 'package_name': name,
1003 # swarming deals with 'root' as '.'
1004 'path': path or '.',
1005 'version': version,
1006 }
1007
1008 by_path = collections.defaultdict(list)
1009 for i, (path, name, version) in enumerate(packages):
1010 # cipd deals with 'root' as ''
1011 if path == '.':
1012 path = ''
1013 by_path[path].append((name, version, i))
1014
1015 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001016 run_dir,
1017 {
1018 subdir: [(name, vers) for name, vers, _ in pkgs
1019 ] for subdir, pkgs in by_path.items()
1020 },
1021 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -07001022 )
1023
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +00001024 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -07001025 this_subdir = by_path[subdir]
1026 for i, (name, version) in enumerate(pin_list):
1027 insert_pin(subdir, name, version, this_subdir[i][2])
1028
Robert Iannucci461b30d2017-12-13 11:34:03 -08001029 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -07001030
1031 return package_pins
1032
1033
vadimsh232f5a82017-01-20 19:23:44 -08001034@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001035def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001036 client_package_name, client_version, cache_dir,
1037 isolated_dir):
vadimsh902948e2017-01-20 15:57:32 -08001038 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -07001039
vadimsh232f5a82017-01-20 19:23:44 -08001040 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
1041
1042 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -07001043 [
1044 {
1045 "path": path, "package_name": package_name, "version": version,
1046 },
1047 ...
1048 ]
vadimsh902948e2017-01-20 15:57:32 -08001049 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -07001050
1051 such that they correspond 1:1 to all input package arguments from the command
1052 line. These dictionaries make their all the way back to swarming, where they
1053 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -07001054
vadimsh902948e2017-01-20 15:57:32 -08001055 If 'packages' list is empty, will bootstrap CIPD client, but won't install
1056 any packages.
1057
1058 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -08001059 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -08001060
nodirbe642ff2016-06-09 15:51:51 -07001061 Args:
nodir90bc8dc2016-06-15 13:35:21 -07001062 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -08001063 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -07001064 service_url (str): CIPD server url, e.g.
1065 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -07001066 client_package_name (str): CIPD package name of CIPD client.
1067 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -07001068 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001069 isolated_dir (str): where to download isolated client.
nodirbe642ff2016-06-09 15:51:51 -07001070 """
1071 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001072
nodirbe642ff2016-06-09 15:51:51 -07001073 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001074
vadimsh902948e2017-01-20 15:57:32 -08001075 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001076 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001077 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001078 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001079
nodirbe642ff2016-06-09 15:51:51 -07001080 get_client_start = time.time()
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001081 client_manager = cipd.get_client(service_url, client_package_name,
1082 client_version, cache_dir)
iannucci96fcccc2016-08-30 15:52:22 -07001083
nodirbe642ff2016-06-09 15:51:51 -07001084 with client_manager as client:
1085 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001086
iannuccib58d10d2017-03-18 02:00:25 -07001087 package_pins = []
1088 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001089 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1090 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001091
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001092 # Install isolated client to |isolated_dir|.
Takuto Ikuta02edca22019-11-29 10:04:51 +00001093 _install_packages(isolated_dir, cipd_cache_dir, client,
1094 [('', ISOLATED_PACKAGE, ISOLATED_REVISION)])
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001095
iannuccib58d10d2017-03-18 02:00:25 -07001096 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001097
vadimsh232f5a82017-01-20 19:23:44 -08001098 total_duration = time.time() - start
1099 logging.info(
1100 'Installing CIPD client and packages took %d seconds', total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001101
vadimsh232f5a82017-01-20 19:23:44 -08001102 yield CipdInfo(
1103 client=client,
1104 cache_dir=cipd_cache_dir,
1105 stats={
1106 'duration': total_duration,
1107 'get_client_duration': get_client_duration,
1108 },
1109 pins={
iannuccib58d10d2017-03-18 02:00:25 -07001110 'client_package': {
1111 'package_name': client.package_name,
1112 'version': client.instance_id,
1113 },
vadimsh232f5a82017-01-20 19:23:44 -08001114 'packages': package_pins,
1115 })
nodirbe642ff2016-06-09 15:51:51 -07001116
1117
1118def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001119 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001120 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001121 version=__version__,
1122 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001123 parser.add_option(
maruel36a963d2016-04-08 17:15:49 -07001124 '--clean', action='store_true',
1125 help='Cleans the cache, trimming it necessary and remove corrupted items '
1126 'and returns without executing anything; use with -v to know what '
1127 'was done')
1128 parser.add_option(
maruel4409e302016-07-19 14:25:51 -07001129 '--use-symlinks', action='store_true',
1130 help='Use symlinks instead of hardlinks')
1131 parser.add_option(
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001132 '--use-go-isolated',
1133 action='store_true',
1134 help='Use go isolated instead of python implementation')
1135 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001136 '--json',
1137 help='dump output metadata to json file. When used, run_isolated returns '
1138 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001139 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001140 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001141 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001142 '--grace-period', type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001143 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001144 parser.add_option(
Marc-Antoine Ruel49e347d2017-10-24 16:52:02 -07001145 '--raw-cmd', action='store_true',
1146 help='Ignore the isolated command, use the one supplied at the command '
1147 'line')
1148 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001149 '--relative-cwd',
1150 help='Ignore the isolated \'relative_cwd\' and use this one instead; '
1151 'requires --raw-cmd')
1152 parser.add_option(
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001153 '--env', default=[], action='append',
1154 help='Environment variables to set for the child process')
1155 parser.add_option(
1156 '--env-prefix', default=[], action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001157 help='Specify a VAR=./path/fragment to put in the environment variable '
1158 'before executing the command. The path fragment must be relative '
1159 'to the isolated run directory, and must not contain a `..` token. '
1160 'The path will be made absolute and prepended to the indicated '
1161 '$VAR using the OS\'s path separator. Multiple items for the same '
1162 '$VAR will be prepended in order.')
1163 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001164 '--bot-file',
1165 help='Path to a file describing the state of the host. The content is '
1166 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001167 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001168 '--switch-to-account',
1169 help='If given, switches LUCI_CONTEXT to given logical service account '
1170 '(e.g. "task" or "system") before launching the isolated process.')
1171 parser.add_option(
aludwin0a8e17d2016-10-27 15:57:39 -07001172 '--output', action='append',
1173 help='Specifies an output to return. If no outputs are specified, all '
1174 'files located in $(ISOLATED_OUTDIR) will be returned; '
1175 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1176 'specified by --output option (there can be multiple) will be '
1177 'returned. Note that if a file in OUT_DIR has the same path '
1178 'as an --output option, the --output version will be returned.')
1179 parser.add_option(
aludwin7556e0c2016-10-26 08:46:10 -07001180 '-a', '--argsfile',
1181 # This is actually handled in parse_args; it's included here purely so it
1182 # can make it into the help text.
1183 help='Specify a file containing a JSON array of arguments to this '
1184 'script. If --argsfile is provided, no other argument may be '
1185 'provided on the command line.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001186
1187 group = optparse.OptionGroup(parser, 'Data source')
1188 group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001189 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001190 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001191 isolateserver.add_isolate_server_options(group)
1192 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001193
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001194 isolateserver.add_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001195
1196 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001197
1198 group = optparse.OptionGroup(parser, 'Named caches')
1199 group.add_option(
1200 '--named-cache',
1201 dest='named_caches',
1202 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001203 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001204 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001205 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001206 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1207 'path is a path relative to the run dir where the cache directory '
1208 'must be put to. '
1209 'This option can be specified more than once.')
1210 group.add_option(
1211 '--named-cache-root', default='named_caches',
1212 help='Cache root directory. Default=%default')
1213 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001214
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001215 group = optparse.OptionGroup(parser, 'Process containment')
1216 parser.add_option(
1217 '--lower-priority', action='store_true',
1218 help='Lowers the child process priority')
1219 parser.add_option(
1220 '--containment-type', choices=('NONE', 'AUTO', 'JOB_OBJECT'),
1221 default='NONE',
1222 help='Type of container to use')
1223 parser.add_option(
1224 '--limit-processes', type='int', default=0,
1225 help='Maximum number of active processes in the containment')
1226 parser.add_option(
1227 '--limit-total-committed-memory', type='int', default=0,
1228 help='Maximum sum of committed memory in the containment')
1229 parser.add_option_group(group)
1230
1231 group = optparse.OptionGroup(parser, 'Debugging')
1232 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001233 '--leak-temp-dir',
1234 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001235 help='Deliberately leak isolate\'s temp dir for later examination. '
1236 'Default: %default')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001237 group.add_option(
marueleb5fbee2015-09-17 13:01:36 -07001238 '--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001239 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001240
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001241 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001242
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001243 parser.set_defaults(cache='cache', cipd_cache='cipd_cache')
nodirbe642ff2016-06-09 15:51:51 -07001244 return parser
1245
1246
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001247def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001248 """Validates named cache options and returns a CacheManager."""
1249 if options.named_caches and not options.named_cache_root:
1250 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001251 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001252 if not CACHE_NAME_RE.match(name):
1253 parser.error(
1254 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1255 if not path:
1256 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001257 try:
1258 long(hint)
1259 except ValueError:
1260 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001261 if options.named_cache_root:
1262 # Make these configurable later if there is use case but for now it's fairly
1263 # safe values.
1264 # In practice, a fair chunk of bots are already recycled on a daily schedule
1265 # so this code doesn't have any effect to them, unless they are preloaded
1266 # with a really old cache.
1267 policies = local_caching.CachePolicies(
1268 # 1TiB.
1269 max_cache_size=1024*1024*1024*1024,
1270 min_free_space=options.min_free_space,
1271 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001272 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001273 root_dir = six.text_type(os.path.abspath(options.named_cache_root))
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001274 return local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001275 return None
1276
1277
aludwin7556e0c2016-10-26 08:46:10 -07001278def parse_args(args):
1279 # Create a fake mini-parser just to get out the "-a" command. Note that
1280 # it's not documented here; instead, it's documented in create_option_parser
1281 # even though that parser will never actually get to parse it. This is
1282 # because --argsfile is exclusive with all other options and arguments.
1283 file_argparse = argparse.ArgumentParser(add_help=False)
1284 file_argparse.add_argument('-a', '--argsfile')
1285 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1286 if file_args.argsfile:
1287 if nonfile_args:
1288 file_argparse.error('Can\'t specify --argsfile with'
1289 'any other arguments (%s)' % nonfile_args)
1290 try:
1291 with open(file_args.argsfile, 'r') as f:
1292 args = json.load(f)
1293 except (IOError, OSError, ValueError) as e:
1294 # We don't need to error out here - "args" is now empty,
1295 # so the call below to parser.parse_args(args) will fail
1296 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001297 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001298
1299 # Even if we failed to read the args, just call the normal parser now since it
1300 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001301 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001302 options, args = parser.parse_args(args)
aludwin7556e0c2016-10-26 08:46:10 -07001303 return (parser, options, args)
1304
1305
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001306def _calc_named_cache_hint(named_cache, named_caches):
1307 """Returns the expected size of the missing named caches."""
1308 present = named_cache.available
1309 size = 0
1310 for name, _, hint in named_caches:
1311 if name not in present:
1312 hint = long(hint)
1313 if hint > 0:
1314 size += hint
1315 return size
1316
1317
aludwin7556e0c2016-10-26 08:46:10 -07001318def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001319 # Warning: when --argsfile is used, the strings are unicode instances, when
1320 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001321 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001322
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001323 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001324 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001325
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001326 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001327 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001328 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1329 if hint:
1330 # Increase the --min-free-space value by the hint, and recreate the
1331 # NamedCache instance so it gets the updated CachePolicy.
1332 options.min_free_space += hint
1333 named_cache = process_named_cache_options(parser, options)
1334
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001335 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1336 # they can be cleaned the same way.
nodirf33b8d62016-10-26 22:34:58 -07001337 isolate_cache = isolateserver.process_cache_options(options, trim=False)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001338 caches = []
1339 if isolate_cache:
1340 caches.append(isolate_cache)
1341 if named_cache:
1342 caches.append(named_cache)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001343 root = caches[0].cache_dir if caches else six.text_type(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001344 if options.clean:
1345 if options.isolated:
1346 parser.error('Can\'t use --isolated with --clean.')
1347 if options.isolate_server:
1348 parser.error('Can\'t use --isolate-server with --clean.')
1349 if options.json:
1350 parser.error('Can\'t use --json with --clean.')
nodirf33b8d62016-10-26 22:34:58 -07001351 if options.named_caches:
1352 parser.error('Can\t use --named-cache with --clean.')
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001353 # Trim first, then clean.
1354 local_caching.trim_caches(
1355 caches,
1356 root,
1357 min_free_space=options.min_free_space,
1358 max_age_secs=MAX_AGE_SECS)
1359 for c in caches:
Marc-Antoine Ruel87fc2222018-06-18 13:09:24 +00001360 c.cleanup()
maruel36a963d2016-04-08 17:15:49 -07001361 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001362
1363 # Trim must still be done for the following case:
1364 # - named-cache was used
1365 # - some entries, with a large hint, where missing
1366 # - --min-free-space was increased accordingly, thus trimming is needed
1367 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1368 # --clean after each task.
1369 if hint:
1370 logging.info('Additional trimming of %d bytes', hint)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001371 local_caching.trim_caches(
1372 caches,
1373 root,
1374 min_free_space=options.min_free_space,
1375 max_age_secs=MAX_AGE_SECS)
maruel36a963d2016-04-08 17:15:49 -07001376
nodir55be77b2016-05-03 09:39:57 -07001377 if not options.isolated and not args:
1378 parser.error('--isolated or command to run is required.')
1379
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001380 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001381
1382 isolateserver.process_isolate_server_options(
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001383 parser, options, True, False)
nodir55be77b2016-05-03 09:39:57 -07001384 if not options.isolate_server:
1385 if options.isolated:
1386 parser.error('--isolated requires --isolate-server')
1387 if ISOLATED_OUTDIR_PARAMETER in args:
1388 parser.error(
1389 '%s in args requires --isolate-server' % ISOLATED_OUTDIR_PARAMETER)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001390
nodir90bc8dc2016-06-15 13:35:21 -07001391 if options.root_dir:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001392 options.root_dir = six.text_type(os.path.abspath(options.root_dir))
maruel12e30012015-10-09 11:55:35 -07001393 if options.json:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001394 options.json = six.text_type(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001395
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001396 if any('=' not in i for i in options.env):
1397 parser.error(
1398 '--env required key=value form. value can be skipped to delete '
1399 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001400 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001401
1402 prefixes = {}
1403 cwd = os.path.realpath(os.getcwd())
1404 for item in options.env_prefix:
1405 if '=' not in item:
1406 parser.error(
1407 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1408 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001409 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001410 if os.path.isabs(opath):
1411 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1412 opath = os.path.normpath(opath)
1413 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1414 parser.error(
1415 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1416 % opath)
1417 prefixes.setdefault(key, []).append(opath)
1418 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001419
nodirbe642ff2016-06-09 15:51:51 -07001420 cipd.validate_cipd_options(parser, options)
Takuto Ikuta7f1471c2019-12-02 04:34:03 +00001421 if options.use_go_isolated and not options.cipd_enabled:
1422 parser.error('--cipd-enabled should be set if --use-go-isolated is set.')
nodirbe642ff2016-06-09 15:51:51 -07001423
vadimsh232f5a82017-01-20 19:23:44 -08001424 install_packages_fn = noop_install_packages
vadimsh902948e2017-01-20 15:57:32 -08001425 if options.cipd_enabled:
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001426 install_packages_fn = (
1427 lambda run_dir, isolated_dir: install_client_and_packages(
vadimsh902948e2017-01-20 15:57:32 -08001428 run_dir, cipd.parse_package_args(options.cipd_packages),
1429 options.cipd_server, options.cipd_client_package,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001430 options.cipd_client_version, cache_dir=options.cipd_cache,
1431 isolated_dir=isolated_dir))
nodirbe642ff2016-06-09 15:51:51 -07001432
nodird6160682017-02-02 13:03:35 -08001433 @contextlib.contextmanager
nodir0ae98b32017-05-11 13:21:53 -07001434 def install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001435 # WARNING: this function depends on "options" variable defined in the outer
1436 # function.
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001437 assert six.text_type(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001438 assert os.path.isabs(run_dir), run_dir
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001439 named_caches = [(os.path.join(run_dir, six.text_type(relpath)), name)
1440 for name, relpath, _ in options.named_caches]
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001441 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001442 named_cache.install(path, name)
nodird6160682017-02-02 13:03:35 -08001443 try:
1444 yield
1445 finally:
dnje289d132017-07-07 11:16:44 -07001446 # Uninstall each named cache, returning it to the cache pool. If an
1447 # uninstall fails for a given cache, it will remain in the task's
1448 # temporary space, get cleaned up by the Swarming bot, and be lost.
1449 #
1450 # If the Swarming bot cannot clean up the cache, it will handle it like
1451 # any other bot file that could not be removed.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001452 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001453 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001454 # uninstall() doesn't trim but does call save() implicitly. Trimming
1455 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001456 named_cache.uninstall(path, name)
1457 except local_caching.NamedCacheError:
1458 logging.exception('Error while removing named cache %r at %r. '
1459 'The cache will be lost.', path, name)
nodirf33b8d62016-10-26 22:34:58 -07001460
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001461 extra_args = []
1462 command = []
1463 if options.raw_cmd:
1464 command = args
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001465 if options.relative_cwd:
1466 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1467 if not a.startswith(os.getcwd()):
1468 parser.error(
1469 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001470 else:
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001471 if options.relative_cwd:
1472 parser.error('--relative-cwd requires --raw-cmd')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001473 extra_args = args
1474
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001475 containment_type = subprocess42.Containment.NONE
1476 if options.containment_type == 'AUTO':
1477 containment_type = subprocess42.Containment.AUTO
1478 if options.containment_type == 'JOB_OBJECT':
1479 containment_type = subprocess42.Containment.JOB_OBJECT
1480 containment = subprocess42.Containment(
1481 containment_type=containment_type,
1482 limit_processes=options.limit_processes,
1483 limit_total_committed_memory=options.limit_total_committed_memory)
1484
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001485 data = TaskData(
1486 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001487 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001488 extra_args=extra_args,
1489 isolated_hash=options.isolated,
1490 storage=None,
1491 isolate_cache=isolate_cache,
1492 outputs=options.output,
1493 install_named_caches=install_named_caches,
1494 leak_temp_dir=options.leak_temp_dir,
1495 root_dir=_to_unicode(options.root_dir),
1496 hard_timeout=options.hard_timeout,
1497 grace_period=options.grace_period,
1498 bot_file=options.bot_file,
1499 switch_to_account=options.switch_to_account,
1500 install_packages_fn=install_packages_fn,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001501 use_symlinks=bool(options.use_symlinks),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +00001502 use_go_isolated=bool(options.use_go_isolated),
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001503 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001504 env_prefix=options.env_prefix,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001505 lower_priority=bool(options.lower_priority),
1506 containment=containment)
nodirbe642ff2016-06-09 15:51:51 -07001507 try:
nodir90bc8dc2016-06-15 13:35:21 -07001508 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001509 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001510 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001511 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001512 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001513 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001514 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001515 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001516 return run_tha_test(data, options.json)
1517 return run_tha_test(data, options.json)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001518 except (
1519 cipd.Error,
1520 local_caching.NamedCacheError,
Marc-Antoine Ruelb6e9e232018-11-20 00:12:33 +00001521 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001522 print(ex.message, file=sys.stderr)
nodirbe642ff2016-06-09 15:51:51 -07001523 return 1
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001524
1525
1526if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001527 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001528 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001529 fix_encoding.fix_encoding()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001530 sys.exit(main(sys.argv[1:]))