blob: 46b3e2ba384b488776add5ad318a61eb5322d527 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
nodir55be77b2016-05-03 09:39:57 -07008Despite name "run_isolated", can run a generic non-isolated command specified as
9args.
10
11If input isolated hash is provided, fetches it, creates a tree of hard links,
12appends args to the command in the fetched isolated and runs it.
13To improve performance, keeps a local cache.
14The local cache can safely be deleted.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050015
nodirbe642ff2016-06-09 15:51:51 -070016Any ${EXECUTABLE_SUFFIX} on the command line will be replaced with ".exe" string
17on Windows and "" on other platforms.
18
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050019Any ${ISOLATED_OUTDIR} on the command line will be replaced by the location of a
20temporary directory upon execution of the command specified in the .isolated
21file. All content written to this directory will be uploaded upon termination
22and the .isolated file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070023
24Any ${SWARMING_BOT_FILE} on the command line will be replaced by the value of
25the --bot-file parameter. This file is used by a swarming bot to communicate
26state of the host to tasks. It is written to by the swarming bot's
27on_before_task() hook in the swarming server's custom bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000028"""
29
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +000030__version__ = '0.11.0'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000031
aludwin7556e0c2016-10-26 08:46:10 -070032import argparse
maruel064c0a32016-04-05 11:47:15 -070033import base64
iannucci96fcccc2016-08-30 15:52:22 -070034import collections
vadimsh232f5a82017-01-20 19:23:44 -080035import contextlib
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040036import errno
aludwin7556e0c2016-10-26 08:46:10 -070037import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000038import logging
39import optparse
40import os
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040041import re
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000042import sys
43import tempfile
maruel064c0a32016-04-05 11:47:15 -070044import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000045
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000046from third_party.depot_tools import fix_encoding
47
Vadim Shtayura6b555c12014-07-23 16:22:18 -070048from utils import file_path
maruel12e30012015-10-09 11:55:35 -070049from utils import fs
maruel064c0a32016-04-05 11:47:15 -070050from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040051from utils import logging_utils
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040052from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050053from utils import subprocess42
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000054from utils import tools
vadimsh@chromium.org3e97deb2013-08-24 00:56:44 +000055from utils import zip_package
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000056
vadimsh9c54b2c2017-07-25 14:08:29 -070057from libs import luci_context
58
Vadim Shtayurae34e13a2014-02-02 11:23:26 -080059import auth
nodirbe642ff2016-06-09 15:51:51 -070060import cipd
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000061import isolateserver
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040062import local_caching
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000063
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000064
vadimsh@chromium.org85071062013-08-21 23:37:45 +000065# Absolute path to this file (can be None if running from zip on Mac).
tansella4949442016-06-23 22:34:32 -070066THIS_FILE_PATH = os.path.abspath(
67 __file__.decode(sys.getfilesystemencoding())) if __file__ else None
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000068
69# Directory that contains this file (might be inside zip package).
tansella4949442016-06-23 22:34:32 -070070BASE_DIR = os.path.dirname(THIS_FILE_PATH) if __file__.decode(
71 sys.getfilesystemencoding()) else None
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000072
73# Directory that contains currently running script file.
maruel@chromium.org814d23f2013-10-01 19:08:00 +000074if zip_package.get_main_script_path():
75 MAIN_DIR = os.path.dirname(
76 os.path.abspath(zip_package.get_main_script_path()))
77else:
78 # This happens when 'import run_isolated' is executed at the python
79 # interactive prompt, in that case __file__ is undefined.
80 MAIN_DIR = None
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000081
maruele2f2cb82016-07-13 14:41:03 -070082
83# Magic variables that can be found in the isolate task command line.
84ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
85EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
86SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
87
88
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000089# The name of the log file to use.
90RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
91
maruele2f2cb82016-07-13 14:41:03 -070092
csharp@chromium.orge217f302012-11-22 16:51:53 +000093# The name of the log to use for the run_test_cases.py command
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000094RUN_TEST_CASES_LOG = 'run_test_cases.log'
csharp@chromium.orge217f302012-11-22 16:51:53 +000095
vadimsh@chromium.org87d63262013-04-04 19:34:21 +000096
maruele2f2cb82016-07-13 14:41:03 -070097# Use short names for temporary directories. This is driven by Windows, which
98# imposes a relatively short maximum path length of 260 characters, often
99# referred to as MAX_PATH. It is relatively easy to create files with longer
100# path length. A use case is with recursive depedency treesV like npm packages.
101#
102# It is recommended to start the script with a `root_dir` as short as
103# possible.
104# - ir stands for isolated_run
105# - io stands for isolated_out
106# - it stands for isolated_tmp
107ISOLATED_RUN_DIR = u'ir'
108ISOLATED_OUT_DIR = u'io'
109ISOLATED_TMP_DIR = u'it'
110
111
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400112# Keep synced with task_request.py
113CACHE_NAME_RE = re.compile(ur'^[a-z0-9_]{1,4096}$')
114
115
marueld928c862017-06-08 08:20:04 -0700116OUTLIVING_ZOMBIE_MSG = """\
117*** Swarming tried multiple times to delete the %s directory and failed ***
118*** Hard failing the task ***
119
120Swarming detected that your testing script ran an executable, which may have
121started a child executable, and the main script returned early, leaving the
122children executables playing around unguided.
123
124You don't want to leave children processes outliving the task on the Swarming
125bot, do you? The Swarming bot doesn't.
126
127How to fix?
128- For any process that starts children processes, make sure all children
129 processes terminated properly before each parent process exits. This is
130 especially important in very deep process trees.
131 - This must be done properly both in normal successful task and in case of
132 task failure. Cleanup is very important.
133- The Swarming bot sends a SIGTERM in case of timeout.
134 - You have %s seconds to comply after the signal was sent to the process
135 before the process is forcibly killed.
136- To achieve not leaking children processes in case of signals on timeout, you
137 MUST handle signals in each executable / python script and propagate them to
138 children processes.
139 - When your test script (python or binary) receives a signal like SIGTERM or
140 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
141 them to terminate before quitting.
142
143See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400144https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700145for more information.
146
147*** May the SIGKILL force be with you ***
148"""
149
150
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000151# Currently hardcoded. Eventually could be exposed as a flag once there's value.
152# 3 weeks
153MAX_AGE_SECS = 21*24*60*60
154
155
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500156TaskData = collections.namedtuple(
157 'TaskData', [
158 # List of strings; the command line to use, independent of what was
159 # specified in the isolated file.
160 'command',
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500161 # Relative directory to start command into.
162 'relative_cwd',
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500163 # List of strings; the arguments to add to the command specified in the
164 # isolated file.
165 'extra_args',
166 # Hash of the .isolated file that must be retrieved to recreate the tree
167 # of files to run the target executable. The command specified in the
168 # .isolated is executed. Mutually exclusive with command argument.
169 'isolated_hash',
170 # isolateserver.Storage instance to retrieve remote objects. This object
171 # has a reference to an isolateserver.StorageApi, which does the actual
172 # I/O.
173 'storage',
174 # isolateserver.LocalCache instance to keep from retrieving the same
175 # objects constantly by caching the objects retrieved. Can be on-disk or
176 # in-memory.
177 'isolate_cache',
178 # List of paths relative to root_dir to put into the output isolated
179 # bundle upon task completion (see link_outputs_to_outdir).
180 'outputs',
181 # Function (run_dir) => context manager that installs named caches into
182 # |run_dir|.
183 'install_named_caches',
184 # If True, the temporary directory will be deliberately leaked for later
185 # examination.
186 'leak_temp_dir',
187 # Path to the directory to use to create the temporary directory. If not
188 # specified, a random temporary directory is created.
189 'root_dir',
190 # Kills the process if it lasts more than this amount of seconds.
191 'hard_timeout',
192 # Number of seconds to wait between SIGTERM and SIGKILL.
193 'grace_period',
194 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
195 # task command line argument.
196 'bot_file',
197 # Logical account to switch LUCI_CONTEXT into.
198 'switch_to_account',
199 # Context manager dir => CipdInfo, see install_client_and_packages.
200 'install_packages_fn',
201 # Create tree with symlinks instead of hardlinks.
202 'use_symlinks',
203 # Environment variables to set.
204 'env',
205 # Environment variables to mutate with relative directories.
206 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
207 'env_prefix'])
208
209
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +0000210def get_as_zip_package(executable=True):
211 """Returns ZipPackage with this module and all its dependencies.
212
213 If |executable| is True will store run_isolated.py as __main__.py so that
214 zip package is directly executable be python.
215 """
216 # Building a zip package when running from another zip package is
217 # unsupported and probably unneeded.
218 assert not zip_package.is_zipped_module(sys.modules[__name__])
vadimsh@chromium.org85071062013-08-21 23:37:45 +0000219 assert THIS_FILE_PATH
220 assert BASE_DIR
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +0000221 package = zip_package.ZipPackage(root=BASE_DIR)
222 package.add_python_file(THIS_FILE_PATH, '__main__.py' if executable else None)
aludwin81178302016-11-30 17:18:49 -0800223 package.add_python_file(os.path.join(BASE_DIR, 'isolate_storage.py'))
Marc-Antoine Ruel8bee66d2014-08-28 19:02:07 -0400224 package.add_python_file(os.path.join(BASE_DIR, 'isolated_format.py'))
maruel@chromium.orgdedbf492013-09-12 20:42:11 +0000225 package.add_python_file(os.path.join(BASE_DIR, 'isolateserver.py'))
Vadim Shtayurae34e13a2014-02-02 11:23:26 -0800226 package.add_python_file(os.path.join(BASE_DIR, 'auth.py'))
nodirbe642ff2016-06-09 15:51:51 -0700227 package.add_python_file(os.path.join(BASE_DIR, 'cipd.py'))
Marc-Antoine Ruel34f5f282018-05-16 16:04:31 -0400228 package.add_python_file(os.path.join(BASE_DIR, 'local_caching.py'))
tanselle4288c32016-07-28 09:45:40 -0700229 package.add_directory(os.path.join(BASE_DIR, 'libs'))
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +0000230 package.add_directory(os.path.join(BASE_DIR, 'third_party'))
231 package.add_directory(os.path.join(BASE_DIR, 'utils'))
232 return package
233
234
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500235def _to_str(s):
236 """Downgrades a unicode instance to str. Pass str through as-is."""
237 if isinstance(s, str):
238 return s
239 # This is technically incorrect, especially on Windows. In theory
240 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
241 # page' on Windows, but that causes other problems, as the character set
242 # is very limited.
243 return s.encode('utf-8')
244
245
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500246def _to_unicode(s):
247 """Upgrades a str instance to unicode. Pass unicode through as-is."""
248 if isinstance(s, unicode) or s is None:
249 return s
250 return s.decode('utf-8')
251
252
maruel03e11842016-07-14 10:50:16 -0700253def make_temp_dir(prefix, root_dir):
254 """Returns a new unique temporary directory."""
255 return unicode(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000256
257
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500258def change_tree_read_only(rootdir, read_only):
259 """Changes the tree read-only bits according to the read_only specification.
260
261 The flag can be 0, 1 or 2, which will affect the possibility to modify files
262 and create or delete files.
263 """
264 if read_only == 2:
265 # Files and directories (except on Windows) are marked read only. This
266 # inhibits modifying, creating or deleting files in the test directory,
267 # except on Windows where creating and deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400268 file_path.make_tree_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500269 elif read_only == 1:
270 # Files are marked read only but not the directories. This inhibits
271 # modifying files but creating or deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400272 file_path.make_tree_files_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500273 elif read_only in (0, None):
Marc-Antoine Ruelf1d827c2014-11-24 15:22:25 -0500274 # Anything can be modified.
Marc-Antoine Ruel2666d9c2018-05-18 13:52:02 -0400275 # TODO(maruel): This is currently dangerous as long as
276 # DiskContentAddressedCache.touch() is not yet changed to verify the hash of
277 # the content of the files it is looking at, so that if a test modifies an
278 # input file, the file must be deleted.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400279 file_path.make_tree_writeable(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500280 else:
281 raise ValueError(
282 'change_tree_read_only(%s, %s): Unknown flag %s' %
283 (rootdir, read_only, read_only))
284
285
vadimsh9c54b2c2017-07-25 14:08:29 -0700286@contextlib.contextmanager
287def set_luci_context_account(account, tmp_dir):
288 """Sets LUCI_CONTEXT account to be used by the task.
289
290 If 'account' is None or '', does nothing at all. This happens when
291 run_isolated.py is called without '--switch-to-account' flag. In this case,
292 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
293 just inherit whatever account is already set. This may happen is users invoke
294 run_isolated.py explicitly from their code.
295
296 If the requested account is not defined in the context, switches to
297 non-authenticated access. This happens for Swarming tasks that don't use
298 'task' service accounts.
299
300 If not using LUCI_CONTEXT-based auth, does nothing.
301 If already running as requested account, does nothing.
302 """
303 if not account:
304 # Not actually switching.
305 yield
306 return
307
308 local_auth = luci_context.read('local_auth')
309 if not local_auth:
310 # Not using LUCI_CONTEXT auth at all.
311 yield
312 return
313
314 # See LUCI_CONTEXT.md for the format of 'local_auth'.
315 if local_auth.get('default_account_id') == account:
316 # Already set, no need to switch.
317 yield
318 return
319
320 available = {a['id'] for a in local_auth.get('accounts') or []}
321 if account in available:
322 logging.info('Switching default LUCI_CONTEXT account to %r', account)
323 local_auth['default_account_id'] = account
324 else:
325 logging.warning(
326 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
327 'disabling authentication', account, sorted(available))
328 local_auth.pop('default_account_id', None)
329
330 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
331 yield
332
333
nodir90bc8dc2016-06-15 13:35:21 -0700334def process_command(command, out_dir, bot_file):
nodirbe642ff2016-06-09 15:51:51 -0700335 """Replaces variables in a command line.
336
337 Raises:
338 ValueError if a parameter is requested in |command| but its value is not
339 provided.
340 """
maruela9cfd6f2015-09-15 11:03:15 -0700341 def fix(arg):
nodirbe642ff2016-06-09 15:51:51 -0700342 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
343 replace_slash = False
nodir55be77b2016-05-03 09:39:57 -0700344 if ISOLATED_OUTDIR_PARAMETER in arg:
nodirbe642ff2016-06-09 15:51:51 -0700345 if not out_dir:
maruel7f63a272016-07-12 12:40:36 -0700346 raise ValueError(
347 'output directory is requested in command, but not provided; '
348 'please specify one')
nodir55be77b2016-05-03 09:39:57 -0700349 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
nodirbe642ff2016-06-09 15:51:51 -0700350 replace_slash = True
nodir90bc8dc2016-06-15 13:35:21 -0700351 if SWARMING_BOT_FILE_PARAMETER in arg:
352 if bot_file:
353 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
354 replace_slash = True
355 else:
356 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command, but no '
357 'bot_file specified. Leaving parameter unchanged.')
nodirbe642ff2016-06-09 15:51:51 -0700358 if replace_slash:
359 # Replace slashes only if parameters are present
nodir55be77b2016-05-03 09:39:57 -0700360 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
361 arg = arg.replace('/', os.sep)
maruela9cfd6f2015-09-15 11:03:15 -0700362 return arg
363
364 return [fix(arg) for arg in command]
365
366
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500367def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes):
vadimsh232f5a82017-01-20 19:23:44 -0800368 """Returns full OS environment to run a command in.
369
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800370 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
371 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800372
373 Args:
374 tmp_dir: temp directory.
375 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500376 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500377 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800378 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
vadimsh232f5a82017-01-20 19:23:44 -0800379 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500380 out = os.environ.copy()
381 for k, v in env.iteritems():
382 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500383 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500384 else:
385 out[k] = v
386
387 if cipd_info:
388 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500389 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
390 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500391
392 for key, paths in env_prefixes.iteritems():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500393 assert isinstance(paths, list), paths
394 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500395 cur = out.get(key)
396 if cur:
397 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500398 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800399
Marc-Antoine Ruelefb30b12018-07-25 18:34:36 +0000400 tmp_dir = _to_str(tmp_dir)
401 # pylint: disable=line-too-long
402 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
403 # platform. So $TMPDIR must be set on all platforms.
404 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
405 out['TMPDIR'] = tmp_dir
406 if sys.platform == 'win32':
407 # * chromium's base utils uses GetTempPath().
408 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
409 # * Go uses GetTempPath().
410 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
411 # set.
412 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
413 out['TMP'] = tmp_dir
414 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
415 out['TEMP'] = tmp_dir
416 elif sys.platform == 'darwin':
417 # * Chromium uses an hack on macOS before calling into
418 # NSTemporaryDirectory().
419 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
420 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
421 out['MAC_CHROMIUM_TMPDIR'] = tmp_dir
422 else:
423 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
424 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
425 # * mktemp on linux respects $TMPDIR.
426 # * Chromium respects $TMPDIR on linux.
427 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
428 # * Go uses $TMPDIR.
429 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
430 pass
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500431 return out
vadimsh232f5a82017-01-20 19:23:44 -0800432
433
434def run_command(command, cwd, env, hard_timeout, grace_period):
maruel6be7f9e2015-10-01 12:25:30 -0700435 """Runs the command.
436
437 Returns:
438 tuple(process exit code, bool if had a hard timeout)
439 """
maruela9cfd6f2015-09-15 11:03:15 -0700440 logging.info('run_command(%s, %s)' % (command, cwd))
marueleb5fbee2015-09-17 13:01:36 -0700441
maruel6be7f9e2015-10-01 12:25:30 -0700442 exit_code = None
443 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700444 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700445 proc = None
446 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700447 try:
maruel6be7f9e2015-10-01 12:25:30 -0700448 # TODO(maruel): This code is imperfect. It doesn't handle well signals
449 # during the download phase and there's short windows were things can go
450 # wrong.
451 def handler(signum, _frame):
452 if proc and not had_signal:
453 logging.info('Received signal %d', signum)
454 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700455 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700456
457 proc = subprocess42.Popen(command, cwd=cwd, env=env, detached=True)
458 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
459 try:
460 exit_code = proc.wait(hard_timeout or None)
461 except subprocess42.TimeoutExpired:
462 if not had_signal:
463 logging.warning('Hard timeout')
464 had_hard_timeout = True
465 logging.warning('Sending SIGTERM')
466 proc.terminate()
467
468 # Ignore signals in grace period. Forcibly give the grace period to the
469 # child process.
470 if exit_code is None:
471 ignore = lambda *_: None
472 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
473 try:
474 exit_code = proc.wait(grace_period or None)
475 except subprocess42.TimeoutExpired:
476 # Now kill for real. The user can distinguish between the
477 # following states:
478 # - signal but process exited within grace period,
479 # hard_timed_out will be set but the process exit code will be
480 # script provided.
481 # - processed exited late, exit code will be -9 on posix.
482 logging.warning('Grace exhausted; sending SIGKILL')
483 proc.kill()
martiniss5c8043e2017-08-01 17:09:43 -0700484 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700485 exit_code = proc.wait()
maruela9cfd6f2015-09-15 11:03:15 -0700486 except OSError:
487 # This is not considered to be an internal error. The executable simply
488 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800489 sys.stderr.write(
490 '<The executable does not exist or a dependent library is missing>\n'
491 '<Check for missing .so/.dll in the .isolate or GN file>\n'
492 '<Command: %s>\n' % command)
493 if os.environ.get('SWARMING_TASK_ID'):
494 # Give an additional hint when running as a swarming task.
495 sys.stderr.write(
496 '<See the task\'s page for commands to help diagnose this issue '
497 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700498 exit_code = 1
499 logging.info(
500 'Command finished with exit code %d (%s)',
501 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700502 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700503
504
maruel4409e302016-07-19 14:25:51 -0700505def fetch_and_map(isolated_hash, storage, cache, outdir, use_symlinks):
506 """Fetches an isolated tree, create the tree and returns (bundle, stats)."""
nodir6f801882016-04-29 14:41:50 -0700507 start = time.time()
508 bundle = isolateserver.fetch_isolated(
509 isolated_hash=isolated_hash,
510 storage=storage,
511 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700512 outdir=outdir,
513 use_symlinks=use_symlinks)
nodir6f801882016-04-29 14:41:50 -0700514 return bundle, {
515 'duration': time.time() - start,
nodir6f801882016-04-29 14:41:50 -0700516 'items_cold': base64.b64encode(large.pack(sorted(cache.added))),
517 'items_hot': base64.b64encode(
tansell9e04a8d2016-07-28 09:31:59 -0700518 large.pack(sorted(set(cache.used) - set(cache.added)))),
nodir6f801882016-04-29 14:41:50 -0700519 }
520
521
aludwin0a8e17d2016-10-27 15:57:39 -0700522def link_outputs_to_outdir(run_dir, out_dir, outputs):
523 """Links any named outputs to out_dir so they can be uploaded.
524
525 Raises an error if the file already exists in that directory.
526 """
527 if not outputs:
528 return
529 isolateserver.create_directories(out_dir, outputs)
530 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400531 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
532
533
534def copy_recursively(src, dst):
535 """Efficiently copies a file or directory from src_dir to dst_dir.
536
537 `item` may be a file, directory, or a symlink to a file or directory.
538 All symlinks are replaced with their targets, so the resulting
539 directory structure in dst_dir will never have any symlinks.
540
541 To increase speed, copy_recursively hardlinks individual files into the
542 (newly created) directory structure if possible, unlike Python's
543 shutil.copytree().
544 """
545 orig_src = src
546 try:
547 # Replace symlinks with their final target.
548 while fs.islink(src):
549 res = fs.readlink(src)
550 src = os.path.join(os.path.dirname(src), res)
551 # TODO(sadafm): Explicitly handle cyclic symlinks.
552
553 # Note that fs.isfile (which is a wrapper around os.path.isfile) throws
554 # an exception if src does not exist. A warning will be logged in that case.
555 if fs.isfile(src):
556 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
557 return
558
559 if not fs.exists(dst):
560 os.makedirs(dst)
561
562 for child in fs.listdir(src):
563 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
564
565 except OSError as e:
566 if e.errno == errno.ENOENT:
567 logging.warning('Path %s does not exist or %s is a broken symlink',
568 src, orig_src)
569 else:
570 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700571
572
maruela9cfd6f2015-09-15 11:03:15 -0700573def delete_and_upload(storage, out_dir, leak_temp_dir):
574 """Deletes the temporary run directory and uploads results back.
575
576 Returns:
nodir6f801882016-04-29 14:41:50 -0700577 tuple(outputs_ref, success, stats)
maruel064c0a32016-04-05 11:47:15 -0700578 - outputs_ref: a dict referring to the results archived back to the isolated
579 server, if applicable.
580 - success: False if something occurred that means that the task must
581 forcibly be considered a failure, e.g. zombie processes were left
582 behind.
nodir6f801882016-04-29 14:41:50 -0700583 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700584 """
maruela9cfd6f2015-09-15 11:03:15 -0700585 # Upload out_dir and generate a .isolated file out of this directory. It is
586 # only done if files were written in the directory.
587 outputs_ref = None
maruel064c0a32016-04-05 11:47:15 -0700588 cold = []
589 hot = []
nodir6f801882016-04-29 14:41:50 -0700590 start = time.time()
591
maruel12e30012015-10-09 11:55:35 -0700592 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700593 with tools.Profiler('ArchiveOutput'):
594 try:
maruel064c0a32016-04-05 11:47:15 -0700595 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
maruela9cfd6f2015-09-15 11:03:15 -0700596 storage, [out_dir], None)
597 outputs_ref = {
598 'isolated': results[0][0],
599 'isolatedserver': storage.location,
600 'namespace': storage.namespace,
601 }
maruel064c0a32016-04-05 11:47:15 -0700602 cold = sorted(i.size for i in f_cold)
603 hot = sorted(i.size for i in f_hot)
maruela9cfd6f2015-09-15 11:03:15 -0700604 except isolateserver.Aborted:
605 # This happens when a signal SIGTERM was received while uploading data.
606 # There is 2 causes:
607 # - The task was too slow and was about to be killed anyway due to
608 # exceeding the hard timeout.
609 # - The amount of data uploaded back is very large and took too much
610 # time to archive.
611 sys.stderr.write('Received SIGTERM while uploading')
612 # Re-raise, so it will be treated as an internal failure.
613 raise
nodir6f801882016-04-29 14:41:50 -0700614
615 success = False
maruela9cfd6f2015-09-15 11:03:15 -0700616 try:
maruel12e30012015-10-09 11:55:35 -0700617 if (not leak_temp_dir and fs.isdir(out_dir) and
maruel6eeea7d2015-09-16 12:17:42 -0700618 not file_path.rmtree(out_dir)):
maruela9cfd6f2015-09-15 11:03:15 -0700619 logging.error('Had difficulties removing out_dir %s', out_dir)
nodir6f801882016-04-29 14:41:50 -0700620 else:
621 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700622 except OSError as e:
623 # When this happens, it means there's a process error.
maruel12e30012015-10-09 11:55:35 -0700624 logging.exception('Had difficulties removing out_dir %s: %s', out_dir, e)
nodir6f801882016-04-29 14:41:50 -0700625 stats = {
626 'duration': time.time() - start,
627 'items_cold': base64.b64encode(large.pack(cold)),
628 'items_hot': base64.b64encode(large.pack(hot)),
629 }
630 return outputs_ref, success, stats
maruela9cfd6f2015-09-15 11:03:15 -0700631
632
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500633def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700634 """Runs a command with optional isolated input/output.
635
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500636 Arguments:
637 - data: TaskData instance.
638 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700639
640 Returns metadata about the result.
641 """
maruela9cfd6f2015-09-15 11:03:15 -0700642 result = {
maruel064c0a32016-04-05 11:47:15 -0700643 'duration': None,
maruela9cfd6f2015-09-15 11:03:15 -0700644 'exit_code': None,
maruel6be7f9e2015-10-01 12:25:30 -0700645 'had_hard_timeout': False,
Seth Koehler49139812017-12-19 13:59:33 -0500646 'internal_failure': 'run_isolated did not complete properly',
maruel064c0a32016-04-05 11:47:15 -0700647 'stats': {
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000648 'isolated': {
649 #'cipd': {
650 # 'duration': 0.,
651 # 'get_client_duration': 0.,
652 #},
653 'download': {
654 #'duration': 0.,
655 'initial_number_items': len(data.isolate_cache),
656 'initial_size': data.isolate_cache.total_size,
657 #'items_cold': '<large.pack()>',
658 #'items_hot': '<large.pack()>',
659 },
660 #'upload': {
661 # 'duration': 0.,
662 # 'items_cold': '<large.pack()>',
663 # 'items_hot': '<large.pack()>',
664 #},
665 },
maruel064c0a32016-04-05 11:47:15 -0700666 },
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000667 #'cipd_pins': {
668 # 'packages': [
669 # {'package_name': ..., 'version': ..., 'path': ...},
670 # ...
671 # ],
672 # 'client_package': {'package_name': ..., 'version': ...},
673 #},
maruela9cfd6f2015-09-15 11:03:15 -0700674 'outputs_ref': None,
nodirbe642ff2016-06-09 15:51:51 -0700675 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700676 }
nodirbe642ff2016-06-09 15:51:51 -0700677
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500678 if data.root_dir:
679 file_path.ensure_tree(data.root_dir, 0700)
680 elif data.isolate_cache.cache_dir:
681 data = data._replace(
682 root_dir=os.path.dirname(data.isolate_cache.cache_dir))
maruele2f2cb82016-07-13 14:41:03 -0700683 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700684 # If root_dir is not specified, it is not constant.
685 # TODO(maruel): This is not obvious. Change this to become an error once we
686 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500687 if constant_run_path and data.root_dir:
688 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700689 if os.path.isdir(run_dir):
690 file_path.rmtree(run_dir)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500691 os.mkdir(run_dir, 0700)
maruelcffa0542017-04-07 08:39:20 -0700692 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500693 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
maruel03e11842016-07-14 10:50:16 -0700694 # storage should be normally set but don't crash if it is not. This can happen
695 # as Swarming task can run without an isolate server.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500696 out_dir = make_temp_dir(
697 ISOLATED_OUT_DIR, data.root_dir) if data.storage else None
698 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700699 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500700 if data.relative_cwd:
701 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500702 command = data.command
nodir55be77b2016-05-03 09:39:57 -0700703 try:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500704 with data.install_packages_fn(run_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800705 if cipd_info:
706 result['stats']['cipd'] = cipd_info.stats
707 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700708
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500709 if data.isolated_hash:
vadimsh232f5a82017-01-20 19:23:44 -0800710 isolated_stats = result['stats'].setdefault('isolated', {})
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000711 bundle, stats = fetch_and_map(
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500712 isolated_hash=data.isolated_hash,
713 storage=data.storage,
714 cache=data.isolate_cache,
vadimsh232f5a82017-01-20 19:23:44 -0800715 outdir=run_dir,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500716 use_symlinks=data.use_symlinks)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000717 isolated_stats['download'].update(stats)
vadimsh232f5a82017-01-20 19:23:44 -0800718 change_tree_read_only(run_dir, bundle.read_only)
maruelabec63c2017-04-26 11:53:24 -0700719 # Inject the command
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500720 if not command and bundle.command:
721 command = bundle.command + data.extra_args
Marc-Antoine Rueld704a1f2017-10-31 10:51:23 -0400722 # Only set the relative directory if the isolated file specified a
723 # command, and no raw command was specified.
724 if bundle.relative_cwd:
725 cwd = os.path.normpath(os.path.join(cwd, bundle.relative_cwd))
maruelabec63c2017-04-26 11:53:24 -0700726
727 if not command:
728 # Handle this as a task failure, not an internal failure.
729 sys.stderr.write(
730 '<No command was specified!>\n'
731 '<Please secify a command when triggering your Swarming task>\n')
732 result['exit_code'] = 1
733 return result
nodirbe642ff2016-06-09 15:51:51 -0700734
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500735 if not cwd.startswith(run_dir):
736 # Handle this as a task failure, not an internal failure. This is a
737 # 'last chance' way to gate against directory escape.
738 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
739 result['exit_code'] = 1
740 return result
741
742 if not os.path.isdir(cwd):
743 # Accepts relative_cwd that does not exist.
744 os.makedirs(cwd, 0700)
745
vadimsh232f5a82017-01-20 19:23:44 -0800746 # If we have an explicit list of files to return, make sure their
747 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500748 if data.storage and data.outputs:
749 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700750
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500751 with data.install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -0800752 sys.stdout.flush()
753 start = time.time()
754 try:
vadimsh9c54b2c2017-07-25 14:08:29 -0700755 # Need to switch the default account before 'get_command_env' call,
756 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500757 with set_luci_context_account(data.switch_to_account, tmp_dir):
758 env = get_command_env(
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500759 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix)
Robert Iannucci24ae76a2018-02-26 12:51:18 -0800760 command = tools.fix_python_cmd(command, env)
761 command = process_command(command, out_dir, data.bot_file)
762 file_path.ensure_command_has_abs_path(command, cwd)
763
vadimsh9c54b2c2017-07-25 14:08:29 -0700764 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500765 command, cwd, env, data.hard_timeout, data.grace_period)
nodird6160682017-02-02 13:03:35 -0800766 finally:
767 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -0500768
769 # We successfully ran the command, set internal_failure back to
770 # None (even if the command failed, it's not an internal error).
771 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -0700772 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -0700773 # An internal error occurred. Report accordingly so the swarming task will
774 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -0700775 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -0700776 result['internal_failure'] = str(e)
777 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -0700778
779 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -0700780 finally:
781 try:
aludwin0a8e17d2016-10-27 15:57:39 -0700782 # Try to link files to the output directory, if specified.
783 if out_dir:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500784 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700785
nodir32a1ec12016-10-26 18:34:07 -0700786 success = False
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500787 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -0700788 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700789 logging.warning(
790 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -0700791 else:
maruel84537cb2015-10-16 14:21:28 -0700792 # On Windows rmtree(run_dir) call above has a synchronization effect: it
793 # finishes only when all task child processes terminate (since a running
794 # process locks *.exe file). Examine out_dir only after that call
795 # completes (since child processes may write to out_dir too and we need
796 # to wait for them to finish).
797 if fs.isdir(run_dir):
798 try:
799 success = file_path.rmtree(run_dir)
800 except OSError as e:
Marc-Antoine Ruel44699b32018-09-24 23:31:50 +0000801 logging.error('rmtree(%r) failed: %s', run_dir, e)
maruel84537cb2015-10-16 14:21:28 -0700802 success = False
803 if not success:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500804 sys.stderr.write(OUTLIVING_ZOMBIE_MSG % ('run', data.grace_period))
maruel84537cb2015-10-16 14:21:28 -0700805 if result['exit_code'] == 0:
806 result['exit_code'] = 1
807 if fs.isdir(tmp_dir):
808 try:
809 success = file_path.rmtree(tmp_dir)
810 except OSError as e:
Marc-Antoine Ruel44699b32018-09-24 23:31:50 +0000811 logging.error('rmtree(%r) failed: %s', tmp_dir, e)
maruel84537cb2015-10-16 14:21:28 -0700812 success = False
813 if not success:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500814 sys.stderr.write(OUTLIVING_ZOMBIE_MSG % ('temp', data.grace_period))
maruel84537cb2015-10-16 14:21:28 -0700815 if result['exit_code'] == 0:
816 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -0700817
marueleb5fbee2015-09-17 13:01:36 -0700818 # This deletes out_dir if leak_temp_dir is not set.
nodir9130f072016-05-27 13:59:08 -0700819 if out_dir:
nodir55715712016-06-03 12:28:19 -0700820 isolated_stats = result['stats'].setdefault('isolated', {})
821 result['outputs_ref'], success, isolated_stats['upload'] = (
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500822 delete_and_upload(data.storage, out_dir, data.leak_temp_dir))
maruela9cfd6f2015-09-15 11:03:15 -0700823 if not success and result['exit_code'] == 0:
824 result['exit_code'] = 1
825 except Exception as e:
826 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -0700827 if out_dir:
828 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -0700829 result['internal_failure'] = str(e)
830 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500831
832
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500833def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -0700834 """Runs an executable and records execution metadata.
835
nodir55be77b2016-05-03 09:39:57 -0700836 If isolated_hash is specified, downloads the dependencies in the cache,
837 hardlinks them into a temporary directory and runs the command specified in
838 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500839
840 A temporary directory is created to hold the output files. The content inside
841 this directory will be uploaded back to |storage| packaged as a .isolated
842 file.
843
844 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500845 - data: TaskData instance.
846 - result_json: File path to dump result metadata into. If set, the process
847 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -0700848
849 Returns:
850 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000851 """
maruela76b9ee2015-12-15 06:18:08 -0800852 if result_json:
853 # Write a json output file right away in case we get killed.
854 result = {
855 'exit_code': None,
856 'had_hard_timeout': False,
857 'internal_failure': 'Was terminated before completion',
858 'outputs_ref': None,
nodirbe642ff2016-06-09 15:51:51 -0700859 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -0800860 }
861 tools.write_json(result_json, result, dense=True)
862
maruela9cfd6f2015-09-15 11:03:15 -0700863 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500864 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -0700865 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -0700866
maruela9cfd6f2015-09-15 11:03:15 -0700867 if result_json:
maruel05d5a882015-09-21 13:59:02 -0700868 # We've found tests to delete 'work' when quitting, causing an exception
869 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -0700870 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -0700871 tools.write_json(result_json, result, dense=True)
872 # Only return 1 if there was an internal error.
873 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +0000874
maruela9cfd6f2015-09-15 11:03:15 -0700875 # Marshall into old-style inline output.
876 if result['outputs_ref']:
877 data = {
878 'hash': result['outputs_ref']['isolated'],
879 'namespace': result['outputs_ref']['namespace'],
880 'storage': result['outputs_ref']['isolatedserver'],
881 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -0500882 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700883 print(
884 '[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
885 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -0800886 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700887 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000888
889
iannuccib58d10d2017-03-18 02:00:25 -0700890# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -0800891CipdInfo = collections.namedtuple('CipdInfo', [
892 'client', # cipd.CipdClient object
893 'cache_dir', # absolute path to bot-global cipd tag and instance cache
894 'stats', # dict with stats to return to the server
895 'pins', # dict with installed cipd pins to return to the server
896])
897
898
899@contextlib.contextmanager
900def noop_install_packages(_run_dir):
iannuccib58d10d2017-03-18 02:00:25 -0700901 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -0800902 yield None
903
904
iannuccib58d10d2017-03-18 02:00:25 -0700905def _install_packages(run_dir, cipd_cache_dir, client, packages, timeout):
906 """Calls 'cipd ensure' for packages.
907
908 Args:
909 run_dir (str): root of installation.
910 cipd_cache_dir (str): the directory to use for the cipd package cache.
911 client (CipdClient): the cipd client to use
912 packages: packages to install, list [(path, package_name, version), ...].
913 timeout: max duration in seconds that this function can take.
914
915 Returns: list of pinned packages. Looks like [
916 {
917 'path': 'subdirectory',
918 'package_name': 'resolved/package/name',
919 'version': 'deadbeef...',
920 },
921 ...
922 ]
923 """
924 package_pins = [None]*len(packages)
925 def insert_pin(path, name, version, idx):
926 package_pins[idx] = {
927 'package_name': name,
928 # swarming deals with 'root' as '.'
929 'path': path or '.',
930 'version': version,
931 }
932
933 by_path = collections.defaultdict(list)
934 for i, (path, name, version) in enumerate(packages):
935 # cipd deals with 'root' as ''
936 if path == '.':
937 path = ''
938 by_path[path].append((name, version, i))
939
940 pins = client.ensure(
941 run_dir,
942 {
943 subdir: [(name, vers) for name, vers, _ in pkgs]
944 for subdir, pkgs in by_path.iteritems()
945 },
946 cache_dir=cipd_cache_dir,
947 timeout=timeout,
948 )
949
950 for subdir, pin_list in sorted(pins.iteritems()):
951 this_subdir = by_path[subdir]
952 for i, (name, version) in enumerate(pin_list):
953 insert_pin(subdir, name, version, this_subdir[i][2])
954
Robert Iannucci461b30d2017-12-13 11:34:03 -0800955 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -0700956
957 return package_pins
958
959
vadimsh232f5a82017-01-20 19:23:44 -0800960@contextlib.contextmanager
iannuccib58d10d2017-03-18 02:00:25 -0700961def install_client_and_packages(
nodirff531b42016-06-23 13:05:06 -0700962 run_dir, packages, service_url, client_package_name,
vadimsh232f5a82017-01-20 19:23:44 -0800963 client_version, cache_dir, timeout=None):
vadimsh902948e2017-01-20 15:57:32 -0800964 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -0700965
vadimsh232f5a82017-01-20 19:23:44 -0800966 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
967
968 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -0700969 [
970 {
971 "path": path, "package_name": package_name, "version": version,
972 },
973 ...
974 ]
vadimsh902948e2017-01-20 15:57:32 -0800975 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -0700976
977 such that they correspond 1:1 to all input package arguments from the command
978 line. These dictionaries make their all the way back to swarming, where they
979 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -0700980
vadimsh902948e2017-01-20 15:57:32 -0800981 If 'packages' list is empty, will bootstrap CIPD client, but won't install
982 any packages.
983
984 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -0800985 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -0800986
nodirbe642ff2016-06-09 15:51:51 -0700987 Args:
nodir90bc8dc2016-06-15 13:35:21 -0700988 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -0800989 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -0700990 service_url (str): CIPD server url, e.g.
991 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -0700992 client_package_name (str): CIPD package name of CIPD client.
993 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -0700994 cache_dir (str): where to keep cache of cipd clients, packages and tags.
995 timeout: max duration in seconds that this function can take.
nodirbe642ff2016-06-09 15:51:51 -0700996 """
997 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -0700998
nodirbe642ff2016-06-09 15:51:51 -0700999 timeoutfn = tools.sliding_timeout(timeout)
nodirbe642ff2016-06-09 15:51:51 -07001000 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001001
vadimsh902948e2017-01-20 15:57:32 -08001002 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001003 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001004 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001005 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001006
nodirbe642ff2016-06-09 15:51:51 -07001007 get_client_start = time.time()
1008 client_manager = cipd.get_client(
1009 service_url, client_package_name, client_version, cache_dir,
1010 timeout=timeoutfn())
iannucci96fcccc2016-08-30 15:52:22 -07001011
nodirbe642ff2016-06-09 15:51:51 -07001012 with client_manager as client:
1013 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001014
iannuccib58d10d2017-03-18 02:00:25 -07001015 package_pins = []
1016 if packages:
1017 package_pins = _install_packages(
1018 run_dir, cipd_cache_dir, client, packages, timeoutfn())
1019
1020 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001021
vadimsh232f5a82017-01-20 19:23:44 -08001022 total_duration = time.time() - start
1023 logging.info(
1024 'Installing CIPD client and packages took %d seconds', total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001025
vadimsh232f5a82017-01-20 19:23:44 -08001026 yield CipdInfo(
1027 client=client,
1028 cache_dir=cipd_cache_dir,
1029 stats={
1030 'duration': total_duration,
1031 'get_client_duration': get_client_duration,
1032 },
1033 pins={
iannuccib58d10d2017-03-18 02:00:25 -07001034 'client_package': {
1035 'package_name': client.package_name,
1036 'version': client.instance_id,
1037 },
vadimsh232f5a82017-01-20 19:23:44 -08001038 'packages': package_pins,
1039 })
nodirbe642ff2016-06-09 15:51:51 -07001040
1041
1042def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001043 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001044 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001045 version=__version__,
1046 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001047 parser.add_option(
maruel36a963d2016-04-08 17:15:49 -07001048 '--clean', action='store_true',
1049 help='Cleans the cache, trimming it necessary and remove corrupted items '
1050 'and returns without executing anything; use with -v to know what '
1051 'was done')
1052 parser.add_option(
maruel4409e302016-07-19 14:25:51 -07001053 '--use-symlinks', action='store_true',
1054 help='Use symlinks instead of hardlinks')
1055 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001056 '--json',
1057 help='dump output metadata to json file. When used, run_isolated returns '
1058 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001059 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001060 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001061 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001062 '--grace-period', type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001063 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001064 parser.add_option(
Marc-Antoine Ruel49e347d2017-10-24 16:52:02 -07001065 '--raw-cmd', action='store_true',
1066 help='Ignore the isolated command, use the one supplied at the command '
1067 'line')
1068 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001069 '--relative-cwd',
1070 help='Ignore the isolated \'relative_cwd\' and use this one instead; '
1071 'requires --raw-cmd')
1072 parser.add_option(
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001073 '--env', default=[], action='append',
1074 help='Environment variables to set for the child process')
1075 parser.add_option(
1076 '--env-prefix', default=[], action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001077 help='Specify a VAR=./path/fragment to put in the environment variable '
1078 'before executing the command. The path fragment must be relative '
1079 'to the isolated run directory, and must not contain a `..` token. '
1080 'The path will be made absolute and prepended to the indicated '
1081 '$VAR using the OS\'s path separator. Multiple items for the same '
1082 '$VAR will be prepended in order.')
1083 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001084 '--bot-file',
1085 help='Path to a file describing the state of the host. The content is '
1086 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001087 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001088 '--switch-to-account',
1089 help='If given, switches LUCI_CONTEXT to given logical service account '
1090 '(e.g. "task" or "system") before launching the isolated process.')
1091 parser.add_option(
aludwin0a8e17d2016-10-27 15:57:39 -07001092 '--output', action='append',
1093 help='Specifies an output to return. If no outputs are specified, all '
1094 'files located in $(ISOLATED_OUTDIR) will be returned; '
1095 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1096 'specified by --output option (there can be multiple) will be '
1097 'returned. Note that if a file in OUT_DIR has the same path '
1098 'as an --output option, the --output version will be returned.')
1099 parser.add_option(
aludwin7556e0c2016-10-26 08:46:10 -07001100 '-a', '--argsfile',
1101 # This is actually handled in parse_args; it's included here purely so it
1102 # can make it into the help text.
1103 help='Specify a file containing a JSON array of arguments to this '
1104 'script. If --argsfile is provided, no other argument may be '
1105 'provided on the command line.')
Marc-Antoine Ruel1687b5e2014-02-06 17:47:53 -05001106 data_group = optparse.OptionGroup(parser, 'Data source')
1107 data_group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001108 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001109 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruelf7d737d2014-12-10 15:36:29 -05001110 isolateserver.add_isolate_server_options(data_group)
Marc-Antoine Ruel1687b5e2014-02-06 17:47:53 -05001111 parser.add_option_group(data_group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001112
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001113 isolateserver.add_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001114
1115 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001116
1117 group = optparse.OptionGroup(parser, 'Named caches')
1118 group.add_option(
1119 '--named-cache',
1120 dest='named_caches',
1121 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001122 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001123 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001124 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001125 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1126 'path is a path relative to the run dir where the cache directory '
1127 'must be put to. '
1128 'This option can be specified more than once.')
1129 group.add_option(
1130 '--named-cache-root', default='named_caches',
1131 help='Cache root directory. Default=%default')
1132 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001133
Kenneth Russell61d42352014-09-15 11:41:16 -07001134 debug_group = optparse.OptionGroup(parser, 'Debugging')
1135 debug_group.add_option(
1136 '--leak-temp-dir',
1137 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001138 help='Deliberately leak isolate\'s temp dir for later examination. '
1139 'Default: %default')
marueleb5fbee2015-09-17 13:01:36 -07001140 debug_group.add_option(
1141 '--root-dir', help='Use a directory instead of a random one')
Kenneth Russell61d42352014-09-15 11:41:16 -07001142 parser.add_option_group(debug_group)
1143
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001144 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001145
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001146 parser.set_defaults(cache='cache', cipd_cache='cipd_cache')
nodirbe642ff2016-06-09 15:51:51 -07001147 return parser
1148
1149
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001150def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001151 """Validates named cache options and returns a CacheManager."""
1152 if options.named_caches and not options.named_cache_root:
1153 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001154 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001155 if not CACHE_NAME_RE.match(name):
1156 parser.error(
1157 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1158 if not path:
1159 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001160 try:
1161 long(hint)
1162 except ValueError:
1163 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001164 if options.named_cache_root:
1165 # Make these configurable later if there is use case but for now it's fairly
1166 # safe values.
1167 # In practice, a fair chunk of bots are already recycled on a daily schedule
1168 # so this code doesn't have any effect to them, unless they are preloaded
1169 # with a really old cache.
1170 policies = local_caching.CachePolicies(
1171 # 1TiB.
1172 max_cache_size=1024*1024*1024*1024,
1173 min_free_space=options.min_free_space,
1174 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001175 max_age_secs=MAX_AGE_SECS)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001176 root_dir = unicode(os.path.abspath(options.named_cache_root))
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001177 return local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001178 return None
1179
1180
aludwin7556e0c2016-10-26 08:46:10 -07001181def parse_args(args):
1182 # Create a fake mini-parser just to get out the "-a" command. Note that
1183 # it's not documented here; instead, it's documented in create_option_parser
1184 # even though that parser will never actually get to parse it. This is
1185 # because --argsfile is exclusive with all other options and arguments.
1186 file_argparse = argparse.ArgumentParser(add_help=False)
1187 file_argparse.add_argument('-a', '--argsfile')
1188 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1189 if file_args.argsfile:
1190 if nonfile_args:
1191 file_argparse.error('Can\'t specify --argsfile with'
1192 'any other arguments (%s)' % nonfile_args)
1193 try:
1194 with open(file_args.argsfile, 'r') as f:
1195 args = json.load(f)
1196 except (IOError, OSError, ValueError) as e:
1197 # We don't need to error out here - "args" is now empty,
1198 # so the call below to parser.parse_args(args) will fail
1199 # and print the full help text.
1200 print >> sys.stderr, 'Couldn\'t read arguments: %s' % e
1201
1202 # Even if we failed to read the args, just call the normal parser now since it
1203 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001204 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001205 options, args = parser.parse_args(args)
aludwin7556e0c2016-10-26 08:46:10 -07001206 return (parser, options, args)
1207
1208
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001209def _calc_named_cache_hint(named_cache, named_caches):
1210 """Returns the expected size of the missing named caches."""
1211 present = named_cache.available
1212 size = 0
1213 for name, _, hint in named_caches:
1214 if name not in present:
1215 hint = long(hint)
1216 if hint > 0:
1217 size += hint
1218 return size
1219
1220
aludwin7556e0c2016-10-26 08:46:10 -07001221def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001222 # Warning: when --argsfile is used, the strings are unicode instances, when
1223 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001224 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001225
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001226 if not file_path.enable_symlink():
1227 logging.error('Symlink support is not enabled')
1228
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001229 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001230 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001231 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1232 if hint:
1233 # Increase the --min-free-space value by the hint, and recreate the
1234 # NamedCache instance so it gets the updated CachePolicy.
1235 options.min_free_space += hint
1236 named_cache = process_named_cache_options(parser, options)
1237
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001238 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1239 # they can be cleaned the same way.
nodirf33b8d62016-10-26 22:34:58 -07001240 isolate_cache = isolateserver.process_cache_options(options, trim=False)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001241 caches = []
1242 if isolate_cache:
1243 caches.append(isolate_cache)
1244 if named_cache:
1245 caches.append(named_cache)
1246 root = caches[0].cache_dir if caches else unicode(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001247 if options.clean:
1248 if options.isolated:
1249 parser.error('Can\'t use --isolated with --clean.')
1250 if options.isolate_server:
1251 parser.error('Can\'t use --isolate-server with --clean.')
1252 if options.json:
1253 parser.error('Can\'t use --json with --clean.')
nodirf33b8d62016-10-26 22:34:58 -07001254 if options.named_caches:
1255 parser.error('Can\t use --named-cache with --clean.')
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001256 # Trim first, then clean.
1257 local_caching.trim_caches(
1258 caches,
1259 root,
1260 min_free_space=options.min_free_space,
1261 max_age_secs=MAX_AGE_SECS)
1262 for c in caches:
Marc-Antoine Ruel87fc2222018-06-18 13:09:24 +00001263 c.cleanup()
maruel36a963d2016-04-08 17:15:49 -07001264 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001265
1266 # Trim must still be done for the following case:
1267 # - named-cache was used
1268 # - some entries, with a large hint, where missing
1269 # - --min-free-space was increased accordingly, thus trimming is needed
1270 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1271 # --clean after each task.
1272 if hint:
1273 logging.info('Additional trimming of %d bytes', hint)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001274 local_caching.trim_caches(
1275 caches,
1276 root,
1277 min_free_space=options.min_free_space,
1278 max_age_secs=MAX_AGE_SECS)
maruel36a963d2016-04-08 17:15:49 -07001279
nodir55be77b2016-05-03 09:39:57 -07001280 if not options.isolated and not args:
1281 parser.error('--isolated or command to run is required.')
1282
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001283 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001284
1285 isolateserver.process_isolate_server_options(
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001286 parser, options, True, False)
nodir55be77b2016-05-03 09:39:57 -07001287 if not options.isolate_server:
1288 if options.isolated:
1289 parser.error('--isolated requires --isolate-server')
1290 if ISOLATED_OUTDIR_PARAMETER in args:
1291 parser.error(
1292 '%s in args requires --isolate-server' % ISOLATED_OUTDIR_PARAMETER)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001293
nodir90bc8dc2016-06-15 13:35:21 -07001294 if options.root_dir:
1295 options.root_dir = unicode(os.path.abspath(options.root_dir))
maruel12e30012015-10-09 11:55:35 -07001296 if options.json:
1297 options.json = unicode(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001298
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001299 if any('=' not in i for i in options.env):
1300 parser.error(
1301 '--env required key=value form. value can be skipped to delete '
1302 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001303 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001304
1305 prefixes = {}
1306 cwd = os.path.realpath(os.getcwd())
1307 for item in options.env_prefix:
1308 if '=' not in item:
1309 parser.error(
1310 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1311 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001312 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001313 if os.path.isabs(opath):
1314 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1315 opath = os.path.normpath(opath)
1316 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1317 parser.error(
1318 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1319 % opath)
1320 prefixes.setdefault(key, []).append(opath)
1321 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001322
nodirbe642ff2016-06-09 15:51:51 -07001323 cipd.validate_cipd_options(parser, options)
1324
vadimsh232f5a82017-01-20 19:23:44 -08001325 install_packages_fn = noop_install_packages
vadimsh902948e2017-01-20 15:57:32 -08001326 if options.cipd_enabled:
iannuccib58d10d2017-03-18 02:00:25 -07001327 install_packages_fn = lambda run_dir: install_client_and_packages(
vadimsh902948e2017-01-20 15:57:32 -08001328 run_dir, cipd.parse_package_args(options.cipd_packages),
1329 options.cipd_server, options.cipd_client_package,
1330 options.cipd_client_version, cache_dir=options.cipd_cache)
nodirbe642ff2016-06-09 15:51:51 -07001331
nodird6160682017-02-02 13:03:35 -08001332 @contextlib.contextmanager
nodir0ae98b32017-05-11 13:21:53 -07001333 def install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001334 # WARNING: this function depends on "options" variable defined in the outer
1335 # function.
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001336 assert unicode(run_dir), repr(run_dir)
1337 assert os.path.isabs(run_dir), run_dir
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001338 named_caches = [
nodir0ae98b32017-05-11 13:21:53 -07001339 (os.path.join(run_dir, unicode(relpath)), name)
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001340 for name, relpath, _ in options.named_caches
nodir0ae98b32017-05-11 13:21:53 -07001341 ]
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001342 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001343 named_cache.install(path, name)
nodird6160682017-02-02 13:03:35 -08001344 try:
1345 yield
1346 finally:
dnje289d132017-07-07 11:16:44 -07001347 # Uninstall each named cache, returning it to the cache pool. If an
1348 # uninstall fails for a given cache, it will remain in the task's
1349 # temporary space, get cleaned up by the Swarming bot, and be lost.
1350 #
1351 # If the Swarming bot cannot clean up the cache, it will handle it like
1352 # any other bot file that could not be removed.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001353 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001354 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001355 # uninstall() doesn't trim but does call save() implicitly. Trimming
1356 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001357 named_cache.uninstall(path, name)
1358 except local_caching.NamedCacheError:
1359 logging.exception('Error while removing named cache %r at %r. '
1360 'The cache will be lost.', path, name)
nodirf33b8d62016-10-26 22:34:58 -07001361
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001362 extra_args = []
1363 command = []
1364 if options.raw_cmd:
1365 command = args
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001366 if options.relative_cwd:
1367 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1368 if not a.startswith(os.getcwd()):
1369 parser.error(
1370 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001371 else:
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001372 if options.relative_cwd:
1373 parser.error('--relative-cwd requires --raw-cmd')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001374 extra_args = args
1375
1376 data = TaskData(
1377 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001378 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001379 extra_args=extra_args,
1380 isolated_hash=options.isolated,
1381 storage=None,
1382 isolate_cache=isolate_cache,
1383 outputs=options.output,
1384 install_named_caches=install_named_caches,
1385 leak_temp_dir=options.leak_temp_dir,
1386 root_dir=_to_unicode(options.root_dir),
1387 hard_timeout=options.hard_timeout,
1388 grace_period=options.grace_period,
1389 bot_file=options.bot_file,
1390 switch_to_account=options.switch_to_account,
1391 install_packages_fn=install_packages_fn,
1392 use_symlinks=options.use_symlinks,
1393 env=options.env,
1394 env_prefix=options.env_prefix)
nodirbe642ff2016-06-09 15:51:51 -07001395 try:
nodir90bc8dc2016-06-15 13:35:21 -07001396 if options.isolate_server:
1397 storage = isolateserver.get_storage(
1398 options.isolate_server, options.namespace)
1399 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001400 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001401 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
1402 assert storage.hash_algo == isolate_cache.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001403 return run_tha_test(data, options.json)
1404 return run_tha_test(data, options.json)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001405 except (
1406 cipd.Error,
1407 local_caching.NamedCacheError,
1408 local_caching.NotFoundError) as ex:
nodirbe642ff2016-06-09 15:51:51 -07001409 print >> sys.stderr, ex.message
1410 return 1
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001411
1412
1413if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001414 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001415 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001416 fix_encoding.fix_encoding()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001417 sys.exit(main(sys.argv[1:]))