blob: 0e73119d35b9899038fa0a22372876381f5d56be [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
33See
34https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
35for all the variables.
36
37See
38https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
39for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000040"""
41
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000042from __future__ import print_function
43
44__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000045
aludwin7556e0c2016-10-26 08:46:10 -070046import argparse
maruel064c0a32016-04-05 11:47:15 -070047import base64
iannucci96fcccc2016-08-30 15:52:22 -070048import collections
vadimsh232f5a82017-01-20 19:23:44 -080049import contextlib
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040050import errno
aludwin7556e0c2016-10-26 08:46:10 -070051import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000052import logging
53import optparse
54import os
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040055import re
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000056import sys
57import tempfile
maruel064c0a32016-04-05 11:47:15 -070058import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000059
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000060from utils import tools
61tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000062
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000063# third_party/
64from depot_tools import fix_encoding
Takuto Ikuta6e2ff962019-10-29 12:35:27 +000065import six
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000066
67# pylint: disable=ungrouped-imports
68import auth
69import cipd
70import isolate_storage
71import isolateserver
72import local_caching
73from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070074from utils import file_path
maruel12e30012015-10-09 11:55:35 -070075from utils import fs
maruel064c0a32016-04-05 11:47:15 -070076from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040077from utils import logging_utils
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040078from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050079from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000080
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000081
maruele2f2cb82016-07-13 14:41:03 -070082# Magic variables that can be found in the isolate task command line.
83ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
84EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
85SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
86
87
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000088# The name of the log file to use.
89RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
90
maruele2f2cb82016-07-13 14:41:03 -070091
csharp@chromium.orge217f302012-11-22 16:51:53 +000092# The name of the log to use for the run_test_cases.py command
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000093RUN_TEST_CASES_LOG = 'run_test_cases.log'
csharp@chromium.orge217f302012-11-22 16:51:53 +000094
vadimsh@chromium.org87d63262013-04-04 19:34:21 +000095
maruele2f2cb82016-07-13 14:41:03 -070096# Use short names for temporary directories. This is driven by Windows, which
97# imposes a relatively short maximum path length of 260 characters, often
98# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +000099# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -0700100#
101# It is recommended to start the script with a `root_dir` as short as
102# possible.
103# - ir stands for isolated_run
104# - io stands for isolated_out
105# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000106# - ic stands for isolated_client
maruele2f2cb82016-07-13 14:41:03 -0700107ISOLATED_RUN_DIR = u'ir'
108ISOLATED_OUT_DIR = u'io'
109ISOLATED_TMP_DIR = u'it'
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000110ISOLATED_CLIENT_DIR = u'ic'
maruele2f2cb82016-07-13 14:41:03 -0700111
Takuto Ikuta02edca22019-11-29 10:04:51 +0000112# TODO(tikuta): take these parameter from luci-config?
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000113# Take revision from
114# https://ci.chromium.org/p/infra-internal/g/infra-packagers/console
Takuto Ikuta02edca22019-11-29 10:04:51 +0000115ISOLATED_PACKAGE = 'infra/tools/luci/isolated/${platform}'
Takuto Ikuta84ef3682019-11-29 06:10:01 +0000116ISOLATED_REVISION = 'git_revision:2ee27ca739de90c29d46eb3af3371a42fec3ebff'
maruele2f2cb82016-07-13 14:41:03 -0700117
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400118# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000119CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400120
121
marueld928c862017-06-08 08:20:04 -0700122OUTLIVING_ZOMBIE_MSG = """\
123*** Swarming tried multiple times to delete the %s directory and failed ***
124*** Hard failing the task ***
125
126Swarming detected that your testing script ran an executable, which may have
127started a child executable, and the main script returned early, leaving the
128children executables playing around unguided.
129
130You don't want to leave children processes outliving the task on the Swarming
131bot, do you? The Swarming bot doesn't.
132
133How to fix?
134- For any process that starts children processes, make sure all children
135 processes terminated properly before each parent process exits. This is
136 especially important in very deep process trees.
137 - This must be done properly both in normal successful task and in case of
138 task failure. Cleanup is very important.
139- The Swarming bot sends a SIGTERM in case of timeout.
140 - You have %s seconds to comply after the signal was sent to the process
141 before the process is forcibly killed.
142- To achieve not leaking children processes in case of signals on timeout, you
143 MUST handle signals in each executable / python script and propagate them to
144 children processes.
145 - When your test script (python or binary) receives a signal like SIGTERM or
146 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
147 them to terminate before quitting.
148
149See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400150https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700151for more information.
152
153*** May the SIGKILL force be with you ***
154"""
155
156
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000157# Currently hardcoded. Eventually could be exposed as a flag once there's value.
158# 3 weeks
159MAX_AGE_SECS = 21*24*60*60
160
161
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500162TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000163 'TaskData',
164 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000165 # List of strings; the command line to use, independent of what was
166 # specified in the isolated file.
167 'command',
168 # Relative directory to start command into.
169 'relative_cwd',
170 # List of strings; the arguments to add to the command specified in the
171 # isolated file.
172 'extra_args',
173 # Hash of the .isolated file that must be retrieved to recreate the tree
174 # of files to run the target executable. The command specified in the
175 # .isolated is executed. Mutually exclusive with command argument.
176 'isolated_hash',
177 # isolateserver.Storage instance to retrieve remote objects. This object
178 # has a reference to an isolateserver.StorageApi, which does the actual
179 # I/O.
180 'storage',
181 # isolateserver.LocalCache instance to keep from retrieving the same
182 # objects constantly by caching the objects retrieved. Can be on-disk or
183 # in-memory.
184 'isolate_cache',
185 # List of paths relative to root_dir to put into the output isolated
186 # bundle upon task completion (see link_outputs_to_outdir).
187 'outputs',
188 # Function (run_dir) => context manager that installs named caches into
189 # |run_dir|.
190 'install_named_caches',
191 # If True, the temporary directory will be deliberately leaked for later
192 # examination.
193 'leak_temp_dir',
194 # Path to the directory to use to create the temporary directory. If not
195 # specified, a random temporary directory is created.
196 'root_dir',
197 # Kills the process if it lasts more than this amount of seconds.
198 'hard_timeout',
199 # Number of seconds to wait between SIGTERM and SIGKILL.
200 'grace_period',
201 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
202 # task command line argument.
203 'bot_file',
204 # Logical account to switch LUCI_CONTEXT into.
205 'switch_to_account',
206 # Context manager dir => CipdInfo, see install_client_and_packages.
207 'install_packages_fn',
208 # Create tree with symlinks instead of hardlinks.
209 'use_symlinks',
210 # Environment variables to set.
211 'env',
212 # Environment variables to mutate with relative directories.
213 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
214 'env_prefix',
215 # Lowers the task process priority.
216 'lower_priority',
217 # subprocess42.Containment instance. Can be None.
218 'containment',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000219 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500220
221
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500222def _to_str(s):
223 """Downgrades a unicode instance to str. Pass str through as-is."""
224 if isinstance(s, str):
225 return s
226 # This is technically incorrect, especially on Windows. In theory
227 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
228 # page' on Windows, but that causes other problems, as the character set
229 # is very limited.
230 return s.encode('utf-8')
231
232
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500233def _to_unicode(s):
234 """Upgrades a str instance to unicode. Pass unicode through as-is."""
Takuto Ikuta95459dd2019-10-29 12:39:47 +0000235 if isinstance(s, six.text_type) or s is None:
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500236 return s
237 return s.decode('utf-8')
238
239
maruel03e11842016-07-14 10:50:16 -0700240def make_temp_dir(prefix, root_dir):
241 """Returns a new unique temporary directory."""
Takuto Ikuta6e2ff962019-10-29 12:35:27 +0000242 return six.text_type(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000243
244
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500245def change_tree_read_only(rootdir, read_only):
246 """Changes the tree read-only bits according to the read_only specification.
247
248 The flag can be 0, 1 or 2, which will affect the possibility to modify files
249 and create or delete files.
250 """
251 if read_only == 2:
252 # Files and directories (except on Windows) are marked read only. This
253 # inhibits modifying, creating or deleting files in the test directory,
254 # except on Windows where creating and deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400255 file_path.make_tree_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500256 elif read_only == 1:
257 # Files are marked read only but not the directories. This inhibits
258 # modifying files but creating or deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400259 file_path.make_tree_files_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500260 elif read_only in (0, None):
Marc-Antoine Ruelf1d827c2014-11-24 15:22:25 -0500261 # Anything can be modified.
Marc-Antoine Ruel2666d9c2018-05-18 13:52:02 -0400262 # TODO(maruel): This is currently dangerous as long as
263 # DiskContentAddressedCache.touch() is not yet changed to verify the hash of
264 # the content of the files it is looking at, so that if a test modifies an
265 # input file, the file must be deleted.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400266 file_path.make_tree_writeable(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500267 else:
268 raise ValueError(
269 'change_tree_read_only(%s, %s): Unknown flag %s' %
270 (rootdir, read_only, read_only))
271
272
vadimsh9c54b2c2017-07-25 14:08:29 -0700273@contextlib.contextmanager
274def set_luci_context_account(account, tmp_dir):
275 """Sets LUCI_CONTEXT account to be used by the task.
276
277 If 'account' is None or '', does nothing at all. This happens when
278 run_isolated.py is called without '--switch-to-account' flag. In this case,
279 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000280 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700281 run_isolated.py explicitly from their code.
282
283 If the requested account is not defined in the context, switches to
284 non-authenticated access. This happens for Swarming tasks that don't use
285 'task' service accounts.
286
287 If not using LUCI_CONTEXT-based auth, does nothing.
288 If already running as requested account, does nothing.
289 """
290 if not account:
291 # Not actually switching.
292 yield
293 return
294
295 local_auth = luci_context.read('local_auth')
296 if not local_auth:
297 # Not using LUCI_CONTEXT auth at all.
298 yield
299 return
300
301 # See LUCI_CONTEXT.md for the format of 'local_auth'.
302 if local_auth.get('default_account_id') == account:
303 # Already set, no need to switch.
304 yield
305 return
306
307 available = {a['id'] for a in local_auth.get('accounts') or []}
308 if account in available:
309 logging.info('Switching default LUCI_CONTEXT account to %r', account)
310 local_auth['default_account_id'] = account
311 else:
312 logging.warning(
313 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
314 'disabling authentication', account, sorted(available))
315 local_auth.pop('default_account_id', None)
316
317 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
318 yield
319
320
nodir90bc8dc2016-06-15 13:35:21 -0700321def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000322 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700323
324 Raises:
325 ValueError if a parameter is requested in |command| but its value is not
326 provided.
327 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000328 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
329
330
331def replace_parameters(arg, out_dir, bot_file):
332 """Replaces parameter tokens with appropriate values in a string.
333
334 Raises:
335 ValueError if a parameter is requested in |arg| but its value is not
336 provided.
337 """
338 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
339 replace_slash = False
340 if ISOLATED_OUTDIR_PARAMETER in arg:
341 if not out_dir:
342 raise ValueError(
343 'output directory is requested in command or env var, but not '
344 'provided; please specify one')
345 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
346 replace_slash = True
347 if SWARMING_BOT_FILE_PARAMETER in arg:
348 if bot_file:
349 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700350 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000351 else:
352 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
353 'var, but no bot_file specified. Leaving parameter '
354 'unchanged.')
355 if replace_slash:
356 # Replace slashes only if parameters are present
357 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
358 arg = arg.replace('/', os.sep)
359 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700360
361
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000362
363def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
364 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800365 """Returns full OS environment to run a command in.
366
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800367 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
368 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800369
370 Args:
371 tmp_dir: temp directory.
372 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500373 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500374 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800375 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000376 out_dir: Isolated output directory. Required to be != None if any of the
377 env vars contain ISOLATED_OUTDIR_PARAMETER.
378 bot_file: Required to be != None if any of the env vars contain
379 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800380 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500381 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000382 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500383 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500384 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500385 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000386 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500387
388 if cipd_info:
389 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500390 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
391 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500392
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000393 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500394 assert isinstance(paths, list), paths
395 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500396 cur = out.get(key)
397 if cur:
398 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500399 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800400
Marc-Antoine Ruelefb30b12018-07-25 18:34:36 +0000401 tmp_dir = _to_str(tmp_dir)
402 # pylint: disable=line-too-long
403 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
404 # platform. So $TMPDIR must be set on all platforms.
405 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
406 out['TMPDIR'] = tmp_dir
407 if sys.platform == 'win32':
408 # * chromium's base utils uses GetTempPath().
409 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
410 # * Go uses GetTempPath().
411 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
412 # set.
413 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
414 out['TMP'] = tmp_dir
415 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
416 out['TEMP'] = tmp_dir
417 elif sys.platform == 'darwin':
418 # * Chromium uses an hack on macOS before calling into
419 # NSTemporaryDirectory().
420 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
421 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
422 out['MAC_CHROMIUM_TMPDIR'] = tmp_dir
423 else:
424 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
425 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
426 # * mktemp on linux respects $TMPDIR.
427 # * Chromium respects $TMPDIR on linux.
428 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
429 # * Go uses $TMPDIR.
430 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
431 pass
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500432 return out
vadimsh232f5a82017-01-20 19:23:44 -0800433
434
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000435def run_command(
436 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700437 """Runs the command.
438
439 Returns:
440 tuple(process exit code, bool if had a hard timeout)
441 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000442 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000443 'run_command(%s, %s, %s, %s, %s, %s)',
444 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700445
maruel6be7f9e2015-10-01 12:25:30 -0700446 exit_code = None
447 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700448 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700449 proc = None
450 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700451 try:
maruel6be7f9e2015-10-01 12:25:30 -0700452 # TODO(maruel): This code is imperfect. It doesn't handle well signals
453 # during the download phase and there's short windows were things can go
454 # wrong.
455 def handler(signum, _frame):
456 if proc and not had_signal:
457 logging.info('Received signal %d', signum)
458 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700459 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700460
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000461 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000462 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000463 lower_priority=lower_priority, containment=containment)
maruel6be7f9e2015-10-01 12:25:30 -0700464 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
465 try:
John Budorickc398f092019-06-10 22:49:44 +0000466 exit_code = proc.wait(hard_timeout or None)
maruel6be7f9e2015-10-01 12:25:30 -0700467 except subprocess42.TimeoutExpired:
468 if not had_signal:
469 logging.warning('Hard timeout')
470 had_hard_timeout = True
471 logging.warning('Sending SIGTERM')
472 proc.terminate()
473
474 # Ignore signals in grace period. Forcibly give the grace period to the
475 # child process.
476 if exit_code is None:
477 ignore = lambda *_: None
478 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
479 try:
480 exit_code = proc.wait(grace_period or None)
481 except subprocess42.TimeoutExpired:
482 # Now kill for real. The user can distinguish between the
483 # following states:
484 # - signal but process exited within grace period,
485 # hard_timed_out will be set but the process exit code will be
486 # script provided.
487 # - processed exited late, exit code will be -9 on posix.
488 logging.warning('Grace exhausted; sending SIGKILL')
489 proc.kill()
martiniss5c8043e2017-08-01 17:09:43 -0700490 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700491 exit_code = proc.wait()
maruela9cfd6f2015-09-15 11:03:15 -0700492 except OSError:
493 # This is not considered to be an internal error. The executable simply
494 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800495 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000496 '<The executable does not exist, a dependent library is missing or '
497 'the command line is too long>\n'
498 '<Check for missing .so/.dll in the .isolate or GN file or length of '
499 'command line args>\n'
maruela72f46e2016-02-24 11:05:45 -0800500 '<Command: %s>\n' % command)
501 if os.environ.get('SWARMING_TASK_ID'):
502 # Give an additional hint when running as a swarming task.
503 sys.stderr.write(
504 '<See the task\'s page for commands to help diagnose this issue '
505 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700506 exit_code = 1
507 logging.info(
508 'Command finished with exit code %d (%s)',
509 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700510 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700511
512
maruel4409e302016-07-19 14:25:51 -0700513def fetch_and_map(isolated_hash, storage, cache, outdir, use_symlinks):
514 """Fetches an isolated tree, create the tree and returns (bundle, stats)."""
nodir6f801882016-04-29 14:41:50 -0700515 start = time.time()
516 bundle = isolateserver.fetch_isolated(
517 isolated_hash=isolated_hash,
518 storage=storage,
519 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700520 outdir=outdir,
521 use_symlinks=use_symlinks)
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000522 hot = (collections.Counter(cache.used) -
523 collections.Counter(cache.added)).elements()
nodir6f801882016-04-29 14:41:50 -0700524 return bundle, {
525 'duration': time.time() - start,
nodir6f801882016-04-29 14:41:50 -0700526 'items_cold': base64.b64encode(large.pack(sorted(cache.added))),
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000527 'items_hot': base64.b64encode(large.pack(sorted(hot))),
nodir6f801882016-04-29 14:41:50 -0700528 }
529
530
aludwin0a8e17d2016-10-27 15:57:39 -0700531def link_outputs_to_outdir(run_dir, out_dir, outputs):
532 """Links any named outputs to out_dir so they can be uploaded.
533
534 Raises an error if the file already exists in that directory.
535 """
536 if not outputs:
537 return
538 isolateserver.create_directories(out_dir, outputs)
539 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400540 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
541
542
543def copy_recursively(src, dst):
544 """Efficiently copies a file or directory from src_dir to dst_dir.
545
546 `item` may be a file, directory, or a symlink to a file or directory.
547 All symlinks are replaced with their targets, so the resulting
548 directory structure in dst_dir will never have any symlinks.
549
550 To increase speed, copy_recursively hardlinks individual files into the
551 (newly created) directory structure if possible, unlike Python's
552 shutil.copytree().
553 """
554 orig_src = src
555 try:
556 # Replace symlinks with their final target.
557 while fs.islink(src):
558 res = fs.readlink(src)
559 src = os.path.join(os.path.dirname(src), res)
560 # TODO(sadafm): Explicitly handle cyclic symlinks.
561
562 # Note that fs.isfile (which is a wrapper around os.path.isfile) throws
563 # an exception if src does not exist. A warning will be logged in that case.
564 if fs.isfile(src):
565 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
566 return
567
568 if not fs.exists(dst):
569 os.makedirs(dst)
570
571 for child in fs.listdir(src):
572 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
573
574 except OSError as e:
575 if e.errno == errno.ENOENT:
576 logging.warning('Path %s does not exist or %s is a broken symlink',
577 src, orig_src)
578 else:
579 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700580
581
Takuto Ikutab4aa8662019-09-17 05:54:36 +0000582def upload_then_delete(storage, out_dir, leak_temp_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700583 """Deletes the temporary run directory and uploads results back.
584
585 Returns:
nodir6f801882016-04-29 14:41:50 -0700586 tuple(outputs_ref, success, stats)
maruel064c0a32016-04-05 11:47:15 -0700587 - outputs_ref: a dict referring to the results archived back to the isolated
588 server, if applicable.
589 - success: False if something occurred that means that the task must
590 forcibly be considered a failure, e.g. zombie processes were left
591 behind.
nodir6f801882016-04-29 14:41:50 -0700592 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700593 """
maruela9cfd6f2015-09-15 11:03:15 -0700594 # Upload out_dir and generate a .isolated file out of this directory. It is
595 # only done if files were written in the directory.
596 outputs_ref = None
maruel064c0a32016-04-05 11:47:15 -0700597 cold = []
598 hot = []
nodir6f801882016-04-29 14:41:50 -0700599 start = time.time()
600
maruel12e30012015-10-09 11:55:35 -0700601 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700602 with tools.Profiler('ArchiveOutput'):
603 try:
maruel064c0a32016-04-05 11:47:15 -0700604 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
maruela9cfd6f2015-09-15 11:03:15 -0700605 storage, [out_dir], None)
606 outputs_ref = {
Marc-Antoine Rueld0868ec2018-11-28 20:47:29 +0000607 'isolated': results.values()[0],
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +0000608 'isolatedserver': storage.server_ref.url,
609 'namespace': storage.server_ref.namespace,
maruela9cfd6f2015-09-15 11:03:15 -0700610 }
maruel064c0a32016-04-05 11:47:15 -0700611 cold = sorted(i.size for i in f_cold)
612 hot = sorted(i.size for i in f_hot)
maruela9cfd6f2015-09-15 11:03:15 -0700613 except isolateserver.Aborted:
614 # This happens when a signal SIGTERM was received while uploading data.
615 # There is 2 causes:
616 # - The task was too slow and was about to be killed anyway due to
617 # exceeding the hard timeout.
618 # - The amount of data uploaded back is very large and took too much
619 # time to archive.
620 sys.stderr.write('Received SIGTERM while uploading')
621 # Re-raise, so it will be treated as an internal failure.
622 raise
nodir6f801882016-04-29 14:41:50 -0700623
624 success = False
maruela9cfd6f2015-09-15 11:03:15 -0700625 try:
maruel12e30012015-10-09 11:55:35 -0700626 if (not leak_temp_dir and fs.isdir(out_dir) and
maruel6eeea7d2015-09-16 12:17:42 -0700627 not file_path.rmtree(out_dir)):
maruela9cfd6f2015-09-15 11:03:15 -0700628 logging.error('Had difficulties removing out_dir %s', out_dir)
nodir6f801882016-04-29 14:41:50 -0700629 else:
630 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700631 except OSError as e:
632 # When this happens, it means there's a process error.
maruel12e30012015-10-09 11:55:35 -0700633 logging.exception('Had difficulties removing out_dir %s: %s', out_dir, e)
nodir6f801882016-04-29 14:41:50 -0700634 stats = {
635 'duration': time.time() - start,
636 'items_cold': base64.b64encode(large.pack(cold)),
637 'items_hot': base64.b64encode(large.pack(hot)),
638 }
639 return outputs_ref, success, stats
maruela9cfd6f2015-09-15 11:03:15 -0700640
641
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500642def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700643 """Runs a command with optional isolated input/output.
644
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500645 Arguments:
646 - data: TaskData instance.
647 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700648
649 Returns metadata about the result.
650 """
maruela9cfd6f2015-09-15 11:03:15 -0700651 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000652 'duration': None,
653 'exit_code': None,
654 'had_hard_timeout': False,
655 'internal_failure': 'run_isolated did not complete properly',
656 'stats': {
657 #'cipd': {
658 # 'duration': 0.,
659 # 'get_client_duration': 0.,
660 #},
661 'isolated': {
662 'download': {
663 #'duration': 0.,
664 'initial_number_items': len(data.isolate_cache),
665 'initial_size': data.isolate_cache.total_size,
666 #'items_cold': '<large.pack()>',
667 #'items_hot': '<large.pack()>',
668 },
669 #'upload': {
670 # 'duration': 0.,
671 # 'items_cold': '<large.pack()>',
672 # 'items_hot': '<large.pack()>',
673 #},
674 },
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000675 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000676 #'cipd_pins': {
677 # 'packages': [
678 # {'package_name': ..., 'version': ..., 'path': ...},
679 # ...
680 # ],
681 # 'client_package': {'package_name': ..., 'version': ...},
682 #},
683 'outputs_ref': None,
684 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700685 }
nodirbe642ff2016-06-09 15:51:51 -0700686
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500687 if data.root_dir:
Lei Leife202df2019-06-11 17:33:34 +0000688 file_path.ensure_tree(data.root_dir, 0o700)
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500689 elif data.isolate_cache.cache_dir:
690 data = data._replace(
691 root_dir=os.path.dirname(data.isolate_cache.cache_dir))
maruele2f2cb82016-07-13 14:41:03 -0700692 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700693 # If root_dir is not specified, it is not constant.
694 # TODO(maruel): This is not obvious. Change this to become an error once we
695 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500696 if constant_run_path and data.root_dir:
697 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700698 if os.path.isdir(run_dir):
699 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000700 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700701 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500702 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
maruel03e11842016-07-14 10:50:16 -0700703 # storage should be normally set but don't crash if it is not. This can happen
704 # as Swarming task can run without an isolate server.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500705 out_dir = make_temp_dir(
706 ISOLATED_OUT_DIR, data.root_dir) if data.storage else None
707 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000708 isolated_client_dir = make_temp_dir(ISOLATED_CLIENT_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700709 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500710 if data.relative_cwd:
711 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500712 command = data.command
nodir55be77b2016-05-03 09:39:57 -0700713 try:
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000714 with data.install_packages_fn(run_dir, isolated_client_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800715 if cipd_info:
716 result['stats']['cipd'] = cipd_info.stats
717 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700718
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500719 if data.isolated_hash:
vadimsh232f5a82017-01-20 19:23:44 -0800720 isolated_stats = result['stats'].setdefault('isolated', {})
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000721 bundle, stats = fetch_and_map(
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500722 isolated_hash=data.isolated_hash,
723 storage=data.storage,
724 cache=data.isolate_cache,
vadimsh232f5a82017-01-20 19:23:44 -0800725 outdir=run_dir,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500726 use_symlinks=data.use_symlinks)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000727 isolated_stats['download'].update(stats)
vadimsh232f5a82017-01-20 19:23:44 -0800728 change_tree_read_only(run_dir, bundle.read_only)
maruelabec63c2017-04-26 11:53:24 -0700729 # Inject the command
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500730 if not command and bundle.command:
731 command = bundle.command + data.extra_args
Marc-Antoine Rueld704a1f2017-10-31 10:51:23 -0400732 # Only set the relative directory if the isolated file specified a
733 # command, and no raw command was specified.
734 if bundle.relative_cwd:
735 cwd = os.path.normpath(os.path.join(cwd, bundle.relative_cwd))
maruelabec63c2017-04-26 11:53:24 -0700736
737 if not command:
738 # Handle this as a task failure, not an internal failure.
739 sys.stderr.write(
740 '<No command was specified!>\n'
741 '<Please secify a command when triggering your Swarming task>\n')
742 result['exit_code'] = 1
743 return result
nodirbe642ff2016-06-09 15:51:51 -0700744
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500745 if not cwd.startswith(run_dir):
746 # Handle this as a task failure, not an internal failure. This is a
747 # 'last chance' way to gate against directory escape.
748 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
749 result['exit_code'] = 1
750 return result
751
752 if not os.path.isdir(cwd):
753 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +0000754 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500755
vadimsh232f5a82017-01-20 19:23:44 -0800756 # If we have an explicit list of files to return, make sure their
757 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500758 if data.storage and data.outputs:
759 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700760
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500761 with data.install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -0800762 sys.stdout.flush()
763 start = time.time()
764 try:
vadimsh9c54b2c2017-07-25 14:08:29 -0700765 # Need to switch the default account before 'get_command_env' call,
766 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500767 with set_luci_context_account(data.switch_to_account, tmp_dir):
768 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000769 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
770 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +0000771 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -0800772 command = process_command(command, out_dir, data.bot_file)
773 file_path.ensure_command_has_abs_path(command, cwd)
774
vadimsh9c54b2c2017-07-25 14:08:29 -0700775 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000776 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000777 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -0800778 finally:
779 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -0500780
781 # We successfully ran the command, set internal_failure back to
782 # None (even if the command failed, it's not an internal error).
783 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -0700784 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -0700785 # An internal error occurred. Report accordingly so the swarming task will
786 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -0700787 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -0700788 result['internal_failure'] = str(e)
789 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -0700790
791 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -0700792 finally:
793 try:
aludwin0a8e17d2016-10-27 15:57:39 -0700794 # Try to link files to the output directory, if specified.
795 if out_dir:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500796 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700797
nodir32a1ec12016-10-26 18:34:07 -0700798 success = False
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500799 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -0700800 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700801 logging.warning(
802 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -0700803 else:
maruel84537cb2015-10-16 14:21:28 -0700804 # On Windows rmtree(run_dir) call above has a synchronization effect: it
805 # finishes only when all task child processes terminate (since a running
806 # process locks *.exe file). Examine out_dir only after that call
807 # completes (since child processes may write to out_dir too and we need
808 # to wait for them to finish).
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000809 for directory in (run_dir, tmp_dir, isolated_client_dir):
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000810 if not fs.isdir(directory):
811 continue
maruel84537cb2015-10-16 14:21:28 -0700812 try:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000813 success = file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -0700814 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000815 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -0700816 success = False
817 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000818 sys.stderr.write(
819 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
maruel84537cb2015-10-16 14:21:28 -0700820 if result['exit_code'] == 0:
821 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -0700822
marueleb5fbee2015-09-17 13:01:36 -0700823 # This deletes out_dir if leak_temp_dir is not set.
nodir9130f072016-05-27 13:59:08 -0700824 if out_dir:
nodir55715712016-06-03 12:28:19 -0700825 isolated_stats = result['stats'].setdefault('isolated', {})
826 result['outputs_ref'], success, isolated_stats['upload'] = (
Takuto Ikutab4aa8662019-09-17 05:54:36 +0000827 upload_then_delete(data.storage, out_dir, data.leak_temp_dir))
maruela9cfd6f2015-09-15 11:03:15 -0700828 if not success and result['exit_code'] == 0:
829 result['exit_code'] = 1
830 except Exception as e:
831 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -0700832 if out_dir:
833 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -0700834 result['internal_failure'] = str(e)
835 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500836
837
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500838def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -0700839 """Runs an executable and records execution metadata.
840
nodir55be77b2016-05-03 09:39:57 -0700841 If isolated_hash is specified, downloads the dependencies in the cache,
842 hardlinks them into a temporary directory and runs the command specified in
843 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500844
845 A temporary directory is created to hold the output files. The content inside
846 this directory will be uploaded back to |storage| packaged as a .isolated
847 file.
848
849 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500850 - data: TaskData instance.
851 - result_json: File path to dump result metadata into. If set, the process
852 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -0700853
854 Returns:
855 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000856 """
maruela76b9ee2015-12-15 06:18:08 -0800857 if result_json:
858 # Write a json output file right away in case we get killed.
859 result = {
860 'exit_code': None,
861 'had_hard_timeout': False,
862 'internal_failure': 'Was terminated before completion',
863 'outputs_ref': None,
nodirbe642ff2016-06-09 15:51:51 -0700864 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -0800865 }
866 tools.write_json(result_json, result, dense=True)
867
maruela9cfd6f2015-09-15 11:03:15 -0700868 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500869 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -0700870 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -0700871
maruela9cfd6f2015-09-15 11:03:15 -0700872 if result_json:
maruel05d5a882015-09-21 13:59:02 -0700873 # We've found tests to delete 'work' when quitting, causing an exception
874 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -0700875 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -0700876 tools.write_json(result_json, result, dense=True)
877 # Only return 1 if there was an internal error.
878 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +0000879
maruela9cfd6f2015-09-15 11:03:15 -0700880 # Marshall into old-style inline output.
881 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000882 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -0700883 data = {
884 'hash': result['outputs_ref']['isolated'],
885 'namespace': result['outputs_ref']['namespace'],
886 'storage': result['outputs_ref']['isolatedserver'],
887 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -0500888 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700889 print(
890 '[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
891 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -0800892 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700893 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000894
895
iannuccib58d10d2017-03-18 02:00:25 -0700896# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -0800897CipdInfo = collections.namedtuple('CipdInfo', [
898 'client', # cipd.CipdClient object
899 'cache_dir', # absolute path to bot-global cipd tag and instance cache
900 'stats', # dict with stats to return to the server
901 'pins', # dict with installed cipd pins to return to the server
902])
903
904
905@contextlib.contextmanager
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000906def noop_install_packages(_run_dir, _isolated_dir):
iannuccib58d10d2017-03-18 02:00:25 -0700907 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -0800908 yield None
909
910
Takuto Ikuta2efc7792019-11-27 14:33:34 +0000911def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -0700912 """Calls 'cipd ensure' for packages.
913
914 Args:
915 run_dir (str): root of installation.
916 cipd_cache_dir (str): the directory to use for the cipd package cache.
917 client (CipdClient): the cipd client to use
918 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -0700919
920 Returns: list of pinned packages. Looks like [
921 {
922 'path': 'subdirectory',
923 'package_name': 'resolved/package/name',
924 'version': 'deadbeef...',
925 },
926 ...
927 ]
928 """
929 package_pins = [None]*len(packages)
930 def insert_pin(path, name, version, idx):
931 package_pins[idx] = {
932 'package_name': name,
933 # swarming deals with 'root' as '.'
934 'path': path or '.',
935 'version': version,
936 }
937
938 by_path = collections.defaultdict(list)
939 for i, (path, name, version) in enumerate(packages):
940 # cipd deals with 'root' as ''
941 if path == '.':
942 path = ''
943 by_path[path].append((name, version, i))
944
945 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +0000946 run_dir,
947 {
948 subdir: [(name, vers) for name, vers, _ in pkgs
949 ] for subdir, pkgs in by_path.items()
950 },
951 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -0700952 )
953
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000954 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -0700955 this_subdir = by_path[subdir]
956 for i, (name, version) in enumerate(pin_list):
957 insert_pin(subdir, name, version, this_subdir[i][2])
958
Robert Iannucci461b30d2017-12-13 11:34:03 -0800959 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -0700960
961 return package_pins
962
963
vadimsh232f5a82017-01-20 19:23:44 -0800964@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +0000965def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000966 client_package_name, client_version, cache_dir,
967 isolated_dir):
vadimsh902948e2017-01-20 15:57:32 -0800968 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -0700969
vadimsh232f5a82017-01-20 19:23:44 -0800970 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
971
972 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -0700973 [
974 {
975 "path": path, "package_name": package_name, "version": version,
976 },
977 ...
978 ]
vadimsh902948e2017-01-20 15:57:32 -0800979 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -0700980
981 such that they correspond 1:1 to all input package arguments from the command
982 line. These dictionaries make their all the way back to swarming, where they
983 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -0700984
vadimsh902948e2017-01-20 15:57:32 -0800985 If 'packages' list is empty, will bootstrap CIPD client, but won't install
986 any packages.
987
988 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -0800989 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -0800990
nodirbe642ff2016-06-09 15:51:51 -0700991 Args:
nodir90bc8dc2016-06-15 13:35:21 -0700992 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -0800993 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -0700994 service_url (str): CIPD server url, e.g.
995 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -0700996 client_package_name (str): CIPD package name of CIPD client.
997 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -0700998 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000999 isolated_dir (str): where to download isolated client.
nodirbe642ff2016-06-09 15:51:51 -07001000 """
1001 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001002
nodirbe642ff2016-06-09 15:51:51 -07001003 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001004
vadimsh902948e2017-01-20 15:57:32 -08001005 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001006 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001007 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001008 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001009
nodirbe642ff2016-06-09 15:51:51 -07001010 get_client_start = time.time()
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001011 client_manager = cipd.get_client(service_url, client_package_name,
1012 client_version, cache_dir)
iannucci96fcccc2016-08-30 15:52:22 -07001013
nodirbe642ff2016-06-09 15:51:51 -07001014 with client_manager as client:
1015 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001016
iannuccib58d10d2017-03-18 02:00:25 -07001017 package_pins = []
1018 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001019 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1020 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001021
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001022 # Install isolated client to |isolated_dir|.
Takuto Ikuta02edca22019-11-29 10:04:51 +00001023 _install_packages(isolated_dir, cipd_cache_dir, client,
1024 [('', ISOLATED_PACKAGE, ISOLATED_REVISION)])
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001025
iannuccib58d10d2017-03-18 02:00:25 -07001026 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001027
vadimsh232f5a82017-01-20 19:23:44 -08001028 total_duration = time.time() - start
1029 logging.info(
1030 'Installing CIPD client and packages took %d seconds', total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001031
vadimsh232f5a82017-01-20 19:23:44 -08001032 yield CipdInfo(
1033 client=client,
1034 cache_dir=cipd_cache_dir,
1035 stats={
1036 'duration': total_duration,
1037 'get_client_duration': get_client_duration,
1038 },
1039 pins={
iannuccib58d10d2017-03-18 02:00:25 -07001040 'client_package': {
1041 'package_name': client.package_name,
1042 'version': client.instance_id,
1043 },
vadimsh232f5a82017-01-20 19:23:44 -08001044 'packages': package_pins,
1045 })
nodirbe642ff2016-06-09 15:51:51 -07001046
1047
1048def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001049 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001050 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001051 version=__version__,
1052 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001053 parser.add_option(
maruel36a963d2016-04-08 17:15:49 -07001054 '--clean', action='store_true',
1055 help='Cleans the cache, trimming it necessary and remove corrupted items '
1056 'and returns without executing anything; use with -v to know what '
1057 'was done')
1058 parser.add_option(
maruel4409e302016-07-19 14:25:51 -07001059 '--use-symlinks', action='store_true',
1060 help='Use symlinks instead of hardlinks')
1061 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001062 '--json',
1063 help='dump output metadata to json file. When used, run_isolated returns '
1064 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001065 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001066 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001067 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001068 '--grace-period', type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001069 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001070 parser.add_option(
Marc-Antoine Ruel49e347d2017-10-24 16:52:02 -07001071 '--raw-cmd', action='store_true',
1072 help='Ignore the isolated command, use the one supplied at the command '
1073 'line')
1074 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001075 '--relative-cwd',
1076 help='Ignore the isolated \'relative_cwd\' and use this one instead; '
1077 'requires --raw-cmd')
1078 parser.add_option(
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001079 '--env', default=[], action='append',
1080 help='Environment variables to set for the child process')
1081 parser.add_option(
1082 '--env-prefix', default=[], action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001083 help='Specify a VAR=./path/fragment to put in the environment variable '
1084 'before executing the command. The path fragment must be relative '
1085 'to the isolated run directory, and must not contain a `..` token. '
1086 'The path will be made absolute and prepended to the indicated '
1087 '$VAR using the OS\'s path separator. Multiple items for the same '
1088 '$VAR will be prepended in order.')
1089 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001090 '--bot-file',
1091 help='Path to a file describing the state of the host. The content is '
1092 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001093 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001094 '--switch-to-account',
1095 help='If given, switches LUCI_CONTEXT to given logical service account '
1096 '(e.g. "task" or "system") before launching the isolated process.')
1097 parser.add_option(
aludwin0a8e17d2016-10-27 15:57:39 -07001098 '--output', action='append',
1099 help='Specifies an output to return. If no outputs are specified, all '
1100 'files located in $(ISOLATED_OUTDIR) will be returned; '
1101 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1102 'specified by --output option (there can be multiple) will be '
1103 'returned. Note that if a file in OUT_DIR has the same path '
1104 'as an --output option, the --output version will be returned.')
1105 parser.add_option(
aludwin7556e0c2016-10-26 08:46:10 -07001106 '-a', '--argsfile',
1107 # This is actually handled in parse_args; it's included here purely so it
1108 # can make it into the help text.
1109 help='Specify a file containing a JSON array of arguments to this '
1110 'script. If --argsfile is provided, no other argument may be '
1111 'provided on the command line.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001112
1113 group = optparse.OptionGroup(parser, 'Data source')
1114 group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001115 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001116 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001117 isolateserver.add_isolate_server_options(group)
1118 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001119
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001120 isolateserver.add_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001121
1122 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001123
1124 group = optparse.OptionGroup(parser, 'Named caches')
1125 group.add_option(
1126 '--named-cache',
1127 dest='named_caches',
1128 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001129 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001130 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001131 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001132 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1133 'path is a path relative to the run dir where the cache directory '
1134 'must be put to. '
1135 'This option can be specified more than once.')
1136 group.add_option(
1137 '--named-cache-root', default='named_caches',
1138 help='Cache root directory. Default=%default')
1139 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001140
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001141 group = optparse.OptionGroup(parser, 'Process containment')
1142 parser.add_option(
1143 '--lower-priority', action='store_true',
1144 help='Lowers the child process priority')
1145 parser.add_option(
1146 '--containment-type', choices=('NONE', 'AUTO', 'JOB_OBJECT'),
1147 default='NONE',
1148 help='Type of container to use')
1149 parser.add_option(
1150 '--limit-processes', type='int', default=0,
1151 help='Maximum number of active processes in the containment')
1152 parser.add_option(
1153 '--limit-total-committed-memory', type='int', default=0,
1154 help='Maximum sum of committed memory in the containment')
1155 parser.add_option_group(group)
1156
1157 group = optparse.OptionGroup(parser, 'Debugging')
1158 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001159 '--leak-temp-dir',
1160 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001161 help='Deliberately leak isolate\'s temp dir for later examination. '
1162 'Default: %default')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001163 group.add_option(
marueleb5fbee2015-09-17 13:01:36 -07001164 '--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001165 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001166
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001167 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001168
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001169 parser.set_defaults(cache='cache', cipd_cache='cipd_cache')
nodirbe642ff2016-06-09 15:51:51 -07001170 return parser
1171
1172
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001173def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001174 """Validates named cache options and returns a CacheManager."""
1175 if options.named_caches and not options.named_cache_root:
1176 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001177 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001178 if not CACHE_NAME_RE.match(name):
1179 parser.error(
1180 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1181 if not path:
1182 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001183 try:
1184 long(hint)
1185 except ValueError:
1186 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001187 if options.named_cache_root:
1188 # Make these configurable later if there is use case but for now it's fairly
1189 # safe values.
1190 # In practice, a fair chunk of bots are already recycled on a daily schedule
1191 # so this code doesn't have any effect to them, unless they are preloaded
1192 # with a really old cache.
1193 policies = local_caching.CachePolicies(
1194 # 1TiB.
1195 max_cache_size=1024*1024*1024*1024,
1196 min_free_space=options.min_free_space,
1197 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001198 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001199 root_dir = six.text_type(os.path.abspath(options.named_cache_root))
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001200 return local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001201 return None
1202
1203
aludwin7556e0c2016-10-26 08:46:10 -07001204def parse_args(args):
1205 # Create a fake mini-parser just to get out the "-a" command. Note that
1206 # it's not documented here; instead, it's documented in create_option_parser
1207 # even though that parser will never actually get to parse it. This is
1208 # because --argsfile is exclusive with all other options and arguments.
1209 file_argparse = argparse.ArgumentParser(add_help=False)
1210 file_argparse.add_argument('-a', '--argsfile')
1211 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1212 if file_args.argsfile:
1213 if nonfile_args:
1214 file_argparse.error('Can\'t specify --argsfile with'
1215 'any other arguments (%s)' % nonfile_args)
1216 try:
1217 with open(file_args.argsfile, 'r') as f:
1218 args = json.load(f)
1219 except (IOError, OSError, ValueError) as e:
1220 # We don't need to error out here - "args" is now empty,
1221 # so the call below to parser.parse_args(args) will fail
1222 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001223 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001224
1225 # Even if we failed to read the args, just call the normal parser now since it
1226 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001227 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001228 options, args = parser.parse_args(args)
aludwin7556e0c2016-10-26 08:46:10 -07001229 return (parser, options, args)
1230
1231
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001232def _calc_named_cache_hint(named_cache, named_caches):
1233 """Returns the expected size of the missing named caches."""
1234 present = named_cache.available
1235 size = 0
1236 for name, _, hint in named_caches:
1237 if name not in present:
1238 hint = long(hint)
1239 if hint > 0:
1240 size += hint
1241 return size
1242
1243
aludwin7556e0c2016-10-26 08:46:10 -07001244def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001245 # Warning: when --argsfile is used, the strings are unicode instances, when
1246 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001247 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001248
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001249 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001250 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001251
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001252 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001253 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001254 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1255 if hint:
1256 # Increase the --min-free-space value by the hint, and recreate the
1257 # NamedCache instance so it gets the updated CachePolicy.
1258 options.min_free_space += hint
1259 named_cache = process_named_cache_options(parser, options)
1260
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001261 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1262 # they can be cleaned the same way.
nodirf33b8d62016-10-26 22:34:58 -07001263 isolate_cache = isolateserver.process_cache_options(options, trim=False)
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001264 caches = []
1265 if isolate_cache:
1266 caches.append(isolate_cache)
1267 if named_cache:
1268 caches.append(named_cache)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001269 root = caches[0].cache_dir if caches else six.text_type(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001270 if options.clean:
1271 if options.isolated:
1272 parser.error('Can\'t use --isolated with --clean.')
1273 if options.isolate_server:
1274 parser.error('Can\'t use --isolate-server with --clean.')
1275 if options.json:
1276 parser.error('Can\'t use --json with --clean.')
nodirf33b8d62016-10-26 22:34:58 -07001277 if options.named_caches:
1278 parser.error('Can\t use --named-cache with --clean.')
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001279 # Trim first, then clean.
1280 local_caching.trim_caches(
1281 caches,
1282 root,
1283 min_free_space=options.min_free_space,
1284 max_age_secs=MAX_AGE_SECS)
1285 for c in caches:
Marc-Antoine Ruel87fc2222018-06-18 13:09:24 +00001286 c.cleanup()
maruel36a963d2016-04-08 17:15:49 -07001287 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001288
1289 # Trim must still be done for the following case:
1290 # - named-cache was used
1291 # - some entries, with a large hint, where missing
1292 # - --min-free-space was increased accordingly, thus trimming is needed
1293 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1294 # --clean after each task.
1295 if hint:
1296 logging.info('Additional trimming of %d bytes', hint)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001297 local_caching.trim_caches(
1298 caches,
1299 root,
1300 min_free_space=options.min_free_space,
1301 max_age_secs=MAX_AGE_SECS)
maruel36a963d2016-04-08 17:15:49 -07001302
nodir55be77b2016-05-03 09:39:57 -07001303 if not options.isolated and not args:
1304 parser.error('--isolated or command to run is required.')
1305
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001306 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001307
1308 isolateserver.process_isolate_server_options(
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001309 parser, options, True, False)
nodir55be77b2016-05-03 09:39:57 -07001310 if not options.isolate_server:
1311 if options.isolated:
1312 parser.error('--isolated requires --isolate-server')
1313 if ISOLATED_OUTDIR_PARAMETER in args:
1314 parser.error(
1315 '%s in args requires --isolate-server' % ISOLATED_OUTDIR_PARAMETER)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001316
nodir90bc8dc2016-06-15 13:35:21 -07001317 if options.root_dir:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001318 options.root_dir = six.text_type(os.path.abspath(options.root_dir))
maruel12e30012015-10-09 11:55:35 -07001319 if options.json:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001320 options.json = six.text_type(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001321
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001322 if any('=' not in i for i in options.env):
1323 parser.error(
1324 '--env required key=value form. value can be skipped to delete '
1325 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001326 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001327
1328 prefixes = {}
1329 cwd = os.path.realpath(os.getcwd())
1330 for item in options.env_prefix:
1331 if '=' not in item:
1332 parser.error(
1333 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1334 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001335 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001336 if os.path.isabs(opath):
1337 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1338 opath = os.path.normpath(opath)
1339 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1340 parser.error(
1341 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1342 % opath)
1343 prefixes.setdefault(key, []).append(opath)
1344 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001345
nodirbe642ff2016-06-09 15:51:51 -07001346 cipd.validate_cipd_options(parser, options)
1347
vadimsh232f5a82017-01-20 19:23:44 -08001348 install_packages_fn = noop_install_packages
vadimsh902948e2017-01-20 15:57:32 -08001349 if options.cipd_enabled:
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001350 install_packages_fn = (
1351 lambda run_dir, isolated_dir: install_client_and_packages(
vadimsh902948e2017-01-20 15:57:32 -08001352 run_dir, cipd.parse_package_args(options.cipd_packages),
1353 options.cipd_server, options.cipd_client_package,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001354 options.cipd_client_version, cache_dir=options.cipd_cache,
1355 isolated_dir=isolated_dir))
nodirbe642ff2016-06-09 15:51:51 -07001356
nodird6160682017-02-02 13:03:35 -08001357 @contextlib.contextmanager
nodir0ae98b32017-05-11 13:21:53 -07001358 def install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001359 # WARNING: this function depends on "options" variable defined in the outer
1360 # function.
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001361 assert six.text_type(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001362 assert os.path.isabs(run_dir), run_dir
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001363 named_caches = [(os.path.join(run_dir, six.text_type(relpath)), name)
1364 for name, relpath, _ in options.named_caches]
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001365 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001366 named_cache.install(path, name)
nodird6160682017-02-02 13:03:35 -08001367 try:
1368 yield
1369 finally:
dnje289d132017-07-07 11:16:44 -07001370 # Uninstall each named cache, returning it to the cache pool. If an
1371 # uninstall fails for a given cache, it will remain in the task's
1372 # temporary space, get cleaned up by the Swarming bot, and be lost.
1373 #
1374 # If the Swarming bot cannot clean up the cache, it will handle it like
1375 # any other bot file that could not be removed.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001376 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001377 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001378 # uninstall() doesn't trim but does call save() implicitly. Trimming
1379 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001380 named_cache.uninstall(path, name)
1381 except local_caching.NamedCacheError:
1382 logging.exception('Error while removing named cache %r at %r. '
1383 'The cache will be lost.', path, name)
nodirf33b8d62016-10-26 22:34:58 -07001384
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001385 extra_args = []
1386 command = []
1387 if options.raw_cmd:
1388 command = args
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001389 if options.relative_cwd:
1390 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1391 if not a.startswith(os.getcwd()):
1392 parser.error(
1393 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001394 else:
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001395 if options.relative_cwd:
1396 parser.error('--relative-cwd requires --raw-cmd')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001397 extra_args = args
1398
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001399 containment_type = subprocess42.Containment.NONE
1400 if options.containment_type == 'AUTO':
1401 containment_type = subprocess42.Containment.AUTO
1402 if options.containment_type == 'JOB_OBJECT':
1403 containment_type = subprocess42.Containment.JOB_OBJECT
1404 containment = subprocess42.Containment(
1405 containment_type=containment_type,
1406 limit_processes=options.limit_processes,
1407 limit_total_committed_memory=options.limit_total_committed_memory)
1408
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001409 data = TaskData(
1410 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001411 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001412 extra_args=extra_args,
1413 isolated_hash=options.isolated,
1414 storage=None,
1415 isolate_cache=isolate_cache,
1416 outputs=options.output,
1417 install_named_caches=install_named_caches,
1418 leak_temp_dir=options.leak_temp_dir,
1419 root_dir=_to_unicode(options.root_dir),
1420 hard_timeout=options.hard_timeout,
1421 grace_period=options.grace_period,
1422 bot_file=options.bot_file,
1423 switch_to_account=options.switch_to_account,
1424 install_packages_fn=install_packages_fn,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001425 use_symlinks=bool(options.use_symlinks),
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001426 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001427 env_prefix=options.env_prefix,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001428 lower_priority=bool(options.lower_priority),
1429 containment=containment)
nodirbe642ff2016-06-09 15:51:51 -07001430 try:
nodir90bc8dc2016-06-15 13:35:21 -07001431 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001432 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001433 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001434 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001435 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001436 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001437 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001438 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001439 return run_tha_test(data, options.json)
1440 return run_tha_test(data, options.json)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001441 except (
1442 cipd.Error,
1443 local_caching.NamedCacheError,
Marc-Antoine Ruelb6e9e232018-11-20 00:12:33 +00001444 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001445 print(ex.message, file=sys.stderr)
nodirbe642ff2016-06-09 15:51:51 -07001446 return 1
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001447
1448
1449if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001450 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001451 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001452 fix_encoding.fix_encoding()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001453 sys.exit(main(sys.argv[1:]))