blob: 86230f160dc57155ab5826302b117504304f82b6 [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +00008run_isolated takes cares of setting up a temporary environment, running a
9command, and tearing it down.
nodir55be77b2016-05-03 09:39:57 -070010
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000011It handles downloading and uploading isolated files, mapping CIPD packages and
12reusing stateful named caches.
13
14The isolated files, CIPD packages and named caches are kept as a global LRU
15cache.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050016
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000017Any ${EXECUTABLE_SUFFIX} on the command line or the environment variables passed
18with the --env option will be replaced with ".exe" string on Windows and "" on
19other platforms.
nodirbe642ff2016-06-09 15:51:51 -070020
Roberto Carrillo71ade6d2018-10-08 22:30:24 +000021Any ${ISOLATED_OUTDIR} on the command line or the environment variables passed
22with the --env option will be replaced by the location of a temporary directory
23upon execution of the command specified in the .isolated file. All content
24written to this directory will be uploaded upon termination and the .isolated
25file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070026
Marc-Antoine Rueleed2f3a2019-03-14 00:00:40 +000027Any ${SWARMING_BOT_FILE} on the command line or the environment variables passed
28with the --env option will be replaced by the value of the --bot-file parameter.
29This file is used by a swarming bot to communicate state of the host to tasks.
30It is written to by the swarming bot's on_before_task() hook in the swarming
31server's custom bot_config.py.
32
33See
34https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Magic-Values.md
35for all the variables.
36
37See
38https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/swarming_bot/config/bot_config.py
39for more information about bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000040"""
41
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +000042from __future__ import print_function
43
44__version__ = '1.0.1'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000045
aludwin7556e0c2016-10-26 08:46:10 -070046import argparse
maruel064c0a32016-04-05 11:47:15 -070047import base64
iannucci96fcccc2016-08-30 15:52:22 -070048import collections
vadimsh232f5a82017-01-20 19:23:44 -080049import contextlib
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -040050import errno
aludwin7556e0c2016-10-26 08:46:10 -070051import json
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000052import logging
53import optparse
54import os
Takuto Ikuta5c59a842020-01-24 03:05:24 +000055import platform
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -040056import re
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000057import sys
58import tempfile
maruel064c0a32016-04-05 11:47:15 -070059import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000060
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000061from utils import tools
62tools.force_local_third_party()
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000063
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000064# third_party/
65from depot_tools import fix_encoding
Takuto Ikuta6e2ff962019-10-29 12:35:27 +000066import six
Marc-Antoine Ruel016c7602019-04-02 18:31:13 +000067
68# pylint: disable=ungrouped-imports
69import auth
70import cipd
71import isolate_storage
72import isolateserver
73import local_caching
74from libs import luci_context
Vadim Shtayura6b555c12014-07-23 16:22:18 -070075from utils import file_path
maruel12e30012015-10-09 11:55:35 -070076from utils import fs
maruel064c0a32016-04-05 11:47:15 -070077from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040078from utils import logging_utils
Ye Kuang2dd17442020-04-22 08:45:52 +000079from utils import net
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040080from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050081from utils import subprocess42
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000082
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000083
maruele2f2cb82016-07-13 14:41:03 -070084# Magic variables that can be found in the isolate task command line.
85ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
86EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
87SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
88
89
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000090# The name of the log file to use.
91RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
92
maruele2f2cb82016-07-13 14:41:03 -070093
csharp@chromium.orge217f302012-11-22 16:51:53 +000094# The name of the log to use for the run_test_cases.py command
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000095RUN_TEST_CASES_LOG = 'run_test_cases.log'
csharp@chromium.orge217f302012-11-22 16:51:53 +000096
vadimsh@chromium.org87d63262013-04-04 19:34:21 +000097
maruele2f2cb82016-07-13 14:41:03 -070098# Use short names for temporary directories. This is driven by Windows, which
99# imposes a relatively short maximum path length of 260 characters, often
100# referred to as MAX_PATH. It is relatively easy to create files with longer
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000101# path length. A use case is with recursive dependency trees like npm packages.
maruele2f2cb82016-07-13 14:41:03 -0700102#
103# It is recommended to start the script with a `root_dir` as short as
104# possible.
105# - ir stands for isolated_run
106# - io stands for isolated_out
107# - it stands for isolated_tmp
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000108# - ic stands for isolated_client
maruele2f2cb82016-07-13 14:41:03 -0700109ISOLATED_RUN_DIR = u'ir'
110ISOLATED_OUT_DIR = u'io'
111ISOLATED_TMP_DIR = u'it'
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000112ISOLATED_CLIENT_DIR = u'ic'
maruele2f2cb82016-07-13 14:41:03 -0700113
Takuto Ikuta02edca22019-11-29 10:04:51 +0000114# TODO(tikuta): take these parameter from luci-config?
Takuto Ikutac8c92e62020-04-01 07:07:29 +0000115# Update tag by `./client/update_isolated.sh`.
116# Or take revision from
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000117# https://ci.chromium.org/p/infra-internal/g/infra-packagers/console
Takuto Ikuta02edca22019-11-29 10:04:51 +0000118ISOLATED_PACKAGE = 'infra/tools/luci/isolated/${platform}'
Takuto Ikuta99e00d62020-04-15 07:13:56 +0000119ISOLATED_REVISION = 'git_revision:be4040d5064cbac78820314bb1aac02f0c2a3c3e'
maruele2f2cb82016-07-13 14:41:03 -0700120
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400121# Keep synced with task_request.py
Lei Leife202df2019-06-11 17:33:34 +0000122CACHE_NAME_RE = re.compile(r'^[a-z0-9_]{1,4096}$')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -0400123
124
marueld928c862017-06-08 08:20:04 -0700125OUTLIVING_ZOMBIE_MSG = """\
126*** Swarming tried multiple times to delete the %s directory and failed ***
127*** Hard failing the task ***
128
129Swarming detected that your testing script ran an executable, which may have
130started a child executable, and the main script returned early, leaving the
131children executables playing around unguided.
132
133You don't want to leave children processes outliving the task on the Swarming
134bot, do you? The Swarming bot doesn't.
135
136How to fix?
137- For any process that starts children processes, make sure all children
138 processes terminated properly before each parent process exits. This is
139 especially important in very deep process trees.
140 - This must be done properly both in normal successful task and in case of
141 task failure. Cleanup is very important.
142- The Swarming bot sends a SIGTERM in case of timeout.
143 - You have %s seconds to comply after the signal was sent to the process
144 before the process is forcibly killed.
145- To achieve not leaking children processes in case of signals on timeout, you
146 MUST handle signals in each executable / python script and propagate them to
147 children processes.
148 - When your test script (python or binary) receives a signal like SIGTERM or
149 CTRL_BREAK_EVENT on Windows), send it to all children processes and wait for
150 them to terminate before quitting.
151
152See
Marc-Antoine Ruelc7243592018-05-24 17:04:04 -0400153https://chromium.googlesource.com/infra/luci/luci-py.git/+/master/appengine/swarming/doc/Bot.md#Graceful-termination_aka-the-SIGTERM-and-SIGKILL-dance
marueld928c862017-06-08 08:20:04 -0700154for more information.
155
156*** May the SIGKILL force be with you ***
157"""
158
159
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000160# Currently hardcoded. Eventually could be exposed as a flag once there's value.
161# 3 weeks
162MAX_AGE_SECS = 21*24*60*60
163
164
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500165TaskData = collections.namedtuple(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000166 'TaskData',
167 [
Takuto Ikuta9a319502019-11-26 07:40:14 +0000168 # List of strings; the command line to use, independent of what was
169 # specified in the isolated file.
170 'command',
171 # Relative directory to start command into.
172 'relative_cwd',
173 # List of strings; the arguments to add to the command specified in the
174 # isolated file.
175 'extra_args',
176 # Hash of the .isolated file that must be retrieved to recreate the tree
177 # of files to run the target executable. The command specified in the
178 # .isolated is executed. Mutually exclusive with command argument.
179 'isolated_hash',
180 # isolateserver.Storage instance to retrieve remote objects. This object
181 # has a reference to an isolateserver.StorageApi, which does the actual
182 # I/O.
183 'storage',
184 # isolateserver.LocalCache instance to keep from retrieving the same
185 # objects constantly by caching the objects retrieved. Can be on-disk or
186 # in-memory.
187 'isolate_cache',
188 # List of paths relative to root_dir to put into the output isolated
189 # bundle upon task completion (see link_outputs_to_outdir).
190 'outputs',
191 # Function (run_dir) => context manager that installs named caches into
192 # |run_dir|.
193 'install_named_caches',
194 # If True, the temporary directory will be deliberately leaked for later
195 # examination.
196 'leak_temp_dir',
197 # Path to the directory to use to create the temporary directory. If not
198 # specified, a random temporary directory is created.
199 'root_dir',
200 # Kills the process if it lasts more than this amount of seconds.
201 'hard_timeout',
202 # Number of seconds to wait between SIGTERM and SIGKILL.
203 'grace_period',
204 # Path to a file with bot state, used in place of ${SWARMING_BOT_FILE}
205 # task command line argument.
206 'bot_file',
207 # Logical account to switch LUCI_CONTEXT into.
208 'switch_to_account',
209 # Context manager dir => CipdInfo, see install_client_and_packages.
210 'install_packages_fn',
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000211 # Use go isolated client.
212 'use_go_isolated',
Takuto Ikuta057c5342019-12-03 04:05:05 +0000213 # Cache directory for go isolated client.
214 'go_cache_dir',
Takuto Ikuta879788c2020-01-10 08:00:26 +0000215 # Parameters passed to go isolated client.
216 'go_cache_policies',
Takuto Ikuta9a319502019-11-26 07:40:14 +0000217 # Environment variables to set.
218 'env',
219 # Environment variables to mutate with relative directories.
220 # Example: {"ENV_KEY": ['relative', 'paths', 'to', 'prepend']}
221 'env_prefix',
222 # Lowers the task process priority.
223 'lower_priority',
224 # subprocess42.Containment instance. Can be None.
225 'containment',
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000226 ])
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500227
228
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500229def _to_str(s):
230 """Downgrades a unicode instance to str. Pass str through as-is."""
231 if isinstance(s, str):
232 return s
233 # This is technically incorrect, especially on Windows. In theory
234 # sys.getfilesystemencoding() should be used to use the right 'ANSI code
235 # page' on Windows, but that causes other problems, as the character set
236 # is very limited.
237 return s.encode('utf-8')
238
239
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500240def _to_unicode(s):
241 """Upgrades a str instance to unicode. Pass unicode through as-is."""
Takuto Ikuta95459dd2019-10-29 12:39:47 +0000242 if isinstance(s, six.text_type) or s is None:
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -0500243 return s
244 return s.decode('utf-8')
245
246
maruel03e11842016-07-14 10:50:16 -0700247def make_temp_dir(prefix, root_dir):
248 """Returns a new unique temporary directory."""
Takuto Ikuta6e2ff962019-10-29 12:35:27 +0000249 return six.text_type(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000250
251
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500252def change_tree_read_only(rootdir, read_only):
253 """Changes the tree read-only bits according to the read_only specification.
254
255 The flag can be 0, 1 or 2, which will affect the possibility to modify files
256 and create or delete files.
257 """
258 if read_only == 2:
259 # Files and directories (except on Windows) are marked read only. This
260 # inhibits modifying, creating or deleting files in the test directory,
261 # except on Windows where creating and deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400262 file_path.make_tree_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500263 elif read_only == 1:
264 # Files are marked read only but not the directories. This inhibits
265 # modifying files but creating or deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400266 file_path.make_tree_files_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500267 elif read_only in (0, None):
Marc-Antoine Ruelf1d827c2014-11-24 15:22:25 -0500268 # Anything can be modified.
Marc-Antoine Ruel2666d9c2018-05-18 13:52:02 -0400269 # TODO(maruel): This is currently dangerous as long as
270 # DiskContentAddressedCache.touch() is not yet changed to verify the hash of
271 # the content of the files it is looking at, so that if a test modifies an
272 # input file, the file must be deleted.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400273 file_path.make_tree_writeable(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500274 else:
275 raise ValueError(
276 'change_tree_read_only(%s, %s): Unknown flag %s' %
277 (rootdir, read_only, read_only))
278
279
vadimsh9c54b2c2017-07-25 14:08:29 -0700280@contextlib.contextmanager
281def set_luci_context_account(account, tmp_dir):
282 """Sets LUCI_CONTEXT account to be used by the task.
283
284 If 'account' is None or '', does nothing at all. This happens when
285 run_isolated.py is called without '--switch-to-account' flag. In this case,
286 if run_isolated.py is running in some LUCI_CONTEXT environment, the task will
Takuto Ikuta33e2ff32019-09-30 12:44:03 +0000287 just inherit whatever account is already set. This may happen if users invoke
vadimsh9c54b2c2017-07-25 14:08:29 -0700288 run_isolated.py explicitly from their code.
289
290 If the requested account is not defined in the context, switches to
291 non-authenticated access. This happens for Swarming tasks that don't use
292 'task' service accounts.
293
294 If not using LUCI_CONTEXT-based auth, does nothing.
295 If already running as requested account, does nothing.
296 """
297 if not account:
298 # Not actually switching.
299 yield
300 return
301
302 local_auth = luci_context.read('local_auth')
303 if not local_auth:
304 # Not using LUCI_CONTEXT auth at all.
305 yield
306 return
307
308 # See LUCI_CONTEXT.md for the format of 'local_auth'.
309 if local_auth.get('default_account_id') == account:
310 # Already set, no need to switch.
311 yield
312 return
313
314 available = {a['id'] for a in local_auth.get('accounts') or []}
315 if account in available:
316 logging.info('Switching default LUCI_CONTEXT account to %r', account)
317 local_auth['default_account_id'] = account
318 else:
319 logging.warning(
320 'Requested LUCI_CONTEXT account %r is not available (have only %r), '
321 'disabling authentication', account, sorted(available))
322 local_auth.pop('default_account_id', None)
323
324 with luci_context.write(_tmpdir=tmp_dir, local_auth=local_auth):
325 yield
326
327
nodir90bc8dc2016-06-15 13:35:21 -0700328def process_command(command, out_dir, bot_file):
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000329 """Replaces parameters in a command line.
nodirbe642ff2016-06-09 15:51:51 -0700330
331 Raises:
332 ValueError if a parameter is requested in |command| but its value is not
333 provided.
334 """
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000335 return [replace_parameters(arg, out_dir, bot_file) for arg in command]
336
337
338def replace_parameters(arg, out_dir, bot_file):
339 """Replaces parameter tokens with appropriate values in a string.
340
341 Raises:
342 ValueError if a parameter is requested in |arg| but its value is not
343 provided.
344 """
345 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
346 replace_slash = False
347 if ISOLATED_OUTDIR_PARAMETER in arg:
348 if not out_dir:
349 raise ValueError(
350 'output directory is requested in command or env var, but not '
351 'provided; please specify one')
352 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
353 replace_slash = True
354 if SWARMING_BOT_FILE_PARAMETER in arg:
355 if bot_file:
356 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
nodirbe642ff2016-06-09 15:51:51 -0700357 replace_slash = True
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000358 else:
359 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command or env '
360 'var, but no bot_file specified. Leaving parameter '
361 'unchanged.')
362 if replace_slash:
363 # Replace slashes only if parameters are present
364 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
365 arg = arg.replace('/', os.sep)
366 return arg
maruela9cfd6f2015-09-15 11:03:15 -0700367
368
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000369
370def get_command_env(tmp_dir, cipd_info, run_dir, env, env_prefixes, out_dir,
371 bot_file):
vadimsh232f5a82017-01-20 19:23:44 -0800372 """Returns full OS environment to run a command in.
373
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800374 Sets up TEMP, puts directory with cipd binary in front of PATH, exposes
375 CIPD_CACHE_DIR env var, and installs all env_prefixes.
vadimsh232f5a82017-01-20 19:23:44 -0800376
377 Args:
378 tmp_dir: temp directory.
379 cipd_info: CipdInfo object is cipd client is used, None if not.
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500380 run_dir: The root directory the isolated tree is mapped in.
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500381 env: environment variables to use
Robert Iannuccibf5f84c2017-11-22 12:56:50 -0800382 env_prefixes: {"ENV_KEY": ['cwd', 'relative', 'paths', 'to', 'prepend']}
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000383 out_dir: Isolated output directory. Required to be != None if any of the
384 env vars contain ISOLATED_OUTDIR_PARAMETER.
385 bot_file: Required to be != None if any of the env vars contain
386 SWARMING_BOT_FILE_PARAMETER.
vadimsh232f5a82017-01-20 19:23:44 -0800387 """
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500388 out = os.environ.copy()
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000389 for k, v in env.items():
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500390 if not v:
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500391 out.pop(k, None)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500392 else:
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000393 out[k] = replace_parameters(v, out_dir, bot_file)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500394
395 if cipd_info:
396 bin_dir = os.path.dirname(cipd_info.client.binary_path)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500397 out['PATH'] = '%s%s%s' % (_to_str(bin_dir), os.pathsep, out['PATH'])
398 out['CIPD_CACHE_DIR'] = _to_str(cipd_info.cache_dir)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500399
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +0000400 for key, paths in env_prefixes.items():
Marc-Antoine Ruel9ec1e9f2017-12-20 16:36:54 -0500401 assert isinstance(paths, list), paths
402 paths = [os.path.normpath(os.path.join(run_dir, p)) for p in paths]
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500403 cur = out.get(key)
404 if cur:
405 paths.append(cur)
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -0500406 out[key] = _to_str(os.path.pathsep.join(paths))
vadimsh232f5a82017-01-20 19:23:44 -0800407
Marc-Antoine Ruelefb30b12018-07-25 18:34:36 +0000408 tmp_dir = _to_str(tmp_dir)
409 # pylint: disable=line-too-long
410 # * python respects $TMPDIR, $TEMP, and $TMP in this order, regardless of
411 # platform. So $TMPDIR must be set on all platforms.
412 # https://github.com/python/cpython/blob/2.7/Lib/tempfile.py#L155
413 out['TMPDIR'] = tmp_dir
414 if sys.platform == 'win32':
415 # * chromium's base utils uses GetTempPath().
416 # https://cs.chromium.org/chromium/src/base/files/file_util_win.cc?q=GetTempPath
417 # * Go uses GetTempPath().
418 # * GetTempDir() uses %TMP%, then %TEMP%, then other stuff. So %TMP% must be
419 # set.
420 # https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-gettemppathw
421 out['TMP'] = tmp_dir
422 # https://blogs.msdn.microsoft.com/oldnewthing/20150417-00/?p=44213
423 out['TEMP'] = tmp_dir
424 elif sys.platform == 'darwin':
425 # * Chromium uses an hack on macOS before calling into
426 # NSTemporaryDirectory().
427 # https://cs.chromium.org/chromium/src/base/files/file_util_mac.mm?q=GetTempDir
428 # https://developer.apple.com/documentation/foundation/1409211-nstemporarydirectory
429 out['MAC_CHROMIUM_TMPDIR'] = tmp_dir
430 else:
431 # TMPDIR is specified as the POSIX standard envvar for the temp directory.
432 # http://pubs.opengroup.org/onlinepubs/9699919799/basedefs/V1_chap08.html
433 # * mktemp on linux respects $TMPDIR.
434 # * Chromium respects $TMPDIR on linux.
435 # https://cs.chromium.org/chromium/src/base/files/file_util_posix.cc?q=GetTempDir
436 # * Go uses $TMPDIR.
437 # https://go.googlesource.com/go/+/go1.10.3/src/os/file_unix.go#307
438 pass
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -0500439 return out
vadimsh232f5a82017-01-20 19:23:44 -0800440
441
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000442def run_command(
443 command, cwd, env, hard_timeout, grace_period, lower_priority, containment):
maruel6be7f9e2015-10-01 12:25:30 -0700444 """Runs the command.
445
446 Returns:
447 tuple(process exit code, bool if had a hard timeout)
448 """
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000449 logging.info(
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000450 'run_command(%s, %s, %s, %s, %s, %s)',
451 command, cwd, hard_timeout, grace_period, lower_priority, containment)
marueleb5fbee2015-09-17 13:01:36 -0700452
maruel6be7f9e2015-10-01 12:25:30 -0700453 exit_code = None
454 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700455 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700456 proc = None
457 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700458 try:
maruel6be7f9e2015-10-01 12:25:30 -0700459 # TODO(maruel): This code is imperfect. It doesn't handle well signals
460 # during the download phase and there's short windows were things can go
461 # wrong.
462 def handler(signum, _frame):
463 if proc and not had_signal:
464 logging.info('Received signal %d', signum)
465 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700466 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700467
Marc-Antoine Ruel30b80fe2019-02-08 13:51:31 +0000468 proc = subprocess42.Popen(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000469 command, cwd=cwd, env=env, detached=True, close_fds=True,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000470 lower_priority=lower_priority, containment=containment)
maruel6be7f9e2015-10-01 12:25:30 -0700471 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
472 try:
John Budorickc398f092019-06-10 22:49:44 +0000473 exit_code = proc.wait(hard_timeout or None)
maruel6be7f9e2015-10-01 12:25:30 -0700474 except subprocess42.TimeoutExpired:
475 if not had_signal:
476 logging.warning('Hard timeout')
477 had_hard_timeout = True
478 logging.warning('Sending SIGTERM')
479 proc.terminate()
480
481 # Ignore signals in grace period. Forcibly give the grace period to the
482 # child process.
483 if exit_code is None:
484 ignore = lambda *_: None
485 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
486 try:
487 exit_code = proc.wait(grace_period or None)
488 except subprocess42.TimeoutExpired:
489 # Now kill for real. The user can distinguish between the
490 # following states:
491 # - signal but process exited within grace period,
492 # hard_timed_out will be set but the process exit code will be
493 # script provided.
494 # - processed exited late, exit code will be -9 on posix.
495 logging.warning('Grace exhausted; sending SIGKILL')
496 proc.kill()
martiniss5c8043e2017-08-01 17:09:43 -0700497 logging.info('Waiting for process exit')
maruel6be7f9e2015-10-01 12:25:30 -0700498 exit_code = proc.wait()
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000499 except OSError as e:
maruela9cfd6f2015-09-15 11:03:15 -0700500 # This is not considered to be an internal error. The executable simply
501 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800502 sys.stderr.write(
tikuta2d678212019-09-23 23:12:08 +0000503 '<The executable does not exist, a dependent library is missing or '
504 'the command line is too long>\n'
505 '<Check for missing .so/.dll in the .isolate or GN file or length of '
506 'command line args>\n'
Takuto Ikutaeccf0862020-03-19 03:05:55 +0000507 '<Command: %s, Exception: %s>\n' % (command, e))
maruela72f46e2016-02-24 11:05:45 -0800508 if os.environ.get('SWARMING_TASK_ID'):
509 # Give an additional hint when running as a swarming task.
510 sys.stderr.write(
511 '<See the task\'s page for commands to help diagnose this issue '
512 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700513 exit_code = 1
514 logging.info(
515 'Command finished with exit code %d (%s)',
516 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700517 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700518
519
Takuto Ikuta879788c2020-01-10 08:00:26 +0000520def _fetch_and_map_with_go(isolated_hash, storage, outdir, go_cache_dir,
521 policies, isolated_client):
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000522 """
523 Fetches an isolated tree using go client, create the tree and returns
524 (bundle, stats).
525 """
526 start = time.time()
527 server_ref = storage.server_ref
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000528 result_json_handle, result_json_path = tempfile.mkstemp(
529 prefix=u'fetch-and-map-result-', suffix=u'.json')
530 os.close(result_json_handle)
531 try:
Ye Kuanga98764c2020-04-09 03:17:37 +0000532 cmd = [
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000533 isolated_client,
534 'download',
535 '-isolate-server',
536 server_ref.url,
537 '-namespace',
538 server_ref.namespace,
539 '-isolated',
540 isolated_hash,
541
542 # flags for cache
543 '-cache-dir',
Takuto Ikuta057c5342019-12-03 04:05:05 +0000544 go_cache_dir,
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000545 '-cache-max-items',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000546 str(policies.max_items),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000547 '-cache-max-size',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000548 str(policies.max_cache_size),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000549 '-cache-min-free-space',
Takuto Ikuta50bc0552019-12-03 03:26:46 +0000550 str(policies.min_free_space),
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000551
552 # flags for output
553 '-output-dir',
554 outdir,
555 '-fetch-and-map-result-json',
556 result_json_path,
Ye Kuanga98764c2020-04-09 03:17:37 +0000557 ]
558 proc = subprocess42.Popen(cmd)
559 cmd_str = ' '.join(cmd)
Takuto Ikuta3153e3b2020-02-18 06:11:47 +0000560
Ye Kuanga98764c2020-04-09 03:17:37 +0000561 exceeded_max_timeout = True
562 check_period_sec = 30
563 max_checks = 100
564 # max timeout = max_checks * check_period_sec = 50 minutes
565 for i in range(max_checks):
Takuto Ikuta3153e3b2020-02-18 06:11:47 +0000566 # This is to prevent I/O timeout error during isolated setup.
567 try:
Ye Kuanga98764c2020-04-09 03:17:37 +0000568 retcode = proc.wait(check_period_sec)
Takuto Ikutab64c5192020-02-19 02:46:34 +0000569 if retcode != 0:
Ye Kuanga98764c2020-04-09 03:17:37 +0000570 raise ValueError("retcode is not 0: %s (cmd=%s)" % (retcode, cmd_str))
571 exceeded_max_timeout = False
Takuto Ikuta3153e3b2020-02-18 06:11:47 +0000572 break
573 except subprocess42.TimeoutExpired:
Ye Kuanga98764c2020-04-09 03:17:37 +0000574 print('still running isolated (after %d seconds)' % (
575 (i + 1) * check_period_sec))
576
577 if exceeded_max_timeout:
578 proc.terminate()
579 try:
580 proc.wait(check_period_sec)
581 except subprocess42.TimeoutExpired:
582 proc.kill()
583 proc.wait()
584 # Raise unconditionally, because |proc| was forcefully terminated.
585 raise ValueError("timedout after %d seconds (cmd=%s)",
586 (check_period_sec * max_checks, cmd_str))
Takuto Ikuta3153e3b2020-02-18 06:11:47 +0000587
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000588 with open(result_json_path) as json_file:
589 result_json = json.load(json_file)
590
591 isolated = result_json['isolated']
592 bundle = isolateserver.IsolatedBundle(filter_cb=None)
593 # Only following properties are used in caller.
594 bundle.command = isolated.get('command')
595 bundle.read_only = isolated.get('read_only')
596 bundle.relative_cwd = isolated.get('relative_cwd')
597
598 return bundle, {
599 'duration': time.time() - start,
600 'items_cold': result_json['items_cold'],
601 'items_hot': result_json['items_hot'],
602 }
603 finally:
604 fs.remove(result_json_path)
605
606
607# TODO(crbug.com/932396): remove this function.
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000608def fetch_and_map(isolated_hash, storage, cache, outdir):
maruel4409e302016-07-19 14:25:51 -0700609 """Fetches an isolated tree, create the tree and returns (bundle, stats)."""
nodir6f801882016-04-29 14:41:50 -0700610 start = time.time()
611 bundle = isolateserver.fetch_isolated(
612 isolated_hash=isolated_hash,
613 storage=storage,
614 cache=cache,
maruel4409e302016-07-19 14:25:51 -0700615 outdir=outdir,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000616 use_symlinks=False)
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000617 hot = (collections.Counter(cache.used) -
618 collections.Counter(cache.added)).elements()
nodir6f801882016-04-29 14:41:50 -0700619 return bundle, {
620 'duration': time.time() - start,
nodir6f801882016-04-29 14:41:50 -0700621 'items_cold': base64.b64encode(large.pack(sorted(cache.added))),
Takuto Ikuta2b9640e2019-06-19 00:53:23 +0000622 'items_hot': base64.b64encode(large.pack(sorted(hot))),
nodir6f801882016-04-29 14:41:50 -0700623 }
624
625
aludwin0a8e17d2016-10-27 15:57:39 -0700626def link_outputs_to_outdir(run_dir, out_dir, outputs):
627 """Links any named outputs to out_dir so they can be uploaded.
628
629 Raises an error if the file already exists in that directory.
630 """
631 if not outputs:
632 return
633 isolateserver.create_directories(out_dir, outputs)
634 for o in outputs:
Sadaf Matinkhoo10743a62018-03-29 16:28:58 -0400635 copy_recursively(os.path.join(run_dir, o), os.path.join(out_dir, o))
636
637
638def copy_recursively(src, dst):
639 """Efficiently copies a file or directory from src_dir to dst_dir.
640
641 `item` may be a file, directory, or a symlink to a file or directory.
642 All symlinks are replaced with their targets, so the resulting
643 directory structure in dst_dir will never have any symlinks.
644
645 To increase speed, copy_recursively hardlinks individual files into the
646 (newly created) directory structure if possible, unlike Python's
647 shutil.copytree().
648 """
649 orig_src = src
650 try:
651 # Replace symlinks with their final target.
652 while fs.islink(src):
653 res = fs.readlink(src)
654 src = os.path.join(os.path.dirname(src), res)
655 # TODO(sadafm): Explicitly handle cyclic symlinks.
656
657 # Note that fs.isfile (which is a wrapper around os.path.isfile) throws
658 # an exception if src does not exist. A warning will be logged in that case.
659 if fs.isfile(src):
660 file_path.link_file(dst, src, file_path.HARDLINK_WITH_FALLBACK)
661 return
662
663 if not fs.exists(dst):
664 os.makedirs(dst)
665
666 for child in fs.listdir(src):
667 copy_recursively(os.path.join(src, child), os.path.join(dst, child))
668
669 except OSError as e:
670 if e.errno == errno.ENOENT:
671 logging.warning('Path %s does not exist or %s is a broken symlink',
672 src, orig_src)
673 else:
674 logging.info("Couldn't collect output file %s: %s", src, e)
aludwin0a8e17d2016-10-27 15:57:39 -0700675
676
Takuto Ikutab4aa8662019-09-17 05:54:36 +0000677def upload_then_delete(storage, out_dir, leak_temp_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700678 """Deletes the temporary run directory and uploads results back.
679
680 Returns:
nodir6f801882016-04-29 14:41:50 -0700681 tuple(outputs_ref, success, stats)
maruel064c0a32016-04-05 11:47:15 -0700682 - outputs_ref: a dict referring to the results archived back to the isolated
683 server, if applicable.
684 - success: False if something occurred that means that the task must
685 forcibly be considered a failure, e.g. zombie processes were left
686 behind.
nodir6f801882016-04-29 14:41:50 -0700687 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700688 """
maruela9cfd6f2015-09-15 11:03:15 -0700689 # Upload out_dir and generate a .isolated file out of this directory. It is
690 # only done if files were written in the directory.
691 outputs_ref = None
maruel064c0a32016-04-05 11:47:15 -0700692 cold = []
693 hot = []
nodir6f801882016-04-29 14:41:50 -0700694 start = time.time()
695
maruel12e30012015-10-09 11:55:35 -0700696 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700697 with tools.Profiler('ArchiveOutput'):
698 try:
maruel064c0a32016-04-05 11:47:15 -0700699 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
Takuto Ikuta26980872020-04-09 06:56:37 +0000700 storage, [out_dir], None, verify_push=True)
maruela9cfd6f2015-09-15 11:03:15 -0700701 outputs_ref = {
Marc-Antoine Rueld0868ec2018-11-28 20:47:29 +0000702 'isolated': results.values()[0],
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +0000703 'isolatedserver': storage.server_ref.url,
704 'namespace': storage.server_ref.namespace,
maruela9cfd6f2015-09-15 11:03:15 -0700705 }
maruel064c0a32016-04-05 11:47:15 -0700706 cold = sorted(i.size for i in f_cold)
707 hot = sorted(i.size for i in f_hot)
maruela9cfd6f2015-09-15 11:03:15 -0700708 except isolateserver.Aborted:
709 # This happens when a signal SIGTERM was received while uploading data.
710 # There is 2 causes:
711 # - The task was too slow and was about to be killed anyway due to
712 # exceeding the hard timeout.
713 # - The amount of data uploaded back is very large and took too much
714 # time to archive.
715 sys.stderr.write('Received SIGTERM while uploading')
716 # Re-raise, so it will be treated as an internal failure.
717 raise
nodir6f801882016-04-29 14:41:50 -0700718
719 success = False
maruela9cfd6f2015-09-15 11:03:15 -0700720 try:
maruel12e30012015-10-09 11:55:35 -0700721 if (not leak_temp_dir and fs.isdir(out_dir) and
maruel6eeea7d2015-09-16 12:17:42 -0700722 not file_path.rmtree(out_dir)):
maruela9cfd6f2015-09-15 11:03:15 -0700723 logging.error('Had difficulties removing out_dir %s', out_dir)
nodir6f801882016-04-29 14:41:50 -0700724 else:
725 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700726 except OSError as e:
727 # When this happens, it means there's a process error.
maruel12e30012015-10-09 11:55:35 -0700728 logging.exception('Had difficulties removing out_dir %s: %s', out_dir, e)
nodir6f801882016-04-29 14:41:50 -0700729 stats = {
730 'duration': time.time() - start,
731 'items_cold': base64.b64encode(large.pack(cold)),
732 'items_hot': base64.b64encode(large.pack(hot)),
733 }
734 return outputs_ref, success, stats
maruela9cfd6f2015-09-15 11:03:15 -0700735
736
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500737def map_and_run(data, constant_run_path):
nodir55be77b2016-05-03 09:39:57 -0700738 """Runs a command with optional isolated input/output.
739
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500740 Arguments:
741 - data: TaskData instance.
742 - constant_run_path: TODO
nodir55be77b2016-05-03 09:39:57 -0700743
744 Returns metadata about the result.
745 """
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000746
747 if data.isolate_cache:
748 download_stats = {
749 #'duration': 0.,
750 'initial_number_items': len(data.isolate_cache),
751 'initial_size': data.isolate_cache.total_size,
752 #'items_cold': '<large.pack()>',
753 #'items_hot': '<large.pack()>',
754 }
755 else:
756 # TODO(tikuta): take stats from state.json in this case too.
757 download_stats = {}
758
maruela9cfd6f2015-09-15 11:03:15 -0700759 result = {
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000760 'duration': None,
761 'exit_code': None,
762 'had_hard_timeout': False,
763 'internal_failure': 'run_isolated did not complete properly',
764 'stats': {
765 #'cipd': {
766 # 'duration': 0.,
767 # 'get_client_duration': 0.,
768 #},
769 'isolated': {
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000770 'download': download_stats,
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000771 #'upload': {
772 # 'duration': 0.,
773 # 'items_cold': '<large.pack()>',
774 # 'items_hot': '<large.pack()>',
775 #},
776 },
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000777 },
Takuto Ikuta5ed62ad2019-09-26 09:16:00 +0000778 #'cipd_pins': {
779 # 'packages': [
780 # {'package_name': ..., 'version': ..., 'path': ...},
781 # ...
782 # ],
783 # 'client_package': {'package_name': ..., 'version': ...},
784 #},
785 'outputs_ref': None,
786 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700787 }
nodirbe642ff2016-06-09 15:51:51 -0700788
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500789 if data.root_dir:
Lei Leife202df2019-06-11 17:33:34 +0000790 file_path.ensure_tree(data.root_dir, 0o700)
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +0000791 elif data.use_go_isolated:
792 data = data._replace(root_dir=os.path.dirname(data.go_cache_dir))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500793 elif data.isolate_cache.cache_dir:
794 data = data._replace(
795 root_dir=os.path.dirname(data.isolate_cache.cache_dir))
maruele2f2cb82016-07-13 14:41:03 -0700796 # See comment for these constants.
maruelcffa0542017-04-07 08:39:20 -0700797 # If root_dir is not specified, it is not constant.
798 # TODO(maruel): This is not obvious. Change this to become an error once we
799 # make the constant_run_path an exposed flag.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500800 if constant_run_path and data.root_dir:
801 run_dir = os.path.join(data.root_dir, ISOLATED_RUN_DIR)
maruel5c4eed82017-05-26 05:33:40 -0700802 if os.path.isdir(run_dir):
803 file_path.rmtree(run_dir)
Lei Leife202df2019-06-11 17:33:34 +0000804 os.mkdir(run_dir, 0o700)
maruelcffa0542017-04-07 08:39:20 -0700805 else:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500806 run_dir = make_temp_dir(ISOLATED_RUN_DIR, data.root_dir)
maruel03e11842016-07-14 10:50:16 -0700807 # storage should be normally set but don't crash if it is not. This can happen
808 # as Swarming task can run without an isolate server.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500809 out_dir = make_temp_dir(
810 ISOLATED_OUT_DIR, data.root_dir) if data.storage else None
811 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, data.root_dir)
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000812 isolated_client_dir = make_temp_dir(ISOLATED_CLIENT_DIR, data.root_dir)
nodir55be77b2016-05-03 09:39:57 -0700813 cwd = run_dir
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500814 if data.relative_cwd:
815 cwd = os.path.normpath(os.path.join(cwd, data.relative_cwd))
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500816 command = data.command
nodir55be77b2016-05-03 09:39:57 -0700817 try:
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000818 with data.install_packages_fn(run_dir, isolated_client_dir) as cipd_info:
vadimsh232f5a82017-01-20 19:23:44 -0800819 if cipd_info:
820 result['stats']['cipd'] = cipd_info.stats
821 result['cipd_pins'] = cipd_info.pins
nodir90bc8dc2016-06-15 13:35:21 -0700822
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500823 if data.isolated_hash:
vadimsh232f5a82017-01-20 19:23:44 -0800824 isolated_stats = result['stats'].setdefault('isolated', {})
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000825 if data.use_go_isolated:
Takuto Ikuta90397ca2020-01-08 10:07:55 +0000826 bundle, stats = _fetch_and_map_with_go(
827 isolated_hash=data.isolated_hash,
828 storage=data.storage,
Takuto Ikuta90397ca2020-01-08 10:07:55 +0000829 outdir=run_dir,
830 go_cache_dir=data.go_cache_dir,
Takuto Ikuta879788c2020-01-10 08:00:26 +0000831 policies=data.go_cache_policies,
Takuto Ikuta90397ca2020-01-08 10:07:55 +0000832 isolated_client=os.path.join(isolated_client_dir,
833 'isolated' + cipd.EXECUTABLE_SUFFIX))
834 else:
Takuto Ikutad03ffcc2019-12-02 01:04:23 +0000835 bundle, stats = fetch_and_map(
836 isolated_hash=data.isolated_hash,
837 storage=data.storage,
838 cache=data.isolate_cache,
Takuto Ikuta16fac4b2019-12-09 04:57:18 +0000839 outdir=run_dir)
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +0000840 isolated_stats['download'].update(stats)
vadimsh232f5a82017-01-20 19:23:44 -0800841 change_tree_read_only(run_dir, bundle.read_only)
maruelabec63c2017-04-26 11:53:24 -0700842 # Inject the command
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500843 if not command and bundle.command:
844 command = bundle.command + data.extra_args
Marc-Antoine Rueld704a1f2017-10-31 10:51:23 -0400845 # Only set the relative directory if the isolated file specified a
846 # command, and no raw command was specified.
847 if bundle.relative_cwd:
848 cwd = os.path.normpath(os.path.join(cwd, bundle.relative_cwd))
maruelabec63c2017-04-26 11:53:24 -0700849
850 if not command:
851 # Handle this as a task failure, not an internal failure.
852 sys.stderr.write(
853 '<No command was specified!>\n'
854 '<Please secify a command when triggering your Swarming task>\n')
855 result['exit_code'] = 1
856 return result
nodirbe642ff2016-06-09 15:51:51 -0700857
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500858 if not cwd.startswith(run_dir):
859 # Handle this as a task failure, not an internal failure. This is a
860 # 'last chance' way to gate against directory escape.
861 sys.stderr.write('<Relative CWD is outside of run directory!>\n')
862 result['exit_code'] = 1
863 return result
864
865 if not os.path.isdir(cwd):
866 # Accepts relative_cwd that does not exist.
Lei Leife202df2019-06-11 17:33:34 +0000867 os.makedirs(cwd, 0o700)
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -0500868
vadimsh232f5a82017-01-20 19:23:44 -0800869 # If we have an explicit list of files to return, make sure their
870 # directories exist now.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500871 if data.storage and data.outputs:
872 isolateserver.create_directories(run_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700873
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500874 with data.install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -0800875 sys.stdout.flush()
876 start = time.time()
877 try:
vadimsh9c54b2c2017-07-25 14:08:29 -0700878 # Need to switch the default account before 'get_command_env' call,
879 # so it can grab correct value of LUCI_CONTEXT env var.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500880 with set_luci_context_account(data.switch_to_account, tmp_dir):
881 env = get_command_env(
Roberto Carrillo71ade6d2018-10-08 22:30:24 +0000882 tmp_dir, cipd_info, run_dir, data.env, data.env_prefix, out_dir,
883 data.bot_file)
Brian Sheedy7a761172019-08-30 22:55:14 +0000884 command = tools.find_executable(command, env)
Robert Iannucci24ae76a2018-02-26 12:51:18 -0800885 command = process_command(command, out_dir, data.bot_file)
886 file_path.ensure_command_has_abs_path(command, cwd)
887
vadimsh9c54b2c2017-07-25 14:08:29 -0700888 result['exit_code'], result['had_hard_timeout'] = run_command(
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +0000889 command, cwd, env, data.hard_timeout, data.grace_period,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +0000890 data.lower_priority, data.containment)
nodird6160682017-02-02 13:03:35 -0800891 finally:
892 result['duration'] = max(time.time() - start, 0)
Seth Koehler49139812017-12-19 13:59:33 -0500893
894 # We successfully ran the command, set internal_failure back to
895 # None (even if the command failed, it's not an internal error).
896 result['internal_failure'] = None
maruela9cfd6f2015-09-15 11:03:15 -0700897 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -0700898 # An internal error occurred. Report accordingly so the swarming task will
899 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -0700900 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -0700901 result['internal_failure'] = str(e)
902 on_error.report(None)
aludwin0a8e17d2016-10-27 15:57:39 -0700903
904 # Clean up
maruela9cfd6f2015-09-15 11:03:15 -0700905 finally:
906 try:
aludwin0a8e17d2016-10-27 15:57:39 -0700907 # Try to link files to the output directory, if specified.
908 if out_dir:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500909 link_outputs_to_outdir(run_dir, out_dir, data.outputs)
aludwin0a8e17d2016-10-27 15:57:39 -0700910
nodir32a1ec12016-10-26 18:34:07 -0700911 success = False
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500912 if data.leak_temp_dir:
nodir32a1ec12016-10-26 18:34:07 -0700913 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700914 logging.warning(
915 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -0700916 else:
maruel84537cb2015-10-16 14:21:28 -0700917 # On Windows rmtree(run_dir) call above has a synchronization effect: it
918 # finishes only when all task child processes terminate (since a running
919 # process locks *.exe file). Examine out_dir only after that call
920 # completes (since child processes may write to out_dir too and we need
921 # to wait for them to finish).
Takuto Ikutab7ce0e32019-11-27 23:26:18 +0000922 for directory in (run_dir, tmp_dir, isolated_client_dir):
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000923 if not fs.isdir(directory):
924 continue
maruel84537cb2015-10-16 14:21:28 -0700925 try:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000926 success = file_path.rmtree(directory)
maruel84537cb2015-10-16 14:21:28 -0700927 except OSError as e:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000928 logging.error('rmtree(%r) failed: %s', directory, e)
maruel84537cb2015-10-16 14:21:28 -0700929 success = False
930 if not success:
Takuto Ikuta69c0d662019-11-27 01:18:08 +0000931 sys.stderr.write(
932 OUTLIVING_ZOMBIE_MSG % (directory, data.grace_period))
maruel84537cb2015-10-16 14:21:28 -0700933 if result['exit_code'] == 0:
934 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -0700935
marueleb5fbee2015-09-17 13:01:36 -0700936 # This deletes out_dir if leak_temp_dir is not set.
nodir9130f072016-05-27 13:59:08 -0700937 if out_dir:
nodir55715712016-06-03 12:28:19 -0700938 isolated_stats = result['stats'].setdefault('isolated', {})
939 result['outputs_ref'], success, isolated_stats['upload'] = (
Takuto Ikutab4aa8662019-09-17 05:54:36 +0000940 upload_then_delete(data.storage, out_dir, data.leak_temp_dir))
maruela9cfd6f2015-09-15 11:03:15 -0700941 if not success and result['exit_code'] == 0:
942 result['exit_code'] = 1
943 except Exception as e:
944 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -0700945 if out_dir:
946 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -0700947 result['internal_failure'] = str(e)
Takuto Ikutaa9a907b2020-04-17 08:50:50 +0000948 on_error.report(None)
maruela9cfd6f2015-09-15 11:03:15 -0700949 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500950
951
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500952def run_tha_test(data, result_json):
nodir55be77b2016-05-03 09:39:57 -0700953 """Runs an executable and records execution metadata.
954
nodir55be77b2016-05-03 09:39:57 -0700955 If isolated_hash is specified, downloads the dependencies in the cache,
956 hardlinks them into a temporary directory and runs the command specified in
957 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500958
959 A temporary directory is created to hold the output files. The content inside
960 this directory will be uploaded back to |storage| packaged as a .isolated
961 file.
962
963 Arguments:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500964 - data: TaskData instance.
965 - result_json: File path to dump result metadata into. If set, the process
966 exit code is always 0 unless an internal error occurred.
maruela9cfd6f2015-09-15 11:03:15 -0700967
968 Returns:
969 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000970 """
maruela76b9ee2015-12-15 06:18:08 -0800971 if result_json:
972 # Write a json output file right away in case we get killed.
973 result = {
974 'exit_code': None,
975 'had_hard_timeout': False,
976 'internal_failure': 'Was terminated before completion',
977 'outputs_ref': None,
nodirbe642ff2016-06-09 15:51:51 -0700978 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -0800979 }
980 tools.write_json(result_json, result, dense=True)
981
maruela9cfd6f2015-09-15 11:03:15 -0700982 # run_isolated exit code. Depends on if result_json is used or not.
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -0500983 result = map_and_run(data, True)
maruela9cfd6f2015-09-15 11:03:15 -0700984 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -0700985
maruela9cfd6f2015-09-15 11:03:15 -0700986 if result_json:
maruel05d5a882015-09-21 13:59:02 -0700987 # We've found tests to delete 'work' when quitting, causing an exception
988 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -0700989 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -0700990 tools.write_json(result_json, result, dense=True)
991 # Only return 1 if there was an internal error.
992 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +0000993
maruela9cfd6f2015-09-15 11:03:15 -0700994 # Marshall into old-style inline output.
995 if result['outputs_ref']:
Marc-Antoine Ruel793bff32019-04-18 17:50:48 +0000996 # pylint: disable=unsubscriptable-object
maruela9cfd6f2015-09-15 11:03:15 -0700997 data = {
998 'hash': result['outputs_ref']['isolated'],
999 'namespace': result['outputs_ref']['namespace'],
1000 'storage': result['outputs_ref']['isolatedserver'],
1001 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -05001002 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -07001003 print(
1004 '[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
1005 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -08001006 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -07001007 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001008
1009
iannuccib58d10d2017-03-18 02:00:25 -07001010# Yielded by 'install_client_and_packages'.
vadimsh232f5a82017-01-20 19:23:44 -08001011CipdInfo = collections.namedtuple('CipdInfo', [
1012 'client', # cipd.CipdClient object
1013 'cache_dir', # absolute path to bot-global cipd tag and instance cache
1014 'stats', # dict with stats to return to the server
1015 'pins', # dict with installed cipd pins to return to the server
1016])
1017
1018
1019@contextlib.contextmanager
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001020def noop_install_packages(_run_dir, _isolated_dir):
iannuccib58d10d2017-03-18 02:00:25 -07001021 """Placeholder for 'install_client_and_packages' if cipd is disabled."""
vadimsh232f5a82017-01-20 19:23:44 -08001022 yield None
1023
1024
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001025def _install_packages(run_dir, cipd_cache_dir, client, packages):
iannuccib58d10d2017-03-18 02:00:25 -07001026 """Calls 'cipd ensure' for packages.
1027
1028 Args:
1029 run_dir (str): root of installation.
1030 cipd_cache_dir (str): the directory to use for the cipd package cache.
1031 client (CipdClient): the cipd client to use
1032 packages: packages to install, list [(path, package_name, version), ...].
iannuccib58d10d2017-03-18 02:00:25 -07001033
1034 Returns: list of pinned packages. Looks like [
1035 {
1036 'path': 'subdirectory',
1037 'package_name': 'resolved/package/name',
1038 'version': 'deadbeef...',
1039 },
1040 ...
1041 ]
1042 """
1043 package_pins = [None]*len(packages)
1044 def insert_pin(path, name, version, idx):
1045 package_pins[idx] = {
1046 'package_name': name,
1047 # swarming deals with 'root' as '.'
1048 'path': path or '.',
1049 'version': version,
1050 }
1051
1052 by_path = collections.defaultdict(list)
1053 for i, (path, name, version) in enumerate(packages):
1054 # cipd deals with 'root' as ''
1055 if path == '.':
1056 path = ''
1057 by_path[path].append((name, version, i))
1058
1059 pins = client.ensure(
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001060 run_dir,
1061 {
1062 subdir: [(name, vers) for name, vers, _ in pkgs
1063 ] for subdir, pkgs in by_path.items()
1064 },
1065 cache_dir=cipd_cache_dir,
iannuccib58d10d2017-03-18 02:00:25 -07001066 )
1067
Marc-Antoine Ruel04903a32019-10-09 21:09:25 +00001068 for subdir, pin_list in sorted(pins.items()):
iannuccib58d10d2017-03-18 02:00:25 -07001069 this_subdir = by_path[subdir]
1070 for i, (name, version) in enumerate(pin_list):
1071 insert_pin(subdir, name, version, this_subdir[i][2])
1072
Robert Iannucci461b30d2017-12-13 11:34:03 -08001073 assert None not in package_pins, (packages, pins, package_pins)
iannuccib58d10d2017-03-18 02:00:25 -07001074
1075 return package_pins
1076
1077
vadimsh232f5a82017-01-20 19:23:44 -08001078@contextlib.contextmanager
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001079def install_client_and_packages(run_dir, packages, service_url,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001080 client_package_name, client_version, cache_dir,
1081 isolated_dir):
vadimsh902948e2017-01-20 15:57:32 -08001082 """Bootstraps CIPD client and installs CIPD packages.
iannucci96fcccc2016-08-30 15:52:22 -07001083
vadimsh232f5a82017-01-20 19:23:44 -08001084 Yields CipdClient, stats, client info and pins (as single CipdInfo object).
1085
1086 Pins and the CIPD client info are in the form of:
iannucci96fcccc2016-08-30 15:52:22 -07001087 [
1088 {
1089 "path": path, "package_name": package_name, "version": version,
1090 },
1091 ...
1092 ]
vadimsh902948e2017-01-20 15:57:32 -08001093 (the CIPD client info is a single dictionary instead of a list)
iannucci96fcccc2016-08-30 15:52:22 -07001094
1095 such that they correspond 1:1 to all input package arguments from the command
1096 line. These dictionaries make their all the way back to swarming, where they
1097 become the arguments of CipdPackage.
nodirbe642ff2016-06-09 15:51:51 -07001098
vadimsh902948e2017-01-20 15:57:32 -08001099 If 'packages' list is empty, will bootstrap CIPD client, but won't install
1100 any packages.
1101
1102 The bootstrapped client (regardless whether 'packages' list is empty or not),
vadimsh232f5a82017-01-20 19:23:44 -08001103 will be made available to the task via $PATH.
vadimsh902948e2017-01-20 15:57:32 -08001104
nodirbe642ff2016-06-09 15:51:51 -07001105 Args:
nodir90bc8dc2016-06-15 13:35:21 -07001106 run_dir (str): root of installation.
vadimsh902948e2017-01-20 15:57:32 -08001107 packages: packages to install, list [(path, package_name, version), ...].
nodirbe642ff2016-06-09 15:51:51 -07001108 service_url (str): CIPD server url, e.g.
1109 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -07001110 client_package_name (str): CIPD package name of CIPD client.
1111 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -07001112 cache_dir (str): where to keep cache of cipd clients, packages and tags.
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001113 isolated_dir (str): where to download isolated client.
nodirbe642ff2016-06-09 15:51:51 -07001114 """
1115 assert cache_dir
nodir90bc8dc2016-06-15 13:35:21 -07001116
nodirbe642ff2016-06-09 15:51:51 -07001117 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -07001118
vadimsh902948e2017-01-20 15:57:32 -08001119 cache_dir = os.path.abspath(cache_dir)
vadimsh232f5a82017-01-20 19:23:44 -08001120 cipd_cache_dir = os.path.join(cache_dir, 'cache') # tag and instance caches
nodir90bc8dc2016-06-15 13:35:21 -07001121 run_dir = os.path.abspath(run_dir)
vadimsh902948e2017-01-20 15:57:32 -08001122 packages = packages or []
nodir90bc8dc2016-06-15 13:35:21 -07001123
nodirbe642ff2016-06-09 15:51:51 -07001124 get_client_start = time.time()
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001125 client_manager = cipd.get_client(service_url, client_package_name,
1126 client_version, cache_dir)
iannucci96fcccc2016-08-30 15:52:22 -07001127
nodirbe642ff2016-06-09 15:51:51 -07001128 with client_manager as client:
1129 get_client_duration = time.time() - get_client_start
nodir90bc8dc2016-06-15 13:35:21 -07001130
iannuccib58d10d2017-03-18 02:00:25 -07001131 package_pins = []
1132 if packages:
Takuto Ikuta2efc7792019-11-27 14:33:34 +00001133 package_pins = _install_packages(run_dir, cipd_cache_dir, client,
1134 packages)
iannuccib58d10d2017-03-18 02:00:25 -07001135
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001136 # Install isolated client to |isolated_dir|.
Takuto Ikuta02edca22019-11-29 10:04:51 +00001137 _install_packages(isolated_dir, cipd_cache_dir, client,
1138 [('', ISOLATED_PACKAGE, ISOLATED_REVISION)])
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001139
iannuccib58d10d2017-03-18 02:00:25 -07001140 file_path.make_tree_files_read_only(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -07001141
vadimsh232f5a82017-01-20 19:23:44 -08001142 total_duration = time.time() - start
1143 logging.info(
1144 'Installing CIPD client and packages took %d seconds', total_duration)
nodir90bc8dc2016-06-15 13:35:21 -07001145
vadimsh232f5a82017-01-20 19:23:44 -08001146 yield CipdInfo(
1147 client=client,
1148 cache_dir=cipd_cache_dir,
1149 stats={
1150 'duration': total_duration,
1151 'get_client_duration': get_client_duration,
1152 },
1153 pins={
iannuccib58d10d2017-03-18 02:00:25 -07001154 'client_package': {
1155 'package_name': client.package_name,
1156 'version': client.instance_id,
1157 },
vadimsh232f5a82017-01-20 19:23:44 -08001158 'packages': package_pins,
1159 })
nodirbe642ff2016-06-09 15:51:51 -07001160
1161
1162def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -04001163 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -07001164 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +00001165 version=__version__,
1166 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -07001167 parser.add_option(
maruel36a963d2016-04-08 17:15:49 -07001168 '--clean', action='store_true',
1169 help='Cleans the cache, trimming it necessary and remove corrupted items '
1170 'and returns without executing anything; use with -v to know what '
1171 'was done')
1172 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -07001173 '--json',
1174 help='dump output metadata to json file. When used, run_isolated returns '
1175 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -07001176 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001177 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -07001178 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -08001179 '--grace-period', type='float',
maruel6be7f9e2015-10-01 12:25:30 -07001180 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -07001181 parser.add_option(
Marc-Antoine Ruel49e347d2017-10-24 16:52:02 -07001182 '--raw-cmd', action='store_true',
1183 help='Ignore the isolated command, use the one supplied at the command '
1184 'line')
1185 parser.add_option(
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001186 '--relative-cwd',
1187 help='Ignore the isolated \'relative_cwd\' and use this one instead; '
1188 'requires --raw-cmd')
1189 parser.add_option(
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001190 '--env', default=[], action='append',
1191 help='Environment variables to set for the child process')
1192 parser.add_option(
1193 '--env-prefix', default=[], action='append',
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001194 help='Specify a VAR=./path/fragment to put in the environment variable '
1195 'before executing the command. The path fragment must be relative '
1196 'to the isolated run directory, and must not contain a `..` token. '
1197 'The path will be made absolute and prepended to the indicated '
1198 '$VAR using the OS\'s path separator. Multiple items for the same '
1199 '$VAR will be prepended in order.')
1200 parser.add_option(
bpastene3ae09522016-06-10 17:12:59 -07001201 '--bot-file',
1202 help='Path to a file describing the state of the host. The content is '
1203 'defined by on_before_task() in bot_config.')
aludwin7556e0c2016-10-26 08:46:10 -07001204 parser.add_option(
vadimsh9c54b2c2017-07-25 14:08:29 -07001205 '--switch-to-account',
1206 help='If given, switches LUCI_CONTEXT to given logical service account '
1207 '(e.g. "task" or "system") before launching the isolated process.')
1208 parser.add_option(
aludwin0a8e17d2016-10-27 15:57:39 -07001209 '--output', action='append',
1210 help='Specifies an output to return. If no outputs are specified, all '
1211 'files located in $(ISOLATED_OUTDIR) will be returned; '
1212 'otherwise, outputs in both $(ISOLATED_OUTDIR) and those '
1213 'specified by --output option (there can be multiple) will be '
1214 'returned. Note that if a file in OUT_DIR has the same path '
1215 'as an --output option, the --output version will be returned.')
1216 parser.add_option(
aludwin7556e0c2016-10-26 08:46:10 -07001217 '-a', '--argsfile',
1218 # This is actually handled in parse_args; it's included here purely so it
1219 # can make it into the help text.
1220 help='Specify a file containing a JSON array of arguments to this '
1221 'script. If --argsfile is provided, no other argument may be '
1222 'provided on the command line.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001223
1224 group = optparse.OptionGroup(parser, 'Data source')
1225 group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -05001226 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -07001227 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001228 isolateserver.add_isolate_server_options(group)
1229 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001230
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -04001231 isolateserver.add_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001232
1233 cipd.add_cipd_options(parser)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001234
1235 group = optparse.OptionGroup(parser, 'Named caches')
1236 group.add_option(
1237 '--named-cache',
1238 dest='named_caches',
1239 action='append',
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001240 nargs=3,
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001241 default=[],
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001242 help='A named cache to request. Accepts 3 arguments: name, path, hint. '
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001243 'name identifies the cache, must match regex [a-z0-9_]{1,4096}. '
1244 'path is a path relative to the run dir where the cache directory '
1245 'must be put to. '
1246 'This option can be specified more than once.')
1247 group.add_option(
1248 '--named-cache-root', default='named_caches',
1249 help='Cache root directory. Default=%default')
1250 parser.add_option_group(group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001251
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001252 group = optparse.OptionGroup(parser, 'Process containment')
1253 parser.add_option(
1254 '--lower-priority', action='store_true',
1255 help='Lowers the child process priority')
1256 parser.add_option(
1257 '--containment-type', choices=('NONE', 'AUTO', 'JOB_OBJECT'),
1258 default='NONE',
1259 help='Type of container to use')
1260 parser.add_option(
1261 '--limit-processes', type='int', default=0,
1262 help='Maximum number of active processes in the containment')
1263 parser.add_option(
1264 '--limit-total-committed-memory', type='int', default=0,
1265 help='Maximum sum of committed memory in the containment')
1266 parser.add_option_group(group)
1267
1268 group = optparse.OptionGroup(parser, 'Debugging')
1269 group.add_option(
Kenneth Russell61d42352014-09-15 11:41:16 -07001270 '--leak-temp-dir',
1271 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -07001272 help='Deliberately leak isolate\'s temp dir for later examination. '
1273 'Default: %default')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001274 group.add_option(
marueleb5fbee2015-09-17 13:01:36 -07001275 '--root-dir', help='Use a directory instead of a random one')
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001276 parser.add_option_group(group)
Kenneth Russell61d42352014-09-15 11:41:16 -07001277
Vadim Shtayurae34e13a2014-02-02 11:23:26 -08001278 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -07001279
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001280 parser.set_defaults(cache='cache', cipd_cache='cipd_cache')
nodirbe642ff2016-06-09 15:51:51 -07001281 return parser
1282
1283
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001284def process_named_cache_options(parser, options, time_fn=None):
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001285 """Validates named cache options and returns a CacheManager."""
1286 if options.named_caches and not options.named_cache_root:
1287 parser.error('--named-cache is specified, but --named-cache-root is empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001288 for name, path, hint in options.named_caches:
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001289 if not CACHE_NAME_RE.match(name):
1290 parser.error(
1291 'cache name %r does not match %r' % (name, CACHE_NAME_RE.pattern))
1292 if not path:
1293 parser.error('cache path cannot be empty')
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001294 try:
1295 long(hint)
1296 except ValueError:
1297 parser.error('cache hint must be a number')
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001298 if options.named_cache_root:
1299 # Make these configurable later if there is use case but for now it's fairly
1300 # safe values.
1301 # In practice, a fair chunk of bots are already recycled on a daily schedule
1302 # so this code doesn't have any effect to them, unless they are preloaded
1303 # with a really old cache.
1304 policies = local_caching.CachePolicies(
1305 # 1TiB.
1306 max_cache_size=1024*1024*1024*1024,
1307 min_free_space=options.min_free_space,
1308 max_items=50,
Marc-Antoine Ruel5d7606b2018-06-15 19:06:12 +00001309 max_age_secs=MAX_AGE_SECS)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001310 root_dir = six.text_type(os.path.abspath(options.named_cache_root))
John Budorickc6186972020-02-26 00:58:14 +00001311 cache = local_caching.NamedCache(root_dir, policies, time_fn=time_fn)
1312 # Touch any named caches we're going to use to minimize thrashing
1313 # between tasks that request some (but not all) of the same named caches.
John Budorick0a4dab62020-03-02 22:23:35 +00001314 cache.touch(*[name for name, _, _ in options.named_caches])
John Budorickc6186972020-02-26 00:58:14 +00001315 return cache
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001316 return None
1317
1318
aludwin7556e0c2016-10-26 08:46:10 -07001319def parse_args(args):
1320 # Create a fake mini-parser just to get out the "-a" command. Note that
1321 # it's not documented here; instead, it's documented in create_option_parser
1322 # even though that parser will never actually get to parse it. This is
1323 # because --argsfile is exclusive with all other options and arguments.
1324 file_argparse = argparse.ArgumentParser(add_help=False)
1325 file_argparse.add_argument('-a', '--argsfile')
1326 (file_args, nonfile_args) = file_argparse.parse_known_args(args)
1327 if file_args.argsfile:
1328 if nonfile_args:
1329 file_argparse.error('Can\'t specify --argsfile with'
1330 'any other arguments (%s)' % nonfile_args)
1331 try:
1332 with open(file_args.argsfile, 'r') as f:
1333 args = json.load(f)
1334 except (IOError, OSError, ValueError) as e:
1335 # We don't need to error out here - "args" is now empty,
1336 # so the call below to parser.parse_args(args) will fail
1337 # and print the full help text.
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001338 print('Couldn\'t read arguments: %s' % e, file=sys.stderr)
aludwin7556e0c2016-10-26 08:46:10 -07001339
1340 # Even if we failed to read the args, just call the normal parser now since it
1341 # will print the correct help message.
nodirbe642ff2016-06-09 15:51:51 -07001342 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001343 options, args = parser.parse_args(args)
aludwin7556e0c2016-10-26 08:46:10 -07001344 return (parser, options, args)
1345
1346
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001347def _calc_named_cache_hint(named_cache, named_caches):
1348 """Returns the expected size of the missing named caches."""
1349 present = named_cache.available
1350 size = 0
1351 for name, _, hint in named_caches:
1352 if name not in present:
1353 hint = long(hint)
1354 if hint > 0:
1355 size += hint
1356 return size
1357
1358
aludwin7556e0c2016-10-26 08:46:10 -07001359def main(args):
Marc-Antoine Ruelee6ca622017-11-29 11:19:16 -05001360 # Warning: when --argsfile is used, the strings are unicode instances, when
1361 # parsed normally, the strings are str instances.
aludwin7556e0c2016-10-26 08:46:10 -07001362 (parser, options, args) = parse_args(args)
maruel36a963d2016-04-08 17:15:49 -07001363
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001364 if not file_path.enable_symlink():
Marc-Antoine Ruel5a024272019-01-15 20:11:16 +00001365 logging.warning('Symlink support is not enabled')
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001366
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001367 named_cache = process_named_cache_options(parser, options)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001368 # hint is 0 if there's no named cache.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001369 hint = _calc_named_cache_hint(named_cache, options.named_caches)
1370 if hint:
1371 # Increase the --min-free-space value by the hint, and recreate the
1372 # NamedCache instance so it gets the updated CachePolicy.
1373 options.min_free_space += hint
1374 named_cache = process_named_cache_options(parser, options)
1375
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001376 # TODO(crbug.com/932396): Remove this.
1377 use_go_isolated = (
1378 options.cipd_enabled and
Takuto Ikuta64a9c2c2020-02-06 06:10:07 +00001379 # TODO(crbug.com/1045281): windows other than win10 has flaky connection
1380 # issue.
1381 (sys.platform != 'win32' or platform.release() == '10'))
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001382
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001383 # TODO(maruel): CIPD caches should be defined at an higher level here too, so
1384 # they can be cleaned the same way.
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001385 if use_go_isolated:
Takuto Ikuta00cf8fc2020-01-14 01:36:00 +00001386 isolate_cache = None
1387 else:
1388 isolate_cache = isolateserver.process_cache_options(options, trim=False)
1389
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001390 caches = []
1391 if isolate_cache:
1392 caches.append(isolate_cache)
1393 if named_cache:
1394 caches.append(named_cache)
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001395 root = caches[0].cache_dir if caches else six.text_type(os.getcwd())
maruel36a963d2016-04-08 17:15:49 -07001396 if options.clean:
1397 if options.isolated:
1398 parser.error('Can\'t use --isolated with --clean.')
1399 if options.isolate_server:
1400 parser.error('Can\'t use --isolate-server with --clean.')
1401 if options.json:
1402 parser.error('Can\'t use --json with --clean.')
nodirf33b8d62016-10-26 22:34:58 -07001403 if options.named_caches:
1404 parser.error('Can\t use --named-cache with --clean.')
Marc-Antoine Ruel7139d912018-06-15 20:04:42 +00001405 # Trim first, then clean.
1406 local_caching.trim_caches(
1407 caches,
1408 root,
1409 min_free_space=options.min_free_space,
1410 max_age_secs=MAX_AGE_SECS)
1411 for c in caches:
Marc-Antoine Ruel87fc2222018-06-18 13:09:24 +00001412 c.cleanup()
maruel36a963d2016-04-08 17:15:49 -07001413 return 0
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001414
1415 # Trim must still be done for the following case:
1416 # - named-cache was used
1417 # - some entries, with a large hint, where missing
1418 # - --min-free-space was increased accordingly, thus trimming is needed
1419 # Otherwise, this will have no effect, as bot_main calls run_isolated with
1420 # --clean after each task.
1421 if hint:
1422 logging.info('Additional trimming of %d bytes', hint)
Marc-Antoine Ruel0d8b0f62018-09-10 14:40:35 +00001423 local_caching.trim_caches(
1424 caches,
1425 root,
1426 min_free_space=options.min_free_space,
1427 max_age_secs=MAX_AGE_SECS)
maruel36a963d2016-04-08 17:15:49 -07001428
nodir55be77b2016-05-03 09:39:57 -07001429 if not options.isolated and not args:
1430 parser.error('--isolated or command to run is required.')
1431
Vadim Shtayura5d1efce2014-02-04 10:55:43 -08001432 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -07001433
1434 isolateserver.process_isolate_server_options(
Marc-Antoine Ruel5028ba22017-08-25 17:37:51 -04001435 parser, options, True, False)
nodir55be77b2016-05-03 09:39:57 -07001436 if not options.isolate_server:
1437 if options.isolated:
1438 parser.error('--isolated requires --isolate-server')
1439 if ISOLATED_OUTDIR_PARAMETER in args:
1440 parser.error(
1441 '%s in args requires --isolate-server' % ISOLATED_OUTDIR_PARAMETER)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001442
nodir90bc8dc2016-06-15 13:35:21 -07001443 if options.root_dir:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001444 options.root_dir = six.text_type(os.path.abspath(options.root_dir))
maruel12e30012015-10-09 11:55:35 -07001445 if options.json:
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001446 options.json = six.text_type(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -07001447
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001448 if any('=' not in i for i in options.env):
1449 parser.error(
1450 '--env required key=value form. value can be skipped to delete '
1451 'the variable')
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001452 options.env = dict(i.split('=', 1) for i in options.env)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001453
1454 prefixes = {}
1455 cwd = os.path.realpath(os.getcwd())
1456 for item in options.env_prefix:
1457 if '=' not in item:
1458 parser.error(
1459 '--env-prefix %r is malformed, must be in the form `VAR=./path`'
1460 % item)
Marc-Antoine Ruel7a68f712017-12-01 18:45:18 -05001461 key, opath = item.split('=', 1)
Marc-Antoine Ruel19dd8872017-11-28 18:33:39 -05001462 if os.path.isabs(opath):
1463 parser.error('--env-prefix %r path is bad, must be relative.' % opath)
1464 opath = os.path.normpath(opath)
1465 if not os.path.realpath(os.path.join(cwd, opath)).startswith(cwd):
1466 parser.error(
1467 '--env-prefix %r path is bad, must be relative and not contain `..`.'
1468 % opath)
1469 prefixes.setdefault(key, []).append(opath)
1470 options.env_prefix = prefixes
Robert Iannuccibf5f84c2017-11-22 12:56:50 -08001471
nodirbe642ff2016-06-09 15:51:51 -07001472 cipd.validate_cipd_options(parser, options)
1473
vadimsh232f5a82017-01-20 19:23:44 -08001474 install_packages_fn = noop_install_packages
vadimsh902948e2017-01-20 15:57:32 -08001475 if options.cipd_enabled:
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001476 install_packages_fn = (
1477 lambda run_dir, isolated_dir: install_client_and_packages(
vadimsh902948e2017-01-20 15:57:32 -08001478 run_dir, cipd.parse_package_args(options.cipd_packages),
1479 options.cipd_server, options.cipd_client_package,
Takuto Ikutab7ce0e32019-11-27 23:26:18 +00001480 options.cipd_client_version, cache_dir=options.cipd_cache,
1481 isolated_dir=isolated_dir))
nodirbe642ff2016-06-09 15:51:51 -07001482
nodird6160682017-02-02 13:03:35 -08001483 @contextlib.contextmanager
nodir0ae98b32017-05-11 13:21:53 -07001484 def install_named_caches(run_dir):
nodird6160682017-02-02 13:03:35 -08001485 # WARNING: this function depends on "options" variable defined in the outer
1486 # function.
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001487 assert six.text_type(run_dir), repr(run_dir)
Marc-Antoine Ruel49f9f8d2018-05-24 15:57:06 -04001488 assert os.path.isabs(run_dir), run_dir
Takuto Ikuta6e2ff962019-10-29 12:35:27 +00001489 named_caches = [(os.path.join(run_dir, six.text_type(relpath)), name)
1490 for name, relpath, _ in options.named_caches]
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001491 for path, name in named_caches:
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001492 named_cache.install(path, name)
nodird6160682017-02-02 13:03:35 -08001493 try:
1494 yield
1495 finally:
dnje289d132017-07-07 11:16:44 -07001496 # Uninstall each named cache, returning it to the cache pool. If an
1497 # uninstall fails for a given cache, it will remain in the task's
1498 # temporary space, get cleaned up by the Swarming bot, and be lost.
1499 #
1500 # If the Swarming bot cannot clean up the cache, it will handle it like
1501 # any other bot file that could not be removed.
Marc-Antoine Ruelc7a704b2018-08-29 19:02:23 +00001502 for path, name in reversed(named_caches):
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001503 try:
Marc-Antoine Ruele9558372018-08-03 03:41:22 +00001504 # uninstall() doesn't trim but does call save() implicitly. Trimming
1505 # *must* be done manually via periodic 'run_isolated.py --clean'.
Marc-Antoine Ruele79ddbf2018-06-13 18:33:07 +00001506 named_cache.uninstall(path, name)
1507 except local_caching.NamedCacheError:
1508 logging.exception('Error while removing named cache %r at %r. '
1509 'The cache will be lost.', path, name)
nodirf33b8d62016-10-26 22:34:58 -07001510
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001511 extra_args = []
1512 command = []
1513 if options.raw_cmd:
1514 command = args
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001515 if options.relative_cwd:
1516 a = os.path.normpath(os.path.abspath(options.relative_cwd))
1517 if not a.startswith(os.getcwd()):
1518 parser.error(
1519 '--relative-cwd must not try to escape the working directory')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001520 else:
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001521 if options.relative_cwd:
1522 parser.error('--relative-cwd requires --raw-cmd')
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001523 extra_args = args
1524
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001525 containment_type = subprocess42.Containment.NONE
1526 if options.containment_type == 'AUTO':
1527 containment_type = subprocess42.Containment.AUTO
1528 if options.containment_type == 'JOB_OBJECT':
1529 containment_type = subprocess42.Containment.JOB_OBJECT
1530 containment = subprocess42.Containment(
1531 containment_type=containment_type,
1532 limit_processes=options.limit_processes,
1533 limit_total_committed_memory=options.limit_total_committed_memory)
1534
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001535 data = TaskData(
1536 command=command,
Marc-Antoine Ruel95068cf2017-12-07 21:35:05 -05001537 relative_cwd=options.relative_cwd,
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001538 extra_args=extra_args,
1539 isolated_hash=options.isolated,
1540 storage=None,
1541 isolate_cache=isolate_cache,
1542 outputs=options.output,
1543 install_named_caches=install_named_caches,
1544 leak_temp_dir=options.leak_temp_dir,
1545 root_dir=_to_unicode(options.root_dir),
1546 hard_timeout=options.hard_timeout,
1547 grace_period=options.grace_period,
1548 bot_file=options.bot_file,
1549 switch_to_account=options.switch_to_account,
1550 install_packages_fn=install_packages_fn,
Takuto Ikuta5c59a842020-01-24 03:05:24 +00001551 use_go_isolated=use_go_isolated,
Takuto Ikuta10cae642020-01-08 08:12:07 +00001552 go_cache_dir=options.cache,
Takuto Ikuta879788c2020-01-10 08:00:26 +00001553 go_cache_policies=local_caching.CachePolicies(
1554 max_cache_size=options.max_cache_size,
1555 min_free_space=options.min_free_space,
1556 max_items=options.max_items,
1557 max_age_secs=None,
1558 ),
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001559 env=options.env,
Marc-Antoine Ruel03c6fd12019-04-30 12:12:55 +00001560 env_prefix=options.env_prefix,
Marc-Antoine Ruel1b65f4e2019-05-02 21:56:58 +00001561 lower_priority=bool(options.lower_priority),
1562 containment=containment)
nodirbe642ff2016-06-09 15:51:51 -07001563 try:
nodir90bc8dc2016-06-15 13:35:21 -07001564 if options.isolate_server:
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001565 server_ref = isolate_storage.ServerRef(
nodir90bc8dc2016-06-15 13:35:21 -07001566 options.isolate_server, options.namespace)
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001567 storage = isolateserver.get_storage(server_ref)
nodir90bc8dc2016-06-15 13:35:21 -07001568 with storage:
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001569 data = data._replace(storage=storage)
nodirf33b8d62016-10-26 22:34:58 -07001570 # Hashing schemes used by |storage| and |isolate_cache| MUST match.
Marc-Antoine Ruelb8513132018-11-20 19:48:53 +00001571 assert storage.server_ref.hash_algo == server_ref.hash_algo
Marc-Antoine Ruel7de52592017-12-07 10:41:12 -05001572 return run_tha_test(data, options.json)
1573 return run_tha_test(data, options.json)
Marc-Antoine Ruel8b11dbd2018-05-18 14:31:22 -04001574 except (
1575 cipd.Error,
1576 local_caching.NamedCacheError,
Marc-Antoine Ruelb6e9e232018-11-20 00:12:33 +00001577 local_caching.NoMoreSpace) as ex:
Marc-Antoine Ruelf899c482019-10-10 23:32:06 +00001578 print(ex.message, file=sys.stderr)
nodirbe642ff2016-06-09 15:51:51 -07001579 return 1
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001580
1581
1582if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -07001583 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +00001584 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +00001585 fix_encoding.fix_encoding()
Ye Kuang2dd17442020-04-22 08:45:52 +00001586 net.set_user_agent('run_isolated.py/' + __version__)
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -05001587 sys.exit(main(sys.argv[1:]))