blob: fa340c624f2a6097d855d2d6665f18bcb5c8c63d [file] [log] [blame]
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00001#!/usr/bin/env python
maruelea586f32016-04-05 11:11:33 -07002# Copyright 2012 The LUCI Authors. All rights reserved.
maruelf1f5e2a2016-05-25 17:10:39 -07003# Use of this source code is governed under the Apache License, Version 2.0
4# that can be found in the LICENSE file.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00005
nodir55be77b2016-05-03 09:39:57 -07006"""Runs a command with optional isolated input/output.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +00007
nodir55be77b2016-05-03 09:39:57 -07008Despite name "run_isolated", can run a generic non-isolated command specified as
9args.
10
11If input isolated hash is provided, fetches it, creates a tree of hard links,
12appends args to the command in the fetched isolated and runs it.
13To improve performance, keeps a local cache.
14The local cache can safely be deleted.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050015
nodirbe642ff2016-06-09 15:51:51 -070016Any ${EXECUTABLE_SUFFIX} on the command line will be replaced with ".exe" string
17on Windows and "" on other platforms.
18
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -050019Any ${ISOLATED_OUTDIR} on the command line will be replaced by the location of a
20temporary directory upon execution of the command specified in the .isolated
21file. All content written to this directory will be uploaded upon termination
22and the .isolated file describing this directory will be printed to stdout.
bpastene447c1992016-06-20 15:21:47 -070023
24Any ${SWARMING_BOT_FILE} on the command line will be replaced by the value of
25the --bot-file parameter. This file is used by a swarming bot to communicate
26state of the host to tasks. It is written to by the swarming bot's
27on_before_task() hook in the swarming server's custom bot_config.py.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000028"""
29
maruel2e8d0f52016-07-16 07:51:29 -070030__version__ = '0.8.3'
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000031
maruel064c0a32016-04-05 11:47:15 -070032import base64
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000033import logging
34import optparse
35import os
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000036import sys
37import tempfile
maruel064c0a32016-04-05 11:47:15 -070038import time
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +000039
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000040from third_party.depot_tools import fix_encoding
41
Vadim Shtayura6b555c12014-07-23 16:22:18 -070042from utils import file_path
maruel12e30012015-10-09 11:55:35 -070043from utils import fs
maruel064c0a32016-04-05 11:47:15 -070044from utils import large
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -040045from utils import logging_utils
Marc-Antoine Ruelcfb60852014-07-02 15:22:00 -040046from utils import on_error
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -050047from utils import subprocess42
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000048from utils import tools
vadimsh@chromium.org3e97deb2013-08-24 00:56:44 +000049from utils import zip_package
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000050
Vadim Shtayurae34e13a2014-02-02 11:23:26 -080051import auth
nodirbe642ff2016-06-09 15:51:51 -070052import cipd
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000053import isolateserver
maruel@chromium.orgdedbf492013-09-12 20:42:11 +000054
vadimsh@chromium.orga4326472013-08-24 02:05:41 +000055
vadimsh@chromium.org85071062013-08-21 23:37:45 +000056# Absolute path to this file (can be None if running from zip on Mac).
tansella4949442016-06-23 22:34:32 -070057THIS_FILE_PATH = os.path.abspath(
58 __file__.decode(sys.getfilesystemencoding())) if __file__ else None
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000059
60# Directory that contains this file (might be inside zip package).
tansella4949442016-06-23 22:34:32 -070061BASE_DIR = os.path.dirname(THIS_FILE_PATH) if __file__.decode(
62 sys.getfilesystemencoding()) else None
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000063
64# Directory that contains currently running script file.
maruel@chromium.org814d23f2013-10-01 19:08:00 +000065if zip_package.get_main_script_path():
66 MAIN_DIR = os.path.dirname(
67 os.path.abspath(zip_package.get_main_script_path()))
68else:
69 # This happens when 'import run_isolated' is executed at the python
70 # interactive prompt, in that case __file__ is undefined.
71 MAIN_DIR = None
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000072
maruele2f2cb82016-07-13 14:41:03 -070073
74# Magic variables that can be found in the isolate task command line.
75ISOLATED_OUTDIR_PARAMETER = '${ISOLATED_OUTDIR}'
76EXECUTABLE_SUFFIX_PARAMETER = '${EXECUTABLE_SUFFIX}'
77SWARMING_BOT_FILE_PARAMETER = '${SWARMING_BOT_FILE}'
78
79
csharp@chromium.orgff2a4662012-11-21 20:49:32 +000080# The name of the log file to use.
81RUN_ISOLATED_LOG_FILE = 'run_isolated.log'
82
maruele2f2cb82016-07-13 14:41:03 -070083
csharp@chromium.orge217f302012-11-22 16:51:53 +000084# The name of the log to use for the run_test_cases.py command
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +000085RUN_TEST_CASES_LOG = 'run_test_cases.log'
csharp@chromium.orge217f302012-11-22 16:51:53 +000086
vadimsh@chromium.org87d63262013-04-04 19:34:21 +000087
maruele2f2cb82016-07-13 14:41:03 -070088# Use short names for temporary directories. This is driven by Windows, which
89# imposes a relatively short maximum path length of 260 characters, often
90# referred to as MAX_PATH. It is relatively easy to create files with longer
91# path length. A use case is with recursive depedency treesV like npm packages.
92#
93# It is recommended to start the script with a `root_dir` as short as
94# possible.
95# - ir stands for isolated_run
96# - io stands for isolated_out
97# - it stands for isolated_tmp
98ISOLATED_RUN_DIR = u'ir'
99ISOLATED_OUT_DIR = u'io'
100ISOLATED_TMP_DIR = u'it'
101
102
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +0000103def get_as_zip_package(executable=True):
104 """Returns ZipPackage with this module and all its dependencies.
105
106 If |executable| is True will store run_isolated.py as __main__.py so that
107 zip package is directly executable be python.
108 """
109 # Building a zip package when running from another zip package is
110 # unsupported and probably unneeded.
111 assert not zip_package.is_zipped_module(sys.modules[__name__])
vadimsh@chromium.org85071062013-08-21 23:37:45 +0000112 assert THIS_FILE_PATH
113 assert BASE_DIR
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +0000114 package = zip_package.ZipPackage(root=BASE_DIR)
115 package.add_python_file(THIS_FILE_PATH, '__main__.py' if executable else None)
Marc-Antoine Ruel8bee66d2014-08-28 19:02:07 -0400116 package.add_python_file(os.path.join(BASE_DIR, 'isolated_format.py'))
maruel@chromium.orgdedbf492013-09-12 20:42:11 +0000117 package.add_python_file(os.path.join(BASE_DIR, 'isolateserver.py'))
Vadim Shtayurae34e13a2014-02-02 11:23:26 -0800118 package.add_python_file(os.path.join(BASE_DIR, 'auth.py'))
nodirbe642ff2016-06-09 15:51:51 -0700119 package.add_python_file(os.path.join(BASE_DIR, 'cipd.py'))
vadimsh@chromium.org8b9d56b2013-08-21 22:24:35 +0000120 package.add_directory(os.path.join(BASE_DIR, 'third_party'))
121 package.add_directory(os.path.join(BASE_DIR, 'utils'))
122 return package
123
124
maruel03e11842016-07-14 10:50:16 -0700125def make_temp_dir(prefix, root_dir):
126 """Returns a new unique temporary directory."""
127 return unicode(tempfile.mkdtemp(prefix=prefix, dir=root_dir))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000128
129
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500130def change_tree_read_only(rootdir, read_only):
131 """Changes the tree read-only bits according to the read_only specification.
132
133 The flag can be 0, 1 or 2, which will affect the possibility to modify files
134 and create or delete files.
135 """
136 if read_only == 2:
137 # Files and directories (except on Windows) are marked read only. This
138 # inhibits modifying, creating or deleting files in the test directory,
139 # except on Windows where creating and deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400140 file_path.make_tree_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500141 elif read_only == 1:
142 # Files are marked read only but not the directories. This inhibits
143 # modifying files but creating or deleting files is still possible.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400144 file_path.make_tree_files_read_only(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500145 elif read_only in (0, None):
Marc-Antoine Ruelf1d827c2014-11-24 15:22:25 -0500146 # Anything can be modified.
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500147 # TODO(maruel): This is currently dangerous as long as DiskCache.touch()
148 # is not yet changed to verify the hash of the content of the files it is
149 # looking at, so that if a test modifies an input file, the file must be
150 # deleted.
Marc-Antoine Ruele4ad07e2014-10-15 20:22:29 -0400151 file_path.make_tree_writeable(rootdir)
Marc-Antoine Ruel7124e392014-01-09 11:49:21 -0500152 else:
153 raise ValueError(
154 'change_tree_read_only(%s, %s): Unknown flag %s' %
155 (rootdir, read_only, read_only))
156
157
nodir90bc8dc2016-06-15 13:35:21 -0700158def process_command(command, out_dir, bot_file):
nodirbe642ff2016-06-09 15:51:51 -0700159 """Replaces variables in a command line.
160
161 Raises:
162 ValueError if a parameter is requested in |command| but its value is not
163 provided.
164 """
maruela9cfd6f2015-09-15 11:03:15 -0700165 def fix(arg):
nodirbe642ff2016-06-09 15:51:51 -0700166 arg = arg.replace(EXECUTABLE_SUFFIX_PARAMETER, cipd.EXECUTABLE_SUFFIX)
167 replace_slash = False
nodir55be77b2016-05-03 09:39:57 -0700168 if ISOLATED_OUTDIR_PARAMETER in arg:
nodirbe642ff2016-06-09 15:51:51 -0700169 if not out_dir:
maruel7f63a272016-07-12 12:40:36 -0700170 raise ValueError(
171 'output directory is requested in command, but not provided; '
172 'please specify one')
nodir55be77b2016-05-03 09:39:57 -0700173 arg = arg.replace(ISOLATED_OUTDIR_PARAMETER, out_dir)
nodirbe642ff2016-06-09 15:51:51 -0700174 replace_slash = True
nodir90bc8dc2016-06-15 13:35:21 -0700175 if SWARMING_BOT_FILE_PARAMETER in arg:
176 if bot_file:
177 arg = arg.replace(SWARMING_BOT_FILE_PARAMETER, bot_file)
178 replace_slash = True
179 else:
180 logging.warning('SWARMING_BOT_FILE_PARAMETER found in command, but no '
181 'bot_file specified. Leaving parameter unchanged.')
nodirbe642ff2016-06-09 15:51:51 -0700182 if replace_slash:
183 # Replace slashes only if parameters are present
nodir55be77b2016-05-03 09:39:57 -0700184 # because of arguments like '${ISOLATED_OUTDIR}/foo/bar'
185 arg = arg.replace('/', os.sep)
maruela9cfd6f2015-09-15 11:03:15 -0700186 return arg
187
188 return [fix(arg) for arg in command]
189
190
maruel6be7f9e2015-10-01 12:25:30 -0700191def run_command(command, cwd, tmp_dir, hard_timeout, grace_period):
192 """Runs the command.
193
194 Returns:
195 tuple(process exit code, bool if had a hard timeout)
196 """
maruela9cfd6f2015-09-15 11:03:15 -0700197 logging.info('run_command(%s, %s)' % (command, cwd))
marueleb5fbee2015-09-17 13:01:36 -0700198
199 env = os.environ.copy()
200 if sys.platform == 'darwin':
tansella4949442016-06-23 22:34:32 -0700201 env['TMPDIR'] = tmp_dir.encode(sys.getfilesystemencoding())
marueleb5fbee2015-09-17 13:01:36 -0700202 elif sys.platform == 'win32':
tansella4949442016-06-23 22:34:32 -0700203 env['TEMP'] = tmp_dir.encode(sys.getfilesystemencoding())
marueleb5fbee2015-09-17 13:01:36 -0700204 else:
tansella4949442016-06-23 22:34:32 -0700205 env['TMP'] = tmp_dir.encode(sys.getfilesystemencoding())
maruel6be7f9e2015-10-01 12:25:30 -0700206 exit_code = None
207 had_hard_timeout = False
maruela9cfd6f2015-09-15 11:03:15 -0700208 with tools.Profiler('RunTest'):
maruel6be7f9e2015-10-01 12:25:30 -0700209 proc = None
210 had_signal = []
maruela9cfd6f2015-09-15 11:03:15 -0700211 try:
maruel6be7f9e2015-10-01 12:25:30 -0700212 # TODO(maruel): This code is imperfect. It doesn't handle well signals
213 # during the download phase and there's short windows were things can go
214 # wrong.
215 def handler(signum, _frame):
216 if proc and not had_signal:
217 logging.info('Received signal %d', signum)
218 had_signal.append(True)
maruel556d9052015-10-05 11:12:44 -0700219 raise subprocess42.TimeoutExpired(command, None)
maruel6be7f9e2015-10-01 12:25:30 -0700220
221 proc = subprocess42.Popen(command, cwd=cwd, env=env, detached=True)
222 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, handler):
223 try:
224 exit_code = proc.wait(hard_timeout or None)
225 except subprocess42.TimeoutExpired:
226 if not had_signal:
227 logging.warning('Hard timeout')
228 had_hard_timeout = True
229 logging.warning('Sending SIGTERM')
230 proc.terminate()
231
232 # Ignore signals in grace period. Forcibly give the grace period to the
233 # child process.
234 if exit_code is None:
235 ignore = lambda *_: None
236 with subprocess42.set_signal_handler(subprocess42.STOP_SIGNALS, ignore):
237 try:
238 exit_code = proc.wait(grace_period or None)
239 except subprocess42.TimeoutExpired:
240 # Now kill for real. The user can distinguish between the
241 # following states:
242 # - signal but process exited within grace period,
243 # hard_timed_out will be set but the process exit code will be
244 # script provided.
245 # - processed exited late, exit code will be -9 on posix.
246 logging.warning('Grace exhausted; sending SIGKILL')
247 proc.kill()
248 logging.info('Waiting for proces exit')
249 exit_code = proc.wait()
maruela9cfd6f2015-09-15 11:03:15 -0700250 except OSError:
251 # This is not considered to be an internal error. The executable simply
252 # does not exit.
maruela72f46e2016-02-24 11:05:45 -0800253 sys.stderr.write(
254 '<The executable does not exist or a dependent library is missing>\n'
255 '<Check for missing .so/.dll in the .isolate or GN file>\n'
256 '<Command: %s>\n' % command)
257 if os.environ.get('SWARMING_TASK_ID'):
258 # Give an additional hint when running as a swarming task.
259 sys.stderr.write(
260 '<See the task\'s page for commands to help diagnose this issue '
261 'by reproducing the task locally>\n')
maruela9cfd6f2015-09-15 11:03:15 -0700262 exit_code = 1
263 logging.info(
264 'Command finished with exit code %d (%s)',
265 exit_code, hex(0xffffffff & exit_code))
maruel6be7f9e2015-10-01 12:25:30 -0700266 return exit_code, had_hard_timeout
maruela9cfd6f2015-09-15 11:03:15 -0700267
268
nodir6f801882016-04-29 14:41:50 -0700269def fetch_and_measure(isolated_hash, storage, cache, outdir):
270 """Fetches an isolated and returns (bundle, stats)."""
271 start = time.time()
272 bundle = isolateserver.fetch_isolated(
273 isolated_hash=isolated_hash,
274 storage=storage,
275 cache=cache,
276 outdir=outdir)
277 return bundle, {
278 'duration': time.time() - start,
279 'initial_number_items': cache.initial_number_items,
280 'initial_size': cache.initial_size,
281 'items_cold': base64.b64encode(large.pack(sorted(cache.added))),
282 'items_hot': base64.b64encode(
283 large.pack(sorted(set(cache.linked) - set(cache.added)))),
284 }
285
286
maruela9cfd6f2015-09-15 11:03:15 -0700287def delete_and_upload(storage, out_dir, leak_temp_dir):
288 """Deletes the temporary run directory and uploads results back.
289
290 Returns:
nodir6f801882016-04-29 14:41:50 -0700291 tuple(outputs_ref, success, stats)
maruel064c0a32016-04-05 11:47:15 -0700292 - outputs_ref: a dict referring to the results archived back to the isolated
293 server, if applicable.
294 - success: False if something occurred that means that the task must
295 forcibly be considered a failure, e.g. zombie processes were left
296 behind.
nodir6f801882016-04-29 14:41:50 -0700297 - stats: uploading stats.
maruela9cfd6f2015-09-15 11:03:15 -0700298 """
299
300 # Upload out_dir and generate a .isolated file out of this directory. It is
301 # only done if files were written in the directory.
302 outputs_ref = None
maruel064c0a32016-04-05 11:47:15 -0700303 cold = []
304 hot = []
nodir6f801882016-04-29 14:41:50 -0700305 start = time.time()
306
maruel12e30012015-10-09 11:55:35 -0700307 if fs.isdir(out_dir) and fs.listdir(out_dir):
maruela9cfd6f2015-09-15 11:03:15 -0700308 with tools.Profiler('ArchiveOutput'):
309 try:
maruel064c0a32016-04-05 11:47:15 -0700310 results, f_cold, f_hot = isolateserver.archive_files_to_storage(
maruela9cfd6f2015-09-15 11:03:15 -0700311 storage, [out_dir], None)
312 outputs_ref = {
313 'isolated': results[0][0],
314 'isolatedserver': storage.location,
315 'namespace': storage.namespace,
316 }
maruel064c0a32016-04-05 11:47:15 -0700317 cold = sorted(i.size for i in f_cold)
318 hot = sorted(i.size for i in f_hot)
maruela9cfd6f2015-09-15 11:03:15 -0700319 except isolateserver.Aborted:
320 # This happens when a signal SIGTERM was received while uploading data.
321 # There is 2 causes:
322 # - The task was too slow and was about to be killed anyway due to
323 # exceeding the hard timeout.
324 # - The amount of data uploaded back is very large and took too much
325 # time to archive.
326 sys.stderr.write('Received SIGTERM while uploading')
327 # Re-raise, so it will be treated as an internal failure.
328 raise
nodir6f801882016-04-29 14:41:50 -0700329
330 success = False
maruela9cfd6f2015-09-15 11:03:15 -0700331 try:
maruel12e30012015-10-09 11:55:35 -0700332 if (not leak_temp_dir and fs.isdir(out_dir) and
maruel6eeea7d2015-09-16 12:17:42 -0700333 not file_path.rmtree(out_dir)):
maruela9cfd6f2015-09-15 11:03:15 -0700334 logging.error('Had difficulties removing out_dir %s', out_dir)
nodir6f801882016-04-29 14:41:50 -0700335 else:
336 success = True
maruela9cfd6f2015-09-15 11:03:15 -0700337 except OSError as e:
338 # When this happens, it means there's a process error.
maruel12e30012015-10-09 11:55:35 -0700339 logging.exception('Had difficulties removing out_dir %s: %s', out_dir, e)
nodir6f801882016-04-29 14:41:50 -0700340 stats = {
341 'duration': time.time() - start,
342 'items_cold': base64.b64encode(large.pack(cold)),
343 'items_hot': base64.b64encode(large.pack(hot)),
344 }
345 return outputs_ref, success, stats
maruela9cfd6f2015-09-15 11:03:15 -0700346
347
marueleb5fbee2015-09-17 13:01:36 -0700348def map_and_run(
nodir55be77b2016-05-03 09:39:57 -0700349 command, isolated_hash, storage, cache, leak_temp_dir, root_dir,
nodir90bc8dc2016-06-15 13:35:21 -0700350 hard_timeout, grace_period, bot_file, extra_args, install_packages_fn):
nodir55be77b2016-05-03 09:39:57 -0700351 """Runs a command with optional isolated input/output.
352
353 See run_tha_test for argument documentation.
354
355 Returns metadata about the result.
356 """
357 assert bool(command) ^ bool(isolated_hash)
maruela9cfd6f2015-09-15 11:03:15 -0700358 result = {
maruel064c0a32016-04-05 11:47:15 -0700359 'duration': None,
maruela9cfd6f2015-09-15 11:03:15 -0700360 'exit_code': None,
maruel6be7f9e2015-10-01 12:25:30 -0700361 'had_hard_timeout': False,
maruela9cfd6f2015-09-15 11:03:15 -0700362 'internal_failure': None,
maruel064c0a32016-04-05 11:47:15 -0700363 'stats': {
nodir55715712016-06-03 12:28:19 -0700364 # 'isolated': {
nodirbe642ff2016-06-09 15:51:51 -0700365 # 'cipd': {
366 # 'duration': 0.,
367 # 'get_client_duration': 0.,
368 # },
nodir55715712016-06-03 12:28:19 -0700369 # 'download': {
370 # 'duration': 0.,
371 # 'initial_number_items': 0,
372 # 'initial_size': 0,
373 # 'items_cold': '<large.pack()>',
374 # 'items_hot': '<large.pack()>',
375 # },
376 # 'upload': {
377 # 'duration': 0.,
378 # 'items_cold': '<large.pack()>',
379 # 'items_hot': '<large.pack()>',
380 # },
maruel064c0a32016-04-05 11:47:15 -0700381 # },
382 },
maruela9cfd6f2015-09-15 11:03:15 -0700383 'outputs_ref': None,
nodirbe642ff2016-06-09 15:51:51 -0700384 'version': 5,
maruela9cfd6f2015-09-15 11:03:15 -0700385 }
nodirbe642ff2016-06-09 15:51:51 -0700386
marueleb5fbee2015-09-17 13:01:36 -0700387 if root_dir:
nodire5028a92016-04-29 14:38:21 -0700388 file_path.ensure_tree(root_dir, 0700)
marueleb5fbee2015-09-17 13:01:36 -0700389 else:
maruel2e8d0f52016-07-16 07:51:29 -0700390 root_dir = os.path.dirname(cache.cache_dir) if cache.cache_dir else None
maruele2f2cb82016-07-13 14:41:03 -0700391 # See comment for these constants.
392 run_dir = make_temp_dir(ISOLATED_RUN_DIR, root_dir)
maruel03e11842016-07-14 10:50:16 -0700393 # storage should be normally set but don't crash if it is not. This can happen
394 # as Swarming task can run without an isolate server.
maruele2f2cb82016-07-13 14:41:03 -0700395 out_dir = make_temp_dir(ISOLATED_OUT_DIR, root_dir) if storage else None
396 tmp_dir = make_temp_dir(ISOLATED_TMP_DIR, root_dir)
nodir55be77b2016-05-03 09:39:57 -0700397 cwd = run_dir
maruela9cfd6f2015-09-15 11:03:15 -0700398
nodir55be77b2016-05-03 09:39:57 -0700399 try:
nodir90bc8dc2016-06-15 13:35:21 -0700400 cipd_stats = install_packages_fn(run_dir)
401 if cipd_stats:
402 result['stats']['cipd'] = cipd_stats
403
nodir55be77b2016-05-03 09:39:57 -0700404 if isolated_hash:
nodir55715712016-06-03 12:28:19 -0700405 isolated_stats = result['stats'].setdefault('isolated', {})
406 bundle, isolated_stats['download'] = fetch_and_measure(
nodir55be77b2016-05-03 09:39:57 -0700407 isolated_hash=isolated_hash,
408 storage=storage,
409 cache=cache,
410 outdir=run_dir)
411 if not bundle.command:
412 # Handle this as a task failure, not an internal failure.
413 sys.stderr.write(
414 '<The .isolated doesn\'t declare any command to run!>\n'
415 '<Check your .isolate for missing \'command\' variable>\n')
416 if os.environ.get('SWARMING_TASK_ID'):
417 # Give an additional hint when running as a swarming task.
418 sys.stderr.write('<This occurs at the \'isolate\' step>\n')
419 result['exit_code'] = 1
420 return result
421
422 change_tree_read_only(run_dir, bundle.read_only)
423 cwd = os.path.normpath(os.path.join(cwd, bundle.relative_cwd))
424 command = bundle.command + extra_args
nodirbe642ff2016-06-09 15:51:51 -0700425
nodir34d673c2016-05-24 09:30:48 -0700426 command = tools.fix_python_path(command)
nodir90bc8dc2016-06-15 13:35:21 -0700427 command = process_command(command, out_dir, bot_file)
maruela9cfd6f2015-09-15 11:03:15 -0700428 file_path.ensure_command_has_abs_path(command, cwd)
nodirbe642ff2016-06-09 15:51:51 -0700429
maruel064c0a32016-04-05 11:47:15 -0700430 sys.stdout.flush()
431 start = time.time()
432 try:
433 result['exit_code'], result['had_hard_timeout'] = run_command(
nodirbe642ff2016-06-09 15:51:51 -0700434 command, cwd, tmp_dir, hard_timeout, grace_period)
maruel064c0a32016-04-05 11:47:15 -0700435 finally:
436 result['duration'] = max(time.time() - start, 0)
maruela9cfd6f2015-09-15 11:03:15 -0700437 except Exception as e:
nodir90bc8dc2016-06-15 13:35:21 -0700438 # An internal error occurred. Report accordingly so the swarming task will
439 # be retried automatically.
maruel12e30012015-10-09 11:55:35 -0700440 logging.exception('internal failure: %s', e)
maruela9cfd6f2015-09-15 11:03:15 -0700441 result['internal_failure'] = str(e)
442 on_error.report(None)
443 finally:
444 try:
445 if leak_temp_dir:
446 logging.warning(
447 'Deliberately leaking %s for later examination', run_dir)
marueleb5fbee2015-09-17 13:01:36 -0700448 else:
maruel84537cb2015-10-16 14:21:28 -0700449 # On Windows rmtree(run_dir) call above has a synchronization effect: it
450 # finishes only when all task child processes terminate (since a running
451 # process locks *.exe file). Examine out_dir only after that call
452 # completes (since child processes may write to out_dir too and we need
453 # to wait for them to finish).
454 if fs.isdir(run_dir):
455 try:
456 success = file_path.rmtree(run_dir)
457 except OSError as e:
458 logging.error('Failure with %s', e)
459 success = False
460 if not success:
461 print >> sys.stderr, (
462 'Failed to delete the run directory, forcibly failing\n'
463 'the task because of it. No zombie process can outlive a\n'
464 'successful task run and still be marked as successful.\n'
465 'Fix your stuff.')
466 if result['exit_code'] == 0:
467 result['exit_code'] = 1
468 if fs.isdir(tmp_dir):
469 try:
470 success = file_path.rmtree(tmp_dir)
471 except OSError as e:
472 logging.error('Failure with %s', e)
473 success = False
474 if not success:
475 print >> sys.stderr, (
476 'Failed to delete the temporary directory, forcibly failing\n'
477 'the task because of it. No zombie process can outlive a\n'
478 'successful task run and still be marked as successful.\n'
479 'Fix your stuff.')
480 if result['exit_code'] == 0:
481 result['exit_code'] = 1
maruela9cfd6f2015-09-15 11:03:15 -0700482
marueleb5fbee2015-09-17 13:01:36 -0700483 # This deletes out_dir if leak_temp_dir is not set.
nodir9130f072016-05-27 13:59:08 -0700484 if out_dir:
nodir55715712016-06-03 12:28:19 -0700485 isolated_stats = result['stats'].setdefault('isolated', {})
486 result['outputs_ref'], success, isolated_stats['upload'] = (
nodir9130f072016-05-27 13:59:08 -0700487 delete_and_upload(storage, out_dir, leak_temp_dir))
maruela9cfd6f2015-09-15 11:03:15 -0700488 if not success and result['exit_code'] == 0:
489 result['exit_code'] = 1
490 except Exception as e:
491 # Swallow any exception in the main finally clause.
nodir9130f072016-05-27 13:59:08 -0700492 if out_dir:
493 logging.exception('Leaking out_dir %s: %s', out_dir, e)
maruela9cfd6f2015-09-15 11:03:15 -0700494 result['internal_failure'] = str(e)
495 return result
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500496
497
Marc-Antoine Ruel0ec868b2015-08-12 14:12:46 -0400498def run_tha_test(
nodir55be77b2016-05-03 09:39:57 -0700499 command, isolated_hash, storage, cache, leak_temp_dir, result_json,
bpastene3ae09522016-06-10 17:12:59 -0700500 root_dir, hard_timeout, grace_period, bot_file, extra_args,
nodir90bc8dc2016-06-15 13:35:21 -0700501 install_packages_fn):
nodir55be77b2016-05-03 09:39:57 -0700502 """Runs an executable and records execution metadata.
503
504 Either command or isolated_hash must be specified.
505
506 If isolated_hash is specified, downloads the dependencies in the cache,
507 hardlinks them into a temporary directory and runs the command specified in
508 the .isolated.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500509
510 A temporary directory is created to hold the output files. The content inside
511 this directory will be uploaded back to |storage| packaged as a .isolated
512 file.
513
514 Arguments:
nodir55be77b2016-05-03 09:39:57 -0700515 command: the command to run, a list of strings. Mutually exclusive with
516 isolated_hash.
Marc-Antoine Ruel35b58432014-12-08 17:40:40 -0500517 isolated_hash: the SHA-1 of the .isolated file that must be retrieved to
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500518 recreate the tree of files to run the target executable.
nodir55be77b2016-05-03 09:39:57 -0700519 The command specified in the .isolated is executed.
520 Mutually exclusive with command argument.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500521 storage: an isolateserver.Storage object to retrieve remote objects. This
522 object has a reference to an isolateserver.StorageApi, which does
523 the actual I/O.
524 cache: an isolateserver.LocalCache to keep from retrieving the same objects
525 constantly by caching the objects retrieved. Can be on-disk or
526 in-memory.
Kenneth Russell61d42352014-09-15 11:41:16 -0700527 leak_temp_dir: if true, the temporary directory will be deliberately leaked
528 for later examination.
maruela9cfd6f2015-09-15 11:03:15 -0700529 result_json: file path to dump result metadata into. If set, the process
nodirbe642ff2016-06-09 15:51:51 -0700530 exit code is always 0 unless an internal error occurred.
nodir90bc8dc2016-06-15 13:35:21 -0700531 root_dir: path to the directory to use to create the temporary directory. If
marueleb5fbee2015-09-17 13:01:36 -0700532 not specified, a random temporary directory is created.
maruel6be7f9e2015-10-01 12:25:30 -0700533 hard_timeout: kills the process if it lasts more than this amount of
534 seconds.
535 grace_period: number of seconds to wait between SIGTERM and SIGKILL.
Marc-Antoine Ruel2283ad12014-02-09 11:14:57 -0500536 extra_args: optional arguments to add to the command stated in the .isolate
nodir55be77b2016-05-03 09:39:57 -0700537 file. Ignored if isolate_hash is empty.
nodir90bc8dc2016-06-15 13:35:21 -0700538 install_packages_fn: function (dir) => cipd_stats. Installs packages.
maruela9cfd6f2015-09-15 11:03:15 -0700539
540 Returns:
541 Process exit code that should be used.
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000542 """
nodir55be77b2016-05-03 09:39:57 -0700543 assert bool(command) ^ bool(isolated_hash)
544 extra_args = extra_args or []
nodirbe642ff2016-06-09 15:51:51 -0700545
nodir55be77b2016-05-03 09:39:57 -0700546 if any(ISOLATED_OUTDIR_PARAMETER in a for a in (command or extra_args)):
547 assert storage is not None, 'storage is None although outdir is specified'
548
maruela76b9ee2015-12-15 06:18:08 -0800549 if result_json:
550 # Write a json output file right away in case we get killed.
551 result = {
552 'exit_code': None,
553 'had_hard_timeout': False,
554 'internal_failure': 'Was terminated before completion',
555 'outputs_ref': None,
nodirbe642ff2016-06-09 15:51:51 -0700556 'version': 5,
maruela76b9ee2015-12-15 06:18:08 -0800557 }
558 tools.write_json(result_json, result, dense=True)
559
maruela9cfd6f2015-09-15 11:03:15 -0700560 # run_isolated exit code. Depends on if result_json is used or not.
561 result = map_and_run(
nodir55be77b2016-05-03 09:39:57 -0700562 command, isolated_hash, storage, cache, leak_temp_dir, root_dir,
nodir90bc8dc2016-06-15 13:35:21 -0700563 hard_timeout, grace_period, bot_file, extra_args, install_packages_fn)
maruela9cfd6f2015-09-15 11:03:15 -0700564 logging.info('Result:\n%s', tools.format_json(result, dense=True))
bpastene3ae09522016-06-10 17:12:59 -0700565
maruela9cfd6f2015-09-15 11:03:15 -0700566 if result_json:
maruel05d5a882015-09-21 13:59:02 -0700567 # We've found tests to delete 'work' when quitting, causing an exception
568 # here. Try to recreate the directory if necessary.
nodire5028a92016-04-29 14:38:21 -0700569 file_path.ensure_tree(os.path.dirname(result_json))
maruela9cfd6f2015-09-15 11:03:15 -0700570 tools.write_json(result_json, result, dense=True)
571 # Only return 1 if there was an internal error.
572 return int(bool(result['internal_failure']))
maruel@chromium.org781ccf62013-09-17 19:39:47 +0000573
maruela9cfd6f2015-09-15 11:03:15 -0700574 # Marshall into old-style inline output.
575 if result['outputs_ref']:
576 data = {
577 'hash': result['outputs_ref']['isolated'],
578 'namespace': result['outputs_ref']['namespace'],
579 'storage': result['outputs_ref']['isolatedserver'],
580 }
Marc-Antoine Ruelc44f5722015-01-08 16:10:01 -0500581 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700582 print(
583 '[run_isolated_out_hack]%s[/run_isolated_out_hack]' %
584 tools.format_json(data, dense=True))
maruelb76604c2015-11-11 11:53:44 -0800585 sys.stdout.flush()
maruela9cfd6f2015-09-15 11:03:15 -0700586 return result['exit_code'] or int(bool(result['internal_failure']))
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000587
588
nodir90bc8dc2016-06-15 13:35:21 -0700589def install_packages(
nodirff531b42016-06-23 13:05:06 -0700590 run_dir, packages, service_url, client_package_name,
nodir90bc8dc2016-06-15 13:35:21 -0700591 client_version, cache_dir=None, timeout=None):
592 """Installs packages. Returns stats.
nodirbe642ff2016-06-09 15:51:51 -0700593
594 Args:
nodir90bc8dc2016-06-15 13:35:21 -0700595 run_dir (str): root of installation.
nodirff531b42016-06-23 13:05:06 -0700596 packages: packages to install, dict {path: [(package_name, version)].
nodirbe642ff2016-06-09 15:51:51 -0700597 service_url (str): CIPD server url, e.g.
598 "https://chrome-infra-packages.appspot.com."
nodir90bc8dc2016-06-15 13:35:21 -0700599 client_package_name (str): CIPD package name of CIPD client.
600 client_version (str): Version of CIPD client.
nodirbe642ff2016-06-09 15:51:51 -0700601 cache_dir (str): where to keep cache of cipd clients, packages and tags.
602 timeout: max duration in seconds that this function can take.
nodirbe642ff2016-06-09 15:51:51 -0700603 """
604 assert cache_dir
nodirff531b42016-06-23 13:05:06 -0700605 if not packages:
nodir90bc8dc2016-06-15 13:35:21 -0700606 return None
607
nodirbe642ff2016-06-09 15:51:51 -0700608 timeoutfn = tools.sliding_timeout(timeout)
nodirbe642ff2016-06-09 15:51:51 -0700609 start = time.time()
nodirbe642ff2016-06-09 15:51:51 -0700610 cache_dir = os.path.abspath(cache_dir)
611
nodir90bc8dc2016-06-15 13:35:21 -0700612 run_dir = os.path.abspath(run_dir)
nodir90bc8dc2016-06-15 13:35:21 -0700613
nodirbe642ff2016-06-09 15:51:51 -0700614 get_client_start = time.time()
615 client_manager = cipd.get_client(
616 service_url, client_package_name, client_version, cache_dir,
617 timeout=timeoutfn())
618 with client_manager as client:
619 get_client_duration = time.time() - get_client_start
nodirff531b42016-06-23 13:05:06 -0700620 for path, packages in sorted(packages.iteritems()):
nodir90bc8dc2016-06-15 13:35:21 -0700621 site_root = os.path.abspath(os.path.join(run_dir, path))
622 if not site_root.startswith(run_dir):
623 raise cipd.Error('Invalid CIPD package path "%s"' % path)
624
625 # Do not clean site_root before installation because it may contain other
626 # site roots.
627 file_path.ensure_tree(site_root, 0770)
nodirbe642ff2016-06-09 15:51:51 -0700628 client.ensure(
629 site_root, packages,
630 cache_dir=os.path.join(cache_dir, 'cipd_internal'),
631 timeout=timeoutfn())
nodirbe642ff2016-06-09 15:51:51 -0700632 file_path.make_tree_files_read_only(site_root)
nodir90bc8dc2016-06-15 13:35:21 -0700633
634 total_duration = time.time() - start
635 logging.info(
636 'Installing CIPD client and packages took %d seconds', total_duration)
637
638 return {
639 'duration': total_duration,
640 'get_client_duration': get_client_duration,
641 }
nodirbe642ff2016-06-09 15:51:51 -0700642
643
644def create_option_parser():
Marc-Antoine Ruelf74cffe2015-07-15 15:21:34 -0400645 parser = logging_utils.OptionParserWithLogging(
nodir55be77b2016-05-03 09:39:57 -0700646 usage='%prog <options> [command to run or extra args]',
maruel@chromium.orgdedbf492013-09-12 20:42:11 +0000647 version=__version__,
648 log_file=RUN_ISOLATED_LOG_FILE)
maruela9cfd6f2015-09-15 11:03:15 -0700649 parser.add_option(
maruel36a963d2016-04-08 17:15:49 -0700650 '--clean', action='store_true',
651 help='Cleans the cache, trimming it necessary and remove corrupted items '
652 'and returns without executing anything; use with -v to know what '
653 'was done')
654 parser.add_option(
maruel2e8d0f52016-07-16 07:51:29 -0700655 '--no-clean', action='store_true',
656 help='Do not clean the cache automatically on startup. This is meant for '
657 'bots where a separate execution with --clean was done earlier so '
658 'doing it again is redundant')
659 parser.add_option(
maruela9cfd6f2015-09-15 11:03:15 -0700660 '--json',
661 help='dump output metadata to json file. When used, run_isolated returns '
662 'non-zero only on internal failure')
maruel6be7f9e2015-10-01 12:25:30 -0700663 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -0800664 '--hard-timeout', type='float', help='Enforce hard timeout in execution')
maruel6be7f9e2015-10-01 12:25:30 -0700665 parser.add_option(
maruel5c9e47b2015-12-18 13:02:30 -0800666 '--grace-period', type='float',
maruel6be7f9e2015-10-01 12:25:30 -0700667 help='Grace period between SIGTERM and SIGKILL')
bpastene3ae09522016-06-10 17:12:59 -0700668 parser.add_option(
669 '--bot-file',
670 help='Path to a file describing the state of the host. The content is '
671 'defined by on_before_task() in bot_config.')
Marc-Antoine Ruel1687b5e2014-02-06 17:47:53 -0500672 data_group = optparse.OptionGroup(parser, 'Data source')
673 data_group.add_option(
Marc-Antoine Ruel185ded42015-01-28 20:49:18 -0500674 '-s', '--isolated',
nodir55be77b2016-05-03 09:39:57 -0700675 help='Hash of the .isolated to grab from the isolate server.')
Marc-Antoine Ruelf7d737d2014-12-10 15:36:29 -0500676 isolateserver.add_isolate_server_options(data_group)
Marc-Antoine Ruel1687b5e2014-02-06 17:47:53 -0500677 parser.add_option_group(data_group)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000678
Marc-Antoine Ruela57d7db2014-10-15 20:31:19 -0400679 isolateserver.add_cache_options(parser)
nodirbe642ff2016-06-09 15:51:51 -0700680
681 cipd.add_cipd_options(parser)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000682
Kenneth Russell61d42352014-09-15 11:41:16 -0700683 debug_group = optparse.OptionGroup(parser, 'Debugging')
684 debug_group.add_option(
685 '--leak-temp-dir',
686 action='store_true',
nodirbe642ff2016-06-09 15:51:51 -0700687 help='Deliberately leak isolate\'s temp dir for later examination. '
688 'Default: %default')
marueleb5fbee2015-09-17 13:01:36 -0700689 debug_group.add_option(
690 '--root-dir', help='Use a directory instead of a random one')
Kenneth Russell61d42352014-09-15 11:41:16 -0700691 parser.add_option_group(debug_group)
692
Vadim Shtayurae34e13a2014-02-02 11:23:26 -0800693 auth.add_auth_options(parser)
nodirbe642ff2016-06-09 15:51:51 -0700694
695 parser.set_defaults(cache='cache', cipd_cache='cipd_cache')
696 return parser
697
698
699def main(args):
700 parser = create_option_parser()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -0500701 options, args = parser.parse_args(args)
maruel36a963d2016-04-08 17:15:49 -0700702
703 cache = isolateserver.process_cache_options(options)
704 if options.clean:
705 if options.isolated:
706 parser.error('Can\'t use --isolated with --clean.')
707 if options.isolate_server:
708 parser.error('Can\'t use --isolate-server with --clean.')
709 if options.json:
710 parser.error('Can\'t use --json with --clean.')
711 cache.cleanup()
712 return 0
maruel2e8d0f52016-07-16 07:51:29 -0700713 if not options.no_clean:
714 cache.cleanup()
maruel36a963d2016-04-08 17:15:49 -0700715
nodir55be77b2016-05-03 09:39:57 -0700716 if not options.isolated and not args:
717 parser.error('--isolated or command to run is required.')
718
Vadim Shtayura5d1efce2014-02-04 10:55:43 -0800719 auth.process_auth_options(parser, options)
nodir55be77b2016-05-03 09:39:57 -0700720
721 isolateserver.process_isolate_server_options(
722 parser, options, True, False)
723 if not options.isolate_server:
724 if options.isolated:
725 parser.error('--isolated requires --isolate-server')
726 if ISOLATED_OUTDIR_PARAMETER in args:
727 parser.error(
728 '%s in args requires --isolate-server' % ISOLATED_OUTDIR_PARAMETER)
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000729
nodir90bc8dc2016-06-15 13:35:21 -0700730 if options.root_dir:
731 options.root_dir = unicode(os.path.abspath(options.root_dir))
maruel12e30012015-10-09 11:55:35 -0700732 if options.json:
733 options.json = unicode(os.path.abspath(options.json))
nodir55be77b2016-05-03 09:39:57 -0700734
nodirbe642ff2016-06-09 15:51:51 -0700735 cipd.validate_cipd_options(parser, options)
736
nodir90bc8dc2016-06-15 13:35:21 -0700737 install_packages_fn = lambda run_dir: install_packages(
nodirff531b42016-06-23 13:05:06 -0700738 run_dir, cipd.parse_package_args(options.cipd_packages),
739 options.cipd_server, options.cipd_client_package,
740 options.cipd_client_version, cache_dir=options.cipd_cache)
nodirbe642ff2016-06-09 15:51:51 -0700741
742 try:
nodir90bc8dc2016-06-15 13:35:21 -0700743 command = [] if options.isolated else args
744 if options.isolate_server:
745 storage = isolateserver.get_storage(
746 options.isolate_server, options.namespace)
747 with storage:
748 # Hashing schemes used by |storage| and |cache| MUST match.
749 assert storage.hash_algo == cache.hash_algo
nodirbe642ff2016-06-09 15:51:51 -0700750 return run_tha_test(
nodir90bc8dc2016-06-15 13:35:21 -0700751 command, options.isolated, storage, cache, options.leak_temp_dir,
752 options.json, options.root_dir, options.hard_timeout,
753 options.grace_period, options.bot_file, args, install_packages_fn)
754 else:
755 return run_tha_test(
756 command, options.isolated, None, cache, options.leak_temp_dir,
757 options.json, options.root_dir, options.hard_timeout,
758 options.grace_period, options.bot_file, args, install_packages_fn)
nodirbe642ff2016-06-09 15:51:51 -0700759 except cipd.Error as ex:
760 print >> sys.stderr, ex.message
761 return 1
maruel@chromium.org9c72d4e2012-09-28 19:20:25 +0000762
763
764if __name__ == '__main__':
maruel8e4e40c2016-05-30 06:21:07 -0700765 subprocess42.inhibit_os_error_reporting()
csharp@chromium.orgbfb98742013-03-26 20:28:36 +0000766 # Ensure that we are always running with the correct encoding.
vadimsh@chromium.orga4326472013-08-24 02:05:41 +0000767 fix_encoding.fix_encoding()
Marc-Antoine Ruel90c98162013-12-18 15:11:57 -0500768 sys.exit(main(sys.argv[1:]))