blob: 45af424b9650ebd0b52c5bfc1f078234c467481e [file] [log] [blame]
Derek Beckett5fb683c2020-08-19 15:24:13 -07001# Lint as: python2, python3
Chris Sosa5e4246b2012-05-22 18:05:22 -07002# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
Sean O'Connor5346e4e2010-08-12 18:49:24 +02003# Use of this source code is governed by a BSD-style license that can be
4# found in the LICENSE file.
5
Gregory Nisbetcf8c2ed2020-07-14 18:35:49 -07006from __future__ import print_function
7
Sean O'Connor5346e4e2010-08-12 18:49:24 +02008import logging
Amin Hassani5cda21d2020-08-10 15:24:44 -07009import os
Sean O'Connor5346e4e2010-08-12 18:49:24 +020010import re
Gregory Nisbetcf8c2ed2020-07-14 18:35:49 -070011import six
Congbin Guo63ae0302019-08-12 16:37:49 -070012import sys
Derek Beckett5fb683c2020-08-19 15:24:13 -070013import six.moves.urllib.parse
Sean O'Connor5346e4e2010-08-12 18:49:24 +020014
Chris Sosa65425082013-10-16 13:26:22 -070015from autotest_lib.client.bin import utils
Amin Hassani18e39882020-08-10 15:32:10 -070016from autotest_lib.client.common_lib import error
Prashanth B32baa9b2014-03-13 13:23:01 -070017from autotest_lib.client.common_lib.cros import dev_server
David Haddock77b75c32020-05-14 01:56:32 -070018from autotest_lib.client.common_lib.cros import kernel_utils
Richard Barnette0beb14b2018-05-15 18:07:52 +000019from autotest_lib.server import autotest
Richard Barnette0beb14b2018-05-15 18:07:52 +000020from autotest_lib.server.cros.dynamic_suite import constants as ds_constants
21from autotest_lib.server.cros.dynamic_suite import tools
Dan Shif3a35f72016-01-25 11:18:14 -080022
Shelley Chen16b8df32016-10-27 16:24:21 -070023try:
24 from chromite.lib import metrics
Dan Shi5e2efb72017-02-07 11:40:23 -080025except ImportError:
26 metrics = utils.metrics_mock
Sean O'Connor5346e4e2010-08-12 18:49:24 +020027
Gwendal Grignou3e96cc22017-06-07 16:22:51 -070028
Richard Barnette621a8e42018-06-25 17:34:11 -070029def _metric_name(base_name):
30 return 'chromeos/autotest/provision/' + base_name
31
32
Richard Barnettee86b1ce2018-06-07 10:37:23 -070033_QUICK_PROVISION_SCRIPT = 'quick-provision'
Richard Barnette3e8b2282018-05-15 20:42:20 +000034
Richard Barnette0beb14b2018-05-15 18:07:52 +000035# PROVISION_FAILED - A flag file to indicate provision failures. The
36# file is created at the start of any AU procedure (see
Jae Hoon Kim5f6ca6e2020-09-10 16:11:23 -070037# `ChromiumOSProvisioner._prepare_host()`). The file's location in
Richard Barnette0beb14b2018-05-15 18:07:52 +000038# stateful means that on successul update it will be removed. Thus, if
39# this file exists, it indicates that we've tried and failed in a
40# previous attempt to update.
41PROVISION_FAILED = '/var/tmp/provision_failed'
42
43
Richard Barnette3e8b2282018-05-15 20:42:20 +000044# A flag file used to enable special handling in lab DUTs. Some
45# parts of the system in Chromium OS test images will behave in ways
46# convenient to the test lab when this file is present. Generally,
47# we create this immediately after any update completes.
48_LAB_MACHINE_FILE = '/mnt/stateful_partition/.labmachine'
49
50
Richard Barnette3ef29a82018-06-28 13:52:54 -070051# _TARGET_VERSION - A file containing the new version to which we plan
52# to update. This file is used by the CrOS shutdown code to detect and
53# handle certain version downgrade cases. Specifically: Downgrading
54# may trigger an unwanted powerwash in the target build when the
55# following conditions are met:
56# * Source build is a v4.4 kernel with R69-10756.0.0 or later.
57# * Target build predates the R69-10756.0.0 cutoff.
58# When this file is present and indicates a downgrade, the OS shutdown
59# code on the DUT knows how to prevent the powerwash.
60_TARGET_VERSION = '/run/update_target_version'
61
62
Richard Barnette5adb6d42018-06-28 15:52:32 -070063# _REBOOT_FAILURE_MESSAGE - This is the standard message text returned
64# when the Host.reboot() method fails. The source of this text comes
65# from `wait_for_restart()` in client/common_lib/hosts/base_classes.py.
66
67_REBOOT_FAILURE_MESSAGE = 'Host did not return from reboot'
68
69
Congbin Guoeb7aa2d2019-07-15 16:10:44 -070070DEVSERVER_PORT = '8082'
71GS_CACHE_PORT = '8888'
72
73
Richard Barnette9d43e562018-06-05 17:20:10 +000074class _AttributedUpdateError(error.TestFail):
75 """Update failure with an attributed cause."""
76
77 def __init__(self, attribution, msg):
78 super(_AttributedUpdateError, self).__init__(
79 '%s: %s' % (attribution, msg))
Richard Barnette5adb6d42018-06-28 15:52:32 -070080 self._message = msg
81
82 def _classify(self):
83 for err_pattern, classification in self._CLASSIFIERS:
84 if re.match(err_pattern, self._message):
85 return classification
86 return None
87
88 @property
89 def failure_summary(self):
90 """Summarize this error for metrics reporting."""
91 classification = self._classify()
92 if classification:
93 return '%s: %s' % (self._SUMMARY, classification)
94 else:
95 return self._SUMMARY
Richard Barnette9d43e562018-06-05 17:20:10 +000096
97
98class HostUpdateError(_AttributedUpdateError):
99 """Failure updating a DUT attributable to the DUT.
100
101 This class of exception should be raised when the most likely cause
102 of failure was a condition existing on the DUT prior to the update,
103 such as a hardware problem, or a bug in the software on the DUT.
104 """
105
Richard Barnette5adb6d42018-06-28 15:52:32 -0700106 DUT_DOWN = 'No answer to ssh'
107
108 _SUMMARY = 'DUT failed prior to update'
109 _CLASSIFIERS = [
110 (DUT_DOWN, DUT_DOWN),
111 (_REBOOT_FAILURE_MESSAGE, 'Reboot failed'),
112 ]
113
Richard Barnette9d43e562018-06-05 17:20:10 +0000114 def __init__(self, hostname, msg):
115 super(HostUpdateError, self).__init__(
116 'Error on %s prior to update' % hostname, msg)
117
118
Richard Barnette9d43e562018-06-05 17:20:10 +0000119class ImageInstallError(_AttributedUpdateError):
120 """Failure updating a DUT when installing from the devserver.
121
122 This class of exception should be raised when the target DUT fails
123 to download and install the target image from the devserver, and
124 either the devserver or the DUT might be at fault.
125 """
126
Richard Barnette5adb6d42018-06-28 15:52:32 -0700127 _SUMMARY = 'Image failed to download and install'
128 _CLASSIFIERS = []
129
Richard Barnette9d43e562018-06-05 17:20:10 +0000130 def __init__(self, hostname, devserver, msg):
131 super(ImageInstallError, self).__init__(
132 'Download and install failed from %s onto %s'
133 % (devserver, hostname), msg)
134
135
136class NewBuildUpdateError(_AttributedUpdateError):
137 """Failure updating a DUT attributable to the target build.
138
139 This class of exception should be raised when updating to a new
140 build fails, and the most likely cause of the failure is a bug in
141 the newly installed target build.
142 """
143
Richard Barnette5adb6d42018-06-28 15:52:32 -0700144 CHROME_FAILURE = 'Chrome failed to reach login screen'
Richard Barnette5adb6d42018-06-28 15:52:32 -0700145 ROLLBACK_FAILURE = 'System rolled back to previous build'
146
147 _SUMMARY = 'New build failed'
148 _CLASSIFIERS = [
149 (CHROME_FAILURE, 'Chrome did not start'),
Richard Barnette5adb6d42018-06-28 15:52:32 -0700150 (ROLLBACK_FAILURE, ROLLBACK_FAILURE),
151 ]
152
Richard Barnette9d43e562018-06-05 17:20:10 +0000153 def __init__(self, update_version, msg):
154 super(NewBuildUpdateError, self).__init__(
155 'Failure in build %s' % update_version, msg)
156
Richard Barnette621a8e42018-06-25 17:34:11 -0700157 @property
158 def failure_summary(self):
159 #pylint: disable=missing-docstring
160 return 'Build failed to work after installing'
161
Richard Barnette9d43e562018-06-05 17:20:10 +0000162
Richard Barnette3e8b2282018-05-15 20:42:20 +0000163def _url_to_version(update_url):
Dan Shi0f466e82013-02-22 15:44:58 -0800164 """Return the version based on update_url.
165
166 @param update_url: url to the image to update to.
167
168 """
Dale Curtisddfdb942011-07-14 13:59:24 -0700169 # The Chrome OS version is generally the last element in the URL. The only
170 # exception is delta update URLs, which are rooted under the version; e.g.,
171 # http://.../update/.../0.14.755.0/au/0.14.754.0. In this case we want to
172 # strip off the au section of the path before reading the version.
Dan Shi5002cfc2013-04-29 10:45:05 -0700173 return re.sub('/au/.*', '',
Derek Beckett5fb683c2020-08-19 15:24:13 -0700174 six.moves.urllib.parse.urlparse(update_url).path).split('/')[-1].strip()
Sean O'Connor5346e4e2010-08-12 18:49:24 +0200175
176
Scott Zawalskieadbf702013-03-14 09:23:06 -0400177def url_to_image_name(update_url):
178 """Return the image name based on update_url.
179
180 From a URL like:
181 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
182 return lumpy-release/R27-3837.0.0
183
184 @param update_url: url to the image to update to.
185 @returns a string representing the image name in the update_url.
186
187 """
Derek Beckett5fb683c2020-08-19 15:24:13 -0700188 return six.moves.urllib.parse.urlparse(update_url).path[len('/update/'):]
Scott Zawalskieadbf702013-03-14 09:23:06 -0400189
190
Richard Barnette4c81b972018-07-18 12:35:16 -0700191def get_update_failure_reason(exception):
192 """Convert an exception into a failure reason for metrics.
193
194 The passed in `exception` should be one raised by failure of
Jae Hoon Kim5f6ca6e2020-09-10 16:11:23 -0700195 `ChromiumOSProvisioner.run_provision`. The returned string will describe
Richard Barnette4c81b972018-07-18 12:35:16 -0700196 the failure. If the input exception value is not a truish value
197 the return value will be `None`.
198
199 The number of possible return strings is restricted to a limited
200 enumeration of values so that the string may be safely used in
201 Monarch metrics without worrying about cardinality of the range of
202 string values.
203
204 @param exception Exception to be converted to a failure reason.
205
206 @return A string suitable for use in Monarch metrics, or `None`.
207 """
208 if exception:
209 if isinstance(exception, _AttributedUpdateError):
210 return exception.failure_summary
211 else:
212 return 'Unknown Error: %s' % type(exception).__name__
213 return None
214
215
Jae Hoon Kim5f6ca6e2020-09-10 16:11:23 -0700216class ChromiumOSProvisioner(object):
Richard Barnette3e8b2282018-05-15 20:42:20 +0000217 """Chromium OS specific DUT update functionality."""
Gilad Arnoldd6adeb82015-09-21 07:10:03 -0700218
Richard Barnette60e759e2018-07-21 20:56:59 -0700219 def __init__(self, update_url, host=None, interactive=True,
Amin Hassani18e39882020-08-10 15:32:10 -0700220 is_release_bucket=None, is_servohost=False):
Gilad Arnoldd6adeb82015-09-21 07:10:03 -0700221 """Initializes the object.
222
Gilad Arnoldd6adeb82015-09-21 07:10:03 -0700223 @param update_url: The URL we want the update to use.
224 @param host: A client.common_lib.hosts.Host implementation.
David Haddock76a4c882017-12-13 18:50:09 -0800225 @param interactive: Bool whether we are doing an interactive update.
Amin Hassani1d6d3a72020-07-09 09:50:26 -0700226 @param is_release_bucket: If True, use release bucket
227 gs://chromeos-releases.
Garry Wang01a1d482020-08-02 20:46:53 -0700228 @param is_servohost: Bool whether the update target is a servohost.
Gilad Arnoldd6adeb82015-09-21 07:10:03 -0700229 """
Gilad Arnoldd6adeb82015-09-21 07:10:03 -0700230 self.update_url = update_url
231 self.host = host
David Haddock76a4c882017-12-13 18:50:09 -0800232 self.interactive = interactive
Richard Barnette3e8b2282018-05-15 20:42:20 +0000233 self.update_version = _url_to_version(update_url)
Amin Hassani1d6d3a72020-07-09 09:50:26 -0700234 self._is_release_bucket = is_release_bucket
Garry Wang01a1d482020-08-02 20:46:53 -0700235 self._is_servohost = is_servohost
236
Richard Barnette3e8b2282018-05-15 20:42:20 +0000237
238 def _run(self, cmd, *args, **kwargs):
239 """Abbreviated form of self.host.run(...)"""
240 return self.host.run(cmd, *args, **kwargs)
Gilad Arnoldd6adeb82015-09-21 07:10:03 -0700241
242
Richard Barnette55d1af82018-05-22 23:40:14 +0000243 def _rootdev(self, options=''):
244 """Returns the stripped output of rootdev <options>.
245
246 @param options: options to run rootdev.
247
248 """
249 return self._run('rootdev %s' % options).stdout.strip()
250
251
Richard Barnette55d1af82018-05-22 23:40:14 +0000252 def _reset_update_engine(self):
253 """Resets the host to prepare for a clean update regardless of state."""
254 self._run('stop ui || true')
Amin Hassani18e39882020-08-10 15:32:10 -0700255 self._run('restart update-engine')
Luigi Semenzatof15c8fc2017-03-03 14:12:40 -0800256
Richard Barnette55d1af82018-05-22 23:40:14 +0000257
258 def _reset_stateful_partition(self):
259 """Clear any pending stateful update request."""
Amin Hassani5cda21d2020-08-10 15:24:44 -0700260 cmd = ['rm', '-rf']
261 for f in ('var_new', 'dev_image_new', '.update_available'):
262 cmd += [os.path.join('/mnt/stateful_partition', f)]
Amin Hassani7f68fea2020-08-17 13:52:10 -0700263 # TODO(b/165024723): This is a temporary measure until we figure out the
264 # root cause of this bug.
265 cmd += ['/mnt/stateful_partition/dev_image/share/tast/data/chromiumos/'
266 'tast/local/bundles/']
Amin Hassani5cda21d2020-08-10 15:24:44 -0700267 cmd += [_TARGET_VERSION, '2>&1']
268 self._run(cmd)
Richard Barnette3ef29a82018-06-28 13:52:54 -0700269
270
271 def _set_target_version(self):
272 """Set the "target version" for the update."""
Amin Hassani1d6d3a72020-07-09 09:50:26 -0700273 # Version strings that come from release buckets do not have RXX- at the
274 # beginning. So remove this prefix only if the version has it.
275 version_number = (self.update_version.split('-')[1]
276 if '-' in self.update_version
277 else self.update_version)
Richard Barnette3ef29a82018-06-28 13:52:54 -0700278 self._run('echo %s > %s' % (version_number, _TARGET_VERSION))
Richard Barnette55d1af82018-05-22 23:40:14 +0000279
280
281 def _revert_boot_partition(self):
282 """Revert the boot partition."""
283 part = self._rootdev('-s')
284 logging.warning('Reverting update; Boot partition will be %s', part)
285 return self._run('/postinst %s 2>&1' % part)
Gilad Arnoldd6adeb82015-09-21 07:10:03 -0700286
287
Richard Barnettef00a2ee2018-06-08 11:51:38 -0700288 def _get_remote_script(self, script_name):
289 """Ensure that `script_name` is present on the DUT.
Chris Sosa5e4246b2012-05-22 18:05:22 -0700290
Amin Hassani18e39882020-08-10 15:32:10 -0700291 The given script (e.g. `quick-provision`) may be present in the
Richard Barnettef00a2ee2018-06-08 11:51:38 -0700292 stateful partition under /usr/local/bin, or we may have to
293 download it from the devserver.
Chris Sosaa3ac2152012-05-23 22:23:13 -0700294
Richard Barnettef00a2ee2018-06-08 11:51:38 -0700295 Determine whether the script is present or must be downloaded
296 and download if necessary. Then, return a command fragment
297 sufficient to run the script from whereever it now lives on the
298 DUT.
Richard Barnette9d43e562018-06-05 17:20:10 +0000299
Richard Barnettef00a2ee2018-06-08 11:51:38 -0700300 @param script_name The name of the script as expected in
301 /usr/local/bin and on the devserver.
302 @return A string with the command (minus arguments) that will
303 run the target script.
Gwendal Grignou3e96cc22017-06-07 16:22:51 -0700304 """
Richard Barnettef00a2ee2018-06-08 11:51:38 -0700305 remote_script = '/usr/local/bin/%s' % script_name
306 if self.host.path_exists(remote_script):
307 return remote_script
Laurence Goodby06fb42c2020-02-29 17:14:42 -0800308 self.host.run('mkdir -p -m 1777 /usr/local/tmp')
309 remote_tmp_script = '/usr/local/tmp/%s' % script_name
Derek Beckett5fb683c2020-08-19 15:24:13 -0700310 server_name = six.moves.urllib.parse.urlparse(self.update_url)[1]
Richard Barnettef00a2ee2018-06-08 11:51:38 -0700311 script_url = 'http://%s/static/%s' % (server_name, script_name)
Dana Goyette353d1d92019-06-27 10:43:59 -0700312 fetch_script = 'curl -Ss -o %s %s && head -1 %s' % (
313 remote_tmp_script, script_url, remote_tmp_script)
Chris Sosa5e4246b2012-05-22 18:05:22 -0700314
Dana Goyette353d1d92019-06-27 10:43:59 -0700315 first_line = self._run(fetch_script).stdout.strip()
316
317 if first_line and first_line.startswith('#!'):
318 script_interpreter = first_line.lstrip('#!')
319 if script_interpreter:
320 return '%s %s' % (script_interpreter, remote_tmp_script)
321 return None
Richard Barnettef00a2ee2018-06-08 11:51:38 -0700322
Richard Barnette14ee84c2018-05-18 20:23:42 +0000323 def _prepare_host(self):
324 """Make sure the target DUT is working and ready for update.
325
326 Initially, the target DUT's state is unknown. The DUT is
327 expected to be online, but we strive to be forgiving if Chrome
328 and/or the update engine aren't fully functional.
329 """
330 # Summary of work, and the rationale:
331 # 1. Reboot, because it's a good way to clear out problems.
332 # 2. Touch the PROVISION_FAILED file, to allow repair to detect
333 # failure later.
334 # 3. Run the hook for host class specific preparation.
335 # 4. Stop Chrome, because the system is designed to eventually
336 # reboot if Chrome is stuck in a crash loop.
337 # 5. Force `update-engine` to start, because if Chrome failed
338 # to start properly, the status of the `update-engine` job
339 # will be uncertain.
Richard Barnette5adb6d42018-06-28 15:52:32 -0700340 if not self.host.is_up():
341 raise HostUpdateError(self.host.hostname,
342 HostUpdateError.DUT_DOWN)
Richard Barnette14ee84c2018-05-18 20:23:42 +0000343 self._reset_stateful_partition()
Garry Wang01a1d482020-08-02 20:46:53 -0700344 # Servohost reboot logic is handled by themselves.
345 if not self._is_servohost:
346 self.host.reboot(timeout=self.host.REBOOT_TIMEOUT)
347 self._run('touch %s' % PROVISION_FAILED)
Richard Barnette14ee84c2018-05-18 20:23:42 +0000348 self.host.prepare_for_update()
Garry Wang01a1d482020-08-02 20:46:53 -0700349 # Servohost will only update via quick provision.
350 if not self._is_servohost:
351 self._reset_update_engine()
Richard Barnette14ee84c2018-05-18 20:23:42 +0000352 logging.info('Updating from version %s to %s.',
353 self.host.get_release_version(),
354 self.update_version)
355
Congbin Guoeb7aa2d2019-07-15 16:10:44 -0700356 def _quick_provision_with_gs_cache(self, provision_command, devserver_name,
357 image_name):
358 """Run quick_provision using GsCache server.
359
360 @param provision_command: The path of quick_provision command.
361 @param devserver_name: The devserver name and port (optional).
362 @param image_name: The image to be installed.
363 """
364 logging.info('Try quick provision with gs_cache.')
365 # If enabled, GsCache server listion on different port on the
366 # devserver.
367 gs_cache_server = devserver_name.replace(DEVSERVER_PORT, GS_CACHE_PORT)
Amin Hassani1d6d3a72020-07-09 09:50:26 -0700368 gs_cache_url = ('http://%s/download/%s'
369 % (gs_cache_server,
370 'chromeos-releases' if self._is_release_bucket
371 else 'chromeos-image-archive'))
Congbin Guoeb7aa2d2019-07-15 16:10:44 -0700372
373 # Check if GS_Cache server is enabled on the server.
Congbin Guo4a2a6642019-08-12 15:03:01 -0700374 self._run('curl -s -o /dev/null %s' % gs_cache_url)
Congbin Guoeb7aa2d2019-07-15 16:10:44 -0700375
376 command = '%s --noreboot %s %s' % (provision_command, image_name,
377 gs_cache_url)
378 self._run(command)
379 metrics.Counter(_metric_name('quick_provision')).increment(
380 fields={'devserver': devserver_name, 'gs_cache': True})
381
382
383 def _quick_provision_with_devserver(self, provision_command,
384 devserver_name, image_name):
385 """Run quick_provision using legacy devserver.
386
387 @param provision_command: The path of quick_provision command.
388 @param devserver_name: The devserver name and port (optional).
389 @param image_name: The image to be installed.
390 """
Congbin Guo63ae0302019-08-12 16:37:49 -0700391 logging.info('Try quick provision with devserver.')
392 ds = dev_server.ImageServer('http://%s' % devserver_name)
Amin Hassani1d6d3a72020-07-09 09:50:26 -0700393 archive_url = ('gs://chromeos-releases/%s' % image_name
394 if self._is_release_bucket else None)
Congbin Guo63ae0302019-08-12 16:37:49 -0700395 try:
Amin Hassani95f86e02020-07-14 13:06:03 -0700396 ds.stage_artifacts(image_name, ['quick_provision', 'stateful',
Amin Hassani1d6d3a72020-07-09 09:50:26 -0700397 'autotest_packages'],
398 archive_url=archive_url)
Congbin Guo63ae0302019-08-12 16:37:49 -0700399 except dev_server.DevServerException as e:
Gregory Nisbetcf8c2ed2020-07-14 18:35:49 -0700400 six.reraise(error.TestFail, str(e), sys.exc_info()[2])
Congbin Guo63ae0302019-08-12 16:37:49 -0700401
Congbin Guoeb7aa2d2019-07-15 16:10:44 -0700402 static_url = 'http://%s/static' % devserver_name
403 command = '%s --noreboot %s %s' % (provision_command, image_name,
404 static_url)
Congbin Guoeb7aa2d2019-07-15 16:10:44 -0700405 self._run(command)
406 metrics.Counter(_metric_name('quick_provision')).increment(
407 fields={'devserver': devserver_name, 'gs_cache': False})
408
409
Amin Hassani18e39882020-08-10 15:32:10 -0700410 def _install_update(self):
Richard Barnettee86b1ce2018-06-07 10:37:23 -0700411 """Install an updating using the `quick-provision` script.
412
413 This uses the `quick-provision` script to download and install
414 a root FS, kernel and stateful filesystem content.
415
416 @return The kernel expected to be booted next.
417 """
Amin Hassani18e39882020-08-10 15:32:10 -0700418 logging.info('Installing image at %s onto %s',
419 self.update_url, self.host.hostname)
Derek Beckett5fb683c2020-08-19 15:24:13 -0700420 server_name = six.moves.urllib.parse.urlparse(self.update_url)[1]
Amin Hassani18e39882020-08-10 15:32:10 -0700421 image_name = url_to_image_name(self.update_url)
422
Amin Hassanib04420b2020-07-08 18:46:11 +0000423 logging.info('Installing image using quick-provision.')
Richard Barnettee86b1ce2018-06-07 10:37:23 -0700424 provision_command = self._get_remote_script(_QUICK_PROVISION_SCRIPT)
Richard Barnettee86b1ce2018-06-07 10:37:23 -0700425 try:
Congbin Guoeb7aa2d2019-07-15 16:10:44 -0700426 try:
427 self._quick_provision_with_gs_cache(provision_command,
428 server_name, image_name)
Amin Hassani95f86e02020-07-14 13:06:03 -0700429 except Exception as e:
430 logging.error('Failed to quick-provision with gscache with '
431 'error %s', e)
Congbin Guoeb7aa2d2019-07-15 16:10:44 -0700432 self._quick_provision_with_devserver(provision_command,
433 server_name, image_name)
434
Richard Barnette3ef29a82018-06-28 13:52:54 -0700435 self._set_target_version()
David Haddock77b75c32020-05-14 01:56:32 -0700436 return kernel_utils.verify_kernel_state_after_update(self.host)
Richard Barnettee86b1ce2018-06-07 10:37:23 -0700437 except Exception:
438 # N.B. We handle only `Exception` here. Non-Exception
439 # classes (such as KeyboardInterrupt) are handled by our
440 # caller.
Amin Hassani18e39882020-08-10 15:32:10 -0700441 logging.exception('quick-provision script failed;')
Richard Barnettee86b1ce2018-06-07 10:37:23 -0700442 self._revert_boot_partition()
443 self._reset_stateful_partition()
444 self._reset_update_engine()
445 return None
446
447
Richard Barnette14ee84c2018-05-18 20:23:42 +0000448 def _complete_update(self, expected_kernel):
449 """Finish the update, and confirm that it succeeded.
Richard Barnette0beb14b2018-05-15 18:07:52 +0000450
Richard Barnette14ee84c2018-05-18 20:23:42 +0000451 Initial condition is that the target build has been downloaded
452 and installed on the DUT, but has not yet been booted. This
453 function is responsible for rebooting the DUT, and checking that
454 the new build is running successfully.
Richard Barnette0beb14b2018-05-15 18:07:52 +0000455
Richard Barnette14ee84c2018-05-18 20:23:42 +0000456 @param expected_kernel: kernel expected to be active after reboot.
Richard Barnette0beb14b2018-05-15 18:07:52 +0000457 """
Richard Barnette14ee84c2018-05-18 20:23:42 +0000458 # Regarding the 'crossystem' command below: In some cases,
459 # the update flow puts the TPM into a state such that it
460 # fails verification. We don't know why. However, this
461 # call papers over the problem by clearing the TPM during
462 # the reboot.
463 #
464 # We ignore failures from 'crossystem'. Although failure
465 # here is unexpected, and could signal a bug, the point of
466 # the exercise is to paper over problems; allowing this to
467 # fail would defeat the purpose.
468 self._run('crossystem clear_tpm_owner_request=1',
469 ignore_status=True)
470 self.host.reboot(timeout=self.host.REBOOT_TIMEOUT)
471
Richard Barnette0beb14b2018-05-15 18:07:52 +0000472 # Touch the lab machine file to leave a marker that
473 # distinguishes this image from other test images.
474 # Afterwards, we must re-run the autoreboot script because
475 # it depends on the _LAB_MACHINE_FILE.
476 autoreboot_cmd = ('FILE="%s" ; [ -f "$FILE" ] || '
477 '( touch "$FILE" ; start autoreboot )')
Richard Barnette3e8b2282018-05-15 20:42:20 +0000478 self._run(autoreboot_cmd % _LAB_MACHINE_FILE)
Sanika Kulkarnia9c4c332020-08-18 15:56:28 -0700479 try:
480 kernel_utils.verify_boot_expectations(
481 expected_kernel, NewBuildUpdateError.ROLLBACK_FAILURE,
482 self.host)
483 except Exception:
484 # When the system is rolled back, the provision_failed file is
485 # removed. So add it back here and re-raise the exception.
486 self._run('touch %s' % PROVISION_FAILED)
487 raise
Richard Barnette0beb14b2018-05-15 18:07:52 +0000488
489 logging.debug('Cleaning up old autotest directories.')
490 try:
491 installed_autodir = autotest.Autotest.get_installed_autodir(
492 self.host)
493 self._run('rm -rf ' + installed_autodir)
494 except autotest.AutodirNotFoundError:
495 logging.debug('No autotest installed directory found.')
496
497
Jae Hoon Kim5f6ca6e2020-09-10 16:11:23 -0700498 def run_provision(self):
499 """Perform a full provision of a DUT in the test lab.
Richard Barnette0beb14b2018-05-15 18:07:52 +0000500
Richard Barnette4c81b972018-07-18 12:35:16 -0700501 This downloads and installs the root FS and stateful partition
502 content needed for the update specified in `self.host` and
Jae Hoon Kim5f6ca6e2020-09-10 16:11:23 -0700503 `self.update_url`. The provision is performed according to the
Richard Barnette4c81b972018-07-18 12:35:16 -0700504 requirements for provisioning a DUT for testing the requested
505 build.
Richard Barnette0beb14b2018-05-15 18:07:52 +0000506
Richard Barnette4c81b972018-07-18 12:35:16 -0700507 At the end of the procedure, metrics are reported describing the
508 outcome of the operation.
509
510 @returns A tuple of the form `(image_name, attributes)`, where
511 `image_name` is the name of the image installed, and
512 `attributes` is new attributes to be applied to the DUT.
Richard Barnette0beb14b2018-05-15 18:07:52 +0000513 """
Richard Barnette4c81b972018-07-18 12:35:16 -0700514 server_name = dev_server.get_resolved_hostname(self.update_url)
515 metrics.Counter(_metric_name('install')).increment(
516 fields={'devserver': server_name})
517
Richard Barnette9d43e562018-06-05 17:20:10 +0000518 try:
519 self._prepare_host()
520 except _AttributedUpdateError:
521 raise
522 except Exception as e:
523 logging.exception('Failure preparing host prior to update.')
524 raise HostUpdateError(self.host.hostname, str(e))
525
526 try:
527 expected_kernel = self._install_update()
528 except _AttributedUpdateError:
529 raise
530 except Exception as e:
531 logging.exception('Failure during download and install.')
532 raise ImageInstallError(self.host.hostname, server_name, str(e))
533
Garry Wang01a1d482020-08-02 20:46:53 -0700534 # Servohost will handle post update process themselves.
535 if not self._is_servohost:
536 try:
537 self._complete_update(expected_kernel)
538 except _AttributedUpdateError:
539 raise
540 except Exception as e:
541 logging.exception('Failure from build after update.')
542 raise NewBuildUpdateError(self.update_version, str(e))
Richard Barnette0beb14b2018-05-15 18:07:52 +0000543
Richard Barnette0beb14b2018-05-15 18:07:52 +0000544 image_name = url_to_image_name(self.update_url)
545 # update_url is different from devserver url needed to stage autotest
546 # packages, therefore, resolve a new devserver url here.
547 devserver_url = dev_server.ImageServer.resolve(
548 image_name, self.host.hostname).url()
549 repo_url = tools.get_package_url(devserver_url, image_name)
550 return image_name, {ds_constants.JOB_REPO_URL: repo_url}