blob: b497b4bf6e7994fd5713fa82197581b4314cfbec [file] [log] [blame]
J. Richard Barnette24adbf42012-04-11 15:04:53 -07001# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
Dale Curtisaa5eedb2011-08-23 16:18:52 -07002# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4
Aviv Keshet74c89a92013-02-04 15:18:30 -08005import functools
J. Richard Barnette1d78b012012-05-15 13:56:30 -07006import logging
Dan Shi0f466e82013-02-22 15:44:58 -08007import os
Simran Basid5e5e272012-09-24 15:23:59 -07008import re
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07009import time
10
mussa584b4462014-06-20 15:13:28 -070011import common
J. Richard Barnette45e93de2012-04-11 17:24:15 -070012from autotest_lib.client.bin import utils
Dan Shi9cb0eec2014-06-03 09:04:50 -070013from autotest_lib.client.common_lib import autotemp
Richard Barnette0c73ffc2012-11-19 15:21:18 -080014from autotest_lib.client.common_lib import error
15from autotest_lib.client.common_lib import global_config
Dan Shi549fb822015-03-24 18:01:11 -070016from autotest_lib.client.common_lib import lsbrelease_utils
J. Richard Barnette45e93de2012-04-11 17:24:15 -070017from autotest_lib.client.common_lib.cros import autoupdater
Richard Barnette03a0c132012-11-05 12:40:35 -080018from autotest_lib.client.common_lib.cros import dev_server
Gabe Blackb72f4fb2015-01-20 16:47:13 -080019from autotest_lib.client.common_lib.cros.graphite import autotest_es
Gabe Black1e1c41b2015-02-04 23:55:15 -080020from autotest_lib.client.common_lib.cros.graphite import autotest_stats
Hsinyu Chaoe0b08e62015-08-11 10:50:37 +000021from autotest_lib.client.cros import constants as client_constants
J. Richard Barnette84890bd2014-02-21 11:05:47 -080022from autotest_lib.client.cros import cros_ui
Cheng-Yi Chiangf4104ff2014-12-23 19:39:01 +080023from autotest_lib.client.cros.audio import cras_utils
Katherine Threlkeldab83d392015-06-18 16:45:57 -070024from autotest_lib.client.cros.input_playback import input_playback
Mussa5b589052015-10-26 17:55:26 -070025from autotest_lib.client.cros.video import constants as video_test_constants
Simran Basi5ace6f22016-01-06 17:30:44 -080026from autotest_lib.server import afe_utils
MK Ryu35d661e2014-09-25 17:44:10 -070027from autotest_lib.server import autoserv_parser
28from autotest_lib.server import autotest
29from autotest_lib.server import constants
Dan Shia1ecd5c2013-06-06 11:21:31 -070030from autotest_lib.server import utils as server_utils
Dan Shi9cb0eec2014-06-03 09:04:50 -070031from autotest_lib.server.cros import provision
Scott Zawalski89c44dd2013-02-26 09:28:02 -050032from autotest_lib.server.cros.dynamic_suite import constants as ds_constants
Simran Basi5e6339a2013-03-21 11:34:32 -070033from autotest_lib.server.cros.dynamic_suite import tools, frontend_wrappers
Dan Shi9cb0eec2014-06-03 09:04:50 -070034from autotest_lib.server.cros.faft.config.config import Config as FAFTConfig
Scottfe06ed82015-11-05 17:15:01 -080035from autotest_lib.server.cros.servo import plankton
Fang Deng96667ca2013-08-01 17:46:18 -070036from autotest_lib.server.hosts import abstract_ssh
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +080037from autotest_lib.server.hosts import chameleon_host
J. Richard Barnettea7e7fdc2016-02-12 12:35:36 -080038from autotest_lib.server.hosts import cros_repair
Scottfe06ed82015-11-05 17:15:01 -080039from autotest_lib.server.hosts import plankton_host
Fang Deng5d518f42013-08-02 14:04:32 -070040from autotest_lib.server.hosts import servo_host
Simran Basidcff4252012-11-20 16:13:20 -080041from autotest_lib.site_utils.rpm_control_system import rpm_client
Simran Basid5e5e272012-09-24 15:23:59 -070042
43
Dan Shib8540a52015-07-16 14:18:23 -070044CONFIG = global_config.global_config
45
Eric Carusoee673ac2015-08-05 17:03:04 -070046LUCID_SLEEP_BOARDS = ['samus', 'lulu']
47
Dan Shid07ee2e2015-09-24 14:49:25 -070048# A file to indicate provision failure and require Repair job to powerwash the
49# dut.
50PROVISION_FAILED = '/var/tmp/provision_failed'
51
beepsc87ff602013-07-31 21:53:00 -070052class FactoryImageCheckerException(error.AutoservError):
53 """Exception raised when an image is a factory image."""
54 pass
55
56
Fang Deng0ca40e22013-08-27 17:47:44 -070057class CrosHost(abstract_ssh.AbstractSSHHost):
J. Richard Barnette45e93de2012-04-11 17:24:15 -070058 """Chromium OS specific subclass of Host."""
59
Simran Basi5ace6f22016-01-06 17:30:44 -080060 VERSION_PREFIX = provision.CROS_VERSION_PREFIX
61
J. Richard Barnette45e93de2012-04-11 17:24:15 -070062 _parser = autoserv_parser.autoserv_parser
Scott Zawalski62bacae2013-03-05 10:40:32 -050063 _AFE = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
J. Richard Barnette45e93de2012-04-11 17:24:15 -070064
Richard Barnette03a0c132012-11-05 12:40:35 -080065 # Timeout values (in seconds) associated with various Chrome OS
66 # state changes.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070067 #
Richard Barnette0c73ffc2012-11-19 15:21:18 -080068 # In general, a good rule of thumb is that the timeout can be up
69 # to twice the typical measured value on the slowest platform.
70 # The times here have not necessarily been empirically tested to
71 # meet this criterion.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070072 #
73 # SLEEP_TIMEOUT: Time to allow for suspend to memory.
Richard Barnette0c73ffc2012-11-19 15:21:18 -080074 # RESUME_TIMEOUT: Time to allow for resume after suspend, plus
75 # time to restart the netwowrk.
J. Richard Barnette84890bd2014-02-21 11:05:47 -080076 # SHUTDOWN_TIMEOUT: Time to allow for shut down.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070077 # BOOT_TIMEOUT: Time to allow for boot from power off. Among
Richard Barnette0c73ffc2012-11-19 15:21:18 -080078 # other things, this must account for the 30 second dev-mode
J. Richard Barnette417cc792015-10-01 09:56:36 -070079 # screen delay, time to start the network on the DUT, and the
80 # ssh timeout of 120 seconds.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070081 # USB_BOOT_TIMEOUT: Time to allow for boot from a USB device,
Richard Barnette0c73ffc2012-11-19 15:21:18 -080082 # including the 30 second dev-mode delay and time to start the
J. Richard Barnetted4649c62013-03-06 17:42:27 -080083 # network.
beepsf079cfb2013-09-18 17:49:51 -070084 # INSTALL_TIMEOUT: Time to allow for chromeos-install.
J. Richard Barnette84890bd2014-02-21 11:05:47 -080085 # POWERWASH_BOOT_TIMEOUT: Time to allow for a reboot that
86 # includes powerwash.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070087
88 SLEEP_TIMEOUT = 2
J. Richard Barnetted4649c62013-03-06 17:42:27 -080089 RESUME_TIMEOUT = 10
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +080090 SHUTDOWN_TIMEOUT = 10
J. Richard Barnette417cc792015-10-01 09:56:36 -070091 BOOT_TIMEOUT = 150
J. Richard Barnette5bab5f52015-08-03 13:14:38 -070092 USB_BOOT_TIMEOUT = 300
J. Richard Barnette7817b052014-08-28 09:47:29 -070093 INSTALL_TIMEOUT = 480
Dan Shi2c88eed2013-11-12 10:18:38 -080094 POWERWASH_BOOT_TIMEOUT = 60
Chris Sosab76e0ee2013-05-22 16:55:41 -070095
Dan Shica503482015-03-30 17:23:25 -070096 # Minimum OS version that supports server side packaging. Older builds may
97 # not have server side package built or with Autotest code change to support
98 # server-side packaging.
Dan Shib8540a52015-07-16 14:18:23 -070099 MIN_VERSION_SUPPORT_SSP = CONFIG.get_config_value(
Dan Shiced09e42015-04-17 16:09:34 -0700100 'AUTOSERV', 'min_version_support_ssp', type=int)
Dan Shica503482015-03-30 17:23:25 -0700101
J. Richard Barnette84890bd2014-02-21 11:05:47 -0800102 # REBOOT_TIMEOUT: How long to wait for a reboot.
103 #
Chris Sosab76e0ee2013-05-22 16:55:41 -0700104 # We have a long timeout to ensure we don't flakily fail due to other
105 # issues. Shorter timeouts are vetted in platform_RebootAfterUpdate.
Simran Basi1160e2c2013-10-04 16:00:24 -0700106 # TODO(sbasi - crbug.com/276094) Restore to 5 mins once the 'host did not
107 # return from reboot' bug is solved.
108 REBOOT_TIMEOUT = 480
Chris Sosab76e0ee2013-05-22 16:55:41 -0700109
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800110 # _USB_POWER_TIMEOUT: Time to allow for USB to power toggle ON and OFF.
111 # _POWER_CYCLE_TIMEOUT: Time to allow for manual power cycle.
112 _USB_POWER_TIMEOUT = 5
113 _POWER_CYCLE_TIMEOUT = 10
114
Dan Shib8540a52015-07-16 14:18:23 -0700115 _RPM_RECOVERY_BOARDS = CONFIG.get_config_value('CROS',
Richard Barnette82c35912012-11-20 10:09:10 -0800116 'rpm_recovery_boards', type=str).split(',')
117
118 _MAX_POWER_CYCLE_ATTEMPTS = 6
119 _LAB_MACHINE_FILE = '/mnt/stateful_partition/.labmachine'
Fang Dengdeba14f2014-11-14 11:54:09 -0800120 _RPM_HOSTNAME_REGEX = ('chromeos(\d+)(-row(\d+))?-rack(\d+[a-z]*)'
121 '-host(\d+)')
Katherine Threlkeldab83d392015-06-18 16:45:57 -0700122 _LIGHTSENSOR_FILES = [ "in_illuminance0_input",
123 "in_illuminance_input",
124 "in_illuminance0_raw",
125 "in_illuminance_raw",
126 "illuminance0_input"]
Richard Barnette82c35912012-11-20 10:09:10 -0800127 _LIGHTSENSOR_SEARCH_DIR = '/sys/bus/iio/devices'
128 _LABEL_FUNCTIONS = []
Aviv Keshet74c89a92013-02-04 15:18:30 -0800129 _DETECTABLE_LABELS = []
Kevin Cheng3a4a57a2015-09-30 12:09:50 -0700130 label_decorator = functools.partial(server_utils.add_label_detector,
131 _LABEL_FUNCTIONS,
Aviv Keshet74c89a92013-02-04 15:18:30 -0800132 _DETECTABLE_LABELS)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700133
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -0800134 # Constants used in ping_wait_up() and ping_wait_down().
135 #
136 # _PING_WAIT_COUNT is the approximate number of polling
137 # cycles to use when waiting for a host state change.
138 #
139 # _PING_STATUS_DOWN and _PING_STATUS_UP are names used
140 # for arguments to the internal _ping_wait_for_status()
141 # method.
142 _PING_WAIT_COUNT = 40
143 _PING_STATUS_DOWN = False
144 _PING_STATUS_UP = True
145
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800146 # Allowed values for the power_method argument.
147
148 # POWER_CONTROL_RPM: Passed as default arg for power_off/on/cycle() methods.
149 # POWER_CONTROL_SERVO: Used in set_power() and power_cycle() methods.
150 # POWER_CONTROL_MANUAL: Used in set_power() and power_cycle() methods.
151 POWER_CONTROL_RPM = 'RPM'
152 POWER_CONTROL_SERVO = 'servoj10'
153 POWER_CONTROL_MANUAL = 'manual'
154
155 POWER_CONTROL_VALID_ARGS = (POWER_CONTROL_RPM,
156 POWER_CONTROL_SERVO,
157 POWER_CONTROL_MANUAL)
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800158
Simran Basi5e6339a2013-03-21 11:34:32 -0700159 _RPM_OUTLET_CHANGED = 'outlet_changed'
160
Dan Shi9cb0eec2014-06-03 09:04:50 -0700161 # URL pattern to download firmware image.
Dan Shib8540a52015-07-16 14:18:23 -0700162 _FW_IMAGE_URL_PATTERN = CONFIG.get_config_value(
Dan Shi9cb0eec2014-06-03 09:04:50 -0700163 'CROS', 'firmware_url_pattern', type=str)
beeps687243d2013-07-18 15:29:27 -0700164
MK Ryu35d661e2014-09-25 17:44:10 -0700165 # Time duration waiting for host up/down check
166 _CHECK_HOST_UP_TIMEOUT_SECS = 15
167
MK Ryu35d661e2014-09-25 17:44:10 -0700168
J. Richard Barnette964fba02012-10-24 17:34:29 -0700169 @staticmethod
beeps46dadc92013-11-07 14:07:10 -0800170 def check_host(host, timeout=10):
171 """
172 Check if the given host is a chrome-os host.
173
174 @param host: An ssh host representing a device.
175 @param timeout: The timeout for the run command.
176
177 @return: True if the host device is chromeos.
178
beeps46dadc92013-11-07 14:07:10 -0800179 """
180 try:
Simran Basi933c8af2015-04-29 14:05:07 -0700181 result = host.run(
182 'grep -q CHROMEOS /etc/lsb-release && '
183 '! test -f /mnt/stateful_partition/.android_tester && '
184 '! grep -q moblab /etc/lsb-release',
185 ignore_status=True, timeout=timeout)
beeps46dadc92013-11-07 14:07:10 -0800186 except (error.AutoservRunError, error.AutoservSSHTimeout):
187 return False
188 return result.exit_status == 0
189
190
191 @staticmethod
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800192 def _extract_arguments(args_dict, key_subset):
193 """Extract options from `args_dict` and return a subset result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800194
195 Take the provided dictionary of argument options and return
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800196 a subset that represent standard arguments needed to construct
197 a test-assistant object (chameleon or servo) for a host. The
198 intent is to provide standard argument processing from
Christopher Wiley644ef3e2015-05-15 13:14:14 -0700199 CrosHost for tests that require a test-assistant board
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800200 to operate.
201
202 @param args_dict Dictionary from which to extract the arguments.
203 @param key_subset Tuple of keys to extract from the args_dict, e.g.
204 ('servo_host', 'servo_port').
205 """
206 result = {}
207 for arg in key_subset:
208 if arg in args_dict:
209 result[arg] = args_dict[arg]
210 return result
211
212
213 @staticmethod
214 def get_chameleon_arguments(args_dict):
215 """Extract chameleon options from `args_dict` and return the result.
216
217 Recommended usage:
218 ~~~~~~~~
219 args_dict = utils.args_to_dict(args)
220 chameleon_args = hosts.CrosHost.get_chameleon_arguments(args_dict)
221 host = hosts.create_host(machine, chameleon_args=chameleon_args)
222 ~~~~~~~~
223
224 @param args_dict Dictionary from which to extract the chameleon
225 arguments.
226 """
227 return CrosHost._extract_arguments(
228 args_dict, ('chameleon_host', 'chameleon_port'))
229
230
231 @staticmethod
Scottfe06ed82015-11-05 17:15:01 -0800232 def get_plankton_arguments(args_dict):
233 """Extract chameleon options from `args_dict` and return the result.
234
235 Recommended usage:
236 ~~~~~~~~
237 args_dict = utils.args_to_dict(args)
238 plankon_args = hosts.CrosHost.get_plankton_arguments(args_dict)
239 host = hosts.create_host(machine, plankton_args=polankton_args)
240 ~~~~~~~~
241
242 @param args_dict Dictionary from which to extract the plankton
243 arguments.
244 """
245 args = CrosHost._extract_arguments(
246 args_dict, ('plankton_host', 'plankton_port'))
247 return args
248
249
250 @staticmethod
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800251 def get_servo_arguments(args_dict):
252 """Extract servo options from `args_dict` and return the result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800253
254 Recommended usage:
255 ~~~~~~~~
256 args_dict = utils.args_to_dict(args)
Fang Deng0ca40e22013-08-27 17:47:44 -0700257 servo_args = hosts.CrosHost.get_servo_arguments(args_dict)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800258 host = hosts.create_host(machine, servo_args=servo_args)
259 ~~~~~~~~
260
261 @param args_dict Dictionary from which to extract the servo
262 arguments.
263 """
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800264 return CrosHost._extract_arguments(
265 args_dict, ('servo_host', 'servo_port'))
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700266
J. Richard Barnette964fba02012-10-24 17:34:29 -0700267
Scottfe06ed82015-11-05 17:15:01 -0800268 def _initialize(self, hostname, chameleon_args=None, servo_args=None, plankton_args=None,
Fang Denge545abb2014-12-30 18:43:47 -0800269 try_lab_servo=False, ssh_verbosity_flag='', ssh_options='',
Fang Dengd1c2b732013-08-20 12:59:46 -0700270 *args, **dargs):
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800271 """Initialize superclasses, |self.chameleon|, and |self.servo|.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700272
Fang Denge545abb2014-12-30 18:43:47 -0800273 This method will attempt to create the test-assistant object
274 (chameleon/servo) when it is needed by the test. Check
275 the docstring of chameleon_host.create_chameleon_host and
276 servo_host.create_servo_host for how this is determined.
Fang Deng5d518f42013-08-02 14:04:32 -0700277
Fang Denge545abb2014-12-30 18:43:47 -0800278 @param hostname: Hostname of the dut.
279 @param chameleon_args: A dictionary that contains args for creating
280 a ChameleonHost. See chameleon_host for details.
281 @param servo_args: A dictionary that contains args for creating
282 a ServoHost object. See servo_host for details.
283 @param try_lab_servo: Boolean, False indicates that ServoHost should
284 not be created for a device in Cros test lab.
285 See servo_host for details.
286 @param ssh_verbosity_flag: String, to pass to the ssh command to control
287 verbosity.
288 @param ssh_options: String, other ssh options to pass to the ssh
289 command.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700290 """
Fang Deng0ca40e22013-08-27 17:47:44 -0700291 super(CrosHost, self)._initialize(hostname=hostname,
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700292 *args, **dargs)
J. Richard Barnettea7e7fdc2016-02-12 12:35:36 -0800293 self._repair_strategy = cros_repair.create_repair_strategy()
J. Richard Barnettef0859852012-08-20 14:55:50 -0700294 # self.env is a dictionary of environment variable settings
295 # to be exported for commands run on the host.
296 # LIBC_FATAL_STDERR_ can be useful for diagnosing certain
297 # errors that might happen.
298 self.env['LIBC_FATAL_STDERR_'] = '1'
Fang Dengd1c2b732013-08-20 12:59:46 -0700299 self._ssh_verbosity_flag = ssh_verbosity_flag
Aviv Keshetc5947fa2013-09-04 14:06:29 -0700300 self._ssh_options = ssh_options
Fang Deng5d518f42013-08-02 14:04:32 -0700301 # TODO(fdeng): We need to simplify the
302 # process of servo and servo_host initialization.
303 # crbug.com/298432
Fang Denge545abb2014-12-30 18:43:47 -0800304 self._servo_host = servo_host.create_servo_host(
305 dut=self.hostname, servo_args=servo_args,
306 try_lab_servo=try_lab_servo)
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800307 # TODO(waihong): Do the simplication on Chameleon too.
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800308 self._chameleon_host = chameleon_host.create_chameleon_host(
309 dut=self.hostname, chameleon_args=chameleon_args)
Scottfe06ed82015-11-05 17:15:01 -0800310 # Add plankton host if plankton args were added on command line
311 self._plankton_host = plankton_host.create_plankton_host(plankton_args)
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800312
Dan Shi4d478522014-02-14 13:46:32 -0800313 if self._servo_host is not None:
314 self.servo = self._servo_host.get_servo()
315 else:
316 self.servo = None
317
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800318 if self._chameleon_host:
Tom Wai-Hong Tameaee3402014-01-22 08:52:10 +0800319 self.chameleon = self._chameleon_host.create_chameleon_board()
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800320 else:
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800321 self.chameleon = None
Fang Deng5d518f42013-08-02 14:04:32 -0700322
Scottfe06ed82015-11-05 17:15:01 -0800323 if self._plankton_host:
324 self.plankton_servo = self._plankton_host.get_servo()
325 logging.info('plankton_servo: %r', self.plankton_servo)
326 # Create the plankton object used to access the ec uart
Scott07a848f2016-01-12 15:04:52 -0800327 self.plankton = plankton.Plankton(self.plankton_servo,
328 self._plankton_host.get_servod_server_proxy())
Scottfe06ed82015-11-05 17:15:01 -0800329 else:
Scott07a848f2016-01-12 15:04:52 -0800330 self.plankton = None
Scottfe06ed82015-11-05 17:15:01 -0800331
Fang Deng5d518f42013-08-02 14:04:32 -0700332
Dan Shi3d7a0e12015-10-12 11:55:45 -0700333 def get_repair_image_name(self, image_type='cros'):
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500334 """Generate a image_name from variables in the global config.
335
Dan Shi3d7a0e12015-10-12 11:55:45 -0700336 image_type is used to differentiate different images. Default is CrOS,
337 in which case, repair image's name follows the naming convention defined
338 in global setting CROS/stable_build_pattern.
339 If the image_type is not `cros`, the repair image will be looked up
340 using key `board_name/image_type`, e.g., daisy_spring/firmware.
341
342 @param image_type: Type of the image. Default is `cros`.
343
Dan Shi08173202015-11-12 13:08:45 -0800344 @returns a str of $board-version/$BUILD. Returns None if stable version
345 for the board and the default are both not set, e.g., stable
346 firmware version for a new board.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500347
348 """
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500349 board = self._get_board_from_afe()
350 if board is None:
351 raise error.AutoservError('DUT has no board attribute, '
352 'cannot be repaired.')
Dan Shi3d7a0e12015-10-12 11:55:45 -0700353 if image_type != 'cros':
354 board = '%s/%s' % (board, image_type)
Simran Basibeb2bb22016-02-03 15:25:48 -0800355 stable_version = afe_utils.get_stable_version(board=board)
Dan Shi3d7a0e12015-10-12 11:55:45 -0700356 if image_type == 'cros':
357 build_pattern = CONFIG.get_config_value(
358 'CROS', 'stable_build_pattern')
359 stable_version = build_pattern % (board, stable_version)
Dan Shi08173202015-11-12 13:08:45 -0800360 elif image_type == 'firmware':
361 # If firmware stable version is not specified, `stable_version`
362 # from the RPC is the default stable version for CrOS image.
363 # firmware stable version must be from firmware branch, thus its
364 # value must be like board-firmware/R31-1234.0.0. Check if
365 # firmware exists in the stable version, if not, return None.
366 if 'firmware' not in stable_version:
367 return None
Dan Shi3d7a0e12015-10-12 11:55:45 -0700368 return stable_version
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500369
370
Chris Sosab76e0ee2013-05-22 16:55:41 -0700371 def lookup_job_repo_url(self):
372 """Looks up the job_repo_url for the host.
373
Dan Shi8190eb82016-02-11 17:15:58 -0800374 This is kept for backwards compatibility as AU test code in older
375 branch does not use server-side packaging and calls this method through
376 the host object.
377
378 TODO(dshi): Once R50 falls off the stable branch, we should remove this
379 method.
380
Chris Sosab76e0ee2013-05-22 16:55:41 -0700381 @returns job_repo_url from AFE or None if not found.
382
383 @raises KeyError if the host does not have a job_repo_url
384 """
Dan Shibe3636a2016-02-14 22:48:01 -0800385 return afe_utils.get_host_attribute(self, ds_constants.JOB_REPO_URL)
beepscb6f1e22013-06-28 19:14:10 -0700386
387
beepsdae65fd2013-07-26 16:24:41 -0700388 def verify_job_repo_url(self, tag=''):
beepscb6f1e22013-06-28 19:14:10 -0700389 """
390 Make sure job_repo_url of this host is valid.
391
joychen03eaad92013-06-26 09:55:21 -0700392 Eg: The job_repo_url "http://lmn.cd.ab.xyx:8080/static/\
beepscb6f1e22013-06-28 19:14:10 -0700393 lumpy-release/R29-4279.0.0/autotest/packages" claims to have the
394 autotest package for lumpy-release/R29-4279.0.0. If this isn't the case,
395 download and extract it. If the devserver embedded in the url is
396 unresponsive, update the job_repo_url of the host after staging it on
397 another devserver.
398
399 @param job_repo_url: A url pointing to the devserver where the autotest
400 package for this build should be staged.
beepsdae65fd2013-07-26 16:24:41 -0700401 @param tag: The tag from the server job, in the format
402 <job_id>-<user>/<hostname>, or <hostless> for a server job.
beepscb6f1e22013-06-28 19:14:10 -0700403
404 @raises DevServerException: If we could not resolve a devserver.
405 @raises AutoservError: If we're unable to save the new job_repo_url as
406 a result of choosing a new devserver because the old one failed to
407 respond to a health check.
beeps0c865032013-07-30 11:37:06 -0700408 @raises urllib2.URLError: If the devserver embedded in job_repo_url
409 doesn't respond within the timeout.
beepscb6f1e22013-06-28 19:14:10 -0700410 """
Dan Shibe3636a2016-02-14 22:48:01 -0800411 job_repo_url = afe_utils.get_host_attribute(self,
412 ds_constants.JOB_REPO_URL)
beepscb6f1e22013-06-28 19:14:10 -0700413 if not job_repo_url:
414 logging.warning('No job repo url set on host %s', self.hostname)
415 return
416
417 logging.info('Verifying job repo url %s', job_repo_url)
418 devserver_url, image_name = tools.get_devserver_build_from_package_url(
419 job_repo_url)
420
beeps0c865032013-07-30 11:37:06 -0700421 ds = dev_server.ImageServer(devserver_url)
beepscb6f1e22013-06-28 19:14:10 -0700422
423 logging.info('Staging autotest artifacts for %s on devserver %s',
424 image_name, ds.url())
beeps687243d2013-07-18 15:29:27 -0700425
426 start_time = time.time()
Simran Basi25e7a922014-10-31 11:56:10 -0700427 ds.stage_artifacts(image_name, ['autotest_packages'])
beeps687243d2013-07-18 15:29:27 -0700428 stage_time = time.time() - start_time
429
430 # Record how much of the verification time comes from a devserver
431 # restage. If we're doing things right we should not see multiple
432 # devservers for a given board/build/branch path.
433 try:
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800434 board, build_type, branch = server_utils.ParseBuildName(
beeps687243d2013-07-18 15:29:27 -0700435 image_name)[:3]
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800436 except server_utils.ParseBuildNameException:
beeps687243d2013-07-18 15:29:27 -0700437 pass
438 else:
beeps0c865032013-07-30 11:37:06 -0700439 devserver = devserver_url[
Chris Sosa65425082013-10-16 13:26:22 -0700440 devserver_url.find('/') + 2:devserver_url.rfind(':')]
beeps687243d2013-07-18 15:29:27 -0700441 stats_key = {
442 'board': board,
443 'build_type': build_type,
444 'branch': branch,
beeps0c865032013-07-30 11:37:06 -0700445 'devserver': devserver.replace('.', '_'),
beeps687243d2013-07-18 15:29:27 -0700446 }
Gabe Black1e1c41b2015-02-04 23:55:15 -0800447 autotest_stats.Gauge('verify_job_repo_url').send(
beeps687243d2013-07-18 15:29:27 -0700448 '%(board)s.%(build_type)s.%(branch)s.%(devserver)s' % stats_key,
449 stage_time)
beepscb6f1e22013-06-28 19:14:10 -0700450
Scott Zawalskieadbf702013-03-14 09:23:06 -0400451
Dan Shicf4d2032015-03-12 15:04:21 -0700452 def stage_server_side_package(self, image=None):
453 """Stage autotest server-side package on devserver.
454
455 @param image: Full path of an OS image to install or a build name.
456
457 @return: A url to the autotest server-side package.
458 """
459 if image:
460 image_name = tools.get_build_from_image(image)
461 if not image_name:
462 raise error.AutoservError(
463 'Failed to parse build name from %s' % image)
464 ds = dev_server.ImageServer.resolve(image_name)
465 else:
Dan Shibe3636a2016-02-14 22:48:01 -0800466 job_repo_url = afe_utils.get_host_attribute(
467 self, ds_constants.JOB_REPO_URL)
Dan Shicf4d2032015-03-12 15:04:21 -0700468 if job_repo_url:
469 devserver_url, image_name = (
470 tools.get_devserver_build_from_package_url(job_repo_url))
471 ds = dev_server.ImageServer(devserver_url)
472 else:
473 labels = self._AFE.get_labels(
474 name__startswith=ds_constants.VERSION_PREFIX,
475 host__hostname=self.hostname)
476 if not labels:
477 raise error.AutoservError(
478 'Failed to stage server-side package. The host has '
479 'no job_report_url attribute or version label.')
480 image_name = labels[0].name[len(ds_constants.VERSION_PREFIX):]
481 ds = dev_server.ImageServer.resolve(image_name)
Dan Shica503482015-03-30 17:23:25 -0700482
483 # Get the OS version of the build, for any build older than
484 # MIN_VERSION_SUPPORT_SSP, server side packaging is not supported.
485 match = re.match('.*/R\d+-(\d+)\.', image_name)
486 if match and int(match.group(1)) < self.MIN_VERSION_SUPPORT_SSP:
487 logging.warn('Build %s is older than %s. Server side packaging is '
488 'disabled.', image_name, self.MIN_VERSION_SUPPORT_SSP)
489 return None
490
Dan Shicf4d2032015-03-12 15:04:21 -0700491 ds.stage_artifacts(image_name, ['autotest_server_package'])
492 return '%s/static/%s/%s' % (ds.url(), image_name,
493 'autotest_server_package.tar.bz2')
494
495
Dan Shi0f466e82013-02-22 15:44:58 -0800496 def _try_stateful_update(self, update_url, force_update, updater):
497 """Try to use stateful update to initialize DUT.
498
499 When DUT is already running the same version that machine_install
500 tries to install, stateful update is a much faster way to clean up
501 the DUT for testing, compared to a full reimage. It is implemeted
502 by calling autoupdater.run_update, but skipping updating root, as
503 updating the kernel is time consuming and not necessary.
504
505 @param update_url: url of the image.
506 @param force_update: Set to True to update the image even if the DUT
507 is running the same version.
508 @param updater: ChromiumOSUpdater instance used to update the DUT.
509 @returns: True if the DUT was updated with stateful update.
510
511 """
Dan Shi10b98482016-02-02 14:38:50 -0800512 # Stop service ap-update-manager to prevent rebooting during autoupdate.
513 # The service is used in jetstream boards, but not other CrOS devices.
514 self.run('sudo stop ap-update-manager', ignore_status=True)
515
J. Richard Barnette3f731032014-04-07 17:42:59 -0700516 # TODO(jrbarnette): Yes, I hate this re.match() test case.
517 # It's better than the alternative: see crbug.com/360944.
518 image_name = autoupdater.url_to_image_name(update_url)
519 release_pattern = r'^.*-release/R[0-9]+-[0-9]+\.[0-9]+\.0$'
520 if not re.match(release_pattern, image_name):
521 return False
Dan Shi0f466e82013-02-22 15:44:58 -0800522 if not updater.check_version():
523 return False
524 if not force_update:
525 logging.info('Canceling stateful update because the new and '
526 'old versions are the same.')
527 return False
528 # Following folders should be rebuilt after stateful update.
529 # A test file is used to confirm each folder gets rebuilt after
530 # the stateful update.
531 folders_to_check = ['/var', '/home', '/mnt/stateful_partition']
532 test_file = '.test_file_to_be_deleted'
533 for folder in folders_to_check:
534 touch_path = os.path.join(folder, test_file)
535 self.run('touch %s' % touch_path)
536
Chris Sosae92399e2015-04-24 11:32:59 -0700537 updater.run_update(update_root=False)
Dan Shi0f466e82013-02-22 15:44:58 -0800538
539 # Reboot to complete stateful update.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700540 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Dan Shi0f466e82013-02-22 15:44:58 -0800541 check_file_cmd = 'test -f %s; echo $?'
542 for folder in folders_to_check:
543 test_file_path = os.path.join(folder, test_file)
544 result = self.run(check_file_cmd % test_file_path,
545 ignore_status=True)
546 if result.exit_status == 1:
547 return False
548 return True
549
550
J. Richard Barnette7275b612013-06-04 18:13:11 -0700551 def _post_update_processing(self, updater, expected_kernel=None):
Dan Shi0f466e82013-02-22 15:44:58 -0800552 """After the DUT is updated, confirm machine_install succeeded.
553
554 @param updater: ChromiumOSUpdater instance used to update the DUT.
J. Richard Barnette7275b612013-06-04 18:13:11 -0700555 @param expected_kernel: kernel expected to be active after reboot,
556 or `None` to skip rollback checking.
Dan Shi0f466e82013-02-22 15:44:58 -0800557
558 """
J. Richard Barnette7275b612013-06-04 18:13:11 -0700559 # Touch the lab machine file to leave a marker that
560 # distinguishes this image from other test images.
561 # Afterwards, we must re-run the autoreboot script because
562 # it depends on the _LAB_MACHINE_FILE.
J. Richard Barnette71cc1862015-12-02 10:32:38 -0800563 autoreboot_cmd = ('FILE="%s" ; [ -f "$FILE" ] || '
564 '( touch "$FILE" ; start autoreboot )')
565 self.run(autoreboot_cmd % self._LAB_MACHINE_FILE)
Chris Sosa65425082013-10-16 13:26:22 -0700566 updater.verify_boot_expectations(
567 expected_kernel, rollback_message=
Gilad Arnoldc26ae1f2015-10-22 16:09:41 -0700568 'Build %s failed to boot on %s; system rolled back to previous '
Chris Sosa65425082013-10-16 13:26:22 -0700569 'build' % (updater.update_version, self.hostname))
J. Richard Barnette7275b612013-06-04 18:13:11 -0700570 # Check that we've got the build we meant to install.
571 if not updater.check_version_to_confirm_install():
572 raise autoupdater.ChromiumOSError(
573 'Failed to update %s to build %s; found build '
574 '%s instead' % (self.hostname,
Chris Sosa65425082013-10-16 13:26:22 -0700575 updater.update_version,
Dan Shi0942b1d2015-03-31 11:07:00 -0700576 self.get_release_version()))
Dan Shi0f466e82013-02-22 15:44:58 -0800577
Chris Sosae92399e2015-04-24 11:32:59 -0700578 logging.debug('Cleaning up old autotest directories.')
579 try:
580 installed_autodir = autotest.Autotest.get_installed_autodir(self)
581 self.run('rm -rf ' + installed_autodir)
582 except autotest.AutodirNotFoundError:
583 logging.debug('No autotest installed directory found.')
584
Dan Shi0f466e82013-02-22 15:44:58 -0800585
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700586 def _stage_image_for_update(self, image_name=None):
Chris Sosae92399e2015-04-24 11:32:59 -0700587 """Stage a build on a devserver and return the update_url and devserver.
Scott Zawalskieadbf702013-03-14 09:23:06 -0400588
589 @param image_name: a name like lumpy-release/R27-3837.0.0
Chris Sosae92399e2015-04-24 11:32:59 -0700590 @returns a tuple with an update URL like:
Scott Zawalskieadbf702013-03-14 09:23:06 -0400591 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
Chris Sosae92399e2015-04-24 11:32:59 -0700592 and the devserver instance.
Scott Zawalskieadbf702013-03-14 09:23:06 -0400593 """
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700594 if not image_name:
595 image_name = self.get_repair_image_name()
Chris Sosae92399e2015-04-24 11:32:59 -0700596
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700597 logging.info('Staging build for AU: %s', image_name)
Dan Shi216389c2015-12-22 11:03:06 -0800598 devserver = dev_server.ImageServer.resolve(image_name, self.hostname)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400599 devserver.trigger_download(image_name, synchronous=False)
Chris Sosae92399e2015-04-24 11:32:59 -0700600 return (tools.image_url_pattern() % (devserver.url(), image_name),
601 devserver)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400602
603
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700604 def stage_image_for_servo(self, image_name=None):
605 """Stage a build on a devserver and return the update_url.
606
607 @param image_name: a name like lumpy-release/R27-3837.0.0
608 @returns an update URL like:
609 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
610 """
611 if not image_name:
612 image_name = self.get_repair_image_name()
613 logging.info('Staging build for servo install: %s', image_name)
Dan Shi216389c2015-12-22 11:03:06 -0800614 devserver = dev_server.ImageServer.resolve(image_name, self.hostname)
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700615 devserver.stage_artifacts(image_name, ['test_image'])
616 return devserver.get_test_image_url(image_name)
617
618
beepse539be02013-07-31 21:57:39 -0700619 def stage_factory_image_for_servo(self, image_name):
620 """Stage a build on a devserver and return the update_url.
621
622 @param image_name: a name like <baord>/4262.204.0
beeps12c0a3c2013-09-03 11:58:27 -0700623
beepse539be02013-07-31 21:57:39 -0700624 @return: An update URL, eg:
625 http://<devserver>/static/canary-channel/\
626 <board>/4262.204.0/factory_test/chromiumos_factory_image.bin
beeps12c0a3c2013-09-03 11:58:27 -0700627
628 @raises: ValueError if the factory artifact name is missing from
629 the config.
630
beepse539be02013-07-31 21:57:39 -0700631 """
632 if not image_name:
633 logging.error('Need an image_name to stage a factory image.')
634 return
635
Dan Shib8540a52015-07-16 14:18:23 -0700636 factory_artifact = CONFIG.get_config_value(
beeps12c0a3c2013-09-03 11:58:27 -0700637 'CROS', 'factory_artifact', type=str, default='')
638 if not factory_artifact:
639 raise ValueError('Cannot retrieve the factory artifact name from '
640 'autotest config, and hence cannot stage factory '
641 'artifacts.')
642
beepse539be02013-07-31 21:57:39 -0700643 logging.info('Staging build for servo install: %s', image_name)
Dan Shi216389c2015-12-22 11:03:06 -0800644 devserver = dev_server.ImageServer.resolve(image_name, self.hostname)
beepse539be02013-07-31 21:57:39 -0700645 devserver.stage_artifacts(
646 image_name,
beeps12c0a3c2013-09-03 11:58:27 -0700647 [factory_artifact],
648 archive_url=None)
beepse539be02013-07-31 21:57:39 -0700649
650 return tools.factory_image_url_pattern() % (devserver.url(), image_name)
651
652
Chris Sosaa3ac2152012-05-23 22:23:13 -0700653 def machine_install(self, update_url=None, force_update=False,
Richard Barnette0b023a72015-04-24 16:07:30 +0000654 local_devserver=False, repair=False,
655 force_full_update=False):
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500656 """Install the DUT.
657
Dan Shi0f466e82013-02-22 15:44:58 -0800658 Use stateful update if the DUT is already running the same build.
659 Stateful update does not update kernel and tends to run much faster
660 than a full reimage. If the DUT is running a different build, or it
661 failed to do a stateful update, full update, including kernel update,
662 will be applied to the DUT.
663
Simran Basi5ace6f22016-01-06 17:30:44 -0800664 Once a host enters machine_install its host attribute job_repo_url
665 (used for package install) will be removed and then updated.
Scott Zawalskieadbf702013-03-14 09:23:06 -0400666
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500667 @param update_url: The url to use for the update
668 pattern: http://$devserver:###/update/$build
669 If update_url is None and repair is True we will install the
Dan Shi6964fa52014-12-18 11:04:27 -0800670 stable image listed in afe_stable_versions table. If the table
671 is not setup, global_config value under CROS.stable_cros_version
672 will be used instead.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500673 @param force_update: Force an update even if the version installed
674 is the same. Default:False
Christopher Wiley6a4ff932015-05-15 14:00:47 -0700675 @param local_devserver: Used by test_that to allow people to
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500676 use their local devserver. Default: False
Chris Sosae92399e2015-04-24 11:32:59 -0700677 @param repair: Forces update to repair image. Implies force_update.
Fang Deng3d3b9272014-12-22 12:20:28 -0800678 @param force_full_update: If True, do not attempt to run stateful
679 update, force a full reimage. If False, try stateful update
680 first when the dut is already installed with the same version.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500681 @raises autoupdater.ChromiumOSError
682
Dan Shibe3636a2016-02-14 22:48:01 -0800683 @returns A tuple of (image_name, host_attributes).
684 image_name is the name of image installed, e.g.,
685 veyron_jerry-release/R50-7871.0.0
686 host_attributes is a dictionary of (attribute, value), which
687 can be saved to afe_host_attributes table in database. This
688 method returns a dictionary with a single entry of
689 `job_repo_url`: repo_url, where repo_url is a devserver url to
690 autotest packages.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500691 """
Chris Sosae92399e2015-04-24 11:32:59 -0700692 devserver = None
Richard Barnette0b023a72015-04-24 16:07:30 +0000693 if repair:
Chris Sosae92399e2015-04-24 11:32:59 -0700694 update_url, devserver = self._stage_image_for_update()
Richard Barnette0b023a72015-04-24 16:07:30 +0000695 force_update = True
Dan Shi0f466e82013-02-22 15:44:58 -0800696
Chris Sosae92399e2015-04-24 11:32:59 -0700697 if not update_url and not self._parser.options.image:
698 raise error.AutoservError(
Dan Shid07ee2e2015-09-24 14:49:25 -0700699 'There is no update URL, nor a method to get one.')
Chris Sosae92399e2015-04-24 11:32:59 -0700700
701 if not update_url and self._parser.options.image:
702 # This is the base case where we have no given update URL i.e.
703 # dynamic suites logic etc. This is the most flexible case where we
704 # can serve an update from any of our fleet of devservers.
705 requested_build = self._parser.options.image
706 if not requested_build.startswith('http://'):
707 logging.debug('Update will be staged for this installation')
708 update_url, devserver = self._stage_image_for_update(
Dan Shid07ee2e2015-09-24 14:49:25 -0700709 requested_build)
Chris Sosae92399e2015-04-24 11:32:59 -0700710 else:
711 update_url = requested_build
712
713 logging.debug('Update URL is %s', update_url)
714
Dan Shif48f8132016-02-18 10:34:30 -0800715 # Report provision stats.
xixuan9e2c98d2016-02-26 19:04:53 -0800716 server_name = dev_server.ImageServer.get_server_name(update_url)
Dan Shif48f8132016-02-18 10:34:30 -0800717 server_name = server_name.replace('.', '_')
718 autotest_stats.Counter('cros_host_provision.' + server_name).increment()
719 autotest_stats.Counter('cros_host_provision.total').increment()
720
Dan Shid07ee2e2015-09-24 14:49:25 -0700721 # Create a file to indicate if provision fails. The file will be removed
722 # by stateful update or full install.
723 self.run('touch %s' % PROVISION_FAILED)
724
Chris Sosae92399e2015-04-24 11:32:59 -0700725 update_complete = False
726 updater = autoupdater.ChromiumOSUpdater(
727 update_url, host=self, local_devserver=local_devserver)
Fang Deng3d3b9272014-12-22 12:20:28 -0800728 if not force_full_update:
729 try:
Chris Sosae92399e2015-04-24 11:32:59 -0700730 # If the DUT is already running the same build, try stateful
731 # update first as it's much quicker than a full re-image.
732 update_complete = self._try_stateful_update(
Dan Shid07ee2e2015-09-24 14:49:25 -0700733 update_url, force_update, updater)
Fang Deng3d3b9272014-12-22 12:20:28 -0800734 except Exception as e:
735 logging.exception(e)
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700736
Dan Shi0f466e82013-02-22 15:44:58 -0800737 inactive_kernel = None
Chris Sosae92399e2015-04-24 11:32:59 -0700738 if update_complete or (not force_update and updater.check_version()):
739 logging.info('Install complete without full update')
740 else:
741 logging.info('DUT requires full update.')
742 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Dan Shi10b98482016-02-02 14:38:50 -0800743 # Stop service ap-update-manager to prevent rebooting during
744 # autoupdate. The service is used in jetstream boards, but not other
745 # CrOS devices.
746 self.run('sudo stop ap-update-manager', ignore_status=True)
747
Chris Sosae92399e2015-04-24 11:32:59 -0700748 num_of_attempts = provision.FLAKY_DEVSERVER_ATTEMPTS
Chris Sosab7612bc2013-03-21 10:32:37 -0700749
Chris Sosae92399e2015-04-24 11:32:59 -0700750 while num_of_attempts > 0:
751 num_of_attempts -= 1
752 try:
753 updater.run_update()
754 except Exception:
755 logging.warn('Autoupdate did not complete.')
756 # Do additional check for the devserver health. Ideally,
757 # the autoupdater.py could raise an exception when it
758 # detected network flake but that would require
759 # instrumenting the update engine and parsing it log.
760 if (num_of_attempts <= 0 or
761 devserver is None or
xixuan9e2c98d2016-02-26 19:04:53 -0800762 dev_server.ImageServer.devserver_healthy(
Chris Sosae92399e2015-04-24 11:32:59 -0700763 devserver.url())):
Dan Shid07ee2e2015-09-24 14:49:25 -0700764 raise
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700765
Chris Sosae92399e2015-04-24 11:32:59 -0700766 logging.warn('Devserver looks unhealthy. Trying another')
767 update_url, devserver = self._stage_image_for_update(
768 requested_build)
769 logging.debug('New Update URL is %s', update_url)
770 updater = autoupdater.ChromiumOSUpdater(
771 update_url, host=self,
772 local_devserver=local_devserver)
773 else:
774 break
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700775
Chris Sosae92399e2015-04-24 11:32:59 -0700776 # Give it some time in case of IO issues.
777 time.sleep(10)
Dan Shi5699ac22014-12-19 10:55:49 -0800778
Chris Sosae92399e2015-04-24 11:32:59 -0700779 # Figure out active and inactive kernel.
780 active_kernel, inactive_kernel = updater.get_kernel_state()
Simran Basi13fa1ba2013-03-04 10:56:47 -0800781
Chris Sosae92399e2015-04-24 11:32:59 -0700782 # Ensure inactive kernel has higher priority than active.
783 if (updater.get_kernel_priority(inactive_kernel)
784 < updater.get_kernel_priority(active_kernel)):
785 raise autoupdater.ChromiumOSError(
786 'Update failed. The priority of the inactive kernel'
787 ' partition is less than that of the active kernel'
788 ' partition.')
789
790 # Updater has returned successfully; reboot the host.
791 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
792
793 self._post_update_processing(updater, inactive_kernel)
Simran Basi5ace6f22016-01-06 17:30:44 -0800794 image_name = autoupdater.url_to_image_name(update_url)
Dan Shibe3636a2016-02-14 22:48:01 -0800795 # update_url is different from devserver url needed to stage autotest
796 # packages, therefore, resolve a new devserver url here.
797 devserver_url = dev_server.ImageServer.resolve(image_name,
798 self.hostname).url()
799 repo_url = tools.get_package_url(devserver_url, image_name)
Simran Basi9cbdbc32016-02-11 18:15:46 -0800800 self.verify_software()
Dan Shibe3636a2016-02-14 22:48:01 -0800801 return image_name, {ds_constants.JOB_REPO_URL: repo_url}
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700802
803
Tom Wai-Hong Tam2d00cb22016-01-08 06:40:50 +0800804 def _clear_fw_version_labels(self, rw_only):
805 """Clear firmware version labels from the machine.
806
807 @param rw_only: True to only clear fwrw_version; otherewise, clear
808 both fwro_version and fwrw_version.
809 """
Dan Shi9cb0eec2014-06-03 09:04:50 -0700810 labels = self._AFE.get_labels(
Dan Shi0723bf52015-06-24 10:52:38 -0700811 name__startswith=provision.FW_RW_VERSION_PREFIX,
Dan Shi9cb0eec2014-06-03 09:04:50 -0700812 host__hostname=self.hostname)
Tom Wai-Hong Tam2d00cb22016-01-08 06:40:50 +0800813 if not rw_only:
814 labels = labels + self._AFE.get_labels(
815 name__startswith=provision.FW_RO_VERSION_PREFIX,
816 host__hostname=self.hostname)
Dan Shi9cb0eec2014-06-03 09:04:50 -0700817 for label in labels:
818 label.remove_hosts(hosts=[self.hostname])
819
820
Tom Wai-Hong Tam2d00cb22016-01-08 06:40:50 +0800821 def _add_fw_version_label(self, build, rw_only):
Dan Shi9cb0eec2014-06-03 09:04:50 -0700822 """Add firmware version label to the machine.
823
824 @param build: Build of firmware.
Tom Wai-Hong Tam2d00cb22016-01-08 06:40:50 +0800825 @param rw_only: True to only add fwrw_version; otherwise, add both
826 fwro_version and fwrw_version.
Dan Shi9cb0eec2014-06-03 09:04:50 -0700827
828 """
Tom Wai-Hong Tam2d00cb22016-01-08 06:40:50 +0800829 fw_label = provision.fwrw_version_to_label(build)
MK Ryu73be9862015-07-06 12:25:00 -0700830 self._AFE.run('label_add_hosts', id=fw_label, hosts=[self.hostname])
Tom Wai-Hong Tam2d00cb22016-01-08 06:40:50 +0800831 if not rw_only:
832 fw_label = provision.fwro_version_to_label(build)
833 self._AFE.run('label_add_hosts', id=fw_label, hosts=[self.hostname])
Dan Shi9cb0eec2014-06-03 09:04:50 -0700834
835
Tom Wai-Hong Tam4ac78982016-01-08 02:34:37 +0800836 def firmware_install(self, build=None, rw_only=False):
Dan Shi9cb0eec2014-06-03 09:04:50 -0700837 """Install firmware to the DUT.
838
839 Use stateful update if the DUT is already running the same build.
840 Stateful update does not update kernel and tends to run much faster
841 than a full reimage. If the DUT is running a different build, or it
842 failed to do a stateful update, full update, including kernel update,
843 will be applied to the DUT.
844
Tom Wai-Hong Tam2d00cb22016-01-08 06:40:50 +0800845 Once a host enters firmware_install its fw[ro|rw]_version label will
846 be removed. After the firmware is updated successfully, a new
847 fw[ro|rw]_version label will be added to the host.
Dan Shi9cb0eec2014-06-03 09:04:50 -0700848
849 @param build: The build version to which we want to provision the
850 firmware of the machine,
851 e.g. 'link-firmware/R22-2695.1.144'.
Tom Wai-Hong Tam4ac78982016-01-08 02:34:37 +0800852 @param rw_only: True to only install firmware to its RW portions. Keep
853 the RO portions unchanged.
Dan Shi9cb0eec2014-06-03 09:04:50 -0700854
855 TODO(dshi): After bug 381718 is fixed, update here with corresponding
856 exceptions that could be raised.
857
858 """
859 if not self.servo:
860 raise error.TestError('Host %s does not have servo.' %
861 self.hostname)
862
863 # TODO(fdeng): use host.get_board() after
864 # crbug.com/271834 is fixed.
865 board = self._get_board_from_afe()
866
Chris Sosae92399e2015-04-24 11:32:59 -0700867 # If build is not set, try to install firmware from stable CrOS.
Dan Shi9cb0eec2014-06-03 09:04:50 -0700868 if not build:
Dan Shi3d7a0e12015-10-12 11:55:45 -0700869 build = self.get_repair_image_name(image_type='firmware')
870 if not build:
871 raise error.TestError(
872 'Failed to find stable firmware build for %s.',
873 self.hostname)
874 logging.info('Will install firmware from build %s.', build)
Dan Shi9cb0eec2014-06-03 09:04:50 -0700875
876 config = FAFTConfig(board)
877 if config.use_u_boot:
878 ap_image = 'image-%s.bin' % board
879 else: # Depthcharge platform
880 ap_image = 'image.bin'
881 ec_image = 'ec.bin'
Dan Shi216389c2015-12-22 11:03:06 -0800882 ds = dev_server.ImageServer.resolve(build, self.hostname)
Dan Shi9cb0eec2014-06-03 09:04:50 -0700883 ds.stage_artifacts(build, ['firmware'])
884
885 tmpd = autotemp.tempdir(unique_id='fwimage')
886 try:
887 fwurl = self._FW_IMAGE_URL_PATTERN % (ds.url(), build)
888 local_tarball = os.path.join(tmpd.name, os.path.basename(fwurl))
889 server_utils.system('wget -O %s %s' % (local_tarball, fwurl),
890 timeout=60)
Dan Shi9cb0eec2014-06-03 09:04:50 -0700891
Tom Wai-Hong Tam2d00cb22016-01-08 06:40:50 +0800892 self._clear_fw_version_labels(rw_only)
Tom Wai-Hong Tamf9db57a2016-03-17 05:32:22 +0800893 if self.get_ec():
894 logging.info('Will re-program EC %snow', 'RW ' if rw_only else '')
895 server_utils.system('tar xf %s -C %s %s' %
896 (local_tarball, tmpd.name, ec_image),
897 timeout=60)
898 self.servo.program_ec(os.path.join(tmpd.name, ec_image), rw_only)
899 else:
900 logging.info('Not a Chrome EC, ignore re-programing it')
Tom Wai-Hong Tam4ac78982016-01-08 02:34:37 +0800901 logging.info('Will re-program BIOS %snow', 'RW ' if rw_only else '')
Tom Wai-Hong Tamf9db57a2016-03-17 05:32:22 +0800902 server_utils.system('tar xf %s -C %s %s' %
903 (local_tarball, tmpd.name, ap_image),
904 timeout=60)
Tom Wai-Hong Tam4ac78982016-01-08 02:34:37 +0800905 self.servo.program_bios(os.path.join(tmpd.name, ap_image), rw_only)
Dan Shi9cb0eec2014-06-03 09:04:50 -0700906 self.servo.get_power_state_controller().reset()
907 time.sleep(self.servo.BOOT_DELAY)
Tom Wai-Hong Tam2d00cb22016-01-08 06:40:50 +0800908 self._add_fw_version_label(build, rw_only)
Dan Shi9cb0eec2014-06-03 09:04:50 -0700909 finally:
910 tmpd.clean()
911
912
Dan Shi10e992b2013-08-30 11:02:59 -0700913 def show_update_engine_log(self):
914 """Output update engine log."""
MK Ryu35d661e2014-09-25 17:44:10 -0700915 logging.debug('Dumping %s', client_constants.UPDATE_ENGINE_LOG)
916 self.run('cat %s' % client_constants.UPDATE_ENGINE_LOG)
Dan Shi10e992b2013-08-30 11:02:59 -0700917
918
Richard Barnette82c35912012-11-20 10:09:10 -0800919 def _get_board_from_afe(self):
920 """Retrieve this host's board from its labels in the AFE.
921
922 Looks for a host label of the form "board:<board>", and
923 returns the "<board>" part of the label. `None` is returned
924 if there is not a single, unique label matching the pattern.
925
926 @returns board from label, or `None`.
927 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700928 return server_utils.get_board_from_afe(self.hostname, self._AFE)
Simran Basi833814b2013-01-29 13:13:43 -0800929
930
Dan Shib3b6db32016-02-03 14:54:05 -0800931 def get_build(self):
932 """Retrieve the current build for this Host from the AFE.
933
934 Looks through this host's labels in the AFE to determine its build.
935 This method is replaced by afe_utils.get_build. It's kept here to
936 maintain backwards compatibility for test control files in older CrOS
937 builds (R48, R49 etc.) still call host.get_build, e.g.,
938 `provision_AutoUpdate.double`.
939 TODO(sbasi): Once R50 falls into release branch, this method can be
940 removed.
941
942 @returns The current build or None if it could not find it or if there
943 were multiple build labels assigned to this host.
944 """
945 return afe_utils.get_build(self)
946
947
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500948 def _install_repair(self):
Chris Sosae92399e2015-04-24 11:32:59 -0700949 """Attempt to repair this host using the update-engine.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500950
951 If the host is up, try installing the DUT with a stable
Dan Shi6964fa52014-12-18 11:04:27 -0800952 "repair" version of Chrome OS as defined in afe_stable_versions table.
953 If the table is not setup, global_config value under
954 CROS.stable_cros_version will be used instead.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500955
Scott Zawalski62bacae2013-03-05 10:40:32 -0500956 @raises AutoservRepairMethodNA if the DUT is not reachable.
957 @raises ChromiumOSError if the install failed for some reason.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500958
959 """
960 if not self.is_up():
Scott Zawalski62bacae2013-03-05 10:40:32 -0500961 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500962 logging.info('Attempting to reimage machine to repair image.')
963 try:
Simran Basi5ace6f22016-01-06 17:30:44 -0800964 afe_utils.machine_install_and_update_labels(self, repair=True)
Fang Dengd0672f32013-03-18 17:18:09 -0700965 except autoupdater.ChromiumOSError as e:
966 logging.exception(e)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500967 logging.info('Repair via install failed.')
Scott Zawalski62bacae2013-03-05 10:40:32 -0500968 raise
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500969
970
Dan Shi2c88eed2013-11-12 10:18:38 -0800971 def _install_repair_with_powerwash(self):
Dan Shi9cc48452013-11-12 12:39:26 -0800972 """Attempt to powerwash first then repair this host using update-engine.
Dan Shi2c88eed2013-11-12 10:18:38 -0800973
Dan Shi9cc48452013-11-12 12:39:26 -0800974 update-engine may fail due to a bad image. In such case, powerwash
975 may help to cleanup the DUT for update-engine to work again.
Dan Shi2c88eed2013-11-12 10:18:38 -0800976
977 @raises AutoservRepairMethodNA if the DUT is not reachable.
978 @raises ChromiumOSError if the install failed for some reason.
979
980 """
981 if not self.is_up():
982 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
983
984 logging.info('Attempting to powerwash the DUT.')
985 self.run('echo "fast safe" > '
986 '/mnt/stateful_partition/factory_install_reset')
987 self.reboot(timeout=self.POWERWASH_BOOT_TIMEOUT, wait=True)
988 if not self.is_up():
Dan Shi9cc48452013-11-12 12:39:26 -0800989 logging.error('Powerwash failed. DUT did not come back after '
Dan Shi2c88eed2013-11-12 10:18:38 -0800990 'reboot.')
991 raise error.AutoservRepairFailure(
992 'DUT failed to boot from powerwash after %d seconds' %
993 self.POWERWASH_BOOT_TIMEOUT)
994
995 logging.info('Powerwash succeeded.')
996 self._install_repair()
997
998
beepsf079cfb2013-09-18 17:49:51 -0700999 def servo_install(self, image_url=None, usb_boot_timeout=USB_BOOT_TIMEOUT,
1000 install_timeout=INSTALL_TIMEOUT):
Scott Zawalski62bacae2013-03-05 10:40:32 -05001001 """
1002 Re-install the OS on the DUT by:
1003 1) installing a test image on a USB storage device attached to the Servo
1004 board,
Richard Barnette03a0c132012-11-05 12:40:35 -08001005 2) booting that image in recovery mode, and then
J. Richard Barnette31b2e312013-04-04 16:05:22 -07001006 3) installing the image with chromeos-install.
1007
Scott Zawalski62bacae2013-03-05 10:40:32 -05001008 @param image_url: If specified use as the url to install on the DUT.
1009 otherwise boot the currently staged image on the USB stick.
beepsf079cfb2013-09-18 17:49:51 -07001010 @param usb_boot_timeout: The usb_boot_timeout to use during reimage.
1011 Factory images need a longer usb_boot_timeout than regular
1012 cros images.
1013 @param install_timeout: The timeout to use when installing the chromeos
1014 image. Factory images need a longer install_timeout.
Richard Barnette03a0c132012-11-05 12:40:35 -08001015
Scott Zawalski62bacae2013-03-05 10:40:32 -05001016 @raises AutoservError if the image fails to boot.
beepsf079cfb2013-09-18 17:49:51 -07001017
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001018 """
beepsf079cfb2013-09-18 17:49:51 -07001019 usb_boot_timer_key = ('servo_install.usb_boot_timeout_%s'
1020 % usb_boot_timeout)
1021 logging.info('Downloading image to USB, then booting from it. Usb boot '
1022 'timeout = %s', usb_boot_timeout)
Gabe Black1e1c41b2015-02-04 23:55:15 -08001023 timer = autotest_stats.Timer(usb_boot_timer_key)
beepsf079cfb2013-09-18 17:49:51 -07001024 timer.start()
J. Richard Barnette31b2e312013-04-04 16:05:22 -07001025 self.servo.install_recovery_image(image_url)
beepsf079cfb2013-09-18 17:49:51 -07001026 if not self.wait_up(timeout=usb_boot_timeout):
Scott Zawalski62bacae2013-03-05 10:40:32 -05001027 raise error.AutoservRepairFailure(
1028 'DUT failed to boot from USB after %d seconds' %
beepsf079cfb2013-09-18 17:49:51 -07001029 usb_boot_timeout)
1030 timer.stop()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001031
Tom Wai-Hong Tamf6b4f812015-08-08 04:14:59 +08001032 # The new chromeos-tpm-recovery has been merged since R44-7073.0.0.
1033 # In old CrOS images, this command fails. Skip the error.
Tom Wai-Hong Tam27af7332015-07-25 06:09:39 +08001034 logging.info('Resetting the TPM status')
Tom Wai-Hong Tamf6b4f812015-08-08 04:14:59 +08001035 try:
1036 self.run('chromeos-tpm-recovery')
1037 except error.AutoservRunError:
1038 logging.warn('chromeos-tpm-recovery is too old.')
1039
Tom Wai-Hong Tam27af7332015-07-25 06:09:39 +08001040
beepsf079cfb2013-09-18 17:49:51 -07001041 install_timer_key = ('servo_install.install_timeout_%s'
1042 % install_timeout)
Gabe Black1e1c41b2015-02-04 23:55:15 -08001043 timer = autotest_stats.Timer(install_timer_key)
beepsf079cfb2013-09-18 17:49:51 -07001044 timer.start()
1045 logging.info('Installing image through chromeos-install.')
J. Richard Barnette9af19632015-09-25 12:18:03 -07001046 self.run('chromeos-install --yes', timeout=install_timeout)
1047 self.halt()
beepsf079cfb2013-09-18 17:49:51 -07001048 timer.stop()
1049
1050 logging.info('Power cycling DUT through servo.')
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001051 self.servo.get_power_state_controller().power_off()
Fang Dengafb88142013-05-30 17:44:31 -07001052 self.servo.switch_usbkey('off')
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001053 # N.B. The Servo API requires that we use power_on() here
1054 # for two reasons:
1055 # 1) After turning on a DUT in recovery mode, you must turn
1056 # it off and then on with power_on() once more to
1057 # disable recovery mode (this is a Parrot specific
1058 # requirement).
1059 # 2) After power_off(), the only way to turn on is with
1060 # power_on() (this is a Storm specific requirement).
J. Richard Barnettefbcc7122013-07-24 18:24:59 -07001061 self.servo.get_power_state_controller().power_on()
beepsf079cfb2013-09-18 17:49:51 -07001062
1063 logging.info('Waiting for DUT to come back up.')
Richard Barnette03a0c132012-11-05 12:40:35 -08001064 if not self.wait_up(timeout=self.BOOT_TIMEOUT):
1065 raise error.AutoservError('DUT failed to reboot installed '
1066 'test image after %d seconds' %
Scott Zawalski62bacae2013-03-05 10:40:32 -05001067 self.BOOT_TIMEOUT)
1068
1069
Dan Shic1b8bdd2015-09-14 23:11:24 -07001070 def _setup_servo(self):
1071 """Try to force to create servo object if it's not set up yet.
1072 """
1073 if self.servo:
1074 return
1075
1076 try:
1077 # Setting servo_args to {} will force it to create the servo_host
1078 # object if possible.
1079 self._servo_host = servo_host.create_servo_host(
1080 dut=self.hostname, servo_args={})
1081 if self._servo_host:
1082 self.servo = self._servo_host.get_servo()
1083 else:
1084 logging.error('Failed to create servo_host object.')
1085 except Exception as e:
1086 logging.error('Failed to create servo object: %s', e)
1087
1088
J. Richard Barnettee4af8b92013-05-01 13:16:12 -07001089 def _servo_repair_reinstall(self):
Scott Zawalski62bacae2013-03-05 10:40:32 -05001090 """Reinstall the DUT utilizing servo and a test image.
1091
1092 Re-install the OS on the DUT by:
1093 1) installing a test image on a USB storage device attached to the Servo
1094 board,
Tom Wai-Hong Tam27af7332015-07-25 06:09:39 +08001095 2) booting that image in recovery mode,
1096 3) resetting the TPM status, and then
1097 4) installing the image with chromeos-install.
Scott Zawalski62bacae2013-03-05 10:40:32 -05001098
Scott Zawalski62bacae2013-03-05 10:40:32 -05001099 @raises AutoservRepairMethodNA if the device does not have servo
1100 support.
1101
1102 """
1103 if not self.servo:
1104 raise error.AutoservRepairMethodNA('Repair Reinstall NA: '
1105 'DUT has no servo support.')
1106
1107 logging.info('Attempting to recovery servo enabled device with '
1108 'servo_repair_reinstall')
1109
J. Richard Barnettee4af8b92013-05-01 13:16:12 -07001110 image_url = self.stage_image_for_servo()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001111 self.servo_install(image_url)
1112
1113
Tom Wai-Hong Tambea741c2016-01-21 07:20:14 +08001114 def _is_firmware_repair_supported(self):
1115 """Check if the firmware repair is supported.
Dan Shi3d7a0e12015-10-12 11:55:45 -07001116
Tom Wai-Hong Tambea741c2016-01-21 07:20:14 +08001117 The firmware repair is only applicable to DUTs in pools listed in
1118 global config CROS/pools_support_firmware_repair.
Dan Shi3d7a0e12015-10-12 11:55:45 -07001119
Tom Wai-Hong Tambea741c2016-01-21 07:20:14 +08001120 @return: True if it is supported; otherwise False.
Dan Shi3d7a0e12015-10-12 11:55:45 -07001121 """
1122 logging.info('Checking if host %s can be repaired with firmware '
1123 'repair.', self.hostname)
1124 pools = server_utils.get_labels_from_afe(self.hostname, 'pool:',
1125 self._AFE)
1126 pools_support_firmware_repair = CONFIG.get_config_value('CROS',
1127 'pools_support_firmware_repair', type=str).split(',')
Tom Wai-Hong Tambea741c2016-01-21 07:20:14 +08001128
1129 return (pools and pools_support_firmware_repair and
1130 set(pools).intersection(set(pools_support_firmware_repair)))
1131
1132
1133 def _firmware_repair(self):
1134 """Reinstall the firmware image using servo.
1135
1136 This repair function attempts to install the stable firmware specified
1137 by the stable firmware version.
1138 Then reset the DUT and try to verify it. If verify fails, it will try to
1139 install the CrOS image using servo.
1140 """
1141 if not self._is_firmware_repair_supported():
1142 logging.info('Host is not in pools that support firmware repair.')
Dan Shi3d7a0e12015-10-12 11:55:45 -07001143 raise error.AutoservRepairMethodNA(
1144 'Firmware repair is not applicable to host %s.' %
1145 self.hostname)
1146
1147 # To repair a DUT connected to a moblab, try to create a servo object if
1148 # it was failed to be created earlier as there may be a servo_host host
1149 # attribute for this host.
1150 if utils.is_moblab():
1151 self._setup_servo()
1152
1153 if not self.servo:
1154 raise error.AutoservRepairMethodNA('Repair Reinstall NA: '
1155 'DUT has no servo support.')
1156
1157 logging.info('Attempting to recovery servo enabled device with '
1158 'firmware_repair.')
1159 self.firmware_install()
1160
1161 logging.info('Firmware repaired. Check if the DUT can boot. If not, '
1162 'reinstall the CrOS using servo.')
1163 try:
Dan Shi3d7a0e12015-10-12 11:55:45 -07001164 self.verify()
1165 except Exception as e:
1166 logging.warn('Failed to verify DUT, error: %s. Will try to repair '
1167 'the DUT with servo_repair_reinstall.', e)
1168 self._servo_repair_reinstall()
1169
1170
Scott Zawalski62bacae2013-03-05 10:40:32 -05001171 def _servo_repair_power(self):
1172 """Attempt to repair DUT using an attached Servo.
1173
J. Richard Barnette13165972016-01-13 10:53:09 -08001174 Attempt to power cycle the DUT via cold_reset.
Scott Zawalski62bacae2013-03-05 10:40:32 -05001175
1176 @raises AutoservRepairMethodNA if the device does not have servo
1177 support.
1178 @raises AutoservRepairFailure if the repair fails for any reason.
1179 """
1180 if not self.servo:
1181 raise error.AutoservRepairMethodNA('Repair Power NA: '
1182 'DUT has no servo support.')
1183
1184 logging.info('Attempting to recover servo enabled device by '
J. Richard Barnette13165972016-01-13 10:53:09 -08001185 'powering cycling with cold reset.')
1186 self.servo.get_power_state_controller().reset()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001187 if self.wait_up(self.BOOT_TIMEOUT):
1188 return
1189
1190 raise error.AutoservRepairFailure('DUT did not boot after long_press.')
Richard Barnette03a0c132012-11-05 12:40:35 -08001191
1192
Richard Barnette82c35912012-11-20 10:09:10 -08001193 def _powercycle_to_repair(self):
1194 """Utilize the RPM Infrastructure to bring the host back up.
1195
1196 If the host is not up/repaired after the first powercycle we utilize
1197 auto fallback to the last good install by powercycling and rebooting the
1198 host 6 times.
Scott Zawalski62bacae2013-03-05 10:40:32 -05001199
1200 @raises AutoservRepairMethodNA if the device does not support remote
1201 power.
1202 @raises AutoservRepairFailure if the repair fails for any reason.
1203
Richard Barnette82c35912012-11-20 10:09:10 -08001204 """
Scott Zawalski62bacae2013-03-05 10:40:32 -05001205 if not self.has_power():
1206 raise error.AutoservRepairMethodNA('Device does not support power.')
1207
Richard Barnette82c35912012-11-20 10:09:10 -08001208 logging.info('Attempting repair via RPM powercycle.')
1209 failed_cycles = 0
1210 self.power_cycle()
1211 while not self.wait_up(timeout=self.BOOT_TIMEOUT):
1212 failed_cycles += 1
1213 if failed_cycles >= self._MAX_POWER_CYCLE_ATTEMPTS:
Scott Zawalski62bacae2013-03-05 10:40:32 -05001214 raise error.AutoservRepairFailure(
1215 'Powercycled host %s %d times; device did not come back'
1216 ' online.' % (self.hostname, failed_cycles))
Richard Barnette82c35912012-11-20 10:09:10 -08001217 self.power_cycle()
1218 if failed_cycles == 0:
1219 logging.info('Powercycling was successful first time.')
1220 else:
1221 logging.info('Powercycling was successful after %d failures.',
1222 failed_cycles)
1223
1224
MK Ryu35d661e2014-09-25 17:44:10 -07001225 def _reboot_repair(self):
1226 """SSH to this host and reboot."""
1227 if not self.is_up(self._CHECK_HOST_UP_TIMEOUT_SECS):
1228 raise error.AutoservRepairMethodNA('DUT unreachable for reboot.')
1229 logging.info('Attempting repair via SSH reboot.')
1230 self.reboot(timeout=self.BOOT_TIMEOUT, wait=True)
1231
1232
Prashanth B4d8184f2014-05-05 12:22:02 -07001233 def check_device(self):
1234 """Check if a device is ssh-able, and if so, clean and verify it.
1235
1236 @raise AutoservSSHTimeout: If the ssh ping times out.
1237 @raise AutoservSshPermissionDeniedError: If ssh ping fails due to
1238 permissions.
1239 @raise AutoservSshPingHostError: For other AutoservRunErrors during
1240 ssh_ping.
1241 @raises AutoservError: As appropriate, during cleanup and verify.
1242 """
1243 self.ssh_ping()
1244 self.cleanup()
1245 self.verify()
1246
1247
Dan Shi90466352015-09-22 15:01:05 -07001248 def confirm_servo(self):
1249 """Confirm servo is initialized and verified.
1250
1251 @raise AutoservError: If servo is not initialized and verified.
1252 """
Tom Wai-Hong Tam244acc22016-01-09 07:04:21 +08001253 if self.servo and self._servo_host.required_by_test:
Dan Shi90466352015-09-22 15:01:05 -07001254 return
1255
1256 # Force to re-create the servo object to make sure servo is verified.
1257 logging.debug('Rebuilding the servo object.')
1258 self.servo = None
1259 self._servo_host = None
1260 self._setup_servo()
1261 if not self.servo:
1262 raise error.AutoservError('Failed to create servo object.')
1263
1264
Dan Shid07ee2e2015-09-24 14:49:25 -07001265 def _is_last_provision_failed(self):
1266 """Checks if the last provision job failed.
1267
1268 @return: True if there exists file /var/tmp/provision_failed, which
1269 indicates the last provision job failed.
1270 False if the file does not exist or the dut can't be reached.
1271 """
1272 try:
1273 result = self.run('test -f %s' % PROVISION_FAILED,
1274 ignore_status=True, timeout=5)
1275 return result.exit_status == 0
1276 except (error.AutoservRunError, error.AutoservSSHTimeout):
1277 # Default to False, for repair to try all repair method if the dut
1278 # can't be reached.
1279 return False
1280
1281
J. Richard Barnettec2d99cf2015-11-18 12:46:15 -08001282 def repair(self):
1283 """Attempt to get the DUT to pass `self.verify()`.
Richard Barnette82c35912012-11-20 10:09:10 -08001284
1285 This overrides the base class function for repair; it does
1286 not call back to the parent class, but instead offers a
1287 simplified implementation based on the capabilities in the
1288 Chrome OS test lab.
1289
Fang Deng5d518f42013-08-02 14:04:32 -07001290 It first verifies and repairs servo if it is a DUT in CrOS
Fang Deng03590af2013-10-07 17:34:20 -07001291 lab and a servo is attached.
Fang Deng5d518f42013-08-02 14:04:32 -07001292
Jakob Juelich82b7d1c2014-09-15 16:10:57 -07001293 This escalates in order through the following procedures and verifies
1294 the status using `self.check_device()` after each of them. This is done
1295 until both the repair and the veryfing step succeed.
1296
MK Ryu35d661e2014-09-25 17:44:10 -07001297 Escalation order of repair procedures from less intrusive to
1298 more intrusive repairs:
1299 1. SSH to the DUT and reboot.
Scott Zawalski62bacae2013-03-05 10:40:32 -05001300 2. If there's a servo for the DUT, try to power the DUT off and
1301 on.
MK Ryu35d661e2014-09-25 17:44:10 -07001302 3. If the DUT can be power-cycled via RPM, try to repair
Richard Barnette82c35912012-11-20 10:09:10 -08001303 by power-cycling.
MK Ryu35d661e2014-09-25 17:44:10 -07001304 4. Try to re-install to a known stable image using
1305 auto-update.
1306 5. If there's a servo for the DUT, try to re-install via
1307 the servo.
Richard Barnette82c35912012-11-20 10:09:10 -08001308
1309 As with the parent method, the last operation performed on
Prashanth B4d8184f2014-05-05 12:22:02 -07001310 the DUT must be to call `self.check_device()`; If that call fails the
1311 exception it raises is passed back to the caller.
J. Richard Barnettefde55fc2013-03-15 17:47:01 -07001312
Scott Zawalski62bacae2013-03-05 10:40:32 -05001313 @raises AutoservRepairTotalFailure if the repair process fails to
1314 fix the DUT.
Fang Deng5d518f42013-08-02 14:04:32 -07001315 @raises ServoHostRepairTotalFailure if the repair process fails to
1316 fix the servo host if one is attached to the DUT.
1317 @raises AutoservSshPermissionDeniedError if it is unable
1318 to ssh to the servo host due to permission error.
1319
Richard Barnette82c35912012-11-20 10:09:10 -08001320 """
Jakob Juelich82b7d1c2014-09-15 16:10:57 -07001321 # Caution: Deleting shards relies on repair to always reboot the DUT.
1322
Nicolas Boichate30c7e12015-11-05 11:12:50 +08001323 # To repair a DUT connected to a moblab, try to create a servo object if
1324 # it was failed to be created earlier as there may be a servo_host host
1325 # attribute for this host.
1326 if utils.is_moblab():
1327 self._setup_servo()
1328
Dan Shi4d478522014-02-14 13:46:32 -08001329 if self._servo_host and not self.servo:
Fang Deng03590af2013-10-07 17:34:20 -07001330 try:
J. Richard Barnette4fc59c42015-12-15 16:58:50 -08001331 self._servo_host.repair()
Fang Deng03590af2013-10-07 17:34:20 -07001332 except Exception as e:
Fang Deng03590af2013-10-07 17:34:20 -07001333 logging.error('Could not create a healthy servo: %s', e)
Dan Shi4d478522014-02-14 13:46:32 -08001334 self.servo = self._servo_host.get_servo()
Fang Deng5d518f42013-08-02 14:04:32 -07001335
Scott Zawalski62bacae2013-03-05 10:40:32 -05001336 # TODO(scottz): This should use something similar to label_decorator,
1337 # but needs to be populated in order so DUTs are repaired with the
1338 # least amount of effort.
Dan Shid07ee2e2015-09-24 14:49:25 -07001339 force_powerwash = self._is_last_provision_failed()
1340 if force_powerwash:
1341 logging.info('Last provision failed, try powerwash first.')
1342 autotest_stats.Counter(
1343 'repair_force_powerwash.TOTAL').increment()
Tom Wai-Hong Tamb284ce42016-01-15 08:11:38 +08001344 repair_funcs = [self._firmware_repair,
1345 self._install_repair_with_powerwash,
1346 self._servo_repair_reinstall]
Dan Shid07ee2e2015-09-24 14:49:25 -07001347 else:
1348 repair_funcs = [self._reboot_repair,
1349 self._servo_repair_power,
Tom Wai-Hong Tamb284ce42016-01-15 08:11:38 +08001350 self._firmware_repair,
Dan Shid07ee2e2015-09-24 14:49:25 -07001351 self._powercycle_to_repair,
1352 self._install_repair,
1353 self._install_repair_with_powerwash,
Tom Wai-Hong Tamb284ce42016-01-15 08:11:38 +08001354 self._servo_repair_reinstall]
Scott Zawalski62bacae2013-03-05 10:40:32 -05001355 errors = []
Simran Basie6130932013-10-01 14:07:52 -07001356 board = self._get_board_from_afe()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001357 for repair_func in repair_funcs:
1358 try:
1359 repair_func()
Prashanth B4d8184f2014-05-05 12:22:02 -07001360 self.check_device()
Gabe Black1e1c41b2015-02-04 23:55:15 -08001361 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001362 '%s.SUCCEEDED' % repair_func.__name__).increment()
1363 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001364 autotest_stats.Counter(
Dan Shid07ee2e2015-09-24 14:49:25 -07001365 '%s.%s.SUCCEEDED' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001366 board)).increment()
Dan Shid07ee2e2015-09-24 14:49:25 -07001367 if force_powerwash:
1368 autotest_stats.Counter(
1369 'repair_force_powerwash.SUCCEEDED').increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001370 return
Simran Basie6130932013-10-01 14:07:52 -07001371 except error.AutoservRepairMethodNA as e:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001372 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001373 '%s.RepairNA' % repair_func.__name__).increment()
1374 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001375 autotest_stats.Counter(
Dan Shid07ee2e2015-09-24 14:49:25 -07001376 '%s.%s.RepairNA' % (repair_func.__name__,
1377 board)).increment()
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001378 logging.warning('Repair function NA: %s', e)
Simran Basie6130932013-10-01 14:07:52 -07001379 errors.append(str(e))
Scott Zawalski62bacae2013-03-05 10:40:32 -05001380 except Exception as e:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001381 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001382 '%s.FAILED' % repair_func.__name__).increment()
1383 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001384 autotest_stats.Counter(
Dan Shid07ee2e2015-09-24 14:49:25 -07001385 '%s.%s.FAILED' % (repair_func.__name__,
1386 board)).increment()
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001387 logging.warning('Failed to repair device: %s', e)
Scott Zawalski62bacae2013-03-05 10:40:32 -05001388 errors.append(str(e))
Scott Zawalski89c44dd2013-02-26 09:28:02 -05001389
Dan Shid07ee2e2015-09-24 14:49:25 -07001390 if force_powerwash:
1391 autotest_stats.Counter(
1392 'repair_force_powerwash.FAILED').increment()
Gabe Black1e1c41b2015-02-04 23:55:15 -08001393 autotest_stats.Counter('Full_Repair_Failed').increment()
Simran Basie6130932013-10-01 14:07:52 -07001394 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001395 autotest_stats.Counter(
Dan Shid07ee2e2015-09-24 14:49:25 -07001396 'Full_Repair_Failed.%s' % board).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001397 raise error.AutoservRepairTotalFailure(
1398 'All attempts at repairing the device failed:\n%s' %
1399 '\n'.join(errors))
Richard Barnette82c35912012-11-20 10:09:10 -08001400
1401
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001402 def close(self):
Fang Deng0ca40e22013-08-27 17:47:44 -07001403 super(CrosHost, self).close()
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001404
1405
Dan Shi49ca0932014-11-14 11:22:27 -08001406 def get_power_supply_info(self):
1407 """Get the output of power_supply_info.
1408
1409 power_supply_info outputs the info of each power supply, e.g.,
1410 Device: Line Power
1411 online: no
1412 type: Mains
1413 voltage (V): 0
1414 current (A): 0
1415 Device: Battery
1416 state: Discharging
1417 percentage: 95.9276
1418 technology: Li-ion
1419
1420 Above output shows two devices, Line Power and Battery, with details of
1421 each device listed. This function parses the output into a dictionary,
1422 with key being the device name, and value being a dictionary of details
1423 of the device info.
1424
1425 @return: The dictionary of power_supply_info, e.g.,
1426 {'Line Power': {'online': 'yes', 'type': 'main'},
1427 'Battery': {'vendor': 'xyz', 'percentage': '100'}}
Dan Shie9b765d2014-12-29 16:59:49 -08001428 @raise error.AutoservRunError if power_supply_info tool is not found in
1429 the DUT. Caller should handle this error to avoid false failure
1430 on verification.
Dan Shi49ca0932014-11-14 11:22:27 -08001431 """
1432 result = self.run('power_supply_info').stdout.strip()
1433 info = {}
1434 device_name = None
1435 device_info = {}
1436 for line in result.split('\n'):
1437 pair = [v.strip() for v in line.split(':')]
1438 if len(pair) != 2:
1439 continue
1440 if pair[0] == 'Device':
1441 if device_name:
1442 info[device_name] = device_info
1443 device_name = pair[1]
1444 device_info = {}
1445 else:
1446 device_info[pair[0]] = pair[1]
1447 if device_name and not device_name in info:
1448 info[device_name] = device_info
1449 return info
1450
1451
1452 def get_battery_percentage(self):
1453 """Get the battery percentage.
1454
1455 @return: The percentage of battery level, value range from 0-100. Return
1456 None if the battery info cannot be retrieved.
1457 """
1458 try:
1459 info = self.get_power_supply_info()
1460 logging.info(info)
1461 return float(info['Battery']['percentage'])
Dan Shie9b765d2014-12-29 16:59:49 -08001462 except (KeyError, ValueError, error.AutoservRunError):
Dan Shi49ca0932014-11-14 11:22:27 -08001463 return None
1464
1465
1466 def is_ac_connected(self):
1467 """Check if the dut has power adapter connected and charging.
1468
1469 @return: True if power adapter is connected and charging.
1470 """
1471 try:
1472 info = self.get_power_supply_info()
1473 return info['Line Power']['online'] == 'yes'
Dan Shie9b765d2014-12-29 16:59:49 -08001474 except (KeyError, error.AutoservRunError):
1475 return None
Dan Shi49ca0932014-11-14 11:22:27 -08001476
1477
Simran Basi5e6339a2013-03-21 11:34:32 -07001478 def _cleanup_poweron(self):
1479 """Special cleanup method to make sure hosts always get power back."""
1480 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
1481 hosts = afe.get_hosts(hostname=self.hostname)
1482 if not hosts or not (self._RPM_OUTLET_CHANGED in
1483 hosts[0].attributes):
1484 return
1485 logging.debug('This host has recently interacted with the RPM'
1486 ' Infrastructure. Ensuring power is on.')
1487 try:
1488 self.power_on()
Dan Shi7dca56e2014-11-11 17:07:56 -08001489 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, None,
1490 hostname=self.hostname)
Simran Basi5e6339a2013-03-21 11:34:32 -07001491 except rpm_client.RemotePowerException:
Simran Basi5e6339a2013-03-21 11:34:32 -07001492 logging.error('Failed to turn Power On for this host after '
1493 'cleanup through the RPM Infrastructure.')
Gabe Blackb72f4fb2015-01-20 16:47:13 -08001494 autotest_es.post(
Dan Shi7dca56e2014-11-11 17:07:56 -08001495 type_str='RPM_poweron_failure',
1496 metadata={'hostname': self.hostname})
Dan Shi49ca0932014-11-14 11:22:27 -08001497
1498 battery_percentage = self.get_battery_percentage()
Dan Shif01ebe22014-12-05 13:10:57 -08001499 if battery_percentage and battery_percentage < 50:
Dan Shi49ca0932014-11-14 11:22:27 -08001500 raise
1501 elif self.is_ac_connected():
1502 logging.info('The device has power adapter connected and '
1503 'charging. No need to try to turn RPM on '
1504 'again.')
1505 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, None,
1506 hostname=self.hostname)
1507 logging.info('Battery level is now at %s%%. The device may '
1508 'still have enough power to run test, so no '
1509 'exception will be raised.', battery_percentage)
1510
Simran Basi5e6339a2013-03-21 11:34:32 -07001511
beepsc87ff602013-07-31 21:53:00 -07001512 def _is_factory_image(self):
1513 """Checks if the image on the DUT is a factory image.
1514
1515 @return: True if the image on the DUT is a factory image.
1516 False otherwise.
1517 """
1518 result = self.run('[ -f /root/.factory_test ]', ignore_status=True)
1519 return result.exit_status == 0
1520
1521
1522 def _restart_ui(self):
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001523 """Restart the Chrome UI.
beepsc87ff602013-07-31 21:53:00 -07001524
1525 @raises: FactoryImageCheckerException for factory images, since
1526 we cannot attempt to restart ui on them.
1527 error.AutoservRunError for any other type of error that
1528 occurs while restarting ui.
1529 """
1530 if self._is_factory_image():
Dan Shi549fb822015-03-24 18:01:11 -07001531 raise FactoryImageCheckerException('Cannot restart ui on factory '
1532 'images')
beepsc87ff602013-07-31 21:53:00 -07001533
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001534 # TODO(jrbarnette): The command to stop/start the ui job
1535 # should live inside cros_ui, too. However that would seem
1536 # to imply interface changes to the existing start()/restart()
1537 # functions, which is a bridge too far (for now).
J. Richard Barnette6069aa12015-06-08 09:10:24 -07001538 prompt = cros_ui.get_chrome_session_ident(self)
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001539 self.run('stop ui; start ui')
1540 cros_ui.wait_for_chrome_ready(prompt, self)
beepsc87ff602013-07-31 21:53:00 -07001541
1542
Dan Shi549fb822015-03-24 18:01:11 -07001543 def get_release_version(self):
1544 """Get the value of attribute CHROMEOS_RELEASE_VERSION from lsb-release.
1545
1546 @returns The version string in lsb-release, under attribute
1547 CHROMEOS_RELEASE_VERSION.
1548 """
1549 lsb_release_content = self.run(
1550 'cat "%s"' % client_constants.LSB_RELEASE).stdout.strip()
1551 return lsbrelease_utils.get_chromeos_release_version(
1552 lsb_release_content=lsb_release_content)
1553
1554
1555 def verify_cros_version_label(self):
1556 """ Make sure host's cros-version label match the actual image in dut.
1557
1558 Remove any cros-version: label that doesn't match that installed in
1559 the dut.
1560
1561 @param raise_error: Set to True to raise exception if any mismatch found
1562
1563 @raise error.AutoservError: If any mismatch between cros-version label
1564 and the build installed in dut is found.
1565 """
1566 labels = self._AFE.get_labels(
1567 name__startswith=ds_constants.VERSION_PREFIX,
1568 host__hostname=self.hostname)
1569 mismatch_found = False
1570 if labels:
1571 # Get CHROMEOS_RELEASE_VERSION from lsb-release, e.g., 6908.0.0.
1572 # Note that it's different from cros-version label, which has
1573 # builder and branch info, e.g.,
1574 # cros-version:peppy-release/R43-6908.0.0
1575 release_version = self.get_release_version()
1576 host_list = [self.hostname]
1577 for label in labels:
1578 # Remove any cros-version label that does not match
1579 # release_version.
1580 build_version = label.name[len(ds_constants.VERSION_PREFIX):]
1581 if not utils.version_match(build_version, release_version):
1582 logging.warn('cros-version label "%s" does not match '
1583 'release version %s. Removing the label.',
1584 label.name, release_version)
1585 label.remove_hosts(hosts=host_list)
1586 mismatch_found = True
1587 if mismatch_found:
Dan Shi1057bae2015-03-30 11:35:09 -07001588 autotest_es.post(use_http=True,
1589 type_str='cros_version_label_mismatch',
1590 metadata={'hostname': self.hostname})
Dan Shi549fb822015-03-24 18:01:11 -07001591 raise error.AutoservError('The host has wrong cros-version label.')
1592
1593
Tom Wai-Hong Tambea741c2016-01-21 07:20:14 +08001594 def verify_firmware_status(self):
1595 """Verify the host's firmware is in a good state.
1596
1597 @raise error.AutoservError: If state is not good.
1598 """
1599 if self._is_firmware_repair_supported():
Tom Wai-Hong Tam93a29562016-01-23 04:16:53 +08001600 try:
1601 # Read the AP firmware and dump the sections we are interested.
1602 cmd = ('mkdir /tmp/verify_firmware; '
1603 'cd /tmp/verify_firmware; '
1604 'for section in VBLOCK_A VBLOCK_B FW_MAIN_A FW_MAIN_B; '
1605 'do flashrom -r image.bin -i $section:$section; '
1606 'done')
1607 self.run(cmd)
1608
1609 # Verify the firmware blocks A and B.
1610 cmd = ('vbutil_firmware --verify /tmp/verify_firmware/VBLOCK_%c'
1611 ' --signpubkey /usr/share/vboot/devkeys/root_key.vbpubk'
1612 ' --fv /tmp/verify_firmware/FW_MAIN_%c')
1613 for c in ('A', 'B'):
1614 rv = self.run(cmd % (c, c), ignore_status=True)
1615 if rv.exit_status:
1616 raise error.AutoservError(
1617 'Firmware %c is in a bad state.' % c)
1618 finally:
1619 # Remove the tempoary files.
1620 self.run('rm -rf /tmp/verify_firmware')
Tom Wai-Hong Tambea741c2016-01-21 07:20:14 +08001621 else:
1622 logging.info('Do not care about firmware status when the host '
1623 'is not in pools that support firmware repair.')
1624
1625
Shelley Chena11b9e72016-01-21 15:15:18 -08001626 def verify_filesystem_write_status(self):
1627 """Verify the DUT's filesystem is read/writable
1628
1629 @raise error.AutoservError: if filesystem is not writable.
1630 """
1631 # try to create & delete a file
1632 filename = "/mnt/stateful_partition/test.txt"
1633 cmd = 'touch %s && rm %s' % (filename, filename)
1634 rv = self.run(command=cmd, ignore_status=True)
1635
1636 if rv.exit_status == 1:
1637 raise error.AutoservError('DUT filesystem is read-only.')
1638
1639
beepsc87ff602013-07-31 21:53:00 -07001640 def cleanup(self):
MK Ryu35d661e2014-09-25 17:44:10 -07001641 self.run('rm -f %s' % client_constants.CLEANUP_LOGS_PAUSED_FILE)
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001642 try:
beepsc87ff602013-07-31 21:53:00 -07001643 self._restart_ui()
1644 except (error.AutotestRunError, error.AutoservRunError,
1645 FactoryImageCheckerException):
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001646 logging.warning('Unable to restart ui, rebooting device.')
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001647 # Since restarting the UI fails fall back to normal Autotest
1648 # cleanup routines, i.e. reboot the machine.
Fang Deng0ca40e22013-08-27 17:47:44 -07001649 super(CrosHost, self).cleanup()
Simran Basi5e6339a2013-03-21 11:34:32 -07001650 # Check if the rpm outlet was manipulated.
Simran Basid5e5e272012-09-24 15:23:59 -07001651 if self.has_power():
Simran Basi5e6339a2013-03-21 11:34:32 -07001652 self._cleanup_poweron()
Dan Shi549fb822015-03-24 18:01:11 -07001653 self.verify_cros_version_label()
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001654
1655
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001656 def reboot(self, **dargs):
1657 """
1658 This function reboots the site host. The more generic
1659 RemoteHost.reboot() performs sync and sleeps for 5
1660 seconds. This is not necessary for Chrome OS devices as the
1661 sync should be finished in a short time during the reboot
1662 command.
1663 """
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001664 if 'reboot_cmd' not in dargs:
Doug Anderson7d5aeb22014-02-27 15:12:17 -08001665 reboot_timeout = dargs.get('reboot_timeout', 10)
J. Richard Barnette9af19632015-09-25 12:18:03 -07001666 dargs['reboot_cmd'] = ('sleep 1; '
1667 'reboot & sleep %d; '
1668 'reboot -f' % reboot_timeout)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001669 # Enable fastsync to avoid running extra sync commands before reboot.
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001670 if 'fastsync' not in dargs:
1671 dargs['fastsync'] = True
Michael Liangda8c60a2014-06-03 13:24:51 -07001672
Charlie Mooneya8e6dab2014-05-29 14:37:55 -07001673 # For purposes of logging reboot times:
1674 # Get the board name i.e. 'daisy_spring'
Michael Liangca4f5a62014-07-10 15:45:13 -07001675 board_fullname = self.get_board()
1676
1677 # Strip the prefix and add it to dargs.
1678 dargs['board'] = board_fullname[board_fullname.find(':')+1:]
Fang Deng0ca40e22013-08-27 17:47:44 -07001679 super(CrosHost, self).reboot(**dargs)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001680
1681
Gwendal Grignou7a61d2f2014-05-23 11:05:51 -07001682 def suspend(self, **dargs):
1683 """
1684 This function suspends the site host.
1685 """
1686 suspend_time = dargs.get('suspend_time', 60)
1687 dargs['timeout'] = suspend_time
1688 if 'suspend_cmd' not in dargs:
J. Richard Barnette9af19632015-09-25 12:18:03 -07001689 dargs['suspend_cmd'] = ' && '.join([
1690 'echo 0 > /sys/class/rtc/rtc0/wakealarm',
Gwendal Grignou7a61d2f2014-05-23 11:05:51 -07001691 'echo +%d > /sys/class/rtc/rtc0/wakealarm' % suspend_time,
J. Richard Barnette9af19632015-09-25 12:18:03 -07001692 'powerd_dbus_suspend --delay=0'])
Gwendal Grignou7a61d2f2014-05-23 11:05:51 -07001693 super(CrosHost, self).suspend(**dargs)
1694
1695
Simran Basiec564392014-08-25 16:48:09 -07001696 def upstart_status(self, service_name):
1697 """Check the status of an upstart init script.
1698
1699 @param service_name: Service to look up.
1700
1701 @returns True if the service is running, False otherwise.
1702 """
1703 return self.run('status %s | grep start/running' %
1704 service_name).stdout.strip() != ''
1705
1706
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001707 def verify_software(self):
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001708 """Verify working software on a Chrome OS system.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001709
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001710 Tests for the following conditions:
1711 1. All conditions tested by the parent version of this
1712 function.
1713 2. Sufficient space in /mnt/stateful_partition.
Fang Deng6b05f5b2013-03-20 13:42:11 -07001714 3. Sufficient space in /mnt/stateful_partition/encrypted.
1715 4. update_engine answers a simple status request over DBus.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001716
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001717 """
Fang Deng0ca40e22013-08-27 17:47:44 -07001718 super(CrosHost, self).verify_software()
Dan Shib8540a52015-07-16 14:18:23 -07001719 default_kilo_inodes_required = CONFIG.get_config_value(
1720 'SERVER', 'kilo_inodes_required', type=int, default=100)
1721 board = self.get_board().replace(ds_constants.BOARD_PREFIX, '')
1722 kilo_inodes_required = CONFIG.get_config_value(
1723 'SERVER', 'kilo_inodes_required_%s' % board,
1724 type=int, default=default_kilo_inodes_required)
1725 self.check_inodes('/mnt/stateful_partition', kilo_inodes_required)
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001726 self.check_diskspace(
1727 '/mnt/stateful_partition',
Dan Shib8540a52015-07-16 14:18:23 -07001728 CONFIG.get_config_value(
Fang Deng6b05f5b2013-03-20 13:42:11 -07001729 'SERVER', 'gb_diskspace_required', type=float,
1730 default=20.0))
Gaurav Shahe448af82014-06-19 15:18:59 -07001731 encrypted_stateful_path = '/mnt/stateful_partition/encrypted'
1732 # Not all targets build with encrypted stateful support.
1733 if self.path_exists(encrypted_stateful_path):
1734 self.check_diskspace(
1735 encrypted_stateful_path,
Dan Shib8540a52015-07-16 14:18:23 -07001736 CONFIG.get_config_value(
Gaurav Shahe448af82014-06-19 15:18:59 -07001737 'SERVER', 'gb_encrypted_diskspace_required', type=float,
1738 default=0.1))
beepsc87ff602013-07-31 21:53:00 -07001739
Simran Basiec564392014-08-25 16:48:09 -07001740 if not self.upstart_status('system-services'):
Prashanth B5d0a0512014-04-25 12:26:08 -07001741 raise error.AutoservError('Chrome failed to reach login. '
1742 'System services not running.')
1743
beepsc87ff602013-07-31 21:53:00 -07001744 # Factory images don't run update engine,
1745 # goofy controls dbus on these DUTs.
1746 if not self._is_factory_image():
1747 self.run('update_engine_client --status')
Scott Zawalskifbca4a92013-03-04 15:56:42 -05001748 # Makes sure python is present, loads and can use built in functions.
1749 # We have seen cases where importing cPickle fails with undefined
1750 # symbols in cPickle.so.
1751 self.run('python -c "import cPickle"')
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001752
Dan Shi549fb822015-03-24 18:01:11 -07001753 self.verify_cros_version_label()
1754
Tom Wai-Hong Tambea741c2016-01-21 07:20:14 +08001755 self.verify_firmware_status()
1756
Shelley Chena11b9e72016-01-21 15:15:18 -08001757 self.verify_filesystem_write_status()
1758
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001759
J. Richard Barnettea7e7fdc2016-02-12 12:35:36 -08001760 def verify(self):
1761 self._repair_strategy.verify(self)
1762
1763
Fang Deng96667ca2013-08-01 17:46:18 -07001764 def make_ssh_command(self, user='root', port=22, opts='', hosts_file=None,
1765 connect_timeout=None, alive_interval=None):
1766 """Override default make_ssh_command to use options tuned for Chrome OS.
1767
1768 Tuning changes:
1769 - ConnectTimeout=30; maximum of 30 seconds allowed for an SSH
1770 connection failure. Consistency with remote_access.sh.
1771
Samuel Tan2ce155b2015-06-23 18:24:38 -07001772 - ServerAliveInterval=900; which causes SSH to ping connection every
1773 900 seconds. In conjunction with ServerAliveCountMax ensures
1774 that if the connection dies, Autotest will bail out.
Fang Deng96667ca2013-08-01 17:46:18 -07001775 Originally tried 60 secs, but saw frequent job ABORTS where
Samuel Tan2ce155b2015-06-23 18:24:38 -07001776 the test completed successfully. Later increased from 180 seconds to
1777 900 seconds to account for tests where the DUT is suspended for
1778 longer periods of time.
Fang Deng96667ca2013-08-01 17:46:18 -07001779
1780 - ServerAliveCountMax=3; consistency with remote_access.sh.
1781
1782 - ConnectAttempts=4; reduce flakiness in connection errors;
1783 consistency with remote_access.sh.
1784
1785 - UserKnownHostsFile=/dev/null; we don't care about the keys.
1786 Host keys change with every new installation, don't waste
1787 memory/space saving them.
1788
1789 - SSH protocol forced to 2; needed for ServerAliveInterval.
1790
1791 @param user User name to use for the ssh connection.
1792 @param port Port on the target host to use for ssh connection.
1793 @param opts Additional options to the ssh command.
1794 @param hosts_file Ignored.
1795 @param connect_timeout Ignored.
1796 @param alive_interval Ignored.
1797 """
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001798 base_command = ('/usr/bin/ssh -a -x %s %s %s'
1799 ' -o StrictHostKeyChecking=no'
Fang Deng96667ca2013-08-01 17:46:18 -07001800 ' -o UserKnownHostsFile=/dev/null -o BatchMode=yes'
Samuel Tan2ce155b2015-06-23 18:24:38 -07001801 ' -o ConnectTimeout=30 -o ServerAliveInterval=900'
Fang Deng96667ca2013-08-01 17:46:18 -07001802 ' -o ServerAliveCountMax=3 -o ConnectionAttempts=4'
1803 ' -o Protocol=2 -l %s -p %d')
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001804 return base_command % (self._ssh_verbosity_flag, self._ssh_options,
1805 opts, user, port)
Jason Abeleb6f924f2013-11-13 16:01:54 -08001806 def syslog(self, message, tag='autotest'):
1807 """Logs a message to syslog on host.
1808
1809 @param message String message to log into syslog
1810 @param tag String tag prefix for syslog
1811
1812 """
1813 self.run('logger -t "%s" "%s"' % (tag, message))
1814
1815
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001816 def _ping_check_status(self, status):
1817 """Ping the host once, and return whether it has a given status.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001818
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001819 @param status Check the ping status against this value.
1820 @return True iff `status` and the result of ping are the same
1821 (i.e. both True or both False).
1822
1823 """
1824 ping_val = utils.ping(self.hostname, tries=1, deadline=1)
1825 return not (status ^ (ping_val == 0))
1826
1827 def _ping_wait_for_status(self, status, timeout):
1828 """Wait for the host to have a given status (UP or DOWN).
1829
1830 Status is checked by polling. Polling will not last longer
1831 than the number of seconds in `timeout`. The polling
1832 interval will be long enough that only approximately
1833 _PING_WAIT_COUNT polling cycles will be executed, subject
1834 to a maximum interval of about one minute.
1835
1836 @param status Waiting will stop immediately if `ping` of the
1837 host returns this status.
1838 @param timeout Poll for at most this many seconds.
1839 @return True iff the host status from `ping` matched the
1840 requested status at the time of return.
1841
1842 """
1843 # _ping_check_status() takes about 1 second, hence the
1844 # "- 1" in the formula below.
1845 poll_interval = min(int(timeout / self._PING_WAIT_COUNT), 60) - 1
1846 end_time = time.time() + timeout
1847 while time.time() <= end_time:
1848 if self._ping_check_status(status):
1849 return True
1850 if poll_interval > 0:
1851 time.sleep(poll_interval)
1852
1853 # The last thing we did was sleep(poll_interval), so it may
1854 # have been too long since the last `ping`. Check one more
1855 # time, just to be sure.
1856 return self._ping_check_status(status)
1857
1858 def ping_wait_up(self, timeout):
1859 """Wait for the host to respond to `ping`.
1860
1861 N.B. This method is not a reliable substitute for
1862 `wait_up()`, because a host that responds to ping will not
1863 necessarily respond to ssh. This method should only be used
1864 if the target DUT can be considered functional even if it
1865 can't be reached via ssh.
1866
1867 @param timeout Minimum time to allow before declaring the
1868 host to be non-responsive.
1869 @return True iff the host answered to ping before the timeout.
1870
1871 """
1872 return self._ping_wait_for_status(self._PING_STATUS_UP, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001873
Andrew Bresticker678c0c72013-01-22 10:44:09 -08001874 def ping_wait_down(self, timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001875 """Wait until the host no longer responds to `ping`.
1876
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001877 This function can be used as a slightly faster version of
1878 `wait_down()`, by avoiding potentially long ssh timeouts.
1879
1880 @param timeout Minimum time to allow for the host to become
1881 non-responsive.
1882 @return True iff the host quit answering ping before the
1883 timeout.
1884
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001885 """
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001886 return self._ping_wait_for_status(self._PING_STATUS_DOWN, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001887
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001888 def test_wait_for_sleep(self, sleep_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001889 """Wait for the client to enter low-power sleep mode.
1890
1891 The test for "is asleep" can't distinguish a system that is
1892 powered off; to confirm that the unit was asleep, it is
1893 necessary to force resume, and then call
1894 `test_wait_for_resume()`.
1895
1896 This function is expected to be called from a test as part
1897 of a sequence like the following:
1898
1899 ~~~~~~~~
1900 boot_id = host.get_boot_id()
1901 # trigger sleep on the host
1902 host.test_wait_for_sleep()
1903 # trigger resume on the host
1904 host.test_wait_for_resume(boot_id)
1905 ~~~~~~~~
1906
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001907 @param sleep_timeout time limit in seconds to allow the host sleep.
1908
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001909 @exception TestFail The host did not go to sleep within
1910 the allowed time.
1911 """
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001912 if sleep_timeout is None:
1913 sleep_timeout = self.SLEEP_TIMEOUT
1914
1915 if not self.ping_wait_down(timeout=sleep_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001916 raise error.TestFail(
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001917 'client failed to sleep after %d seconds' % sleep_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001918
1919
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001920 def test_wait_for_resume(self, old_boot_id, resume_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001921 """Wait for the client to resume from low-power sleep mode.
1922
1923 The `old_boot_id` parameter should be the value from
1924 `get_boot_id()` obtained prior to entering sleep mode. A
1925 `TestFail` exception is raised if the boot id changes.
1926
1927 See @ref test_wait_for_sleep for more on this function's
1928 usage.
1929
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001930 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001931 target host went to sleep.
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001932 @param resume_timeout time limit in seconds to allow the host up.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001933
1934 @exception TestFail The host did not respond within the
1935 allowed time.
1936 @exception TestFail The host responded, but the boot id test
1937 indicated a reboot rather than a sleep
1938 cycle.
1939 """
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001940 if resume_timeout is None:
1941 resume_timeout = self.RESUME_TIMEOUT
1942
1943 if not self.wait_up(timeout=resume_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001944 raise error.TestFail(
1945 'client failed to resume from sleep after %d seconds' %
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001946 resume_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001947 else:
1948 new_boot_id = self.get_boot_id()
1949 if new_boot_id != old_boot_id:
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08001950 logging.error('client rebooted (old boot %s, new boot %s)',
1951 old_boot_id, new_boot_id)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001952 raise error.TestFail(
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08001953 'client rebooted, but sleep was expected')
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001954
1955
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08001956 def test_wait_for_shutdown(self, shutdown_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001957 """Wait for the client to shut down.
1958
1959 The test for "has shut down" can't distinguish a system that
1960 is merely asleep; to confirm that the unit was down, it is
1961 necessary to force boot, and then call test_wait_for_boot().
1962
1963 This function is expected to be called from a test as part
1964 of a sequence like the following:
1965
1966 ~~~~~~~~
1967 boot_id = host.get_boot_id()
1968 # trigger shutdown on the host
1969 host.test_wait_for_shutdown()
1970 # trigger boot on the host
1971 host.test_wait_for_boot(boot_id)
1972 ~~~~~~~~
1973
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08001974 @param shutdown_timeout time limit in seconds to allow the host down.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001975 @exception TestFail The host did not shut down within the
1976 allowed time.
1977 """
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08001978 if shutdown_timeout is None:
1979 shutdown_timeout = self.SHUTDOWN_TIMEOUT
1980
1981 if not self.ping_wait_down(timeout=shutdown_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001982 raise error.TestFail(
1983 'client failed to shut down after %d seconds' %
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08001984 shutdown_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001985
1986
1987 def test_wait_for_boot(self, old_boot_id=None):
1988 """Wait for the client to boot from cold power.
1989
1990 The `old_boot_id` parameter should be the value from
1991 `get_boot_id()` obtained prior to shutting down. A
1992 `TestFail` exception is raised if the boot id does not
1993 change. The boot id test is omitted if `old_boot_id` is not
1994 specified.
1995
1996 See @ref test_wait_for_shutdown for more on this function's
1997 usage.
1998
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001999 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002000 shut down.
2001
2002 @exception TestFail The host did not respond within the
2003 allowed time.
2004 @exception TestFail The host responded, but the boot id test
2005 indicated that there was no reboot.
2006 """
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07002007 if not self.wait_up(timeout=self.REBOOT_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002008 raise error.TestFail(
2009 'client failed to reboot after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07002010 self.REBOOT_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002011 elif old_boot_id:
2012 if self.get_boot_id() == old_boot_id:
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002013 logging.error('client not rebooted (boot %s)',
2014 old_boot_id)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002015 raise error.TestFail(
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002016 'client is back up, but did not reboot')
Simran Basid5e5e272012-09-24 15:23:59 -07002017
2018
2019 @staticmethod
2020 def check_for_rpm_support(hostname):
2021 """For a given hostname, return whether or not it is powered by an RPM.
2022
Simran Basi1df55112013-09-06 11:25:09 -07002023 @param hostname: hostname to check for rpm support.
2024
Simran Basid5e5e272012-09-24 15:23:59 -07002025 @return None if this host does not follows the defined naming format
2026 for RPM powered DUT's in the lab. If it does follow the format,
2027 it returns a regular expression MatchObject instead.
2028 """
Fang Dengbaff9082015-01-06 13:46:15 -08002029 return re.match(CrosHost._RPM_HOSTNAME_REGEX, hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07002030
2031
2032 def has_power(self):
2033 """For this host, return whether or not it is powered by an RPM.
2034
2035 @return True if this host is in the CROS lab and follows the defined
2036 naming format.
2037 """
Fang Deng0ca40e22013-08-27 17:47:44 -07002038 return CrosHost.check_for_rpm_support(self.hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07002039
2040
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08002041 def _set_power(self, state, power_method):
2042 """Sets the power to the host via RPM, Servo or manual.
2043
2044 @param state Specifies which power state to set to DUT
2045 @param power_method Specifies which method of power control to
2046 use. By default "RPM" will be used. Valid values
2047 are the strings "RPM", "manual", "servoj10".
2048
2049 """
2050 ACCEPTABLE_STATES = ['ON', 'OFF']
2051
2052 if state.upper() not in ACCEPTABLE_STATES:
2053 raise error.TestError('State must be one of: %s.'
2054 % (ACCEPTABLE_STATES,))
2055
2056 if power_method == self.POWER_CONTROL_SERVO:
2057 logging.info('Setting servo port J10 to %s', state)
2058 self.servo.set('prtctl3_pwren', state.lower())
2059 time.sleep(self._USB_POWER_TIMEOUT)
2060 elif power_method == self.POWER_CONTROL_MANUAL:
2061 logging.info('You have %d seconds to set the AC power to %s.',
2062 self._POWER_CYCLE_TIMEOUT, state)
2063 time.sleep(self._POWER_CYCLE_TIMEOUT)
2064 else:
2065 if not self.has_power():
2066 raise error.TestFail('DUT does not have RPM connected.')
Simran Basi5e6339a2013-03-21 11:34:32 -07002067 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
2068 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, True,
2069 hostname=self.hostname)
Simran Basi1df55112013-09-06 11:25:09 -07002070 rpm_client.set_power(self.hostname, state.upper(), timeout_mins=5)
Simran Basid5e5e272012-09-24 15:23:59 -07002071
2072
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08002073 def power_off(self, power_method=POWER_CONTROL_RPM):
2074 """Turn off power to this host via RPM, Servo or manual.
2075
2076 @param power_method Specifies which method of power control to
2077 use. By default "RPM" will be used. Valid values
2078 are the strings "RPM", "manual", "servoj10".
2079
2080 """
2081 self._set_power('OFF', power_method)
Simran Basid5e5e272012-09-24 15:23:59 -07002082
2083
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08002084 def power_on(self, power_method=POWER_CONTROL_RPM):
2085 """Turn on power to this host via RPM, Servo or manual.
2086
2087 @param power_method Specifies which method of power control to
2088 use. By default "RPM" will be used. Valid values
2089 are the strings "RPM", "manual", "servoj10".
2090
2091 """
2092 self._set_power('ON', power_method)
2093
2094
2095 def power_cycle(self, power_method=POWER_CONTROL_RPM):
2096 """Cycle power to this host by turning it OFF, then ON.
2097
2098 @param power_method Specifies which method of power control to
2099 use. By default "RPM" will be used. Valid values
2100 are the strings "RPM", "manual", "servoj10".
2101
2102 """
2103 if power_method in (self.POWER_CONTROL_SERVO,
2104 self.POWER_CONTROL_MANUAL):
2105 self.power_off(power_method=power_method)
2106 time.sleep(self._POWER_CYCLE_TIMEOUT)
2107 self.power_on(power_method=power_method)
2108 else:
2109 rpm_client.set_power(self.hostname, 'CYCLE')
Simran Basic6f1f7a2012-10-16 10:47:46 -07002110
2111
2112 def get_platform(self):
2113 """Determine the correct platform label for this host.
2114
2115 @returns a string representing this host's platform.
2116 """
2117 crossystem = utils.Crossystem(self)
2118 crossystem.init()
2119 # Extract fwid value and use the leading part as the platform id.
2120 # fwid generally follow the format of {platform}.{firmware version}
2121 # Example: Alex.X.YYY.Z or Google_Alex.X.YYY.Z
2122 platform = crossystem.fwid().split('.')[0].lower()
2123 # Newer platforms start with 'Google_' while the older ones do not.
2124 return platform.replace('google_', '')
2125
2126
Hung-ying Tyanb1328032014-04-01 14:18:54 +08002127 def get_architecture(self):
2128 """Determine the correct architecture label for this host.
2129
2130 @returns a string representing this host's architecture.
2131 """
2132 crossystem = utils.Crossystem(self)
2133 crossystem.init()
2134 return crossystem.arch()
2135
2136
Luis Lozano40b7d0d2014-01-17 15:12:06 -08002137 def get_chrome_version(self):
2138 """Gets the Chrome version number and milestone as strings.
2139
2140 Invokes "chrome --version" to get the version number and milestone.
2141
2142 @return A tuple (chrome_ver, milestone) where "chrome_ver" is the
2143 current Chrome version number as a string (in the form "W.X.Y.Z")
2144 and "milestone" is the first component of the version number
2145 (the "W" from "W.X.Y.Z"). If the version number cannot be parsed
2146 in the "W.X.Y.Z" format, the "chrome_ver" will be the full output
2147 of "chrome --version" and the milestone will be the empty string.
2148
2149 """
MK Ryu35d661e2014-09-25 17:44:10 -07002150 version_string = self.run(client_constants.CHROME_VERSION_COMMAND).stdout
Luis Lozano40b7d0d2014-01-17 15:12:06 -08002151 return utils.parse_chrome_version(version_string)
2152
J. Richard Barnetted2af5852016-02-05 15:03:10 -08002153
Aviv Keshet74c89a92013-02-04 15:18:30 -08002154 @label_decorator()
Simran Basic6f1f7a2012-10-16 10:47:46 -07002155 def get_board(self):
2156 """Determine the correct board label for this host.
2157
2158 @returns a string representing this host's board.
2159 """
2160 release_info = utils.parse_cmd_output('cat /etc/lsb-release',
2161 run_method=self.run)
J. Richard Barnetted2af5852016-02-05 15:03:10 -08002162 return (ds_constants.BOARD_PREFIX +
2163 release_info['CHROMEOS_RELEASE_BOARD'])
Simran Basic6f1f7a2012-10-16 10:47:46 -07002164
2165
Aviv Keshet74c89a92013-02-04 15:18:30 -08002166 @label_decorator('lightsensor')
Simran Basic6f1f7a2012-10-16 10:47:46 -07002167 def has_lightsensor(self):
2168 """Determine the correct board label for this host.
2169
2170 @returns the string 'lightsensor' if this host has a lightsensor or
2171 None if it does not.
2172 """
2173 search_cmd = "find -L %s -maxdepth 4 | egrep '%s'" % (
Richard Barnette82c35912012-11-20 10:09:10 -08002174 self._LIGHTSENSOR_SEARCH_DIR, '|'.join(self._LIGHTSENSOR_FILES))
Simran Basic6f1f7a2012-10-16 10:47:46 -07002175 try:
2176 # Run the search cmd following the symlinks. Stderr_tee is set to
2177 # None as there can be a symlink loop, but the command will still
2178 # execute correctly with a few messages printed to stderr.
2179 self.run(search_cmd, stdout_tee=None, stderr_tee=None)
2180 return 'lightsensor'
2181 except error.AutoservRunError:
2182 # egrep exited with a return code of 1 meaning none of the possible
2183 # lightsensor files existed.
2184 return None
2185
2186
Aviv Keshet74c89a92013-02-04 15:18:30 -08002187 @label_decorator('bluetooth')
Simran Basic6f1f7a2012-10-16 10:47:46 -07002188 def has_bluetooth(self):
2189 """Determine the correct board label for this host.
2190
2191 @returns the string 'bluetooth' if this host has bluetooth or
2192 None if it does not.
2193 """
2194 try:
2195 self.run('test -d /sys/class/bluetooth/hci0')
2196 # test exited with a return code of 0.
2197 return 'bluetooth'
2198 except error.AutoservRunError:
2199 # test exited with a return code 1 meaning the directory did not
2200 # exist.
2201 return None
2202
2203
Bill Richardson4f595f52014-02-13 16:20:26 -08002204 @label_decorator('ec')
2205 def get_ec(self):
2206 """
2207 Determine the type of EC on this host.
2208
2209 @returns a string representing this host's embedded controller type.
2210 At present, it only returns "ec:cros", for Chrome OS ECs. Other types
2211 of EC (or none) don't return any strings, since no tests depend on
2212 those.
2213 """
2214 cmd = 'mosys ec info'
2215 # The output should look like these, so that the last field should
2216 # match our EC version scheme:
2217 #
2218 # stm | stm32f100 | snow_v1.3.139-375eb9f
2219 # ti | Unknown-10de | peppy_v1.5.114-5d52788
2220 #
2221 # Non-Chrome OS ECs will look like these:
2222 #
2223 # ENE | KB932 | 00BE107A00
2224 # ite | it8518 | 3.08
2225 #
2226 # And some systems don't have ECs at all (Lumpy, for example).
2227 regexp = r'^.*\|\s*(\S+_v\d+\.\d+\.\d+-[0-9a-f]+)\s*$'
2228
2229 ecinfo = self.run(command=cmd, ignore_status=True)
2230 if ecinfo.exit_status == 0:
2231 res = re.search(regexp, ecinfo.stdout)
2232 if res:
2233 logging.info("EC version is %s", res.groups()[0])
2234 return 'ec:cros'
2235 logging.info("%s got: %s", cmd, ecinfo.stdout)
2236 # Has an EC, but it's not a Chrome OS EC
2237 return None
2238 logging.info("%s exited with status %d", cmd, ecinfo.exit_status)
2239 # No EC present
2240 return None
2241
2242
Alec Berg31b932b2014-04-04 16:09:11 -07002243 @label_decorator('accels')
2244 def get_accels(self):
2245 """
2246 Determine the type of accelerometers on this host.
2247
2248 @returns a string representing this host's accelerometer type.
2249 At present, it only returns "accel:cros-ec", for accelerometers
2250 attached to a Chrome OS EC, or none, if no accelerometers.
2251 """
2252 # Check to make sure we have ectool
2253 rv = self.run('which ectool', ignore_status=True)
2254 if rv.exit_status:
2255 logging.info("No ectool cmd found, assuming no EC accelerometers")
2256 return None
2257
2258 # Check that the EC supports the motionsense command
2259 rv = self.run('ectool motionsense', ignore_status=True)
2260 if rv.exit_status:
2261 logging.info("EC does not support motionsense command "
2262 "assuming no EC accelerometers")
2263 return None
2264
2265 # Check that EC motion sensors are active
2266 active = self.run('ectool motionsense active').stdout.split('\n')
2267 if active[0] == "0":
2268 logging.info("Motion sense inactive, assuming no EC accelerometers")
2269 return None
2270
2271 logging.info("EC accelerometers found")
2272 return 'accel:cros-ec'
2273
2274
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08002275 @label_decorator('chameleon')
2276 def has_chameleon(self):
2277 """Determine if a Chameleon connected to this host.
2278
Tom Wai-Hong Tambadbb332014-10-10 02:59:41 +08002279 @returns a list containing two strings ('chameleon' and
2280 'chameleon:' + label, e.g. 'chameleon:hdmi') if this host
2281 has a Chameleon or None if it has not.
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08002282 """
2283 if self._chameleon_host:
Tom Wai-Hong Tambadbb332014-10-10 02:59:41 +08002284 return ['chameleon', 'chameleon:' + self.chameleon.get_label()]
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08002285 else:
2286 return None
2287
2288
Cheng-Yi Chiangf4104ff2014-12-23 19:39:01 +08002289 @label_decorator('audio_loopback_dongle')
2290 def has_loopback_dongle(self):
2291 """Determine if an audio loopback dongle is plugged to this host.
2292
2293 @returns 'audio_loopback_dongle' when there is an audio loopback dongle
2294 plugged to this host.
2295 None when there is no audio loopback dongle
2296 plugged to this host.
2297 """
Cheng-Yi Chiang8de78112015-05-27 14:47:08 +08002298 nodes_info = self.run(command=cras_utils.get_cras_nodes_cmd(),
2299 ignore_status=True).stdout
2300 if (cras_utils.node_type_is_plugged('HEADPHONE', nodes_info) and
2301 cras_utils.node_type_is_plugged('MIC', nodes_info)):
Cheng-Yi Chiangf4104ff2014-12-23 19:39:01 +08002302 return 'audio_loopback_dongle'
2303 else:
2304 return None
2305
2306
Derek Basehorec71ff622014-07-07 15:18:40 -07002307 @label_decorator('power_supply')
2308 def get_power_supply(self):
2309 """
2310 Determine what type of power supply the host has
2311
2312 @returns a string representing this host's power supply.
2313 'power:battery' when the device has a battery intended for
2314 extended use
2315 'power:AC_primary' when the device has a battery not intended
2316 for extended use (for moving the machine, etc)
2317 'power:AC_only' when the device has no battery at all.
2318 """
2319 psu = self.run(command='mosys psu type', ignore_status=True)
2320 if psu.exit_status:
2321 # The psu command for mosys is not included for all platforms. The
2322 # assumption is that the device will have a battery if the command
2323 # is not found.
2324 return 'power:battery'
2325
2326 psu_str = psu.stdout.strip()
2327 if psu_str == 'unknown':
2328 return None
2329
2330 return 'power:%s' % psu_str
2331
2332
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002333 @label_decorator('storage')
2334 def get_storage(self):
2335 """
2336 Determine the type of boot device for this host.
2337
2338 Determine if the internal device is SCSI or dw_mmc device.
2339 Then check that it is SSD or HDD or eMMC or something else.
2340
2341 @returns a string representing this host's internal device type.
2342 'storage:ssd' when internal device is solid state drive
2343 'storage:hdd' when internal device is hard disk drive
2344 'storage:mmc' when internal device is mmc drive
2345 None When internal device is something else or
2346 when we are unable to determine the type
2347 """
2348 # The output should be /dev/mmcblk* for SD/eMMC or /dev/sd* for scsi
2349 rootdev_cmd = ' '.join(['. /usr/sbin/write_gpt.sh;',
2350 '. /usr/share/misc/chromeos-common.sh;',
2351 'load_base_vars;',
2352 'get_fixed_dst_drive'])
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002353 rootdev = self.run(command=rootdev_cmd, ignore_status=True)
2354 if rootdev.exit_status:
2355 logging.info("Fail to run %s", rootdev_cmd)
2356 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002357 rootdev_str = rootdev.stdout.strip()
2358
2359 if not rootdev_str:
2360 return None
2361
2362 rootdev_base = os.path.basename(rootdev_str)
2363
2364 mmc_pattern = '/dev/mmcblk[0-9]'
2365 if re.match(mmc_pattern, rootdev_str):
2366 # Use type to determine if the internal device is eMMC or somthing
2367 # else. We can assume that MMC is always an internal device.
2368 type_cmd = 'cat /sys/block/%s/device/type' % rootdev_base
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002369 type = self.run(command=type_cmd, ignore_status=True)
2370 if type.exit_status:
2371 logging.info("Fail to run %s", type_cmd)
2372 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002373 type_str = type.stdout.strip()
2374
2375 if type_str == 'MMC':
2376 return 'storage:mmc'
2377
2378 scsi_pattern = '/dev/sd[a-z]+'
2379 if re.match(scsi_pattern, rootdev.stdout):
2380 # Read symlink for /sys/block/sd* to determine if the internal
2381 # device is connected via ata or usb.
2382 link_cmd = 'readlink /sys/block/%s' % rootdev_base
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002383 link = self.run(command=link_cmd, ignore_status=True)
2384 if link.exit_status:
2385 logging.info("Fail to run %s", link_cmd)
2386 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002387 link_str = link.stdout.strip()
2388 if 'usb' in link_str:
2389 return None
2390
2391 # Read rotation to determine if the internal device is ssd or hdd.
2392 rotate_cmd = str('cat /sys/block/%s/queue/rotational'
2393 % rootdev_base)
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002394 rotate = self.run(command=rotate_cmd, ignore_status=True)
2395 if rotate.exit_status:
2396 logging.info("Fail to run %s", rotate_cmd)
2397 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002398 rotate_str = rotate.stdout.strip()
2399
2400 rotate_dict = {'0':'storage:ssd', '1':'storage:hdd'}
2401 return rotate_dict.get(rotate_str)
2402
2403 # All other internal device / error case will always fall here
2404 return None
2405
2406
Dan Shi4e9a2aa2014-03-24 14:28:42 -07002407 @label_decorator('servo')
2408 def get_servo(self):
2409 """Determine if the host has a servo attached.
2410
2411 If the host has a working servo attached, it should have a servo label.
2412
2413 @return: string 'servo' if the host has servo attached. Otherwise,
2414 returns None.
2415 """
2416 return 'servo' if self._servo_host else None
2417
2418
Dan Shi5beba472014-05-28 22:46:07 -07002419 @label_decorator('video_labels')
2420 def get_video_labels(self):
2421 """Run /usr/local/bin/avtest_label_detect to get a list of video labels.
2422
2423 Sample output of avtest_label_detect:
2424 Detected label: hw_video_acc_vp8
2425 Detected label: webcam
2426
2427 @return: A list of labels detected by tool avtest_label_detect.
2428 """
2429 try:
2430 result = self.run('/usr/local/bin/avtest_label_detect').stdout
2431 return re.findall('^Detected label: (\w+)$', result, re.M)
2432 except error.AutoservRunError:
2433 # The tool is not installed.
2434 return []
2435
2436
mussa584b4462014-06-20 15:13:28 -07002437 @label_decorator('video_glitch_detection')
2438 def is_video_glitch_detection_supported(self):
2439 """ Determine if a board under test is supported for video glitch
2440 detection tests.
2441
2442 @return: 'video_glitch_detection' if board is supported, None otherwise.
2443 """
Mussa5b589052015-10-26 17:55:26 -07002444 board = self.get_board().replace(ds_constants.BOARD_PREFIX, '')
mussa584b4462014-06-20 15:13:28 -07002445
Mussa5b589052015-10-26 17:55:26 -07002446 if board in video_test_constants.SUPPORTED_BOARDS:
2447 return 'video_glitch_detection'
mussa584b4462014-06-20 15:13:28 -07002448
Mussa5b589052015-10-26 17:55:26 -07002449 return None
mussa584b4462014-06-20 15:13:28 -07002450
mussa584b4462014-06-20 15:13:28 -07002451
Katherine Threlkeld7b97a9f2014-06-24 13:47:14 -07002452 @label_decorator('touch_labels')
2453 def get_touch(self):
2454 """
2455 Determine whether board under test has a touchpad or touchscreen.
2456
2457 @return: A list of some combination of 'touchscreen' and 'touchpad',
2458 depending on what is present on the device.
Katherine Threlkeldab83d392015-06-18 16:45:57 -07002459
Katherine Threlkeld7b97a9f2014-06-24 13:47:14 -07002460 """
2461 labels = []
Katherine Threlkeldab83d392015-06-18 16:45:57 -07002462 looking_for = ['touchpad', 'touchscreen']
2463 player = input_playback.InputPlayback()
2464 input_events = self.run('ls /dev/input/event*').stdout.strip().split()
2465 filename = '/tmp/touch_labels'
2466 for event in input_events:
2467 self.run('evtest %s > %s' % (event, filename), timeout=1,
2468 ignore_timeout=True)
2469 properties = self.run('cat %s' % filename).stdout
2470 input_type = player._determine_input_type(properties)
2471 if input_type in looking_for:
2472 labels.append(input_type)
2473 looking_for.remove(input_type)
2474 if len(looking_for) == 0:
2475 break
2476 self.run('rm %s' % filename)
2477
Katherine Threlkeld7b97a9f2014-06-24 13:47:14 -07002478 return labels
2479
Hung-ying Tyana39b0542015-06-30 10:36:42 +08002480
2481 @label_decorator('internal_display')
2482 def has_internal_display(self):
2483 """Determine if the device under test is equipped with an internal
2484 display.
2485
2486 @return: 'internal_display' if one is present; None otherwise.
2487 """
2488 from autotest_lib.client.cros.graphics import graphics_utils
2489 from autotest_lib.client.common_lib import utils as common_utils
2490
2491 def __system_output(cmd):
2492 return self.run(cmd).stdout
2493
2494 def __read_file(remote_path):
2495 return self.run('cat %s' % remote_path).stdout
2496
2497 # Hijack the necessary client functions so that we can take advantage
2498 # of the client lib here.
2499 # FIXME: find a less hacky way than this
2500 original_system_output = utils.system_output
2501 original_read_file = common_utils.read_file
2502 utils.system_output = __system_output
2503 common_utils.read_file = __read_file
2504 try:
2505 return ('internal_display' if graphics_utils.has_internal_display()
2506 else None)
2507 finally:
2508 utils.system_output = original_system_output
2509 common_utils.read_file = original_read_file
2510
2511
Eric Carusoee673ac2015-08-05 17:03:04 -07002512 @label_decorator('lucidsleep')
2513 def has_lucid_sleep_support(self):
2514 """Determine if the device under test has support for lucid sleep.
2515
2516 @return 'lucidsleep' if this board supports lucid sleep; None otherwise
2517 """
2518 board = self.get_board().replace(ds_constants.BOARD_PREFIX, '')
2519 return 'lucidsleep' if board in LUCID_SLEEP_BOARDS else None
2520
2521
Dan Shi85276d42014-04-08 22:11:45 -07002522 def is_boot_from_usb(self):
2523 """Check if DUT is boot from USB.
2524
2525 @return: True if DUT is boot from usb.
2526 """
2527 device = self.run('rootdev -s -d').stdout.strip()
2528 removable = int(self.run('cat /sys/block/%s/removable' %
2529 os.path.basename(device)).stdout.strip())
2530 return removable == 1
Helen Zhang17dae2b2014-11-11 09:25:52 -08002531
2532
2533 def read_from_meminfo(self, key):
Dan Shi49ca0932014-11-14 11:22:27 -08002534 """Return the memory info from /proc/meminfo
Helen Zhang17dae2b2014-11-11 09:25:52 -08002535
2536 @param key: meminfo requested
2537
2538 @return the memory value as a string
2539
2540 """
Helen Zhang17dae2b2014-11-11 09:25:52 -08002541 meminfo = self.run('grep %s /proc/meminfo' % key).stdout.strip()
2542 logging.debug('%s', meminfo)
2543 return int(re.search(r'\d+', meminfo).group(0))
Rohit Makasana8a4923c2015-08-13 17:04:26 -07002544
2545
2546 def get_board_type(self):
2547 """
2548 Get the DUT's device type from /etc/lsb-release.
Danny Chan471a8d12015-08-18 14:57:41 -07002549 DEVICETYPE can be one of CHROMEBOX, CHROMEBASE, CHROMEBOOK or more.
2550
2551 @return value of DEVICETYPE param from lsb-release.
Rohit Makasana8a4923c2015-08-13 17:04:26 -07002552 """
Danny Chan471a8d12015-08-18 14:57:41 -07002553 device_type = self.run('grep DEVICETYPE /etc/lsb-release',
2554 ignore_status=True).stdout
2555 if device_type:
Kalin Stoyanov524310b2015-08-21 16:24:04 -07002556 return device_type.split('=')[-1].strip()
Danny Chan471a8d12015-08-18 14:57:41 -07002557 return ''
Gilad Arnolda76bef02015-09-29 13:55:15 -07002558
2559
2560 def get_os_type(self):
2561 return 'cros'
Simran Basia5522a32015-10-06 11:01:24 -07002562
2563
2564 def enable_adb_testing(self):
2565 """Mark this host as an adb tester."""
Dan Shia2872172015-10-31 01:16:51 -07002566 self.run('touch %s' % constants.ANDROID_TESTER_FILEFLAG)