blob: e2815257cf2503b458321b0762163c7be9ae2d86 [file] [log] [blame]
J. Richard Barnette24adbf42012-04-11 15:04:53 -07001# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
Dale Curtisaa5eedb2011-08-23 16:18:52 -07002# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4
mussa584b4462014-06-20 15:13:28 -07005import ConfigParser
Aviv Keshet74c89a92013-02-04 15:18:30 -08006import functools
Christopher Wiley0ed712b2013-04-09 15:25:12 -07007import httplib
J. Richard Barnette1d78b012012-05-15 13:56:30 -07008import logging
Dan Shi0f466e82013-02-22 15:44:58 -08009import os
Simran Basid5e5e272012-09-24 15:23:59 -070010import re
Christopher Wileyd78249a2013-03-01 13:05:31 -080011import socket
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070012import time
J. Richard Barnette1d78b012012-05-15 13:56:30 -070013import xmlrpclib
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070014
mussa584b4462014-06-20 15:13:28 -070015import common
J. Richard Barnette45e93de2012-04-11 17:24:15 -070016from autotest_lib.client.bin import utils
Dan Shi9cb0eec2014-06-03 09:04:50 -070017from autotest_lib.client.common_lib import autotemp
Richard Barnette0c73ffc2012-11-19 15:21:18 -080018from autotest_lib.client.common_lib import error
19from autotest_lib.client.common_lib import global_config
Dan Shi549fb822015-03-24 18:01:11 -070020from autotest_lib.client.common_lib import lsbrelease_utils
J. Richard Barnette45e93de2012-04-11 17:24:15 -070021from autotest_lib.client.common_lib.cros import autoupdater
Richard Barnette03a0c132012-11-05 12:40:35 -080022from autotest_lib.client.common_lib.cros import dev_server
Christopher Wileyd78249a2013-03-01 13:05:31 -080023from autotest_lib.client.common_lib.cros import retry
Gabe Blackb72f4fb2015-01-20 16:47:13 -080024from autotest_lib.client.common_lib.cros.graphite import autotest_es
Gabe Black1e1c41b2015-02-04 23:55:15 -080025from autotest_lib.client.common_lib.cros.graphite import autotest_stats
Hsinyu Chaoe0b08e62015-08-11 10:50:37 +000026from autotest_lib.client.cros import constants as client_constants
J. Richard Barnette84890bd2014-02-21 11:05:47 -080027from autotest_lib.client.cros import cros_ui
Cheng-Yi Chiangf4104ff2014-12-23 19:39:01 +080028from autotest_lib.client.cros.audio import cras_utils
Katherine Threlkeldab83d392015-06-18 16:45:57 -070029from autotest_lib.client.cros.input_playback import input_playback
MK Ryu35d661e2014-09-25 17:44:10 -070030from autotest_lib.server import autoserv_parser
31from autotest_lib.server import autotest
32from autotest_lib.server import constants
33from autotest_lib.server import crashcollect
Dan Shia1ecd5c2013-06-06 11:21:31 -070034from autotest_lib.server import utils as server_utils
Dan Shi9cb0eec2014-06-03 09:04:50 -070035from autotest_lib.server.cros import provision
Scott Zawalski89c44dd2013-02-26 09:28:02 -050036from autotest_lib.server.cros.dynamic_suite import constants as ds_constants
Simran Basi5e6339a2013-03-21 11:34:32 -070037from autotest_lib.server.cros.dynamic_suite import tools, frontend_wrappers
Dan Shi9cb0eec2014-06-03 09:04:50 -070038from autotest_lib.server.cros.faft.config.config import Config as FAFTConfig
Fang Deng96667ca2013-08-01 17:46:18 -070039from autotest_lib.server.hosts import abstract_ssh
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +080040from autotest_lib.server.hosts import chameleon_host
Fang Deng5d518f42013-08-02 14:04:32 -070041from autotest_lib.server.hosts import servo_host
Simran Basidcff4252012-11-20 16:13:20 -080042from autotest_lib.site_utils.rpm_control_system import rpm_client
Simran Basid5e5e272012-09-24 15:23:59 -070043
44
beeps32a63082013-08-22 14:02:29 -070045try:
46 import jsonrpclib
47except ImportError:
48 jsonrpclib = None
Fang Deng96667ca2013-08-01 17:46:18 -070049
Fang Dengd1c2b732013-08-20 12:59:46 -070050
Dan Shib8540a52015-07-16 14:18:23 -070051CONFIG = global_config.global_config
52
Eric Carusoee673ac2015-08-05 17:03:04 -070053LUCID_SLEEP_BOARDS = ['samus', 'lulu']
54
Dan Shi6731a6c2015-09-24 14:49:25 -070055# A file to indicate provision failure and require Repair job to powerwash the
56# dut.
57PROVISION_FAILED = '/var/tmp/provision_failed'
58
beepsc87ff602013-07-31 21:53:00 -070059class FactoryImageCheckerException(error.AutoservError):
60 """Exception raised when an image is a factory image."""
61 pass
62
63
Aviv Keshet74c89a92013-02-04 15:18:30 -080064def add_label_detector(label_function_list, label_list=None, label=None):
65 """Decorator used to group functions together into the provided list.
66 @param label_function_list: List of label detecting functions to add
67 decorated function to.
68 @param label_list: List of detectable labels to add detectable labels to.
69 (Default: None)
70 @param label: Label string that is detectable by this detection function
71 (Default: None)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -080072 """
Simran Basic6f1f7a2012-10-16 10:47:46 -070073 def add_func(func):
Aviv Keshet74c89a92013-02-04 15:18:30 -080074 """
75 @param func: The function to be added as a detector.
76 """
77 label_function_list.append(func)
78 if label and label_list is not None:
79 label_list.append(label)
Simran Basic6f1f7a2012-10-16 10:47:46 -070080 return func
81 return add_func
82
83
Fang Deng0ca40e22013-08-27 17:47:44 -070084class CrosHost(abstract_ssh.AbstractSSHHost):
J. Richard Barnette45e93de2012-04-11 17:24:15 -070085 """Chromium OS specific subclass of Host."""
86
87 _parser = autoserv_parser.autoserv_parser
Scott Zawalski62bacae2013-03-05 10:40:32 -050088 _AFE = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
J. Richard Barnette45e93de2012-04-11 17:24:15 -070089
Richard Barnette03a0c132012-11-05 12:40:35 -080090 # Timeout values (in seconds) associated with various Chrome OS
91 # state changes.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070092 #
Richard Barnette0c73ffc2012-11-19 15:21:18 -080093 # In general, a good rule of thumb is that the timeout can be up
94 # to twice the typical measured value on the slowest platform.
95 # The times here have not necessarily been empirically tested to
96 # meet this criterion.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070097 #
98 # SLEEP_TIMEOUT: Time to allow for suspend to memory.
Richard Barnette0c73ffc2012-11-19 15:21:18 -080099 # RESUME_TIMEOUT: Time to allow for resume after suspend, plus
100 # time to restart the netwowrk.
J. Richard Barnette84890bd2014-02-21 11:05:47 -0800101 # SHUTDOWN_TIMEOUT: Time to allow for shut down.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -0700102 # BOOT_TIMEOUT: Time to allow for boot from power off. Among
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800103 # other things, this must account for the 30 second dev-mode
J. Richard Barnetted4649c62013-03-06 17:42:27 -0800104 # screen delay and time to start the network.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -0700105 # USB_BOOT_TIMEOUT: Time to allow for boot from a USB device,
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800106 # including the 30 second dev-mode delay and time to start the
J. Richard Barnetted4649c62013-03-06 17:42:27 -0800107 # network.
beepsf079cfb2013-09-18 17:49:51 -0700108 # INSTALL_TIMEOUT: Time to allow for chromeos-install.
J. Richard Barnette84890bd2014-02-21 11:05:47 -0800109 # POWERWASH_BOOT_TIMEOUT: Time to allow for a reboot that
110 # includes powerwash.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -0700111
112 SLEEP_TIMEOUT = 2
J. Richard Barnetted4649c62013-03-06 17:42:27 -0800113 RESUME_TIMEOUT = 10
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +0800114 SHUTDOWN_TIMEOUT = 10
J. Richard Barnettefbcc7122013-07-24 18:24:59 -0700115 BOOT_TIMEOUT = 60
J. Richard Barnette5bab5f52015-08-03 13:14:38 -0700116 USB_BOOT_TIMEOUT = 300
J. Richard Barnette7817b052014-08-28 09:47:29 -0700117 INSTALL_TIMEOUT = 480
Dan Shi2c88eed2013-11-12 10:18:38 -0800118 POWERWASH_BOOT_TIMEOUT = 60
Chris Sosab76e0ee2013-05-22 16:55:41 -0700119
Dan Shica503482015-03-30 17:23:25 -0700120 # Minimum OS version that supports server side packaging. Older builds may
121 # not have server side package built or with Autotest code change to support
122 # server-side packaging.
Dan Shib8540a52015-07-16 14:18:23 -0700123 MIN_VERSION_SUPPORT_SSP = CONFIG.get_config_value(
Dan Shiced09e42015-04-17 16:09:34 -0700124 'AUTOSERV', 'min_version_support_ssp', type=int)
Dan Shica503482015-03-30 17:23:25 -0700125
J. Richard Barnette84890bd2014-02-21 11:05:47 -0800126 # REBOOT_TIMEOUT: How long to wait for a reboot.
127 #
Chris Sosab76e0ee2013-05-22 16:55:41 -0700128 # We have a long timeout to ensure we don't flakily fail due to other
129 # issues. Shorter timeouts are vetted in platform_RebootAfterUpdate.
Simran Basi1160e2c2013-10-04 16:00:24 -0700130 # TODO(sbasi - crbug.com/276094) Restore to 5 mins once the 'host did not
131 # return from reboot' bug is solved.
132 REBOOT_TIMEOUT = 480
Chris Sosab76e0ee2013-05-22 16:55:41 -0700133
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800134 # _USB_POWER_TIMEOUT: Time to allow for USB to power toggle ON and OFF.
135 # _POWER_CYCLE_TIMEOUT: Time to allow for manual power cycle.
136 _USB_POWER_TIMEOUT = 5
137 _POWER_CYCLE_TIMEOUT = 10
138
beeps32a63082013-08-22 14:02:29 -0700139 _RPC_PROXY_URL = 'http://localhost:%d'
Christopher Wileydd181852013-10-10 19:56:58 -0700140 _RPC_SHUTDOWN_POLLING_PERIOD_SECONDS = 2
Peter Qiu4410db72014-06-05 10:32:41 -0700141 # Set shutdown timeout to account for the time for restarting the UI.
142 _RPC_SHUTDOWN_TIMEOUT_SECONDS = cros_ui.RESTART_UI_TIMEOUT
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800143
Dan Shib8540a52015-07-16 14:18:23 -0700144 _RPM_RECOVERY_BOARDS = CONFIG.get_config_value('CROS',
Richard Barnette82c35912012-11-20 10:09:10 -0800145 'rpm_recovery_boards', type=str).split(',')
146
147 _MAX_POWER_CYCLE_ATTEMPTS = 6
148 _LAB_MACHINE_FILE = '/mnt/stateful_partition/.labmachine'
Fang Dengdeba14f2014-11-14 11:54:09 -0800149 _RPM_HOSTNAME_REGEX = ('chromeos(\d+)(-row(\d+))?-rack(\d+[a-z]*)'
150 '-host(\d+)')
Katherine Threlkeldab83d392015-06-18 16:45:57 -0700151 _LIGHTSENSOR_FILES = [ "in_illuminance0_input",
152 "in_illuminance_input",
153 "in_illuminance0_raw",
154 "in_illuminance_raw",
155 "illuminance0_input"]
Richard Barnette82c35912012-11-20 10:09:10 -0800156 _LIGHTSENSOR_SEARCH_DIR = '/sys/bus/iio/devices'
157 _LABEL_FUNCTIONS = []
Aviv Keshet74c89a92013-02-04 15:18:30 -0800158 _DETECTABLE_LABELS = []
159 label_decorator = functools.partial(add_label_detector, _LABEL_FUNCTIONS,
160 _DETECTABLE_LABELS)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700161
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -0800162 # Constants used in ping_wait_up() and ping_wait_down().
163 #
164 # _PING_WAIT_COUNT is the approximate number of polling
165 # cycles to use when waiting for a host state change.
166 #
167 # _PING_STATUS_DOWN and _PING_STATUS_UP are names used
168 # for arguments to the internal _ping_wait_for_status()
169 # method.
170 _PING_WAIT_COUNT = 40
171 _PING_STATUS_DOWN = False
172 _PING_STATUS_UP = True
173
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800174 # Allowed values for the power_method argument.
175
176 # POWER_CONTROL_RPM: Passed as default arg for power_off/on/cycle() methods.
177 # POWER_CONTROL_SERVO: Used in set_power() and power_cycle() methods.
178 # POWER_CONTROL_MANUAL: Used in set_power() and power_cycle() methods.
179 POWER_CONTROL_RPM = 'RPM'
180 POWER_CONTROL_SERVO = 'servoj10'
181 POWER_CONTROL_MANUAL = 'manual'
182
183 POWER_CONTROL_VALID_ARGS = (POWER_CONTROL_RPM,
184 POWER_CONTROL_SERVO,
185 POWER_CONTROL_MANUAL)
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800186
Simran Basi5e6339a2013-03-21 11:34:32 -0700187 _RPM_OUTLET_CHANGED = 'outlet_changed'
188
Dan Shi9cb0eec2014-06-03 09:04:50 -0700189 # URL pattern to download firmware image.
Dan Shib8540a52015-07-16 14:18:23 -0700190 _FW_IMAGE_URL_PATTERN = CONFIG.get_config_value(
Dan Shi9cb0eec2014-06-03 09:04:50 -0700191 'CROS', 'firmware_url_pattern', type=str)
beeps687243d2013-07-18 15:29:27 -0700192
MK Ryu35d661e2014-09-25 17:44:10 -0700193 # File that has a list of directories to be collected
194 _LOGS_TO_COLLECT_FILE = os.path.join(
195 common.client_dir, 'common_lib', 'logs_to_collect')
196
197 # Prefix of logging message w.r.t. crash collection
198 _CRASHLOGS_PREFIX = 'collect_crashlogs'
199
200 # Time duration waiting for host up/down check
201 _CHECK_HOST_UP_TIMEOUT_SECS = 15
202
203 # A command that interacts with kernel and hardware (e.g., rm, mkdir, etc)
204 # might not be completely done deep through the hardware when the machine
205 # is powered down right after the command returns.
206 # We should wait for a few seconds to make them done. Finger crossed.
207 _SAFE_WAIT_SECS = 10
208
209
J. Richard Barnette964fba02012-10-24 17:34:29 -0700210 @staticmethod
beeps46dadc92013-11-07 14:07:10 -0800211 def check_host(host, timeout=10):
212 """
213 Check if the given host is a chrome-os host.
214
215 @param host: An ssh host representing a device.
216 @param timeout: The timeout for the run command.
217
218 @return: True if the host device is chromeos.
219
beeps46dadc92013-11-07 14:07:10 -0800220 """
221 try:
Simran Basi933c8af2015-04-29 14:05:07 -0700222 result = host.run(
223 'grep -q CHROMEOS /etc/lsb-release && '
224 '! test -f /mnt/stateful_partition/.android_tester && '
225 '! grep -q moblab /etc/lsb-release',
226 ignore_status=True, timeout=timeout)
beeps46dadc92013-11-07 14:07:10 -0800227 except (error.AutoservRunError, error.AutoservSSHTimeout):
228 return False
229 return result.exit_status == 0
230
231
232 @staticmethod
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800233 def _extract_arguments(args_dict, key_subset):
234 """Extract options from `args_dict` and return a subset result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800235
236 Take the provided dictionary of argument options and return
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800237 a subset that represent standard arguments needed to construct
238 a test-assistant object (chameleon or servo) for a host. The
239 intent is to provide standard argument processing from
Christopher Wiley644ef3e2015-05-15 13:14:14 -0700240 CrosHost for tests that require a test-assistant board
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800241 to operate.
242
243 @param args_dict Dictionary from which to extract the arguments.
244 @param key_subset Tuple of keys to extract from the args_dict, e.g.
245 ('servo_host', 'servo_port').
246 """
247 result = {}
248 for arg in key_subset:
249 if arg in args_dict:
250 result[arg] = args_dict[arg]
251 return result
252
253
254 @staticmethod
255 def get_chameleon_arguments(args_dict):
256 """Extract chameleon options from `args_dict` and return the result.
257
258 Recommended usage:
259 ~~~~~~~~
260 args_dict = utils.args_to_dict(args)
261 chameleon_args = hosts.CrosHost.get_chameleon_arguments(args_dict)
262 host = hosts.create_host(machine, chameleon_args=chameleon_args)
263 ~~~~~~~~
264
265 @param args_dict Dictionary from which to extract the chameleon
266 arguments.
267 """
268 return CrosHost._extract_arguments(
269 args_dict, ('chameleon_host', 'chameleon_port'))
270
271
272 @staticmethod
273 def get_servo_arguments(args_dict):
274 """Extract servo options from `args_dict` and return the result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800275
276 Recommended usage:
277 ~~~~~~~~
278 args_dict = utils.args_to_dict(args)
Fang Deng0ca40e22013-08-27 17:47:44 -0700279 servo_args = hosts.CrosHost.get_servo_arguments(args_dict)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800280 host = hosts.create_host(machine, servo_args=servo_args)
281 ~~~~~~~~
282
283 @param args_dict Dictionary from which to extract the servo
284 arguments.
285 """
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800286 return CrosHost._extract_arguments(
287 args_dict, ('servo_host', 'servo_port'))
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700288
J. Richard Barnette964fba02012-10-24 17:34:29 -0700289
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800290 def _initialize(self, hostname, chameleon_args=None, servo_args=None,
Fang Denge545abb2014-12-30 18:43:47 -0800291 try_lab_servo=False, ssh_verbosity_flag='', ssh_options='',
Fang Dengd1c2b732013-08-20 12:59:46 -0700292 *args, **dargs):
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800293 """Initialize superclasses, |self.chameleon|, and |self.servo|.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700294
Fang Denge545abb2014-12-30 18:43:47 -0800295 This method will attempt to create the test-assistant object
296 (chameleon/servo) when it is needed by the test. Check
297 the docstring of chameleon_host.create_chameleon_host and
298 servo_host.create_servo_host for how this is determined.
Fang Deng5d518f42013-08-02 14:04:32 -0700299
Fang Denge545abb2014-12-30 18:43:47 -0800300 @param hostname: Hostname of the dut.
301 @param chameleon_args: A dictionary that contains args for creating
302 a ChameleonHost. See chameleon_host for details.
303 @param servo_args: A dictionary that contains args for creating
304 a ServoHost object. See servo_host for details.
305 @param try_lab_servo: Boolean, False indicates that ServoHost should
306 not be created for a device in Cros test lab.
307 See servo_host for details.
308 @param ssh_verbosity_flag: String, to pass to the ssh command to control
309 verbosity.
310 @param ssh_options: String, other ssh options to pass to the ssh
311 command.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700312 """
Fang Deng0ca40e22013-08-27 17:47:44 -0700313 super(CrosHost, self)._initialize(hostname=hostname,
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700314 *args, **dargs)
J. Richard Barnettef0859852012-08-20 14:55:50 -0700315 # self.env is a dictionary of environment variable settings
316 # to be exported for commands run on the host.
317 # LIBC_FATAL_STDERR_ can be useful for diagnosing certain
318 # errors that might happen.
319 self.env['LIBC_FATAL_STDERR_'] = '1'
beeps32a63082013-08-22 14:02:29 -0700320 self._rpc_proxy_map = {}
Fang Dengd1c2b732013-08-20 12:59:46 -0700321 self._ssh_verbosity_flag = ssh_verbosity_flag
Aviv Keshetc5947fa2013-09-04 14:06:29 -0700322 self._ssh_options = ssh_options
Fang Deng5d518f42013-08-02 14:04:32 -0700323 # TODO(fdeng): We need to simplify the
324 # process of servo and servo_host initialization.
325 # crbug.com/298432
Fang Denge545abb2014-12-30 18:43:47 -0800326 self._servo_host = servo_host.create_servo_host(
327 dut=self.hostname, servo_args=servo_args,
328 try_lab_servo=try_lab_servo)
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800329 # TODO(waihong): Do the simplication on Chameleon too.
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800330 self._chameleon_host = chameleon_host.create_chameleon_host(
331 dut=self.hostname, chameleon_args=chameleon_args)
332
Dan Shi4d478522014-02-14 13:46:32 -0800333 if self._servo_host is not None:
334 self.servo = self._servo_host.get_servo()
335 else:
336 self.servo = None
337
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800338 if self._chameleon_host:
Tom Wai-Hong Tameaee3402014-01-22 08:52:10 +0800339 self.chameleon = self._chameleon_host.create_chameleon_board()
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800340 else:
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800341 self.chameleon = None
Fang Deng5d518f42013-08-02 14:04:32 -0700342
343
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500344 def get_repair_image_name(self):
345 """Generate a image_name from variables in the global config.
346
347 @returns a str of $board-version/$BUILD.
348
349 """
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500350 board = self._get_board_from_afe()
351 if board is None:
352 raise error.AutoservError('DUT has no board attribute, '
353 'cannot be repaired.')
Dan Shi6964fa52014-12-18 11:04:27 -0800354 stable_version = self._AFE.run('get_stable_version', board=board)
Dan Shib8540a52015-07-16 14:18:23 -0700355 build_pattern = CONFIG.get_config_value(
Dan Shi6964fa52014-12-18 11:04:27 -0800356 'CROS', 'stable_build_pattern')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500357 return build_pattern % (board, stable_version)
358
359
Scott Zawalski62bacae2013-03-05 10:40:32 -0500360 def _host_in_AFE(self):
361 """Check if the host is an object the AFE knows.
362
363 @returns the host object.
364 """
365 return self._AFE.get_hosts(hostname=self.hostname)
366
367
Chris Sosab76e0ee2013-05-22 16:55:41 -0700368 def lookup_job_repo_url(self):
369 """Looks up the job_repo_url for the host.
370
371 @returns job_repo_url from AFE or None if not found.
372
373 @raises KeyError if the host does not have a job_repo_url
374 """
Chris Sosab76e0ee2013-05-22 16:55:41 -0700375 hosts = self._AFE.get_hosts(hostname=self.hostname)
beepsb5efc532013-06-04 11:29:34 -0700376 if hosts and ds_constants.JOB_REPO_URL in hosts[0].attributes:
377 return hosts[0].attributes[ds_constants.JOB_REPO_URL]
J. Richard Barnette85d0aac2015-08-20 10:34:39 -0700378 else:
379 return None
Chris Sosab76e0ee2013-05-22 16:55:41 -0700380
381
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500382 def clear_cros_version_labels_and_job_repo_url(self):
383 """Clear cros_version labels and host attribute job_repo_url."""
Scott Zawalski62bacae2013-03-05 10:40:32 -0500384 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400385 return
386
Scott Zawalski62bacae2013-03-05 10:40:32 -0500387 host_list = [self.hostname]
388 labels = self._AFE.get_labels(
389 name__startswith=ds_constants.VERSION_PREFIX,
390 host__hostname=self.hostname)
Dan Shi0f466e82013-02-22 15:44:58 -0800391
Scott Zawalski62bacae2013-03-05 10:40:32 -0500392 for label in labels:
393 label.remove_hosts(hosts=host_list)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500394
beepscb6f1e22013-06-28 19:14:10 -0700395 self.update_job_repo_url(None, None)
396
397
398 def update_job_repo_url(self, devserver_url, image_name):
399 """
400 Updates the job_repo_url host attribute and asserts it's value.
401
402 @param devserver_url: The devserver to use in the job_repo_url.
403 @param image_name: The name of the image to use in the job_repo_url.
404
405 @raises AutoservError: If we failed to update the job_repo_url.
406 """
407 repo_url = None
408 if devserver_url and image_name:
409 repo_url = tools.get_package_url(devserver_url, image_name)
410 self._AFE.set_host_attribute(ds_constants.JOB_REPO_URL, repo_url,
Scott Zawalski62bacae2013-03-05 10:40:32 -0500411 hostname=self.hostname)
beepscb6f1e22013-06-28 19:14:10 -0700412 if self.lookup_job_repo_url() != repo_url:
413 raise error.AutoservError('Failed to update job_repo_url with %s, '
414 'host %s' % (repo_url, self.hostname))
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500415
416
Dan Shie9309262013-06-19 22:50:21 -0700417 def add_cros_version_labels_and_job_repo_url(self, image_name):
Scott Zawalskieadbf702013-03-14 09:23:06 -0400418 """Add cros_version labels and host attribute job_repo_url.
419
420 @param image_name: The name of the image e.g.
421 lumpy-release/R27-3837.0.0
Dan Shi7458bf62013-06-10 12:50:16 -0700422
Scott Zawalskieadbf702013-03-14 09:23:06 -0400423 """
Scott Zawalski62bacae2013-03-05 10:40:32 -0500424 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400425 return
Scott Zawalski62bacae2013-03-05 10:40:32 -0500426
Scott Zawalskieadbf702013-03-14 09:23:06 -0400427 cros_label = '%s%s' % (ds_constants.VERSION_PREFIX, image_name)
Dan Shie9309262013-06-19 22:50:21 -0700428 devserver_url = dev_server.ImageServer.resolve(image_name).url()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500429
MK Ryufb5e3a82015-07-01 12:21:20 -0700430 self._AFE.run('label_add_hosts', id=cros_label, hosts=[self.hostname])
beepscb6f1e22013-06-28 19:14:10 -0700431 self.update_job_repo_url(devserver_url, image_name)
432
433
beepsdae65fd2013-07-26 16:24:41 -0700434 def verify_job_repo_url(self, tag=''):
beepscb6f1e22013-06-28 19:14:10 -0700435 """
436 Make sure job_repo_url of this host is valid.
437
joychen03eaad92013-06-26 09:55:21 -0700438 Eg: The job_repo_url "http://lmn.cd.ab.xyx:8080/static/\
beepscb6f1e22013-06-28 19:14:10 -0700439 lumpy-release/R29-4279.0.0/autotest/packages" claims to have the
440 autotest package for lumpy-release/R29-4279.0.0. If this isn't the case,
441 download and extract it. If the devserver embedded in the url is
442 unresponsive, update the job_repo_url of the host after staging it on
443 another devserver.
444
445 @param job_repo_url: A url pointing to the devserver where the autotest
446 package for this build should be staged.
beepsdae65fd2013-07-26 16:24:41 -0700447 @param tag: The tag from the server job, in the format
448 <job_id>-<user>/<hostname>, or <hostless> for a server job.
beepscb6f1e22013-06-28 19:14:10 -0700449
450 @raises DevServerException: If we could not resolve a devserver.
451 @raises AutoservError: If we're unable to save the new job_repo_url as
452 a result of choosing a new devserver because the old one failed to
453 respond to a health check.
beeps0c865032013-07-30 11:37:06 -0700454 @raises urllib2.URLError: If the devserver embedded in job_repo_url
455 doesn't respond within the timeout.
beepscb6f1e22013-06-28 19:14:10 -0700456 """
457 job_repo_url = self.lookup_job_repo_url()
458 if not job_repo_url:
459 logging.warning('No job repo url set on host %s', self.hostname)
460 return
461
462 logging.info('Verifying job repo url %s', job_repo_url)
463 devserver_url, image_name = tools.get_devserver_build_from_package_url(
464 job_repo_url)
465
beeps0c865032013-07-30 11:37:06 -0700466 ds = dev_server.ImageServer(devserver_url)
beepscb6f1e22013-06-28 19:14:10 -0700467
468 logging.info('Staging autotest artifacts for %s on devserver %s',
469 image_name, ds.url())
beeps687243d2013-07-18 15:29:27 -0700470
471 start_time = time.time()
Simran Basi25e7a922014-10-31 11:56:10 -0700472 ds.stage_artifacts(image_name, ['autotest_packages'])
beeps687243d2013-07-18 15:29:27 -0700473 stage_time = time.time() - start_time
474
475 # Record how much of the verification time comes from a devserver
476 # restage. If we're doing things right we should not see multiple
477 # devservers for a given board/build/branch path.
478 try:
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800479 board, build_type, branch = server_utils.ParseBuildName(
beeps687243d2013-07-18 15:29:27 -0700480 image_name)[:3]
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800481 except server_utils.ParseBuildNameException:
beeps687243d2013-07-18 15:29:27 -0700482 pass
483 else:
beeps0c865032013-07-30 11:37:06 -0700484 devserver = devserver_url[
Chris Sosa65425082013-10-16 13:26:22 -0700485 devserver_url.find('/') + 2:devserver_url.rfind(':')]
beeps687243d2013-07-18 15:29:27 -0700486 stats_key = {
487 'board': board,
488 'build_type': build_type,
489 'branch': branch,
beeps0c865032013-07-30 11:37:06 -0700490 'devserver': devserver.replace('.', '_'),
beeps687243d2013-07-18 15:29:27 -0700491 }
Gabe Black1e1c41b2015-02-04 23:55:15 -0800492 autotest_stats.Gauge('verify_job_repo_url').send(
beeps687243d2013-07-18 15:29:27 -0700493 '%(board)s.%(build_type)s.%(branch)s.%(devserver)s' % stats_key,
494 stage_time)
beepscb6f1e22013-06-28 19:14:10 -0700495
Scott Zawalskieadbf702013-03-14 09:23:06 -0400496
Dan Shicf4d2032015-03-12 15:04:21 -0700497 def stage_server_side_package(self, image=None):
498 """Stage autotest server-side package on devserver.
499
500 @param image: Full path of an OS image to install or a build name.
501
502 @return: A url to the autotest server-side package.
503 """
504 if image:
505 image_name = tools.get_build_from_image(image)
506 if not image_name:
507 raise error.AutoservError(
508 'Failed to parse build name from %s' % image)
509 ds = dev_server.ImageServer.resolve(image_name)
510 else:
511 job_repo_url = self.lookup_job_repo_url()
512 if job_repo_url:
513 devserver_url, image_name = (
514 tools.get_devserver_build_from_package_url(job_repo_url))
515 ds = dev_server.ImageServer(devserver_url)
516 else:
517 labels = self._AFE.get_labels(
518 name__startswith=ds_constants.VERSION_PREFIX,
519 host__hostname=self.hostname)
520 if not labels:
521 raise error.AutoservError(
522 'Failed to stage server-side package. The host has '
523 'no job_report_url attribute or version label.')
524 image_name = labels[0].name[len(ds_constants.VERSION_PREFIX):]
525 ds = dev_server.ImageServer.resolve(image_name)
Dan Shica503482015-03-30 17:23:25 -0700526
527 # Get the OS version of the build, for any build older than
528 # MIN_VERSION_SUPPORT_SSP, server side packaging is not supported.
529 match = re.match('.*/R\d+-(\d+)\.', image_name)
530 if match and int(match.group(1)) < self.MIN_VERSION_SUPPORT_SSP:
531 logging.warn('Build %s is older than %s. Server side packaging is '
532 'disabled.', image_name, self.MIN_VERSION_SUPPORT_SSP)
533 return None
534
Dan Shicf4d2032015-03-12 15:04:21 -0700535 ds.stage_artifacts(image_name, ['autotest_server_package'])
536 return '%s/static/%s/%s' % (ds.url(), image_name,
537 'autotest_server_package.tar.bz2')
538
539
Dan Shi0f466e82013-02-22 15:44:58 -0800540 def _try_stateful_update(self, update_url, force_update, updater):
541 """Try to use stateful update to initialize DUT.
542
543 When DUT is already running the same version that machine_install
544 tries to install, stateful update is a much faster way to clean up
545 the DUT for testing, compared to a full reimage. It is implemeted
546 by calling autoupdater.run_update, but skipping updating root, as
547 updating the kernel is time consuming and not necessary.
548
549 @param update_url: url of the image.
550 @param force_update: Set to True to update the image even if the DUT
551 is running the same version.
552 @param updater: ChromiumOSUpdater instance used to update the DUT.
553 @returns: True if the DUT was updated with stateful update.
554
555 """
J. Richard Barnette3f731032014-04-07 17:42:59 -0700556 # TODO(jrbarnette): Yes, I hate this re.match() test case.
557 # It's better than the alternative: see crbug.com/360944.
558 image_name = autoupdater.url_to_image_name(update_url)
559 release_pattern = r'^.*-release/R[0-9]+-[0-9]+\.[0-9]+\.0$'
560 if not re.match(release_pattern, image_name):
561 return False
Dan Shi0f466e82013-02-22 15:44:58 -0800562 if not updater.check_version():
563 return False
564 if not force_update:
565 logging.info('Canceling stateful update because the new and '
566 'old versions are the same.')
567 return False
568 # Following folders should be rebuilt after stateful update.
569 # A test file is used to confirm each folder gets rebuilt after
570 # the stateful update.
571 folders_to_check = ['/var', '/home', '/mnt/stateful_partition']
572 test_file = '.test_file_to_be_deleted'
573 for folder in folders_to_check:
574 touch_path = os.path.join(folder, test_file)
575 self.run('touch %s' % touch_path)
576
Chris Sosae92399e2015-04-24 11:32:59 -0700577 updater.run_update(update_root=False)
Dan Shi0f466e82013-02-22 15:44:58 -0800578
579 # Reboot to complete stateful update.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700580 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Dan Shi0f466e82013-02-22 15:44:58 -0800581 check_file_cmd = 'test -f %s; echo $?'
582 for folder in folders_to_check:
583 test_file_path = os.path.join(folder, test_file)
584 result = self.run(check_file_cmd % test_file_path,
585 ignore_status=True)
586 if result.exit_status == 1:
587 return False
588 return True
589
590
J. Richard Barnette7275b612013-06-04 18:13:11 -0700591 def _post_update_processing(self, updater, expected_kernel=None):
Dan Shi0f466e82013-02-22 15:44:58 -0800592 """After the DUT is updated, confirm machine_install succeeded.
593
594 @param updater: ChromiumOSUpdater instance used to update the DUT.
J. Richard Barnette7275b612013-06-04 18:13:11 -0700595 @param expected_kernel: kernel expected to be active after reboot,
596 or `None` to skip rollback checking.
Dan Shi0f466e82013-02-22 15:44:58 -0800597
598 """
J. Richard Barnette7275b612013-06-04 18:13:11 -0700599 # Touch the lab machine file to leave a marker that
600 # distinguishes this image from other test images.
601 # Afterwards, we must re-run the autoreboot script because
602 # it depends on the _LAB_MACHINE_FILE.
Dan Shi0f466e82013-02-22 15:44:58 -0800603 self.run('touch %s' % self._LAB_MACHINE_FILE)
Dan Shi0f466e82013-02-22 15:44:58 -0800604 self.run('start autoreboot')
Chris Sosa65425082013-10-16 13:26:22 -0700605 updater.verify_boot_expectations(
606 expected_kernel, rollback_message=
607 'Build %s failed to boot on %s; system rolled back to previous'
608 'build' % (updater.update_version, self.hostname))
J. Richard Barnette7275b612013-06-04 18:13:11 -0700609 # Check that we've got the build we meant to install.
610 if not updater.check_version_to_confirm_install():
611 raise autoupdater.ChromiumOSError(
612 'Failed to update %s to build %s; found build '
613 '%s instead' % (self.hostname,
Chris Sosa65425082013-10-16 13:26:22 -0700614 updater.update_version,
Dan Shi0942b1d2015-03-31 11:07:00 -0700615 self.get_release_version()))
Dan Shi0f466e82013-02-22 15:44:58 -0800616
Chris Sosae92399e2015-04-24 11:32:59 -0700617 logging.debug('Cleaning up old autotest directories.')
618 try:
619 installed_autodir = autotest.Autotest.get_installed_autodir(self)
620 self.run('rm -rf ' + installed_autodir)
621 except autotest.AutodirNotFoundError:
622 logging.debug('No autotest installed directory found.')
623
Dan Shi0f466e82013-02-22 15:44:58 -0800624
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700625 def _stage_image_for_update(self, image_name=None):
Chris Sosae92399e2015-04-24 11:32:59 -0700626 """Stage a build on a devserver and return the update_url and devserver.
Scott Zawalskieadbf702013-03-14 09:23:06 -0400627
628 @param image_name: a name like lumpy-release/R27-3837.0.0
Chris Sosae92399e2015-04-24 11:32:59 -0700629 @returns a tuple with an update URL like:
Scott Zawalskieadbf702013-03-14 09:23:06 -0400630 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
Chris Sosae92399e2015-04-24 11:32:59 -0700631 and the devserver instance.
Scott Zawalskieadbf702013-03-14 09:23:06 -0400632 """
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700633 if not image_name:
634 image_name = self.get_repair_image_name()
Chris Sosae92399e2015-04-24 11:32:59 -0700635
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700636 logging.info('Staging build for AU: %s', image_name)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400637 devserver = dev_server.ImageServer.resolve(image_name)
638 devserver.trigger_download(image_name, synchronous=False)
Chris Sosae92399e2015-04-24 11:32:59 -0700639 return (tools.image_url_pattern() % (devserver.url(), image_name),
640 devserver)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400641
642
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700643 def stage_image_for_servo(self, image_name=None):
644 """Stage a build on a devserver and return the update_url.
645
646 @param image_name: a name like lumpy-release/R27-3837.0.0
647 @returns an update URL like:
648 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
649 """
650 if not image_name:
651 image_name = self.get_repair_image_name()
652 logging.info('Staging build for servo install: %s', image_name)
653 devserver = dev_server.ImageServer.resolve(image_name)
654 devserver.stage_artifacts(image_name, ['test_image'])
655 return devserver.get_test_image_url(image_name)
656
657
beepse539be02013-07-31 21:57:39 -0700658 def stage_factory_image_for_servo(self, image_name):
659 """Stage a build on a devserver and return the update_url.
660
661 @param image_name: a name like <baord>/4262.204.0
beeps12c0a3c2013-09-03 11:58:27 -0700662
beepse539be02013-07-31 21:57:39 -0700663 @return: An update URL, eg:
664 http://<devserver>/static/canary-channel/\
665 <board>/4262.204.0/factory_test/chromiumos_factory_image.bin
beeps12c0a3c2013-09-03 11:58:27 -0700666
667 @raises: ValueError if the factory artifact name is missing from
668 the config.
669
beepse539be02013-07-31 21:57:39 -0700670 """
671 if not image_name:
672 logging.error('Need an image_name to stage a factory image.')
673 return
674
Dan Shib8540a52015-07-16 14:18:23 -0700675 factory_artifact = CONFIG.get_config_value(
beeps12c0a3c2013-09-03 11:58:27 -0700676 'CROS', 'factory_artifact', type=str, default='')
677 if not factory_artifact:
678 raise ValueError('Cannot retrieve the factory artifact name from '
679 'autotest config, and hence cannot stage factory '
680 'artifacts.')
681
beepse539be02013-07-31 21:57:39 -0700682 logging.info('Staging build for servo install: %s', image_name)
683 devserver = dev_server.ImageServer.resolve(image_name)
684 devserver.stage_artifacts(
685 image_name,
beeps12c0a3c2013-09-03 11:58:27 -0700686 [factory_artifact],
687 archive_url=None)
beepse539be02013-07-31 21:57:39 -0700688
689 return tools.factory_image_url_pattern() % (devserver.url(), image_name)
690
691
Chris Sosaa3ac2152012-05-23 22:23:13 -0700692 def machine_install(self, update_url=None, force_update=False,
Richard Barnette0b023a72015-04-24 16:07:30 +0000693 local_devserver=False, repair=False,
694 force_full_update=False):
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500695 """Install the DUT.
696
Dan Shi0f466e82013-02-22 15:44:58 -0800697 Use stateful update if the DUT is already running the same build.
698 Stateful update does not update kernel and tends to run much faster
699 than a full reimage. If the DUT is running a different build, or it
700 failed to do a stateful update, full update, including kernel update,
701 will be applied to the DUT.
702
Scott Zawalskieadbf702013-03-14 09:23:06 -0400703 Once a host enters machine_install its cros_version label will be
704 removed as well as its host attribute job_repo_url (used for
705 package install).
706
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500707 @param update_url: The url to use for the update
708 pattern: http://$devserver:###/update/$build
709 If update_url is None and repair is True we will install the
Dan Shi6964fa52014-12-18 11:04:27 -0800710 stable image listed in afe_stable_versions table. If the table
711 is not setup, global_config value under CROS.stable_cros_version
712 will be used instead.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500713 @param force_update: Force an update even if the version installed
714 is the same. Default:False
Christopher Wiley6a4ff932015-05-15 14:00:47 -0700715 @param local_devserver: Used by test_that to allow people to
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500716 use their local devserver. Default: False
Chris Sosae92399e2015-04-24 11:32:59 -0700717 @param repair: Forces update to repair image. Implies force_update.
Fang Deng3d3b9272014-12-22 12:20:28 -0800718 @param force_full_update: If True, do not attempt to run stateful
719 update, force a full reimage. If False, try stateful update
720 first when the dut is already installed with the same version.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500721 @raises autoupdater.ChromiumOSError
722
723 """
Chris Sosae92399e2015-04-24 11:32:59 -0700724 devserver = None
Richard Barnette0b023a72015-04-24 16:07:30 +0000725 if repair:
Chris Sosae92399e2015-04-24 11:32:59 -0700726 update_url, devserver = self._stage_image_for_update()
Richard Barnette0b023a72015-04-24 16:07:30 +0000727 force_update = True
Dan Shi0f466e82013-02-22 15:44:58 -0800728
Chris Sosae92399e2015-04-24 11:32:59 -0700729 if not update_url and not self._parser.options.image:
730 raise error.AutoservError(
Dan Shi6731a6c2015-09-24 14:49:25 -0700731 'There is no update URL, nor a method to get one.')
Chris Sosae92399e2015-04-24 11:32:59 -0700732
733 if not update_url and self._parser.options.image:
734 # This is the base case where we have no given update URL i.e.
735 # dynamic suites logic etc. This is the most flexible case where we
736 # can serve an update from any of our fleet of devservers.
737 requested_build = self._parser.options.image
738 if not requested_build.startswith('http://'):
739 logging.debug('Update will be staged for this installation')
740 update_url, devserver = self._stage_image_for_update(
Dan Shi6731a6c2015-09-24 14:49:25 -0700741 requested_build)
Chris Sosae92399e2015-04-24 11:32:59 -0700742 else:
743 update_url = requested_build
744
745 logging.debug('Update URL is %s', update_url)
746
Scott Zawalskieadbf702013-03-14 09:23:06 -0400747 # Remove cros-version and job_repo_url host attribute from host.
748 self.clear_cros_version_labels_and_job_repo_url()
Chris Sosae92399e2015-04-24 11:32:59 -0700749
Dan Shi6731a6c2015-09-24 14:49:25 -0700750 # Create a file to indicate if provision fails. The file will be removed
751 # by stateful update or full install.
752 self.run('touch %s' % PROVISION_FAILED)
753
Chris Sosae92399e2015-04-24 11:32:59 -0700754 update_complete = False
755 updater = autoupdater.ChromiumOSUpdater(
756 update_url, host=self, local_devserver=local_devserver)
Fang Deng3d3b9272014-12-22 12:20:28 -0800757 if not force_full_update:
758 try:
Chris Sosae92399e2015-04-24 11:32:59 -0700759 # If the DUT is already running the same build, try stateful
760 # update first as it's much quicker than a full re-image.
761 update_complete = self._try_stateful_update(
Dan Shi6731a6c2015-09-24 14:49:25 -0700762 update_url, force_update, updater)
Fang Deng3d3b9272014-12-22 12:20:28 -0800763 except Exception as e:
764 logging.exception(e)
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700765
Dan Shi0f466e82013-02-22 15:44:58 -0800766 inactive_kernel = None
Chris Sosae92399e2015-04-24 11:32:59 -0700767 if update_complete or (not force_update and updater.check_version()):
768 logging.info('Install complete without full update')
769 else:
770 logging.info('DUT requires full update.')
771 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
772 num_of_attempts = provision.FLAKY_DEVSERVER_ATTEMPTS
Chris Sosab7612bc2013-03-21 10:32:37 -0700773
Chris Sosae92399e2015-04-24 11:32:59 -0700774 while num_of_attempts > 0:
775 num_of_attempts -= 1
776 try:
777 updater.run_update()
778 except Exception:
779 logging.warn('Autoupdate did not complete.')
780 # Do additional check for the devserver health. Ideally,
781 # the autoupdater.py could raise an exception when it
782 # detected network flake but that would require
783 # instrumenting the update engine and parsing it log.
784 if (num_of_attempts <= 0 or
785 devserver is None or
786 dev_server.DevServer.devserver_healthy(
787 devserver.url())):
Dan Shi6731a6c2015-09-24 14:49:25 -0700788 raise
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700789
Chris Sosae92399e2015-04-24 11:32:59 -0700790 logging.warn('Devserver looks unhealthy. Trying another')
791 update_url, devserver = self._stage_image_for_update(
792 requested_build)
793 logging.debug('New Update URL is %s', update_url)
794 updater = autoupdater.ChromiumOSUpdater(
795 update_url, host=self,
796 local_devserver=local_devserver)
797 else:
798 break
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700799
Chris Sosae92399e2015-04-24 11:32:59 -0700800 # Give it some time in case of IO issues.
801 time.sleep(10)
Dan Shi5699ac22014-12-19 10:55:49 -0800802
Chris Sosae92399e2015-04-24 11:32:59 -0700803 # Figure out active and inactive kernel.
804 active_kernel, inactive_kernel = updater.get_kernel_state()
Simran Basi13fa1ba2013-03-04 10:56:47 -0800805
Chris Sosae92399e2015-04-24 11:32:59 -0700806 # Ensure inactive kernel has higher priority than active.
807 if (updater.get_kernel_priority(inactive_kernel)
808 < updater.get_kernel_priority(active_kernel)):
809 raise autoupdater.ChromiumOSError(
810 'Update failed. The priority of the inactive kernel'
811 ' partition is less than that of the active kernel'
812 ' partition.')
813
814 # Updater has returned successfully; reboot the host.
815 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
816
817 self._post_update_processing(updater, inactive_kernel)
818 self.add_cros_version_labels_and_job_repo_url(
819 autoupdater.url_to_image_name(update_url))
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700820
821
Dan Shi9cb0eec2014-06-03 09:04:50 -0700822 def _clear_fw_version_labels(self):
823 """Clear firmware version labels from the machine."""
824 labels = self._AFE.get_labels(
Dan Shi0723bf52015-06-24 10:52:38 -0700825 name__startswith=provision.FW_RW_VERSION_PREFIX,
Dan Shi9cb0eec2014-06-03 09:04:50 -0700826 host__hostname=self.hostname)
827 for label in labels:
828 label.remove_hosts(hosts=[self.hostname])
829
830
831 def _add_fw_version_label(self, build):
832 """Add firmware version label to the machine.
833
834 @param build: Build of firmware.
835
836 """
837 fw_label = provision.fw_version_to_label(build)
MK Ryu73be9862015-07-06 12:25:00 -0700838 self._AFE.run('label_add_hosts', id=fw_label, hosts=[self.hostname])
Dan Shi9cb0eec2014-06-03 09:04:50 -0700839
840
841 def firmware_install(self, build=None):
842 """Install firmware to the DUT.
843
844 Use stateful update if the DUT is already running the same build.
845 Stateful update does not update kernel and tends to run much faster
846 than a full reimage. If the DUT is running a different build, or it
847 failed to do a stateful update, full update, including kernel update,
848 will be applied to the DUT.
849
850 Once a host enters firmware_install its fw_version label will be
851 removed. After the firmware is updated successfully, a new fw_version
852 label will be added to the host.
853
854 @param build: The build version to which we want to provision the
855 firmware of the machine,
856 e.g. 'link-firmware/R22-2695.1.144'.
857
858 TODO(dshi): After bug 381718 is fixed, update here with corresponding
859 exceptions that could be raised.
860
861 """
862 if not self.servo:
863 raise error.TestError('Host %s does not have servo.' %
864 self.hostname)
865
866 # TODO(fdeng): use host.get_board() after
867 # crbug.com/271834 is fixed.
868 board = self._get_board_from_afe()
869
Chris Sosae92399e2015-04-24 11:32:59 -0700870 # If build is not set, try to install firmware from stable CrOS.
Dan Shi9cb0eec2014-06-03 09:04:50 -0700871 if not build:
872 build = self.get_repair_image_name()
873
874 config = FAFTConfig(board)
875 if config.use_u_boot:
876 ap_image = 'image-%s.bin' % board
877 else: # Depthcharge platform
878 ap_image = 'image.bin'
879 ec_image = 'ec.bin'
880 ds = dev_server.ImageServer.resolve(build)
881 ds.stage_artifacts(build, ['firmware'])
882
883 tmpd = autotemp.tempdir(unique_id='fwimage')
884 try:
885 fwurl = self._FW_IMAGE_URL_PATTERN % (ds.url(), build)
886 local_tarball = os.path.join(tmpd.name, os.path.basename(fwurl))
887 server_utils.system('wget -O %s %s' % (local_tarball, fwurl),
888 timeout=60)
889 server_utils.system('tar xf %s -C %s %s %s' %
890 (local_tarball, tmpd.name, ap_image, ec_image),
891 timeout=60)
892 server_utils.system('tar xf %s --wildcards -C %s "dts/*"' %
893 (local_tarball, tmpd.name),
894 timeout=60, ignore_status=True)
895
896 self._clear_fw_version_labels()
897 logging.info('Will re-program EC now')
898 self.servo.program_ec(os.path.join(tmpd.name, ec_image))
899 logging.info('Will re-program BIOS now')
900 self.servo.program_bios(os.path.join(tmpd.name, ap_image))
901 self.servo.get_power_state_controller().reset()
902 time.sleep(self.servo.BOOT_DELAY)
Dan Shia5fef052015-05-18 23:28:47 -0700903 self._add_fw_version_label(build)
Dan Shi9cb0eec2014-06-03 09:04:50 -0700904 finally:
905 tmpd.clean()
906
907
Dan Shi10e992b2013-08-30 11:02:59 -0700908 def show_update_engine_log(self):
909 """Output update engine log."""
MK Ryu35d661e2014-09-25 17:44:10 -0700910 logging.debug('Dumping %s', client_constants.UPDATE_ENGINE_LOG)
911 self.run('cat %s' % client_constants.UPDATE_ENGINE_LOG)
Dan Shi10e992b2013-08-30 11:02:59 -0700912
913
Richard Barnette82c35912012-11-20 10:09:10 -0800914 def _get_board_from_afe(self):
915 """Retrieve this host's board from its labels in the AFE.
916
917 Looks for a host label of the form "board:<board>", and
918 returns the "<board>" part of the label. `None` is returned
919 if there is not a single, unique label matching the pattern.
920
921 @returns board from label, or `None`.
922 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700923 return server_utils.get_board_from_afe(self.hostname, self._AFE)
Simran Basi833814b2013-01-29 13:13:43 -0800924
925
926 def get_build(self):
927 """Retrieve the current build for this Host from the AFE.
928
929 Looks through this host's labels in the AFE to determine its build.
930
931 @returns The current build or None if it could not find it or if there
932 were multiple build labels assigned to this host.
933 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700934 return server_utils.get_build_from_afe(self.hostname, self._AFE)
Richard Barnette82c35912012-11-20 10:09:10 -0800935
936
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500937 def _install_repair(self):
Chris Sosae92399e2015-04-24 11:32:59 -0700938 """Attempt to repair this host using the update-engine.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500939
940 If the host is up, try installing the DUT with a stable
Dan Shi6964fa52014-12-18 11:04:27 -0800941 "repair" version of Chrome OS as defined in afe_stable_versions table.
942 If the table is not setup, global_config value under
943 CROS.stable_cros_version will be used instead.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500944
Scott Zawalski62bacae2013-03-05 10:40:32 -0500945 @raises AutoservRepairMethodNA if the DUT is not reachable.
946 @raises ChromiumOSError if the install failed for some reason.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500947
948 """
949 if not self.is_up():
Scott Zawalski62bacae2013-03-05 10:40:32 -0500950 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500951 logging.info('Attempting to reimage machine to repair image.')
952 try:
Richard Barnette0b023a72015-04-24 16:07:30 +0000953 self.machine_install(repair=True)
Fang Dengd0672f32013-03-18 17:18:09 -0700954 except autoupdater.ChromiumOSError as e:
955 logging.exception(e)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500956 logging.info('Repair via install failed.')
Scott Zawalski62bacae2013-03-05 10:40:32 -0500957 raise
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500958
959
Dan Shi2c88eed2013-11-12 10:18:38 -0800960 def _install_repair_with_powerwash(self):
Dan Shi9cc48452013-11-12 12:39:26 -0800961 """Attempt to powerwash first then repair this host using update-engine.
Dan Shi2c88eed2013-11-12 10:18:38 -0800962
Dan Shi9cc48452013-11-12 12:39:26 -0800963 update-engine may fail due to a bad image. In such case, powerwash
964 may help to cleanup the DUT for update-engine to work again.
Dan Shi2c88eed2013-11-12 10:18:38 -0800965
966 @raises AutoservRepairMethodNA if the DUT is not reachable.
967 @raises ChromiumOSError if the install failed for some reason.
968
969 """
970 if not self.is_up():
971 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
972
973 logging.info('Attempting to powerwash the DUT.')
974 self.run('echo "fast safe" > '
975 '/mnt/stateful_partition/factory_install_reset')
976 self.reboot(timeout=self.POWERWASH_BOOT_TIMEOUT, wait=True)
977 if not self.is_up():
Dan Shi9cc48452013-11-12 12:39:26 -0800978 logging.error('Powerwash failed. DUT did not come back after '
Dan Shi2c88eed2013-11-12 10:18:38 -0800979 'reboot.')
980 raise error.AutoservRepairFailure(
981 'DUT failed to boot from powerwash after %d seconds' %
982 self.POWERWASH_BOOT_TIMEOUT)
983
984 logging.info('Powerwash succeeded.')
985 self._install_repair()
986
987
beepsf079cfb2013-09-18 17:49:51 -0700988 def servo_install(self, image_url=None, usb_boot_timeout=USB_BOOT_TIMEOUT,
989 install_timeout=INSTALL_TIMEOUT):
Scott Zawalski62bacae2013-03-05 10:40:32 -0500990 """
991 Re-install the OS on the DUT by:
992 1) installing a test image on a USB storage device attached to the Servo
993 board,
Richard Barnette03a0c132012-11-05 12:40:35 -0800994 2) booting that image in recovery mode, and then
J. Richard Barnette31b2e312013-04-04 16:05:22 -0700995 3) installing the image with chromeos-install.
996
Scott Zawalski62bacae2013-03-05 10:40:32 -0500997 @param image_url: If specified use as the url to install on the DUT.
998 otherwise boot the currently staged image on the USB stick.
beepsf079cfb2013-09-18 17:49:51 -0700999 @param usb_boot_timeout: The usb_boot_timeout to use during reimage.
1000 Factory images need a longer usb_boot_timeout than regular
1001 cros images.
1002 @param install_timeout: The timeout to use when installing the chromeos
1003 image. Factory images need a longer install_timeout.
Richard Barnette03a0c132012-11-05 12:40:35 -08001004
Scott Zawalski62bacae2013-03-05 10:40:32 -05001005 @raises AutoservError if the image fails to boot.
beepsf079cfb2013-09-18 17:49:51 -07001006
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001007 """
beepsf079cfb2013-09-18 17:49:51 -07001008 usb_boot_timer_key = ('servo_install.usb_boot_timeout_%s'
1009 % usb_boot_timeout)
1010 logging.info('Downloading image to USB, then booting from it. Usb boot '
1011 'timeout = %s', usb_boot_timeout)
Gabe Black1e1c41b2015-02-04 23:55:15 -08001012 timer = autotest_stats.Timer(usb_boot_timer_key)
beepsf079cfb2013-09-18 17:49:51 -07001013 timer.start()
J. Richard Barnette31b2e312013-04-04 16:05:22 -07001014 self.servo.install_recovery_image(image_url)
beepsf079cfb2013-09-18 17:49:51 -07001015 if not self.wait_up(timeout=usb_boot_timeout):
Scott Zawalski62bacae2013-03-05 10:40:32 -05001016 raise error.AutoservRepairFailure(
1017 'DUT failed to boot from USB after %d seconds' %
beepsf079cfb2013-09-18 17:49:51 -07001018 usb_boot_timeout)
1019 timer.stop()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001020
Tom Wai-Hong Tamf6b4f812015-08-08 04:14:59 +08001021 # The new chromeos-tpm-recovery has been merged since R44-7073.0.0.
1022 # In old CrOS images, this command fails. Skip the error.
Tom Wai-Hong Tam27af7332015-07-25 06:09:39 +08001023 logging.info('Resetting the TPM status')
Tom Wai-Hong Tamf6b4f812015-08-08 04:14:59 +08001024 try:
1025 self.run('chromeos-tpm-recovery')
1026 except error.AutoservRunError:
1027 logging.warn('chromeos-tpm-recovery is too old.')
1028
Tom Wai-Hong Tam27af7332015-07-25 06:09:39 +08001029
beepsf079cfb2013-09-18 17:49:51 -07001030 install_timer_key = ('servo_install.install_timeout_%s'
1031 % install_timeout)
Gabe Black1e1c41b2015-02-04 23:55:15 -08001032 timer = autotest_stats.Timer(install_timer_key)
beepsf079cfb2013-09-18 17:49:51 -07001033 timer.start()
1034 logging.info('Installing image through chromeos-install.')
J. Richard Barnette9af19632015-09-25 12:18:03 -07001035 self.run('chromeos-install --yes', timeout=install_timeout)
1036 self.halt()
beepsf079cfb2013-09-18 17:49:51 -07001037 timer.stop()
1038
1039 logging.info('Power cycling DUT through servo.')
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001040 self.servo.get_power_state_controller().power_off()
Fang Dengafb88142013-05-30 17:44:31 -07001041 self.servo.switch_usbkey('off')
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001042 # N.B. The Servo API requires that we use power_on() here
1043 # for two reasons:
1044 # 1) After turning on a DUT in recovery mode, you must turn
1045 # it off and then on with power_on() once more to
1046 # disable recovery mode (this is a Parrot specific
1047 # requirement).
1048 # 2) After power_off(), the only way to turn on is with
1049 # power_on() (this is a Storm specific requirement).
J. Richard Barnettefbcc7122013-07-24 18:24:59 -07001050 self.servo.get_power_state_controller().power_on()
beepsf079cfb2013-09-18 17:49:51 -07001051
1052 logging.info('Waiting for DUT to come back up.')
Richard Barnette03a0c132012-11-05 12:40:35 -08001053 if not self.wait_up(timeout=self.BOOT_TIMEOUT):
1054 raise error.AutoservError('DUT failed to reboot installed '
1055 'test image after %d seconds' %
Scott Zawalski62bacae2013-03-05 10:40:32 -05001056 self.BOOT_TIMEOUT)
1057
1058
Dan Shic1b8bdd2015-09-14 23:11:24 -07001059 def _setup_servo(self):
1060 """Try to force to create servo object if it's not set up yet.
1061 """
1062 if self.servo:
1063 return
1064
1065 try:
1066 # Setting servo_args to {} will force it to create the servo_host
1067 # object if possible.
1068 self._servo_host = servo_host.create_servo_host(
1069 dut=self.hostname, servo_args={})
1070 if self._servo_host:
1071 self.servo = self._servo_host.get_servo()
1072 else:
1073 logging.error('Failed to create servo_host object.')
1074 except Exception as e:
1075 logging.error('Failed to create servo object: %s', e)
1076
1077
J. Richard Barnettee4af8b92013-05-01 13:16:12 -07001078 def _servo_repair_reinstall(self):
Scott Zawalski62bacae2013-03-05 10:40:32 -05001079 """Reinstall the DUT utilizing servo and a test image.
1080
1081 Re-install the OS on the DUT by:
1082 1) installing a test image on a USB storage device attached to the Servo
1083 board,
Tom Wai-Hong Tam27af7332015-07-25 06:09:39 +08001084 2) booting that image in recovery mode,
1085 3) resetting the TPM status, and then
1086 4) installing the image with chromeos-install.
Scott Zawalski62bacae2013-03-05 10:40:32 -05001087
Scott Zawalski62bacae2013-03-05 10:40:32 -05001088 @raises AutoservRepairMethodNA if the device does not have servo
1089 support.
1090
1091 """
Dan Shic1b8bdd2015-09-14 23:11:24 -07001092 # To repair a DUT connected to a moblab, try to create a servo object if
1093 # it was failed to be created earlier as there may be a servo_host host
1094 # attribute for this host.
1095 if utils.is_moblab():
1096 self._setup_servo()
1097
Scott Zawalski62bacae2013-03-05 10:40:32 -05001098 if not self.servo:
1099 raise error.AutoservRepairMethodNA('Repair Reinstall NA: '
1100 'DUT has no servo support.')
1101
1102 logging.info('Attempting to recovery servo enabled device with '
1103 'servo_repair_reinstall')
1104
J. Richard Barnettee4af8b92013-05-01 13:16:12 -07001105 image_url = self.stage_image_for_servo()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001106 self.servo_install(image_url)
1107
1108
1109 def _servo_repair_power(self):
1110 """Attempt to repair DUT using an attached Servo.
1111
1112 Attempt to power on the DUT via power_long_press.
1113
1114 @raises AutoservRepairMethodNA if the device does not have servo
1115 support.
1116 @raises AutoservRepairFailure if the repair fails for any reason.
1117 """
1118 if not self.servo:
1119 raise error.AutoservRepairMethodNA('Repair Power NA: '
1120 'DUT has no servo support.')
1121
1122 logging.info('Attempting to recover servo enabled device by '
1123 'powering it off and on.')
1124 self.servo.get_power_state_controller().power_off()
1125 self.servo.get_power_state_controller().power_on()
1126 if self.wait_up(self.BOOT_TIMEOUT):
1127 return
1128
1129 raise error.AutoservRepairFailure('DUT did not boot after long_press.')
Richard Barnette03a0c132012-11-05 12:40:35 -08001130
1131
Richard Barnette82c35912012-11-20 10:09:10 -08001132 def _powercycle_to_repair(self):
1133 """Utilize the RPM Infrastructure to bring the host back up.
1134
1135 If the host is not up/repaired after the first powercycle we utilize
1136 auto fallback to the last good install by powercycling and rebooting the
1137 host 6 times.
Scott Zawalski62bacae2013-03-05 10:40:32 -05001138
1139 @raises AutoservRepairMethodNA if the device does not support remote
1140 power.
1141 @raises AutoservRepairFailure if the repair fails for any reason.
1142
Richard Barnette82c35912012-11-20 10:09:10 -08001143 """
Scott Zawalski62bacae2013-03-05 10:40:32 -05001144 if not self.has_power():
1145 raise error.AutoservRepairMethodNA('Device does not support power.')
1146
Richard Barnette82c35912012-11-20 10:09:10 -08001147 logging.info('Attempting repair via RPM powercycle.')
1148 failed_cycles = 0
1149 self.power_cycle()
1150 while not self.wait_up(timeout=self.BOOT_TIMEOUT):
1151 failed_cycles += 1
1152 if failed_cycles >= self._MAX_POWER_CYCLE_ATTEMPTS:
Scott Zawalski62bacae2013-03-05 10:40:32 -05001153 raise error.AutoservRepairFailure(
1154 'Powercycled host %s %d times; device did not come back'
1155 ' online.' % (self.hostname, failed_cycles))
Richard Barnette82c35912012-11-20 10:09:10 -08001156 self.power_cycle()
1157 if failed_cycles == 0:
1158 logging.info('Powercycling was successful first time.')
1159 else:
1160 logging.info('Powercycling was successful after %d failures.',
1161 failed_cycles)
1162
1163
MK Ryu35d661e2014-09-25 17:44:10 -07001164 def _reboot_repair(self):
1165 """SSH to this host and reboot."""
1166 if not self.is_up(self._CHECK_HOST_UP_TIMEOUT_SECS):
1167 raise error.AutoservRepairMethodNA('DUT unreachable for reboot.')
1168 logging.info('Attempting repair via SSH reboot.')
1169 self.reboot(timeout=self.BOOT_TIMEOUT, wait=True)
1170
1171
Prashanth B4d8184f2014-05-05 12:22:02 -07001172 def check_device(self):
1173 """Check if a device is ssh-able, and if so, clean and verify it.
1174
1175 @raise AutoservSSHTimeout: If the ssh ping times out.
1176 @raise AutoservSshPermissionDeniedError: If ssh ping fails due to
1177 permissions.
1178 @raise AutoservSshPingHostError: For other AutoservRunErrors during
1179 ssh_ping.
1180 @raises AutoservError: As appropriate, during cleanup and verify.
1181 """
1182 self.ssh_ping()
1183 self.cleanup()
1184 self.verify()
1185
1186
Dan Shi90466352015-09-22 15:01:05 -07001187 def confirm_servo(self):
1188 """Confirm servo is initialized and verified.
1189
1190 @raise AutoservError: If servo is not initialized and verified.
1191 """
1192 if self._servo_host.required_by_test and self.servo:
1193 return
1194
1195 # Force to re-create the servo object to make sure servo is verified.
1196 logging.debug('Rebuilding the servo object.')
1197 self.servo = None
1198 self._servo_host = None
1199 self._setup_servo()
1200 if not self.servo:
1201 raise error.AutoservError('Failed to create servo object.')
1202
1203
Dan Shi6731a6c2015-09-24 14:49:25 -07001204 def _is_last_provision_failed(self):
1205 """Checks if the last provision job failed.
1206
1207 @return: True if there exists file /var/tmp/provision_failed, which
1208 indicates the last provision job failed.
1209 False otherwise.
1210 """
1211 result = self.run('[ -f %s ]' % PROVISION_FAILED, ignore_status=True)
1212 return result.exit_status == 0
1213
1214
Richard Barnette82c35912012-11-20 10:09:10 -08001215 def repair_full(self):
1216 """Repair a host for repair level NO_PROTECTION.
1217
1218 This overrides the base class function for repair; it does
1219 not call back to the parent class, but instead offers a
1220 simplified implementation based on the capabilities in the
1221 Chrome OS test lab.
1222
Fang Deng5d518f42013-08-02 14:04:32 -07001223 It first verifies and repairs servo if it is a DUT in CrOS
Fang Deng03590af2013-10-07 17:34:20 -07001224 lab and a servo is attached.
Fang Deng5d518f42013-08-02 14:04:32 -07001225
Jakob Juelich82b7d1c2014-09-15 16:10:57 -07001226 This escalates in order through the following procedures and verifies
1227 the status using `self.check_device()` after each of them. This is done
1228 until both the repair and the veryfing step succeed.
1229
MK Ryu35d661e2014-09-25 17:44:10 -07001230 Escalation order of repair procedures from less intrusive to
1231 more intrusive repairs:
1232 1. SSH to the DUT and reboot.
Scott Zawalski62bacae2013-03-05 10:40:32 -05001233 2. If there's a servo for the DUT, try to power the DUT off and
1234 on.
MK Ryu35d661e2014-09-25 17:44:10 -07001235 3. If the DUT can be power-cycled via RPM, try to repair
Richard Barnette82c35912012-11-20 10:09:10 -08001236 by power-cycling.
MK Ryu35d661e2014-09-25 17:44:10 -07001237 4. Try to re-install to a known stable image using
1238 auto-update.
1239 5. If there's a servo for the DUT, try to re-install via
1240 the servo.
Richard Barnette82c35912012-11-20 10:09:10 -08001241
1242 As with the parent method, the last operation performed on
Prashanth B4d8184f2014-05-05 12:22:02 -07001243 the DUT must be to call `self.check_device()`; If that call fails the
1244 exception it raises is passed back to the caller.
J. Richard Barnettefde55fc2013-03-15 17:47:01 -07001245
Scott Zawalski62bacae2013-03-05 10:40:32 -05001246 @raises AutoservRepairTotalFailure if the repair process fails to
1247 fix the DUT.
Fang Deng5d518f42013-08-02 14:04:32 -07001248 @raises ServoHostRepairTotalFailure if the repair process fails to
1249 fix the servo host if one is attached to the DUT.
1250 @raises AutoservSshPermissionDeniedError if it is unable
1251 to ssh to the servo host due to permission error.
1252
Richard Barnette82c35912012-11-20 10:09:10 -08001253 """
Jakob Juelich82b7d1c2014-09-15 16:10:57 -07001254 # Caution: Deleting shards relies on repair to always reboot the DUT.
1255
Dan Shi4d478522014-02-14 13:46:32 -08001256 if self._servo_host and not self.servo:
Fang Deng03590af2013-10-07 17:34:20 -07001257 try:
Dan Shi4d478522014-02-14 13:46:32 -08001258 self._servo_host.repair_full()
Fang Deng03590af2013-10-07 17:34:20 -07001259 except Exception as e:
Fang Deng03590af2013-10-07 17:34:20 -07001260 logging.error('Could not create a healthy servo: %s', e)
Dan Shi4d478522014-02-14 13:46:32 -08001261 self.servo = self._servo_host.get_servo()
Fang Deng5d518f42013-08-02 14:04:32 -07001262
MK Ryu35d661e2014-09-25 17:44:10 -07001263 self.try_collect_crashlogs()
1264
Scott Zawalski62bacae2013-03-05 10:40:32 -05001265 # TODO(scottz): This should use something similar to label_decorator,
1266 # but needs to be populated in order so DUTs are repaired with the
1267 # least amount of effort.
Dan Shi6731a6c2015-09-24 14:49:25 -07001268 if self._is_last_provision_failed():
1269 logging.info('Last provision failed, try powerwash first.')
1270 repair_funcs = [self._install_repair_with_powerwash,
1271 self._servo_repair_reinstall]
1272 else:
1273 repair_funcs = [self._reboot_repair,
1274 self._servo_repair_power,
1275 self._powercycle_to_repair,
1276 self._install_repair,
1277 self._install_repair_with_powerwash,
1278 self._servo_repair_reinstall]
Scott Zawalski62bacae2013-03-05 10:40:32 -05001279 errors = []
Simran Basie6130932013-10-01 14:07:52 -07001280 board = self._get_board_from_afe()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001281 for repair_func in repair_funcs:
1282 try:
1283 repair_func()
MK Ryu35d661e2014-09-25 17:44:10 -07001284 self.try_collect_crashlogs()
Prashanth B4d8184f2014-05-05 12:22:02 -07001285 self.check_device()
Gabe Black1e1c41b2015-02-04 23:55:15 -08001286 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001287 '%s.SUCCEEDED' % repair_func.__name__).increment()
1288 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001289 autotest_stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001290 '%s.%s.SUCCEEDED' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001291 board)).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001292 return
Simran Basie6130932013-10-01 14:07:52 -07001293 except error.AutoservRepairMethodNA as e:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001294 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001295 '%s.RepairNA' % repair_func.__name__).increment()
1296 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001297 autotest_stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001298 '%s.%s.RepairNA' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001299 board)).increment()
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001300 logging.warning('Repair function NA: %s', e)
Simran Basie6130932013-10-01 14:07:52 -07001301 errors.append(str(e))
Scott Zawalski62bacae2013-03-05 10:40:32 -05001302 except Exception as e:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001303 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001304 '%s.FAILED' % repair_func.__name__).increment()
1305 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001306 autotest_stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001307 '%s.%s.FAILED' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001308 board)).increment()
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001309 logging.warning('Failed to repair device: %s', e)
Scott Zawalski62bacae2013-03-05 10:40:32 -05001310 errors.append(str(e))
Scott Zawalski89c44dd2013-02-26 09:28:02 -05001311
Gabe Black1e1c41b2015-02-04 23:55:15 -08001312 autotest_stats.Counter('Full_Repair_Failed').increment()
Simran Basie6130932013-10-01 14:07:52 -07001313 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001314 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001315 'Full_Repair_Failed.%s' % board).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001316 raise error.AutoservRepairTotalFailure(
1317 'All attempts at repairing the device failed:\n%s' %
1318 '\n'.join(errors))
Richard Barnette82c35912012-11-20 10:09:10 -08001319
1320
MK Ryu35d661e2014-09-25 17:44:10 -07001321 def try_collect_crashlogs(self, check_host_up=True):
1322 """
1323 Check if a host is up and logs need to be collected from the host,
1324 if yes, collect them.
1325
1326 @param check_host_up: Flag for checking host is up. Default is True.
1327 """
1328 try:
1329 crash_job = self._need_crash_logs()
1330 if crash_job:
1331 logging.debug('%s: Job %s was crashed', self._CRASHLOGS_PREFIX,
1332 crash_job)
1333 if not check_host_up or self.is_up(
1334 self._CHECK_HOST_UP_TIMEOUT_SECS):
1335 self._collect_crashlogs(crash_job)
1336 logging.debug('%s: Completed collecting logs for the '
1337 'crashed job %s', self._CRASHLOGS_PREFIX,
1338 crash_job)
1339 except Exception as e:
1340 # Exception should not result in repair failure.
1341 # Therefore, suppress all exceptions here.
1342 logging.error('%s: Failed while trying to collect crash-logs: %s',
1343 self._CRASHLOGS_PREFIX, e)
1344
1345
1346 def _need_crash_logs(self):
1347 """Get the value of need_crash_logs attribute of this host.
1348
1349 @return: Value string of need_crash_logs attribute
1350 None if there is no need_crash_logs attribute
1351 """
1352 attrs = self._AFE.get_host_attribute(constants.CRASHLOGS_HOST_ATTRIBUTE,
1353 hostname=self.hostname)
1354 assert len(attrs) < 2
1355 return attrs[0].value if attrs else None
1356
1357
1358 def _collect_crashlogs(self, job_id):
1359 """Grab logs from the host where a job was crashed.
1360
1361 First, check if PRIOR_LOGS_DIR exists in the host.
1362 If yes, collect them.
1363 Otherwise, check if a lab-machine marker (_LAB_MACHINE_FILE) exists
1364 in the host.
1365 If yes, the host was repaired automatically, and we collect normal
1366 system logs.
1367
1368 @param job_id: Id of the job that was crashed.
1369 """
1370 crashlogs_dir = crashcollect.get_crashinfo_dir(self,
1371 constants.CRASHLOGS_DEST_DIR_PREFIX)
1372 flag_prior_logs = False
1373
1374 if self.path_exists(client_constants.PRIOR_LOGS_DIR):
1375 flag_prior_logs = True
1376 self._collect_prior_logs(crashlogs_dir)
1377 elif self.path_exists(self._LAB_MACHINE_FILE):
1378 self._collect_system_logs(crashlogs_dir)
1379 else:
1380 logging.warning('%s: Host was manually re-installed without '
1381 '--lab_preserve_log option. Skip collecting '
1382 'crash-logs.', self._CRASHLOGS_PREFIX)
1383
1384 # We make crash collection be one-time effort.
1385 # _collect_prior_logs() and _collect_system_logs() will not throw
1386 # any exception, and following codes will be executed even when
1387 # those methods fail.
1388 # _collect_crashlogs() is called only when the host is up (refer
1389 # to try_collect_crashlogs()). We assume _collect_prior_logs() and
1390 # _collect_system_logs() fail rarely when the host is up.
1391 # In addition, it is not clear how many times we should try crash
1392 # collection again while not triggering next repair unnecessarily.
1393 # Threfore, we try crash collection one time.
1394
1395 # Create a marker file as soon as log collection is done.
1396 # Leave the job id to this marker for gs_offloader to consume.
1397 marker_file = os.path.join(crashlogs_dir, constants.CRASHLOGS_MARKER)
1398 with open(marker_file, 'a') as f:
1399 f.write('%s\n' % job_id)
1400
1401 # Remove need_crash_logs attribute
1402 logging.debug('%s: Remove attribute need_crash_logs from host %s',
1403 self._CRASHLOGS_PREFIX, self.hostname)
1404 self._AFE.set_host_attribute(constants.CRASHLOGS_HOST_ATTRIBUTE,
1405 None, hostname=self.hostname)
1406
1407 if flag_prior_logs:
1408 logging.debug('%s: Remove %s from host %s', self._CRASHLOGS_PREFIX,
1409 client_constants.PRIOR_LOGS_DIR, self.hostname)
1410 self.run('rm -rf %s; sync' % client_constants.PRIOR_LOGS_DIR)
1411 # Wait for a few seconds to make sure the prior command is
1412 # done deep through storage.
1413 time.sleep(self._SAFE_WAIT_SECS)
1414
1415
1416 def _collect_prior_logs(self, crashlogs_dir):
1417 """Grab prior logs that were stashed before re-installing a host.
1418
1419 @param crashlogs_dir: Directory path where crash-logs are stored.
1420 """
1421 logging.debug('%s: Found %s, collecting them...',
1422 self._CRASHLOGS_PREFIX, client_constants.PRIOR_LOGS_DIR)
1423 try:
1424 self.collect_logs(client_constants.PRIOR_LOGS_DIR,
1425 crashlogs_dir, False)
1426 logging.debug('%s: %s is collected',
1427 self._CRASHLOGS_PREFIX, client_constants.PRIOR_LOGS_DIR)
1428 except Exception as e:
1429 logging.error('%s: Failed to collect %s: %s',
1430 self._CRASHLOGS_PREFIX, client_constants.PRIOR_LOGS_DIR,
1431 e)
1432
1433
1434 def _collect_system_logs(self, crashlogs_dir):
1435 """Grab normal system logs from a host.
1436
1437 @param crashlogs_dir: Directory path where crash-logs are stored.
1438 """
1439 logging.debug('%s: Found %s, collecting system logs...',
1440 self._CRASHLOGS_PREFIX, self._LAB_MACHINE_FILE)
1441 sources = server_utils.parse_simple_config(self._LOGS_TO_COLLECT_FILE)
1442 for src in sources:
1443 try:
1444 if self.path_exists(src):
1445 logging.debug('%s: Collecting %s...',
1446 self._CRASHLOGS_PREFIX, src)
1447 dest = server_utils.concat_path_except_last(
1448 crashlogs_dir, src)
1449 self.collect_logs(src, dest, False)
1450 logging.debug('%s: %s is collected',
1451 self._CRASHLOGS_PREFIX, src)
1452 except Exception as e:
1453 logging.error('%s: Failed to collect %s: %s',
1454 self._CRASHLOGS_PREFIX, src, e)
1455
1456
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001457 def close(self):
beeps32a63082013-08-22 14:02:29 -07001458 self.rpc_disconnect_all()
Fang Deng0ca40e22013-08-27 17:47:44 -07001459 super(CrosHost, self).close()
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001460
1461
Dan Shi49ca0932014-11-14 11:22:27 -08001462 def get_power_supply_info(self):
1463 """Get the output of power_supply_info.
1464
1465 power_supply_info outputs the info of each power supply, e.g.,
1466 Device: Line Power
1467 online: no
1468 type: Mains
1469 voltage (V): 0
1470 current (A): 0
1471 Device: Battery
1472 state: Discharging
1473 percentage: 95.9276
1474 technology: Li-ion
1475
1476 Above output shows two devices, Line Power and Battery, with details of
1477 each device listed. This function parses the output into a dictionary,
1478 with key being the device name, and value being a dictionary of details
1479 of the device info.
1480
1481 @return: The dictionary of power_supply_info, e.g.,
1482 {'Line Power': {'online': 'yes', 'type': 'main'},
1483 'Battery': {'vendor': 'xyz', 'percentage': '100'}}
Dan Shie9b765d2014-12-29 16:59:49 -08001484 @raise error.AutoservRunError if power_supply_info tool is not found in
1485 the DUT. Caller should handle this error to avoid false failure
1486 on verification.
Dan Shi49ca0932014-11-14 11:22:27 -08001487 """
1488 result = self.run('power_supply_info').stdout.strip()
1489 info = {}
1490 device_name = None
1491 device_info = {}
1492 for line in result.split('\n'):
1493 pair = [v.strip() for v in line.split(':')]
1494 if len(pair) != 2:
1495 continue
1496 if pair[0] == 'Device':
1497 if device_name:
1498 info[device_name] = device_info
1499 device_name = pair[1]
1500 device_info = {}
1501 else:
1502 device_info[pair[0]] = pair[1]
1503 if device_name and not device_name in info:
1504 info[device_name] = device_info
1505 return info
1506
1507
1508 def get_battery_percentage(self):
1509 """Get the battery percentage.
1510
1511 @return: The percentage of battery level, value range from 0-100. Return
1512 None if the battery info cannot be retrieved.
1513 """
1514 try:
1515 info = self.get_power_supply_info()
1516 logging.info(info)
1517 return float(info['Battery']['percentage'])
Dan Shie9b765d2014-12-29 16:59:49 -08001518 except (KeyError, ValueError, error.AutoservRunError):
Dan Shi49ca0932014-11-14 11:22:27 -08001519 return None
1520
1521
1522 def is_ac_connected(self):
1523 """Check if the dut has power adapter connected and charging.
1524
1525 @return: True if power adapter is connected and charging.
1526 """
1527 try:
1528 info = self.get_power_supply_info()
1529 return info['Line Power']['online'] == 'yes'
Dan Shie9b765d2014-12-29 16:59:49 -08001530 except (KeyError, error.AutoservRunError):
1531 return None
Dan Shi49ca0932014-11-14 11:22:27 -08001532
1533
Simran Basi5e6339a2013-03-21 11:34:32 -07001534 def _cleanup_poweron(self):
1535 """Special cleanup method to make sure hosts always get power back."""
1536 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
1537 hosts = afe.get_hosts(hostname=self.hostname)
1538 if not hosts or not (self._RPM_OUTLET_CHANGED in
1539 hosts[0].attributes):
1540 return
1541 logging.debug('This host has recently interacted with the RPM'
1542 ' Infrastructure. Ensuring power is on.')
1543 try:
1544 self.power_on()
Dan Shi7dca56e2014-11-11 17:07:56 -08001545 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, None,
1546 hostname=self.hostname)
Simran Basi5e6339a2013-03-21 11:34:32 -07001547 except rpm_client.RemotePowerException:
Simran Basi5e6339a2013-03-21 11:34:32 -07001548 logging.error('Failed to turn Power On for this host after '
1549 'cleanup through the RPM Infrastructure.')
Gabe Blackb72f4fb2015-01-20 16:47:13 -08001550 autotest_es.post(
Dan Shi7dca56e2014-11-11 17:07:56 -08001551 type_str='RPM_poweron_failure',
1552 metadata={'hostname': self.hostname})
Dan Shi49ca0932014-11-14 11:22:27 -08001553
1554 battery_percentage = self.get_battery_percentage()
Dan Shif01ebe22014-12-05 13:10:57 -08001555 if battery_percentage and battery_percentage < 50:
Dan Shi49ca0932014-11-14 11:22:27 -08001556 raise
1557 elif self.is_ac_connected():
1558 logging.info('The device has power adapter connected and '
1559 'charging. No need to try to turn RPM on '
1560 'again.')
1561 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, None,
1562 hostname=self.hostname)
1563 logging.info('Battery level is now at %s%%. The device may '
1564 'still have enough power to run test, so no '
1565 'exception will be raised.', battery_percentage)
1566
Simran Basi5e6339a2013-03-21 11:34:32 -07001567
beepsc87ff602013-07-31 21:53:00 -07001568 def _is_factory_image(self):
1569 """Checks if the image on the DUT is a factory image.
1570
1571 @return: True if the image on the DUT is a factory image.
1572 False otherwise.
1573 """
1574 result = self.run('[ -f /root/.factory_test ]', ignore_status=True)
1575 return result.exit_status == 0
1576
1577
1578 def _restart_ui(self):
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001579 """Restart the Chrome UI.
beepsc87ff602013-07-31 21:53:00 -07001580
1581 @raises: FactoryImageCheckerException for factory images, since
1582 we cannot attempt to restart ui on them.
1583 error.AutoservRunError for any other type of error that
1584 occurs while restarting ui.
1585 """
1586 if self._is_factory_image():
Dan Shi549fb822015-03-24 18:01:11 -07001587 raise FactoryImageCheckerException('Cannot restart ui on factory '
1588 'images')
beepsc87ff602013-07-31 21:53:00 -07001589
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001590 # TODO(jrbarnette): The command to stop/start the ui job
1591 # should live inside cros_ui, too. However that would seem
1592 # to imply interface changes to the existing start()/restart()
1593 # functions, which is a bridge too far (for now).
J. Richard Barnette6069aa12015-06-08 09:10:24 -07001594 prompt = cros_ui.get_chrome_session_ident(self)
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001595 self.run('stop ui; start ui')
1596 cros_ui.wait_for_chrome_ready(prompt, self)
beepsc87ff602013-07-31 21:53:00 -07001597
1598
Dan Shi549fb822015-03-24 18:01:11 -07001599 def get_release_version(self):
1600 """Get the value of attribute CHROMEOS_RELEASE_VERSION from lsb-release.
1601
1602 @returns The version string in lsb-release, under attribute
1603 CHROMEOS_RELEASE_VERSION.
1604 """
1605 lsb_release_content = self.run(
1606 'cat "%s"' % client_constants.LSB_RELEASE).stdout.strip()
1607 return lsbrelease_utils.get_chromeos_release_version(
1608 lsb_release_content=lsb_release_content)
1609
1610
1611 def verify_cros_version_label(self):
1612 """ Make sure host's cros-version label match the actual image in dut.
1613
1614 Remove any cros-version: label that doesn't match that installed in
1615 the dut.
1616
1617 @param raise_error: Set to True to raise exception if any mismatch found
1618
1619 @raise error.AutoservError: If any mismatch between cros-version label
1620 and the build installed in dut is found.
1621 """
1622 labels = self._AFE.get_labels(
1623 name__startswith=ds_constants.VERSION_PREFIX,
1624 host__hostname=self.hostname)
1625 mismatch_found = False
1626 if labels:
1627 # Get CHROMEOS_RELEASE_VERSION from lsb-release, e.g., 6908.0.0.
1628 # Note that it's different from cros-version label, which has
1629 # builder and branch info, e.g.,
1630 # cros-version:peppy-release/R43-6908.0.0
1631 release_version = self.get_release_version()
1632 host_list = [self.hostname]
1633 for label in labels:
1634 # Remove any cros-version label that does not match
1635 # release_version.
1636 build_version = label.name[len(ds_constants.VERSION_PREFIX):]
1637 if not utils.version_match(build_version, release_version):
1638 logging.warn('cros-version label "%s" does not match '
1639 'release version %s. Removing the label.',
1640 label.name, release_version)
1641 label.remove_hosts(hosts=host_list)
1642 mismatch_found = True
1643 if mismatch_found:
Dan Shi1057bae2015-03-30 11:35:09 -07001644 autotest_es.post(use_http=True,
1645 type_str='cros_version_label_mismatch',
1646 metadata={'hostname': self.hostname})
Dan Shi549fb822015-03-24 18:01:11 -07001647 raise error.AutoservError('The host has wrong cros-version label.')
1648
1649
beepsc87ff602013-07-31 21:53:00 -07001650 def cleanup(self):
MK Ryu35d661e2014-09-25 17:44:10 -07001651 self.run('rm -f %s' % client_constants.CLEANUP_LOGS_PAUSED_FILE)
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001652 try:
beepsc87ff602013-07-31 21:53:00 -07001653 self._restart_ui()
1654 except (error.AutotestRunError, error.AutoservRunError,
1655 FactoryImageCheckerException):
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001656 logging.warning('Unable to restart ui, rebooting device.')
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001657 # Since restarting the UI fails fall back to normal Autotest
1658 # cleanup routines, i.e. reboot the machine.
Fang Deng0ca40e22013-08-27 17:47:44 -07001659 super(CrosHost, self).cleanup()
Simran Basi5e6339a2013-03-21 11:34:32 -07001660 # Check if the rpm outlet was manipulated.
Simran Basid5e5e272012-09-24 15:23:59 -07001661 if self.has_power():
Simran Basi5e6339a2013-03-21 11:34:32 -07001662 self._cleanup_poweron()
Dan Shi549fb822015-03-24 18:01:11 -07001663 self.verify_cros_version_label()
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001664
1665
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001666 def reboot(self, **dargs):
1667 """
1668 This function reboots the site host. The more generic
1669 RemoteHost.reboot() performs sync and sleeps for 5
1670 seconds. This is not necessary for Chrome OS devices as the
1671 sync should be finished in a short time during the reboot
1672 command.
1673 """
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001674 if 'reboot_cmd' not in dargs:
Doug Anderson7d5aeb22014-02-27 15:12:17 -08001675 reboot_timeout = dargs.get('reboot_timeout', 10)
J. Richard Barnette9af19632015-09-25 12:18:03 -07001676 dargs['reboot_cmd'] = ('sleep 1; '
1677 'reboot & sleep %d; '
1678 'reboot -f' % reboot_timeout)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001679 # Enable fastsync to avoid running extra sync commands before reboot.
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001680 if 'fastsync' not in dargs:
1681 dargs['fastsync'] = True
Michael Liangda8c60a2014-06-03 13:24:51 -07001682
Charlie Mooneya8e6dab2014-05-29 14:37:55 -07001683 # For purposes of logging reboot times:
1684 # Get the board name i.e. 'daisy_spring'
Michael Liangca4f5a62014-07-10 15:45:13 -07001685 board_fullname = self.get_board()
1686
1687 # Strip the prefix and add it to dargs.
1688 dargs['board'] = board_fullname[board_fullname.find(':')+1:]
Fang Deng0ca40e22013-08-27 17:47:44 -07001689 super(CrosHost, self).reboot(**dargs)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001690
1691
Gwendal Grignou7a61d2f2014-05-23 11:05:51 -07001692 def suspend(self, **dargs):
1693 """
1694 This function suspends the site host.
1695 """
1696 suspend_time = dargs.get('suspend_time', 60)
1697 dargs['timeout'] = suspend_time
1698 if 'suspend_cmd' not in dargs:
J. Richard Barnette9af19632015-09-25 12:18:03 -07001699 dargs['suspend_cmd'] = ' && '.join([
1700 'echo 0 > /sys/class/rtc/rtc0/wakealarm',
Gwendal Grignou7a61d2f2014-05-23 11:05:51 -07001701 'echo +%d > /sys/class/rtc/rtc0/wakealarm' % suspend_time,
J. Richard Barnette9af19632015-09-25 12:18:03 -07001702 'powerd_dbus_suspend --delay=0'])
Gwendal Grignou7a61d2f2014-05-23 11:05:51 -07001703 super(CrosHost, self).suspend(**dargs)
1704
1705
Simran Basiec564392014-08-25 16:48:09 -07001706 def upstart_status(self, service_name):
1707 """Check the status of an upstart init script.
1708
1709 @param service_name: Service to look up.
1710
1711 @returns True if the service is running, False otherwise.
1712 """
1713 return self.run('status %s | grep start/running' %
1714 service_name).stdout.strip() != ''
1715
1716
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001717 def verify_software(self):
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001718 """Verify working software on a Chrome OS system.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001719
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001720 Tests for the following conditions:
1721 1. All conditions tested by the parent version of this
1722 function.
1723 2. Sufficient space in /mnt/stateful_partition.
Fang Deng6b05f5b2013-03-20 13:42:11 -07001724 3. Sufficient space in /mnt/stateful_partition/encrypted.
1725 4. update_engine answers a simple status request over DBus.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001726
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001727 """
MK Ryu35d661e2014-09-25 17:44:10 -07001728 # Check if a job was crashed on this host.
1729 # If yes, avoid verification until crash-logs are collected.
1730 if self._need_crash_logs():
1731 raise error.AutoservCrashLogCollectRequired(
1732 'Need to collect crash-logs before verification')
1733
Fang Deng0ca40e22013-08-27 17:47:44 -07001734 super(CrosHost, self).verify_software()
Dan Shib8540a52015-07-16 14:18:23 -07001735 default_kilo_inodes_required = CONFIG.get_config_value(
1736 'SERVER', 'kilo_inodes_required', type=int, default=100)
1737 board = self.get_board().replace(ds_constants.BOARD_PREFIX, '')
1738 kilo_inodes_required = CONFIG.get_config_value(
1739 'SERVER', 'kilo_inodes_required_%s' % board,
1740 type=int, default=default_kilo_inodes_required)
1741 self.check_inodes('/mnt/stateful_partition', kilo_inodes_required)
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001742 self.check_diskspace(
1743 '/mnt/stateful_partition',
Dan Shib8540a52015-07-16 14:18:23 -07001744 CONFIG.get_config_value(
Fang Deng6b05f5b2013-03-20 13:42:11 -07001745 'SERVER', 'gb_diskspace_required', type=float,
1746 default=20.0))
Gaurav Shahe448af82014-06-19 15:18:59 -07001747 encrypted_stateful_path = '/mnt/stateful_partition/encrypted'
1748 # Not all targets build with encrypted stateful support.
1749 if self.path_exists(encrypted_stateful_path):
1750 self.check_diskspace(
1751 encrypted_stateful_path,
Dan Shib8540a52015-07-16 14:18:23 -07001752 CONFIG.get_config_value(
Gaurav Shahe448af82014-06-19 15:18:59 -07001753 'SERVER', 'gb_encrypted_diskspace_required', type=float,
1754 default=0.1))
beepsc87ff602013-07-31 21:53:00 -07001755
Simran Basiec564392014-08-25 16:48:09 -07001756 if not self.upstart_status('system-services'):
Prashanth B5d0a0512014-04-25 12:26:08 -07001757 raise error.AutoservError('Chrome failed to reach login. '
1758 'System services not running.')
1759
beepsc87ff602013-07-31 21:53:00 -07001760 # Factory images don't run update engine,
1761 # goofy controls dbus on these DUTs.
1762 if not self._is_factory_image():
1763 self.run('update_engine_client --status')
Scott Zawalskifbca4a92013-03-04 15:56:42 -05001764 # Makes sure python is present, loads and can use built in functions.
1765 # We have seen cases where importing cPickle fails with undefined
1766 # symbols in cPickle.so.
1767 self.run('python -c "import cPickle"')
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001768
Dan Shi549fb822015-03-24 18:01:11 -07001769 self.verify_cros_version_label()
1770
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001771
Dan Shi49ca0932014-11-14 11:22:27 -08001772 def verify_hardware(self):
1773 """Verify hardware system of a Chrome OS system.
1774
1775 Check following hardware conditions:
1776 1. Battery level.
1777 2. Is power adapter connected.
1778 """
1779 logging.info('Battery percentage: %s', self.get_battery_percentage())
Dan Shie9b765d2014-12-29 16:59:49 -08001780 if self.is_ac_connected() is None:
1781 logging.info('Can not determine if the device has power adapter '
1782 'connected.')
1783 else:
1784 logging.info('Device %s power adapter connected and charging.',
1785 'has' if self.is_ac_connected() else 'does not have')
Dan Shi49ca0932014-11-14 11:22:27 -08001786
1787
Fang Deng96667ca2013-08-01 17:46:18 -07001788 def make_ssh_command(self, user='root', port=22, opts='', hosts_file=None,
1789 connect_timeout=None, alive_interval=None):
1790 """Override default make_ssh_command to use options tuned for Chrome OS.
1791
1792 Tuning changes:
1793 - ConnectTimeout=30; maximum of 30 seconds allowed for an SSH
1794 connection failure. Consistency with remote_access.sh.
1795
Samuel Tan2ce155b2015-06-23 18:24:38 -07001796 - ServerAliveInterval=900; which causes SSH to ping connection every
1797 900 seconds. In conjunction with ServerAliveCountMax ensures
1798 that if the connection dies, Autotest will bail out.
Fang Deng96667ca2013-08-01 17:46:18 -07001799 Originally tried 60 secs, but saw frequent job ABORTS where
Samuel Tan2ce155b2015-06-23 18:24:38 -07001800 the test completed successfully. Later increased from 180 seconds to
1801 900 seconds to account for tests where the DUT is suspended for
1802 longer periods of time.
Fang Deng96667ca2013-08-01 17:46:18 -07001803
1804 - ServerAliveCountMax=3; consistency with remote_access.sh.
1805
1806 - ConnectAttempts=4; reduce flakiness in connection errors;
1807 consistency with remote_access.sh.
1808
1809 - UserKnownHostsFile=/dev/null; we don't care about the keys.
1810 Host keys change with every new installation, don't waste
1811 memory/space saving them.
1812
1813 - SSH protocol forced to 2; needed for ServerAliveInterval.
1814
1815 @param user User name to use for the ssh connection.
1816 @param port Port on the target host to use for ssh connection.
1817 @param opts Additional options to the ssh command.
1818 @param hosts_file Ignored.
1819 @param connect_timeout Ignored.
1820 @param alive_interval Ignored.
1821 """
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001822 base_command = ('/usr/bin/ssh -a -x %s %s %s'
1823 ' -o StrictHostKeyChecking=no'
Fang Deng96667ca2013-08-01 17:46:18 -07001824 ' -o UserKnownHostsFile=/dev/null -o BatchMode=yes'
Samuel Tan2ce155b2015-06-23 18:24:38 -07001825 ' -o ConnectTimeout=30 -o ServerAliveInterval=900'
Fang Deng96667ca2013-08-01 17:46:18 -07001826 ' -o ServerAliveCountMax=3 -o ConnectionAttempts=4'
1827 ' -o Protocol=2 -l %s -p %d')
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001828 return base_command % (self._ssh_verbosity_flag, self._ssh_options,
1829 opts, user, port)
Fang Deng96667ca2013-08-01 17:46:18 -07001830
1831
Christopher Wileydd181852013-10-10 19:56:58 -07001832 def _setup_rpc(self, port, command_name, remote_pid=None):
beeps32a63082013-08-22 14:02:29 -07001833 """Sets up a tunnel process and performs rpc connection book keeping.
1834
Cheng-Yi Chianga155e7e2015-08-20 20:42:04 +08001835 Chrome OS on the target closes down most external ports for security.
1836 We could open the port, but doing that would conflict with security
1837 tests that check that only expected ports are open. So, to get to
1838 the port on the target we use an ssh tunnel.
1839
beeps32a63082013-08-22 14:02:29 -07001840 This method assumes that xmlrpc and jsonrpc never conflict, since
1841 we can only either have an xmlrpc or a jsonrpc server listening on
1842 a remote port. As such, it enforces a single proxy->remote port
1843 policy, i.e if one starts a jsonrpc proxy/server from port A->B,
1844 and then tries to start an xmlrpc proxy forwarded to the same port,
1845 the xmlrpc proxy will override the jsonrpc tunnel process, however:
1846
1847 1. None of the methods on the xmlrpc proxy will work because
1848 the server listening on B is jsonrpc.
1849
1850 2. The xmlrpc client cannot initiate a termination of the JsonRPC
1851 server, as the only use case currently is goofy, which is tied to
1852 the factory image. It is much easier to handle a failed xmlrpc
1853 call on the client than it is to terminate goofy in this scenario,
1854 as doing the latter might leave the DUT in a hard to recover state.
1855
1856 With the current implementation newer rpc proxy connections will
1857 terminate the tunnel processes of older rpc connections tunneling
1858 to the same remote port. If methods are invoked on the client
1859 after this has happened they will fail with connection closed errors.
1860
1861 @param port: The remote forwarding port.
1862 @param command_name: The name of the remote process, to terminate
1863 using pkill.
1864
1865 @return A url that we can use to initiate the rpc connection.
1866 """
1867 self.rpc_disconnect(port)
1868 local_port = utils.get_unused_port()
1869 tunnel_proc = self._create_ssh_tunnel(port, local_port)
Christopher Wileydd181852013-10-10 19:56:58 -07001870 self._rpc_proxy_map[port] = (command_name, tunnel_proc, remote_pid)
beeps32a63082013-08-22 14:02:29 -07001871 return self._RPC_PROXY_URL % local_port
1872
1873
Christopher Wileyd78249a2013-03-01 13:05:31 -08001874 def xmlrpc_connect(self, command, port, command_name=None,
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001875 ready_test_name=None, timeout_seconds=10,
1876 logfile='/dev/null'):
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001877 """Connect to an XMLRPC server on the host.
1878
1879 The `command` argument should be a simple shell command that
1880 starts an XMLRPC server on the given `port`. The command
1881 must not daemonize, and must terminate cleanly on SIGTERM.
1882 The command is started in the background on the host, and a
1883 local XMLRPC client for the server is created and returned
1884 to the caller.
1885
1886 Note that the process of creating an XMLRPC client makes no
1887 attempt to connect to the remote server; the caller is
1888 responsible for determining whether the server is running
1889 correctly, and is ready to serve requests.
1890
Christopher Wileyd78249a2013-03-01 13:05:31 -08001891 Optionally, the caller can pass ready_test_name, a string
1892 containing the name of a method to call on the proxy. This
1893 method should take no parameters and return successfully only
1894 when the server is ready to process client requests. When
1895 ready_test_name is set, xmlrpc_connect will block until the
1896 proxy is ready, and throw a TestError if the server isn't
1897 ready by timeout_seconds.
1898
beeps32a63082013-08-22 14:02:29 -07001899 If a server is already running on the remote port, this
1900 method will kill it and disconnect the tunnel process
1901 associated with the connection before establishing a new one,
1902 by consulting the rpc_proxy_map in rpc_disconnect.
1903
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001904 @param command Shell command to start the server.
1905 @param port Port number on which the server is expected to
1906 be serving.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001907 @param command_name String to use as input to `pkill` to
1908 terminate the XMLRPC server on the host.
Christopher Wileyd78249a2013-03-01 13:05:31 -08001909 @param ready_test_name String containing the name of a
1910 method defined on the XMLRPC server.
1911 @param timeout_seconds Number of seconds to wait
1912 for the server to become 'ready.' Will throw a
1913 TestFail error if server is not ready in time.
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001914 @param logfile Logfile to send output when running
1915 'command' argument.
Yusuf Mohsinally8d19e3c2013-11-21 14:25:45 -08001916
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001917 """
Christopher Wileyc14f06a2013-10-16 13:55:39 -07001918 # Clean up any existing state. If the caller is willing
1919 # to believe their server is down, we ought to clean up
1920 # any tunnels we might have sitting around.
1921 self.rpc_disconnect(port)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001922 # Start the server on the host. Redirection in the command
1923 # below is necessary, because 'ssh' won't terminate until
1924 # background child processes close stdin, stdout, and
1925 # stderr.
J. Richard Barnette9af19632015-09-25 12:18:03 -07001926 remote_cmd = '%s >%s 2>&1' % (command, logfile)
1927 remote_pid = self.run_background(remote_cmd)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001928 logging.debug('Started XMLRPC server on host %s, pid = %s',
1929 self.hostname, remote_pid)
1930
Christopher Wileydd181852013-10-10 19:56:58 -07001931 # Tunnel through SSH to be able to reach that remote port.
1932 rpc_url = self._setup_rpc(port, command_name, remote_pid=remote_pid)
Christopher Wileyd78249a2013-03-01 13:05:31 -08001933 proxy = xmlrpclib.ServerProxy(rpc_url, allow_none=True)
Christopher Wileydd181852013-10-10 19:56:58 -07001934
Christopher Wileyd78249a2013-03-01 13:05:31 -08001935 if ready_test_name is not None:
J. Richard Barnette13eb7c02013-03-07 12:06:29 -08001936 # retry.retry logs each attempt; calculate delay_sec to
1937 # keep log spam to a dull roar.
Christopher Wiley0ed712b2013-04-09 15:25:12 -07001938 @retry.retry((socket.error,
1939 xmlrpclib.ProtocolError,
1940 httplib.BadStatusLine),
Chris Sosa65425082013-10-16 13:26:22 -07001941 timeout_min=timeout_seconds / 60.0,
1942 delay_sec=min(max(timeout_seconds / 20.0, 0.1), 1))
Christopher Wileyd78249a2013-03-01 13:05:31 -08001943 def ready_test():
1944 """ Call proxy.ready_test_name(). """
1945 getattr(proxy, ready_test_name)()
1946 successful = False
1947 try:
1948 logging.info('Waiting %d seconds for XMLRPC server '
1949 'to start.', timeout_seconds)
1950 ready_test()
1951 successful = True
Christopher Wileyd78249a2013-03-01 13:05:31 -08001952 finally:
1953 if not successful:
1954 logging.error('Failed to start XMLRPC server.')
beeps32a63082013-08-22 14:02:29 -07001955 self.rpc_disconnect(port)
Christopher Wileyd78249a2013-03-01 13:05:31 -08001956 logging.info('XMLRPC server started successfully.')
1957 return proxy
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001958
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001959
Jason Abeleb6f924f2013-11-13 16:01:54 -08001960 def syslog(self, message, tag='autotest'):
1961 """Logs a message to syslog on host.
1962
1963 @param message String message to log into syslog
1964 @param tag String tag prefix for syslog
1965
1966 """
1967 self.run('logger -t "%s" "%s"' % (tag, message))
1968
1969
beeps32a63082013-08-22 14:02:29 -07001970 def jsonrpc_connect(self, port):
1971 """Creates a jsonrpc proxy connection through an ssh tunnel.
1972
1973 This method exists to facilitate communication with goofy (which is
1974 the default system manager on all factory images) and as such, leaves
1975 most of the rpc server sanity checking to the caller. Unlike
1976 xmlrpc_connect, this method does not facilitate the creation of a remote
1977 jsonrpc server, as the only clients of this code are factory tests,
1978 for which the goofy system manager is built in to the image and starts
1979 when the target boots.
1980
1981 One can theoretically create multiple jsonrpc proxies all forwarded
1982 to the same remote port, provided the remote port has an rpc server
1983 listening. However, in doing so we stand the risk of leaking an
1984 existing tunnel process, so we always disconnect any older tunnels
1985 we might have through rpc_disconnect.
1986
1987 @param port: port on the remote host that is serving this proxy.
1988
1989 @return: The client proxy.
1990 """
1991 if not jsonrpclib:
1992 logging.warning('Jsonrpclib could not be imported. Check that '
1993 'site-packages contains jsonrpclib.')
1994 return None
1995
1996 proxy = jsonrpclib.jsonrpc.ServerProxy(self._setup_rpc(port, None))
1997
1998 logging.info('Established a jsonrpc connection through port %s.', port)
1999 return proxy
2000
2001
2002 def rpc_disconnect(self, port):
2003 """Disconnect from an RPC server on the host.
2004
2005 Terminates the remote RPC server previously started for
J. Richard Barnette1d78b012012-05-15 13:56:30 -07002006 the given `port`. Also closes the local ssh tunnel created
2007 for the connection to the host. This function does not
beeps32a63082013-08-22 14:02:29 -07002008 directly alter the state of a previously returned RPC
J. Richard Barnette1d78b012012-05-15 13:56:30 -07002009 client object; however disconnection will cause all
2010 subsequent calls to methods on the object to fail.
2011
2012 This function does nothing if requested to disconnect a port
beeps32a63082013-08-22 14:02:29 -07002013 that was not previously connected via _setup_rpc.
J. Richard Barnette1d78b012012-05-15 13:56:30 -07002014
2015 @param port Port number passed to a previous call to
beeps32a63082013-08-22 14:02:29 -07002016 `_setup_rpc()`.
J. Richard Barnette1d78b012012-05-15 13:56:30 -07002017 """
beeps32a63082013-08-22 14:02:29 -07002018 if port not in self._rpc_proxy_map:
J. Richard Barnette1d78b012012-05-15 13:56:30 -07002019 return
Christopher Wileydd181852013-10-10 19:56:58 -07002020 remote_name, tunnel_proc, remote_pid = self._rpc_proxy_map[port]
J. Richard Barnette1d78b012012-05-15 13:56:30 -07002021 if remote_name:
2022 # We use 'pkill' to find our target process rather than
2023 # a PID, because the host may have rebooted since
2024 # connecting, and we don't want to kill an innocent
2025 # process with the same PID.
2026 #
2027 # 'pkill' helpfully exits with status 1 if no target
2028 # process is found, for which run() will throw an
Simran Basid5e5e272012-09-24 15:23:59 -07002029 # exception. We don't want that, so we the ignore
J. Richard Barnette1d78b012012-05-15 13:56:30 -07002030 # status.
2031 self.run("pkill -f '%s'" % remote_name, ignore_status=True)
Christopher Wileydd181852013-10-10 19:56:58 -07002032 if remote_pid:
2033 logging.info('Waiting for RPC server "%s" shutdown',
2034 remote_name)
2035 start_time = time.time()
2036 while (time.time() - start_time <
2037 self._RPC_SHUTDOWN_TIMEOUT_SECONDS):
2038 running_processes = self.run(
2039 "pgrep -f '%s'" % remote_name,
2040 ignore_status=True).stdout.split()
2041 if not remote_pid in running_processes:
2042 logging.info('Shut down RPC server.')
2043 break
2044 time.sleep(self._RPC_SHUTDOWN_POLLING_PERIOD_SECONDS)
2045 else:
2046 raise error.TestError('Failed to shutdown RPC server %s' %
2047 remote_name)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07002048
2049 if tunnel_proc.poll() is None:
2050 tunnel_proc.terminate()
2051 logging.debug('Terminated tunnel, pid %d', tunnel_proc.pid)
2052 else:
2053 logging.debug('Tunnel pid %d terminated early, status %d',
2054 tunnel_proc.pid, tunnel_proc.returncode)
beeps32a63082013-08-22 14:02:29 -07002055 del self._rpc_proxy_map[port]
J. Richard Barnette1d78b012012-05-15 13:56:30 -07002056
2057
beeps32a63082013-08-22 14:02:29 -07002058 def rpc_disconnect_all(self):
2059 """Disconnect all known RPC proxy ports."""
2060 for port in self._rpc_proxy_map.keys():
2061 self.rpc_disconnect(port)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07002062
2063
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002064 def poor_mans_rpc(self, fun):
2065 """
2066 Calls a function from client utils on the host and returns a string.
2067
2068 @param fun function in client utils namespace.
2069 @return output string from calling fun.
2070 """
Simran Basi263a9d32014-08-19 11:16:51 -07002071 script = 'cd %s/bin; ' % autotest.Autotest.get_installed_autodir(self)
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002072 script += 'python -c "import common; import utils;'
2073 script += 'print utils.%s"' % fun
2074 return script
2075
2076
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002077 def _ping_check_status(self, status):
2078 """Ping the host once, and return whether it has a given status.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002079
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002080 @param status Check the ping status against this value.
2081 @return True iff `status` and the result of ping are the same
2082 (i.e. both True or both False).
2083
2084 """
2085 ping_val = utils.ping(self.hostname, tries=1, deadline=1)
2086 return not (status ^ (ping_val == 0))
2087
2088 def _ping_wait_for_status(self, status, timeout):
2089 """Wait for the host to have a given status (UP or DOWN).
2090
2091 Status is checked by polling. Polling will not last longer
2092 than the number of seconds in `timeout`. The polling
2093 interval will be long enough that only approximately
2094 _PING_WAIT_COUNT polling cycles will be executed, subject
2095 to a maximum interval of about one minute.
2096
2097 @param status Waiting will stop immediately if `ping` of the
2098 host returns this status.
2099 @param timeout Poll for at most this many seconds.
2100 @return True iff the host status from `ping` matched the
2101 requested status at the time of return.
2102
2103 """
2104 # _ping_check_status() takes about 1 second, hence the
2105 # "- 1" in the formula below.
2106 poll_interval = min(int(timeout / self._PING_WAIT_COUNT), 60) - 1
2107 end_time = time.time() + timeout
2108 while time.time() <= end_time:
2109 if self._ping_check_status(status):
2110 return True
2111 if poll_interval > 0:
2112 time.sleep(poll_interval)
2113
2114 # The last thing we did was sleep(poll_interval), so it may
2115 # have been too long since the last `ping`. Check one more
2116 # time, just to be sure.
2117 return self._ping_check_status(status)
2118
2119 def ping_wait_up(self, timeout):
2120 """Wait for the host to respond to `ping`.
2121
2122 N.B. This method is not a reliable substitute for
2123 `wait_up()`, because a host that responds to ping will not
2124 necessarily respond to ssh. This method should only be used
2125 if the target DUT can be considered functional even if it
2126 can't be reached via ssh.
2127
2128 @param timeout Minimum time to allow before declaring the
2129 host to be non-responsive.
2130 @return True iff the host answered to ping before the timeout.
2131
2132 """
2133 return self._ping_wait_for_status(self._PING_STATUS_UP, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002134
Andrew Bresticker678c0c72013-01-22 10:44:09 -08002135 def ping_wait_down(self, timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002136 """Wait until the host no longer responds to `ping`.
2137
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002138 This function can be used as a slightly faster version of
2139 `wait_down()`, by avoiding potentially long ssh timeouts.
2140
2141 @param timeout Minimum time to allow for the host to become
2142 non-responsive.
2143 @return True iff the host quit answering ping before the
2144 timeout.
2145
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002146 """
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002147 return self._ping_wait_for_status(self._PING_STATUS_DOWN, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002148
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002149 def test_wait_for_sleep(self, sleep_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002150 """Wait for the client to enter low-power sleep mode.
2151
2152 The test for "is asleep" can't distinguish a system that is
2153 powered off; to confirm that the unit was asleep, it is
2154 necessary to force resume, and then call
2155 `test_wait_for_resume()`.
2156
2157 This function is expected to be called from a test as part
2158 of a sequence like the following:
2159
2160 ~~~~~~~~
2161 boot_id = host.get_boot_id()
2162 # trigger sleep on the host
2163 host.test_wait_for_sleep()
2164 # trigger resume on the host
2165 host.test_wait_for_resume(boot_id)
2166 ~~~~~~~~
2167
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002168 @param sleep_timeout time limit in seconds to allow the host sleep.
2169
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002170 @exception TestFail The host did not go to sleep within
2171 the allowed time.
2172 """
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002173 if sleep_timeout is None:
2174 sleep_timeout = self.SLEEP_TIMEOUT
2175
2176 if not self.ping_wait_down(timeout=sleep_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002177 raise error.TestFail(
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002178 'client failed to sleep after %d seconds' % sleep_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002179
2180
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002181 def test_wait_for_resume(self, old_boot_id, resume_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002182 """Wait for the client to resume from low-power sleep mode.
2183
2184 The `old_boot_id` parameter should be the value from
2185 `get_boot_id()` obtained prior to entering sleep mode. A
2186 `TestFail` exception is raised if the boot id changes.
2187
2188 See @ref test_wait_for_sleep for more on this function's
2189 usage.
2190
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08002191 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002192 target host went to sleep.
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002193 @param resume_timeout time limit in seconds to allow the host up.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002194
2195 @exception TestFail The host did not respond within the
2196 allowed time.
2197 @exception TestFail The host responded, but the boot id test
2198 indicated a reboot rather than a sleep
2199 cycle.
2200 """
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002201 if resume_timeout is None:
2202 resume_timeout = self.RESUME_TIMEOUT
2203
2204 if not self.wait_up(timeout=resume_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002205 raise error.TestFail(
2206 'client failed to resume from sleep after %d seconds' %
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002207 resume_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002208 else:
2209 new_boot_id = self.get_boot_id()
2210 if new_boot_id != old_boot_id:
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002211 logging.error('client rebooted (old boot %s, new boot %s)',
2212 old_boot_id, new_boot_id)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002213 raise error.TestFail(
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002214 'client rebooted, but sleep was expected')
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002215
2216
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002217 def test_wait_for_shutdown(self, shutdown_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002218 """Wait for the client to shut down.
2219
2220 The test for "has shut down" can't distinguish a system that
2221 is merely asleep; to confirm that the unit was down, it is
2222 necessary to force boot, and then call test_wait_for_boot().
2223
2224 This function is expected to be called from a test as part
2225 of a sequence like the following:
2226
2227 ~~~~~~~~
2228 boot_id = host.get_boot_id()
2229 # trigger shutdown on the host
2230 host.test_wait_for_shutdown()
2231 # trigger boot on the host
2232 host.test_wait_for_boot(boot_id)
2233 ~~~~~~~~
2234
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002235 @param shutdown_timeout time limit in seconds to allow the host down.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002236 @exception TestFail The host did not shut down within the
2237 allowed time.
2238 """
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002239 if shutdown_timeout is None:
2240 shutdown_timeout = self.SHUTDOWN_TIMEOUT
2241
2242 if not self.ping_wait_down(timeout=shutdown_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002243 raise error.TestFail(
2244 'client failed to shut down after %d seconds' %
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002245 shutdown_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002246
2247
2248 def test_wait_for_boot(self, old_boot_id=None):
2249 """Wait for the client to boot from cold power.
2250
2251 The `old_boot_id` parameter should be the value from
2252 `get_boot_id()` obtained prior to shutting down. A
2253 `TestFail` exception is raised if the boot id does not
2254 change. The boot id test is omitted if `old_boot_id` is not
2255 specified.
2256
2257 See @ref test_wait_for_shutdown for more on this function's
2258 usage.
2259
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08002260 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002261 shut down.
2262
2263 @exception TestFail The host did not respond within the
2264 allowed time.
2265 @exception TestFail The host responded, but the boot id test
2266 indicated that there was no reboot.
2267 """
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07002268 if not self.wait_up(timeout=self.REBOOT_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002269 raise error.TestFail(
2270 'client failed to reboot after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07002271 self.REBOOT_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002272 elif old_boot_id:
2273 if self.get_boot_id() == old_boot_id:
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002274 logging.error('client not rebooted (boot %s)',
2275 old_boot_id)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002276 raise error.TestFail(
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002277 'client is back up, but did not reboot')
Simran Basid5e5e272012-09-24 15:23:59 -07002278
2279
2280 @staticmethod
2281 def check_for_rpm_support(hostname):
2282 """For a given hostname, return whether or not it is powered by an RPM.
2283
Simran Basi1df55112013-09-06 11:25:09 -07002284 @param hostname: hostname to check for rpm support.
2285
Simran Basid5e5e272012-09-24 15:23:59 -07002286 @return None if this host does not follows the defined naming format
2287 for RPM powered DUT's in the lab. If it does follow the format,
2288 it returns a regular expression MatchObject instead.
2289 """
Fang Dengbaff9082015-01-06 13:46:15 -08002290 return re.match(CrosHost._RPM_HOSTNAME_REGEX, hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07002291
2292
2293 def has_power(self):
2294 """For this host, return whether or not it is powered by an RPM.
2295
2296 @return True if this host is in the CROS lab and follows the defined
2297 naming format.
2298 """
Fang Deng0ca40e22013-08-27 17:47:44 -07002299 return CrosHost.check_for_rpm_support(self.hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07002300
2301
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08002302 def _set_power(self, state, power_method):
2303 """Sets the power to the host via RPM, Servo or manual.
2304
2305 @param state Specifies which power state to set to DUT
2306 @param power_method Specifies which method of power control to
2307 use. By default "RPM" will be used. Valid values
2308 are the strings "RPM", "manual", "servoj10".
2309
2310 """
2311 ACCEPTABLE_STATES = ['ON', 'OFF']
2312
2313 if state.upper() not in ACCEPTABLE_STATES:
2314 raise error.TestError('State must be one of: %s.'
2315 % (ACCEPTABLE_STATES,))
2316
2317 if power_method == self.POWER_CONTROL_SERVO:
2318 logging.info('Setting servo port J10 to %s', state)
2319 self.servo.set('prtctl3_pwren', state.lower())
2320 time.sleep(self._USB_POWER_TIMEOUT)
2321 elif power_method == self.POWER_CONTROL_MANUAL:
2322 logging.info('You have %d seconds to set the AC power to %s.',
2323 self._POWER_CYCLE_TIMEOUT, state)
2324 time.sleep(self._POWER_CYCLE_TIMEOUT)
2325 else:
2326 if not self.has_power():
2327 raise error.TestFail('DUT does not have RPM connected.')
Simran Basi5e6339a2013-03-21 11:34:32 -07002328 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
2329 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, True,
2330 hostname=self.hostname)
Simran Basi1df55112013-09-06 11:25:09 -07002331 rpm_client.set_power(self.hostname, state.upper(), timeout_mins=5)
Simran Basid5e5e272012-09-24 15:23:59 -07002332
2333
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08002334 def power_off(self, power_method=POWER_CONTROL_RPM):
2335 """Turn off power to this host via RPM, Servo or manual.
2336
2337 @param power_method Specifies which method of power control to
2338 use. By default "RPM" will be used. Valid values
2339 are the strings "RPM", "manual", "servoj10".
2340
2341 """
2342 self._set_power('OFF', power_method)
Simran Basid5e5e272012-09-24 15:23:59 -07002343
2344
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08002345 def power_on(self, power_method=POWER_CONTROL_RPM):
2346 """Turn on power to this host via RPM, Servo or manual.
2347
2348 @param power_method Specifies which method of power control to
2349 use. By default "RPM" will be used. Valid values
2350 are the strings "RPM", "manual", "servoj10".
2351
2352 """
2353 self._set_power('ON', power_method)
2354
2355
2356 def power_cycle(self, power_method=POWER_CONTROL_RPM):
2357 """Cycle power to this host by turning it OFF, then ON.
2358
2359 @param power_method Specifies which method of power control to
2360 use. By default "RPM" will be used. Valid values
2361 are the strings "RPM", "manual", "servoj10".
2362
2363 """
2364 if power_method in (self.POWER_CONTROL_SERVO,
2365 self.POWER_CONTROL_MANUAL):
2366 self.power_off(power_method=power_method)
2367 time.sleep(self._POWER_CYCLE_TIMEOUT)
2368 self.power_on(power_method=power_method)
2369 else:
2370 rpm_client.set_power(self.hostname, 'CYCLE')
Simran Basic6f1f7a2012-10-16 10:47:46 -07002371
2372
2373 def get_platform(self):
2374 """Determine the correct platform label for this host.
2375
2376 @returns a string representing this host's platform.
2377 """
2378 crossystem = utils.Crossystem(self)
2379 crossystem.init()
2380 # Extract fwid value and use the leading part as the platform id.
2381 # fwid generally follow the format of {platform}.{firmware version}
2382 # Example: Alex.X.YYY.Z or Google_Alex.X.YYY.Z
2383 platform = crossystem.fwid().split('.')[0].lower()
2384 # Newer platforms start with 'Google_' while the older ones do not.
2385 return platform.replace('google_', '')
2386
2387
Hung-ying Tyanb1328032014-04-01 14:18:54 +08002388 def get_architecture(self):
2389 """Determine the correct architecture label for this host.
2390
2391 @returns a string representing this host's architecture.
2392 """
2393 crossystem = utils.Crossystem(self)
2394 crossystem.init()
2395 return crossystem.arch()
2396
2397
Luis Lozano40b7d0d2014-01-17 15:12:06 -08002398 def get_chrome_version(self):
2399 """Gets the Chrome version number and milestone as strings.
2400
2401 Invokes "chrome --version" to get the version number and milestone.
2402
2403 @return A tuple (chrome_ver, milestone) where "chrome_ver" is the
2404 current Chrome version number as a string (in the form "W.X.Y.Z")
2405 and "milestone" is the first component of the version number
2406 (the "W" from "W.X.Y.Z"). If the version number cannot be parsed
2407 in the "W.X.Y.Z" format, the "chrome_ver" will be the full output
2408 of "chrome --version" and the milestone will be the empty string.
2409
2410 """
MK Ryu35d661e2014-09-25 17:44:10 -07002411 version_string = self.run(client_constants.CHROME_VERSION_COMMAND).stdout
Luis Lozano40b7d0d2014-01-17 15:12:06 -08002412 return utils.parse_chrome_version(version_string)
2413
Aviv Keshet74c89a92013-02-04 15:18:30 -08002414 @label_decorator()
Simran Basic6f1f7a2012-10-16 10:47:46 -07002415 def get_board(self):
2416 """Determine the correct board label for this host.
2417
2418 @returns a string representing this host's board.
2419 """
2420 release_info = utils.parse_cmd_output('cat /etc/lsb-release',
2421 run_method=self.run)
2422 board = release_info['CHROMEOS_RELEASE_BOARD']
2423 # Devices in the lab generally have the correct board name but our own
2424 # development devices have {board_name}-signed-{key_type}. The board
2425 # name may also begin with 'x86-' which we need to keep.
Simran Basi833814b2013-01-29 13:13:43 -08002426 board_format_string = ds_constants.BOARD_PREFIX + '%s'
Simran Basic6f1f7a2012-10-16 10:47:46 -07002427 if 'x86' not in board:
Simran Basi833814b2013-01-29 13:13:43 -08002428 return board_format_string % board.split('-')[0]
2429 return board_format_string % '-'.join(board.split('-')[0:2])
Simran Basic6f1f7a2012-10-16 10:47:46 -07002430
2431
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002432 @label_decorator('board_freq_mem')
2433 def get_board_with_frequency_and_memory(self):
2434 """
2435 Determines the board name with frequency and memory.
2436
2437 @returns a more detailed string representing the board. Examples are
2438 butterfly_1.1GHz_2GB, link_1.8GHz_4GB, x86-zgb_1.7GHz_2GB
2439 """
2440 board = self.run(self.poor_mans_rpc(
2441 'get_board_with_frequency_and_memory()')).stdout
2442 return 'board_freq_mem:%s' % str.strip(board)
2443
2444
Aviv Keshet74c89a92013-02-04 15:18:30 -08002445 @label_decorator('lightsensor')
Simran Basic6f1f7a2012-10-16 10:47:46 -07002446 def has_lightsensor(self):
2447 """Determine the correct board label for this host.
2448
2449 @returns the string 'lightsensor' if this host has a lightsensor or
2450 None if it does not.
2451 """
2452 search_cmd = "find -L %s -maxdepth 4 | egrep '%s'" % (
Richard Barnette82c35912012-11-20 10:09:10 -08002453 self._LIGHTSENSOR_SEARCH_DIR, '|'.join(self._LIGHTSENSOR_FILES))
Simran Basic6f1f7a2012-10-16 10:47:46 -07002454 try:
2455 # Run the search cmd following the symlinks. Stderr_tee is set to
2456 # None as there can be a symlink loop, but the command will still
2457 # execute correctly with a few messages printed to stderr.
2458 self.run(search_cmd, stdout_tee=None, stderr_tee=None)
2459 return 'lightsensor'
2460 except error.AutoservRunError:
2461 # egrep exited with a return code of 1 meaning none of the possible
2462 # lightsensor files existed.
2463 return None
2464
2465
Aviv Keshet74c89a92013-02-04 15:18:30 -08002466 @label_decorator('bluetooth')
Simran Basic6f1f7a2012-10-16 10:47:46 -07002467 def has_bluetooth(self):
2468 """Determine the correct board label for this host.
2469
2470 @returns the string 'bluetooth' if this host has bluetooth or
2471 None if it does not.
2472 """
2473 try:
2474 self.run('test -d /sys/class/bluetooth/hci0')
2475 # test exited with a return code of 0.
2476 return 'bluetooth'
2477 except error.AutoservRunError:
2478 # test exited with a return code 1 meaning the directory did not
2479 # exist.
2480 return None
2481
2482
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002483 @label_decorator('gpu_family')
2484 def get_gpu_family(self):
2485 """
2486 Determine GPU family.
2487
2488 @returns a string representing the gpu family. Examples are mali, tegra,
2489 pinetrail, sandybridge, ivybridge, haswell and baytrail.
2490 """
2491 gpu_family = self.run(self.poor_mans_rpc('get_gpu_family()')).stdout
2492 return 'gpu_family:%s' % str.strip(gpu_family)
2493
2494
Ilja Friedel0ce0b602013-08-15 18:45:27 -07002495 @label_decorator('graphics')
2496 def get_graphics(self):
2497 """
2498 Determine the correct board label for this host.
2499
2500 @returns a string representing this host's graphics. For now ARM boards
2501 return graphics:gles while all other boards return graphics:gl. This
2502 may change over time, but for robustness reasons this should avoid
2503 executing code in actual graphics libraries (which may not be ready and
2504 is tested by graphics_GLAPICheck).
2505 """
2506 uname = self.run('uname -a').stdout.lower()
2507 if 'arm' in uname:
2508 return 'graphics:gles'
2509 return 'graphics:gl'
2510
2511
Bill Richardson4f595f52014-02-13 16:20:26 -08002512 @label_decorator('ec')
2513 def get_ec(self):
2514 """
2515 Determine the type of EC on this host.
2516
2517 @returns a string representing this host's embedded controller type.
2518 At present, it only returns "ec:cros", for Chrome OS ECs. Other types
2519 of EC (or none) don't return any strings, since no tests depend on
2520 those.
2521 """
2522 cmd = 'mosys ec info'
2523 # The output should look like these, so that the last field should
2524 # match our EC version scheme:
2525 #
2526 # stm | stm32f100 | snow_v1.3.139-375eb9f
2527 # ti | Unknown-10de | peppy_v1.5.114-5d52788
2528 #
2529 # Non-Chrome OS ECs will look like these:
2530 #
2531 # ENE | KB932 | 00BE107A00
2532 # ite | it8518 | 3.08
2533 #
2534 # And some systems don't have ECs at all (Lumpy, for example).
2535 regexp = r'^.*\|\s*(\S+_v\d+\.\d+\.\d+-[0-9a-f]+)\s*$'
2536
2537 ecinfo = self.run(command=cmd, ignore_status=True)
2538 if ecinfo.exit_status == 0:
2539 res = re.search(regexp, ecinfo.stdout)
2540 if res:
2541 logging.info("EC version is %s", res.groups()[0])
2542 return 'ec:cros'
2543 logging.info("%s got: %s", cmd, ecinfo.stdout)
2544 # Has an EC, but it's not a Chrome OS EC
2545 return None
2546 logging.info("%s exited with status %d", cmd, ecinfo.exit_status)
2547 # No EC present
2548 return None
2549
2550
Alec Berg31b932b2014-04-04 16:09:11 -07002551 @label_decorator('accels')
2552 def get_accels(self):
2553 """
2554 Determine the type of accelerometers on this host.
2555
2556 @returns a string representing this host's accelerometer type.
2557 At present, it only returns "accel:cros-ec", for accelerometers
2558 attached to a Chrome OS EC, or none, if no accelerometers.
2559 """
2560 # Check to make sure we have ectool
2561 rv = self.run('which ectool', ignore_status=True)
2562 if rv.exit_status:
2563 logging.info("No ectool cmd found, assuming no EC accelerometers")
2564 return None
2565
2566 # Check that the EC supports the motionsense command
2567 rv = self.run('ectool motionsense', ignore_status=True)
2568 if rv.exit_status:
2569 logging.info("EC does not support motionsense command "
2570 "assuming no EC accelerometers")
2571 return None
2572
2573 # Check that EC motion sensors are active
2574 active = self.run('ectool motionsense active').stdout.split('\n')
2575 if active[0] == "0":
2576 logging.info("Motion sense inactive, assuming no EC accelerometers")
2577 return None
2578
2579 logging.info("EC accelerometers found")
2580 return 'accel:cros-ec'
2581
2582
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08002583 @label_decorator('chameleon')
2584 def has_chameleon(self):
2585 """Determine if a Chameleon connected to this host.
2586
Tom Wai-Hong Tambadbb332014-10-10 02:59:41 +08002587 @returns a list containing two strings ('chameleon' and
2588 'chameleon:' + label, e.g. 'chameleon:hdmi') if this host
2589 has a Chameleon or None if it has not.
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08002590 """
2591 if self._chameleon_host:
Tom Wai-Hong Tambadbb332014-10-10 02:59:41 +08002592 return ['chameleon', 'chameleon:' + self.chameleon.get_label()]
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08002593 else:
2594 return None
2595
2596
Cheng-Yi Chiangf4104ff2014-12-23 19:39:01 +08002597 @label_decorator('audio_loopback_dongle')
2598 def has_loopback_dongle(self):
2599 """Determine if an audio loopback dongle is plugged to this host.
2600
2601 @returns 'audio_loopback_dongle' when there is an audio loopback dongle
2602 plugged to this host.
2603 None when there is no audio loopback dongle
2604 plugged to this host.
2605 """
Cheng-Yi Chiang8de78112015-05-27 14:47:08 +08002606 nodes_info = self.run(command=cras_utils.get_cras_nodes_cmd(),
2607 ignore_status=True).stdout
2608 if (cras_utils.node_type_is_plugged('HEADPHONE', nodes_info) and
2609 cras_utils.node_type_is_plugged('MIC', nodes_info)):
Cheng-Yi Chiangf4104ff2014-12-23 19:39:01 +08002610 return 'audio_loopback_dongle'
2611 else:
2612 return None
2613
2614
Derek Basehorec71ff622014-07-07 15:18:40 -07002615 @label_decorator('power_supply')
2616 def get_power_supply(self):
2617 """
2618 Determine what type of power supply the host has
2619
2620 @returns a string representing this host's power supply.
2621 'power:battery' when the device has a battery intended for
2622 extended use
2623 'power:AC_primary' when the device has a battery not intended
2624 for extended use (for moving the machine, etc)
2625 'power:AC_only' when the device has no battery at all.
2626 """
2627 psu = self.run(command='mosys psu type', ignore_status=True)
2628 if psu.exit_status:
2629 # The psu command for mosys is not included for all platforms. The
2630 # assumption is that the device will have a battery if the command
2631 # is not found.
2632 return 'power:battery'
2633
2634 psu_str = psu.stdout.strip()
2635 if psu_str == 'unknown':
2636 return None
2637
2638 return 'power:%s' % psu_str
2639
2640
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002641 @label_decorator('storage')
2642 def get_storage(self):
2643 """
2644 Determine the type of boot device for this host.
2645
2646 Determine if the internal device is SCSI or dw_mmc device.
2647 Then check that it is SSD or HDD or eMMC or something else.
2648
2649 @returns a string representing this host's internal device type.
2650 'storage:ssd' when internal device is solid state drive
2651 'storage:hdd' when internal device is hard disk drive
2652 'storage:mmc' when internal device is mmc drive
2653 None When internal device is something else or
2654 when we are unable to determine the type
2655 """
2656 # The output should be /dev/mmcblk* for SD/eMMC or /dev/sd* for scsi
2657 rootdev_cmd = ' '.join(['. /usr/sbin/write_gpt.sh;',
2658 '. /usr/share/misc/chromeos-common.sh;',
2659 'load_base_vars;',
2660 'get_fixed_dst_drive'])
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002661 rootdev = self.run(command=rootdev_cmd, ignore_status=True)
2662 if rootdev.exit_status:
2663 logging.info("Fail to run %s", rootdev_cmd)
2664 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002665 rootdev_str = rootdev.stdout.strip()
2666
2667 if not rootdev_str:
2668 return None
2669
2670 rootdev_base = os.path.basename(rootdev_str)
2671
2672 mmc_pattern = '/dev/mmcblk[0-9]'
2673 if re.match(mmc_pattern, rootdev_str):
2674 # Use type to determine if the internal device is eMMC or somthing
2675 # else. We can assume that MMC is always an internal device.
2676 type_cmd = 'cat /sys/block/%s/device/type' % rootdev_base
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002677 type = self.run(command=type_cmd, ignore_status=True)
2678 if type.exit_status:
2679 logging.info("Fail to run %s", type_cmd)
2680 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002681 type_str = type.stdout.strip()
2682
2683 if type_str == 'MMC':
2684 return 'storage:mmc'
2685
2686 scsi_pattern = '/dev/sd[a-z]+'
2687 if re.match(scsi_pattern, rootdev.stdout):
2688 # Read symlink for /sys/block/sd* to determine if the internal
2689 # device is connected via ata or usb.
2690 link_cmd = 'readlink /sys/block/%s' % rootdev_base
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002691 link = self.run(command=link_cmd, ignore_status=True)
2692 if link.exit_status:
2693 logging.info("Fail to run %s", link_cmd)
2694 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002695 link_str = link.stdout.strip()
2696 if 'usb' in link_str:
2697 return None
2698
2699 # Read rotation to determine if the internal device is ssd or hdd.
2700 rotate_cmd = str('cat /sys/block/%s/queue/rotational'
2701 % rootdev_base)
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002702 rotate = self.run(command=rotate_cmd, ignore_status=True)
2703 if rotate.exit_status:
2704 logging.info("Fail to run %s", rotate_cmd)
2705 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002706 rotate_str = rotate.stdout.strip()
2707
2708 rotate_dict = {'0':'storage:ssd', '1':'storage:hdd'}
2709 return rotate_dict.get(rotate_str)
2710
2711 # All other internal device / error case will always fall here
2712 return None
2713
2714
Dan Shi4e9a2aa2014-03-24 14:28:42 -07002715 @label_decorator('servo')
2716 def get_servo(self):
2717 """Determine if the host has a servo attached.
2718
2719 If the host has a working servo attached, it should have a servo label.
2720
2721 @return: string 'servo' if the host has servo attached. Otherwise,
2722 returns None.
2723 """
2724 return 'servo' if self._servo_host else None
2725
2726
Dan Shi5beba472014-05-28 22:46:07 -07002727 @label_decorator('video_labels')
2728 def get_video_labels(self):
2729 """Run /usr/local/bin/avtest_label_detect to get a list of video labels.
2730
2731 Sample output of avtest_label_detect:
2732 Detected label: hw_video_acc_vp8
2733 Detected label: webcam
2734
2735 @return: A list of labels detected by tool avtest_label_detect.
2736 """
2737 try:
2738 result = self.run('/usr/local/bin/avtest_label_detect').stdout
2739 return re.findall('^Detected label: (\w+)$', result, re.M)
2740 except error.AutoservRunError:
2741 # The tool is not installed.
2742 return []
2743
2744
mussa584b4462014-06-20 15:13:28 -07002745 @label_decorator('video_glitch_detection')
2746 def is_video_glitch_detection_supported(self):
2747 """ Determine if a board under test is supported for video glitch
2748 detection tests.
2749
2750 @return: 'video_glitch_detection' if board is supported, None otherwise.
2751 """
2752 parser = ConfigParser.SafeConfigParser()
2753 filename = os.path.join(
2754 common.autotest_dir, 'client/cros/video/device_spec.conf')
2755
2756 dut = self.get_board().replace(ds_constants.BOARD_PREFIX, '')
2757
2758 try:
2759 parser.read(filename)
mussa584b4462014-06-20 15:13:28 -07002760 supported_boards = parser.sections()
2761
Mussa83c84d62014-10-02 12:11:28 -07002762 return 'video_glitch_detection' if dut in supported_boards else None
mussa584b4462014-06-20 15:13:28 -07002763
2764 except ConfigParser.error:
2765 # something went wrong while parsing the conf file
2766 return None
2767
Katherine Threlkeld7b97a9f2014-06-24 13:47:14 -07002768 @label_decorator('touch_labels')
2769 def get_touch(self):
2770 """
2771 Determine whether board under test has a touchpad or touchscreen.
2772
2773 @return: A list of some combination of 'touchscreen' and 'touchpad',
2774 depending on what is present on the device.
Katherine Threlkeldab83d392015-06-18 16:45:57 -07002775
Katherine Threlkeld7b97a9f2014-06-24 13:47:14 -07002776 """
2777 labels = []
Katherine Threlkeldab83d392015-06-18 16:45:57 -07002778 looking_for = ['touchpad', 'touchscreen']
2779 player = input_playback.InputPlayback()
2780 input_events = self.run('ls /dev/input/event*').stdout.strip().split()
2781 filename = '/tmp/touch_labels'
2782 for event in input_events:
2783 self.run('evtest %s > %s' % (event, filename), timeout=1,
2784 ignore_timeout=True)
2785 properties = self.run('cat %s' % filename).stdout
2786 input_type = player._determine_input_type(properties)
2787 if input_type in looking_for:
2788 labels.append(input_type)
2789 looking_for.remove(input_type)
2790 if len(looking_for) == 0:
2791 break
2792 self.run('rm %s' % filename)
2793
Katherine Threlkeld7b97a9f2014-06-24 13:47:14 -07002794 return labels
2795
Hung-ying Tyana39b0542015-06-30 10:36:42 +08002796
2797 @label_decorator('internal_display')
2798 def has_internal_display(self):
2799 """Determine if the device under test is equipped with an internal
2800 display.
2801
2802 @return: 'internal_display' if one is present; None otherwise.
2803 """
2804 from autotest_lib.client.cros.graphics import graphics_utils
2805 from autotest_lib.client.common_lib import utils as common_utils
2806
2807 def __system_output(cmd):
2808 return self.run(cmd).stdout
2809
2810 def __read_file(remote_path):
2811 return self.run('cat %s' % remote_path).stdout
2812
2813 # Hijack the necessary client functions so that we can take advantage
2814 # of the client lib here.
2815 # FIXME: find a less hacky way than this
2816 original_system_output = utils.system_output
2817 original_read_file = common_utils.read_file
2818 utils.system_output = __system_output
2819 common_utils.read_file = __read_file
2820 try:
2821 return ('internal_display' if graphics_utils.has_internal_display()
2822 else None)
2823 finally:
2824 utils.system_output = original_system_output
2825 common_utils.read_file = original_read_file
2826
2827
Eric Carusoee673ac2015-08-05 17:03:04 -07002828 @label_decorator('lucidsleep')
2829 def has_lucid_sleep_support(self):
2830 """Determine if the device under test has support for lucid sleep.
2831
2832 @return 'lucidsleep' if this board supports lucid sleep; None otherwise
2833 """
2834 board = self.get_board().replace(ds_constants.BOARD_PREFIX, '')
2835 return 'lucidsleep' if board in LUCID_SLEEP_BOARDS else None
2836
2837
Simran Basic6f1f7a2012-10-16 10:47:46 -07002838 def get_labels(self):
2839 """Return a list of labels for this given host.
2840
2841 This is the main way to retrieve all the automatic labels for a host
2842 as it will run through all the currently implemented label functions.
2843 """
2844 labels = []
Richard Barnette82c35912012-11-20 10:09:10 -08002845 for label_function in self._LABEL_FUNCTIONS:
J. Richard Barnetteb869b222014-09-03 17:55:44 -07002846 try:
2847 label = label_function(self)
2848 except Exception as e:
2849 logging.error('Label function %s failed; ignoring it.',
2850 label_function.__name__)
2851 logging.exception(e)
2852 label = None
Simran Basic6f1f7a2012-10-16 10:47:46 -07002853 if label:
Dan Shi5beba472014-05-28 22:46:07 -07002854 if type(label) is str:
2855 labels.append(label)
2856 elif type(label) is list:
2857 labels.extend(label)
Simran Basic6f1f7a2012-10-16 10:47:46 -07002858 return labels
Dan Shi85276d42014-04-08 22:11:45 -07002859
2860
2861 def is_boot_from_usb(self):
2862 """Check if DUT is boot from USB.
2863
2864 @return: True if DUT is boot from usb.
2865 """
2866 device = self.run('rootdev -s -d').stdout.strip()
2867 removable = int(self.run('cat /sys/block/%s/removable' %
2868 os.path.basename(device)).stdout.strip())
2869 return removable == 1
Helen Zhang17dae2b2014-11-11 09:25:52 -08002870
2871
2872 def read_from_meminfo(self, key):
Dan Shi49ca0932014-11-14 11:22:27 -08002873 """Return the memory info from /proc/meminfo
Helen Zhang17dae2b2014-11-11 09:25:52 -08002874
2875 @param key: meminfo requested
2876
2877 @return the memory value as a string
2878
2879 """
Helen Zhang17dae2b2014-11-11 09:25:52 -08002880 meminfo = self.run('grep %s /proc/meminfo' % key).stdout.strip()
2881 logging.debug('%s', meminfo)
2882 return int(re.search(r'\d+', meminfo).group(0))
Rohit Makasana8a4923c2015-08-13 17:04:26 -07002883
2884
2885 def get_board_type(self):
2886 """
2887 Get the DUT's device type from /etc/lsb-release.
Danny Chan471a8d12015-08-18 14:57:41 -07002888 DEVICETYPE can be one of CHROMEBOX, CHROMEBASE, CHROMEBOOK or more.
2889
2890 @return value of DEVICETYPE param from lsb-release.
Rohit Makasana8a4923c2015-08-13 17:04:26 -07002891 """
Danny Chan471a8d12015-08-18 14:57:41 -07002892 device_type = self.run('grep DEVICETYPE /etc/lsb-release',
2893 ignore_status=True).stdout
2894 if device_type:
Kalin Stoyanov524310b2015-08-21 16:24:04 -07002895 return device_type.split('=')[-1].strip()
Danny Chan471a8d12015-08-18 14:57:41 -07002896 return ''