blob: bb551d0d11f3e3282ccb02596b2083489de6c860 [file] [log] [blame]
J. Richard Barnette24adbf42012-04-11 15:04:53 -07001# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
Dale Curtisaa5eedb2011-08-23 16:18:52 -07002# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4
mussa584b4462014-06-20 15:13:28 -07005import ConfigParser
Aviv Keshet74c89a92013-02-04 15:18:30 -08006import functools
Christopher Wiley0ed712b2013-04-09 15:25:12 -07007import httplib
J. Richard Barnette1d78b012012-05-15 13:56:30 -07008import logging
Dan Shi0f466e82013-02-22 15:44:58 -08009import os
Simran Basid5e5e272012-09-24 15:23:59 -070010import re
Christopher Wileyd78249a2013-03-01 13:05:31 -080011import socket
J. Richard Barnette1d78b012012-05-15 13:56:30 -070012import subprocess
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070013import time
J. Richard Barnette1d78b012012-05-15 13:56:30 -070014import xmlrpclib
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070015
mussa584b4462014-06-20 15:13:28 -070016import common
J. Richard Barnette45e93de2012-04-11 17:24:15 -070017from autotest_lib.client.bin import utils
Dan Shi9cb0eec2014-06-03 09:04:50 -070018from autotest_lib.client.common_lib import autotemp
Richard Barnette0c73ffc2012-11-19 15:21:18 -080019from autotest_lib.client.common_lib import error
20from autotest_lib.client.common_lib import global_config
Dan Shi549fb822015-03-24 18:01:11 -070021from autotest_lib.client.common_lib import lsbrelease_utils
J. Richard Barnette45e93de2012-04-11 17:24:15 -070022from autotest_lib.client.common_lib.cros import autoupdater
Richard Barnette03a0c132012-11-05 12:40:35 -080023from autotest_lib.client.common_lib.cros import dev_server
Christopher Wileyd78249a2013-03-01 13:05:31 -080024from autotest_lib.client.common_lib.cros import retry
Gabe Blackb72f4fb2015-01-20 16:47:13 -080025from autotest_lib.client.common_lib.cros.graphite import autotest_es
Gabe Black1e1c41b2015-02-04 23:55:15 -080026from autotest_lib.client.common_lib.cros.graphite import autotest_stats
MK Ryu35d661e2014-09-25 17:44:10 -070027from autotest_lib.client.cros import constants as client_constants
J. Richard Barnette84890bd2014-02-21 11:05:47 -080028from autotest_lib.client.cros import cros_ui
Cheng-Yi Chiangf4104ff2014-12-23 19:39:01 +080029from autotest_lib.client.cros.audio import cras_utils
Katherine Threlkeldab83d392015-06-18 16:45:57 -070030from autotest_lib.client.cros.input_playback import input_playback
MK Ryu35d661e2014-09-25 17:44:10 -070031from autotest_lib.server import autoserv_parser
32from autotest_lib.server import autotest
33from autotest_lib.server import constants
34from autotest_lib.server import crashcollect
Dan Shia1ecd5c2013-06-06 11:21:31 -070035from autotest_lib.server import utils as server_utils
Dan Shi9cb0eec2014-06-03 09:04:50 -070036from autotest_lib.server.cros import provision
Scott Zawalski89c44dd2013-02-26 09:28:02 -050037from autotest_lib.server.cros.dynamic_suite import constants as ds_constants
Simran Basi5e6339a2013-03-21 11:34:32 -070038from autotest_lib.server.cros.dynamic_suite import tools, frontend_wrappers
Dan Shi9cb0eec2014-06-03 09:04:50 -070039from autotest_lib.server.cros.faft.config.config import Config as FAFTConfig
Fang Deng96667ca2013-08-01 17:46:18 -070040from autotest_lib.server.hosts import abstract_ssh
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +080041from autotest_lib.server.hosts import chameleon_host
Fang Deng5d518f42013-08-02 14:04:32 -070042from autotest_lib.server.hosts import servo_host
Simran Basidcff4252012-11-20 16:13:20 -080043from autotest_lib.site_utils.rpm_control_system import rpm_client
Simran Basid5e5e272012-09-24 15:23:59 -070044
45
beeps32a63082013-08-22 14:02:29 -070046try:
47 import jsonrpclib
48except ImportError:
49 jsonrpclib = None
Fang Deng96667ca2013-08-01 17:46:18 -070050
Fang Dengd1c2b732013-08-20 12:59:46 -070051
beepsc87ff602013-07-31 21:53:00 -070052class FactoryImageCheckerException(error.AutoservError):
53 """Exception raised when an image is a factory image."""
54 pass
55
56
Aviv Keshet74c89a92013-02-04 15:18:30 -080057def add_label_detector(label_function_list, label_list=None, label=None):
58 """Decorator used to group functions together into the provided list.
59 @param label_function_list: List of label detecting functions to add
60 decorated function to.
61 @param label_list: List of detectable labels to add detectable labels to.
62 (Default: None)
63 @param label: Label string that is detectable by this detection function
64 (Default: None)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -080065 """
Simran Basic6f1f7a2012-10-16 10:47:46 -070066 def add_func(func):
Aviv Keshet74c89a92013-02-04 15:18:30 -080067 """
68 @param func: The function to be added as a detector.
69 """
70 label_function_list.append(func)
71 if label and label_list is not None:
72 label_list.append(label)
Simran Basic6f1f7a2012-10-16 10:47:46 -070073 return func
74 return add_func
75
76
Fang Deng0ca40e22013-08-27 17:47:44 -070077class CrosHost(abstract_ssh.AbstractSSHHost):
J. Richard Barnette45e93de2012-04-11 17:24:15 -070078 """Chromium OS specific subclass of Host."""
79
80 _parser = autoserv_parser.autoserv_parser
Scott Zawalski62bacae2013-03-05 10:40:32 -050081 _AFE = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
J. Richard Barnette45e93de2012-04-11 17:24:15 -070082
Richard Barnette03a0c132012-11-05 12:40:35 -080083 # Timeout values (in seconds) associated with various Chrome OS
84 # state changes.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070085 #
Richard Barnette0c73ffc2012-11-19 15:21:18 -080086 # In general, a good rule of thumb is that the timeout can be up
87 # to twice the typical measured value on the slowest platform.
88 # The times here have not necessarily been empirically tested to
89 # meet this criterion.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070090 #
91 # SLEEP_TIMEOUT: Time to allow for suspend to memory.
Richard Barnette0c73ffc2012-11-19 15:21:18 -080092 # RESUME_TIMEOUT: Time to allow for resume after suspend, plus
93 # time to restart the netwowrk.
J. Richard Barnette84890bd2014-02-21 11:05:47 -080094 # SHUTDOWN_TIMEOUT: Time to allow for shut down.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070095 # BOOT_TIMEOUT: Time to allow for boot from power off. Among
Richard Barnette0c73ffc2012-11-19 15:21:18 -080096 # other things, this must account for the 30 second dev-mode
J. Richard Barnetted4649c62013-03-06 17:42:27 -080097 # screen delay and time to start the network.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070098 # USB_BOOT_TIMEOUT: Time to allow for boot from a USB device,
Richard Barnette0c73ffc2012-11-19 15:21:18 -080099 # including the 30 second dev-mode delay and time to start the
J. Richard Barnetted4649c62013-03-06 17:42:27 -0800100 # network.
beepsf079cfb2013-09-18 17:49:51 -0700101 # INSTALL_TIMEOUT: Time to allow for chromeos-install.
J. Richard Barnette84890bd2014-02-21 11:05:47 -0800102 # POWERWASH_BOOT_TIMEOUT: Time to allow for a reboot that
103 # includes powerwash.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -0700104
105 SLEEP_TIMEOUT = 2
J. Richard Barnetted4649c62013-03-06 17:42:27 -0800106 RESUME_TIMEOUT = 10
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +0800107 SHUTDOWN_TIMEOUT = 10
J. Richard Barnettefbcc7122013-07-24 18:24:59 -0700108 BOOT_TIMEOUT = 60
J. Richard Barnetteeb69d722012-06-18 17:29:44 -0700109 USB_BOOT_TIMEOUT = 150
J. Richard Barnette7817b052014-08-28 09:47:29 -0700110 INSTALL_TIMEOUT = 480
Dan Shi2c88eed2013-11-12 10:18:38 -0800111 POWERWASH_BOOT_TIMEOUT = 60
Chris Sosab76e0ee2013-05-22 16:55:41 -0700112
Dan Shica503482015-03-30 17:23:25 -0700113 # Minimum OS version that supports server side packaging. Older builds may
114 # not have server side package built or with Autotest code change to support
115 # server-side packaging.
Dan Shiced09e42015-04-17 16:09:34 -0700116 MIN_VERSION_SUPPORT_SSP = global_config.global_config.get_config_value(
117 'AUTOSERV', 'min_version_support_ssp', type=int)
Dan Shica503482015-03-30 17:23:25 -0700118
J. Richard Barnette84890bd2014-02-21 11:05:47 -0800119 # REBOOT_TIMEOUT: How long to wait for a reboot.
120 #
Chris Sosab76e0ee2013-05-22 16:55:41 -0700121 # We have a long timeout to ensure we don't flakily fail due to other
122 # issues. Shorter timeouts are vetted in platform_RebootAfterUpdate.
Simran Basi1160e2c2013-10-04 16:00:24 -0700123 # TODO(sbasi - crbug.com/276094) Restore to 5 mins once the 'host did not
124 # return from reboot' bug is solved.
125 REBOOT_TIMEOUT = 480
Chris Sosab76e0ee2013-05-22 16:55:41 -0700126
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800127 # _USB_POWER_TIMEOUT: Time to allow for USB to power toggle ON and OFF.
128 # _POWER_CYCLE_TIMEOUT: Time to allow for manual power cycle.
129 _USB_POWER_TIMEOUT = 5
130 _POWER_CYCLE_TIMEOUT = 10
131
beeps32a63082013-08-22 14:02:29 -0700132 _RPC_PROXY_URL = 'http://localhost:%d'
Christopher Wileydd181852013-10-10 19:56:58 -0700133 _RPC_SHUTDOWN_POLLING_PERIOD_SECONDS = 2
Peter Qiu4410db72014-06-05 10:32:41 -0700134 # Set shutdown timeout to account for the time for restarting the UI.
135 _RPC_SHUTDOWN_TIMEOUT_SECONDS = cros_ui.RESTART_UI_TIMEOUT
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800136
Richard Barnette82c35912012-11-20 10:09:10 -0800137 _RPM_RECOVERY_BOARDS = global_config.global_config.get_config_value('CROS',
138 'rpm_recovery_boards', type=str).split(',')
139
140 _MAX_POWER_CYCLE_ATTEMPTS = 6
141 _LAB_MACHINE_FILE = '/mnt/stateful_partition/.labmachine'
Fang Dengdeba14f2014-11-14 11:54:09 -0800142 _RPM_HOSTNAME_REGEX = ('chromeos(\d+)(-row(\d+))?-rack(\d+[a-z]*)'
143 '-host(\d+)')
Katherine Threlkeldab83d392015-06-18 16:45:57 -0700144 _LIGHTSENSOR_FILES = [ "in_illuminance0_input",
145 "in_illuminance_input",
146 "in_illuminance0_raw",
147 "in_illuminance_raw",
148 "illuminance0_input"]
Richard Barnette82c35912012-11-20 10:09:10 -0800149 _LIGHTSENSOR_SEARCH_DIR = '/sys/bus/iio/devices'
150 _LABEL_FUNCTIONS = []
Aviv Keshet74c89a92013-02-04 15:18:30 -0800151 _DETECTABLE_LABELS = []
152 label_decorator = functools.partial(add_label_detector, _LABEL_FUNCTIONS,
153 _DETECTABLE_LABELS)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700154
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -0800155 # Constants used in ping_wait_up() and ping_wait_down().
156 #
157 # _PING_WAIT_COUNT is the approximate number of polling
158 # cycles to use when waiting for a host state change.
159 #
160 # _PING_STATUS_DOWN and _PING_STATUS_UP are names used
161 # for arguments to the internal _ping_wait_for_status()
162 # method.
163 _PING_WAIT_COUNT = 40
164 _PING_STATUS_DOWN = False
165 _PING_STATUS_UP = True
166
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800167 # Allowed values for the power_method argument.
168
169 # POWER_CONTROL_RPM: Passed as default arg for power_off/on/cycle() methods.
170 # POWER_CONTROL_SERVO: Used in set_power() and power_cycle() methods.
171 # POWER_CONTROL_MANUAL: Used in set_power() and power_cycle() methods.
172 POWER_CONTROL_RPM = 'RPM'
173 POWER_CONTROL_SERVO = 'servoj10'
174 POWER_CONTROL_MANUAL = 'manual'
175
176 POWER_CONTROL_VALID_ARGS = (POWER_CONTROL_RPM,
177 POWER_CONTROL_SERVO,
178 POWER_CONTROL_MANUAL)
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800179
Simran Basi5e6339a2013-03-21 11:34:32 -0700180 _RPM_OUTLET_CHANGED = 'outlet_changed'
181
Dan Shi9cb0eec2014-06-03 09:04:50 -0700182 # URL pattern to download firmware image.
183 _FW_IMAGE_URL_PATTERN = global_config.global_config.get_config_value(
184 'CROS', 'firmware_url_pattern', type=str)
beeps687243d2013-07-18 15:29:27 -0700185
MK Ryu35d661e2014-09-25 17:44:10 -0700186 # File that has a list of directories to be collected
187 _LOGS_TO_COLLECT_FILE = os.path.join(
188 common.client_dir, 'common_lib', 'logs_to_collect')
189
190 # Prefix of logging message w.r.t. crash collection
191 _CRASHLOGS_PREFIX = 'collect_crashlogs'
192
193 # Time duration waiting for host up/down check
194 _CHECK_HOST_UP_TIMEOUT_SECS = 15
195
196 # A command that interacts with kernel and hardware (e.g., rm, mkdir, etc)
197 # might not be completely done deep through the hardware when the machine
198 # is powered down right after the command returns.
199 # We should wait for a few seconds to make them done. Finger crossed.
200 _SAFE_WAIT_SECS = 10
201
202
J. Richard Barnette964fba02012-10-24 17:34:29 -0700203 @staticmethod
beeps46dadc92013-11-07 14:07:10 -0800204 def check_host(host, timeout=10):
205 """
206 Check if the given host is a chrome-os host.
207
208 @param host: An ssh host representing a device.
209 @param timeout: The timeout for the run command.
210
211 @return: True if the host device is chromeos.
212
beeps46dadc92013-11-07 14:07:10 -0800213 """
214 try:
Simran Basi933c8af2015-04-29 14:05:07 -0700215 result = host.run(
216 'grep -q CHROMEOS /etc/lsb-release && '
217 '! test -f /mnt/stateful_partition/.android_tester && '
218 '! grep -q moblab /etc/lsb-release',
219 ignore_status=True, timeout=timeout)
beeps46dadc92013-11-07 14:07:10 -0800220 except (error.AutoservRunError, error.AutoservSSHTimeout):
221 return False
222 return result.exit_status == 0
223
224
225 @staticmethod
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800226 def _extract_arguments(args_dict, key_subset):
227 """Extract options from `args_dict` and return a subset result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800228
229 Take the provided dictionary of argument options and return
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800230 a subset that represent standard arguments needed to construct
231 a test-assistant object (chameleon or servo) for a host. The
232 intent is to provide standard argument processing from
Christopher Wiley644ef3e2015-05-15 13:14:14 -0700233 CrosHost for tests that require a test-assistant board
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800234 to operate.
235
236 @param args_dict Dictionary from which to extract the arguments.
237 @param key_subset Tuple of keys to extract from the args_dict, e.g.
238 ('servo_host', 'servo_port').
239 """
240 result = {}
241 for arg in key_subset:
242 if arg in args_dict:
243 result[arg] = args_dict[arg]
244 return result
245
246
247 @staticmethod
248 def get_chameleon_arguments(args_dict):
249 """Extract chameleon options from `args_dict` and return the result.
250
251 Recommended usage:
252 ~~~~~~~~
253 args_dict = utils.args_to_dict(args)
254 chameleon_args = hosts.CrosHost.get_chameleon_arguments(args_dict)
255 host = hosts.create_host(machine, chameleon_args=chameleon_args)
256 ~~~~~~~~
257
258 @param args_dict Dictionary from which to extract the chameleon
259 arguments.
260 """
261 return CrosHost._extract_arguments(
262 args_dict, ('chameleon_host', 'chameleon_port'))
263
264
265 @staticmethod
266 def get_servo_arguments(args_dict):
267 """Extract servo options from `args_dict` and return the result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800268
269 Recommended usage:
270 ~~~~~~~~
271 args_dict = utils.args_to_dict(args)
Fang Deng0ca40e22013-08-27 17:47:44 -0700272 servo_args = hosts.CrosHost.get_servo_arguments(args_dict)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800273 host = hosts.create_host(machine, servo_args=servo_args)
274 ~~~~~~~~
275
276 @param args_dict Dictionary from which to extract the servo
277 arguments.
278 """
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800279 return CrosHost._extract_arguments(
280 args_dict, ('servo_host', 'servo_port'))
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700281
J. Richard Barnette964fba02012-10-24 17:34:29 -0700282
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800283 def _initialize(self, hostname, chameleon_args=None, servo_args=None,
Fang Denge545abb2014-12-30 18:43:47 -0800284 try_lab_servo=False, ssh_verbosity_flag='', ssh_options='',
Fang Dengd1c2b732013-08-20 12:59:46 -0700285 *args, **dargs):
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800286 """Initialize superclasses, |self.chameleon|, and |self.servo|.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700287
Fang Denge545abb2014-12-30 18:43:47 -0800288 This method will attempt to create the test-assistant object
289 (chameleon/servo) when it is needed by the test. Check
290 the docstring of chameleon_host.create_chameleon_host and
291 servo_host.create_servo_host for how this is determined.
Fang Deng5d518f42013-08-02 14:04:32 -0700292
Fang Denge545abb2014-12-30 18:43:47 -0800293 @param hostname: Hostname of the dut.
294 @param chameleon_args: A dictionary that contains args for creating
295 a ChameleonHost. See chameleon_host for details.
296 @param servo_args: A dictionary that contains args for creating
297 a ServoHost object. See servo_host for details.
298 @param try_lab_servo: Boolean, False indicates that ServoHost should
299 not be created for a device in Cros test lab.
300 See servo_host for details.
301 @param ssh_verbosity_flag: String, to pass to the ssh command to control
302 verbosity.
303 @param ssh_options: String, other ssh options to pass to the ssh
304 command.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700305 """
Fang Deng0ca40e22013-08-27 17:47:44 -0700306 super(CrosHost, self)._initialize(hostname=hostname,
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700307 *args, **dargs)
J. Richard Barnettef0859852012-08-20 14:55:50 -0700308 # self.env is a dictionary of environment variable settings
309 # to be exported for commands run on the host.
310 # LIBC_FATAL_STDERR_ can be useful for diagnosing certain
311 # errors that might happen.
312 self.env['LIBC_FATAL_STDERR_'] = '1'
beeps32a63082013-08-22 14:02:29 -0700313 self._rpc_proxy_map = {}
Fang Dengd1c2b732013-08-20 12:59:46 -0700314 self._ssh_verbosity_flag = ssh_verbosity_flag
Aviv Keshetc5947fa2013-09-04 14:06:29 -0700315 self._ssh_options = ssh_options
Fang Deng5d518f42013-08-02 14:04:32 -0700316 # TODO(fdeng): We need to simplify the
317 # process of servo and servo_host initialization.
318 # crbug.com/298432
Fang Denge545abb2014-12-30 18:43:47 -0800319 self._servo_host = servo_host.create_servo_host(
320 dut=self.hostname, servo_args=servo_args,
321 try_lab_servo=try_lab_servo)
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800322 # TODO(waihong): Do the simplication on Chameleon too.
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800323 self._chameleon_host = chameleon_host.create_chameleon_host(
324 dut=self.hostname, chameleon_args=chameleon_args)
325
Dan Shi4d478522014-02-14 13:46:32 -0800326 if self._servo_host is not None:
327 self.servo = self._servo_host.get_servo()
328 else:
329 self.servo = None
330
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800331 if self._chameleon_host:
Tom Wai-Hong Tameaee3402014-01-22 08:52:10 +0800332 self.chameleon = self._chameleon_host.create_chameleon_board()
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800333 else:
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800334 self.chameleon = None
Fang Deng5d518f42013-08-02 14:04:32 -0700335
336
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500337 def get_repair_image_name(self):
338 """Generate a image_name from variables in the global config.
339
340 @returns a str of $board-version/$BUILD.
341
342 """
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500343 board = self._get_board_from_afe()
344 if board is None:
345 raise error.AutoservError('DUT has no board attribute, '
346 'cannot be repaired.')
Dan Shi6964fa52014-12-18 11:04:27 -0800347 stable_version = self._AFE.run('get_stable_version', board=board)
348 build_pattern = global_config.global_config.get_config_value(
349 'CROS', 'stable_build_pattern')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500350 return build_pattern % (board, stable_version)
351
352
Scott Zawalski62bacae2013-03-05 10:40:32 -0500353 def _host_in_AFE(self):
354 """Check if the host is an object the AFE knows.
355
356 @returns the host object.
357 """
358 return self._AFE.get_hosts(hostname=self.hostname)
359
360
Chris Sosab76e0ee2013-05-22 16:55:41 -0700361 def lookup_job_repo_url(self):
362 """Looks up the job_repo_url for the host.
363
364 @returns job_repo_url from AFE or None if not found.
365
366 @raises KeyError if the host does not have a job_repo_url
367 """
368 if not self._host_in_AFE():
369 return None
370
371 hosts = self._AFE.get_hosts(hostname=self.hostname)
beepsb5efc532013-06-04 11:29:34 -0700372 if hosts and ds_constants.JOB_REPO_URL in hosts[0].attributes:
373 return hosts[0].attributes[ds_constants.JOB_REPO_URL]
Chris Sosab76e0ee2013-05-22 16:55:41 -0700374
375
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500376 def clear_cros_version_labels_and_job_repo_url(self):
377 """Clear cros_version labels and host attribute job_repo_url."""
Scott Zawalski62bacae2013-03-05 10:40:32 -0500378 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400379 return
380
Scott Zawalski62bacae2013-03-05 10:40:32 -0500381 host_list = [self.hostname]
382 labels = self._AFE.get_labels(
383 name__startswith=ds_constants.VERSION_PREFIX,
384 host__hostname=self.hostname)
Dan Shi0f466e82013-02-22 15:44:58 -0800385
Scott Zawalski62bacae2013-03-05 10:40:32 -0500386 for label in labels:
387 label.remove_hosts(hosts=host_list)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500388
beepscb6f1e22013-06-28 19:14:10 -0700389 self.update_job_repo_url(None, None)
390
391
392 def update_job_repo_url(self, devserver_url, image_name):
393 """
394 Updates the job_repo_url host attribute and asserts it's value.
395
396 @param devserver_url: The devserver to use in the job_repo_url.
397 @param image_name: The name of the image to use in the job_repo_url.
398
399 @raises AutoservError: If we failed to update the job_repo_url.
400 """
401 repo_url = None
402 if devserver_url and image_name:
403 repo_url = tools.get_package_url(devserver_url, image_name)
404 self._AFE.set_host_attribute(ds_constants.JOB_REPO_URL, repo_url,
Scott Zawalski62bacae2013-03-05 10:40:32 -0500405 hostname=self.hostname)
beepscb6f1e22013-06-28 19:14:10 -0700406 if self.lookup_job_repo_url() != repo_url:
407 raise error.AutoservError('Failed to update job_repo_url with %s, '
408 'host %s' % (repo_url, self.hostname))
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500409
410
Dan Shie9309262013-06-19 22:50:21 -0700411 def add_cros_version_labels_and_job_repo_url(self, image_name):
Scott Zawalskieadbf702013-03-14 09:23:06 -0400412 """Add cros_version labels and host attribute job_repo_url.
413
414 @param image_name: The name of the image e.g.
415 lumpy-release/R27-3837.0.0
Dan Shi7458bf62013-06-10 12:50:16 -0700416
Scott Zawalskieadbf702013-03-14 09:23:06 -0400417 """
Scott Zawalski62bacae2013-03-05 10:40:32 -0500418 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400419 return
Scott Zawalski62bacae2013-03-05 10:40:32 -0500420
Scott Zawalskieadbf702013-03-14 09:23:06 -0400421 cros_label = '%s%s' % (ds_constants.VERSION_PREFIX, image_name)
Dan Shie9309262013-06-19 22:50:21 -0700422 devserver_url = dev_server.ImageServer.resolve(image_name).url()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500423
MK Ryufb5e3a82015-07-01 12:21:20 -0700424 self._AFE.run('label_add_hosts', id=cros_label, hosts=[self.hostname])
beepscb6f1e22013-06-28 19:14:10 -0700425 self.update_job_repo_url(devserver_url, image_name)
426
427
beepsdae65fd2013-07-26 16:24:41 -0700428 def verify_job_repo_url(self, tag=''):
beepscb6f1e22013-06-28 19:14:10 -0700429 """
430 Make sure job_repo_url of this host is valid.
431
joychen03eaad92013-06-26 09:55:21 -0700432 Eg: The job_repo_url "http://lmn.cd.ab.xyx:8080/static/\
beepscb6f1e22013-06-28 19:14:10 -0700433 lumpy-release/R29-4279.0.0/autotest/packages" claims to have the
434 autotest package for lumpy-release/R29-4279.0.0. If this isn't the case,
435 download and extract it. If the devserver embedded in the url is
436 unresponsive, update the job_repo_url of the host after staging it on
437 another devserver.
438
439 @param job_repo_url: A url pointing to the devserver where the autotest
440 package for this build should be staged.
beepsdae65fd2013-07-26 16:24:41 -0700441 @param tag: The tag from the server job, in the format
442 <job_id>-<user>/<hostname>, or <hostless> for a server job.
beepscb6f1e22013-06-28 19:14:10 -0700443
444 @raises DevServerException: If we could not resolve a devserver.
445 @raises AutoservError: If we're unable to save the new job_repo_url as
446 a result of choosing a new devserver because the old one failed to
447 respond to a health check.
beeps0c865032013-07-30 11:37:06 -0700448 @raises urllib2.URLError: If the devserver embedded in job_repo_url
449 doesn't respond within the timeout.
beepscb6f1e22013-06-28 19:14:10 -0700450 """
451 job_repo_url = self.lookup_job_repo_url()
452 if not job_repo_url:
453 logging.warning('No job repo url set on host %s', self.hostname)
454 return
455
456 logging.info('Verifying job repo url %s', job_repo_url)
457 devserver_url, image_name = tools.get_devserver_build_from_package_url(
458 job_repo_url)
459
beeps0c865032013-07-30 11:37:06 -0700460 ds = dev_server.ImageServer(devserver_url)
beepscb6f1e22013-06-28 19:14:10 -0700461
462 logging.info('Staging autotest artifacts for %s on devserver %s',
463 image_name, ds.url())
beeps687243d2013-07-18 15:29:27 -0700464
465 start_time = time.time()
Simran Basi25e7a922014-10-31 11:56:10 -0700466 ds.stage_artifacts(image_name, ['autotest_packages'])
beeps687243d2013-07-18 15:29:27 -0700467 stage_time = time.time() - start_time
468
469 # Record how much of the verification time comes from a devserver
470 # restage. If we're doing things right we should not see multiple
471 # devservers for a given board/build/branch path.
472 try:
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800473 board, build_type, branch = server_utils.ParseBuildName(
beeps687243d2013-07-18 15:29:27 -0700474 image_name)[:3]
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800475 except server_utils.ParseBuildNameException:
beeps687243d2013-07-18 15:29:27 -0700476 pass
477 else:
beeps0c865032013-07-30 11:37:06 -0700478 devserver = devserver_url[
Chris Sosa65425082013-10-16 13:26:22 -0700479 devserver_url.find('/') + 2:devserver_url.rfind(':')]
beeps687243d2013-07-18 15:29:27 -0700480 stats_key = {
481 'board': board,
482 'build_type': build_type,
483 'branch': branch,
beeps0c865032013-07-30 11:37:06 -0700484 'devserver': devserver.replace('.', '_'),
beeps687243d2013-07-18 15:29:27 -0700485 }
Gabe Black1e1c41b2015-02-04 23:55:15 -0800486 autotest_stats.Gauge('verify_job_repo_url').send(
beeps687243d2013-07-18 15:29:27 -0700487 '%(board)s.%(build_type)s.%(branch)s.%(devserver)s' % stats_key,
488 stage_time)
beepscb6f1e22013-06-28 19:14:10 -0700489
Scott Zawalskieadbf702013-03-14 09:23:06 -0400490
Dan Shicf4d2032015-03-12 15:04:21 -0700491 def stage_server_side_package(self, image=None):
492 """Stage autotest server-side package on devserver.
493
494 @param image: Full path of an OS image to install or a build name.
495
496 @return: A url to the autotest server-side package.
497 """
498 if image:
499 image_name = tools.get_build_from_image(image)
500 if not image_name:
501 raise error.AutoservError(
502 'Failed to parse build name from %s' % image)
503 ds = dev_server.ImageServer.resolve(image_name)
504 else:
505 job_repo_url = self.lookup_job_repo_url()
506 if job_repo_url:
507 devserver_url, image_name = (
508 tools.get_devserver_build_from_package_url(job_repo_url))
509 ds = dev_server.ImageServer(devserver_url)
510 else:
511 labels = self._AFE.get_labels(
512 name__startswith=ds_constants.VERSION_PREFIX,
513 host__hostname=self.hostname)
514 if not labels:
515 raise error.AutoservError(
516 'Failed to stage server-side package. The host has '
517 'no job_report_url attribute or version label.')
518 image_name = labels[0].name[len(ds_constants.VERSION_PREFIX):]
519 ds = dev_server.ImageServer.resolve(image_name)
Dan Shica503482015-03-30 17:23:25 -0700520
521 # Get the OS version of the build, for any build older than
522 # MIN_VERSION_SUPPORT_SSP, server side packaging is not supported.
523 match = re.match('.*/R\d+-(\d+)\.', image_name)
524 if match and int(match.group(1)) < self.MIN_VERSION_SUPPORT_SSP:
525 logging.warn('Build %s is older than %s. Server side packaging is '
526 'disabled.', image_name, self.MIN_VERSION_SUPPORT_SSP)
527 return None
528
Dan Shicf4d2032015-03-12 15:04:21 -0700529 ds.stage_artifacts(image_name, ['autotest_server_package'])
530 return '%s/static/%s/%s' % (ds.url(), image_name,
531 'autotest_server_package.tar.bz2')
532
533
Dan Shi0f466e82013-02-22 15:44:58 -0800534 def _try_stateful_update(self, update_url, force_update, updater):
535 """Try to use stateful update to initialize DUT.
536
537 When DUT is already running the same version that machine_install
538 tries to install, stateful update is a much faster way to clean up
539 the DUT for testing, compared to a full reimage. It is implemeted
540 by calling autoupdater.run_update, but skipping updating root, as
541 updating the kernel is time consuming and not necessary.
542
543 @param update_url: url of the image.
544 @param force_update: Set to True to update the image even if the DUT
545 is running the same version.
546 @param updater: ChromiumOSUpdater instance used to update the DUT.
547 @returns: True if the DUT was updated with stateful update.
548
549 """
J. Richard Barnette3f731032014-04-07 17:42:59 -0700550 # TODO(jrbarnette): Yes, I hate this re.match() test case.
551 # It's better than the alternative: see crbug.com/360944.
552 image_name = autoupdater.url_to_image_name(update_url)
553 release_pattern = r'^.*-release/R[0-9]+-[0-9]+\.[0-9]+\.0$'
554 if not re.match(release_pattern, image_name):
555 return False
Dan Shi0f466e82013-02-22 15:44:58 -0800556 if not updater.check_version():
557 return False
558 if not force_update:
559 logging.info('Canceling stateful update because the new and '
560 'old versions are the same.')
561 return False
562 # Following folders should be rebuilt after stateful update.
563 # A test file is used to confirm each folder gets rebuilt after
564 # the stateful update.
565 folders_to_check = ['/var', '/home', '/mnt/stateful_partition']
566 test_file = '.test_file_to_be_deleted'
567 for folder in folders_to_check:
568 touch_path = os.path.join(folder, test_file)
569 self.run('touch %s' % touch_path)
570
Chris Sosae92399e2015-04-24 11:32:59 -0700571 updater.run_update(update_root=False)
Dan Shi0f466e82013-02-22 15:44:58 -0800572
573 # Reboot to complete stateful update.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700574 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Dan Shi0f466e82013-02-22 15:44:58 -0800575 check_file_cmd = 'test -f %s; echo $?'
576 for folder in folders_to_check:
577 test_file_path = os.path.join(folder, test_file)
578 result = self.run(check_file_cmd % test_file_path,
579 ignore_status=True)
580 if result.exit_status == 1:
581 return False
582 return True
583
584
J. Richard Barnette7275b612013-06-04 18:13:11 -0700585 def _post_update_processing(self, updater, expected_kernel=None):
Dan Shi0f466e82013-02-22 15:44:58 -0800586 """After the DUT is updated, confirm machine_install succeeded.
587
588 @param updater: ChromiumOSUpdater instance used to update the DUT.
J. Richard Barnette7275b612013-06-04 18:13:11 -0700589 @param expected_kernel: kernel expected to be active after reboot,
590 or `None` to skip rollback checking.
Dan Shi0f466e82013-02-22 15:44:58 -0800591
592 """
J. Richard Barnette7275b612013-06-04 18:13:11 -0700593 # Touch the lab machine file to leave a marker that
594 # distinguishes this image from other test images.
595 # Afterwards, we must re-run the autoreboot script because
596 # it depends on the _LAB_MACHINE_FILE.
Dan Shi0f466e82013-02-22 15:44:58 -0800597 self.run('touch %s' % self._LAB_MACHINE_FILE)
Dan Shi0f466e82013-02-22 15:44:58 -0800598 self.run('start autoreboot')
Chris Sosa65425082013-10-16 13:26:22 -0700599 updater.verify_boot_expectations(
600 expected_kernel, rollback_message=
601 'Build %s failed to boot on %s; system rolled back to previous'
602 'build' % (updater.update_version, self.hostname))
J. Richard Barnette7275b612013-06-04 18:13:11 -0700603 # Check that we've got the build we meant to install.
604 if not updater.check_version_to_confirm_install():
605 raise autoupdater.ChromiumOSError(
606 'Failed to update %s to build %s; found build '
607 '%s instead' % (self.hostname,
Chris Sosa65425082013-10-16 13:26:22 -0700608 updater.update_version,
Dan Shi0942b1d2015-03-31 11:07:00 -0700609 self.get_release_version()))
Dan Shi0f466e82013-02-22 15:44:58 -0800610
Chris Sosae92399e2015-04-24 11:32:59 -0700611 logging.debug('Cleaning up old autotest directories.')
612 try:
613 installed_autodir = autotest.Autotest.get_installed_autodir(self)
614 self.run('rm -rf ' + installed_autodir)
615 except autotest.AutodirNotFoundError:
616 logging.debug('No autotest installed directory found.')
617
Dan Shi0f466e82013-02-22 15:44:58 -0800618
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700619 def _stage_image_for_update(self, image_name=None):
Chris Sosae92399e2015-04-24 11:32:59 -0700620 """Stage a build on a devserver and return the update_url and devserver.
Scott Zawalskieadbf702013-03-14 09:23:06 -0400621
622 @param image_name: a name like lumpy-release/R27-3837.0.0
Chris Sosae92399e2015-04-24 11:32:59 -0700623 @returns a tuple with an update URL like:
Scott Zawalskieadbf702013-03-14 09:23:06 -0400624 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
Chris Sosae92399e2015-04-24 11:32:59 -0700625 and the devserver instance.
Scott Zawalskieadbf702013-03-14 09:23:06 -0400626 """
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700627 if not image_name:
628 image_name = self.get_repair_image_name()
Chris Sosae92399e2015-04-24 11:32:59 -0700629
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700630 logging.info('Staging build for AU: %s', image_name)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400631 devserver = dev_server.ImageServer.resolve(image_name)
632 devserver.trigger_download(image_name, synchronous=False)
Chris Sosae92399e2015-04-24 11:32:59 -0700633 return (tools.image_url_pattern() % (devserver.url(), image_name),
634 devserver)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400635
636
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700637 def stage_image_for_servo(self, image_name=None):
638 """Stage a build on a devserver and return the update_url.
639
640 @param image_name: a name like lumpy-release/R27-3837.0.0
641 @returns an update URL like:
642 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
643 """
644 if not image_name:
645 image_name = self.get_repair_image_name()
646 logging.info('Staging build for servo install: %s', image_name)
647 devserver = dev_server.ImageServer.resolve(image_name)
648 devserver.stage_artifacts(image_name, ['test_image'])
649 return devserver.get_test_image_url(image_name)
650
651
beepse539be02013-07-31 21:57:39 -0700652 def stage_factory_image_for_servo(self, image_name):
653 """Stage a build on a devserver and return the update_url.
654
655 @param image_name: a name like <baord>/4262.204.0
beeps12c0a3c2013-09-03 11:58:27 -0700656
beepse539be02013-07-31 21:57:39 -0700657 @return: An update URL, eg:
658 http://<devserver>/static/canary-channel/\
659 <board>/4262.204.0/factory_test/chromiumos_factory_image.bin
beeps12c0a3c2013-09-03 11:58:27 -0700660
661 @raises: ValueError if the factory artifact name is missing from
662 the config.
663
beepse539be02013-07-31 21:57:39 -0700664 """
665 if not image_name:
666 logging.error('Need an image_name to stage a factory image.')
667 return
668
beeps12c0a3c2013-09-03 11:58:27 -0700669 factory_artifact = global_config.global_config.get_config_value(
670 'CROS', 'factory_artifact', type=str, default='')
671 if not factory_artifact:
672 raise ValueError('Cannot retrieve the factory artifact name from '
673 'autotest config, and hence cannot stage factory '
674 'artifacts.')
675
beepse539be02013-07-31 21:57:39 -0700676 logging.info('Staging build for servo install: %s', image_name)
677 devserver = dev_server.ImageServer.resolve(image_name)
678 devserver.stage_artifacts(
679 image_name,
beeps12c0a3c2013-09-03 11:58:27 -0700680 [factory_artifact],
681 archive_url=None)
beepse539be02013-07-31 21:57:39 -0700682
683 return tools.factory_image_url_pattern() % (devserver.url(), image_name)
684
685
Chris Sosaa3ac2152012-05-23 22:23:13 -0700686 def machine_install(self, update_url=None, force_update=False,
Richard Barnette0b023a72015-04-24 16:07:30 +0000687 local_devserver=False, repair=False,
688 force_full_update=False):
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500689 """Install the DUT.
690
Dan Shi0f466e82013-02-22 15:44:58 -0800691 Use stateful update if the DUT is already running the same build.
692 Stateful update does not update kernel and tends to run much faster
693 than a full reimage. If the DUT is running a different build, or it
694 failed to do a stateful update, full update, including kernel update,
695 will be applied to the DUT.
696
Scott Zawalskieadbf702013-03-14 09:23:06 -0400697 Once a host enters machine_install its cros_version label will be
698 removed as well as its host attribute job_repo_url (used for
699 package install).
700
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500701 @param update_url: The url to use for the update
702 pattern: http://$devserver:###/update/$build
703 If update_url is None and repair is True we will install the
Dan Shi6964fa52014-12-18 11:04:27 -0800704 stable image listed in afe_stable_versions table. If the table
705 is not setup, global_config value under CROS.stable_cros_version
706 will be used instead.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500707 @param force_update: Force an update even if the version installed
708 is the same. Default:False
Christopher Wiley6a4ff932015-05-15 14:00:47 -0700709 @param local_devserver: Used by test_that to allow people to
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500710 use their local devserver. Default: False
Chris Sosae92399e2015-04-24 11:32:59 -0700711 @param repair: Forces update to repair image. Implies force_update.
Fang Deng3d3b9272014-12-22 12:20:28 -0800712 @param force_full_update: If True, do not attempt to run stateful
713 update, force a full reimage. If False, try stateful update
714 first when the dut is already installed with the same version.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500715 @raises autoupdater.ChromiumOSError
716
717 """
Chris Sosae92399e2015-04-24 11:32:59 -0700718 devserver = None
Richard Barnette0b023a72015-04-24 16:07:30 +0000719 if repair:
Chris Sosae92399e2015-04-24 11:32:59 -0700720 update_url, devserver = self._stage_image_for_update()
Richard Barnette0b023a72015-04-24 16:07:30 +0000721 force_update = True
Dan Shi0f466e82013-02-22 15:44:58 -0800722
Chris Sosae92399e2015-04-24 11:32:59 -0700723 if not update_url and not self._parser.options.image:
724 raise error.AutoservError(
725 'There is no update URL, nor a method to get one.')
726
727 if not update_url and self._parser.options.image:
728 # This is the base case where we have no given update URL i.e.
729 # dynamic suites logic etc. This is the most flexible case where we
730 # can serve an update from any of our fleet of devservers.
731 requested_build = self._parser.options.image
732 if not requested_build.startswith('http://'):
733 logging.debug('Update will be staged for this installation')
734 update_url, devserver = self._stage_image_for_update(
735 requested_build)
736 else:
737 update_url = requested_build
738
739 logging.debug('Update URL is %s', update_url)
740
Scott Zawalskieadbf702013-03-14 09:23:06 -0400741 # Remove cros-version and job_repo_url host attribute from host.
742 self.clear_cros_version_labels_and_job_repo_url()
Chris Sosae92399e2015-04-24 11:32:59 -0700743
744 update_complete = False
745 updater = autoupdater.ChromiumOSUpdater(
746 update_url, host=self, local_devserver=local_devserver)
Fang Deng3d3b9272014-12-22 12:20:28 -0800747 if not force_full_update:
748 try:
Chris Sosae92399e2015-04-24 11:32:59 -0700749 # If the DUT is already running the same build, try stateful
750 # update first as it's much quicker than a full re-image.
751 update_complete = self._try_stateful_update(
752 update_url, force_update, updater)
Fang Deng3d3b9272014-12-22 12:20:28 -0800753 except Exception as e:
754 logging.exception(e)
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700755
Dan Shi0f466e82013-02-22 15:44:58 -0800756 inactive_kernel = None
Chris Sosae92399e2015-04-24 11:32:59 -0700757 if update_complete or (not force_update and updater.check_version()):
758 logging.info('Install complete without full update')
759 else:
760 logging.info('DUT requires full update.')
761 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
762 num_of_attempts = provision.FLAKY_DEVSERVER_ATTEMPTS
Chris Sosab7612bc2013-03-21 10:32:37 -0700763
Chris Sosae92399e2015-04-24 11:32:59 -0700764 while num_of_attempts > 0:
765 num_of_attempts -= 1
766 try:
767 updater.run_update()
768 except Exception:
769 logging.warn('Autoupdate did not complete.')
770 # Do additional check for the devserver health. Ideally,
771 # the autoupdater.py could raise an exception when it
772 # detected network flake but that would require
773 # instrumenting the update engine and parsing it log.
774 if (num_of_attempts <= 0 or
775 devserver is None or
776 dev_server.DevServer.devserver_healthy(
777 devserver.url())):
778 raise
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700779
Chris Sosae92399e2015-04-24 11:32:59 -0700780 logging.warn('Devserver looks unhealthy. Trying another')
781 update_url, devserver = self._stage_image_for_update(
782 requested_build)
783 logging.debug('New Update URL is %s', update_url)
784 updater = autoupdater.ChromiumOSUpdater(
785 update_url, host=self,
786 local_devserver=local_devserver)
787 else:
788 break
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700789
Chris Sosae92399e2015-04-24 11:32:59 -0700790 # Give it some time in case of IO issues.
791 time.sleep(10)
Dan Shi5699ac22014-12-19 10:55:49 -0800792
Chris Sosae92399e2015-04-24 11:32:59 -0700793 # Figure out active and inactive kernel.
794 active_kernel, inactive_kernel = updater.get_kernel_state()
Simran Basi13fa1ba2013-03-04 10:56:47 -0800795
Chris Sosae92399e2015-04-24 11:32:59 -0700796 # Ensure inactive kernel has higher priority than active.
797 if (updater.get_kernel_priority(inactive_kernel)
798 < updater.get_kernel_priority(active_kernel)):
799 raise autoupdater.ChromiumOSError(
800 'Update failed. The priority of the inactive kernel'
801 ' partition is less than that of the active kernel'
802 ' partition.')
803
804 # Updater has returned successfully; reboot the host.
805 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
806
807 self._post_update_processing(updater, inactive_kernel)
808 self.add_cros_version_labels_and_job_repo_url(
809 autoupdater.url_to_image_name(update_url))
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700810
811
Dan Shi9cb0eec2014-06-03 09:04:50 -0700812 def _clear_fw_version_labels(self):
813 """Clear firmware version labels from the machine."""
814 labels = self._AFE.get_labels(
Dan Shi0723bf52015-06-24 10:52:38 -0700815 name__startswith=provision.FW_RW_VERSION_PREFIX,
Dan Shi9cb0eec2014-06-03 09:04:50 -0700816 host__hostname=self.hostname)
817 for label in labels:
818 label.remove_hosts(hosts=[self.hostname])
819
820
821 def _add_fw_version_label(self, build):
822 """Add firmware version label to the machine.
823
824 @param build: Build of firmware.
825
826 """
827 fw_label = provision.fw_version_to_label(build)
MK Ryu73be9862015-07-06 12:25:00 -0700828 self._AFE.run('label_add_hosts', id=fw_label, hosts=[self.hostname])
Dan Shi9cb0eec2014-06-03 09:04:50 -0700829
830
831 def firmware_install(self, build=None):
832 """Install firmware to the DUT.
833
834 Use stateful update if the DUT is already running the same build.
835 Stateful update does not update kernel and tends to run much faster
836 than a full reimage. If the DUT is running a different build, or it
837 failed to do a stateful update, full update, including kernel update,
838 will be applied to the DUT.
839
840 Once a host enters firmware_install its fw_version label will be
841 removed. After the firmware is updated successfully, a new fw_version
842 label will be added to the host.
843
844 @param build: The build version to which we want to provision the
845 firmware of the machine,
846 e.g. 'link-firmware/R22-2695.1.144'.
847
848 TODO(dshi): After bug 381718 is fixed, update here with corresponding
849 exceptions that could be raised.
850
851 """
852 if not self.servo:
853 raise error.TestError('Host %s does not have servo.' %
854 self.hostname)
855
856 # TODO(fdeng): use host.get_board() after
857 # crbug.com/271834 is fixed.
858 board = self._get_board_from_afe()
859
Chris Sosae92399e2015-04-24 11:32:59 -0700860 # If build is not set, try to install firmware from stable CrOS.
Dan Shi9cb0eec2014-06-03 09:04:50 -0700861 if not build:
862 build = self.get_repair_image_name()
863
864 config = FAFTConfig(board)
865 if config.use_u_boot:
866 ap_image = 'image-%s.bin' % board
867 else: # Depthcharge platform
868 ap_image = 'image.bin'
869 ec_image = 'ec.bin'
870 ds = dev_server.ImageServer.resolve(build)
871 ds.stage_artifacts(build, ['firmware'])
872
873 tmpd = autotemp.tempdir(unique_id='fwimage')
874 try:
875 fwurl = self._FW_IMAGE_URL_PATTERN % (ds.url(), build)
876 local_tarball = os.path.join(tmpd.name, os.path.basename(fwurl))
877 server_utils.system('wget -O %s %s' % (local_tarball, fwurl),
878 timeout=60)
879 server_utils.system('tar xf %s -C %s %s %s' %
880 (local_tarball, tmpd.name, ap_image, ec_image),
881 timeout=60)
882 server_utils.system('tar xf %s --wildcards -C %s "dts/*"' %
883 (local_tarball, tmpd.name),
884 timeout=60, ignore_status=True)
885
886 self._clear_fw_version_labels()
887 logging.info('Will re-program EC now')
888 self.servo.program_ec(os.path.join(tmpd.name, ec_image))
889 logging.info('Will re-program BIOS now')
890 self.servo.program_bios(os.path.join(tmpd.name, ap_image))
891 self.servo.get_power_state_controller().reset()
892 time.sleep(self.servo.BOOT_DELAY)
Dan Shia5fef052015-05-18 23:28:47 -0700893 self._add_fw_version_label(build)
Dan Shi9cb0eec2014-06-03 09:04:50 -0700894 finally:
895 tmpd.clean()
896
897
Dan Shi10e992b2013-08-30 11:02:59 -0700898 def show_update_engine_log(self):
899 """Output update engine log."""
MK Ryu35d661e2014-09-25 17:44:10 -0700900 logging.debug('Dumping %s', client_constants.UPDATE_ENGINE_LOG)
901 self.run('cat %s' % client_constants.UPDATE_ENGINE_LOG)
Dan Shi10e992b2013-08-30 11:02:59 -0700902
903
Richard Barnette82c35912012-11-20 10:09:10 -0800904 def _get_board_from_afe(self):
905 """Retrieve this host's board from its labels in the AFE.
906
907 Looks for a host label of the form "board:<board>", and
908 returns the "<board>" part of the label. `None` is returned
909 if there is not a single, unique label matching the pattern.
910
911 @returns board from label, or `None`.
912 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700913 return server_utils.get_board_from_afe(self.hostname, self._AFE)
Simran Basi833814b2013-01-29 13:13:43 -0800914
915
916 def get_build(self):
917 """Retrieve the current build for this Host from the AFE.
918
919 Looks through this host's labels in the AFE to determine its build.
920
921 @returns The current build or None if it could not find it or if there
922 were multiple build labels assigned to this host.
923 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700924 return server_utils.get_build_from_afe(self.hostname, self._AFE)
Richard Barnette82c35912012-11-20 10:09:10 -0800925
926
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500927 def _install_repair(self):
Chris Sosae92399e2015-04-24 11:32:59 -0700928 """Attempt to repair this host using the update-engine.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500929
930 If the host is up, try installing the DUT with a stable
Dan Shi6964fa52014-12-18 11:04:27 -0800931 "repair" version of Chrome OS as defined in afe_stable_versions table.
932 If the table is not setup, global_config value under
933 CROS.stable_cros_version will be used instead.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500934
Scott Zawalski62bacae2013-03-05 10:40:32 -0500935 @raises AutoservRepairMethodNA if the DUT is not reachable.
936 @raises ChromiumOSError if the install failed for some reason.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500937
938 """
939 if not self.is_up():
Scott Zawalski62bacae2013-03-05 10:40:32 -0500940 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500941 logging.info('Attempting to reimage machine to repair image.')
942 try:
Richard Barnette0b023a72015-04-24 16:07:30 +0000943 self.machine_install(repair=True)
Fang Dengd0672f32013-03-18 17:18:09 -0700944 except autoupdater.ChromiumOSError as e:
945 logging.exception(e)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500946 logging.info('Repair via install failed.')
Scott Zawalski62bacae2013-03-05 10:40:32 -0500947 raise
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500948
949
Dan Shi2c88eed2013-11-12 10:18:38 -0800950 def _install_repair_with_powerwash(self):
Dan Shi9cc48452013-11-12 12:39:26 -0800951 """Attempt to powerwash first then repair this host using update-engine.
Dan Shi2c88eed2013-11-12 10:18:38 -0800952
Dan Shi9cc48452013-11-12 12:39:26 -0800953 update-engine may fail due to a bad image. In such case, powerwash
954 may help to cleanup the DUT for update-engine to work again.
Dan Shi2c88eed2013-11-12 10:18:38 -0800955
956 @raises AutoservRepairMethodNA if the DUT is not reachable.
957 @raises ChromiumOSError if the install failed for some reason.
958
959 """
960 if not self.is_up():
961 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
962
963 logging.info('Attempting to powerwash the DUT.')
964 self.run('echo "fast safe" > '
965 '/mnt/stateful_partition/factory_install_reset')
966 self.reboot(timeout=self.POWERWASH_BOOT_TIMEOUT, wait=True)
967 if not self.is_up():
Dan Shi9cc48452013-11-12 12:39:26 -0800968 logging.error('Powerwash failed. DUT did not come back after '
Dan Shi2c88eed2013-11-12 10:18:38 -0800969 'reboot.')
970 raise error.AutoservRepairFailure(
971 'DUT failed to boot from powerwash after %d seconds' %
972 self.POWERWASH_BOOT_TIMEOUT)
973
974 logging.info('Powerwash succeeded.')
975 self._install_repair()
976
977
beepsf079cfb2013-09-18 17:49:51 -0700978 def servo_install(self, image_url=None, usb_boot_timeout=USB_BOOT_TIMEOUT,
979 install_timeout=INSTALL_TIMEOUT):
Scott Zawalski62bacae2013-03-05 10:40:32 -0500980 """
981 Re-install the OS on the DUT by:
982 1) installing a test image on a USB storage device attached to the Servo
983 board,
Richard Barnette03a0c132012-11-05 12:40:35 -0800984 2) booting that image in recovery mode, and then
J. Richard Barnette31b2e312013-04-04 16:05:22 -0700985 3) installing the image with chromeos-install.
986
Scott Zawalski62bacae2013-03-05 10:40:32 -0500987 @param image_url: If specified use as the url to install on the DUT.
988 otherwise boot the currently staged image on the USB stick.
beepsf079cfb2013-09-18 17:49:51 -0700989 @param usb_boot_timeout: The usb_boot_timeout to use during reimage.
990 Factory images need a longer usb_boot_timeout than regular
991 cros images.
992 @param install_timeout: The timeout to use when installing the chromeos
993 image. Factory images need a longer install_timeout.
Richard Barnette03a0c132012-11-05 12:40:35 -0800994
Scott Zawalski62bacae2013-03-05 10:40:32 -0500995 @raises AutoservError if the image fails to boot.
beepsf079cfb2013-09-18 17:49:51 -0700996
J. Richard Barnette0199cc82014-12-05 17:08:40 -0800997 """
beepsf079cfb2013-09-18 17:49:51 -0700998 usb_boot_timer_key = ('servo_install.usb_boot_timeout_%s'
999 % usb_boot_timeout)
1000 logging.info('Downloading image to USB, then booting from it. Usb boot '
1001 'timeout = %s', usb_boot_timeout)
Gabe Black1e1c41b2015-02-04 23:55:15 -08001002 timer = autotest_stats.Timer(usb_boot_timer_key)
beepsf079cfb2013-09-18 17:49:51 -07001003 timer.start()
J. Richard Barnette31b2e312013-04-04 16:05:22 -07001004 self.servo.install_recovery_image(image_url)
beepsf079cfb2013-09-18 17:49:51 -07001005 if not self.wait_up(timeout=usb_boot_timeout):
Scott Zawalski62bacae2013-03-05 10:40:32 -05001006 raise error.AutoservRepairFailure(
1007 'DUT failed to boot from USB after %d seconds' %
beepsf079cfb2013-09-18 17:49:51 -07001008 usb_boot_timeout)
1009 timer.stop()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001010
beepsf079cfb2013-09-18 17:49:51 -07001011 install_timer_key = ('servo_install.install_timeout_%s'
1012 % install_timeout)
Gabe Black1e1c41b2015-02-04 23:55:15 -08001013 timer = autotest_stats.Timer(install_timer_key)
beepsf079cfb2013-09-18 17:49:51 -07001014 timer.start()
1015 logging.info('Installing image through chromeos-install.')
J. Richard Barnette2522a8f2015-03-04 15:59:15 -08001016 self.run('chromeos-install --yes',
MK Ryu35d661e2014-09-25 17:44:10 -07001017 timeout=install_timeout)
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001018 self.run('halt')
beepsf079cfb2013-09-18 17:49:51 -07001019 timer.stop()
1020
1021 logging.info('Power cycling DUT through servo.')
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001022 self.servo.get_power_state_controller().power_off()
Fang Dengafb88142013-05-30 17:44:31 -07001023 self.servo.switch_usbkey('off')
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001024 # N.B. The Servo API requires that we use power_on() here
1025 # for two reasons:
1026 # 1) After turning on a DUT in recovery mode, you must turn
1027 # it off and then on with power_on() once more to
1028 # disable recovery mode (this is a Parrot specific
1029 # requirement).
1030 # 2) After power_off(), the only way to turn on is with
1031 # power_on() (this is a Storm specific requirement).
J. Richard Barnettefbcc7122013-07-24 18:24:59 -07001032 self.servo.get_power_state_controller().power_on()
beepsf079cfb2013-09-18 17:49:51 -07001033
1034 logging.info('Waiting for DUT to come back up.')
Richard Barnette03a0c132012-11-05 12:40:35 -08001035 if not self.wait_up(timeout=self.BOOT_TIMEOUT):
1036 raise error.AutoservError('DUT failed to reboot installed '
1037 'test image after %d seconds' %
Scott Zawalski62bacae2013-03-05 10:40:32 -05001038 self.BOOT_TIMEOUT)
1039
1040
J. Richard Barnettee4af8b92013-05-01 13:16:12 -07001041 def _servo_repair_reinstall(self):
Scott Zawalski62bacae2013-03-05 10:40:32 -05001042 """Reinstall the DUT utilizing servo and a test image.
1043
1044 Re-install the OS on the DUT by:
1045 1) installing a test image on a USB storage device attached to the Servo
1046 board,
1047 2) booting that image in recovery mode, and then
1048 3) installing the image with chromeos-install.
1049
Scott Zawalski62bacae2013-03-05 10:40:32 -05001050 @raises AutoservRepairMethodNA if the device does not have servo
1051 support.
1052
1053 """
1054 if not self.servo:
1055 raise error.AutoservRepairMethodNA('Repair Reinstall NA: '
1056 'DUT has no servo support.')
1057
1058 logging.info('Attempting to recovery servo enabled device with '
1059 'servo_repair_reinstall')
1060
J. Richard Barnettee4af8b92013-05-01 13:16:12 -07001061 image_url = self.stage_image_for_servo()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001062 self.servo_install(image_url)
1063
1064
1065 def _servo_repair_power(self):
1066 """Attempt to repair DUT using an attached Servo.
1067
1068 Attempt to power on the DUT via power_long_press.
1069
1070 @raises AutoservRepairMethodNA if the device does not have servo
1071 support.
1072 @raises AutoservRepairFailure if the repair fails for any reason.
1073 """
1074 if not self.servo:
1075 raise error.AutoservRepairMethodNA('Repair Power NA: '
1076 'DUT has no servo support.')
1077
1078 logging.info('Attempting to recover servo enabled device by '
1079 'powering it off and on.')
1080 self.servo.get_power_state_controller().power_off()
1081 self.servo.get_power_state_controller().power_on()
1082 if self.wait_up(self.BOOT_TIMEOUT):
1083 return
1084
1085 raise error.AutoservRepairFailure('DUT did not boot after long_press.')
Richard Barnette03a0c132012-11-05 12:40:35 -08001086
1087
Richard Barnette82c35912012-11-20 10:09:10 -08001088 def _powercycle_to_repair(self):
1089 """Utilize the RPM Infrastructure to bring the host back up.
1090
1091 If the host is not up/repaired after the first powercycle we utilize
1092 auto fallback to the last good install by powercycling and rebooting the
1093 host 6 times.
Scott Zawalski62bacae2013-03-05 10:40:32 -05001094
1095 @raises AutoservRepairMethodNA if the device does not support remote
1096 power.
1097 @raises AutoservRepairFailure if the repair fails for any reason.
1098
Richard Barnette82c35912012-11-20 10:09:10 -08001099 """
Scott Zawalski62bacae2013-03-05 10:40:32 -05001100 if not self.has_power():
1101 raise error.AutoservRepairMethodNA('Device does not support power.')
1102
Richard Barnette82c35912012-11-20 10:09:10 -08001103 logging.info('Attempting repair via RPM powercycle.')
1104 failed_cycles = 0
1105 self.power_cycle()
1106 while not self.wait_up(timeout=self.BOOT_TIMEOUT):
1107 failed_cycles += 1
1108 if failed_cycles >= self._MAX_POWER_CYCLE_ATTEMPTS:
Scott Zawalski62bacae2013-03-05 10:40:32 -05001109 raise error.AutoservRepairFailure(
1110 'Powercycled host %s %d times; device did not come back'
1111 ' online.' % (self.hostname, failed_cycles))
Richard Barnette82c35912012-11-20 10:09:10 -08001112 self.power_cycle()
1113 if failed_cycles == 0:
1114 logging.info('Powercycling was successful first time.')
1115 else:
1116 logging.info('Powercycling was successful after %d failures.',
1117 failed_cycles)
1118
1119
MK Ryu35d661e2014-09-25 17:44:10 -07001120 def _reboot_repair(self):
1121 """SSH to this host and reboot."""
1122 if not self.is_up(self._CHECK_HOST_UP_TIMEOUT_SECS):
1123 raise error.AutoservRepairMethodNA('DUT unreachable for reboot.')
1124 logging.info('Attempting repair via SSH reboot.')
1125 self.reboot(timeout=self.BOOT_TIMEOUT, wait=True)
1126
1127
Prashanth B4d8184f2014-05-05 12:22:02 -07001128 def check_device(self):
1129 """Check if a device is ssh-able, and if so, clean and verify it.
1130
1131 @raise AutoservSSHTimeout: If the ssh ping times out.
1132 @raise AutoservSshPermissionDeniedError: If ssh ping fails due to
1133 permissions.
1134 @raise AutoservSshPingHostError: For other AutoservRunErrors during
1135 ssh_ping.
1136 @raises AutoservError: As appropriate, during cleanup and verify.
1137 """
1138 self.ssh_ping()
1139 self.cleanup()
1140 self.verify()
1141
1142
Richard Barnette82c35912012-11-20 10:09:10 -08001143 def repair_full(self):
1144 """Repair a host for repair level NO_PROTECTION.
1145
1146 This overrides the base class function for repair; it does
1147 not call back to the parent class, but instead offers a
1148 simplified implementation based on the capabilities in the
1149 Chrome OS test lab.
1150
Fang Deng5d518f42013-08-02 14:04:32 -07001151 It first verifies and repairs servo if it is a DUT in CrOS
Fang Deng03590af2013-10-07 17:34:20 -07001152 lab and a servo is attached.
Fang Deng5d518f42013-08-02 14:04:32 -07001153
Jakob Juelich82b7d1c2014-09-15 16:10:57 -07001154 This escalates in order through the following procedures and verifies
1155 the status using `self.check_device()` after each of them. This is done
1156 until both the repair and the veryfing step succeed.
1157
MK Ryu35d661e2014-09-25 17:44:10 -07001158 Escalation order of repair procedures from less intrusive to
1159 more intrusive repairs:
1160 1. SSH to the DUT and reboot.
Scott Zawalski62bacae2013-03-05 10:40:32 -05001161 2. If there's a servo for the DUT, try to power the DUT off and
1162 on.
MK Ryu35d661e2014-09-25 17:44:10 -07001163 3. If the DUT can be power-cycled via RPM, try to repair
Richard Barnette82c35912012-11-20 10:09:10 -08001164 by power-cycling.
MK Ryu35d661e2014-09-25 17:44:10 -07001165 4. Try to re-install to a known stable image using
1166 auto-update.
1167 5. If there's a servo for the DUT, try to re-install via
1168 the servo.
Richard Barnette82c35912012-11-20 10:09:10 -08001169
1170 As with the parent method, the last operation performed on
Prashanth B4d8184f2014-05-05 12:22:02 -07001171 the DUT must be to call `self.check_device()`; If that call fails the
1172 exception it raises is passed back to the caller.
J. Richard Barnettefde55fc2013-03-15 17:47:01 -07001173
Scott Zawalski62bacae2013-03-05 10:40:32 -05001174 @raises AutoservRepairTotalFailure if the repair process fails to
1175 fix the DUT.
Fang Deng5d518f42013-08-02 14:04:32 -07001176 @raises ServoHostRepairTotalFailure if the repair process fails to
1177 fix the servo host if one is attached to the DUT.
1178 @raises AutoservSshPermissionDeniedError if it is unable
1179 to ssh to the servo host due to permission error.
1180
Richard Barnette82c35912012-11-20 10:09:10 -08001181 """
Jakob Juelich82b7d1c2014-09-15 16:10:57 -07001182 # Caution: Deleting shards relies on repair to always reboot the DUT.
1183
Dan Shi4d478522014-02-14 13:46:32 -08001184 if self._servo_host and not self.servo:
Fang Deng03590af2013-10-07 17:34:20 -07001185 try:
Dan Shi4d478522014-02-14 13:46:32 -08001186 self._servo_host.repair_full()
Fang Deng03590af2013-10-07 17:34:20 -07001187 except Exception as e:
Fang Deng03590af2013-10-07 17:34:20 -07001188 logging.error('Could not create a healthy servo: %s', e)
Dan Shi4d478522014-02-14 13:46:32 -08001189 self.servo = self._servo_host.get_servo()
Fang Deng5d518f42013-08-02 14:04:32 -07001190
MK Ryu35d661e2014-09-25 17:44:10 -07001191 self.try_collect_crashlogs()
1192
Scott Zawalski62bacae2013-03-05 10:40:32 -05001193 # TODO(scottz): This should use something similar to label_decorator,
1194 # but needs to be populated in order so DUTs are repaired with the
1195 # least amount of effort.
MK Ryu35d661e2014-09-25 17:44:10 -07001196 repair_funcs = [self._reboot_repair,
1197 self._servo_repair_power,
1198 self._powercycle_to_repair,
Dan Shi849a1c42014-03-05 11:10:43 -08001199 self._install_repair,
Dan Shi2c88eed2013-11-12 10:18:38 -08001200 self._install_repair_with_powerwash,
MK Ryu35d661e2014-09-25 17:44:10 -07001201 self._servo_repair_reinstall]
Scott Zawalski62bacae2013-03-05 10:40:32 -05001202 errors = []
Simran Basie6130932013-10-01 14:07:52 -07001203 board = self._get_board_from_afe()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001204 for repair_func in repair_funcs:
1205 try:
1206 repair_func()
MK Ryu35d661e2014-09-25 17:44:10 -07001207 self.try_collect_crashlogs()
Prashanth B4d8184f2014-05-05 12:22:02 -07001208 self.check_device()
Gabe Black1e1c41b2015-02-04 23:55:15 -08001209 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001210 '%s.SUCCEEDED' % repair_func.__name__).increment()
1211 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001212 autotest_stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001213 '%s.%s.SUCCEEDED' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001214 board)).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001215 return
Simran Basie6130932013-10-01 14:07:52 -07001216 except error.AutoservRepairMethodNA as e:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001217 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001218 '%s.RepairNA' % repair_func.__name__).increment()
1219 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001220 autotest_stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001221 '%s.%s.RepairNA' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001222 board)).increment()
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001223 logging.warning('Repair function NA: %s', e)
Simran Basie6130932013-10-01 14:07:52 -07001224 errors.append(str(e))
Scott Zawalski62bacae2013-03-05 10:40:32 -05001225 except Exception as e:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001226 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001227 '%s.FAILED' % repair_func.__name__).increment()
1228 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001229 autotest_stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001230 '%s.%s.FAILED' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001231 board)).increment()
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001232 logging.warning('Failed to repair device: %s', e)
Scott Zawalski62bacae2013-03-05 10:40:32 -05001233 errors.append(str(e))
Scott Zawalski89c44dd2013-02-26 09:28:02 -05001234
Gabe Black1e1c41b2015-02-04 23:55:15 -08001235 autotest_stats.Counter('Full_Repair_Failed').increment()
Simran Basie6130932013-10-01 14:07:52 -07001236 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001237 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001238 'Full_Repair_Failed.%s' % board).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001239 raise error.AutoservRepairTotalFailure(
1240 'All attempts at repairing the device failed:\n%s' %
1241 '\n'.join(errors))
Richard Barnette82c35912012-11-20 10:09:10 -08001242
1243
MK Ryu35d661e2014-09-25 17:44:10 -07001244 def try_collect_crashlogs(self, check_host_up=True):
1245 """
1246 Check if a host is up and logs need to be collected from the host,
1247 if yes, collect them.
1248
1249 @param check_host_up: Flag for checking host is up. Default is True.
1250 """
1251 try:
1252 crash_job = self._need_crash_logs()
1253 if crash_job:
1254 logging.debug('%s: Job %s was crashed', self._CRASHLOGS_PREFIX,
1255 crash_job)
1256 if not check_host_up or self.is_up(
1257 self._CHECK_HOST_UP_TIMEOUT_SECS):
1258 self._collect_crashlogs(crash_job)
1259 logging.debug('%s: Completed collecting logs for the '
1260 'crashed job %s', self._CRASHLOGS_PREFIX,
1261 crash_job)
1262 except Exception as e:
1263 # Exception should not result in repair failure.
1264 # Therefore, suppress all exceptions here.
1265 logging.error('%s: Failed while trying to collect crash-logs: %s',
1266 self._CRASHLOGS_PREFIX, e)
1267
1268
1269 def _need_crash_logs(self):
1270 """Get the value of need_crash_logs attribute of this host.
1271
1272 @return: Value string of need_crash_logs attribute
1273 None if there is no need_crash_logs attribute
1274 """
1275 attrs = self._AFE.get_host_attribute(constants.CRASHLOGS_HOST_ATTRIBUTE,
1276 hostname=self.hostname)
1277 assert len(attrs) < 2
1278 return attrs[0].value if attrs else None
1279
1280
1281 def _collect_crashlogs(self, job_id):
1282 """Grab logs from the host where a job was crashed.
1283
1284 First, check if PRIOR_LOGS_DIR exists in the host.
1285 If yes, collect them.
1286 Otherwise, check if a lab-machine marker (_LAB_MACHINE_FILE) exists
1287 in the host.
1288 If yes, the host was repaired automatically, and we collect normal
1289 system logs.
1290
1291 @param job_id: Id of the job that was crashed.
1292 """
1293 crashlogs_dir = crashcollect.get_crashinfo_dir(self,
1294 constants.CRASHLOGS_DEST_DIR_PREFIX)
1295 flag_prior_logs = False
1296
1297 if self.path_exists(client_constants.PRIOR_LOGS_DIR):
1298 flag_prior_logs = True
1299 self._collect_prior_logs(crashlogs_dir)
1300 elif self.path_exists(self._LAB_MACHINE_FILE):
1301 self._collect_system_logs(crashlogs_dir)
1302 else:
1303 logging.warning('%s: Host was manually re-installed without '
1304 '--lab_preserve_log option. Skip collecting '
1305 'crash-logs.', self._CRASHLOGS_PREFIX)
1306
1307 # We make crash collection be one-time effort.
1308 # _collect_prior_logs() and _collect_system_logs() will not throw
1309 # any exception, and following codes will be executed even when
1310 # those methods fail.
1311 # _collect_crashlogs() is called only when the host is up (refer
1312 # to try_collect_crashlogs()). We assume _collect_prior_logs() and
1313 # _collect_system_logs() fail rarely when the host is up.
1314 # In addition, it is not clear how many times we should try crash
1315 # collection again while not triggering next repair unnecessarily.
1316 # Threfore, we try crash collection one time.
1317
1318 # Create a marker file as soon as log collection is done.
1319 # Leave the job id to this marker for gs_offloader to consume.
1320 marker_file = os.path.join(crashlogs_dir, constants.CRASHLOGS_MARKER)
1321 with open(marker_file, 'a') as f:
1322 f.write('%s\n' % job_id)
1323
1324 # Remove need_crash_logs attribute
1325 logging.debug('%s: Remove attribute need_crash_logs from host %s',
1326 self._CRASHLOGS_PREFIX, self.hostname)
1327 self._AFE.set_host_attribute(constants.CRASHLOGS_HOST_ATTRIBUTE,
1328 None, hostname=self.hostname)
1329
1330 if flag_prior_logs:
1331 logging.debug('%s: Remove %s from host %s', self._CRASHLOGS_PREFIX,
1332 client_constants.PRIOR_LOGS_DIR, self.hostname)
1333 self.run('rm -rf %s; sync' % client_constants.PRIOR_LOGS_DIR)
1334 # Wait for a few seconds to make sure the prior command is
1335 # done deep through storage.
1336 time.sleep(self._SAFE_WAIT_SECS)
1337
1338
1339 def _collect_prior_logs(self, crashlogs_dir):
1340 """Grab prior logs that were stashed before re-installing a host.
1341
1342 @param crashlogs_dir: Directory path where crash-logs are stored.
1343 """
1344 logging.debug('%s: Found %s, collecting them...',
1345 self._CRASHLOGS_PREFIX, client_constants.PRIOR_LOGS_DIR)
1346 try:
1347 self.collect_logs(client_constants.PRIOR_LOGS_DIR,
1348 crashlogs_dir, False)
1349 logging.debug('%s: %s is collected',
1350 self._CRASHLOGS_PREFIX, client_constants.PRIOR_LOGS_DIR)
1351 except Exception as e:
1352 logging.error('%s: Failed to collect %s: %s',
1353 self._CRASHLOGS_PREFIX, client_constants.PRIOR_LOGS_DIR,
1354 e)
1355
1356
1357 def _collect_system_logs(self, crashlogs_dir):
1358 """Grab normal system logs from a host.
1359
1360 @param crashlogs_dir: Directory path where crash-logs are stored.
1361 """
1362 logging.debug('%s: Found %s, collecting system logs...',
1363 self._CRASHLOGS_PREFIX, self._LAB_MACHINE_FILE)
1364 sources = server_utils.parse_simple_config(self._LOGS_TO_COLLECT_FILE)
1365 for src in sources:
1366 try:
1367 if self.path_exists(src):
1368 logging.debug('%s: Collecting %s...',
1369 self._CRASHLOGS_PREFIX, src)
1370 dest = server_utils.concat_path_except_last(
1371 crashlogs_dir, src)
1372 self.collect_logs(src, dest, False)
1373 logging.debug('%s: %s is collected',
1374 self._CRASHLOGS_PREFIX, src)
1375 except Exception as e:
1376 logging.error('%s: Failed to collect %s: %s',
1377 self._CRASHLOGS_PREFIX, src, e)
1378
1379
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001380 def close(self):
beeps32a63082013-08-22 14:02:29 -07001381 self.rpc_disconnect_all()
Fang Deng0ca40e22013-08-27 17:47:44 -07001382 super(CrosHost, self).close()
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001383
1384
Dan Shi49ca0932014-11-14 11:22:27 -08001385 def get_power_supply_info(self):
1386 """Get the output of power_supply_info.
1387
1388 power_supply_info outputs the info of each power supply, e.g.,
1389 Device: Line Power
1390 online: no
1391 type: Mains
1392 voltage (V): 0
1393 current (A): 0
1394 Device: Battery
1395 state: Discharging
1396 percentage: 95.9276
1397 technology: Li-ion
1398
1399 Above output shows two devices, Line Power and Battery, with details of
1400 each device listed. This function parses the output into a dictionary,
1401 with key being the device name, and value being a dictionary of details
1402 of the device info.
1403
1404 @return: The dictionary of power_supply_info, e.g.,
1405 {'Line Power': {'online': 'yes', 'type': 'main'},
1406 'Battery': {'vendor': 'xyz', 'percentage': '100'}}
Dan Shie9b765d2014-12-29 16:59:49 -08001407 @raise error.AutoservRunError if power_supply_info tool is not found in
1408 the DUT. Caller should handle this error to avoid false failure
1409 on verification.
Dan Shi49ca0932014-11-14 11:22:27 -08001410 """
1411 result = self.run('power_supply_info').stdout.strip()
1412 info = {}
1413 device_name = None
1414 device_info = {}
1415 for line in result.split('\n'):
1416 pair = [v.strip() for v in line.split(':')]
1417 if len(pair) != 2:
1418 continue
1419 if pair[0] == 'Device':
1420 if device_name:
1421 info[device_name] = device_info
1422 device_name = pair[1]
1423 device_info = {}
1424 else:
1425 device_info[pair[0]] = pair[1]
1426 if device_name and not device_name in info:
1427 info[device_name] = device_info
1428 return info
1429
1430
1431 def get_battery_percentage(self):
1432 """Get the battery percentage.
1433
1434 @return: The percentage of battery level, value range from 0-100. Return
1435 None if the battery info cannot be retrieved.
1436 """
1437 try:
1438 info = self.get_power_supply_info()
1439 logging.info(info)
1440 return float(info['Battery']['percentage'])
Dan Shie9b765d2014-12-29 16:59:49 -08001441 except (KeyError, ValueError, error.AutoservRunError):
Dan Shi49ca0932014-11-14 11:22:27 -08001442 return None
1443
1444
1445 def is_ac_connected(self):
1446 """Check if the dut has power adapter connected and charging.
1447
1448 @return: True if power adapter is connected and charging.
1449 """
1450 try:
1451 info = self.get_power_supply_info()
1452 return info['Line Power']['online'] == 'yes'
Dan Shie9b765d2014-12-29 16:59:49 -08001453 except (KeyError, error.AutoservRunError):
1454 return None
Dan Shi49ca0932014-11-14 11:22:27 -08001455
1456
Simran Basi5e6339a2013-03-21 11:34:32 -07001457 def _cleanup_poweron(self):
1458 """Special cleanup method to make sure hosts always get power back."""
1459 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
1460 hosts = afe.get_hosts(hostname=self.hostname)
1461 if not hosts or not (self._RPM_OUTLET_CHANGED in
1462 hosts[0].attributes):
1463 return
1464 logging.debug('This host has recently interacted with the RPM'
1465 ' Infrastructure. Ensuring power is on.')
1466 try:
1467 self.power_on()
Dan Shi7dca56e2014-11-11 17:07:56 -08001468 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, None,
1469 hostname=self.hostname)
Simran Basi5e6339a2013-03-21 11:34:32 -07001470 except rpm_client.RemotePowerException:
Simran Basi5e6339a2013-03-21 11:34:32 -07001471 logging.error('Failed to turn Power On for this host after '
1472 'cleanup through the RPM Infrastructure.')
Gabe Blackb72f4fb2015-01-20 16:47:13 -08001473 autotest_es.post(
Dan Shi7dca56e2014-11-11 17:07:56 -08001474 type_str='RPM_poweron_failure',
1475 metadata={'hostname': self.hostname})
Dan Shi49ca0932014-11-14 11:22:27 -08001476
1477 battery_percentage = self.get_battery_percentage()
Dan Shif01ebe22014-12-05 13:10:57 -08001478 if battery_percentage and battery_percentage < 50:
Dan Shi49ca0932014-11-14 11:22:27 -08001479 raise
1480 elif self.is_ac_connected():
1481 logging.info('The device has power adapter connected and '
1482 'charging. No need to try to turn RPM on '
1483 'again.')
1484 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, None,
1485 hostname=self.hostname)
1486 logging.info('Battery level is now at %s%%. The device may '
1487 'still have enough power to run test, so no '
1488 'exception will be raised.', battery_percentage)
1489
Simran Basi5e6339a2013-03-21 11:34:32 -07001490
beepsc87ff602013-07-31 21:53:00 -07001491 def _is_factory_image(self):
1492 """Checks if the image on the DUT is a factory image.
1493
1494 @return: True if the image on the DUT is a factory image.
1495 False otherwise.
1496 """
1497 result = self.run('[ -f /root/.factory_test ]', ignore_status=True)
1498 return result.exit_status == 0
1499
1500
1501 def _restart_ui(self):
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001502 """Restart the Chrome UI.
beepsc87ff602013-07-31 21:53:00 -07001503
1504 @raises: FactoryImageCheckerException for factory images, since
1505 we cannot attempt to restart ui on them.
1506 error.AutoservRunError for any other type of error that
1507 occurs while restarting ui.
1508 """
1509 if self._is_factory_image():
Dan Shi549fb822015-03-24 18:01:11 -07001510 raise FactoryImageCheckerException('Cannot restart ui on factory '
1511 'images')
beepsc87ff602013-07-31 21:53:00 -07001512
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001513 # TODO(jrbarnette): The command to stop/start the ui job
1514 # should live inside cros_ui, too. However that would seem
1515 # to imply interface changes to the existing start()/restart()
1516 # functions, which is a bridge too far (for now).
J. Richard Barnette6069aa12015-06-08 09:10:24 -07001517 prompt = cros_ui.get_chrome_session_ident(self)
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001518 self.run('stop ui; start ui')
1519 cros_ui.wait_for_chrome_ready(prompt, self)
beepsc87ff602013-07-31 21:53:00 -07001520
1521
Dan Shi549fb822015-03-24 18:01:11 -07001522 def get_release_version(self):
1523 """Get the value of attribute CHROMEOS_RELEASE_VERSION from lsb-release.
1524
1525 @returns The version string in lsb-release, under attribute
1526 CHROMEOS_RELEASE_VERSION.
1527 """
1528 lsb_release_content = self.run(
1529 'cat "%s"' % client_constants.LSB_RELEASE).stdout.strip()
1530 return lsbrelease_utils.get_chromeos_release_version(
1531 lsb_release_content=lsb_release_content)
1532
1533
1534 def verify_cros_version_label(self):
1535 """ Make sure host's cros-version label match the actual image in dut.
1536
1537 Remove any cros-version: label that doesn't match that installed in
1538 the dut.
1539
1540 @param raise_error: Set to True to raise exception if any mismatch found
1541
1542 @raise error.AutoservError: If any mismatch between cros-version label
1543 and the build installed in dut is found.
1544 """
1545 labels = self._AFE.get_labels(
1546 name__startswith=ds_constants.VERSION_PREFIX,
1547 host__hostname=self.hostname)
1548 mismatch_found = False
1549 if labels:
1550 # Get CHROMEOS_RELEASE_VERSION from lsb-release, e.g., 6908.0.0.
1551 # Note that it's different from cros-version label, which has
1552 # builder and branch info, e.g.,
1553 # cros-version:peppy-release/R43-6908.0.0
1554 release_version = self.get_release_version()
1555 host_list = [self.hostname]
1556 for label in labels:
1557 # Remove any cros-version label that does not match
1558 # release_version.
1559 build_version = label.name[len(ds_constants.VERSION_PREFIX):]
1560 if not utils.version_match(build_version, release_version):
1561 logging.warn('cros-version label "%s" does not match '
1562 'release version %s. Removing the label.',
1563 label.name, release_version)
1564 label.remove_hosts(hosts=host_list)
1565 mismatch_found = True
1566 if mismatch_found:
Dan Shi1057bae2015-03-30 11:35:09 -07001567 autotest_es.post(use_http=True,
1568 type_str='cros_version_label_mismatch',
1569 metadata={'hostname': self.hostname})
Dan Shi549fb822015-03-24 18:01:11 -07001570 raise error.AutoservError('The host has wrong cros-version label.')
1571
1572
beepsc87ff602013-07-31 21:53:00 -07001573 def cleanup(self):
MK Ryu35d661e2014-09-25 17:44:10 -07001574 self.run('rm -f %s' % client_constants.CLEANUP_LOGS_PAUSED_FILE)
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001575 try:
beepsc87ff602013-07-31 21:53:00 -07001576 self._restart_ui()
1577 except (error.AutotestRunError, error.AutoservRunError,
1578 FactoryImageCheckerException):
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001579 logging.warning('Unable to restart ui, rebooting device.')
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001580 # Since restarting the UI fails fall back to normal Autotest
1581 # cleanup routines, i.e. reboot the machine.
Fang Deng0ca40e22013-08-27 17:47:44 -07001582 super(CrosHost, self).cleanup()
Simran Basi5e6339a2013-03-21 11:34:32 -07001583 # Check if the rpm outlet was manipulated.
Simran Basid5e5e272012-09-24 15:23:59 -07001584 if self.has_power():
Simran Basi5e6339a2013-03-21 11:34:32 -07001585 self._cleanup_poweron()
Dan Shi549fb822015-03-24 18:01:11 -07001586 self.verify_cros_version_label()
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001587
1588
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001589 def reboot(self, **dargs):
1590 """
1591 This function reboots the site host. The more generic
1592 RemoteHost.reboot() performs sync and sleeps for 5
1593 seconds. This is not necessary for Chrome OS devices as the
1594 sync should be finished in a short time during the reboot
1595 command.
1596 """
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001597 if 'reboot_cmd' not in dargs:
Doug Anderson7d5aeb22014-02-27 15:12:17 -08001598 reboot_timeout = dargs.get('reboot_timeout', 10)
1599 dargs['reboot_cmd'] = ('((reboot & sleep %d; reboot -f &)'
1600 ' </dev/null >/dev/null 2>&1 &)' %
1601 reboot_timeout)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001602 # Enable fastsync to avoid running extra sync commands before reboot.
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001603 if 'fastsync' not in dargs:
1604 dargs['fastsync'] = True
Michael Liangda8c60a2014-06-03 13:24:51 -07001605
Charlie Mooneya8e6dab2014-05-29 14:37:55 -07001606 # For purposes of logging reboot times:
1607 # Get the board name i.e. 'daisy_spring'
Michael Liangca4f5a62014-07-10 15:45:13 -07001608 board_fullname = self.get_board()
1609
1610 # Strip the prefix and add it to dargs.
1611 dargs['board'] = board_fullname[board_fullname.find(':')+1:]
Fang Deng0ca40e22013-08-27 17:47:44 -07001612 super(CrosHost, self).reboot(**dargs)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001613
1614
Gwendal Grignou7a61d2f2014-05-23 11:05:51 -07001615 def suspend(self, **dargs):
1616 """
1617 This function suspends the site host.
1618 """
1619 suspend_time = dargs.get('suspend_time', 60)
1620 dargs['timeout'] = suspend_time
1621 if 'suspend_cmd' not in dargs:
1622 cmd = ' && '.join(['echo 0 > /sys/class/rtc/rtc0/wakealarm',
1623 'echo +%d > /sys/class/rtc/rtc0/wakealarm' % suspend_time,
1624 'powerd_dbus_suspend --delay=0 &'])
1625 dargs['suspend_cmd'] = ('(( %s )'
1626 '< /dev/null >/dev/null 2>&1 &)' % cmd)
1627 super(CrosHost, self).suspend(**dargs)
1628
1629
Simran Basiec564392014-08-25 16:48:09 -07001630 def upstart_status(self, service_name):
1631 """Check the status of an upstart init script.
1632
1633 @param service_name: Service to look up.
1634
1635 @returns True if the service is running, False otherwise.
1636 """
1637 return self.run('status %s | grep start/running' %
1638 service_name).stdout.strip() != ''
1639
1640
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001641 def verify_software(self):
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001642 """Verify working software on a Chrome OS system.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001643
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001644 Tests for the following conditions:
1645 1. All conditions tested by the parent version of this
1646 function.
1647 2. Sufficient space in /mnt/stateful_partition.
Fang Deng6b05f5b2013-03-20 13:42:11 -07001648 3. Sufficient space in /mnt/stateful_partition/encrypted.
1649 4. update_engine answers a simple status request over DBus.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001650
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001651 """
MK Ryu35d661e2014-09-25 17:44:10 -07001652 # Check if a job was crashed on this host.
1653 # If yes, avoid verification until crash-logs are collected.
1654 if self._need_crash_logs():
1655 raise error.AutoservCrashLogCollectRequired(
1656 'Need to collect crash-logs before verification')
1657
Fang Deng0ca40e22013-08-27 17:47:44 -07001658 super(CrosHost, self).verify_software()
J. Richard Barnette4164d1d2014-12-02 17:52:33 -08001659 self.check_inodes(
1660 '/mnt/stateful_partition',
1661 global_config.global_config.get_config_value(
1662 'SERVER', 'kilo_inodes_required', type=int,
1663 default=100))
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001664 self.check_diskspace(
1665 '/mnt/stateful_partition',
1666 global_config.global_config.get_config_value(
Fang Deng6b05f5b2013-03-20 13:42:11 -07001667 'SERVER', 'gb_diskspace_required', type=float,
1668 default=20.0))
Gaurav Shahe448af82014-06-19 15:18:59 -07001669 encrypted_stateful_path = '/mnt/stateful_partition/encrypted'
1670 # Not all targets build with encrypted stateful support.
1671 if self.path_exists(encrypted_stateful_path):
1672 self.check_diskspace(
1673 encrypted_stateful_path,
1674 global_config.global_config.get_config_value(
1675 'SERVER', 'gb_encrypted_diskspace_required', type=float,
1676 default=0.1))
beepsc87ff602013-07-31 21:53:00 -07001677
Simran Basiec564392014-08-25 16:48:09 -07001678 if not self.upstart_status('system-services'):
Prashanth B5d0a0512014-04-25 12:26:08 -07001679 raise error.AutoservError('Chrome failed to reach login. '
1680 'System services not running.')
1681
beepsc87ff602013-07-31 21:53:00 -07001682 # Factory images don't run update engine,
1683 # goofy controls dbus on these DUTs.
1684 if not self._is_factory_image():
1685 self.run('update_engine_client --status')
Scott Zawalskifbca4a92013-03-04 15:56:42 -05001686 # Makes sure python is present, loads and can use built in functions.
1687 # We have seen cases where importing cPickle fails with undefined
1688 # symbols in cPickle.so.
1689 self.run('python -c "import cPickle"')
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001690
Dan Shi549fb822015-03-24 18:01:11 -07001691 self.verify_cros_version_label()
1692
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001693
Dan Shi49ca0932014-11-14 11:22:27 -08001694 def verify_hardware(self):
1695 """Verify hardware system of a Chrome OS system.
1696
1697 Check following hardware conditions:
1698 1. Battery level.
1699 2. Is power adapter connected.
1700 """
1701 logging.info('Battery percentage: %s', self.get_battery_percentage())
Dan Shie9b765d2014-12-29 16:59:49 -08001702 if self.is_ac_connected() is None:
1703 logging.info('Can not determine if the device has power adapter '
1704 'connected.')
1705 else:
1706 logging.info('Device %s power adapter connected and charging.',
1707 'has' if self.is_ac_connected() else 'does not have')
Dan Shi49ca0932014-11-14 11:22:27 -08001708
1709
Fang Deng96667ca2013-08-01 17:46:18 -07001710 def make_ssh_command(self, user='root', port=22, opts='', hosts_file=None,
1711 connect_timeout=None, alive_interval=None):
1712 """Override default make_ssh_command to use options tuned for Chrome OS.
1713
1714 Tuning changes:
1715 - ConnectTimeout=30; maximum of 30 seconds allowed for an SSH
1716 connection failure. Consistency with remote_access.sh.
1717
Samuel Tan2ce155b2015-06-23 18:24:38 -07001718 - ServerAliveInterval=900; which causes SSH to ping connection every
1719 900 seconds. In conjunction with ServerAliveCountMax ensures
1720 that if the connection dies, Autotest will bail out.
Fang Deng96667ca2013-08-01 17:46:18 -07001721 Originally tried 60 secs, but saw frequent job ABORTS where
Samuel Tan2ce155b2015-06-23 18:24:38 -07001722 the test completed successfully. Later increased from 180 seconds to
1723 900 seconds to account for tests where the DUT is suspended for
1724 longer periods of time.
Fang Deng96667ca2013-08-01 17:46:18 -07001725
1726 - ServerAliveCountMax=3; consistency with remote_access.sh.
1727
1728 - ConnectAttempts=4; reduce flakiness in connection errors;
1729 consistency with remote_access.sh.
1730
1731 - UserKnownHostsFile=/dev/null; we don't care about the keys.
1732 Host keys change with every new installation, don't waste
1733 memory/space saving them.
1734
1735 - SSH protocol forced to 2; needed for ServerAliveInterval.
1736
1737 @param user User name to use for the ssh connection.
1738 @param port Port on the target host to use for ssh connection.
1739 @param opts Additional options to the ssh command.
1740 @param hosts_file Ignored.
1741 @param connect_timeout Ignored.
1742 @param alive_interval Ignored.
1743 """
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001744 base_command = ('/usr/bin/ssh -a -x %s %s %s'
1745 ' -o StrictHostKeyChecking=no'
Fang Deng96667ca2013-08-01 17:46:18 -07001746 ' -o UserKnownHostsFile=/dev/null -o BatchMode=yes'
Samuel Tan2ce155b2015-06-23 18:24:38 -07001747 ' -o ConnectTimeout=30 -o ServerAliveInterval=900'
Fang Deng96667ca2013-08-01 17:46:18 -07001748 ' -o ServerAliveCountMax=3 -o ConnectionAttempts=4'
1749 ' -o Protocol=2 -l %s -p %d')
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001750 return base_command % (self._ssh_verbosity_flag, self._ssh_options,
1751 opts, user, port)
Fang Deng96667ca2013-08-01 17:46:18 -07001752
1753
beeps32a63082013-08-22 14:02:29 -07001754 def _create_ssh_tunnel(self, port, local_port):
1755 """Create an ssh tunnel from local_port to port.
1756
1757 @param port: remote port on the host.
1758 @param local_port: local forwarding port.
1759
1760 @return: the tunnel process.
1761 """
1762 # Chrome OS on the target closes down most external ports
1763 # for security. We could open the port, but doing that
1764 # would conflict with security tests that check that only
1765 # expected ports are open. So, to get to the port on the
1766 # target we use an ssh tunnel.
1767 tunnel_options = '-n -N -q -L %d:localhost:%d' % (local_port, port)
1768 ssh_cmd = self.make_ssh_command(opts=tunnel_options)
1769 tunnel_cmd = '%s %s' % (ssh_cmd, self.hostname)
1770 logging.debug('Full tunnel command: %s', tunnel_cmd)
1771 tunnel_proc = subprocess.Popen(tunnel_cmd, shell=True, close_fds=True)
1772 logging.debug('Started ssh tunnel, local = %d'
1773 ' remote = %d, pid = %d',
1774 local_port, port, tunnel_proc.pid)
1775 return tunnel_proc
1776
1777
Christopher Wileydd181852013-10-10 19:56:58 -07001778 def _setup_rpc(self, port, command_name, remote_pid=None):
beeps32a63082013-08-22 14:02:29 -07001779 """Sets up a tunnel process and performs rpc connection book keeping.
1780
1781 This method assumes that xmlrpc and jsonrpc never conflict, since
1782 we can only either have an xmlrpc or a jsonrpc server listening on
1783 a remote port. As such, it enforces a single proxy->remote port
1784 policy, i.e if one starts a jsonrpc proxy/server from port A->B,
1785 and then tries to start an xmlrpc proxy forwarded to the same port,
1786 the xmlrpc proxy will override the jsonrpc tunnel process, however:
1787
1788 1. None of the methods on the xmlrpc proxy will work because
1789 the server listening on B is jsonrpc.
1790
1791 2. The xmlrpc client cannot initiate a termination of the JsonRPC
1792 server, as the only use case currently is goofy, which is tied to
1793 the factory image. It is much easier to handle a failed xmlrpc
1794 call on the client than it is to terminate goofy in this scenario,
1795 as doing the latter might leave the DUT in a hard to recover state.
1796
1797 With the current implementation newer rpc proxy connections will
1798 terminate the tunnel processes of older rpc connections tunneling
1799 to the same remote port. If methods are invoked on the client
1800 after this has happened they will fail with connection closed errors.
1801
1802 @param port: The remote forwarding port.
1803 @param command_name: The name of the remote process, to terminate
1804 using pkill.
1805
1806 @return A url that we can use to initiate the rpc connection.
1807 """
1808 self.rpc_disconnect(port)
1809 local_port = utils.get_unused_port()
1810 tunnel_proc = self._create_ssh_tunnel(port, local_port)
Christopher Wileydd181852013-10-10 19:56:58 -07001811 self._rpc_proxy_map[port] = (command_name, tunnel_proc, remote_pid)
beeps32a63082013-08-22 14:02:29 -07001812 return self._RPC_PROXY_URL % local_port
1813
1814
Christopher Wileyd78249a2013-03-01 13:05:31 -08001815 def xmlrpc_connect(self, command, port, command_name=None,
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001816 ready_test_name=None, timeout_seconds=10,
1817 logfile='/dev/null'):
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001818 """Connect to an XMLRPC server on the host.
1819
1820 The `command` argument should be a simple shell command that
1821 starts an XMLRPC server on the given `port`. The command
1822 must not daemonize, and must terminate cleanly on SIGTERM.
1823 The command is started in the background on the host, and a
1824 local XMLRPC client for the server is created and returned
1825 to the caller.
1826
1827 Note that the process of creating an XMLRPC client makes no
1828 attempt to connect to the remote server; the caller is
1829 responsible for determining whether the server is running
1830 correctly, and is ready to serve requests.
1831
Christopher Wileyd78249a2013-03-01 13:05:31 -08001832 Optionally, the caller can pass ready_test_name, a string
1833 containing the name of a method to call on the proxy. This
1834 method should take no parameters and return successfully only
1835 when the server is ready to process client requests. When
1836 ready_test_name is set, xmlrpc_connect will block until the
1837 proxy is ready, and throw a TestError if the server isn't
1838 ready by timeout_seconds.
1839
beeps32a63082013-08-22 14:02:29 -07001840 If a server is already running on the remote port, this
1841 method will kill it and disconnect the tunnel process
1842 associated with the connection before establishing a new one,
1843 by consulting the rpc_proxy_map in rpc_disconnect.
1844
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001845 @param command Shell command to start the server.
1846 @param port Port number on which the server is expected to
1847 be serving.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001848 @param command_name String to use as input to `pkill` to
1849 terminate the XMLRPC server on the host.
Christopher Wileyd78249a2013-03-01 13:05:31 -08001850 @param ready_test_name String containing the name of a
1851 method defined on the XMLRPC server.
1852 @param timeout_seconds Number of seconds to wait
1853 for the server to become 'ready.' Will throw a
1854 TestFail error if server is not ready in time.
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001855 @param logfile Logfile to send output when running
1856 'command' argument.
Yusuf Mohsinally8d19e3c2013-11-21 14:25:45 -08001857
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001858 """
Christopher Wileyc14f06a2013-10-16 13:55:39 -07001859 # Clean up any existing state. If the caller is willing
1860 # to believe their server is down, we ought to clean up
1861 # any tunnels we might have sitting around.
1862 self.rpc_disconnect(port)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001863 # Start the server on the host. Redirection in the command
1864 # below is necessary, because 'ssh' won't terminate until
1865 # background child processes close stdin, stdout, and
1866 # stderr.
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001867 remote_cmd = '%s </dev/null >%s 2>&1 & echo $!' % (command, logfile)
Christopher Wileydd181852013-10-10 19:56:58 -07001868 remote_pid = self.run(remote_cmd).stdout.rstrip('\n')
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001869 logging.debug('Started XMLRPC server on host %s, pid = %s',
1870 self.hostname, remote_pid)
1871
Christopher Wileydd181852013-10-10 19:56:58 -07001872 # Tunnel through SSH to be able to reach that remote port.
1873 rpc_url = self._setup_rpc(port, command_name, remote_pid=remote_pid)
Christopher Wileyd78249a2013-03-01 13:05:31 -08001874 proxy = xmlrpclib.ServerProxy(rpc_url, allow_none=True)
Christopher Wileydd181852013-10-10 19:56:58 -07001875
Christopher Wileyd78249a2013-03-01 13:05:31 -08001876 if ready_test_name is not None:
J. Richard Barnette13eb7c02013-03-07 12:06:29 -08001877 # retry.retry logs each attempt; calculate delay_sec to
1878 # keep log spam to a dull roar.
Christopher Wiley0ed712b2013-04-09 15:25:12 -07001879 @retry.retry((socket.error,
1880 xmlrpclib.ProtocolError,
1881 httplib.BadStatusLine),
Chris Sosa65425082013-10-16 13:26:22 -07001882 timeout_min=timeout_seconds / 60.0,
1883 delay_sec=min(max(timeout_seconds / 20.0, 0.1), 1))
Christopher Wileyd78249a2013-03-01 13:05:31 -08001884 def ready_test():
1885 """ Call proxy.ready_test_name(). """
1886 getattr(proxy, ready_test_name)()
1887 successful = False
1888 try:
1889 logging.info('Waiting %d seconds for XMLRPC server '
1890 'to start.', timeout_seconds)
1891 ready_test()
1892 successful = True
Christopher Wileyd78249a2013-03-01 13:05:31 -08001893 finally:
1894 if not successful:
1895 logging.error('Failed to start XMLRPC server.')
beeps32a63082013-08-22 14:02:29 -07001896 self.rpc_disconnect(port)
Christopher Wileyd78249a2013-03-01 13:05:31 -08001897 logging.info('XMLRPC server started successfully.')
1898 return proxy
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001899
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001900
Jason Abeleb6f924f2013-11-13 16:01:54 -08001901 def syslog(self, message, tag='autotest'):
1902 """Logs a message to syslog on host.
1903
1904 @param message String message to log into syslog
1905 @param tag String tag prefix for syslog
1906
1907 """
1908 self.run('logger -t "%s" "%s"' % (tag, message))
1909
1910
beeps32a63082013-08-22 14:02:29 -07001911 def jsonrpc_connect(self, port):
1912 """Creates a jsonrpc proxy connection through an ssh tunnel.
1913
1914 This method exists to facilitate communication with goofy (which is
1915 the default system manager on all factory images) and as such, leaves
1916 most of the rpc server sanity checking to the caller. Unlike
1917 xmlrpc_connect, this method does not facilitate the creation of a remote
1918 jsonrpc server, as the only clients of this code are factory tests,
1919 for which the goofy system manager is built in to the image and starts
1920 when the target boots.
1921
1922 One can theoretically create multiple jsonrpc proxies all forwarded
1923 to the same remote port, provided the remote port has an rpc server
1924 listening. However, in doing so we stand the risk of leaking an
1925 existing tunnel process, so we always disconnect any older tunnels
1926 we might have through rpc_disconnect.
1927
1928 @param port: port on the remote host that is serving this proxy.
1929
1930 @return: The client proxy.
1931 """
1932 if not jsonrpclib:
1933 logging.warning('Jsonrpclib could not be imported. Check that '
1934 'site-packages contains jsonrpclib.')
1935 return None
1936
1937 proxy = jsonrpclib.jsonrpc.ServerProxy(self._setup_rpc(port, None))
1938
1939 logging.info('Established a jsonrpc connection through port %s.', port)
1940 return proxy
1941
1942
1943 def rpc_disconnect(self, port):
1944 """Disconnect from an RPC server on the host.
1945
1946 Terminates the remote RPC server previously started for
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001947 the given `port`. Also closes the local ssh tunnel created
1948 for the connection to the host. This function does not
beeps32a63082013-08-22 14:02:29 -07001949 directly alter the state of a previously returned RPC
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001950 client object; however disconnection will cause all
1951 subsequent calls to methods on the object to fail.
1952
1953 This function does nothing if requested to disconnect a port
beeps32a63082013-08-22 14:02:29 -07001954 that was not previously connected via _setup_rpc.
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001955
1956 @param port Port number passed to a previous call to
beeps32a63082013-08-22 14:02:29 -07001957 `_setup_rpc()`.
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001958 """
beeps32a63082013-08-22 14:02:29 -07001959 if port not in self._rpc_proxy_map:
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001960 return
Christopher Wileydd181852013-10-10 19:56:58 -07001961 remote_name, tunnel_proc, remote_pid = self._rpc_proxy_map[port]
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001962 if remote_name:
1963 # We use 'pkill' to find our target process rather than
1964 # a PID, because the host may have rebooted since
1965 # connecting, and we don't want to kill an innocent
1966 # process with the same PID.
1967 #
1968 # 'pkill' helpfully exits with status 1 if no target
1969 # process is found, for which run() will throw an
Simran Basid5e5e272012-09-24 15:23:59 -07001970 # exception. We don't want that, so we the ignore
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001971 # status.
1972 self.run("pkill -f '%s'" % remote_name, ignore_status=True)
Christopher Wileydd181852013-10-10 19:56:58 -07001973 if remote_pid:
1974 logging.info('Waiting for RPC server "%s" shutdown',
1975 remote_name)
1976 start_time = time.time()
1977 while (time.time() - start_time <
1978 self._RPC_SHUTDOWN_TIMEOUT_SECONDS):
1979 running_processes = self.run(
1980 "pgrep -f '%s'" % remote_name,
1981 ignore_status=True).stdout.split()
1982 if not remote_pid in running_processes:
1983 logging.info('Shut down RPC server.')
1984 break
1985 time.sleep(self._RPC_SHUTDOWN_POLLING_PERIOD_SECONDS)
1986 else:
1987 raise error.TestError('Failed to shutdown RPC server %s' %
1988 remote_name)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001989
1990 if tunnel_proc.poll() is None:
1991 tunnel_proc.terminate()
1992 logging.debug('Terminated tunnel, pid %d', tunnel_proc.pid)
1993 else:
1994 logging.debug('Tunnel pid %d terminated early, status %d',
1995 tunnel_proc.pid, tunnel_proc.returncode)
beeps32a63082013-08-22 14:02:29 -07001996 del self._rpc_proxy_map[port]
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001997
1998
beeps32a63082013-08-22 14:02:29 -07001999 def rpc_disconnect_all(self):
2000 """Disconnect all known RPC proxy ports."""
2001 for port in self._rpc_proxy_map.keys():
2002 self.rpc_disconnect(port)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07002003
2004
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002005 def poor_mans_rpc(self, fun):
2006 """
2007 Calls a function from client utils on the host and returns a string.
2008
2009 @param fun function in client utils namespace.
2010 @return output string from calling fun.
2011 """
Simran Basi263a9d32014-08-19 11:16:51 -07002012 script = 'cd %s/bin; ' % autotest.Autotest.get_installed_autodir(self)
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002013 script += 'python -c "import common; import utils;'
2014 script += 'print utils.%s"' % fun
2015 return script
2016
2017
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002018 def _ping_check_status(self, status):
2019 """Ping the host once, and return whether it has a given status.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002020
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002021 @param status Check the ping status against this value.
2022 @return True iff `status` and the result of ping are the same
2023 (i.e. both True or both False).
2024
2025 """
2026 ping_val = utils.ping(self.hostname, tries=1, deadline=1)
2027 return not (status ^ (ping_val == 0))
2028
2029 def _ping_wait_for_status(self, status, timeout):
2030 """Wait for the host to have a given status (UP or DOWN).
2031
2032 Status is checked by polling. Polling will not last longer
2033 than the number of seconds in `timeout`. The polling
2034 interval will be long enough that only approximately
2035 _PING_WAIT_COUNT polling cycles will be executed, subject
2036 to a maximum interval of about one minute.
2037
2038 @param status Waiting will stop immediately if `ping` of the
2039 host returns this status.
2040 @param timeout Poll for at most this many seconds.
2041 @return True iff the host status from `ping` matched the
2042 requested status at the time of return.
2043
2044 """
2045 # _ping_check_status() takes about 1 second, hence the
2046 # "- 1" in the formula below.
2047 poll_interval = min(int(timeout / self._PING_WAIT_COUNT), 60) - 1
2048 end_time = time.time() + timeout
2049 while time.time() <= end_time:
2050 if self._ping_check_status(status):
2051 return True
2052 if poll_interval > 0:
2053 time.sleep(poll_interval)
2054
2055 # The last thing we did was sleep(poll_interval), so it may
2056 # have been too long since the last `ping`. Check one more
2057 # time, just to be sure.
2058 return self._ping_check_status(status)
2059
2060 def ping_wait_up(self, timeout):
2061 """Wait for the host to respond to `ping`.
2062
2063 N.B. This method is not a reliable substitute for
2064 `wait_up()`, because a host that responds to ping will not
2065 necessarily respond to ssh. This method should only be used
2066 if the target DUT can be considered functional even if it
2067 can't be reached via ssh.
2068
2069 @param timeout Minimum time to allow before declaring the
2070 host to be non-responsive.
2071 @return True iff the host answered to ping before the timeout.
2072
2073 """
2074 return self._ping_wait_for_status(self._PING_STATUS_UP, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002075
Andrew Bresticker678c0c72013-01-22 10:44:09 -08002076 def ping_wait_down(self, timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002077 """Wait until the host no longer responds to `ping`.
2078
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002079 This function can be used as a slightly faster version of
2080 `wait_down()`, by avoiding potentially long ssh timeouts.
2081
2082 @param timeout Minimum time to allow for the host to become
2083 non-responsive.
2084 @return True iff the host quit answering ping before the
2085 timeout.
2086
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002087 """
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002088 return self._ping_wait_for_status(self._PING_STATUS_DOWN, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002089
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002090 def test_wait_for_sleep(self, sleep_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002091 """Wait for the client to enter low-power sleep mode.
2092
2093 The test for "is asleep" can't distinguish a system that is
2094 powered off; to confirm that the unit was asleep, it is
2095 necessary to force resume, and then call
2096 `test_wait_for_resume()`.
2097
2098 This function is expected to be called from a test as part
2099 of a sequence like the following:
2100
2101 ~~~~~~~~
2102 boot_id = host.get_boot_id()
2103 # trigger sleep on the host
2104 host.test_wait_for_sleep()
2105 # trigger resume on the host
2106 host.test_wait_for_resume(boot_id)
2107 ~~~~~~~~
2108
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002109 @param sleep_timeout time limit in seconds to allow the host sleep.
2110
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002111 @exception TestFail The host did not go to sleep within
2112 the allowed time.
2113 """
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002114 if sleep_timeout is None:
2115 sleep_timeout = self.SLEEP_TIMEOUT
2116
2117 if not self.ping_wait_down(timeout=sleep_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002118 raise error.TestFail(
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002119 'client failed to sleep after %d seconds' % sleep_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002120
2121
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002122 def test_wait_for_resume(self, old_boot_id, resume_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002123 """Wait for the client to resume from low-power sleep mode.
2124
2125 The `old_boot_id` parameter should be the value from
2126 `get_boot_id()` obtained prior to entering sleep mode. A
2127 `TestFail` exception is raised if the boot id changes.
2128
2129 See @ref test_wait_for_sleep for more on this function's
2130 usage.
2131
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08002132 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002133 target host went to sleep.
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002134 @param resume_timeout time limit in seconds to allow the host up.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002135
2136 @exception TestFail The host did not respond within the
2137 allowed time.
2138 @exception TestFail The host responded, but the boot id test
2139 indicated a reboot rather than a sleep
2140 cycle.
2141 """
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002142 if resume_timeout is None:
2143 resume_timeout = self.RESUME_TIMEOUT
2144
2145 if not self.wait_up(timeout=resume_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002146 raise error.TestFail(
2147 'client failed to resume from sleep after %d seconds' %
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002148 resume_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002149 else:
2150 new_boot_id = self.get_boot_id()
2151 if new_boot_id != old_boot_id:
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002152 logging.error('client rebooted (old boot %s, new boot %s)',
2153 old_boot_id, new_boot_id)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002154 raise error.TestFail(
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002155 'client rebooted, but sleep was expected')
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002156
2157
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002158 def test_wait_for_shutdown(self, shutdown_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002159 """Wait for the client to shut down.
2160
2161 The test for "has shut down" can't distinguish a system that
2162 is merely asleep; to confirm that the unit was down, it is
2163 necessary to force boot, and then call test_wait_for_boot().
2164
2165 This function is expected to be called from a test as part
2166 of a sequence like the following:
2167
2168 ~~~~~~~~
2169 boot_id = host.get_boot_id()
2170 # trigger shutdown on the host
2171 host.test_wait_for_shutdown()
2172 # trigger boot on the host
2173 host.test_wait_for_boot(boot_id)
2174 ~~~~~~~~
2175
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002176 @param shutdown_timeout time limit in seconds to allow the host down.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002177 @exception TestFail The host did not shut down within the
2178 allowed time.
2179 """
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002180 if shutdown_timeout is None:
2181 shutdown_timeout = self.SHUTDOWN_TIMEOUT
2182
2183 if not self.ping_wait_down(timeout=shutdown_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002184 raise error.TestFail(
2185 'client failed to shut down after %d seconds' %
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002186 shutdown_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002187
2188
2189 def test_wait_for_boot(self, old_boot_id=None):
2190 """Wait for the client to boot from cold power.
2191
2192 The `old_boot_id` parameter should be the value from
2193 `get_boot_id()` obtained prior to shutting down. A
2194 `TestFail` exception is raised if the boot id does not
2195 change. The boot id test is omitted if `old_boot_id` is not
2196 specified.
2197
2198 See @ref test_wait_for_shutdown for more on this function's
2199 usage.
2200
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08002201 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002202 shut down.
2203
2204 @exception TestFail The host did not respond within the
2205 allowed time.
2206 @exception TestFail The host responded, but the boot id test
2207 indicated that there was no reboot.
2208 """
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07002209 if not self.wait_up(timeout=self.REBOOT_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002210 raise error.TestFail(
2211 'client failed to reboot after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07002212 self.REBOOT_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002213 elif old_boot_id:
2214 if self.get_boot_id() == old_boot_id:
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002215 logging.error('client not rebooted (boot %s)',
2216 old_boot_id)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002217 raise error.TestFail(
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002218 'client is back up, but did not reboot')
Simran Basid5e5e272012-09-24 15:23:59 -07002219
2220
2221 @staticmethod
2222 def check_for_rpm_support(hostname):
2223 """For a given hostname, return whether or not it is powered by an RPM.
2224
Simran Basi1df55112013-09-06 11:25:09 -07002225 @param hostname: hostname to check for rpm support.
2226
Simran Basid5e5e272012-09-24 15:23:59 -07002227 @return None if this host does not follows the defined naming format
2228 for RPM powered DUT's in the lab. If it does follow the format,
2229 it returns a regular expression MatchObject instead.
2230 """
Fang Dengbaff9082015-01-06 13:46:15 -08002231 return re.match(CrosHost._RPM_HOSTNAME_REGEX, hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07002232
2233
2234 def has_power(self):
2235 """For this host, return whether or not it is powered by an RPM.
2236
2237 @return True if this host is in the CROS lab and follows the defined
2238 naming format.
2239 """
Fang Deng0ca40e22013-08-27 17:47:44 -07002240 return CrosHost.check_for_rpm_support(self.hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07002241
2242
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08002243 def _set_power(self, state, power_method):
2244 """Sets the power to the host via RPM, Servo or manual.
2245
2246 @param state Specifies which power state to set to DUT
2247 @param power_method Specifies which method of power control to
2248 use. By default "RPM" will be used. Valid values
2249 are the strings "RPM", "manual", "servoj10".
2250
2251 """
2252 ACCEPTABLE_STATES = ['ON', 'OFF']
2253
2254 if state.upper() not in ACCEPTABLE_STATES:
2255 raise error.TestError('State must be one of: %s.'
2256 % (ACCEPTABLE_STATES,))
2257
2258 if power_method == self.POWER_CONTROL_SERVO:
2259 logging.info('Setting servo port J10 to %s', state)
2260 self.servo.set('prtctl3_pwren', state.lower())
2261 time.sleep(self._USB_POWER_TIMEOUT)
2262 elif power_method == self.POWER_CONTROL_MANUAL:
2263 logging.info('You have %d seconds to set the AC power to %s.',
2264 self._POWER_CYCLE_TIMEOUT, state)
2265 time.sleep(self._POWER_CYCLE_TIMEOUT)
2266 else:
2267 if not self.has_power():
2268 raise error.TestFail('DUT does not have RPM connected.')
Simran Basi5e6339a2013-03-21 11:34:32 -07002269 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
2270 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, True,
2271 hostname=self.hostname)
Simran Basi1df55112013-09-06 11:25:09 -07002272 rpm_client.set_power(self.hostname, state.upper(), timeout_mins=5)
Simran Basid5e5e272012-09-24 15:23:59 -07002273
2274
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08002275 def power_off(self, power_method=POWER_CONTROL_RPM):
2276 """Turn off power to this host via RPM, Servo or manual.
2277
2278 @param power_method Specifies which method of power control to
2279 use. By default "RPM" will be used. Valid values
2280 are the strings "RPM", "manual", "servoj10".
2281
2282 """
2283 self._set_power('OFF', power_method)
Simran Basid5e5e272012-09-24 15:23:59 -07002284
2285
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08002286 def power_on(self, power_method=POWER_CONTROL_RPM):
2287 """Turn on power to this host via RPM, Servo or manual.
2288
2289 @param power_method Specifies which method of power control to
2290 use. By default "RPM" will be used. Valid values
2291 are the strings "RPM", "manual", "servoj10".
2292
2293 """
2294 self._set_power('ON', power_method)
2295
2296
2297 def power_cycle(self, power_method=POWER_CONTROL_RPM):
2298 """Cycle power to this host by turning it OFF, then ON.
2299
2300 @param power_method Specifies which method of power control to
2301 use. By default "RPM" will be used. Valid values
2302 are the strings "RPM", "manual", "servoj10".
2303
2304 """
2305 if power_method in (self.POWER_CONTROL_SERVO,
2306 self.POWER_CONTROL_MANUAL):
2307 self.power_off(power_method=power_method)
2308 time.sleep(self._POWER_CYCLE_TIMEOUT)
2309 self.power_on(power_method=power_method)
2310 else:
2311 rpm_client.set_power(self.hostname, 'CYCLE')
Simran Basic6f1f7a2012-10-16 10:47:46 -07002312
2313
2314 def get_platform(self):
2315 """Determine the correct platform label for this host.
2316
2317 @returns a string representing this host's platform.
2318 """
2319 crossystem = utils.Crossystem(self)
2320 crossystem.init()
2321 # Extract fwid value and use the leading part as the platform id.
2322 # fwid generally follow the format of {platform}.{firmware version}
2323 # Example: Alex.X.YYY.Z or Google_Alex.X.YYY.Z
2324 platform = crossystem.fwid().split('.')[0].lower()
2325 # Newer platforms start with 'Google_' while the older ones do not.
2326 return platform.replace('google_', '')
2327
2328
Hung-ying Tyanb1328032014-04-01 14:18:54 +08002329 def get_architecture(self):
2330 """Determine the correct architecture label for this host.
2331
2332 @returns a string representing this host's architecture.
2333 """
2334 crossystem = utils.Crossystem(self)
2335 crossystem.init()
2336 return crossystem.arch()
2337
2338
Luis Lozano40b7d0d2014-01-17 15:12:06 -08002339 def get_chrome_version(self):
2340 """Gets the Chrome version number and milestone as strings.
2341
2342 Invokes "chrome --version" to get the version number and milestone.
2343
2344 @return A tuple (chrome_ver, milestone) where "chrome_ver" is the
2345 current Chrome version number as a string (in the form "W.X.Y.Z")
2346 and "milestone" is the first component of the version number
2347 (the "W" from "W.X.Y.Z"). If the version number cannot be parsed
2348 in the "W.X.Y.Z" format, the "chrome_ver" will be the full output
2349 of "chrome --version" and the milestone will be the empty string.
2350
2351 """
MK Ryu35d661e2014-09-25 17:44:10 -07002352 version_string = self.run(client_constants.CHROME_VERSION_COMMAND).stdout
Luis Lozano40b7d0d2014-01-17 15:12:06 -08002353 return utils.parse_chrome_version(version_string)
2354
Aviv Keshet74c89a92013-02-04 15:18:30 -08002355 @label_decorator()
Simran Basic6f1f7a2012-10-16 10:47:46 -07002356 def get_board(self):
2357 """Determine the correct board label for this host.
2358
2359 @returns a string representing this host's board.
2360 """
2361 release_info = utils.parse_cmd_output('cat /etc/lsb-release',
2362 run_method=self.run)
2363 board = release_info['CHROMEOS_RELEASE_BOARD']
2364 # Devices in the lab generally have the correct board name but our own
2365 # development devices have {board_name}-signed-{key_type}. The board
2366 # name may also begin with 'x86-' which we need to keep.
Simran Basi833814b2013-01-29 13:13:43 -08002367 board_format_string = ds_constants.BOARD_PREFIX + '%s'
Simran Basic6f1f7a2012-10-16 10:47:46 -07002368 if 'x86' not in board:
Simran Basi833814b2013-01-29 13:13:43 -08002369 return board_format_string % board.split('-')[0]
2370 return board_format_string % '-'.join(board.split('-')[0:2])
Simran Basic6f1f7a2012-10-16 10:47:46 -07002371
2372
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002373 @label_decorator('board_freq_mem')
2374 def get_board_with_frequency_and_memory(self):
2375 """
2376 Determines the board name with frequency and memory.
2377
2378 @returns a more detailed string representing the board. Examples are
2379 butterfly_1.1GHz_2GB, link_1.8GHz_4GB, x86-zgb_1.7GHz_2GB
2380 """
2381 board = self.run(self.poor_mans_rpc(
2382 'get_board_with_frequency_and_memory()')).stdout
2383 return 'board_freq_mem:%s' % str.strip(board)
2384
2385
Aviv Keshet74c89a92013-02-04 15:18:30 -08002386 @label_decorator('lightsensor')
Simran Basic6f1f7a2012-10-16 10:47:46 -07002387 def has_lightsensor(self):
2388 """Determine the correct board label for this host.
2389
2390 @returns the string 'lightsensor' if this host has a lightsensor or
2391 None if it does not.
2392 """
2393 search_cmd = "find -L %s -maxdepth 4 | egrep '%s'" % (
Richard Barnette82c35912012-11-20 10:09:10 -08002394 self._LIGHTSENSOR_SEARCH_DIR, '|'.join(self._LIGHTSENSOR_FILES))
Simran Basic6f1f7a2012-10-16 10:47:46 -07002395 try:
2396 # Run the search cmd following the symlinks. Stderr_tee is set to
2397 # None as there can be a symlink loop, but the command will still
2398 # execute correctly with a few messages printed to stderr.
2399 self.run(search_cmd, stdout_tee=None, stderr_tee=None)
2400 return 'lightsensor'
2401 except error.AutoservRunError:
2402 # egrep exited with a return code of 1 meaning none of the possible
2403 # lightsensor files existed.
2404 return None
2405
2406
Aviv Keshet74c89a92013-02-04 15:18:30 -08002407 @label_decorator('bluetooth')
Simran Basic6f1f7a2012-10-16 10:47:46 -07002408 def has_bluetooth(self):
2409 """Determine the correct board label for this host.
2410
2411 @returns the string 'bluetooth' if this host has bluetooth or
2412 None if it does not.
2413 """
2414 try:
2415 self.run('test -d /sys/class/bluetooth/hci0')
2416 # test exited with a return code of 0.
2417 return 'bluetooth'
2418 except error.AutoservRunError:
2419 # test exited with a return code 1 meaning the directory did not
2420 # exist.
2421 return None
2422
2423
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002424 @label_decorator('gpu_family')
2425 def get_gpu_family(self):
2426 """
2427 Determine GPU family.
2428
2429 @returns a string representing the gpu family. Examples are mali, tegra,
2430 pinetrail, sandybridge, ivybridge, haswell and baytrail.
2431 """
2432 gpu_family = self.run(self.poor_mans_rpc('get_gpu_family()')).stdout
2433 return 'gpu_family:%s' % str.strip(gpu_family)
2434
2435
Ilja Friedel0ce0b602013-08-15 18:45:27 -07002436 @label_decorator('graphics')
2437 def get_graphics(self):
2438 """
2439 Determine the correct board label for this host.
2440
2441 @returns a string representing this host's graphics. For now ARM boards
2442 return graphics:gles while all other boards return graphics:gl. This
2443 may change over time, but for robustness reasons this should avoid
2444 executing code in actual graphics libraries (which may not be ready and
2445 is tested by graphics_GLAPICheck).
2446 """
2447 uname = self.run('uname -a').stdout.lower()
2448 if 'arm' in uname:
2449 return 'graphics:gles'
2450 return 'graphics:gl'
2451
2452
Bill Richardson4f595f52014-02-13 16:20:26 -08002453 @label_decorator('ec')
2454 def get_ec(self):
2455 """
2456 Determine the type of EC on this host.
2457
2458 @returns a string representing this host's embedded controller type.
2459 At present, it only returns "ec:cros", for Chrome OS ECs. Other types
2460 of EC (or none) don't return any strings, since no tests depend on
2461 those.
2462 """
2463 cmd = 'mosys ec info'
2464 # The output should look like these, so that the last field should
2465 # match our EC version scheme:
2466 #
2467 # stm | stm32f100 | snow_v1.3.139-375eb9f
2468 # ti | Unknown-10de | peppy_v1.5.114-5d52788
2469 #
2470 # Non-Chrome OS ECs will look like these:
2471 #
2472 # ENE | KB932 | 00BE107A00
2473 # ite | it8518 | 3.08
2474 #
2475 # And some systems don't have ECs at all (Lumpy, for example).
2476 regexp = r'^.*\|\s*(\S+_v\d+\.\d+\.\d+-[0-9a-f]+)\s*$'
2477
2478 ecinfo = self.run(command=cmd, ignore_status=True)
2479 if ecinfo.exit_status == 0:
2480 res = re.search(regexp, ecinfo.stdout)
2481 if res:
2482 logging.info("EC version is %s", res.groups()[0])
2483 return 'ec:cros'
2484 logging.info("%s got: %s", cmd, ecinfo.stdout)
2485 # Has an EC, but it's not a Chrome OS EC
2486 return None
2487 logging.info("%s exited with status %d", cmd, ecinfo.exit_status)
2488 # No EC present
2489 return None
2490
2491
Alec Berg31b932b2014-04-04 16:09:11 -07002492 @label_decorator('accels')
2493 def get_accels(self):
2494 """
2495 Determine the type of accelerometers on this host.
2496
2497 @returns a string representing this host's accelerometer type.
2498 At present, it only returns "accel:cros-ec", for accelerometers
2499 attached to a Chrome OS EC, or none, if no accelerometers.
2500 """
2501 # Check to make sure we have ectool
2502 rv = self.run('which ectool', ignore_status=True)
2503 if rv.exit_status:
2504 logging.info("No ectool cmd found, assuming no EC accelerometers")
2505 return None
2506
2507 # Check that the EC supports the motionsense command
2508 rv = self.run('ectool motionsense', ignore_status=True)
2509 if rv.exit_status:
2510 logging.info("EC does not support motionsense command "
2511 "assuming no EC accelerometers")
2512 return None
2513
2514 # Check that EC motion sensors are active
2515 active = self.run('ectool motionsense active').stdout.split('\n')
2516 if active[0] == "0":
2517 logging.info("Motion sense inactive, assuming no EC accelerometers")
2518 return None
2519
2520 logging.info("EC accelerometers found")
2521 return 'accel:cros-ec'
2522
2523
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08002524 @label_decorator('chameleon')
2525 def has_chameleon(self):
2526 """Determine if a Chameleon connected to this host.
2527
Tom Wai-Hong Tambadbb332014-10-10 02:59:41 +08002528 @returns a list containing two strings ('chameleon' and
2529 'chameleon:' + label, e.g. 'chameleon:hdmi') if this host
2530 has a Chameleon or None if it has not.
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08002531 """
2532 if self._chameleon_host:
Tom Wai-Hong Tambadbb332014-10-10 02:59:41 +08002533 return ['chameleon', 'chameleon:' + self.chameleon.get_label()]
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08002534 else:
2535 return None
2536
2537
Cheng-Yi Chiangf4104ff2014-12-23 19:39:01 +08002538 @label_decorator('audio_loopback_dongle')
2539 def has_loopback_dongle(self):
2540 """Determine if an audio loopback dongle is plugged to this host.
2541
2542 @returns 'audio_loopback_dongle' when there is an audio loopback dongle
2543 plugged to this host.
2544 None when there is no audio loopback dongle
2545 plugged to this host.
2546 """
Cheng-Yi Chiang8de78112015-05-27 14:47:08 +08002547 nodes_info = self.run(command=cras_utils.get_cras_nodes_cmd(),
2548 ignore_status=True).stdout
2549 if (cras_utils.node_type_is_plugged('HEADPHONE', nodes_info) and
2550 cras_utils.node_type_is_plugged('MIC', nodes_info)):
Cheng-Yi Chiangf4104ff2014-12-23 19:39:01 +08002551 return 'audio_loopback_dongle'
2552 else:
2553 return None
2554
2555
Derek Basehorec71ff622014-07-07 15:18:40 -07002556 @label_decorator('power_supply')
2557 def get_power_supply(self):
2558 """
2559 Determine what type of power supply the host has
2560
2561 @returns a string representing this host's power supply.
2562 'power:battery' when the device has a battery intended for
2563 extended use
2564 'power:AC_primary' when the device has a battery not intended
2565 for extended use (for moving the machine, etc)
2566 'power:AC_only' when the device has no battery at all.
2567 """
2568 psu = self.run(command='mosys psu type', ignore_status=True)
2569 if psu.exit_status:
2570 # The psu command for mosys is not included for all platforms. The
2571 # assumption is that the device will have a battery if the command
2572 # is not found.
2573 return 'power:battery'
2574
2575 psu_str = psu.stdout.strip()
2576 if psu_str == 'unknown':
2577 return None
2578
2579 return 'power:%s' % psu_str
2580
2581
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002582 @label_decorator('storage')
2583 def get_storage(self):
2584 """
2585 Determine the type of boot device for this host.
2586
2587 Determine if the internal device is SCSI or dw_mmc device.
2588 Then check that it is SSD or HDD or eMMC or something else.
2589
2590 @returns a string representing this host's internal device type.
2591 'storage:ssd' when internal device is solid state drive
2592 'storage:hdd' when internal device is hard disk drive
2593 'storage:mmc' when internal device is mmc drive
2594 None When internal device is something else or
2595 when we are unable to determine the type
2596 """
2597 # The output should be /dev/mmcblk* for SD/eMMC or /dev/sd* for scsi
2598 rootdev_cmd = ' '.join(['. /usr/sbin/write_gpt.sh;',
2599 '. /usr/share/misc/chromeos-common.sh;',
2600 'load_base_vars;',
2601 'get_fixed_dst_drive'])
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002602 rootdev = self.run(command=rootdev_cmd, ignore_status=True)
2603 if rootdev.exit_status:
2604 logging.info("Fail to run %s", rootdev_cmd)
2605 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002606 rootdev_str = rootdev.stdout.strip()
2607
2608 if not rootdev_str:
2609 return None
2610
2611 rootdev_base = os.path.basename(rootdev_str)
2612
2613 mmc_pattern = '/dev/mmcblk[0-9]'
2614 if re.match(mmc_pattern, rootdev_str):
2615 # Use type to determine if the internal device is eMMC or somthing
2616 # else. We can assume that MMC is always an internal device.
2617 type_cmd = 'cat /sys/block/%s/device/type' % rootdev_base
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002618 type = self.run(command=type_cmd, ignore_status=True)
2619 if type.exit_status:
2620 logging.info("Fail to run %s", type_cmd)
2621 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002622 type_str = type.stdout.strip()
2623
2624 if type_str == 'MMC':
2625 return 'storage:mmc'
2626
2627 scsi_pattern = '/dev/sd[a-z]+'
2628 if re.match(scsi_pattern, rootdev.stdout):
2629 # Read symlink for /sys/block/sd* to determine if the internal
2630 # device is connected via ata or usb.
2631 link_cmd = 'readlink /sys/block/%s' % rootdev_base
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002632 link = self.run(command=link_cmd, ignore_status=True)
2633 if link.exit_status:
2634 logging.info("Fail to run %s", link_cmd)
2635 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002636 link_str = link.stdout.strip()
2637 if 'usb' in link_str:
2638 return None
2639
2640 # Read rotation to determine if the internal device is ssd or hdd.
2641 rotate_cmd = str('cat /sys/block/%s/queue/rotational'
2642 % rootdev_base)
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002643 rotate = self.run(command=rotate_cmd, ignore_status=True)
2644 if rotate.exit_status:
2645 logging.info("Fail to run %s", rotate_cmd)
2646 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002647 rotate_str = rotate.stdout.strip()
2648
2649 rotate_dict = {'0':'storage:ssd', '1':'storage:hdd'}
2650 return rotate_dict.get(rotate_str)
2651
2652 # All other internal device / error case will always fall here
2653 return None
2654
2655
Dan Shi4e9a2aa2014-03-24 14:28:42 -07002656 @label_decorator('servo')
2657 def get_servo(self):
2658 """Determine if the host has a servo attached.
2659
2660 If the host has a working servo attached, it should have a servo label.
2661
2662 @return: string 'servo' if the host has servo attached. Otherwise,
2663 returns None.
2664 """
2665 return 'servo' if self._servo_host else None
2666
2667
Dan Shi5beba472014-05-28 22:46:07 -07002668 @label_decorator('video_labels')
2669 def get_video_labels(self):
2670 """Run /usr/local/bin/avtest_label_detect to get a list of video labels.
2671
2672 Sample output of avtest_label_detect:
2673 Detected label: hw_video_acc_vp8
2674 Detected label: webcam
2675
2676 @return: A list of labels detected by tool avtest_label_detect.
2677 """
2678 try:
2679 result = self.run('/usr/local/bin/avtest_label_detect').stdout
2680 return re.findall('^Detected label: (\w+)$', result, re.M)
2681 except error.AutoservRunError:
2682 # The tool is not installed.
2683 return []
2684
2685
mussa584b4462014-06-20 15:13:28 -07002686 @label_decorator('video_glitch_detection')
2687 def is_video_glitch_detection_supported(self):
2688 """ Determine if a board under test is supported for video glitch
2689 detection tests.
2690
2691 @return: 'video_glitch_detection' if board is supported, None otherwise.
2692 """
2693 parser = ConfigParser.SafeConfigParser()
2694 filename = os.path.join(
2695 common.autotest_dir, 'client/cros/video/device_spec.conf')
2696
2697 dut = self.get_board().replace(ds_constants.BOARD_PREFIX, '')
2698
2699 try:
2700 parser.read(filename)
mussa584b4462014-06-20 15:13:28 -07002701 supported_boards = parser.sections()
2702
Mussa83c84d62014-10-02 12:11:28 -07002703 return 'video_glitch_detection' if dut in supported_boards else None
mussa584b4462014-06-20 15:13:28 -07002704
2705 except ConfigParser.error:
2706 # something went wrong while parsing the conf file
2707 return None
2708
Katherine Threlkeld7b97a9f2014-06-24 13:47:14 -07002709 @label_decorator('touch_labels')
2710 def get_touch(self):
2711 """
2712 Determine whether board under test has a touchpad or touchscreen.
2713
2714 @return: A list of some combination of 'touchscreen' and 'touchpad',
2715 depending on what is present on the device.
Katherine Threlkeldab83d392015-06-18 16:45:57 -07002716
Katherine Threlkeld7b97a9f2014-06-24 13:47:14 -07002717 """
2718 labels = []
Katherine Threlkeldab83d392015-06-18 16:45:57 -07002719 looking_for = ['touchpad', 'touchscreen']
2720 player = input_playback.InputPlayback()
2721 input_events = self.run('ls /dev/input/event*').stdout.strip().split()
2722 filename = '/tmp/touch_labels'
2723 for event in input_events:
2724 self.run('evtest %s > %s' % (event, filename), timeout=1,
2725 ignore_timeout=True)
2726 properties = self.run('cat %s' % filename).stdout
2727 input_type = player._determine_input_type(properties)
2728 if input_type in looking_for:
2729 labels.append(input_type)
2730 looking_for.remove(input_type)
2731 if len(looking_for) == 0:
2732 break
2733 self.run('rm %s' % filename)
2734
Katherine Threlkeld7b97a9f2014-06-24 13:47:14 -07002735 return labels
2736
Hung-ying Tyana39b0542015-06-30 10:36:42 +08002737
2738 @label_decorator('internal_display')
2739 def has_internal_display(self):
2740 """Determine if the device under test is equipped with an internal
2741 display.
2742
2743 @return: 'internal_display' if one is present; None otherwise.
2744 """
2745 from autotest_lib.client.cros.graphics import graphics_utils
2746 from autotest_lib.client.common_lib import utils as common_utils
2747
2748 def __system_output(cmd):
2749 return self.run(cmd).stdout
2750
2751 def __read_file(remote_path):
2752 return self.run('cat %s' % remote_path).stdout
2753
2754 # Hijack the necessary client functions so that we can take advantage
2755 # of the client lib here.
2756 # FIXME: find a less hacky way than this
2757 original_system_output = utils.system_output
2758 original_read_file = common_utils.read_file
2759 utils.system_output = __system_output
2760 common_utils.read_file = __read_file
2761 try:
2762 return ('internal_display' if graphics_utils.has_internal_display()
2763 else None)
2764 finally:
2765 utils.system_output = original_system_output
2766 common_utils.read_file = original_read_file
2767
2768
Simran Basic6f1f7a2012-10-16 10:47:46 -07002769 def get_labels(self):
2770 """Return a list of labels for this given host.
2771
2772 This is the main way to retrieve all the automatic labels for a host
2773 as it will run through all the currently implemented label functions.
2774 """
2775 labels = []
Richard Barnette82c35912012-11-20 10:09:10 -08002776 for label_function in self._LABEL_FUNCTIONS:
J. Richard Barnetteb869b222014-09-03 17:55:44 -07002777 try:
2778 label = label_function(self)
2779 except Exception as e:
2780 logging.error('Label function %s failed; ignoring it.',
2781 label_function.__name__)
2782 logging.exception(e)
2783 label = None
Simran Basic6f1f7a2012-10-16 10:47:46 -07002784 if label:
Dan Shi5beba472014-05-28 22:46:07 -07002785 if type(label) is str:
2786 labels.append(label)
2787 elif type(label) is list:
2788 labels.extend(label)
Simran Basic6f1f7a2012-10-16 10:47:46 -07002789 return labels
Dan Shi85276d42014-04-08 22:11:45 -07002790
2791
2792 def is_boot_from_usb(self):
2793 """Check if DUT is boot from USB.
2794
2795 @return: True if DUT is boot from usb.
2796 """
2797 device = self.run('rootdev -s -d').stdout.strip()
2798 removable = int(self.run('cat /sys/block/%s/removable' %
2799 os.path.basename(device)).stdout.strip())
2800 return removable == 1
Helen Zhang17dae2b2014-11-11 09:25:52 -08002801
2802
2803 def read_from_meminfo(self, key):
Dan Shi49ca0932014-11-14 11:22:27 -08002804 """Return the memory info from /proc/meminfo
Helen Zhang17dae2b2014-11-11 09:25:52 -08002805
2806 @param key: meminfo requested
2807
2808 @return the memory value as a string
2809
2810 """
Helen Zhang17dae2b2014-11-11 09:25:52 -08002811 meminfo = self.run('grep %s /proc/meminfo' % key).stdout.strip()
2812 logging.debug('%s', meminfo)
2813 return int(re.search(r'\d+', meminfo).group(0))