blob: bb67a535d951c56c5ac7e5f39f78e457fbd1776d [file] [log] [blame]
J. Richard Barnette24adbf42012-04-11 15:04:53 -07001# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
Dale Curtisaa5eedb2011-08-23 16:18:52 -07002# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4
mussa584b4462014-06-20 15:13:28 -07005import ConfigParser
Aviv Keshet74c89a92013-02-04 15:18:30 -08006import functools
Christopher Wiley0ed712b2013-04-09 15:25:12 -07007import httplib
J. Richard Barnette1d78b012012-05-15 13:56:30 -07008import logging
Dan Shi0f466e82013-02-22 15:44:58 -08009import os
Simran Basid5e5e272012-09-24 15:23:59 -070010import re
Christopher Wileyd78249a2013-03-01 13:05:31 -080011import socket
J. Richard Barnette1d78b012012-05-15 13:56:30 -070012import subprocess
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070013import time
J. Richard Barnette1d78b012012-05-15 13:56:30 -070014import xmlrpclib
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070015
mussa584b4462014-06-20 15:13:28 -070016import common
J. Richard Barnette45e93de2012-04-11 17:24:15 -070017from autotest_lib.client.bin import utils
Dan Shi9cb0eec2014-06-03 09:04:50 -070018from autotest_lib.client.common_lib import autotemp
Richard Barnette0c73ffc2012-11-19 15:21:18 -080019from autotest_lib.client.common_lib import error
20from autotest_lib.client.common_lib import global_config
Dan Shi549fb822015-03-24 18:01:11 -070021from autotest_lib.client.common_lib import lsbrelease_utils
J. Richard Barnette45e93de2012-04-11 17:24:15 -070022from autotest_lib.client.common_lib.cros import autoupdater
Richard Barnette03a0c132012-11-05 12:40:35 -080023from autotest_lib.client.common_lib.cros import dev_server
Christopher Wileyd78249a2013-03-01 13:05:31 -080024from autotest_lib.client.common_lib.cros import retry
Gabe Blackb72f4fb2015-01-20 16:47:13 -080025from autotest_lib.client.common_lib.cros.graphite import autotest_es
Gabe Black1e1c41b2015-02-04 23:55:15 -080026from autotest_lib.client.common_lib.cros.graphite import autotest_stats
MK Ryu35d661e2014-09-25 17:44:10 -070027from autotest_lib.client.cros import constants as client_constants
J. Richard Barnette84890bd2014-02-21 11:05:47 -080028from autotest_lib.client.cros import cros_ui
Cheng-Yi Chiangf4104ff2014-12-23 19:39:01 +080029from autotest_lib.client.cros.audio import cras_utils
Katherine Threlkeldab83d392015-06-18 16:45:57 -070030from autotest_lib.client.cros.input_playback import input_playback
MK Ryu35d661e2014-09-25 17:44:10 -070031from autotest_lib.server import autoserv_parser
32from autotest_lib.server import autotest
33from autotest_lib.server import constants
34from autotest_lib.server import crashcollect
Dan Shia1ecd5c2013-06-06 11:21:31 -070035from autotest_lib.server import utils as server_utils
Dan Shi9cb0eec2014-06-03 09:04:50 -070036from autotest_lib.server.cros import provision
Scott Zawalski89c44dd2013-02-26 09:28:02 -050037from autotest_lib.server.cros.dynamic_suite import constants as ds_constants
Simran Basi5e6339a2013-03-21 11:34:32 -070038from autotest_lib.server.cros.dynamic_suite import tools, frontend_wrappers
Dan Shi9cb0eec2014-06-03 09:04:50 -070039from autotest_lib.server.cros.faft.config.config import Config as FAFTConfig
Fang Deng96667ca2013-08-01 17:46:18 -070040from autotest_lib.server.hosts import abstract_ssh
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +080041from autotest_lib.server.hosts import chameleon_host
Fang Deng5d518f42013-08-02 14:04:32 -070042from autotest_lib.server.hosts import servo_host
Simran Basidcff4252012-11-20 16:13:20 -080043from autotest_lib.site_utils.rpm_control_system import rpm_client
Simran Basid5e5e272012-09-24 15:23:59 -070044
45
beeps32a63082013-08-22 14:02:29 -070046try:
47 import jsonrpclib
48except ImportError:
49 jsonrpclib = None
Fang Deng96667ca2013-08-01 17:46:18 -070050
Fang Dengd1c2b732013-08-20 12:59:46 -070051
beepsc87ff602013-07-31 21:53:00 -070052class FactoryImageCheckerException(error.AutoservError):
53 """Exception raised when an image is a factory image."""
54 pass
55
56
Aviv Keshet74c89a92013-02-04 15:18:30 -080057def add_label_detector(label_function_list, label_list=None, label=None):
58 """Decorator used to group functions together into the provided list.
59 @param label_function_list: List of label detecting functions to add
60 decorated function to.
61 @param label_list: List of detectable labels to add detectable labels to.
62 (Default: None)
63 @param label: Label string that is detectable by this detection function
64 (Default: None)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -080065 """
Simran Basic6f1f7a2012-10-16 10:47:46 -070066 def add_func(func):
Aviv Keshet74c89a92013-02-04 15:18:30 -080067 """
68 @param func: The function to be added as a detector.
69 """
70 label_function_list.append(func)
71 if label and label_list is not None:
72 label_list.append(label)
Simran Basic6f1f7a2012-10-16 10:47:46 -070073 return func
74 return add_func
75
76
Fang Deng0ca40e22013-08-27 17:47:44 -070077class CrosHost(abstract_ssh.AbstractSSHHost):
J. Richard Barnette45e93de2012-04-11 17:24:15 -070078 """Chromium OS specific subclass of Host."""
79
80 _parser = autoserv_parser.autoserv_parser
Scott Zawalski62bacae2013-03-05 10:40:32 -050081 _AFE = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
J. Richard Barnette45e93de2012-04-11 17:24:15 -070082
Richard Barnette03a0c132012-11-05 12:40:35 -080083 # Timeout values (in seconds) associated with various Chrome OS
84 # state changes.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070085 #
Richard Barnette0c73ffc2012-11-19 15:21:18 -080086 # In general, a good rule of thumb is that the timeout can be up
87 # to twice the typical measured value on the slowest platform.
88 # The times here have not necessarily been empirically tested to
89 # meet this criterion.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070090 #
91 # SLEEP_TIMEOUT: Time to allow for suspend to memory.
Richard Barnette0c73ffc2012-11-19 15:21:18 -080092 # RESUME_TIMEOUT: Time to allow for resume after suspend, plus
93 # time to restart the netwowrk.
J. Richard Barnette84890bd2014-02-21 11:05:47 -080094 # SHUTDOWN_TIMEOUT: Time to allow for shut down.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070095 # BOOT_TIMEOUT: Time to allow for boot from power off. Among
Richard Barnette0c73ffc2012-11-19 15:21:18 -080096 # other things, this must account for the 30 second dev-mode
J. Richard Barnetted4649c62013-03-06 17:42:27 -080097 # screen delay and time to start the network.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070098 # USB_BOOT_TIMEOUT: Time to allow for boot from a USB device,
Richard Barnette0c73ffc2012-11-19 15:21:18 -080099 # including the 30 second dev-mode delay and time to start the
J. Richard Barnetted4649c62013-03-06 17:42:27 -0800100 # network.
beepsf079cfb2013-09-18 17:49:51 -0700101 # INSTALL_TIMEOUT: Time to allow for chromeos-install.
J. Richard Barnette84890bd2014-02-21 11:05:47 -0800102 # POWERWASH_BOOT_TIMEOUT: Time to allow for a reboot that
103 # includes powerwash.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -0700104
105 SLEEP_TIMEOUT = 2
J. Richard Barnetted4649c62013-03-06 17:42:27 -0800106 RESUME_TIMEOUT = 10
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +0800107 SHUTDOWN_TIMEOUT = 10
J. Richard Barnettefbcc7122013-07-24 18:24:59 -0700108 BOOT_TIMEOUT = 60
J. Richard Barnetteeb69d722012-06-18 17:29:44 -0700109 USB_BOOT_TIMEOUT = 150
J. Richard Barnette7817b052014-08-28 09:47:29 -0700110 INSTALL_TIMEOUT = 480
Dan Shi2c88eed2013-11-12 10:18:38 -0800111 POWERWASH_BOOT_TIMEOUT = 60
Chris Sosab76e0ee2013-05-22 16:55:41 -0700112
Dan Shica503482015-03-30 17:23:25 -0700113 # Minimum OS version that supports server side packaging. Older builds may
114 # not have server side package built or with Autotest code change to support
115 # server-side packaging.
Dan Shiced09e42015-04-17 16:09:34 -0700116 MIN_VERSION_SUPPORT_SSP = global_config.global_config.get_config_value(
117 'AUTOSERV', 'min_version_support_ssp', type=int)
Dan Shica503482015-03-30 17:23:25 -0700118
J. Richard Barnette84890bd2014-02-21 11:05:47 -0800119 # REBOOT_TIMEOUT: How long to wait for a reboot.
120 #
Chris Sosab76e0ee2013-05-22 16:55:41 -0700121 # We have a long timeout to ensure we don't flakily fail due to other
122 # issues. Shorter timeouts are vetted in platform_RebootAfterUpdate.
Simran Basi1160e2c2013-10-04 16:00:24 -0700123 # TODO(sbasi - crbug.com/276094) Restore to 5 mins once the 'host did not
124 # return from reboot' bug is solved.
125 REBOOT_TIMEOUT = 480
Chris Sosab76e0ee2013-05-22 16:55:41 -0700126
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800127 # _USB_POWER_TIMEOUT: Time to allow for USB to power toggle ON and OFF.
128 # _POWER_CYCLE_TIMEOUT: Time to allow for manual power cycle.
129 _USB_POWER_TIMEOUT = 5
130 _POWER_CYCLE_TIMEOUT = 10
131
beeps32a63082013-08-22 14:02:29 -0700132 _RPC_PROXY_URL = 'http://localhost:%d'
Christopher Wileydd181852013-10-10 19:56:58 -0700133 _RPC_SHUTDOWN_POLLING_PERIOD_SECONDS = 2
Peter Qiu4410db72014-06-05 10:32:41 -0700134 # Set shutdown timeout to account for the time for restarting the UI.
135 _RPC_SHUTDOWN_TIMEOUT_SECONDS = cros_ui.RESTART_UI_TIMEOUT
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800136
Richard Barnette82c35912012-11-20 10:09:10 -0800137 _RPM_RECOVERY_BOARDS = global_config.global_config.get_config_value('CROS',
138 'rpm_recovery_boards', type=str).split(',')
139
140 _MAX_POWER_CYCLE_ATTEMPTS = 6
141 _LAB_MACHINE_FILE = '/mnt/stateful_partition/.labmachine'
Fang Dengdeba14f2014-11-14 11:54:09 -0800142 _RPM_HOSTNAME_REGEX = ('chromeos(\d+)(-row(\d+))?-rack(\d+[a-z]*)'
143 '-host(\d+)')
Katherine Threlkeldab83d392015-06-18 16:45:57 -0700144 _LIGHTSENSOR_FILES = [ "in_illuminance0_input",
145 "in_illuminance_input",
146 "in_illuminance0_raw",
147 "in_illuminance_raw",
148 "illuminance0_input"]
Richard Barnette82c35912012-11-20 10:09:10 -0800149 _LIGHTSENSOR_SEARCH_DIR = '/sys/bus/iio/devices'
150 _LABEL_FUNCTIONS = []
Aviv Keshet74c89a92013-02-04 15:18:30 -0800151 _DETECTABLE_LABELS = []
152 label_decorator = functools.partial(add_label_detector, _LABEL_FUNCTIONS,
153 _DETECTABLE_LABELS)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700154
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -0800155 # Constants used in ping_wait_up() and ping_wait_down().
156 #
157 # _PING_WAIT_COUNT is the approximate number of polling
158 # cycles to use when waiting for a host state change.
159 #
160 # _PING_STATUS_DOWN and _PING_STATUS_UP are names used
161 # for arguments to the internal _ping_wait_for_status()
162 # method.
163 _PING_WAIT_COUNT = 40
164 _PING_STATUS_DOWN = False
165 _PING_STATUS_UP = True
166
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800167 # Allowed values for the power_method argument.
168
169 # POWER_CONTROL_RPM: Passed as default arg for power_off/on/cycle() methods.
170 # POWER_CONTROL_SERVO: Used in set_power() and power_cycle() methods.
171 # POWER_CONTROL_MANUAL: Used in set_power() and power_cycle() methods.
172 POWER_CONTROL_RPM = 'RPM'
173 POWER_CONTROL_SERVO = 'servoj10'
174 POWER_CONTROL_MANUAL = 'manual'
175
176 POWER_CONTROL_VALID_ARGS = (POWER_CONTROL_RPM,
177 POWER_CONTROL_SERVO,
178 POWER_CONTROL_MANUAL)
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800179
Simran Basi5e6339a2013-03-21 11:34:32 -0700180 _RPM_OUTLET_CHANGED = 'outlet_changed'
181
Dan Shi9cb0eec2014-06-03 09:04:50 -0700182 # URL pattern to download firmware image.
183 _FW_IMAGE_URL_PATTERN = global_config.global_config.get_config_value(
184 'CROS', 'firmware_url_pattern', type=str)
beeps687243d2013-07-18 15:29:27 -0700185
MK Ryu35d661e2014-09-25 17:44:10 -0700186 # File that has a list of directories to be collected
187 _LOGS_TO_COLLECT_FILE = os.path.join(
188 common.client_dir, 'common_lib', 'logs_to_collect')
189
190 # Prefix of logging message w.r.t. crash collection
191 _CRASHLOGS_PREFIX = 'collect_crashlogs'
192
193 # Time duration waiting for host up/down check
194 _CHECK_HOST_UP_TIMEOUT_SECS = 15
195
196 # A command that interacts with kernel and hardware (e.g., rm, mkdir, etc)
197 # might not be completely done deep through the hardware when the machine
198 # is powered down right after the command returns.
199 # We should wait for a few seconds to make them done. Finger crossed.
200 _SAFE_WAIT_SECS = 10
201
202
J. Richard Barnette964fba02012-10-24 17:34:29 -0700203 @staticmethod
beeps46dadc92013-11-07 14:07:10 -0800204 def check_host(host, timeout=10):
205 """
206 Check if the given host is a chrome-os host.
207
208 @param host: An ssh host representing a device.
209 @param timeout: The timeout for the run command.
210
211 @return: True if the host device is chromeos.
212
beeps46dadc92013-11-07 14:07:10 -0800213 """
214 try:
Simran Basi933c8af2015-04-29 14:05:07 -0700215 result = host.run(
216 'grep -q CHROMEOS /etc/lsb-release && '
217 '! test -f /mnt/stateful_partition/.android_tester && '
218 '! grep -q moblab /etc/lsb-release',
219 ignore_status=True, timeout=timeout)
beeps46dadc92013-11-07 14:07:10 -0800220 except (error.AutoservRunError, error.AutoservSSHTimeout):
221 return False
222 return result.exit_status == 0
223
224
225 @staticmethod
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800226 def _extract_arguments(args_dict, key_subset):
227 """Extract options from `args_dict` and return a subset result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800228
229 Take the provided dictionary of argument options and return
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800230 a subset that represent standard arguments needed to construct
231 a test-assistant object (chameleon or servo) for a host. The
232 intent is to provide standard argument processing from
Christopher Wiley644ef3e2015-05-15 13:14:14 -0700233 CrosHost for tests that require a test-assistant board
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800234 to operate.
235
236 @param args_dict Dictionary from which to extract the arguments.
237 @param key_subset Tuple of keys to extract from the args_dict, e.g.
238 ('servo_host', 'servo_port').
239 """
240 result = {}
241 for arg in key_subset:
242 if arg in args_dict:
243 result[arg] = args_dict[arg]
244 return result
245
246
247 @staticmethod
248 def get_chameleon_arguments(args_dict):
249 """Extract chameleon options from `args_dict` and return the result.
250
251 Recommended usage:
252 ~~~~~~~~
253 args_dict = utils.args_to_dict(args)
254 chameleon_args = hosts.CrosHost.get_chameleon_arguments(args_dict)
255 host = hosts.create_host(machine, chameleon_args=chameleon_args)
256 ~~~~~~~~
257
258 @param args_dict Dictionary from which to extract the chameleon
259 arguments.
260 """
261 return CrosHost._extract_arguments(
262 args_dict, ('chameleon_host', 'chameleon_port'))
263
264
265 @staticmethod
266 def get_servo_arguments(args_dict):
267 """Extract servo options from `args_dict` and return the result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800268
269 Recommended usage:
270 ~~~~~~~~
271 args_dict = utils.args_to_dict(args)
Fang Deng0ca40e22013-08-27 17:47:44 -0700272 servo_args = hosts.CrosHost.get_servo_arguments(args_dict)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800273 host = hosts.create_host(machine, servo_args=servo_args)
274 ~~~~~~~~
275
276 @param args_dict Dictionary from which to extract the servo
277 arguments.
278 """
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800279 return CrosHost._extract_arguments(
280 args_dict, ('servo_host', 'servo_port'))
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700281
J. Richard Barnette964fba02012-10-24 17:34:29 -0700282
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800283 def _initialize(self, hostname, chameleon_args=None, servo_args=None,
Fang Denge545abb2014-12-30 18:43:47 -0800284 try_lab_servo=False, ssh_verbosity_flag='', ssh_options='',
Fang Dengd1c2b732013-08-20 12:59:46 -0700285 *args, **dargs):
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800286 """Initialize superclasses, |self.chameleon|, and |self.servo|.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700287
Fang Denge545abb2014-12-30 18:43:47 -0800288 This method will attempt to create the test-assistant object
289 (chameleon/servo) when it is needed by the test. Check
290 the docstring of chameleon_host.create_chameleon_host and
291 servo_host.create_servo_host for how this is determined.
Fang Deng5d518f42013-08-02 14:04:32 -0700292
Fang Denge545abb2014-12-30 18:43:47 -0800293 @param hostname: Hostname of the dut.
294 @param chameleon_args: A dictionary that contains args for creating
295 a ChameleonHost. See chameleon_host for details.
296 @param servo_args: A dictionary that contains args for creating
297 a ServoHost object. See servo_host for details.
298 @param try_lab_servo: Boolean, False indicates that ServoHost should
299 not be created for a device in Cros test lab.
300 See servo_host for details.
301 @param ssh_verbosity_flag: String, to pass to the ssh command to control
302 verbosity.
303 @param ssh_options: String, other ssh options to pass to the ssh
304 command.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700305 """
Fang Deng0ca40e22013-08-27 17:47:44 -0700306 super(CrosHost, self)._initialize(hostname=hostname,
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700307 *args, **dargs)
J. Richard Barnettef0859852012-08-20 14:55:50 -0700308 # self.env is a dictionary of environment variable settings
309 # to be exported for commands run on the host.
310 # LIBC_FATAL_STDERR_ can be useful for diagnosing certain
311 # errors that might happen.
312 self.env['LIBC_FATAL_STDERR_'] = '1'
beeps32a63082013-08-22 14:02:29 -0700313 self._rpc_proxy_map = {}
Fang Dengd1c2b732013-08-20 12:59:46 -0700314 self._ssh_verbosity_flag = ssh_verbosity_flag
Aviv Keshetc5947fa2013-09-04 14:06:29 -0700315 self._ssh_options = ssh_options
Fang Deng5d518f42013-08-02 14:04:32 -0700316 # TODO(fdeng): We need to simplify the
317 # process of servo and servo_host initialization.
318 # crbug.com/298432
Fang Denge545abb2014-12-30 18:43:47 -0800319 self._servo_host = servo_host.create_servo_host(
320 dut=self.hostname, servo_args=servo_args,
321 try_lab_servo=try_lab_servo)
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800322 # TODO(waihong): Do the simplication on Chameleon too.
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800323 self._chameleon_host = chameleon_host.create_chameleon_host(
324 dut=self.hostname, chameleon_args=chameleon_args)
325
Dan Shi4d478522014-02-14 13:46:32 -0800326 if self._servo_host is not None:
327 self.servo = self._servo_host.get_servo()
328 else:
329 self.servo = None
330
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800331 if self._chameleon_host:
Tom Wai-Hong Tameaee3402014-01-22 08:52:10 +0800332 self.chameleon = self._chameleon_host.create_chameleon_board()
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800333 else:
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800334 self.chameleon = None
Fang Deng5d518f42013-08-02 14:04:32 -0700335
336
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500337 def get_repair_image_name(self):
338 """Generate a image_name from variables in the global config.
339
340 @returns a str of $board-version/$BUILD.
341
342 """
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500343 board = self._get_board_from_afe()
344 if board is None:
345 raise error.AutoservError('DUT has no board attribute, '
346 'cannot be repaired.')
Dan Shi6964fa52014-12-18 11:04:27 -0800347 stable_version = self._AFE.run('get_stable_version', board=board)
348 build_pattern = global_config.global_config.get_config_value(
349 'CROS', 'stable_build_pattern')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500350 return build_pattern % (board, stable_version)
351
352
Scott Zawalski62bacae2013-03-05 10:40:32 -0500353 def _host_in_AFE(self):
354 """Check if the host is an object the AFE knows.
355
356 @returns the host object.
357 """
358 return self._AFE.get_hosts(hostname=self.hostname)
359
360
Chris Sosab76e0ee2013-05-22 16:55:41 -0700361 def lookup_job_repo_url(self):
362 """Looks up the job_repo_url for the host.
363
364 @returns job_repo_url from AFE or None if not found.
365
366 @raises KeyError if the host does not have a job_repo_url
367 """
368 if not self._host_in_AFE():
369 return None
370
371 hosts = self._AFE.get_hosts(hostname=self.hostname)
beepsb5efc532013-06-04 11:29:34 -0700372 if hosts and ds_constants.JOB_REPO_URL in hosts[0].attributes:
373 return hosts[0].attributes[ds_constants.JOB_REPO_URL]
Chris Sosab76e0ee2013-05-22 16:55:41 -0700374
375
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500376 def clear_cros_version_labels_and_job_repo_url(self):
377 """Clear cros_version labels and host attribute job_repo_url."""
Scott Zawalski62bacae2013-03-05 10:40:32 -0500378 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400379 return
380
Scott Zawalski62bacae2013-03-05 10:40:32 -0500381 host_list = [self.hostname]
382 labels = self._AFE.get_labels(
383 name__startswith=ds_constants.VERSION_PREFIX,
384 host__hostname=self.hostname)
Dan Shi0f466e82013-02-22 15:44:58 -0800385
Scott Zawalski62bacae2013-03-05 10:40:32 -0500386 for label in labels:
387 label.remove_hosts(hosts=host_list)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500388
beepscb6f1e22013-06-28 19:14:10 -0700389 self.update_job_repo_url(None, None)
390
391
392 def update_job_repo_url(self, devserver_url, image_name):
393 """
394 Updates the job_repo_url host attribute and asserts it's value.
395
396 @param devserver_url: The devserver to use in the job_repo_url.
397 @param image_name: The name of the image to use in the job_repo_url.
398
399 @raises AutoservError: If we failed to update the job_repo_url.
400 """
401 repo_url = None
402 if devserver_url and image_name:
403 repo_url = tools.get_package_url(devserver_url, image_name)
404 self._AFE.set_host_attribute(ds_constants.JOB_REPO_URL, repo_url,
Scott Zawalski62bacae2013-03-05 10:40:32 -0500405 hostname=self.hostname)
beepscb6f1e22013-06-28 19:14:10 -0700406 if self.lookup_job_repo_url() != repo_url:
407 raise error.AutoservError('Failed to update job_repo_url with %s, '
408 'host %s' % (repo_url, self.hostname))
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500409
410
Dan Shie9309262013-06-19 22:50:21 -0700411 def add_cros_version_labels_and_job_repo_url(self, image_name):
Scott Zawalskieadbf702013-03-14 09:23:06 -0400412 """Add cros_version labels and host attribute job_repo_url.
413
414 @param image_name: The name of the image e.g.
415 lumpy-release/R27-3837.0.0
Dan Shi7458bf62013-06-10 12:50:16 -0700416
Scott Zawalskieadbf702013-03-14 09:23:06 -0400417 """
Scott Zawalski62bacae2013-03-05 10:40:32 -0500418 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400419 return
Scott Zawalski62bacae2013-03-05 10:40:32 -0500420
Scott Zawalskieadbf702013-03-14 09:23:06 -0400421 cros_label = '%s%s' % (ds_constants.VERSION_PREFIX, image_name)
Dan Shie9309262013-06-19 22:50:21 -0700422 devserver_url = dev_server.ImageServer.resolve(image_name).url()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500423
424 labels = self._AFE.get_labels(name=cros_label)
425 if labels:
426 label = labels[0]
427 else:
428 label = self._AFE.create_label(name=cros_label)
429
430 label.add_hosts([self.hostname])
beepscb6f1e22013-06-28 19:14:10 -0700431 self.update_job_repo_url(devserver_url, image_name)
432
433
beepsdae65fd2013-07-26 16:24:41 -0700434 def verify_job_repo_url(self, tag=''):
beepscb6f1e22013-06-28 19:14:10 -0700435 """
436 Make sure job_repo_url of this host is valid.
437
joychen03eaad92013-06-26 09:55:21 -0700438 Eg: The job_repo_url "http://lmn.cd.ab.xyx:8080/static/\
beepscb6f1e22013-06-28 19:14:10 -0700439 lumpy-release/R29-4279.0.0/autotest/packages" claims to have the
440 autotest package for lumpy-release/R29-4279.0.0. If this isn't the case,
441 download and extract it. If the devserver embedded in the url is
442 unresponsive, update the job_repo_url of the host after staging it on
443 another devserver.
444
445 @param job_repo_url: A url pointing to the devserver where the autotest
446 package for this build should be staged.
beepsdae65fd2013-07-26 16:24:41 -0700447 @param tag: The tag from the server job, in the format
448 <job_id>-<user>/<hostname>, or <hostless> for a server job.
beepscb6f1e22013-06-28 19:14:10 -0700449
450 @raises DevServerException: If we could not resolve a devserver.
451 @raises AutoservError: If we're unable to save the new job_repo_url as
452 a result of choosing a new devserver because the old one failed to
453 respond to a health check.
beeps0c865032013-07-30 11:37:06 -0700454 @raises urllib2.URLError: If the devserver embedded in job_repo_url
455 doesn't respond within the timeout.
beepscb6f1e22013-06-28 19:14:10 -0700456 """
457 job_repo_url = self.lookup_job_repo_url()
458 if not job_repo_url:
459 logging.warning('No job repo url set on host %s', self.hostname)
460 return
461
462 logging.info('Verifying job repo url %s', job_repo_url)
463 devserver_url, image_name = tools.get_devserver_build_from_package_url(
464 job_repo_url)
465
beeps0c865032013-07-30 11:37:06 -0700466 ds = dev_server.ImageServer(devserver_url)
beepscb6f1e22013-06-28 19:14:10 -0700467
468 logging.info('Staging autotest artifacts for %s on devserver %s',
469 image_name, ds.url())
beeps687243d2013-07-18 15:29:27 -0700470
471 start_time = time.time()
Simran Basi25e7a922014-10-31 11:56:10 -0700472 ds.stage_artifacts(image_name, ['autotest_packages'])
beeps687243d2013-07-18 15:29:27 -0700473 stage_time = time.time() - start_time
474
475 # Record how much of the verification time comes from a devserver
476 # restage. If we're doing things right we should not see multiple
477 # devservers for a given board/build/branch path.
478 try:
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800479 board, build_type, branch = server_utils.ParseBuildName(
beeps687243d2013-07-18 15:29:27 -0700480 image_name)[:3]
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800481 except server_utils.ParseBuildNameException:
beeps687243d2013-07-18 15:29:27 -0700482 pass
483 else:
beeps0c865032013-07-30 11:37:06 -0700484 devserver = devserver_url[
Chris Sosa65425082013-10-16 13:26:22 -0700485 devserver_url.find('/') + 2:devserver_url.rfind(':')]
beeps687243d2013-07-18 15:29:27 -0700486 stats_key = {
487 'board': board,
488 'build_type': build_type,
489 'branch': branch,
beeps0c865032013-07-30 11:37:06 -0700490 'devserver': devserver.replace('.', '_'),
beeps687243d2013-07-18 15:29:27 -0700491 }
Gabe Black1e1c41b2015-02-04 23:55:15 -0800492 autotest_stats.Gauge('verify_job_repo_url').send(
beeps687243d2013-07-18 15:29:27 -0700493 '%(board)s.%(build_type)s.%(branch)s.%(devserver)s' % stats_key,
494 stage_time)
beepscb6f1e22013-06-28 19:14:10 -0700495
Scott Zawalskieadbf702013-03-14 09:23:06 -0400496
Dan Shicf4d2032015-03-12 15:04:21 -0700497 def stage_server_side_package(self, image=None):
498 """Stage autotest server-side package on devserver.
499
500 @param image: Full path of an OS image to install or a build name.
501
502 @return: A url to the autotest server-side package.
503 """
504 if image:
505 image_name = tools.get_build_from_image(image)
506 if not image_name:
507 raise error.AutoservError(
508 'Failed to parse build name from %s' % image)
509 ds = dev_server.ImageServer.resolve(image_name)
510 else:
511 job_repo_url = self.lookup_job_repo_url()
512 if job_repo_url:
513 devserver_url, image_name = (
514 tools.get_devserver_build_from_package_url(job_repo_url))
515 ds = dev_server.ImageServer(devserver_url)
516 else:
517 labels = self._AFE.get_labels(
518 name__startswith=ds_constants.VERSION_PREFIX,
519 host__hostname=self.hostname)
520 if not labels:
521 raise error.AutoservError(
522 'Failed to stage server-side package. The host has '
523 'no job_report_url attribute or version label.')
524 image_name = labels[0].name[len(ds_constants.VERSION_PREFIX):]
525 ds = dev_server.ImageServer.resolve(image_name)
Dan Shica503482015-03-30 17:23:25 -0700526
527 # Get the OS version of the build, for any build older than
528 # MIN_VERSION_SUPPORT_SSP, server side packaging is not supported.
529 match = re.match('.*/R\d+-(\d+)\.', image_name)
530 if match and int(match.group(1)) < self.MIN_VERSION_SUPPORT_SSP:
531 logging.warn('Build %s is older than %s. Server side packaging is '
532 'disabled.', image_name, self.MIN_VERSION_SUPPORT_SSP)
533 return None
534
Dan Shicf4d2032015-03-12 15:04:21 -0700535 ds.stage_artifacts(image_name, ['autotest_server_package'])
536 return '%s/static/%s/%s' % (ds.url(), image_name,
537 'autotest_server_package.tar.bz2')
538
539
Dan Shi0f466e82013-02-22 15:44:58 -0800540 def _try_stateful_update(self, update_url, force_update, updater):
541 """Try to use stateful update to initialize DUT.
542
543 When DUT is already running the same version that machine_install
544 tries to install, stateful update is a much faster way to clean up
545 the DUT for testing, compared to a full reimage. It is implemeted
546 by calling autoupdater.run_update, but skipping updating root, as
547 updating the kernel is time consuming and not necessary.
548
549 @param update_url: url of the image.
550 @param force_update: Set to True to update the image even if the DUT
551 is running the same version.
552 @param updater: ChromiumOSUpdater instance used to update the DUT.
553 @returns: True if the DUT was updated with stateful update.
554
555 """
J. Richard Barnette3f731032014-04-07 17:42:59 -0700556 # TODO(jrbarnette): Yes, I hate this re.match() test case.
557 # It's better than the alternative: see crbug.com/360944.
558 image_name = autoupdater.url_to_image_name(update_url)
559 release_pattern = r'^.*-release/R[0-9]+-[0-9]+\.[0-9]+\.0$'
560 if not re.match(release_pattern, image_name):
561 return False
Dan Shi0f466e82013-02-22 15:44:58 -0800562 if not updater.check_version():
563 return False
564 if not force_update:
565 logging.info('Canceling stateful update because the new and '
566 'old versions are the same.')
567 return False
568 # Following folders should be rebuilt after stateful update.
569 # A test file is used to confirm each folder gets rebuilt after
570 # the stateful update.
571 folders_to_check = ['/var', '/home', '/mnt/stateful_partition']
572 test_file = '.test_file_to_be_deleted'
573 for folder in folders_to_check:
574 touch_path = os.path.join(folder, test_file)
575 self.run('touch %s' % touch_path)
576
Chris Sosae92399e2015-04-24 11:32:59 -0700577 updater.run_update(update_root=False)
Dan Shi0f466e82013-02-22 15:44:58 -0800578
579 # Reboot to complete stateful update.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700580 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Dan Shi0f466e82013-02-22 15:44:58 -0800581 check_file_cmd = 'test -f %s; echo $?'
582 for folder in folders_to_check:
583 test_file_path = os.path.join(folder, test_file)
584 result = self.run(check_file_cmd % test_file_path,
585 ignore_status=True)
586 if result.exit_status == 1:
587 return False
588 return True
589
590
J. Richard Barnette7275b612013-06-04 18:13:11 -0700591 def _post_update_processing(self, updater, expected_kernel=None):
Dan Shi0f466e82013-02-22 15:44:58 -0800592 """After the DUT is updated, confirm machine_install succeeded.
593
594 @param updater: ChromiumOSUpdater instance used to update the DUT.
J. Richard Barnette7275b612013-06-04 18:13:11 -0700595 @param expected_kernel: kernel expected to be active after reboot,
596 or `None` to skip rollback checking.
Dan Shi0f466e82013-02-22 15:44:58 -0800597
598 """
J. Richard Barnette7275b612013-06-04 18:13:11 -0700599 # Touch the lab machine file to leave a marker that
600 # distinguishes this image from other test images.
601 # Afterwards, we must re-run the autoreboot script because
602 # it depends on the _LAB_MACHINE_FILE.
Dan Shi0f466e82013-02-22 15:44:58 -0800603 self.run('touch %s' % self._LAB_MACHINE_FILE)
Dan Shi0f466e82013-02-22 15:44:58 -0800604 self.run('start autoreboot')
Chris Sosa65425082013-10-16 13:26:22 -0700605 updater.verify_boot_expectations(
606 expected_kernel, rollback_message=
607 'Build %s failed to boot on %s; system rolled back to previous'
608 'build' % (updater.update_version, self.hostname))
J. Richard Barnette7275b612013-06-04 18:13:11 -0700609 # Check that we've got the build we meant to install.
610 if not updater.check_version_to_confirm_install():
611 raise autoupdater.ChromiumOSError(
612 'Failed to update %s to build %s; found build '
613 '%s instead' % (self.hostname,
Chris Sosa65425082013-10-16 13:26:22 -0700614 updater.update_version,
Dan Shi0942b1d2015-03-31 11:07:00 -0700615 self.get_release_version()))
Dan Shi0f466e82013-02-22 15:44:58 -0800616
Chris Sosae92399e2015-04-24 11:32:59 -0700617 logging.debug('Cleaning up old autotest directories.')
618 try:
619 installed_autodir = autotest.Autotest.get_installed_autodir(self)
620 self.run('rm -rf ' + installed_autodir)
621 except autotest.AutodirNotFoundError:
622 logging.debug('No autotest installed directory found.')
623
Dan Shi0f466e82013-02-22 15:44:58 -0800624
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700625 def _stage_image_for_update(self, image_name=None):
Chris Sosae92399e2015-04-24 11:32:59 -0700626 """Stage a build on a devserver and return the update_url and devserver.
Scott Zawalskieadbf702013-03-14 09:23:06 -0400627
628 @param image_name: a name like lumpy-release/R27-3837.0.0
Chris Sosae92399e2015-04-24 11:32:59 -0700629 @returns a tuple with an update URL like:
Scott Zawalskieadbf702013-03-14 09:23:06 -0400630 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
Chris Sosae92399e2015-04-24 11:32:59 -0700631 and the devserver instance.
Scott Zawalskieadbf702013-03-14 09:23:06 -0400632 """
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700633 if not image_name:
634 image_name = self.get_repair_image_name()
Chris Sosae92399e2015-04-24 11:32:59 -0700635
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700636 logging.info('Staging build for AU: %s', image_name)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400637 devserver = dev_server.ImageServer.resolve(image_name)
638 devserver.trigger_download(image_name, synchronous=False)
Chris Sosae92399e2015-04-24 11:32:59 -0700639 return (tools.image_url_pattern() % (devserver.url(), image_name),
640 devserver)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400641
642
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700643 def stage_image_for_servo(self, image_name=None):
644 """Stage a build on a devserver and return the update_url.
645
646 @param image_name: a name like lumpy-release/R27-3837.0.0
647 @returns an update URL like:
648 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
649 """
650 if not image_name:
651 image_name = self.get_repair_image_name()
652 logging.info('Staging build for servo install: %s', image_name)
653 devserver = dev_server.ImageServer.resolve(image_name)
654 devserver.stage_artifacts(image_name, ['test_image'])
655 return devserver.get_test_image_url(image_name)
656
657
beepse539be02013-07-31 21:57:39 -0700658 def stage_factory_image_for_servo(self, image_name):
659 """Stage a build on a devserver and return the update_url.
660
661 @param image_name: a name like <baord>/4262.204.0
beeps12c0a3c2013-09-03 11:58:27 -0700662
beepse539be02013-07-31 21:57:39 -0700663 @return: An update URL, eg:
664 http://<devserver>/static/canary-channel/\
665 <board>/4262.204.0/factory_test/chromiumos_factory_image.bin
beeps12c0a3c2013-09-03 11:58:27 -0700666
667 @raises: ValueError if the factory artifact name is missing from
668 the config.
669
beepse539be02013-07-31 21:57:39 -0700670 """
671 if not image_name:
672 logging.error('Need an image_name to stage a factory image.')
673 return
674
beeps12c0a3c2013-09-03 11:58:27 -0700675 factory_artifact = global_config.global_config.get_config_value(
676 'CROS', 'factory_artifact', type=str, default='')
677 if not factory_artifact:
678 raise ValueError('Cannot retrieve the factory artifact name from '
679 'autotest config, and hence cannot stage factory '
680 'artifacts.')
681
beepse539be02013-07-31 21:57:39 -0700682 logging.info('Staging build for servo install: %s', image_name)
683 devserver = dev_server.ImageServer.resolve(image_name)
684 devserver.stage_artifacts(
685 image_name,
beeps12c0a3c2013-09-03 11:58:27 -0700686 [factory_artifact],
687 archive_url=None)
beepse539be02013-07-31 21:57:39 -0700688
689 return tools.factory_image_url_pattern() % (devserver.url(), image_name)
690
691
Chris Sosaa3ac2152012-05-23 22:23:13 -0700692 def machine_install(self, update_url=None, force_update=False,
Richard Barnette0b023a72015-04-24 16:07:30 +0000693 local_devserver=False, repair=False,
694 force_full_update=False):
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500695 """Install the DUT.
696
Dan Shi0f466e82013-02-22 15:44:58 -0800697 Use stateful update if the DUT is already running the same build.
698 Stateful update does not update kernel and tends to run much faster
699 than a full reimage. If the DUT is running a different build, or it
700 failed to do a stateful update, full update, including kernel update,
701 will be applied to the DUT.
702
Scott Zawalskieadbf702013-03-14 09:23:06 -0400703 Once a host enters machine_install its cros_version label will be
704 removed as well as its host attribute job_repo_url (used for
705 package install).
706
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500707 @param update_url: The url to use for the update
708 pattern: http://$devserver:###/update/$build
709 If update_url is None and repair is True we will install the
Dan Shi6964fa52014-12-18 11:04:27 -0800710 stable image listed in afe_stable_versions table. If the table
711 is not setup, global_config value under CROS.stable_cros_version
712 will be used instead.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500713 @param force_update: Force an update even if the version installed
714 is the same. Default:False
Christopher Wiley6a4ff932015-05-15 14:00:47 -0700715 @param local_devserver: Used by test_that to allow people to
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500716 use their local devserver. Default: False
Chris Sosae92399e2015-04-24 11:32:59 -0700717 @param repair: Forces update to repair image. Implies force_update.
Fang Deng3d3b9272014-12-22 12:20:28 -0800718 @param force_full_update: If True, do not attempt to run stateful
719 update, force a full reimage. If False, try stateful update
720 first when the dut is already installed with the same version.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500721 @raises autoupdater.ChromiumOSError
722
723 """
Chris Sosae92399e2015-04-24 11:32:59 -0700724 devserver = None
Richard Barnette0b023a72015-04-24 16:07:30 +0000725 if repair:
Chris Sosae92399e2015-04-24 11:32:59 -0700726 update_url, devserver = self._stage_image_for_update()
Richard Barnette0b023a72015-04-24 16:07:30 +0000727 force_update = True
Dan Shi0f466e82013-02-22 15:44:58 -0800728
Chris Sosae92399e2015-04-24 11:32:59 -0700729 if not update_url and not self._parser.options.image:
730 raise error.AutoservError(
731 'There is no update URL, nor a method to get one.')
732
733 if not update_url and self._parser.options.image:
734 # This is the base case where we have no given update URL i.e.
735 # dynamic suites logic etc. This is the most flexible case where we
736 # can serve an update from any of our fleet of devservers.
737 requested_build = self._parser.options.image
738 if not requested_build.startswith('http://'):
739 logging.debug('Update will be staged for this installation')
740 update_url, devserver = self._stage_image_for_update(
741 requested_build)
742 else:
743 update_url = requested_build
744
745 logging.debug('Update URL is %s', update_url)
746
Scott Zawalskieadbf702013-03-14 09:23:06 -0400747 # Remove cros-version and job_repo_url host attribute from host.
748 self.clear_cros_version_labels_and_job_repo_url()
Chris Sosae92399e2015-04-24 11:32:59 -0700749
750 update_complete = False
751 updater = autoupdater.ChromiumOSUpdater(
752 update_url, host=self, local_devserver=local_devserver)
Fang Deng3d3b9272014-12-22 12:20:28 -0800753 if not force_full_update:
754 try:
Chris Sosae92399e2015-04-24 11:32:59 -0700755 # If the DUT is already running the same build, try stateful
756 # update first as it's much quicker than a full re-image.
757 update_complete = self._try_stateful_update(
758 update_url, force_update, updater)
Fang Deng3d3b9272014-12-22 12:20:28 -0800759 except Exception as e:
760 logging.exception(e)
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700761
Dan Shi0f466e82013-02-22 15:44:58 -0800762 inactive_kernel = None
Chris Sosae92399e2015-04-24 11:32:59 -0700763 if update_complete or (not force_update and updater.check_version()):
764 logging.info('Install complete without full update')
765 else:
766 logging.info('DUT requires full update.')
767 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
768 num_of_attempts = provision.FLAKY_DEVSERVER_ATTEMPTS
Chris Sosab7612bc2013-03-21 10:32:37 -0700769
Chris Sosae92399e2015-04-24 11:32:59 -0700770 while num_of_attempts > 0:
771 num_of_attempts -= 1
772 try:
773 updater.run_update()
774 except Exception:
775 logging.warn('Autoupdate did not complete.')
776 # Do additional check for the devserver health. Ideally,
777 # the autoupdater.py could raise an exception when it
778 # detected network flake but that would require
779 # instrumenting the update engine and parsing it log.
780 if (num_of_attempts <= 0 or
781 devserver is None or
782 dev_server.DevServer.devserver_healthy(
783 devserver.url())):
784 raise
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700785
Chris Sosae92399e2015-04-24 11:32:59 -0700786 logging.warn('Devserver looks unhealthy. Trying another')
787 update_url, devserver = self._stage_image_for_update(
788 requested_build)
789 logging.debug('New Update URL is %s', update_url)
790 updater = autoupdater.ChromiumOSUpdater(
791 update_url, host=self,
792 local_devserver=local_devserver)
793 else:
794 break
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700795
Chris Sosae92399e2015-04-24 11:32:59 -0700796 # Give it some time in case of IO issues.
797 time.sleep(10)
Dan Shi5699ac22014-12-19 10:55:49 -0800798
Chris Sosae92399e2015-04-24 11:32:59 -0700799 # Figure out active and inactive kernel.
800 active_kernel, inactive_kernel = updater.get_kernel_state()
Simran Basi13fa1ba2013-03-04 10:56:47 -0800801
Chris Sosae92399e2015-04-24 11:32:59 -0700802 # Ensure inactive kernel has higher priority than active.
803 if (updater.get_kernel_priority(inactive_kernel)
804 < updater.get_kernel_priority(active_kernel)):
805 raise autoupdater.ChromiumOSError(
806 'Update failed. The priority of the inactive kernel'
807 ' partition is less than that of the active kernel'
808 ' partition.')
809
810 # Updater has returned successfully; reboot the host.
811 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
812
813 self._post_update_processing(updater, inactive_kernel)
814 self.add_cros_version_labels_and_job_repo_url(
815 autoupdater.url_to_image_name(update_url))
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700816
817
Dan Shi9cb0eec2014-06-03 09:04:50 -0700818 def _clear_fw_version_labels(self):
819 """Clear firmware version labels from the machine."""
820 labels = self._AFE.get_labels(
Dan Shi0723bf52015-06-24 10:52:38 -0700821 name__startswith=provision.FW_RW_VERSION_PREFIX,
Dan Shi9cb0eec2014-06-03 09:04:50 -0700822 host__hostname=self.hostname)
823 for label in labels:
824 label.remove_hosts(hosts=[self.hostname])
825
826
827 def _add_fw_version_label(self, build):
828 """Add firmware version label to the machine.
829
830 @param build: Build of firmware.
831
832 """
833 fw_label = provision.fw_version_to_label(build)
834 provision.ensure_label_exists(fw_label)
835 label = self._AFE.get_labels(name__startswith=fw_label)[0]
836 label.add_hosts([self.hostname])
837
838
839 def firmware_install(self, build=None):
840 """Install firmware to the DUT.
841
842 Use stateful update if the DUT is already running the same build.
843 Stateful update does not update kernel and tends to run much faster
844 than a full reimage. If the DUT is running a different build, or it
845 failed to do a stateful update, full update, including kernel update,
846 will be applied to the DUT.
847
848 Once a host enters firmware_install its fw_version label will be
849 removed. After the firmware is updated successfully, a new fw_version
850 label will be added to the host.
851
852 @param build: The build version to which we want to provision the
853 firmware of the machine,
854 e.g. 'link-firmware/R22-2695.1.144'.
855
856 TODO(dshi): After bug 381718 is fixed, update here with corresponding
857 exceptions that could be raised.
858
859 """
860 if not self.servo:
861 raise error.TestError('Host %s does not have servo.' %
862 self.hostname)
863
864 # TODO(fdeng): use host.get_board() after
865 # crbug.com/271834 is fixed.
866 board = self._get_board_from_afe()
867
Chris Sosae92399e2015-04-24 11:32:59 -0700868 # If build is not set, try to install firmware from stable CrOS.
Dan Shi9cb0eec2014-06-03 09:04:50 -0700869 if not build:
870 build = self.get_repair_image_name()
871
872 config = FAFTConfig(board)
873 if config.use_u_boot:
874 ap_image = 'image-%s.bin' % board
875 else: # Depthcharge platform
876 ap_image = 'image.bin'
877 ec_image = 'ec.bin'
878 ds = dev_server.ImageServer.resolve(build)
879 ds.stage_artifacts(build, ['firmware'])
880
881 tmpd = autotemp.tempdir(unique_id='fwimage')
882 try:
883 fwurl = self._FW_IMAGE_URL_PATTERN % (ds.url(), build)
884 local_tarball = os.path.join(tmpd.name, os.path.basename(fwurl))
885 server_utils.system('wget -O %s %s' % (local_tarball, fwurl),
886 timeout=60)
887 server_utils.system('tar xf %s -C %s %s %s' %
888 (local_tarball, tmpd.name, ap_image, ec_image),
889 timeout=60)
890 server_utils.system('tar xf %s --wildcards -C %s "dts/*"' %
891 (local_tarball, tmpd.name),
892 timeout=60, ignore_status=True)
893
894 self._clear_fw_version_labels()
895 logging.info('Will re-program EC now')
896 self.servo.program_ec(os.path.join(tmpd.name, ec_image))
897 logging.info('Will re-program BIOS now')
898 self.servo.program_bios(os.path.join(tmpd.name, ap_image))
899 self.servo.get_power_state_controller().reset()
900 time.sleep(self.servo.BOOT_DELAY)
Dan Shia5fef052015-05-18 23:28:47 -0700901 self._add_fw_version_label(build)
Dan Shi9cb0eec2014-06-03 09:04:50 -0700902 finally:
903 tmpd.clean()
904
905
Dan Shi10e992b2013-08-30 11:02:59 -0700906 def show_update_engine_log(self):
907 """Output update engine log."""
MK Ryu35d661e2014-09-25 17:44:10 -0700908 logging.debug('Dumping %s', client_constants.UPDATE_ENGINE_LOG)
909 self.run('cat %s' % client_constants.UPDATE_ENGINE_LOG)
Dan Shi10e992b2013-08-30 11:02:59 -0700910
911
Richard Barnette82c35912012-11-20 10:09:10 -0800912 def _get_board_from_afe(self):
913 """Retrieve this host's board from its labels in the AFE.
914
915 Looks for a host label of the form "board:<board>", and
916 returns the "<board>" part of the label. `None` is returned
917 if there is not a single, unique label matching the pattern.
918
919 @returns board from label, or `None`.
920 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700921 return server_utils.get_board_from_afe(self.hostname, self._AFE)
Simran Basi833814b2013-01-29 13:13:43 -0800922
923
924 def get_build(self):
925 """Retrieve the current build for this Host from the AFE.
926
927 Looks through this host's labels in the AFE to determine its build.
928
929 @returns The current build or None if it could not find it or if there
930 were multiple build labels assigned to this host.
931 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700932 return server_utils.get_build_from_afe(self.hostname, self._AFE)
Richard Barnette82c35912012-11-20 10:09:10 -0800933
934
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500935 def _install_repair(self):
Chris Sosae92399e2015-04-24 11:32:59 -0700936 """Attempt to repair this host using the update-engine.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500937
938 If the host is up, try installing the DUT with a stable
Dan Shi6964fa52014-12-18 11:04:27 -0800939 "repair" version of Chrome OS as defined in afe_stable_versions table.
940 If the table is not setup, global_config value under
941 CROS.stable_cros_version will be used instead.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500942
Scott Zawalski62bacae2013-03-05 10:40:32 -0500943 @raises AutoservRepairMethodNA if the DUT is not reachable.
944 @raises ChromiumOSError if the install failed for some reason.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500945
946 """
947 if not self.is_up():
Scott Zawalski62bacae2013-03-05 10:40:32 -0500948 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500949 logging.info('Attempting to reimage machine to repair image.')
950 try:
Richard Barnette0b023a72015-04-24 16:07:30 +0000951 self.machine_install(repair=True)
Fang Dengd0672f32013-03-18 17:18:09 -0700952 except autoupdater.ChromiumOSError as e:
953 logging.exception(e)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500954 logging.info('Repair via install failed.')
Scott Zawalski62bacae2013-03-05 10:40:32 -0500955 raise
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500956
957
Dan Shi2c88eed2013-11-12 10:18:38 -0800958 def _install_repair_with_powerwash(self):
Dan Shi9cc48452013-11-12 12:39:26 -0800959 """Attempt to powerwash first then repair this host using update-engine.
Dan Shi2c88eed2013-11-12 10:18:38 -0800960
Dan Shi9cc48452013-11-12 12:39:26 -0800961 update-engine may fail due to a bad image. In such case, powerwash
962 may help to cleanup the DUT for update-engine to work again.
Dan Shi2c88eed2013-11-12 10:18:38 -0800963
964 @raises AutoservRepairMethodNA if the DUT is not reachable.
965 @raises ChromiumOSError if the install failed for some reason.
966
967 """
968 if not self.is_up():
969 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
970
971 logging.info('Attempting to powerwash the DUT.')
972 self.run('echo "fast safe" > '
973 '/mnt/stateful_partition/factory_install_reset')
974 self.reboot(timeout=self.POWERWASH_BOOT_TIMEOUT, wait=True)
975 if not self.is_up():
Dan Shi9cc48452013-11-12 12:39:26 -0800976 logging.error('Powerwash failed. DUT did not come back after '
Dan Shi2c88eed2013-11-12 10:18:38 -0800977 'reboot.')
978 raise error.AutoservRepairFailure(
979 'DUT failed to boot from powerwash after %d seconds' %
980 self.POWERWASH_BOOT_TIMEOUT)
981
982 logging.info('Powerwash succeeded.')
983 self._install_repair()
984
985
beepsf079cfb2013-09-18 17:49:51 -0700986 def servo_install(self, image_url=None, usb_boot_timeout=USB_BOOT_TIMEOUT,
987 install_timeout=INSTALL_TIMEOUT):
Scott Zawalski62bacae2013-03-05 10:40:32 -0500988 """
989 Re-install the OS on the DUT by:
990 1) installing a test image on a USB storage device attached to the Servo
991 board,
Richard Barnette03a0c132012-11-05 12:40:35 -0800992 2) booting that image in recovery mode, and then
J. Richard Barnette31b2e312013-04-04 16:05:22 -0700993 3) installing the image with chromeos-install.
994
Scott Zawalski62bacae2013-03-05 10:40:32 -0500995 @param image_url: If specified use as the url to install on the DUT.
996 otherwise boot the currently staged image on the USB stick.
beepsf079cfb2013-09-18 17:49:51 -0700997 @param usb_boot_timeout: The usb_boot_timeout to use during reimage.
998 Factory images need a longer usb_boot_timeout than regular
999 cros images.
1000 @param install_timeout: The timeout to use when installing the chromeos
1001 image. Factory images need a longer install_timeout.
Richard Barnette03a0c132012-11-05 12:40:35 -08001002
Scott Zawalski62bacae2013-03-05 10:40:32 -05001003 @raises AutoservError if the image fails to boot.
beepsf079cfb2013-09-18 17:49:51 -07001004
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001005 """
beepsf079cfb2013-09-18 17:49:51 -07001006 usb_boot_timer_key = ('servo_install.usb_boot_timeout_%s'
1007 % usb_boot_timeout)
1008 logging.info('Downloading image to USB, then booting from it. Usb boot '
1009 'timeout = %s', usb_boot_timeout)
Gabe Black1e1c41b2015-02-04 23:55:15 -08001010 timer = autotest_stats.Timer(usb_boot_timer_key)
beepsf079cfb2013-09-18 17:49:51 -07001011 timer.start()
J. Richard Barnette31b2e312013-04-04 16:05:22 -07001012 self.servo.install_recovery_image(image_url)
beepsf079cfb2013-09-18 17:49:51 -07001013 if not self.wait_up(timeout=usb_boot_timeout):
Scott Zawalski62bacae2013-03-05 10:40:32 -05001014 raise error.AutoservRepairFailure(
1015 'DUT failed to boot from USB after %d seconds' %
beepsf079cfb2013-09-18 17:49:51 -07001016 usb_boot_timeout)
1017 timer.stop()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001018
beepsf079cfb2013-09-18 17:49:51 -07001019 install_timer_key = ('servo_install.install_timeout_%s'
1020 % install_timeout)
Gabe Black1e1c41b2015-02-04 23:55:15 -08001021 timer = autotest_stats.Timer(install_timer_key)
beepsf079cfb2013-09-18 17:49:51 -07001022 timer.start()
1023 logging.info('Installing image through chromeos-install.')
J. Richard Barnette2522a8f2015-03-04 15:59:15 -08001024 self.run('chromeos-install --yes',
MK Ryu35d661e2014-09-25 17:44:10 -07001025 timeout=install_timeout)
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001026 self.run('halt')
beepsf079cfb2013-09-18 17:49:51 -07001027 timer.stop()
1028
1029 logging.info('Power cycling DUT through servo.')
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001030 self.servo.get_power_state_controller().power_off()
Fang Dengafb88142013-05-30 17:44:31 -07001031 self.servo.switch_usbkey('off')
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001032 # N.B. The Servo API requires that we use power_on() here
1033 # for two reasons:
1034 # 1) After turning on a DUT in recovery mode, you must turn
1035 # it off and then on with power_on() once more to
1036 # disable recovery mode (this is a Parrot specific
1037 # requirement).
1038 # 2) After power_off(), the only way to turn on is with
1039 # power_on() (this is a Storm specific requirement).
J. Richard Barnettefbcc7122013-07-24 18:24:59 -07001040 self.servo.get_power_state_controller().power_on()
beepsf079cfb2013-09-18 17:49:51 -07001041
1042 logging.info('Waiting for DUT to come back up.')
Richard Barnette03a0c132012-11-05 12:40:35 -08001043 if not self.wait_up(timeout=self.BOOT_TIMEOUT):
1044 raise error.AutoservError('DUT failed to reboot installed '
1045 'test image after %d seconds' %
Scott Zawalski62bacae2013-03-05 10:40:32 -05001046 self.BOOT_TIMEOUT)
1047
1048
J. Richard Barnettee4af8b92013-05-01 13:16:12 -07001049 def _servo_repair_reinstall(self):
Scott Zawalski62bacae2013-03-05 10:40:32 -05001050 """Reinstall the DUT utilizing servo and a test image.
1051
1052 Re-install the OS on the DUT by:
1053 1) installing a test image on a USB storage device attached to the Servo
1054 board,
1055 2) booting that image in recovery mode, and then
1056 3) installing the image with chromeos-install.
1057
Scott Zawalski62bacae2013-03-05 10:40:32 -05001058 @raises AutoservRepairMethodNA if the device does not have servo
1059 support.
1060
1061 """
1062 if not self.servo:
1063 raise error.AutoservRepairMethodNA('Repair Reinstall NA: '
1064 'DUT has no servo support.')
1065
1066 logging.info('Attempting to recovery servo enabled device with '
1067 'servo_repair_reinstall')
1068
J. Richard Barnettee4af8b92013-05-01 13:16:12 -07001069 image_url = self.stage_image_for_servo()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001070 self.servo_install(image_url)
1071
1072
1073 def _servo_repair_power(self):
1074 """Attempt to repair DUT using an attached Servo.
1075
1076 Attempt to power on the DUT via power_long_press.
1077
1078 @raises AutoservRepairMethodNA if the device does not have servo
1079 support.
1080 @raises AutoservRepairFailure if the repair fails for any reason.
1081 """
1082 if not self.servo:
1083 raise error.AutoservRepairMethodNA('Repair Power NA: '
1084 'DUT has no servo support.')
1085
1086 logging.info('Attempting to recover servo enabled device by '
1087 'powering it off and on.')
1088 self.servo.get_power_state_controller().power_off()
1089 self.servo.get_power_state_controller().power_on()
1090 if self.wait_up(self.BOOT_TIMEOUT):
1091 return
1092
1093 raise error.AutoservRepairFailure('DUT did not boot after long_press.')
Richard Barnette03a0c132012-11-05 12:40:35 -08001094
1095
Richard Barnette82c35912012-11-20 10:09:10 -08001096 def _powercycle_to_repair(self):
1097 """Utilize the RPM Infrastructure to bring the host back up.
1098
1099 If the host is not up/repaired after the first powercycle we utilize
1100 auto fallback to the last good install by powercycling and rebooting the
1101 host 6 times.
Scott Zawalski62bacae2013-03-05 10:40:32 -05001102
1103 @raises AutoservRepairMethodNA if the device does not support remote
1104 power.
1105 @raises AutoservRepairFailure if the repair fails for any reason.
1106
Richard Barnette82c35912012-11-20 10:09:10 -08001107 """
Scott Zawalski62bacae2013-03-05 10:40:32 -05001108 if not self.has_power():
1109 raise error.AutoservRepairMethodNA('Device does not support power.')
1110
Richard Barnette82c35912012-11-20 10:09:10 -08001111 logging.info('Attempting repair via RPM powercycle.')
1112 failed_cycles = 0
1113 self.power_cycle()
1114 while not self.wait_up(timeout=self.BOOT_TIMEOUT):
1115 failed_cycles += 1
1116 if failed_cycles >= self._MAX_POWER_CYCLE_ATTEMPTS:
Scott Zawalski62bacae2013-03-05 10:40:32 -05001117 raise error.AutoservRepairFailure(
1118 'Powercycled host %s %d times; device did not come back'
1119 ' online.' % (self.hostname, failed_cycles))
Richard Barnette82c35912012-11-20 10:09:10 -08001120 self.power_cycle()
1121 if failed_cycles == 0:
1122 logging.info('Powercycling was successful first time.')
1123 else:
1124 logging.info('Powercycling was successful after %d failures.',
1125 failed_cycles)
1126
1127
MK Ryu35d661e2014-09-25 17:44:10 -07001128 def _reboot_repair(self):
1129 """SSH to this host and reboot."""
1130 if not self.is_up(self._CHECK_HOST_UP_TIMEOUT_SECS):
1131 raise error.AutoservRepairMethodNA('DUT unreachable for reboot.')
1132 logging.info('Attempting repair via SSH reboot.')
1133 self.reboot(timeout=self.BOOT_TIMEOUT, wait=True)
1134
1135
Prashanth B4d8184f2014-05-05 12:22:02 -07001136 def check_device(self):
1137 """Check if a device is ssh-able, and if so, clean and verify it.
1138
1139 @raise AutoservSSHTimeout: If the ssh ping times out.
1140 @raise AutoservSshPermissionDeniedError: If ssh ping fails due to
1141 permissions.
1142 @raise AutoservSshPingHostError: For other AutoservRunErrors during
1143 ssh_ping.
1144 @raises AutoservError: As appropriate, during cleanup and verify.
1145 """
1146 self.ssh_ping()
1147 self.cleanup()
1148 self.verify()
1149
1150
Richard Barnette82c35912012-11-20 10:09:10 -08001151 def repair_full(self):
1152 """Repair a host for repair level NO_PROTECTION.
1153
1154 This overrides the base class function for repair; it does
1155 not call back to the parent class, but instead offers a
1156 simplified implementation based on the capabilities in the
1157 Chrome OS test lab.
1158
Fang Deng5d518f42013-08-02 14:04:32 -07001159 It first verifies and repairs servo if it is a DUT in CrOS
Fang Deng03590af2013-10-07 17:34:20 -07001160 lab and a servo is attached.
Fang Deng5d518f42013-08-02 14:04:32 -07001161
Jakob Juelich82b7d1c2014-09-15 16:10:57 -07001162 This escalates in order through the following procedures and verifies
1163 the status using `self.check_device()` after each of them. This is done
1164 until both the repair and the veryfing step succeed.
1165
MK Ryu35d661e2014-09-25 17:44:10 -07001166 Escalation order of repair procedures from less intrusive to
1167 more intrusive repairs:
1168 1. SSH to the DUT and reboot.
Scott Zawalski62bacae2013-03-05 10:40:32 -05001169 2. If there's a servo for the DUT, try to power the DUT off and
1170 on.
MK Ryu35d661e2014-09-25 17:44:10 -07001171 3. If the DUT can be power-cycled via RPM, try to repair
Richard Barnette82c35912012-11-20 10:09:10 -08001172 by power-cycling.
MK Ryu35d661e2014-09-25 17:44:10 -07001173 4. Try to re-install to a known stable image using
1174 auto-update.
1175 5. If there's a servo for the DUT, try to re-install via
1176 the servo.
Richard Barnette82c35912012-11-20 10:09:10 -08001177
1178 As with the parent method, the last operation performed on
Prashanth B4d8184f2014-05-05 12:22:02 -07001179 the DUT must be to call `self.check_device()`; If that call fails the
1180 exception it raises is passed back to the caller.
J. Richard Barnettefde55fc2013-03-15 17:47:01 -07001181
Scott Zawalski62bacae2013-03-05 10:40:32 -05001182 @raises AutoservRepairTotalFailure if the repair process fails to
1183 fix the DUT.
Fang Deng5d518f42013-08-02 14:04:32 -07001184 @raises ServoHostRepairTotalFailure if the repair process fails to
1185 fix the servo host if one is attached to the DUT.
1186 @raises AutoservSshPermissionDeniedError if it is unable
1187 to ssh to the servo host due to permission error.
1188
Richard Barnette82c35912012-11-20 10:09:10 -08001189 """
Jakob Juelich82b7d1c2014-09-15 16:10:57 -07001190 # Caution: Deleting shards relies on repair to always reboot the DUT.
1191
Dan Shi4d478522014-02-14 13:46:32 -08001192 if self._servo_host and not self.servo:
Fang Deng03590af2013-10-07 17:34:20 -07001193 try:
Dan Shi4d478522014-02-14 13:46:32 -08001194 self._servo_host.repair_full()
Fang Deng03590af2013-10-07 17:34:20 -07001195 except Exception as e:
Fang Deng03590af2013-10-07 17:34:20 -07001196 logging.error('Could not create a healthy servo: %s', e)
Dan Shi4d478522014-02-14 13:46:32 -08001197 self.servo = self._servo_host.get_servo()
Fang Deng5d518f42013-08-02 14:04:32 -07001198
MK Ryu35d661e2014-09-25 17:44:10 -07001199 self.try_collect_crashlogs()
1200
Scott Zawalski62bacae2013-03-05 10:40:32 -05001201 # TODO(scottz): This should use something similar to label_decorator,
1202 # but needs to be populated in order so DUTs are repaired with the
1203 # least amount of effort.
MK Ryu35d661e2014-09-25 17:44:10 -07001204 repair_funcs = [self._reboot_repair,
1205 self._servo_repair_power,
1206 self._powercycle_to_repair,
Dan Shi849a1c42014-03-05 11:10:43 -08001207 self._install_repair,
Dan Shi2c88eed2013-11-12 10:18:38 -08001208 self._install_repair_with_powerwash,
MK Ryu35d661e2014-09-25 17:44:10 -07001209 self._servo_repair_reinstall]
Scott Zawalski62bacae2013-03-05 10:40:32 -05001210 errors = []
Simran Basie6130932013-10-01 14:07:52 -07001211 board = self._get_board_from_afe()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001212 for repair_func in repair_funcs:
1213 try:
1214 repair_func()
MK Ryu35d661e2014-09-25 17:44:10 -07001215 self.try_collect_crashlogs()
Prashanth B4d8184f2014-05-05 12:22:02 -07001216 self.check_device()
Gabe Black1e1c41b2015-02-04 23:55:15 -08001217 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001218 '%s.SUCCEEDED' % repair_func.__name__).increment()
1219 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001220 autotest_stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001221 '%s.%s.SUCCEEDED' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001222 board)).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001223 return
Simran Basie6130932013-10-01 14:07:52 -07001224 except error.AutoservRepairMethodNA as e:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001225 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001226 '%s.RepairNA' % repair_func.__name__).increment()
1227 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001228 autotest_stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001229 '%s.%s.RepairNA' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001230 board)).increment()
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001231 logging.warning('Repair function NA: %s', e)
Simran Basie6130932013-10-01 14:07:52 -07001232 errors.append(str(e))
Scott Zawalski62bacae2013-03-05 10:40:32 -05001233 except Exception as e:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001234 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001235 '%s.FAILED' % repair_func.__name__).increment()
1236 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001237 autotest_stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001238 '%s.%s.FAILED' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001239 board)).increment()
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001240 logging.warning('Failed to repair device: %s', e)
Scott Zawalski62bacae2013-03-05 10:40:32 -05001241 errors.append(str(e))
Scott Zawalski89c44dd2013-02-26 09:28:02 -05001242
Gabe Black1e1c41b2015-02-04 23:55:15 -08001243 autotest_stats.Counter('Full_Repair_Failed').increment()
Simran Basie6130932013-10-01 14:07:52 -07001244 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001245 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001246 'Full_Repair_Failed.%s' % board).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001247 raise error.AutoservRepairTotalFailure(
1248 'All attempts at repairing the device failed:\n%s' %
1249 '\n'.join(errors))
Richard Barnette82c35912012-11-20 10:09:10 -08001250
1251
MK Ryu35d661e2014-09-25 17:44:10 -07001252 def try_collect_crashlogs(self, check_host_up=True):
1253 """
1254 Check if a host is up and logs need to be collected from the host,
1255 if yes, collect them.
1256
1257 @param check_host_up: Flag for checking host is up. Default is True.
1258 """
1259 try:
1260 crash_job = self._need_crash_logs()
1261 if crash_job:
1262 logging.debug('%s: Job %s was crashed', self._CRASHLOGS_PREFIX,
1263 crash_job)
1264 if not check_host_up or self.is_up(
1265 self._CHECK_HOST_UP_TIMEOUT_SECS):
1266 self._collect_crashlogs(crash_job)
1267 logging.debug('%s: Completed collecting logs for the '
1268 'crashed job %s', self._CRASHLOGS_PREFIX,
1269 crash_job)
1270 except Exception as e:
1271 # Exception should not result in repair failure.
1272 # Therefore, suppress all exceptions here.
1273 logging.error('%s: Failed while trying to collect crash-logs: %s',
1274 self._CRASHLOGS_PREFIX, e)
1275
1276
1277 def _need_crash_logs(self):
1278 """Get the value of need_crash_logs attribute of this host.
1279
1280 @return: Value string of need_crash_logs attribute
1281 None if there is no need_crash_logs attribute
1282 """
1283 attrs = self._AFE.get_host_attribute(constants.CRASHLOGS_HOST_ATTRIBUTE,
1284 hostname=self.hostname)
1285 assert len(attrs) < 2
1286 return attrs[0].value if attrs else None
1287
1288
1289 def _collect_crashlogs(self, job_id):
1290 """Grab logs from the host where a job was crashed.
1291
1292 First, check if PRIOR_LOGS_DIR exists in the host.
1293 If yes, collect them.
1294 Otherwise, check if a lab-machine marker (_LAB_MACHINE_FILE) exists
1295 in the host.
1296 If yes, the host was repaired automatically, and we collect normal
1297 system logs.
1298
1299 @param job_id: Id of the job that was crashed.
1300 """
1301 crashlogs_dir = crashcollect.get_crashinfo_dir(self,
1302 constants.CRASHLOGS_DEST_DIR_PREFIX)
1303 flag_prior_logs = False
1304
1305 if self.path_exists(client_constants.PRIOR_LOGS_DIR):
1306 flag_prior_logs = True
1307 self._collect_prior_logs(crashlogs_dir)
1308 elif self.path_exists(self._LAB_MACHINE_FILE):
1309 self._collect_system_logs(crashlogs_dir)
1310 else:
1311 logging.warning('%s: Host was manually re-installed without '
1312 '--lab_preserve_log option. Skip collecting '
1313 'crash-logs.', self._CRASHLOGS_PREFIX)
1314
1315 # We make crash collection be one-time effort.
1316 # _collect_prior_logs() and _collect_system_logs() will not throw
1317 # any exception, and following codes will be executed even when
1318 # those methods fail.
1319 # _collect_crashlogs() is called only when the host is up (refer
1320 # to try_collect_crashlogs()). We assume _collect_prior_logs() and
1321 # _collect_system_logs() fail rarely when the host is up.
1322 # In addition, it is not clear how many times we should try crash
1323 # collection again while not triggering next repair unnecessarily.
1324 # Threfore, we try crash collection one time.
1325
1326 # Create a marker file as soon as log collection is done.
1327 # Leave the job id to this marker for gs_offloader to consume.
1328 marker_file = os.path.join(crashlogs_dir, constants.CRASHLOGS_MARKER)
1329 with open(marker_file, 'a') as f:
1330 f.write('%s\n' % job_id)
1331
1332 # Remove need_crash_logs attribute
1333 logging.debug('%s: Remove attribute need_crash_logs from host %s',
1334 self._CRASHLOGS_PREFIX, self.hostname)
1335 self._AFE.set_host_attribute(constants.CRASHLOGS_HOST_ATTRIBUTE,
1336 None, hostname=self.hostname)
1337
1338 if flag_prior_logs:
1339 logging.debug('%s: Remove %s from host %s', self._CRASHLOGS_PREFIX,
1340 client_constants.PRIOR_LOGS_DIR, self.hostname)
1341 self.run('rm -rf %s; sync' % client_constants.PRIOR_LOGS_DIR)
1342 # Wait for a few seconds to make sure the prior command is
1343 # done deep through storage.
1344 time.sleep(self._SAFE_WAIT_SECS)
1345
1346
1347 def _collect_prior_logs(self, crashlogs_dir):
1348 """Grab prior logs that were stashed before re-installing a host.
1349
1350 @param crashlogs_dir: Directory path where crash-logs are stored.
1351 """
1352 logging.debug('%s: Found %s, collecting them...',
1353 self._CRASHLOGS_PREFIX, client_constants.PRIOR_LOGS_DIR)
1354 try:
1355 self.collect_logs(client_constants.PRIOR_LOGS_DIR,
1356 crashlogs_dir, False)
1357 logging.debug('%s: %s is collected',
1358 self._CRASHLOGS_PREFIX, client_constants.PRIOR_LOGS_DIR)
1359 except Exception as e:
1360 logging.error('%s: Failed to collect %s: %s',
1361 self._CRASHLOGS_PREFIX, client_constants.PRIOR_LOGS_DIR,
1362 e)
1363
1364
1365 def _collect_system_logs(self, crashlogs_dir):
1366 """Grab normal system logs from a host.
1367
1368 @param crashlogs_dir: Directory path where crash-logs are stored.
1369 """
1370 logging.debug('%s: Found %s, collecting system logs...',
1371 self._CRASHLOGS_PREFIX, self._LAB_MACHINE_FILE)
1372 sources = server_utils.parse_simple_config(self._LOGS_TO_COLLECT_FILE)
1373 for src in sources:
1374 try:
1375 if self.path_exists(src):
1376 logging.debug('%s: Collecting %s...',
1377 self._CRASHLOGS_PREFIX, src)
1378 dest = server_utils.concat_path_except_last(
1379 crashlogs_dir, src)
1380 self.collect_logs(src, dest, False)
1381 logging.debug('%s: %s is collected',
1382 self._CRASHLOGS_PREFIX, src)
1383 except Exception as e:
1384 logging.error('%s: Failed to collect %s: %s',
1385 self._CRASHLOGS_PREFIX, src, e)
1386
1387
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001388 def close(self):
beeps32a63082013-08-22 14:02:29 -07001389 self.rpc_disconnect_all()
Fang Deng0ca40e22013-08-27 17:47:44 -07001390 super(CrosHost, self).close()
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001391
1392
Dan Shi49ca0932014-11-14 11:22:27 -08001393 def get_power_supply_info(self):
1394 """Get the output of power_supply_info.
1395
1396 power_supply_info outputs the info of each power supply, e.g.,
1397 Device: Line Power
1398 online: no
1399 type: Mains
1400 voltage (V): 0
1401 current (A): 0
1402 Device: Battery
1403 state: Discharging
1404 percentage: 95.9276
1405 technology: Li-ion
1406
1407 Above output shows two devices, Line Power and Battery, with details of
1408 each device listed. This function parses the output into a dictionary,
1409 with key being the device name, and value being a dictionary of details
1410 of the device info.
1411
1412 @return: The dictionary of power_supply_info, e.g.,
1413 {'Line Power': {'online': 'yes', 'type': 'main'},
1414 'Battery': {'vendor': 'xyz', 'percentage': '100'}}
Dan Shie9b765d2014-12-29 16:59:49 -08001415 @raise error.AutoservRunError if power_supply_info tool is not found in
1416 the DUT. Caller should handle this error to avoid false failure
1417 on verification.
Dan Shi49ca0932014-11-14 11:22:27 -08001418 """
1419 result = self.run('power_supply_info').stdout.strip()
1420 info = {}
1421 device_name = None
1422 device_info = {}
1423 for line in result.split('\n'):
1424 pair = [v.strip() for v in line.split(':')]
1425 if len(pair) != 2:
1426 continue
1427 if pair[0] == 'Device':
1428 if device_name:
1429 info[device_name] = device_info
1430 device_name = pair[1]
1431 device_info = {}
1432 else:
1433 device_info[pair[0]] = pair[1]
1434 if device_name and not device_name in info:
1435 info[device_name] = device_info
1436 return info
1437
1438
1439 def get_battery_percentage(self):
1440 """Get the battery percentage.
1441
1442 @return: The percentage of battery level, value range from 0-100. Return
1443 None if the battery info cannot be retrieved.
1444 """
1445 try:
1446 info = self.get_power_supply_info()
1447 logging.info(info)
1448 return float(info['Battery']['percentage'])
Dan Shie9b765d2014-12-29 16:59:49 -08001449 except (KeyError, ValueError, error.AutoservRunError):
Dan Shi49ca0932014-11-14 11:22:27 -08001450 return None
1451
1452
1453 def is_ac_connected(self):
1454 """Check if the dut has power adapter connected and charging.
1455
1456 @return: True if power adapter is connected and charging.
1457 """
1458 try:
1459 info = self.get_power_supply_info()
1460 return info['Line Power']['online'] == 'yes'
Dan Shie9b765d2014-12-29 16:59:49 -08001461 except (KeyError, error.AutoservRunError):
1462 return None
Dan Shi49ca0932014-11-14 11:22:27 -08001463
1464
Simran Basi5e6339a2013-03-21 11:34:32 -07001465 def _cleanup_poweron(self):
1466 """Special cleanup method to make sure hosts always get power back."""
1467 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
1468 hosts = afe.get_hosts(hostname=self.hostname)
1469 if not hosts or not (self._RPM_OUTLET_CHANGED in
1470 hosts[0].attributes):
1471 return
1472 logging.debug('This host has recently interacted with the RPM'
1473 ' Infrastructure. Ensuring power is on.')
1474 try:
1475 self.power_on()
Dan Shi7dca56e2014-11-11 17:07:56 -08001476 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, None,
1477 hostname=self.hostname)
Simran Basi5e6339a2013-03-21 11:34:32 -07001478 except rpm_client.RemotePowerException:
Simran Basi5e6339a2013-03-21 11:34:32 -07001479 logging.error('Failed to turn Power On for this host after '
1480 'cleanup through the RPM Infrastructure.')
Gabe Blackb72f4fb2015-01-20 16:47:13 -08001481 autotest_es.post(
Dan Shi7dca56e2014-11-11 17:07:56 -08001482 type_str='RPM_poweron_failure',
1483 metadata={'hostname': self.hostname})
Dan Shi49ca0932014-11-14 11:22:27 -08001484
1485 battery_percentage = self.get_battery_percentage()
Dan Shif01ebe22014-12-05 13:10:57 -08001486 if battery_percentage and battery_percentage < 50:
Dan Shi49ca0932014-11-14 11:22:27 -08001487 raise
1488 elif self.is_ac_connected():
1489 logging.info('The device has power adapter connected and '
1490 'charging. No need to try to turn RPM on '
1491 'again.')
1492 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, None,
1493 hostname=self.hostname)
1494 logging.info('Battery level is now at %s%%. The device may '
1495 'still have enough power to run test, so no '
1496 'exception will be raised.', battery_percentage)
1497
Simran Basi5e6339a2013-03-21 11:34:32 -07001498
beepsc87ff602013-07-31 21:53:00 -07001499 def _is_factory_image(self):
1500 """Checks if the image on the DUT is a factory image.
1501
1502 @return: True if the image on the DUT is a factory image.
1503 False otherwise.
1504 """
1505 result = self.run('[ -f /root/.factory_test ]', ignore_status=True)
1506 return result.exit_status == 0
1507
1508
1509 def _restart_ui(self):
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001510 """Restart the Chrome UI.
beepsc87ff602013-07-31 21:53:00 -07001511
1512 @raises: FactoryImageCheckerException for factory images, since
1513 we cannot attempt to restart ui on them.
1514 error.AutoservRunError for any other type of error that
1515 occurs while restarting ui.
1516 """
1517 if self._is_factory_image():
Dan Shi549fb822015-03-24 18:01:11 -07001518 raise FactoryImageCheckerException('Cannot restart ui on factory '
1519 'images')
beepsc87ff602013-07-31 21:53:00 -07001520
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001521 # TODO(jrbarnette): The command to stop/start the ui job
1522 # should live inside cros_ui, too. However that would seem
1523 # to imply interface changes to the existing start()/restart()
1524 # functions, which is a bridge too far (for now).
J. Richard Barnette6069aa12015-06-08 09:10:24 -07001525 prompt = cros_ui.get_chrome_session_ident(self)
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001526 self.run('stop ui; start ui')
1527 cros_ui.wait_for_chrome_ready(prompt, self)
beepsc87ff602013-07-31 21:53:00 -07001528
1529
Dan Shi549fb822015-03-24 18:01:11 -07001530 def get_release_version(self):
1531 """Get the value of attribute CHROMEOS_RELEASE_VERSION from lsb-release.
1532
1533 @returns The version string in lsb-release, under attribute
1534 CHROMEOS_RELEASE_VERSION.
1535 """
1536 lsb_release_content = self.run(
1537 'cat "%s"' % client_constants.LSB_RELEASE).stdout.strip()
1538 return lsbrelease_utils.get_chromeos_release_version(
1539 lsb_release_content=lsb_release_content)
1540
1541
1542 def verify_cros_version_label(self):
1543 """ Make sure host's cros-version label match the actual image in dut.
1544
1545 Remove any cros-version: label that doesn't match that installed in
1546 the dut.
1547
1548 @param raise_error: Set to True to raise exception if any mismatch found
1549
1550 @raise error.AutoservError: If any mismatch between cros-version label
1551 and the build installed in dut is found.
1552 """
1553 labels = self._AFE.get_labels(
1554 name__startswith=ds_constants.VERSION_PREFIX,
1555 host__hostname=self.hostname)
1556 mismatch_found = False
1557 if labels:
1558 # Get CHROMEOS_RELEASE_VERSION from lsb-release, e.g., 6908.0.0.
1559 # Note that it's different from cros-version label, which has
1560 # builder and branch info, e.g.,
1561 # cros-version:peppy-release/R43-6908.0.0
1562 release_version = self.get_release_version()
1563 host_list = [self.hostname]
1564 for label in labels:
1565 # Remove any cros-version label that does not match
1566 # release_version.
1567 build_version = label.name[len(ds_constants.VERSION_PREFIX):]
1568 if not utils.version_match(build_version, release_version):
1569 logging.warn('cros-version label "%s" does not match '
1570 'release version %s. Removing the label.',
1571 label.name, release_version)
1572 label.remove_hosts(hosts=host_list)
1573 mismatch_found = True
1574 if mismatch_found:
Dan Shi1057bae2015-03-30 11:35:09 -07001575 autotest_es.post(use_http=True,
1576 type_str='cros_version_label_mismatch',
1577 metadata={'hostname': self.hostname})
Dan Shi549fb822015-03-24 18:01:11 -07001578 raise error.AutoservError('The host has wrong cros-version label.')
1579
1580
beepsc87ff602013-07-31 21:53:00 -07001581 def cleanup(self):
MK Ryu35d661e2014-09-25 17:44:10 -07001582 self.run('rm -f %s' % client_constants.CLEANUP_LOGS_PAUSED_FILE)
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001583 try:
beepsc87ff602013-07-31 21:53:00 -07001584 self._restart_ui()
1585 except (error.AutotestRunError, error.AutoservRunError,
1586 FactoryImageCheckerException):
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001587 logging.warning('Unable to restart ui, rebooting device.')
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001588 # Since restarting the UI fails fall back to normal Autotest
1589 # cleanup routines, i.e. reboot the machine.
Fang Deng0ca40e22013-08-27 17:47:44 -07001590 super(CrosHost, self).cleanup()
Simran Basi5e6339a2013-03-21 11:34:32 -07001591 # Check if the rpm outlet was manipulated.
Simran Basid5e5e272012-09-24 15:23:59 -07001592 if self.has_power():
Simran Basi5e6339a2013-03-21 11:34:32 -07001593 self._cleanup_poweron()
Dan Shi549fb822015-03-24 18:01:11 -07001594 self.verify_cros_version_label()
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001595
1596
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001597 def reboot(self, **dargs):
1598 """
1599 This function reboots the site host. The more generic
1600 RemoteHost.reboot() performs sync and sleeps for 5
1601 seconds. This is not necessary for Chrome OS devices as the
1602 sync should be finished in a short time during the reboot
1603 command.
1604 """
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001605 if 'reboot_cmd' not in dargs:
Doug Anderson7d5aeb22014-02-27 15:12:17 -08001606 reboot_timeout = dargs.get('reboot_timeout', 10)
1607 dargs['reboot_cmd'] = ('((reboot & sleep %d; reboot -f &)'
1608 ' </dev/null >/dev/null 2>&1 &)' %
1609 reboot_timeout)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001610 # Enable fastsync to avoid running extra sync commands before reboot.
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001611 if 'fastsync' not in dargs:
1612 dargs['fastsync'] = True
Michael Liangda8c60a2014-06-03 13:24:51 -07001613
Charlie Mooneya8e6dab2014-05-29 14:37:55 -07001614 # For purposes of logging reboot times:
1615 # Get the board name i.e. 'daisy_spring'
Michael Liangca4f5a62014-07-10 15:45:13 -07001616 board_fullname = self.get_board()
1617
1618 # Strip the prefix and add it to dargs.
1619 dargs['board'] = board_fullname[board_fullname.find(':')+1:]
Fang Deng0ca40e22013-08-27 17:47:44 -07001620 super(CrosHost, self).reboot(**dargs)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001621
1622
Gwendal Grignou7a61d2f2014-05-23 11:05:51 -07001623 def suspend(self, **dargs):
1624 """
1625 This function suspends the site host.
1626 """
1627 suspend_time = dargs.get('suspend_time', 60)
1628 dargs['timeout'] = suspend_time
1629 if 'suspend_cmd' not in dargs:
1630 cmd = ' && '.join(['echo 0 > /sys/class/rtc/rtc0/wakealarm',
1631 'echo +%d > /sys/class/rtc/rtc0/wakealarm' % suspend_time,
1632 'powerd_dbus_suspend --delay=0 &'])
1633 dargs['suspend_cmd'] = ('(( %s )'
1634 '< /dev/null >/dev/null 2>&1 &)' % cmd)
1635 super(CrosHost, self).suspend(**dargs)
1636
1637
Simran Basiec564392014-08-25 16:48:09 -07001638 def upstart_status(self, service_name):
1639 """Check the status of an upstart init script.
1640
1641 @param service_name: Service to look up.
1642
1643 @returns True if the service is running, False otherwise.
1644 """
1645 return self.run('status %s | grep start/running' %
1646 service_name).stdout.strip() != ''
1647
1648
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001649 def verify_software(self):
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001650 """Verify working software on a Chrome OS system.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001651
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001652 Tests for the following conditions:
1653 1. All conditions tested by the parent version of this
1654 function.
1655 2. Sufficient space in /mnt/stateful_partition.
Fang Deng6b05f5b2013-03-20 13:42:11 -07001656 3. Sufficient space in /mnt/stateful_partition/encrypted.
1657 4. update_engine answers a simple status request over DBus.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001658
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001659 """
MK Ryu35d661e2014-09-25 17:44:10 -07001660 # Check if a job was crashed on this host.
1661 # If yes, avoid verification until crash-logs are collected.
1662 if self._need_crash_logs():
1663 raise error.AutoservCrashLogCollectRequired(
1664 'Need to collect crash-logs before verification')
1665
Fang Deng0ca40e22013-08-27 17:47:44 -07001666 super(CrosHost, self).verify_software()
J. Richard Barnette4164d1d2014-12-02 17:52:33 -08001667 self.check_inodes(
1668 '/mnt/stateful_partition',
1669 global_config.global_config.get_config_value(
1670 'SERVER', 'kilo_inodes_required', type=int,
1671 default=100))
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001672 self.check_diskspace(
1673 '/mnt/stateful_partition',
1674 global_config.global_config.get_config_value(
Fang Deng6b05f5b2013-03-20 13:42:11 -07001675 'SERVER', 'gb_diskspace_required', type=float,
1676 default=20.0))
Gaurav Shahe448af82014-06-19 15:18:59 -07001677 encrypted_stateful_path = '/mnt/stateful_partition/encrypted'
1678 # Not all targets build with encrypted stateful support.
1679 if self.path_exists(encrypted_stateful_path):
1680 self.check_diskspace(
1681 encrypted_stateful_path,
1682 global_config.global_config.get_config_value(
1683 'SERVER', 'gb_encrypted_diskspace_required', type=float,
1684 default=0.1))
beepsc87ff602013-07-31 21:53:00 -07001685
Simran Basiec564392014-08-25 16:48:09 -07001686 if not self.upstart_status('system-services'):
Prashanth B5d0a0512014-04-25 12:26:08 -07001687 raise error.AutoservError('Chrome failed to reach login. '
1688 'System services not running.')
1689
beepsc87ff602013-07-31 21:53:00 -07001690 # Factory images don't run update engine,
1691 # goofy controls dbus on these DUTs.
1692 if not self._is_factory_image():
1693 self.run('update_engine_client --status')
Scott Zawalskifbca4a92013-03-04 15:56:42 -05001694 # Makes sure python is present, loads and can use built in functions.
1695 # We have seen cases where importing cPickle fails with undefined
1696 # symbols in cPickle.so.
1697 self.run('python -c "import cPickle"')
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001698
Dan Shi549fb822015-03-24 18:01:11 -07001699 self.verify_cros_version_label()
1700
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001701
Dan Shi49ca0932014-11-14 11:22:27 -08001702 def verify_hardware(self):
1703 """Verify hardware system of a Chrome OS system.
1704
1705 Check following hardware conditions:
1706 1. Battery level.
1707 2. Is power adapter connected.
1708 """
1709 logging.info('Battery percentage: %s', self.get_battery_percentage())
Dan Shie9b765d2014-12-29 16:59:49 -08001710 if self.is_ac_connected() is None:
1711 logging.info('Can not determine if the device has power adapter '
1712 'connected.')
1713 else:
1714 logging.info('Device %s power adapter connected and charging.',
1715 'has' if self.is_ac_connected() else 'does not have')
Dan Shi49ca0932014-11-14 11:22:27 -08001716
1717
Fang Deng96667ca2013-08-01 17:46:18 -07001718 def make_ssh_command(self, user='root', port=22, opts='', hosts_file=None,
1719 connect_timeout=None, alive_interval=None):
1720 """Override default make_ssh_command to use options tuned for Chrome OS.
1721
1722 Tuning changes:
1723 - ConnectTimeout=30; maximum of 30 seconds allowed for an SSH
1724 connection failure. Consistency with remote_access.sh.
1725
Samuel Tan2ce155b2015-06-23 18:24:38 -07001726 - ServerAliveInterval=900; which causes SSH to ping connection every
1727 900 seconds. In conjunction with ServerAliveCountMax ensures
1728 that if the connection dies, Autotest will bail out.
Fang Deng96667ca2013-08-01 17:46:18 -07001729 Originally tried 60 secs, but saw frequent job ABORTS where
Samuel Tan2ce155b2015-06-23 18:24:38 -07001730 the test completed successfully. Later increased from 180 seconds to
1731 900 seconds to account for tests where the DUT is suspended for
1732 longer periods of time.
Fang Deng96667ca2013-08-01 17:46:18 -07001733
1734 - ServerAliveCountMax=3; consistency with remote_access.sh.
1735
1736 - ConnectAttempts=4; reduce flakiness in connection errors;
1737 consistency with remote_access.sh.
1738
1739 - UserKnownHostsFile=/dev/null; we don't care about the keys.
1740 Host keys change with every new installation, don't waste
1741 memory/space saving them.
1742
1743 - SSH protocol forced to 2; needed for ServerAliveInterval.
1744
1745 @param user User name to use for the ssh connection.
1746 @param port Port on the target host to use for ssh connection.
1747 @param opts Additional options to the ssh command.
1748 @param hosts_file Ignored.
1749 @param connect_timeout Ignored.
1750 @param alive_interval Ignored.
1751 """
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001752 base_command = ('/usr/bin/ssh -a -x %s %s %s'
1753 ' -o StrictHostKeyChecking=no'
Fang Deng96667ca2013-08-01 17:46:18 -07001754 ' -o UserKnownHostsFile=/dev/null -o BatchMode=yes'
Samuel Tan2ce155b2015-06-23 18:24:38 -07001755 ' -o ConnectTimeout=30 -o ServerAliveInterval=900'
Fang Deng96667ca2013-08-01 17:46:18 -07001756 ' -o ServerAliveCountMax=3 -o ConnectionAttempts=4'
1757 ' -o Protocol=2 -l %s -p %d')
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001758 return base_command % (self._ssh_verbosity_flag, self._ssh_options,
1759 opts, user, port)
Fang Deng96667ca2013-08-01 17:46:18 -07001760
1761
beeps32a63082013-08-22 14:02:29 -07001762 def _create_ssh_tunnel(self, port, local_port):
1763 """Create an ssh tunnel from local_port to port.
1764
1765 @param port: remote port on the host.
1766 @param local_port: local forwarding port.
1767
1768 @return: the tunnel process.
1769 """
1770 # Chrome OS on the target closes down most external ports
1771 # for security. We could open the port, but doing that
1772 # would conflict with security tests that check that only
1773 # expected ports are open. So, to get to the port on the
1774 # target we use an ssh tunnel.
1775 tunnel_options = '-n -N -q -L %d:localhost:%d' % (local_port, port)
1776 ssh_cmd = self.make_ssh_command(opts=tunnel_options)
1777 tunnel_cmd = '%s %s' % (ssh_cmd, self.hostname)
1778 logging.debug('Full tunnel command: %s', tunnel_cmd)
1779 tunnel_proc = subprocess.Popen(tunnel_cmd, shell=True, close_fds=True)
1780 logging.debug('Started ssh tunnel, local = %d'
1781 ' remote = %d, pid = %d',
1782 local_port, port, tunnel_proc.pid)
1783 return tunnel_proc
1784
1785
Christopher Wileydd181852013-10-10 19:56:58 -07001786 def _setup_rpc(self, port, command_name, remote_pid=None):
beeps32a63082013-08-22 14:02:29 -07001787 """Sets up a tunnel process and performs rpc connection book keeping.
1788
1789 This method assumes that xmlrpc and jsonrpc never conflict, since
1790 we can only either have an xmlrpc or a jsonrpc server listening on
1791 a remote port. As such, it enforces a single proxy->remote port
1792 policy, i.e if one starts a jsonrpc proxy/server from port A->B,
1793 and then tries to start an xmlrpc proxy forwarded to the same port,
1794 the xmlrpc proxy will override the jsonrpc tunnel process, however:
1795
1796 1. None of the methods on the xmlrpc proxy will work because
1797 the server listening on B is jsonrpc.
1798
1799 2. The xmlrpc client cannot initiate a termination of the JsonRPC
1800 server, as the only use case currently is goofy, which is tied to
1801 the factory image. It is much easier to handle a failed xmlrpc
1802 call on the client than it is to terminate goofy in this scenario,
1803 as doing the latter might leave the DUT in a hard to recover state.
1804
1805 With the current implementation newer rpc proxy connections will
1806 terminate the tunnel processes of older rpc connections tunneling
1807 to the same remote port. If methods are invoked on the client
1808 after this has happened they will fail with connection closed errors.
1809
1810 @param port: The remote forwarding port.
1811 @param command_name: The name of the remote process, to terminate
1812 using pkill.
1813
1814 @return A url that we can use to initiate the rpc connection.
1815 """
1816 self.rpc_disconnect(port)
1817 local_port = utils.get_unused_port()
1818 tunnel_proc = self._create_ssh_tunnel(port, local_port)
Christopher Wileydd181852013-10-10 19:56:58 -07001819 self._rpc_proxy_map[port] = (command_name, tunnel_proc, remote_pid)
beeps32a63082013-08-22 14:02:29 -07001820 return self._RPC_PROXY_URL % local_port
1821
1822
Christopher Wileyd78249a2013-03-01 13:05:31 -08001823 def xmlrpc_connect(self, command, port, command_name=None,
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001824 ready_test_name=None, timeout_seconds=10,
1825 logfile='/dev/null'):
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001826 """Connect to an XMLRPC server on the host.
1827
1828 The `command` argument should be a simple shell command that
1829 starts an XMLRPC server on the given `port`. The command
1830 must not daemonize, and must terminate cleanly on SIGTERM.
1831 The command is started in the background on the host, and a
1832 local XMLRPC client for the server is created and returned
1833 to the caller.
1834
1835 Note that the process of creating an XMLRPC client makes no
1836 attempt to connect to the remote server; the caller is
1837 responsible for determining whether the server is running
1838 correctly, and is ready to serve requests.
1839
Christopher Wileyd78249a2013-03-01 13:05:31 -08001840 Optionally, the caller can pass ready_test_name, a string
1841 containing the name of a method to call on the proxy. This
1842 method should take no parameters and return successfully only
1843 when the server is ready to process client requests. When
1844 ready_test_name is set, xmlrpc_connect will block until the
1845 proxy is ready, and throw a TestError if the server isn't
1846 ready by timeout_seconds.
1847
beeps32a63082013-08-22 14:02:29 -07001848 If a server is already running on the remote port, this
1849 method will kill it and disconnect the tunnel process
1850 associated with the connection before establishing a new one,
1851 by consulting the rpc_proxy_map in rpc_disconnect.
1852
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001853 @param command Shell command to start the server.
1854 @param port Port number on which the server is expected to
1855 be serving.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001856 @param command_name String to use as input to `pkill` to
1857 terminate the XMLRPC server on the host.
Christopher Wileyd78249a2013-03-01 13:05:31 -08001858 @param ready_test_name String containing the name of a
1859 method defined on the XMLRPC server.
1860 @param timeout_seconds Number of seconds to wait
1861 for the server to become 'ready.' Will throw a
1862 TestFail error if server is not ready in time.
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001863 @param logfile Logfile to send output when running
1864 'command' argument.
Yusuf Mohsinally8d19e3c2013-11-21 14:25:45 -08001865
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001866 """
Christopher Wileyc14f06a2013-10-16 13:55:39 -07001867 # Clean up any existing state. If the caller is willing
1868 # to believe their server is down, we ought to clean up
1869 # any tunnels we might have sitting around.
1870 self.rpc_disconnect(port)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001871 # Start the server on the host. Redirection in the command
1872 # below is necessary, because 'ssh' won't terminate until
1873 # background child processes close stdin, stdout, and
1874 # stderr.
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001875 remote_cmd = '%s </dev/null >%s 2>&1 & echo $!' % (command, logfile)
Christopher Wileydd181852013-10-10 19:56:58 -07001876 remote_pid = self.run(remote_cmd).stdout.rstrip('\n')
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001877 logging.debug('Started XMLRPC server on host %s, pid = %s',
1878 self.hostname, remote_pid)
1879
Christopher Wileydd181852013-10-10 19:56:58 -07001880 # Tunnel through SSH to be able to reach that remote port.
1881 rpc_url = self._setup_rpc(port, command_name, remote_pid=remote_pid)
Christopher Wileyd78249a2013-03-01 13:05:31 -08001882 proxy = xmlrpclib.ServerProxy(rpc_url, allow_none=True)
Christopher Wileydd181852013-10-10 19:56:58 -07001883
Christopher Wileyd78249a2013-03-01 13:05:31 -08001884 if ready_test_name is not None:
J. Richard Barnette13eb7c02013-03-07 12:06:29 -08001885 # retry.retry logs each attempt; calculate delay_sec to
1886 # keep log spam to a dull roar.
Christopher Wiley0ed712b2013-04-09 15:25:12 -07001887 @retry.retry((socket.error,
1888 xmlrpclib.ProtocolError,
1889 httplib.BadStatusLine),
Chris Sosa65425082013-10-16 13:26:22 -07001890 timeout_min=timeout_seconds / 60.0,
1891 delay_sec=min(max(timeout_seconds / 20.0, 0.1), 1))
Christopher Wileyd78249a2013-03-01 13:05:31 -08001892 def ready_test():
1893 """ Call proxy.ready_test_name(). """
1894 getattr(proxy, ready_test_name)()
1895 successful = False
1896 try:
1897 logging.info('Waiting %d seconds for XMLRPC server '
1898 'to start.', timeout_seconds)
1899 ready_test()
1900 successful = True
Christopher Wileyd78249a2013-03-01 13:05:31 -08001901 finally:
1902 if not successful:
1903 logging.error('Failed to start XMLRPC server.')
beeps32a63082013-08-22 14:02:29 -07001904 self.rpc_disconnect(port)
Christopher Wileyd78249a2013-03-01 13:05:31 -08001905 logging.info('XMLRPC server started successfully.')
1906 return proxy
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001907
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001908
Jason Abeleb6f924f2013-11-13 16:01:54 -08001909 def syslog(self, message, tag='autotest'):
1910 """Logs a message to syslog on host.
1911
1912 @param message String message to log into syslog
1913 @param tag String tag prefix for syslog
1914
1915 """
1916 self.run('logger -t "%s" "%s"' % (tag, message))
1917
1918
beeps32a63082013-08-22 14:02:29 -07001919 def jsonrpc_connect(self, port):
1920 """Creates a jsonrpc proxy connection through an ssh tunnel.
1921
1922 This method exists to facilitate communication with goofy (which is
1923 the default system manager on all factory images) and as such, leaves
1924 most of the rpc server sanity checking to the caller. Unlike
1925 xmlrpc_connect, this method does not facilitate the creation of a remote
1926 jsonrpc server, as the only clients of this code are factory tests,
1927 for which the goofy system manager is built in to the image and starts
1928 when the target boots.
1929
1930 One can theoretically create multiple jsonrpc proxies all forwarded
1931 to the same remote port, provided the remote port has an rpc server
1932 listening. However, in doing so we stand the risk of leaking an
1933 existing tunnel process, so we always disconnect any older tunnels
1934 we might have through rpc_disconnect.
1935
1936 @param port: port on the remote host that is serving this proxy.
1937
1938 @return: The client proxy.
1939 """
1940 if not jsonrpclib:
1941 logging.warning('Jsonrpclib could not be imported. Check that '
1942 'site-packages contains jsonrpclib.')
1943 return None
1944
1945 proxy = jsonrpclib.jsonrpc.ServerProxy(self._setup_rpc(port, None))
1946
1947 logging.info('Established a jsonrpc connection through port %s.', port)
1948 return proxy
1949
1950
1951 def rpc_disconnect(self, port):
1952 """Disconnect from an RPC server on the host.
1953
1954 Terminates the remote RPC server previously started for
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001955 the given `port`. Also closes the local ssh tunnel created
1956 for the connection to the host. This function does not
beeps32a63082013-08-22 14:02:29 -07001957 directly alter the state of a previously returned RPC
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001958 client object; however disconnection will cause all
1959 subsequent calls to methods on the object to fail.
1960
1961 This function does nothing if requested to disconnect a port
beeps32a63082013-08-22 14:02:29 -07001962 that was not previously connected via _setup_rpc.
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001963
1964 @param port Port number passed to a previous call to
beeps32a63082013-08-22 14:02:29 -07001965 `_setup_rpc()`.
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001966 """
beeps32a63082013-08-22 14:02:29 -07001967 if port not in self._rpc_proxy_map:
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001968 return
Christopher Wileydd181852013-10-10 19:56:58 -07001969 remote_name, tunnel_proc, remote_pid = self._rpc_proxy_map[port]
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001970 if remote_name:
1971 # We use 'pkill' to find our target process rather than
1972 # a PID, because the host may have rebooted since
1973 # connecting, and we don't want to kill an innocent
1974 # process with the same PID.
1975 #
1976 # 'pkill' helpfully exits with status 1 if no target
1977 # process is found, for which run() will throw an
Simran Basid5e5e272012-09-24 15:23:59 -07001978 # exception. We don't want that, so we the ignore
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001979 # status.
1980 self.run("pkill -f '%s'" % remote_name, ignore_status=True)
Christopher Wileydd181852013-10-10 19:56:58 -07001981 if remote_pid:
1982 logging.info('Waiting for RPC server "%s" shutdown',
1983 remote_name)
1984 start_time = time.time()
1985 while (time.time() - start_time <
1986 self._RPC_SHUTDOWN_TIMEOUT_SECONDS):
1987 running_processes = self.run(
1988 "pgrep -f '%s'" % remote_name,
1989 ignore_status=True).stdout.split()
1990 if not remote_pid in running_processes:
1991 logging.info('Shut down RPC server.')
1992 break
1993 time.sleep(self._RPC_SHUTDOWN_POLLING_PERIOD_SECONDS)
1994 else:
1995 raise error.TestError('Failed to shutdown RPC server %s' %
1996 remote_name)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001997
1998 if tunnel_proc.poll() is None:
1999 tunnel_proc.terminate()
2000 logging.debug('Terminated tunnel, pid %d', tunnel_proc.pid)
2001 else:
2002 logging.debug('Tunnel pid %d terminated early, status %d',
2003 tunnel_proc.pid, tunnel_proc.returncode)
beeps32a63082013-08-22 14:02:29 -07002004 del self._rpc_proxy_map[port]
J. Richard Barnette1d78b012012-05-15 13:56:30 -07002005
2006
beeps32a63082013-08-22 14:02:29 -07002007 def rpc_disconnect_all(self):
2008 """Disconnect all known RPC proxy ports."""
2009 for port in self._rpc_proxy_map.keys():
2010 self.rpc_disconnect(port)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07002011
2012
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002013 def poor_mans_rpc(self, fun):
2014 """
2015 Calls a function from client utils on the host and returns a string.
2016
2017 @param fun function in client utils namespace.
2018 @return output string from calling fun.
2019 """
Simran Basi263a9d32014-08-19 11:16:51 -07002020 script = 'cd %s/bin; ' % autotest.Autotest.get_installed_autodir(self)
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002021 script += 'python -c "import common; import utils;'
2022 script += 'print utils.%s"' % fun
2023 return script
2024
2025
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002026 def _ping_check_status(self, status):
2027 """Ping the host once, and return whether it has a given status.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002028
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002029 @param status Check the ping status against this value.
2030 @return True iff `status` and the result of ping are the same
2031 (i.e. both True or both False).
2032
2033 """
2034 ping_val = utils.ping(self.hostname, tries=1, deadline=1)
2035 return not (status ^ (ping_val == 0))
2036
2037 def _ping_wait_for_status(self, status, timeout):
2038 """Wait for the host to have a given status (UP or DOWN).
2039
2040 Status is checked by polling. Polling will not last longer
2041 than the number of seconds in `timeout`. The polling
2042 interval will be long enough that only approximately
2043 _PING_WAIT_COUNT polling cycles will be executed, subject
2044 to a maximum interval of about one minute.
2045
2046 @param status Waiting will stop immediately if `ping` of the
2047 host returns this status.
2048 @param timeout Poll for at most this many seconds.
2049 @return True iff the host status from `ping` matched the
2050 requested status at the time of return.
2051
2052 """
2053 # _ping_check_status() takes about 1 second, hence the
2054 # "- 1" in the formula below.
2055 poll_interval = min(int(timeout / self._PING_WAIT_COUNT), 60) - 1
2056 end_time = time.time() + timeout
2057 while time.time() <= end_time:
2058 if self._ping_check_status(status):
2059 return True
2060 if poll_interval > 0:
2061 time.sleep(poll_interval)
2062
2063 # The last thing we did was sleep(poll_interval), so it may
2064 # have been too long since the last `ping`. Check one more
2065 # time, just to be sure.
2066 return self._ping_check_status(status)
2067
2068 def ping_wait_up(self, timeout):
2069 """Wait for the host to respond to `ping`.
2070
2071 N.B. This method is not a reliable substitute for
2072 `wait_up()`, because a host that responds to ping will not
2073 necessarily respond to ssh. This method should only be used
2074 if the target DUT can be considered functional even if it
2075 can't be reached via ssh.
2076
2077 @param timeout Minimum time to allow before declaring the
2078 host to be non-responsive.
2079 @return True iff the host answered to ping before the timeout.
2080
2081 """
2082 return self._ping_wait_for_status(self._PING_STATUS_UP, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002083
Andrew Bresticker678c0c72013-01-22 10:44:09 -08002084 def ping_wait_down(self, timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002085 """Wait until the host no longer responds to `ping`.
2086
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002087 This function can be used as a slightly faster version of
2088 `wait_down()`, by avoiding potentially long ssh timeouts.
2089
2090 @param timeout Minimum time to allow for the host to become
2091 non-responsive.
2092 @return True iff the host quit answering ping before the
2093 timeout.
2094
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002095 """
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002096 return self._ping_wait_for_status(self._PING_STATUS_DOWN, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002097
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002098 def test_wait_for_sleep(self, sleep_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002099 """Wait for the client to enter low-power sleep mode.
2100
2101 The test for "is asleep" can't distinguish a system that is
2102 powered off; to confirm that the unit was asleep, it is
2103 necessary to force resume, and then call
2104 `test_wait_for_resume()`.
2105
2106 This function is expected to be called from a test as part
2107 of a sequence like the following:
2108
2109 ~~~~~~~~
2110 boot_id = host.get_boot_id()
2111 # trigger sleep on the host
2112 host.test_wait_for_sleep()
2113 # trigger resume on the host
2114 host.test_wait_for_resume(boot_id)
2115 ~~~~~~~~
2116
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002117 @param sleep_timeout time limit in seconds to allow the host sleep.
2118
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002119 @exception TestFail The host did not go to sleep within
2120 the allowed time.
2121 """
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002122 if sleep_timeout is None:
2123 sleep_timeout = self.SLEEP_TIMEOUT
2124
2125 if not self.ping_wait_down(timeout=sleep_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002126 raise error.TestFail(
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002127 'client failed to sleep after %d seconds' % sleep_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002128
2129
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002130 def test_wait_for_resume(self, old_boot_id, resume_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002131 """Wait for the client to resume from low-power sleep mode.
2132
2133 The `old_boot_id` parameter should be the value from
2134 `get_boot_id()` obtained prior to entering sleep mode. A
2135 `TestFail` exception is raised if the boot id changes.
2136
2137 See @ref test_wait_for_sleep for more on this function's
2138 usage.
2139
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08002140 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002141 target host went to sleep.
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002142 @param resume_timeout time limit in seconds to allow the host up.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002143
2144 @exception TestFail The host did not respond within the
2145 allowed time.
2146 @exception TestFail The host responded, but the boot id test
2147 indicated a reboot rather than a sleep
2148 cycle.
2149 """
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002150 if resume_timeout is None:
2151 resume_timeout = self.RESUME_TIMEOUT
2152
2153 if not self.wait_up(timeout=resume_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002154 raise error.TestFail(
2155 'client failed to resume from sleep after %d seconds' %
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002156 resume_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002157 else:
2158 new_boot_id = self.get_boot_id()
2159 if new_boot_id != old_boot_id:
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002160 logging.error('client rebooted (old boot %s, new boot %s)',
2161 old_boot_id, new_boot_id)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002162 raise error.TestFail(
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002163 'client rebooted, but sleep was expected')
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002164
2165
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002166 def test_wait_for_shutdown(self, shutdown_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002167 """Wait for the client to shut down.
2168
2169 The test for "has shut down" can't distinguish a system that
2170 is merely asleep; to confirm that the unit was down, it is
2171 necessary to force boot, and then call test_wait_for_boot().
2172
2173 This function is expected to be called from a test as part
2174 of a sequence like the following:
2175
2176 ~~~~~~~~
2177 boot_id = host.get_boot_id()
2178 # trigger shutdown on the host
2179 host.test_wait_for_shutdown()
2180 # trigger boot on the host
2181 host.test_wait_for_boot(boot_id)
2182 ~~~~~~~~
2183
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002184 @param shutdown_timeout time limit in seconds to allow the host down.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002185 @exception TestFail The host did not shut down within the
2186 allowed time.
2187 """
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002188 if shutdown_timeout is None:
2189 shutdown_timeout = self.SHUTDOWN_TIMEOUT
2190
2191 if not self.ping_wait_down(timeout=shutdown_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002192 raise error.TestFail(
2193 'client failed to shut down after %d seconds' %
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002194 shutdown_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002195
2196
2197 def test_wait_for_boot(self, old_boot_id=None):
2198 """Wait for the client to boot from cold power.
2199
2200 The `old_boot_id` parameter should be the value from
2201 `get_boot_id()` obtained prior to shutting down. A
2202 `TestFail` exception is raised if the boot id does not
2203 change. The boot id test is omitted if `old_boot_id` is not
2204 specified.
2205
2206 See @ref test_wait_for_shutdown for more on this function's
2207 usage.
2208
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08002209 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002210 shut down.
2211
2212 @exception TestFail The host did not respond within the
2213 allowed time.
2214 @exception TestFail The host responded, but the boot id test
2215 indicated that there was no reboot.
2216 """
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07002217 if not self.wait_up(timeout=self.REBOOT_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002218 raise error.TestFail(
2219 'client failed to reboot after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07002220 self.REBOOT_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002221 elif old_boot_id:
2222 if self.get_boot_id() == old_boot_id:
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002223 logging.error('client not rebooted (boot %s)',
2224 old_boot_id)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002225 raise error.TestFail(
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002226 'client is back up, but did not reboot')
Simran Basid5e5e272012-09-24 15:23:59 -07002227
2228
2229 @staticmethod
2230 def check_for_rpm_support(hostname):
2231 """For a given hostname, return whether or not it is powered by an RPM.
2232
Simran Basi1df55112013-09-06 11:25:09 -07002233 @param hostname: hostname to check for rpm support.
2234
Simran Basid5e5e272012-09-24 15:23:59 -07002235 @return None if this host does not follows the defined naming format
2236 for RPM powered DUT's in the lab. If it does follow the format,
2237 it returns a regular expression MatchObject instead.
2238 """
Fang Dengbaff9082015-01-06 13:46:15 -08002239 return re.match(CrosHost._RPM_HOSTNAME_REGEX, hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07002240
2241
2242 def has_power(self):
2243 """For this host, return whether or not it is powered by an RPM.
2244
2245 @return True if this host is in the CROS lab and follows the defined
2246 naming format.
2247 """
Fang Deng0ca40e22013-08-27 17:47:44 -07002248 return CrosHost.check_for_rpm_support(self.hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07002249
2250
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08002251 def _set_power(self, state, power_method):
2252 """Sets the power to the host via RPM, Servo or manual.
2253
2254 @param state Specifies which power state to set to DUT
2255 @param power_method Specifies which method of power control to
2256 use. By default "RPM" will be used. Valid values
2257 are the strings "RPM", "manual", "servoj10".
2258
2259 """
2260 ACCEPTABLE_STATES = ['ON', 'OFF']
2261
2262 if state.upper() not in ACCEPTABLE_STATES:
2263 raise error.TestError('State must be one of: %s.'
2264 % (ACCEPTABLE_STATES,))
2265
2266 if power_method == self.POWER_CONTROL_SERVO:
2267 logging.info('Setting servo port J10 to %s', state)
2268 self.servo.set('prtctl3_pwren', state.lower())
2269 time.sleep(self._USB_POWER_TIMEOUT)
2270 elif power_method == self.POWER_CONTROL_MANUAL:
2271 logging.info('You have %d seconds to set the AC power to %s.',
2272 self._POWER_CYCLE_TIMEOUT, state)
2273 time.sleep(self._POWER_CYCLE_TIMEOUT)
2274 else:
2275 if not self.has_power():
2276 raise error.TestFail('DUT does not have RPM connected.')
Simran Basi5e6339a2013-03-21 11:34:32 -07002277 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
2278 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, True,
2279 hostname=self.hostname)
Simran Basi1df55112013-09-06 11:25:09 -07002280 rpm_client.set_power(self.hostname, state.upper(), timeout_mins=5)
Simran Basid5e5e272012-09-24 15:23:59 -07002281
2282
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08002283 def power_off(self, power_method=POWER_CONTROL_RPM):
2284 """Turn off power to this host via RPM, Servo or manual.
2285
2286 @param power_method Specifies which method of power control to
2287 use. By default "RPM" will be used. Valid values
2288 are the strings "RPM", "manual", "servoj10".
2289
2290 """
2291 self._set_power('OFF', power_method)
Simran Basid5e5e272012-09-24 15:23:59 -07002292
2293
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08002294 def power_on(self, power_method=POWER_CONTROL_RPM):
2295 """Turn on power to this host via RPM, Servo or manual.
2296
2297 @param power_method Specifies which method of power control to
2298 use. By default "RPM" will be used. Valid values
2299 are the strings "RPM", "manual", "servoj10".
2300
2301 """
2302 self._set_power('ON', power_method)
2303
2304
2305 def power_cycle(self, power_method=POWER_CONTROL_RPM):
2306 """Cycle power to this host by turning it OFF, then ON.
2307
2308 @param power_method Specifies which method of power control to
2309 use. By default "RPM" will be used. Valid values
2310 are the strings "RPM", "manual", "servoj10".
2311
2312 """
2313 if power_method in (self.POWER_CONTROL_SERVO,
2314 self.POWER_CONTROL_MANUAL):
2315 self.power_off(power_method=power_method)
2316 time.sleep(self._POWER_CYCLE_TIMEOUT)
2317 self.power_on(power_method=power_method)
2318 else:
2319 rpm_client.set_power(self.hostname, 'CYCLE')
Simran Basic6f1f7a2012-10-16 10:47:46 -07002320
2321
2322 def get_platform(self):
2323 """Determine the correct platform label for this host.
2324
2325 @returns a string representing this host's platform.
2326 """
2327 crossystem = utils.Crossystem(self)
2328 crossystem.init()
2329 # Extract fwid value and use the leading part as the platform id.
2330 # fwid generally follow the format of {platform}.{firmware version}
2331 # Example: Alex.X.YYY.Z or Google_Alex.X.YYY.Z
2332 platform = crossystem.fwid().split('.')[0].lower()
2333 # Newer platforms start with 'Google_' while the older ones do not.
2334 return platform.replace('google_', '')
2335
2336
Hung-ying Tyanb1328032014-04-01 14:18:54 +08002337 def get_architecture(self):
2338 """Determine the correct architecture label for this host.
2339
2340 @returns a string representing this host's architecture.
2341 """
2342 crossystem = utils.Crossystem(self)
2343 crossystem.init()
2344 return crossystem.arch()
2345
2346
Luis Lozano40b7d0d2014-01-17 15:12:06 -08002347 def get_chrome_version(self):
2348 """Gets the Chrome version number and milestone as strings.
2349
2350 Invokes "chrome --version" to get the version number and milestone.
2351
2352 @return A tuple (chrome_ver, milestone) where "chrome_ver" is the
2353 current Chrome version number as a string (in the form "W.X.Y.Z")
2354 and "milestone" is the first component of the version number
2355 (the "W" from "W.X.Y.Z"). If the version number cannot be parsed
2356 in the "W.X.Y.Z" format, the "chrome_ver" will be the full output
2357 of "chrome --version" and the milestone will be the empty string.
2358
2359 """
MK Ryu35d661e2014-09-25 17:44:10 -07002360 version_string = self.run(client_constants.CHROME_VERSION_COMMAND).stdout
Luis Lozano40b7d0d2014-01-17 15:12:06 -08002361 return utils.parse_chrome_version(version_string)
2362
Aviv Keshet74c89a92013-02-04 15:18:30 -08002363 @label_decorator()
Simran Basic6f1f7a2012-10-16 10:47:46 -07002364 def get_board(self):
2365 """Determine the correct board label for this host.
2366
2367 @returns a string representing this host's board.
2368 """
2369 release_info = utils.parse_cmd_output('cat /etc/lsb-release',
2370 run_method=self.run)
2371 board = release_info['CHROMEOS_RELEASE_BOARD']
2372 # Devices in the lab generally have the correct board name but our own
2373 # development devices have {board_name}-signed-{key_type}. The board
2374 # name may also begin with 'x86-' which we need to keep.
Simran Basi833814b2013-01-29 13:13:43 -08002375 board_format_string = ds_constants.BOARD_PREFIX + '%s'
Simran Basic6f1f7a2012-10-16 10:47:46 -07002376 if 'x86' not in board:
Simran Basi833814b2013-01-29 13:13:43 -08002377 return board_format_string % board.split('-')[0]
2378 return board_format_string % '-'.join(board.split('-')[0:2])
Simran Basic6f1f7a2012-10-16 10:47:46 -07002379
2380
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002381 @label_decorator('board_freq_mem')
2382 def get_board_with_frequency_and_memory(self):
2383 """
2384 Determines the board name with frequency and memory.
2385
2386 @returns a more detailed string representing the board. Examples are
2387 butterfly_1.1GHz_2GB, link_1.8GHz_4GB, x86-zgb_1.7GHz_2GB
2388 """
2389 board = self.run(self.poor_mans_rpc(
2390 'get_board_with_frequency_and_memory()')).stdout
2391 return 'board_freq_mem:%s' % str.strip(board)
2392
2393
Aviv Keshet74c89a92013-02-04 15:18:30 -08002394 @label_decorator('lightsensor')
Simran Basic6f1f7a2012-10-16 10:47:46 -07002395 def has_lightsensor(self):
2396 """Determine the correct board label for this host.
2397
2398 @returns the string 'lightsensor' if this host has a lightsensor or
2399 None if it does not.
2400 """
2401 search_cmd = "find -L %s -maxdepth 4 | egrep '%s'" % (
Richard Barnette82c35912012-11-20 10:09:10 -08002402 self._LIGHTSENSOR_SEARCH_DIR, '|'.join(self._LIGHTSENSOR_FILES))
Simran Basic6f1f7a2012-10-16 10:47:46 -07002403 try:
2404 # Run the search cmd following the symlinks. Stderr_tee is set to
2405 # None as there can be a symlink loop, but the command will still
2406 # execute correctly with a few messages printed to stderr.
2407 self.run(search_cmd, stdout_tee=None, stderr_tee=None)
2408 return 'lightsensor'
2409 except error.AutoservRunError:
2410 # egrep exited with a return code of 1 meaning none of the possible
2411 # lightsensor files existed.
2412 return None
2413
2414
Aviv Keshet74c89a92013-02-04 15:18:30 -08002415 @label_decorator('bluetooth')
Simran Basic6f1f7a2012-10-16 10:47:46 -07002416 def has_bluetooth(self):
2417 """Determine the correct board label for this host.
2418
2419 @returns the string 'bluetooth' if this host has bluetooth or
2420 None if it does not.
2421 """
2422 try:
2423 self.run('test -d /sys/class/bluetooth/hci0')
2424 # test exited with a return code of 0.
2425 return 'bluetooth'
2426 except error.AutoservRunError:
2427 # test exited with a return code 1 meaning the directory did not
2428 # exist.
2429 return None
2430
2431
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002432 @label_decorator('gpu_family')
2433 def get_gpu_family(self):
2434 """
2435 Determine GPU family.
2436
2437 @returns a string representing the gpu family. Examples are mali, tegra,
2438 pinetrail, sandybridge, ivybridge, haswell and baytrail.
2439 """
2440 gpu_family = self.run(self.poor_mans_rpc('get_gpu_family()')).stdout
2441 return 'gpu_family:%s' % str.strip(gpu_family)
2442
2443
Ilja Friedel0ce0b602013-08-15 18:45:27 -07002444 @label_decorator('graphics')
2445 def get_graphics(self):
2446 """
2447 Determine the correct board label for this host.
2448
2449 @returns a string representing this host's graphics. For now ARM boards
2450 return graphics:gles while all other boards return graphics:gl. This
2451 may change over time, but for robustness reasons this should avoid
2452 executing code in actual graphics libraries (which may not be ready and
2453 is tested by graphics_GLAPICheck).
2454 """
2455 uname = self.run('uname -a').stdout.lower()
2456 if 'arm' in uname:
2457 return 'graphics:gles'
2458 return 'graphics:gl'
2459
2460
Bill Richardson4f595f52014-02-13 16:20:26 -08002461 @label_decorator('ec')
2462 def get_ec(self):
2463 """
2464 Determine the type of EC on this host.
2465
2466 @returns a string representing this host's embedded controller type.
2467 At present, it only returns "ec:cros", for Chrome OS ECs. Other types
2468 of EC (or none) don't return any strings, since no tests depend on
2469 those.
2470 """
2471 cmd = 'mosys ec info'
2472 # The output should look like these, so that the last field should
2473 # match our EC version scheme:
2474 #
2475 # stm | stm32f100 | snow_v1.3.139-375eb9f
2476 # ti | Unknown-10de | peppy_v1.5.114-5d52788
2477 #
2478 # Non-Chrome OS ECs will look like these:
2479 #
2480 # ENE | KB932 | 00BE107A00
2481 # ite | it8518 | 3.08
2482 #
2483 # And some systems don't have ECs at all (Lumpy, for example).
2484 regexp = r'^.*\|\s*(\S+_v\d+\.\d+\.\d+-[0-9a-f]+)\s*$'
2485
2486 ecinfo = self.run(command=cmd, ignore_status=True)
2487 if ecinfo.exit_status == 0:
2488 res = re.search(regexp, ecinfo.stdout)
2489 if res:
2490 logging.info("EC version is %s", res.groups()[0])
2491 return 'ec:cros'
2492 logging.info("%s got: %s", cmd, ecinfo.stdout)
2493 # Has an EC, but it's not a Chrome OS EC
2494 return None
2495 logging.info("%s exited with status %d", cmd, ecinfo.exit_status)
2496 # No EC present
2497 return None
2498
2499
Alec Berg31b932b2014-04-04 16:09:11 -07002500 @label_decorator('accels')
2501 def get_accels(self):
2502 """
2503 Determine the type of accelerometers on this host.
2504
2505 @returns a string representing this host's accelerometer type.
2506 At present, it only returns "accel:cros-ec", for accelerometers
2507 attached to a Chrome OS EC, or none, if no accelerometers.
2508 """
2509 # Check to make sure we have ectool
2510 rv = self.run('which ectool', ignore_status=True)
2511 if rv.exit_status:
2512 logging.info("No ectool cmd found, assuming no EC accelerometers")
2513 return None
2514
2515 # Check that the EC supports the motionsense command
2516 rv = self.run('ectool motionsense', ignore_status=True)
2517 if rv.exit_status:
2518 logging.info("EC does not support motionsense command "
2519 "assuming no EC accelerometers")
2520 return None
2521
2522 # Check that EC motion sensors are active
2523 active = self.run('ectool motionsense active').stdout.split('\n')
2524 if active[0] == "0":
2525 logging.info("Motion sense inactive, assuming no EC accelerometers")
2526 return None
2527
2528 logging.info("EC accelerometers found")
2529 return 'accel:cros-ec'
2530
2531
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08002532 @label_decorator('chameleon')
2533 def has_chameleon(self):
2534 """Determine if a Chameleon connected to this host.
2535
Tom Wai-Hong Tambadbb332014-10-10 02:59:41 +08002536 @returns a list containing two strings ('chameleon' and
2537 'chameleon:' + label, e.g. 'chameleon:hdmi') if this host
2538 has a Chameleon or None if it has not.
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08002539 """
2540 if self._chameleon_host:
Tom Wai-Hong Tambadbb332014-10-10 02:59:41 +08002541 return ['chameleon', 'chameleon:' + self.chameleon.get_label()]
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08002542 else:
2543 return None
2544
2545
Cheng-Yi Chiangf4104ff2014-12-23 19:39:01 +08002546 @label_decorator('audio_loopback_dongle')
2547 def has_loopback_dongle(self):
2548 """Determine if an audio loopback dongle is plugged to this host.
2549
2550 @returns 'audio_loopback_dongle' when there is an audio loopback dongle
2551 plugged to this host.
2552 None when there is no audio loopback dongle
2553 plugged to this host.
2554 """
Cheng-Yi Chiang8de78112015-05-27 14:47:08 +08002555 nodes_info = self.run(command=cras_utils.get_cras_nodes_cmd(),
2556 ignore_status=True).stdout
2557 if (cras_utils.node_type_is_plugged('HEADPHONE', nodes_info) and
2558 cras_utils.node_type_is_plugged('MIC', nodes_info)):
Cheng-Yi Chiangf4104ff2014-12-23 19:39:01 +08002559 return 'audio_loopback_dongle'
2560 else:
2561 return None
2562
2563
Derek Basehorec71ff622014-07-07 15:18:40 -07002564 @label_decorator('power_supply')
2565 def get_power_supply(self):
2566 """
2567 Determine what type of power supply the host has
2568
2569 @returns a string representing this host's power supply.
2570 'power:battery' when the device has a battery intended for
2571 extended use
2572 'power:AC_primary' when the device has a battery not intended
2573 for extended use (for moving the machine, etc)
2574 'power:AC_only' when the device has no battery at all.
2575 """
2576 psu = self.run(command='mosys psu type', ignore_status=True)
2577 if psu.exit_status:
2578 # The psu command for mosys is not included for all platforms. The
2579 # assumption is that the device will have a battery if the command
2580 # is not found.
2581 return 'power:battery'
2582
2583 psu_str = psu.stdout.strip()
2584 if psu_str == 'unknown':
2585 return None
2586
2587 return 'power:%s' % psu_str
2588
2589
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002590 @label_decorator('storage')
2591 def get_storage(self):
2592 """
2593 Determine the type of boot device for this host.
2594
2595 Determine if the internal device is SCSI or dw_mmc device.
2596 Then check that it is SSD or HDD or eMMC or something else.
2597
2598 @returns a string representing this host's internal device type.
2599 'storage:ssd' when internal device is solid state drive
2600 'storage:hdd' when internal device is hard disk drive
2601 'storage:mmc' when internal device is mmc drive
2602 None When internal device is something else or
2603 when we are unable to determine the type
2604 """
2605 # The output should be /dev/mmcblk* for SD/eMMC or /dev/sd* for scsi
2606 rootdev_cmd = ' '.join(['. /usr/sbin/write_gpt.sh;',
2607 '. /usr/share/misc/chromeos-common.sh;',
2608 'load_base_vars;',
2609 'get_fixed_dst_drive'])
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002610 rootdev = self.run(command=rootdev_cmd, ignore_status=True)
2611 if rootdev.exit_status:
2612 logging.info("Fail to run %s", rootdev_cmd)
2613 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002614 rootdev_str = rootdev.stdout.strip()
2615
2616 if not rootdev_str:
2617 return None
2618
2619 rootdev_base = os.path.basename(rootdev_str)
2620
2621 mmc_pattern = '/dev/mmcblk[0-9]'
2622 if re.match(mmc_pattern, rootdev_str):
2623 # Use type to determine if the internal device is eMMC or somthing
2624 # else. We can assume that MMC is always an internal device.
2625 type_cmd = 'cat /sys/block/%s/device/type' % rootdev_base
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002626 type = self.run(command=type_cmd, ignore_status=True)
2627 if type.exit_status:
2628 logging.info("Fail to run %s", type_cmd)
2629 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002630 type_str = type.stdout.strip()
2631
2632 if type_str == 'MMC':
2633 return 'storage:mmc'
2634
2635 scsi_pattern = '/dev/sd[a-z]+'
2636 if re.match(scsi_pattern, rootdev.stdout):
2637 # Read symlink for /sys/block/sd* to determine if the internal
2638 # device is connected via ata or usb.
2639 link_cmd = 'readlink /sys/block/%s' % rootdev_base
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002640 link = self.run(command=link_cmd, ignore_status=True)
2641 if link.exit_status:
2642 logging.info("Fail to run %s", link_cmd)
2643 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002644 link_str = link.stdout.strip()
2645 if 'usb' in link_str:
2646 return None
2647
2648 # Read rotation to determine if the internal device is ssd or hdd.
2649 rotate_cmd = str('cat /sys/block/%s/queue/rotational'
2650 % rootdev_base)
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002651 rotate = self.run(command=rotate_cmd, ignore_status=True)
2652 if rotate.exit_status:
2653 logging.info("Fail to run %s", rotate_cmd)
2654 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002655 rotate_str = rotate.stdout.strip()
2656
2657 rotate_dict = {'0':'storage:ssd', '1':'storage:hdd'}
2658 return rotate_dict.get(rotate_str)
2659
2660 # All other internal device / error case will always fall here
2661 return None
2662
2663
Dan Shi4e9a2aa2014-03-24 14:28:42 -07002664 @label_decorator('servo')
2665 def get_servo(self):
2666 """Determine if the host has a servo attached.
2667
2668 If the host has a working servo attached, it should have a servo label.
2669
2670 @return: string 'servo' if the host has servo attached. Otherwise,
2671 returns None.
2672 """
2673 return 'servo' if self._servo_host else None
2674
2675
Dan Shi5beba472014-05-28 22:46:07 -07002676 @label_decorator('video_labels')
2677 def get_video_labels(self):
2678 """Run /usr/local/bin/avtest_label_detect to get a list of video labels.
2679
2680 Sample output of avtest_label_detect:
2681 Detected label: hw_video_acc_vp8
2682 Detected label: webcam
2683
2684 @return: A list of labels detected by tool avtest_label_detect.
2685 """
2686 try:
2687 result = self.run('/usr/local/bin/avtest_label_detect').stdout
2688 return re.findall('^Detected label: (\w+)$', result, re.M)
2689 except error.AutoservRunError:
2690 # The tool is not installed.
2691 return []
2692
2693
mussa584b4462014-06-20 15:13:28 -07002694 @label_decorator('video_glitch_detection')
2695 def is_video_glitch_detection_supported(self):
2696 """ Determine if a board under test is supported for video glitch
2697 detection tests.
2698
2699 @return: 'video_glitch_detection' if board is supported, None otherwise.
2700 """
2701 parser = ConfigParser.SafeConfigParser()
2702 filename = os.path.join(
2703 common.autotest_dir, 'client/cros/video/device_spec.conf')
2704
2705 dut = self.get_board().replace(ds_constants.BOARD_PREFIX, '')
2706
2707 try:
2708 parser.read(filename)
mussa584b4462014-06-20 15:13:28 -07002709 supported_boards = parser.sections()
2710
Mussa83c84d62014-10-02 12:11:28 -07002711 return 'video_glitch_detection' if dut in supported_boards else None
mussa584b4462014-06-20 15:13:28 -07002712
2713 except ConfigParser.error:
2714 # something went wrong while parsing the conf file
2715 return None
2716
Katherine Threlkeld7b97a9f2014-06-24 13:47:14 -07002717 @label_decorator('touch_labels')
2718 def get_touch(self):
2719 """
2720 Determine whether board under test has a touchpad or touchscreen.
2721
2722 @return: A list of some combination of 'touchscreen' and 'touchpad',
2723 depending on what is present on the device.
Katherine Threlkeldab83d392015-06-18 16:45:57 -07002724
Katherine Threlkeld7b97a9f2014-06-24 13:47:14 -07002725 """
2726 labels = []
Katherine Threlkeldab83d392015-06-18 16:45:57 -07002727 looking_for = ['touchpad', 'touchscreen']
2728 player = input_playback.InputPlayback()
2729 input_events = self.run('ls /dev/input/event*').stdout.strip().split()
2730 filename = '/tmp/touch_labels'
2731 for event in input_events:
2732 self.run('evtest %s > %s' % (event, filename), timeout=1,
2733 ignore_timeout=True)
2734 properties = self.run('cat %s' % filename).stdout
2735 input_type = player._determine_input_type(properties)
2736 if input_type in looking_for:
2737 labels.append(input_type)
2738 looking_for.remove(input_type)
2739 if len(looking_for) == 0:
2740 break
2741 self.run('rm %s' % filename)
2742
Katherine Threlkeld7b97a9f2014-06-24 13:47:14 -07002743 return labels
2744
Hung-ying Tyana39b0542015-06-30 10:36:42 +08002745
2746 @label_decorator('internal_display')
2747 def has_internal_display(self):
2748 """Determine if the device under test is equipped with an internal
2749 display.
2750
2751 @return: 'internal_display' if one is present; None otherwise.
2752 """
2753 from autotest_lib.client.cros.graphics import graphics_utils
2754 from autotest_lib.client.common_lib import utils as common_utils
2755
2756 def __system_output(cmd):
2757 return self.run(cmd).stdout
2758
2759 def __read_file(remote_path):
2760 return self.run('cat %s' % remote_path).stdout
2761
2762 # Hijack the necessary client functions so that we can take advantage
2763 # of the client lib here.
2764 # FIXME: find a less hacky way than this
2765 original_system_output = utils.system_output
2766 original_read_file = common_utils.read_file
2767 utils.system_output = __system_output
2768 common_utils.read_file = __read_file
2769 try:
2770 return ('internal_display' if graphics_utils.has_internal_display()
2771 else None)
2772 finally:
2773 utils.system_output = original_system_output
2774 common_utils.read_file = original_read_file
2775
2776
Simran Basic6f1f7a2012-10-16 10:47:46 -07002777 def get_labels(self):
2778 """Return a list of labels for this given host.
2779
2780 This is the main way to retrieve all the automatic labels for a host
2781 as it will run through all the currently implemented label functions.
2782 """
2783 labels = []
Richard Barnette82c35912012-11-20 10:09:10 -08002784 for label_function in self._LABEL_FUNCTIONS:
J. Richard Barnetteb869b222014-09-03 17:55:44 -07002785 try:
2786 label = label_function(self)
2787 except Exception as e:
2788 logging.error('Label function %s failed; ignoring it.',
2789 label_function.__name__)
2790 logging.exception(e)
2791 label = None
Simran Basic6f1f7a2012-10-16 10:47:46 -07002792 if label:
Dan Shi5beba472014-05-28 22:46:07 -07002793 if type(label) is str:
2794 labels.append(label)
2795 elif type(label) is list:
2796 labels.extend(label)
Simran Basic6f1f7a2012-10-16 10:47:46 -07002797 return labels
Dan Shi85276d42014-04-08 22:11:45 -07002798
2799
2800 def is_boot_from_usb(self):
2801 """Check if DUT is boot from USB.
2802
2803 @return: True if DUT is boot from usb.
2804 """
2805 device = self.run('rootdev -s -d').stdout.strip()
2806 removable = int(self.run('cat /sys/block/%s/removable' %
2807 os.path.basename(device)).stdout.strip())
2808 return removable == 1
Helen Zhang17dae2b2014-11-11 09:25:52 -08002809
2810
2811 def read_from_meminfo(self, key):
Dan Shi49ca0932014-11-14 11:22:27 -08002812 """Return the memory info from /proc/meminfo
Helen Zhang17dae2b2014-11-11 09:25:52 -08002813
2814 @param key: meminfo requested
2815
2816 @return the memory value as a string
2817
2818 """
Helen Zhang17dae2b2014-11-11 09:25:52 -08002819 meminfo = self.run('grep %s /proc/meminfo' % key).stdout.strip()
2820 logging.debug('%s', meminfo)
2821 return int(re.search(r'\d+', meminfo).group(0))