blob: 624d49a1b7b3a13d4dc76a7caded8431bc6b5a8e [file] [log] [blame]
J. Richard Barnette24adbf42012-04-11 15:04:53 -07001# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
Dale Curtisaa5eedb2011-08-23 16:18:52 -07002# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4
mussa584b4462014-06-20 15:13:28 -07005import ConfigParser
Aviv Keshet74c89a92013-02-04 15:18:30 -08006import functools
Christopher Wiley0ed712b2013-04-09 15:25:12 -07007import httplib
J. Richard Barnette1d78b012012-05-15 13:56:30 -07008import logging
Dan Shi0f466e82013-02-22 15:44:58 -08009import os
Simran Basid5e5e272012-09-24 15:23:59 -070010import re
Christopher Wileyd78249a2013-03-01 13:05:31 -080011import socket
J. Richard Barnette1d78b012012-05-15 13:56:30 -070012import subprocess
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070013import time
J. Richard Barnette1d78b012012-05-15 13:56:30 -070014import xmlrpclib
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070015
mussa584b4462014-06-20 15:13:28 -070016import common
J. Richard Barnette45e93de2012-04-11 17:24:15 -070017from autotest_lib.client.bin import utils
Dan Shi9cb0eec2014-06-03 09:04:50 -070018from autotest_lib.client.common_lib import autotemp
Richard Barnette0c73ffc2012-11-19 15:21:18 -080019from autotest_lib.client.common_lib import error
20from autotest_lib.client.common_lib import global_config
Dan Shi549fb822015-03-24 18:01:11 -070021from autotest_lib.client.common_lib import lsbrelease_utils
J. Richard Barnette45e93de2012-04-11 17:24:15 -070022from autotest_lib.client.common_lib.cros import autoupdater
Richard Barnette03a0c132012-11-05 12:40:35 -080023from autotest_lib.client.common_lib.cros import dev_server
Christopher Wileyd78249a2013-03-01 13:05:31 -080024from autotest_lib.client.common_lib.cros import retry
Gabe Blackb72f4fb2015-01-20 16:47:13 -080025from autotest_lib.client.common_lib.cros.graphite import autotest_es
Gabe Black1e1c41b2015-02-04 23:55:15 -080026from autotest_lib.client.common_lib.cros.graphite import autotest_stats
MK Ryu35d661e2014-09-25 17:44:10 -070027from autotest_lib.client.cros import constants as client_constants
J. Richard Barnette84890bd2014-02-21 11:05:47 -080028from autotest_lib.client.cros import cros_ui
Cheng-Yi Chiangf4104ff2014-12-23 19:39:01 +080029from autotest_lib.client.cros.audio import cras_utils
Katherine Threlkeldab83d392015-06-18 16:45:57 -070030from autotest_lib.client.cros.input_playback import input_playback
MK Ryu35d661e2014-09-25 17:44:10 -070031from autotest_lib.server import autoserv_parser
32from autotest_lib.server import autotest
33from autotest_lib.server import constants
34from autotest_lib.server import crashcollect
Dan Shia1ecd5c2013-06-06 11:21:31 -070035from autotest_lib.server import utils as server_utils
Dan Shi9cb0eec2014-06-03 09:04:50 -070036from autotest_lib.server.cros import provision
Scott Zawalski89c44dd2013-02-26 09:28:02 -050037from autotest_lib.server.cros.dynamic_suite import constants as ds_constants
Simran Basi5e6339a2013-03-21 11:34:32 -070038from autotest_lib.server.cros.dynamic_suite import tools, frontend_wrappers
Dan Shi9cb0eec2014-06-03 09:04:50 -070039from autotest_lib.server.cros.faft.config.config import Config as FAFTConfig
Fang Deng96667ca2013-08-01 17:46:18 -070040from autotest_lib.server.hosts import abstract_ssh
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +080041from autotest_lib.server.hosts import chameleon_host
Fang Deng5d518f42013-08-02 14:04:32 -070042from autotest_lib.server.hosts import servo_host
Simran Basidcff4252012-11-20 16:13:20 -080043from autotest_lib.site_utils.rpm_control_system import rpm_client
Simran Basid5e5e272012-09-24 15:23:59 -070044
45
beeps32a63082013-08-22 14:02:29 -070046try:
47 import jsonrpclib
48except ImportError:
49 jsonrpclib = None
Fang Deng96667ca2013-08-01 17:46:18 -070050
Fang Dengd1c2b732013-08-20 12:59:46 -070051
beepsc87ff602013-07-31 21:53:00 -070052class FactoryImageCheckerException(error.AutoservError):
53 """Exception raised when an image is a factory image."""
54 pass
55
56
Aviv Keshet74c89a92013-02-04 15:18:30 -080057def add_label_detector(label_function_list, label_list=None, label=None):
58 """Decorator used to group functions together into the provided list.
59 @param label_function_list: List of label detecting functions to add
60 decorated function to.
61 @param label_list: List of detectable labels to add detectable labels to.
62 (Default: None)
63 @param label: Label string that is detectable by this detection function
64 (Default: None)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -080065 """
Simran Basic6f1f7a2012-10-16 10:47:46 -070066 def add_func(func):
Aviv Keshet74c89a92013-02-04 15:18:30 -080067 """
68 @param func: The function to be added as a detector.
69 """
70 label_function_list.append(func)
71 if label and label_list is not None:
72 label_list.append(label)
Simran Basic6f1f7a2012-10-16 10:47:46 -070073 return func
74 return add_func
75
76
Fang Deng0ca40e22013-08-27 17:47:44 -070077class CrosHost(abstract_ssh.AbstractSSHHost):
J. Richard Barnette45e93de2012-04-11 17:24:15 -070078 """Chromium OS specific subclass of Host."""
79
80 _parser = autoserv_parser.autoserv_parser
Scott Zawalski62bacae2013-03-05 10:40:32 -050081 _AFE = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
J. Richard Barnette45e93de2012-04-11 17:24:15 -070082
Richard Barnette03a0c132012-11-05 12:40:35 -080083 # Timeout values (in seconds) associated with various Chrome OS
84 # state changes.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070085 #
Richard Barnette0c73ffc2012-11-19 15:21:18 -080086 # In general, a good rule of thumb is that the timeout can be up
87 # to twice the typical measured value on the slowest platform.
88 # The times here have not necessarily been empirically tested to
89 # meet this criterion.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070090 #
91 # SLEEP_TIMEOUT: Time to allow for suspend to memory.
Richard Barnette0c73ffc2012-11-19 15:21:18 -080092 # RESUME_TIMEOUT: Time to allow for resume after suspend, plus
93 # time to restart the netwowrk.
J. Richard Barnette84890bd2014-02-21 11:05:47 -080094 # SHUTDOWN_TIMEOUT: Time to allow for shut down.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070095 # BOOT_TIMEOUT: Time to allow for boot from power off. Among
Richard Barnette0c73ffc2012-11-19 15:21:18 -080096 # other things, this must account for the 30 second dev-mode
J. Richard Barnetted4649c62013-03-06 17:42:27 -080097 # screen delay and time to start the network.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070098 # USB_BOOT_TIMEOUT: Time to allow for boot from a USB device,
Richard Barnette0c73ffc2012-11-19 15:21:18 -080099 # including the 30 second dev-mode delay and time to start the
J. Richard Barnetted4649c62013-03-06 17:42:27 -0800100 # network.
beepsf079cfb2013-09-18 17:49:51 -0700101 # INSTALL_TIMEOUT: Time to allow for chromeos-install.
J. Richard Barnette84890bd2014-02-21 11:05:47 -0800102 # POWERWASH_BOOT_TIMEOUT: Time to allow for a reboot that
103 # includes powerwash.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -0700104
105 SLEEP_TIMEOUT = 2
J. Richard Barnetted4649c62013-03-06 17:42:27 -0800106 RESUME_TIMEOUT = 10
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +0800107 SHUTDOWN_TIMEOUT = 10
J. Richard Barnettefbcc7122013-07-24 18:24:59 -0700108 BOOT_TIMEOUT = 60
J. Richard Barnetteeb69d722012-06-18 17:29:44 -0700109 USB_BOOT_TIMEOUT = 150
J. Richard Barnette7817b052014-08-28 09:47:29 -0700110 INSTALL_TIMEOUT = 480
Dan Shi2c88eed2013-11-12 10:18:38 -0800111 POWERWASH_BOOT_TIMEOUT = 60
Chris Sosab76e0ee2013-05-22 16:55:41 -0700112
Dan Shica503482015-03-30 17:23:25 -0700113 # Minimum OS version that supports server side packaging. Older builds may
114 # not have server side package built or with Autotest code change to support
115 # server-side packaging.
Dan Shiced09e42015-04-17 16:09:34 -0700116 MIN_VERSION_SUPPORT_SSP = global_config.global_config.get_config_value(
117 'AUTOSERV', 'min_version_support_ssp', type=int)
Dan Shica503482015-03-30 17:23:25 -0700118
J. Richard Barnette84890bd2014-02-21 11:05:47 -0800119 # REBOOT_TIMEOUT: How long to wait for a reboot.
120 #
Chris Sosab76e0ee2013-05-22 16:55:41 -0700121 # We have a long timeout to ensure we don't flakily fail due to other
122 # issues. Shorter timeouts are vetted in platform_RebootAfterUpdate.
Simran Basi1160e2c2013-10-04 16:00:24 -0700123 # TODO(sbasi - crbug.com/276094) Restore to 5 mins once the 'host did not
124 # return from reboot' bug is solved.
125 REBOOT_TIMEOUT = 480
Chris Sosab76e0ee2013-05-22 16:55:41 -0700126
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800127 # _USB_POWER_TIMEOUT: Time to allow for USB to power toggle ON and OFF.
128 # _POWER_CYCLE_TIMEOUT: Time to allow for manual power cycle.
129 _USB_POWER_TIMEOUT = 5
130 _POWER_CYCLE_TIMEOUT = 10
131
beeps32a63082013-08-22 14:02:29 -0700132 _RPC_PROXY_URL = 'http://localhost:%d'
Christopher Wileydd181852013-10-10 19:56:58 -0700133 _RPC_SHUTDOWN_POLLING_PERIOD_SECONDS = 2
Peter Qiu4410db72014-06-05 10:32:41 -0700134 # Set shutdown timeout to account for the time for restarting the UI.
135 _RPC_SHUTDOWN_TIMEOUT_SECONDS = cros_ui.RESTART_UI_TIMEOUT
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800136
Richard Barnette82c35912012-11-20 10:09:10 -0800137 _RPM_RECOVERY_BOARDS = global_config.global_config.get_config_value('CROS',
138 'rpm_recovery_boards', type=str).split(',')
139
140 _MAX_POWER_CYCLE_ATTEMPTS = 6
141 _LAB_MACHINE_FILE = '/mnt/stateful_partition/.labmachine'
Fang Dengdeba14f2014-11-14 11:54:09 -0800142 _RPM_HOSTNAME_REGEX = ('chromeos(\d+)(-row(\d+))?-rack(\d+[a-z]*)'
143 '-host(\d+)')
Katherine Threlkeldab83d392015-06-18 16:45:57 -0700144 _LIGHTSENSOR_FILES = [ "in_illuminance0_input",
145 "in_illuminance_input",
146 "in_illuminance0_raw",
147 "in_illuminance_raw",
148 "illuminance0_input"]
Richard Barnette82c35912012-11-20 10:09:10 -0800149 _LIGHTSENSOR_SEARCH_DIR = '/sys/bus/iio/devices'
150 _LABEL_FUNCTIONS = []
Aviv Keshet74c89a92013-02-04 15:18:30 -0800151 _DETECTABLE_LABELS = []
152 label_decorator = functools.partial(add_label_detector, _LABEL_FUNCTIONS,
153 _DETECTABLE_LABELS)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700154
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -0800155 # Constants used in ping_wait_up() and ping_wait_down().
156 #
157 # _PING_WAIT_COUNT is the approximate number of polling
158 # cycles to use when waiting for a host state change.
159 #
160 # _PING_STATUS_DOWN and _PING_STATUS_UP are names used
161 # for arguments to the internal _ping_wait_for_status()
162 # method.
163 _PING_WAIT_COUNT = 40
164 _PING_STATUS_DOWN = False
165 _PING_STATUS_UP = True
166
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800167 # Allowed values for the power_method argument.
168
169 # POWER_CONTROL_RPM: Passed as default arg for power_off/on/cycle() methods.
170 # POWER_CONTROL_SERVO: Used in set_power() and power_cycle() methods.
171 # POWER_CONTROL_MANUAL: Used in set_power() and power_cycle() methods.
172 POWER_CONTROL_RPM = 'RPM'
173 POWER_CONTROL_SERVO = 'servoj10'
174 POWER_CONTROL_MANUAL = 'manual'
175
176 POWER_CONTROL_VALID_ARGS = (POWER_CONTROL_RPM,
177 POWER_CONTROL_SERVO,
178 POWER_CONTROL_MANUAL)
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800179
Simran Basi5e6339a2013-03-21 11:34:32 -0700180 _RPM_OUTLET_CHANGED = 'outlet_changed'
181
Dan Shi9cb0eec2014-06-03 09:04:50 -0700182 # URL pattern to download firmware image.
183 _FW_IMAGE_URL_PATTERN = global_config.global_config.get_config_value(
184 'CROS', 'firmware_url_pattern', type=str)
beeps687243d2013-07-18 15:29:27 -0700185
MK Ryu35d661e2014-09-25 17:44:10 -0700186 # File that has a list of directories to be collected
187 _LOGS_TO_COLLECT_FILE = os.path.join(
188 common.client_dir, 'common_lib', 'logs_to_collect')
189
190 # Prefix of logging message w.r.t. crash collection
191 _CRASHLOGS_PREFIX = 'collect_crashlogs'
192
193 # Time duration waiting for host up/down check
194 _CHECK_HOST_UP_TIMEOUT_SECS = 15
195
196 # A command that interacts with kernel and hardware (e.g., rm, mkdir, etc)
197 # might not be completely done deep through the hardware when the machine
198 # is powered down right after the command returns.
199 # We should wait for a few seconds to make them done. Finger crossed.
200 _SAFE_WAIT_SECS = 10
201
202
J. Richard Barnette964fba02012-10-24 17:34:29 -0700203 @staticmethod
beeps46dadc92013-11-07 14:07:10 -0800204 def check_host(host, timeout=10):
205 """
206 Check if the given host is a chrome-os host.
207
208 @param host: An ssh host representing a device.
209 @param timeout: The timeout for the run command.
210
211 @return: True if the host device is chromeos.
212
beeps46dadc92013-11-07 14:07:10 -0800213 """
214 try:
Simran Basi933c8af2015-04-29 14:05:07 -0700215 result = host.run(
216 'grep -q CHROMEOS /etc/lsb-release && '
217 '! test -f /mnt/stateful_partition/.android_tester && '
218 '! grep -q moblab /etc/lsb-release',
219 ignore_status=True, timeout=timeout)
beeps46dadc92013-11-07 14:07:10 -0800220 except (error.AutoservRunError, error.AutoservSSHTimeout):
221 return False
222 return result.exit_status == 0
223
224
225 @staticmethod
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800226 def _extract_arguments(args_dict, key_subset):
227 """Extract options from `args_dict` and return a subset result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800228
229 Take the provided dictionary of argument options and return
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800230 a subset that represent standard arguments needed to construct
231 a test-assistant object (chameleon or servo) for a host. The
232 intent is to provide standard argument processing from
Christopher Wiley644ef3e2015-05-15 13:14:14 -0700233 CrosHost for tests that require a test-assistant board
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800234 to operate.
235
236 @param args_dict Dictionary from which to extract the arguments.
237 @param key_subset Tuple of keys to extract from the args_dict, e.g.
238 ('servo_host', 'servo_port').
239 """
240 result = {}
241 for arg in key_subset:
242 if arg in args_dict:
243 result[arg] = args_dict[arg]
244 return result
245
246
247 @staticmethod
248 def get_chameleon_arguments(args_dict):
249 """Extract chameleon options from `args_dict` and return the result.
250
251 Recommended usage:
252 ~~~~~~~~
253 args_dict = utils.args_to_dict(args)
254 chameleon_args = hosts.CrosHost.get_chameleon_arguments(args_dict)
255 host = hosts.create_host(machine, chameleon_args=chameleon_args)
256 ~~~~~~~~
257
258 @param args_dict Dictionary from which to extract the chameleon
259 arguments.
260 """
261 return CrosHost._extract_arguments(
262 args_dict, ('chameleon_host', 'chameleon_port'))
263
264
265 @staticmethod
266 def get_servo_arguments(args_dict):
267 """Extract servo options from `args_dict` and return the result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800268
269 Recommended usage:
270 ~~~~~~~~
271 args_dict = utils.args_to_dict(args)
Fang Deng0ca40e22013-08-27 17:47:44 -0700272 servo_args = hosts.CrosHost.get_servo_arguments(args_dict)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800273 host = hosts.create_host(machine, servo_args=servo_args)
274 ~~~~~~~~
275
276 @param args_dict Dictionary from which to extract the servo
277 arguments.
278 """
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800279 return CrosHost._extract_arguments(
280 args_dict, ('servo_host', 'servo_port'))
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700281
J. Richard Barnette964fba02012-10-24 17:34:29 -0700282
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800283 def _initialize(self, hostname, chameleon_args=None, servo_args=None,
Fang Denge545abb2014-12-30 18:43:47 -0800284 try_lab_servo=False, ssh_verbosity_flag='', ssh_options='',
Fang Dengd1c2b732013-08-20 12:59:46 -0700285 *args, **dargs):
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800286 """Initialize superclasses, |self.chameleon|, and |self.servo|.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700287
Fang Denge545abb2014-12-30 18:43:47 -0800288 This method will attempt to create the test-assistant object
289 (chameleon/servo) when it is needed by the test. Check
290 the docstring of chameleon_host.create_chameleon_host and
291 servo_host.create_servo_host for how this is determined.
Fang Deng5d518f42013-08-02 14:04:32 -0700292
Fang Denge545abb2014-12-30 18:43:47 -0800293 @param hostname: Hostname of the dut.
294 @param chameleon_args: A dictionary that contains args for creating
295 a ChameleonHost. See chameleon_host for details.
296 @param servo_args: A dictionary that contains args for creating
297 a ServoHost object. See servo_host for details.
298 @param try_lab_servo: Boolean, False indicates that ServoHost should
299 not be created for a device in Cros test lab.
300 See servo_host for details.
301 @param ssh_verbosity_flag: String, to pass to the ssh command to control
302 verbosity.
303 @param ssh_options: String, other ssh options to pass to the ssh
304 command.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700305 """
Fang Deng0ca40e22013-08-27 17:47:44 -0700306 super(CrosHost, self)._initialize(hostname=hostname,
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700307 *args, **dargs)
J. Richard Barnettef0859852012-08-20 14:55:50 -0700308 # self.env is a dictionary of environment variable settings
309 # to be exported for commands run on the host.
310 # LIBC_FATAL_STDERR_ can be useful for diagnosing certain
311 # errors that might happen.
312 self.env['LIBC_FATAL_STDERR_'] = '1'
beeps32a63082013-08-22 14:02:29 -0700313 self._rpc_proxy_map = {}
Fang Dengd1c2b732013-08-20 12:59:46 -0700314 self._ssh_verbosity_flag = ssh_verbosity_flag
Aviv Keshetc5947fa2013-09-04 14:06:29 -0700315 self._ssh_options = ssh_options
Fang Deng5d518f42013-08-02 14:04:32 -0700316 # TODO(fdeng): We need to simplify the
317 # process of servo and servo_host initialization.
318 # crbug.com/298432
Fang Denge545abb2014-12-30 18:43:47 -0800319 self._servo_host = servo_host.create_servo_host(
320 dut=self.hostname, servo_args=servo_args,
321 try_lab_servo=try_lab_servo)
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800322 # TODO(waihong): Do the simplication on Chameleon too.
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800323 self._chameleon_host = chameleon_host.create_chameleon_host(
324 dut=self.hostname, chameleon_args=chameleon_args)
325
Dan Shi4d478522014-02-14 13:46:32 -0800326 if self._servo_host is not None:
327 self.servo = self._servo_host.get_servo()
328 else:
329 self.servo = None
330
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800331 if self._chameleon_host:
Tom Wai-Hong Tameaee3402014-01-22 08:52:10 +0800332 self.chameleon = self._chameleon_host.create_chameleon_board()
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800333 else:
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800334 self.chameleon = None
Fang Deng5d518f42013-08-02 14:04:32 -0700335
336
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500337 def get_repair_image_name(self):
338 """Generate a image_name from variables in the global config.
339
340 @returns a str of $board-version/$BUILD.
341
342 """
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500343 board = self._get_board_from_afe()
344 if board is None:
345 raise error.AutoservError('DUT has no board attribute, '
346 'cannot be repaired.')
Dan Shi6964fa52014-12-18 11:04:27 -0800347 stable_version = self._AFE.run('get_stable_version', board=board)
348 build_pattern = global_config.global_config.get_config_value(
349 'CROS', 'stable_build_pattern')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500350 return build_pattern % (board, stable_version)
351
352
Scott Zawalski62bacae2013-03-05 10:40:32 -0500353 def _host_in_AFE(self):
354 """Check if the host is an object the AFE knows.
355
356 @returns the host object.
357 """
358 return self._AFE.get_hosts(hostname=self.hostname)
359
360
Chris Sosab76e0ee2013-05-22 16:55:41 -0700361 def lookup_job_repo_url(self):
362 """Looks up the job_repo_url for the host.
363
364 @returns job_repo_url from AFE or None if not found.
365
366 @raises KeyError if the host does not have a job_repo_url
367 """
368 if not self._host_in_AFE():
369 return None
370
371 hosts = self._AFE.get_hosts(hostname=self.hostname)
beepsb5efc532013-06-04 11:29:34 -0700372 if hosts and ds_constants.JOB_REPO_URL in hosts[0].attributes:
373 return hosts[0].attributes[ds_constants.JOB_REPO_URL]
Chris Sosab76e0ee2013-05-22 16:55:41 -0700374
375
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500376 def clear_cros_version_labels_and_job_repo_url(self):
377 """Clear cros_version labels and host attribute job_repo_url."""
Scott Zawalski62bacae2013-03-05 10:40:32 -0500378 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400379 return
380
Scott Zawalski62bacae2013-03-05 10:40:32 -0500381 host_list = [self.hostname]
382 labels = self._AFE.get_labels(
383 name__startswith=ds_constants.VERSION_PREFIX,
384 host__hostname=self.hostname)
Dan Shi0f466e82013-02-22 15:44:58 -0800385
Scott Zawalski62bacae2013-03-05 10:40:32 -0500386 for label in labels:
387 label.remove_hosts(hosts=host_list)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500388
beepscb6f1e22013-06-28 19:14:10 -0700389 self.update_job_repo_url(None, None)
390
391
392 def update_job_repo_url(self, devserver_url, image_name):
393 """
394 Updates the job_repo_url host attribute and asserts it's value.
395
396 @param devserver_url: The devserver to use in the job_repo_url.
397 @param image_name: The name of the image to use in the job_repo_url.
398
399 @raises AutoservError: If we failed to update the job_repo_url.
400 """
401 repo_url = None
402 if devserver_url and image_name:
403 repo_url = tools.get_package_url(devserver_url, image_name)
404 self._AFE.set_host_attribute(ds_constants.JOB_REPO_URL, repo_url,
Scott Zawalski62bacae2013-03-05 10:40:32 -0500405 hostname=self.hostname)
beepscb6f1e22013-06-28 19:14:10 -0700406 if self.lookup_job_repo_url() != repo_url:
407 raise error.AutoservError('Failed to update job_repo_url with %s, '
408 'host %s' % (repo_url, self.hostname))
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500409
410
Dan Shie9309262013-06-19 22:50:21 -0700411 def add_cros_version_labels_and_job_repo_url(self, image_name):
Scott Zawalskieadbf702013-03-14 09:23:06 -0400412 """Add cros_version labels and host attribute job_repo_url.
413
414 @param image_name: The name of the image e.g.
415 lumpy-release/R27-3837.0.0
Dan Shi7458bf62013-06-10 12:50:16 -0700416
Scott Zawalskieadbf702013-03-14 09:23:06 -0400417 """
Scott Zawalski62bacae2013-03-05 10:40:32 -0500418 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400419 return
Scott Zawalski62bacae2013-03-05 10:40:32 -0500420
Scott Zawalskieadbf702013-03-14 09:23:06 -0400421 cros_label = '%s%s' % (ds_constants.VERSION_PREFIX, image_name)
Dan Shie9309262013-06-19 22:50:21 -0700422 devserver_url = dev_server.ImageServer.resolve(image_name).url()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500423
424 labels = self._AFE.get_labels(name=cros_label)
425 if labels:
426 label = labels[0]
427 else:
428 label = self._AFE.create_label(name=cros_label)
429
430 label.add_hosts([self.hostname])
beepscb6f1e22013-06-28 19:14:10 -0700431 self.update_job_repo_url(devserver_url, image_name)
432
433
beepsdae65fd2013-07-26 16:24:41 -0700434 def verify_job_repo_url(self, tag=''):
beepscb6f1e22013-06-28 19:14:10 -0700435 """
436 Make sure job_repo_url of this host is valid.
437
joychen03eaad92013-06-26 09:55:21 -0700438 Eg: The job_repo_url "http://lmn.cd.ab.xyx:8080/static/\
beepscb6f1e22013-06-28 19:14:10 -0700439 lumpy-release/R29-4279.0.0/autotest/packages" claims to have the
440 autotest package for lumpy-release/R29-4279.0.0. If this isn't the case,
441 download and extract it. If the devserver embedded in the url is
442 unresponsive, update the job_repo_url of the host after staging it on
443 another devserver.
444
445 @param job_repo_url: A url pointing to the devserver where the autotest
446 package for this build should be staged.
beepsdae65fd2013-07-26 16:24:41 -0700447 @param tag: The tag from the server job, in the format
448 <job_id>-<user>/<hostname>, or <hostless> for a server job.
beepscb6f1e22013-06-28 19:14:10 -0700449
450 @raises DevServerException: If we could not resolve a devserver.
451 @raises AutoservError: If we're unable to save the new job_repo_url as
452 a result of choosing a new devserver because the old one failed to
453 respond to a health check.
beeps0c865032013-07-30 11:37:06 -0700454 @raises urllib2.URLError: If the devserver embedded in job_repo_url
455 doesn't respond within the timeout.
beepscb6f1e22013-06-28 19:14:10 -0700456 """
457 job_repo_url = self.lookup_job_repo_url()
458 if not job_repo_url:
459 logging.warning('No job repo url set on host %s', self.hostname)
460 return
461
462 logging.info('Verifying job repo url %s', job_repo_url)
463 devserver_url, image_name = tools.get_devserver_build_from_package_url(
464 job_repo_url)
465
beeps0c865032013-07-30 11:37:06 -0700466 ds = dev_server.ImageServer(devserver_url)
beepscb6f1e22013-06-28 19:14:10 -0700467
468 logging.info('Staging autotest artifacts for %s on devserver %s',
469 image_name, ds.url())
beeps687243d2013-07-18 15:29:27 -0700470
471 start_time = time.time()
Simran Basi25e7a922014-10-31 11:56:10 -0700472 ds.stage_artifacts(image_name, ['autotest_packages'])
beeps687243d2013-07-18 15:29:27 -0700473 stage_time = time.time() - start_time
474
475 # Record how much of the verification time comes from a devserver
476 # restage. If we're doing things right we should not see multiple
477 # devservers for a given board/build/branch path.
478 try:
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800479 board, build_type, branch = server_utils.ParseBuildName(
beeps687243d2013-07-18 15:29:27 -0700480 image_name)[:3]
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800481 except server_utils.ParseBuildNameException:
beeps687243d2013-07-18 15:29:27 -0700482 pass
483 else:
beeps0c865032013-07-30 11:37:06 -0700484 devserver = devserver_url[
Chris Sosa65425082013-10-16 13:26:22 -0700485 devserver_url.find('/') + 2:devserver_url.rfind(':')]
beeps687243d2013-07-18 15:29:27 -0700486 stats_key = {
487 'board': board,
488 'build_type': build_type,
489 'branch': branch,
beeps0c865032013-07-30 11:37:06 -0700490 'devserver': devserver.replace('.', '_'),
beeps687243d2013-07-18 15:29:27 -0700491 }
Gabe Black1e1c41b2015-02-04 23:55:15 -0800492 autotest_stats.Gauge('verify_job_repo_url').send(
beeps687243d2013-07-18 15:29:27 -0700493 '%(board)s.%(build_type)s.%(branch)s.%(devserver)s' % stats_key,
494 stage_time)
beepscb6f1e22013-06-28 19:14:10 -0700495
Scott Zawalskieadbf702013-03-14 09:23:06 -0400496
Dan Shicf4d2032015-03-12 15:04:21 -0700497 def stage_server_side_package(self, image=None):
498 """Stage autotest server-side package on devserver.
499
500 @param image: Full path of an OS image to install or a build name.
501
502 @return: A url to the autotest server-side package.
503 """
504 if image:
505 image_name = tools.get_build_from_image(image)
506 if not image_name:
507 raise error.AutoservError(
508 'Failed to parse build name from %s' % image)
509 ds = dev_server.ImageServer.resolve(image_name)
510 else:
511 job_repo_url = self.lookup_job_repo_url()
512 if job_repo_url:
513 devserver_url, image_name = (
514 tools.get_devserver_build_from_package_url(job_repo_url))
515 ds = dev_server.ImageServer(devserver_url)
516 else:
517 labels = self._AFE.get_labels(
518 name__startswith=ds_constants.VERSION_PREFIX,
519 host__hostname=self.hostname)
520 if not labels:
521 raise error.AutoservError(
522 'Failed to stage server-side package. The host has '
523 'no job_report_url attribute or version label.')
524 image_name = labels[0].name[len(ds_constants.VERSION_PREFIX):]
525 ds = dev_server.ImageServer.resolve(image_name)
Dan Shica503482015-03-30 17:23:25 -0700526
527 # Get the OS version of the build, for any build older than
528 # MIN_VERSION_SUPPORT_SSP, server side packaging is not supported.
529 match = re.match('.*/R\d+-(\d+)\.', image_name)
530 if match and int(match.group(1)) < self.MIN_VERSION_SUPPORT_SSP:
531 logging.warn('Build %s is older than %s. Server side packaging is '
532 'disabled.', image_name, self.MIN_VERSION_SUPPORT_SSP)
533 return None
534
Dan Shicf4d2032015-03-12 15:04:21 -0700535 ds.stage_artifacts(image_name, ['autotest_server_package'])
536 return '%s/static/%s/%s' % (ds.url(), image_name,
537 'autotest_server_package.tar.bz2')
538
539
Dan Shi0f466e82013-02-22 15:44:58 -0800540 def _try_stateful_update(self, update_url, force_update, updater):
541 """Try to use stateful update to initialize DUT.
542
543 When DUT is already running the same version that machine_install
544 tries to install, stateful update is a much faster way to clean up
545 the DUT for testing, compared to a full reimage. It is implemeted
546 by calling autoupdater.run_update, but skipping updating root, as
547 updating the kernel is time consuming and not necessary.
548
549 @param update_url: url of the image.
550 @param force_update: Set to True to update the image even if the DUT
551 is running the same version.
552 @param updater: ChromiumOSUpdater instance used to update the DUT.
553 @returns: True if the DUT was updated with stateful update.
554
555 """
J. Richard Barnette3f731032014-04-07 17:42:59 -0700556 # TODO(jrbarnette): Yes, I hate this re.match() test case.
557 # It's better than the alternative: see crbug.com/360944.
558 image_name = autoupdater.url_to_image_name(update_url)
559 release_pattern = r'^.*-release/R[0-9]+-[0-9]+\.[0-9]+\.0$'
560 if not re.match(release_pattern, image_name):
561 return False
Dan Shi0f466e82013-02-22 15:44:58 -0800562 if not updater.check_version():
563 return False
564 if not force_update:
565 logging.info('Canceling stateful update because the new and '
566 'old versions are the same.')
567 return False
568 # Following folders should be rebuilt after stateful update.
569 # A test file is used to confirm each folder gets rebuilt after
570 # the stateful update.
571 folders_to_check = ['/var', '/home', '/mnt/stateful_partition']
572 test_file = '.test_file_to_be_deleted'
573 for folder in folders_to_check:
574 touch_path = os.path.join(folder, test_file)
575 self.run('touch %s' % touch_path)
576
Chris Sosae92399e2015-04-24 11:32:59 -0700577 updater.run_update(update_root=False)
Dan Shi0f466e82013-02-22 15:44:58 -0800578
579 # Reboot to complete stateful update.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700580 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Dan Shi0f466e82013-02-22 15:44:58 -0800581 check_file_cmd = 'test -f %s; echo $?'
582 for folder in folders_to_check:
583 test_file_path = os.path.join(folder, test_file)
584 result = self.run(check_file_cmd % test_file_path,
585 ignore_status=True)
586 if result.exit_status == 1:
587 return False
588 return True
589
590
J. Richard Barnette7275b612013-06-04 18:13:11 -0700591 def _post_update_processing(self, updater, expected_kernel=None):
Dan Shi0f466e82013-02-22 15:44:58 -0800592 """After the DUT is updated, confirm machine_install succeeded.
593
594 @param updater: ChromiumOSUpdater instance used to update the DUT.
J. Richard Barnette7275b612013-06-04 18:13:11 -0700595 @param expected_kernel: kernel expected to be active after reboot,
596 or `None` to skip rollback checking.
Dan Shi0f466e82013-02-22 15:44:58 -0800597
598 """
J. Richard Barnette7275b612013-06-04 18:13:11 -0700599 # Touch the lab machine file to leave a marker that
600 # distinguishes this image from other test images.
601 # Afterwards, we must re-run the autoreboot script because
602 # it depends on the _LAB_MACHINE_FILE.
Dan Shi0f466e82013-02-22 15:44:58 -0800603 self.run('touch %s' % self._LAB_MACHINE_FILE)
Dan Shi0f466e82013-02-22 15:44:58 -0800604 self.run('start autoreboot')
Chris Sosa65425082013-10-16 13:26:22 -0700605 updater.verify_boot_expectations(
606 expected_kernel, rollback_message=
607 'Build %s failed to boot on %s; system rolled back to previous'
608 'build' % (updater.update_version, self.hostname))
J. Richard Barnette7275b612013-06-04 18:13:11 -0700609 # Check that we've got the build we meant to install.
610 if not updater.check_version_to_confirm_install():
611 raise autoupdater.ChromiumOSError(
612 'Failed to update %s to build %s; found build '
613 '%s instead' % (self.hostname,
Chris Sosa65425082013-10-16 13:26:22 -0700614 updater.update_version,
Dan Shi0942b1d2015-03-31 11:07:00 -0700615 self.get_release_version()))
Dan Shi0f466e82013-02-22 15:44:58 -0800616
Chris Sosae92399e2015-04-24 11:32:59 -0700617 logging.debug('Cleaning up old autotest directories.')
618 try:
619 installed_autodir = autotest.Autotest.get_installed_autodir(self)
620 self.run('rm -rf ' + installed_autodir)
621 except autotest.AutodirNotFoundError:
622 logging.debug('No autotest installed directory found.')
623
Dan Shi0f466e82013-02-22 15:44:58 -0800624
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700625 def _stage_image_for_update(self, image_name=None):
Chris Sosae92399e2015-04-24 11:32:59 -0700626 """Stage a build on a devserver and return the update_url and devserver.
Scott Zawalskieadbf702013-03-14 09:23:06 -0400627
628 @param image_name: a name like lumpy-release/R27-3837.0.0
Chris Sosae92399e2015-04-24 11:32:59 -0700629 @returns a tuple with an update URL like:
Scott Zawalskieadbf702013-03-14 09:23:06 -0400630 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
Chris Sosae92399e2015-04-24 11:32:59 -0700631 and the devserver instance.
Scott Zawalskieadbf702013-03-14 09:23:06 -0400632 """
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700633 if not image_name:
634 image_name = self.get_repair_image_name()
Chris Sosae92399e2015-04-24 11:32:59 -0700635
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700636 logging.info('Staging build for AU: %s', image_name)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400637 devserver = dev_server.ImageServer.resolve(image_name)
638 devserver.trigger_download(image_name, synchronous=False)
Chris Sosae92399e2015-04-24 11:32:59 -0700639 return (tools.image_url_pattern() % (devserver.url(), image_name),
640 devserver)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400641
642
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700643 def stage_image_for_servo(self, image_name=None):
644 """Stage a build on a devserver and return the update_url.
645
646 @param image_name: a name like lumpy-release/R27-3837.0.0
647 @returns an update URL like:
648 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
649 """
650 if not image_name:
651 image_name = self.get_repair_image_name()
652 logging.info('Staging build for servo install: %s', image_name)
653 devserver = dev_server.ImageServer.resolve(image_name)
654 devserver.stage_artifacts(image_name, ['test_image'])
655 return devserver.get_test_image_url(image_name)
656
657
beepse539be02013-07-31 21:57:39 -0700658 def stage_factory_image_for_servo(self, image_name):
659 """Stage a build on a devserver and return the update_url.
660
661 @param image_name: a name like <baord>/4262.204.0
beeps12c0a3c2013-09-03 11:58:27 -0700662
beepse539be02013-07-31 21:57:39 -0700663 @return: An update URL, eg:
664 http://<devserver>/static/canary-channel/\
665 <board>/4262.204.0/factory_test/chromiumos_factory_image.bin
beeps12c0a3c2013-09-03 11:58:27 -0700666
667 @raises: ValueError if the factory artifact name is missing from
668 the config.
669
beepse539be02013-07-31 21:57:39 -0700670 """
671 if not image_name:
672 logging.error('Need an image_name to stage a factory image.')
673 return
674
beeps12c0a3c2013-09-03 11:58:27 -0700675 factory_artifact = global_config.global_config.get_config_value(
676 'CROS', 'factory_artifact', type=str, default='')
677 if not factory_artifact:
678 raise ValueError('Cannot retrieve the factory artifact name from '
679 'autotest config, and hence cannot stage factory '
680 'artifacts.')
681
beepse539be02013-07-31 21:57:39 -0700682 logging.info('Staging build for servo install: %s', image_name)
683 devserver = dev_server.ImageServer.resolve(image_name)
684 devserver.stage_artifacts(
685 image_name,
beeps12c0a3c2013-09-03 11:58:27 -0700686 [factory_artifact],
687 archive_url=None)
beepse539be02013-07-31 21:57:39 -0700688
689 return tools.factory_image_url_pattern() % (devserver.url(), image_name)
690
691
Chris Sosaa3ac2152012-05-23 22:23:13 -0700692 def machine_install(self, update_url=None, force_update=False,
Richard Barnette0b023a72015-04-24 16:07:30 +0000693 local_devserver=False, repair=False,
694 force_full_update=False):
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500695 """Install the DUT.
696
Dan Shi0f466e82013-02-22 15:44:58 -0800697 Use stateful update if the DUT is already running the same build.
698 Stateful update does not update kernel and tends to run much faster
699 than a full reimage. If the DUT is running a different build, or it
700 failed to do a stateful update, full update, including kernel update,
701 will be applied to the DUT.
702
Scott Zawalskieadbf702013-03-14 09:23:06 -0400703 Once a host enters machine_install its cros_version label will be
704 removed as well as its host attribute job_repo_url (used for
705 package install).
706
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500707 @param update_url: The url to use for the update
708 pattern: http://$devserver:###/update/$build
709 If update_url is None and repair is True we will install the
Dan Shi6964fa52014-12-18 11:04:27 -0800710 stable image listed in afe_stable_versions table. If the table
711 is not setup, global_config value under CROS.stable_cros_version
712 will be used instead.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500713 @param force_update: Force an update even if the version installed
714 is the same. Default:False
Christopher Wiley6a4ff932015-05-15 14:00:47 -0700715 @param local_devserver: Used by test_that to allow people to
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500716 use their local devserver. Default: False
Chris Sosae92399e2015-04-24 11:32:59 -0700717 @param repair: Forces update to repair image. Implies force_update.
Fang Deng3d3b9272014-12-22 12:20:28 -0800718 @param force_full_update: If True, do not attempt to run stateful
719 update, force a full reimage. If False, try stateful update
720 first when the dut is already installed with the same version.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500721 @raises autoupdater.ChromiumOSError
722
723 """
Chris Sosae92399e2015-04-24 11:32:59 -0700724 devserver = None
Richard Barnette0b023a72015-04-24 16:07:30 +0000725 if repair:
Chris Sosae92399e2015-04-24 11:32:59 -0700726 update_url, devserver = self._stage_image_for_update()
Richard Barnette0b023a72015-04-24 16:07:30 +0000727 force_update = True
Dan Shi0f466e82013-02-22 15:44:58 -0800728
Chris Sosae92399e2015-04-24 11:32:59 -0700729 if not update_url and not self._parser.options.image:
730 raise error.AutoservError(
731 'There is no update URL, nor a method to get one.')
732
733 if not update_url and self._parser.options.image:
734 # This is the base case where we have no given update URL i.e.
735 # dynamic suites logic etc. This is the most flexible case where we
736 # can serve an update from any of our fleet of devservers.
737 requested_build = self._parser.options.image
738 if not requested_build.startswith('http://'):
739 logging.debug('Update will be staged for this installation')
740 update_url, devserver = self._stage_image_for_update(
741 requested_build)
742 else:
743 update_url = requested_build
744
745 logging.debug('Update URL is %s', update_url)
746
Scott Zawalskieadbf702013-03-14 09:23:06 -0400747 # Remove cros-version and job_repo_url host attribute from host.
748 self.clear_cros_version_labels_and_job_repo_url()
Chris Sosae92399e2015-04-24 11:32:59 -0700749
750 update_complete = False
751 updater = autoupdater.ChromiumOSUpdater(
752 update_url, host=self, local_devserver=local_devserver)
Fang Deng3d3b9272014-12-22 12:20:28 -0800753 if not force_full_update:
754 try:
Chris Sosae92399e2015-04-24 11:32:59 -0700755 # If the DUT is already running the same build, try stateful
756 # update first as it's much quicker than a full re-image.
757 update_complete = self._try_stateful_update(
758 update_url, force_update, updater)
Fang Deng3d3b9272014-12-22 12:20:28 -0800759 except Exception as e:
760 logging.exception(e)
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700761
Dan Shi0f466e82013-02-22 15:44:58 -0800762 inactive_kernel = None
Chris Sosae92399e2015-04-24 11:32:59 -0700763 if update_complete or (not force_update and updater.check_version()):
764 logging.info('Install complete without full update')
765 else:
766 logging.info('DUT requires full update.')
767 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
768 num_of_attempts = provision.FLAKY_DEVSERVER_ATTEMPTS
Chris Sosab7612bc2013-03-21 10:32:37 -0700769
Chris Sosae92399e2015-04-24 11:32:59 -0700770 while num_of_attempts > 0:
771 num_of_attempts -= 1
772 try:
773 updater.run_update()
774 except Exception:
775 logging.warn('Autoupdate did not complete.')
776 # Do additional check for the devserver health. Ideally,
777 # the autoupdater.py could raise an exception when it
778 # detected network flake but that would require
779 # instrumenting the update engine and parsing it log.
780 if (num_of_attempts <= 0 or
781 devserver is None or
782 dev_server.DevServer.devserver_healthy(
783 devserver.url())):
784 raise
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700785
Chris Sosae92399e2015-04-24 11:32:59 -0700786 logging.warn('Devserver looks unhealthy. Trying another')
787 update_url, devserver = self._stage_image_for_update(
788 requested_build)
789 logging.debug('New Update URL is %s', update_url)
790 updater = autoupdater.ChromiumOSUpdater(
791 update_url, host=self,
792 local_devserver=local_devserver)
793 else:
794 break
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700795
Chris Sosae92399e2015-04-24 11:32:59 -0700796 # Give it some time in case of IO issues.
797 time.sleep(10)
Dan Shi5699ac22014-12-19 10:55:49 -0800798
Chris Sosae92399e2015-04-24 11:32:59 -0700799 # Figure out active and inactive kernel.
800 active_kernel, inactive_kernel = updater.get_kernel_state()
Simran Basi13fa1ba2013-03-04 10:56:47 -0800801
Chris Sosae92399e2015-04-24 11:32:59 -0700802 # Ensure inactive kernel has higher priority than active.
803 if (updater.get_kernel_priority(inactive_kernel)
804 < updater.get_kernel_priority(active_kernel)):
805 raise autoupdater.ChromiumOSError(
806 'Update failed. The priority of the inactive kernel'
807 ' partition is less than that of the active kernel'
808 ' partition.')
809
810 # Updater has returned successfully; reboot the host.
811 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
812
813 self._post_update_processing(updater, inactive_kernel)
814 self.add_cros_version_labels_and_job_repo_url(
815 autoupdater.url_to_image_name(update_url))
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700816
817
Dan Shi9cb0eec2014-06-03 09:04:50 -0700818 def _clear_fw_version_labels(self):
819 """Clear firmware version labels from the machine."""
820 labels = self._AFE.get_labels(
821 name__startswith=provision.FW_VERSION_PREFIX,
822 host__hostname=self.hostname)
823 for label in labels:
824 label.remove_hosts(hosts=[self.hostname])
825
826
827 def _add_fw_version_label(self, build):
828 """Add firmware version label to the machine.
829
830 @param build: Build of firmware.
831
832 """
833 fw_label = provision.fw_version_to_label(build)
834 provision.ensure_label_exists(fw_label)
835 label = self._AFE.get_labels(name__startswith=fw_label)[0]
836 label.add_hosts([self.hostname])
837
838
839 def firmware_install(self, build=None):
840 """Install firmware to the DUT.
841
842 Use stateful update if the DUT is already running the same build.
843 Stateful update does not update kernel and tends to run much faster
844 than a full reimage. If the DUT is running a different build, or it
845 failed to do a stateful update, full update, including kernel update,
846 will be applied to the DUT.
847
848 Once a host enters firmware_install its fw_version label will be
849 removed. After the firmware is updated successfully, a new fw_version
850 label will be added to the host.
851
852 @param build: The build version to which we want to provision the
853 firmware of the machine,
854 e.g. 'link-firmware/R22-2695.1.144'.
855
856 TODO(dshi): After bug 381718 is fixed, update here with corresponding
857 exceptions that could be raised.
858
859 """
860 if not self.servo:
861 raise error.TestError('Host %s does not have servo.' %
862 self.hostname)
863
864 # TODO(fdeng): use host.get_board() after
865 # crbug.com/271834 is fixed.
866 board = self._get_board_from_afe()
867
Chris Sosae92399e2015-04-24 11:32:59 -0700868 # If build is not set, try to install firmware from stable CrOS.
Dan Shi9cb0eec2014-06-03 09:04:50 -0700869 if not build:
870 build = self.get_repair_image_name()
871
872 config = FAFTConfig(board)
873 if config.use_u_boot:
874 ap_image = 'image-%s.bin' % board
875 else: # Depthcharge platform
876 ap_image = 'image.bin'
877 ec_image = 'ec.bin'
878 ds = dev_server.ImageServer.resolve(build)
879 ds.stage_artifacts(build, ['firmware'])
880
881 tmpd = autotemp.tempdir(unique_id='fwimage')
882 try:
883 fwurl = self._FW_IMAGE_URL_PATTERN % (ds.url(), build)
884 local_tarball = os.path.join(tmpd.name, os.path.basename(fwurl))
885 server_utils.system('wget -O %s %s' % (local_tarball, fwurl),
886 timeout=60)
887 server_utils.system('tar xf %s -C %s %s %s' %
888 (local_tarball, tmpd.name, ap_image, ec_image),
889 timeout=60)
890 server_utils.system('tar xf %s --wildcards -C %s "dts/*"' %
891 (local_tarball, tmpd.name),
892 timeout=60, ignore_status=True)
893
894 self._clear_fw_version_labels()
895 logging.info('Will re-program EC now')
896 self.servo.program_ec(os.path.join(tmpd.name, ec_image))
897 logging.info('Will re-program BIOS now')
898 self.servo.program_bios(os.path.join(tmpd.name, ap_image))
899 self.servo.get_power_state_controller().reset()
900 time.sleep(self.servo.BOOT_DELAY)
Dan Shia5fef052015-05-18 23:28:47 -0700901 self._add_fw_version_label(build)
Dan Shi9cb0eec2014-06-03 09:04:50 -0700902 finally:
903 tmpd.clean()
904
905
Dan Shi10e992b2013-08-30 11:02:59 -0700906 def show_update_engine_log(self):
907 """Output update engine log."""
MK Ryu35d661e2014-09-25 17:44:10 -0700908 logging.debug('Dumping %s', client_constants.UPDATE_ENGINE_LOG)
909 self.run('cat %s' % client_constants.UPDATE_ENGINE_LOG)
Dan Shi10e992b2013-08-30 11:02:59 -0700910
911
Richard Barnette82c35912012-11-20 10:09:10 -0800912 def _get_board_from_afe(self):
913 """Retrieve this host's board from its labels in the AFE.
914
915 Looks for a host label of the form "board:<board>", and
916 returns the "<board>" part of the label. `None` is returned
917 if there is not a single, unique label matching the pattern.
918
919 @returns board from label, or `None`.
920 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700921 return server_utils.get_board_from_afe(self.hostname, self._AFE)
Simran Basi833814b2013-01-29 13:13:43 -0800922
923
924 def get_build(self):
925 """Retrieve the current build for this Host from the AFE.
926
927 Looks through this host's labels in the AFE to determine its build.
928
929 @returns The current build or None if it could not find it or if there
930 were multiple build labels assigned to this host.
931 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700932 return server_utils.get_build_from_afe(self.hostname, self._AFE)
Richard Barnette82c35912012-11-20 10:09:10 -0800933
934
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500935 def _install_repair(self):
Chris Sosae92399e2015-04-24 11:32:59 -0700936 """Attempt to repair this host using the update-engine.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500937
938 If the host is up, try installing the DUT with a stable
Dan Shi6964fa52014-12-18 11:04:27 -0800939 "repair" version of Chrome OS as defined in afe_stable_versions table.
940 If the table is not setup, global_config value under
941 CROS.stable_cros_version will be used instead.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500942
Scott Zawalski62bacae2013-03-05 10:40:32 -0500943 @raises AutoservRepairMethodNA if the DUT is not reachable.
944 @raises ChromiumOSError if the install failed for some reason.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500945
946 """
947 if not self.is_up():
Scott Zawalski62bacae2013-03-05 10:40:32 -0500948 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500949 logging.info('Attempting to reimage machine to repair image.')
950 try:
Richard Barnette0b023a72015-04-24 16:07:30 +0000951 self.machine_install(repair=True)
Fang Dengd0672f32013-03-18 17:18:09 -0700952 except autoupdater.ChromiumOSError as e:
953 logging.exception(e)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500954 logging.info('Repair via install failed.')
Scott Zawalski62bacae2013-03-05 10:40:32 -0500955 raise
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500956
957
Dan Shi2c88eed2013-11-12 10:18:38 -0800958 def _install_repair_with_powerwash(self):
Dan Shi9cc48452013-11-12 12:39:26 -0800959 """Attempt to powerwash first then repair this host using update-engine.
Dan Shi2c88eed2013-11-12 10:18:38 -0800960
Dan Shi9cc48452013-11-12 12:39:26 -0800961 update-engine may fail due to a bad image. In such case, powerwash
962 may help to cleanup the DUT for update-engine to work again.
Dan Shi2c88eed2013-11-12 10:18:38 -0800963
964 @raises AutoservRepairMethodNA if the DUT is not reachable.
965 @raises ChromiumOSError if the install failed for some reason.
966
967 """
968 if not self.is_up():
969 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
970
971 logging.info('Attempting to powerwash the DUT.')
972 self.run('echo "fast safe" > '
973 '/mnt/stateful_partition/factory_install_reset')
974 self.reboot(timeout=self.POWERWASH_BOOT_TIMEOUT, wait=True)
975 if not self.is_up():
Dan Shi9cc48452013-11-12 12:39:26 -0800976 logging.error('Powerwash failed. DUT did not come back after '
Dan Shi2c88eed2013-11-12 10:18:38 -0800977 'reboot.')
978 raise error.AutoservRepairFailure(
979 'DUT failed to boot from powerwash after %d seconds' %
980 self.POWERWASH_BOOT_TIMEOUT)
981
982 logging.info('Powerwash succeeded.')
983 self._install_repair()
984
985
beepsf079cfb2013-09-18 17:49:51 -0700986 def servo_install(self, image_url=None, usb_boot_timeout=USB_BOOT_TIMEOUT,
987 install_timeout=INSTALL_TIMEOUT):
Scott Zawalski62bacae2013-03-05 10:40:32 -0500988 """
989 Re-install the OS on the DUT by:
990 1) installing a test image on a USB storage device attached to the Servo
991 board,
Richard Barnette03a0c132012-11-05 12:40:35 -0800992 2) booting that image in recovery mode, and then
J. Richard Barnette31b2e312013-04-04 16:05:22 -0700993 3) installing the image with chromeos-install.
994
Scott Zawalski62bacae2013-03-05 10:40:32 -0500995 @param image_url: If specified use as the url to install on the DUT.
996 otherwise boot the currently staged image on the USB stick.
beepsf079cfb2013-09-18 17:49:51 -0700997 @param usb_boot_timeout: The usb_boot_timeout to use during reimage.
998 Factory images need a longer usb_boot_timeout than regular
999 cros images.
1000 @param install_timeout: The timeout to use when installing the chromeos
1001 image. Factory images need a longer install_timeout.
Richard Barnette03a0c132012-11-05 12:40:35 -08001002
Scott Zawalski62bacae2013-03-05 10:40:32 -05001003 @raises AutoservError if the image fails to boot.
beepsf079cfb2013-09-18 17:49:51 -07001004
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001005 """
beepsf079cfb2013-09-18 17:49:51 -07001006 usb_boot_timer_key = ('servo_install.usb_boot_timeout_%s'
1007 % usb_boot_timeout)
1008 logging.info('Downloading image to USB, then booting from it. Usb boot '
1009 'timeout = %s', usb_boot_timeout)
Gabe Black1e1c41b2015-02-04 23:55:15 -08001010 timer = autotest_stats.Timer(usb_boot_timer_key)
beepsf079cfb2013-09-18 17:49:51 -07001011 timer.start()
J. Richard Barnette31b2e312013-04-04 16:05:22 -07001012 self.servo.install_recovery_image(image_url)
beepsf079cfb2013-09-18 17:49:51 -07001013 if not self.wait_up(timeout=usb_boot_timeout):
Scott Zawalski62bacae2013-03-05 10:40:32 -05001014 raise error.AutoservRepairFailure(
1015 'DUT failed to boot from USB after %d seconds' %
beepsf079cfb2013-09-18 17:49:51 -07001016 usb_boot_timeout)
1017 timer.stop()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001018
beepsf079cfb2013-09-18 17:49:51 -07001019 install_timer_key = ('servo_install.install_timeout_%s'
1020 % install_timeout)
Gabe Black1e1c41b2015-02-04 23:55:15 -08001021 timer = autotest_stats.Timer(install_timer_key)
beepsf079cfb2013-09-18 17:49:51 -07001022 timer.start()
1023 logging.info('Installing image through chromeos-install.')
J. Richard Barnette2522a8f2015-03-04 15:59:15 -08001024 self.run('chromeos-install --yes',
MK Ryu35d661e2014-09-25 17:44:10 -07001025 timeout=install_timeout)
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001026 self.run('halt')
beepsf079cfb2013-09-18 17:49:51 -07001027 timer.stop()
1028
1029 logging.info('Power cycling DUT through servo.')
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001030 self.servo.get_power_state_controller().power_off()
Fang Dengafb88142013-05-30 17:44:31 -07001031 self.servo.switch_usbkey('off')
J. Richard Barnette0199cc82014-12-05 17:08:40 -08001032 # N.B. The Servo API requires that we use power_on() here
1033 # for two reasons:
1034 # 1) After turning on a DUT in recovery mode, you must turn
1035 # it off and then on with power_on() once more to
1036 # disable recovery mode (this is a Parrot specific
1037 # requirement).
1038 # 2) After power_off(), the only way to turn on is with
1039 # power_on() (this is a Storm specific requirement).
J. Richard Barnettefbcc7122013-07-24 18:24:59 -07001040 self.servo.get_power_state_controller().power_on()
beepsf079cfb2013-09-18 17:49:51 -07001041
1042 logging.info('Waiting for DUT to come back up.')
Richard Barnette03a0c132012-11-05 12:40:35 -08001043 if not self.wait_up(timeout=self.BOOT_TIMEOUT):
1044 raise error.AutoservError('DUT failed to reboot installed '
1045 'test image after %d seconds' %
Scott Zawalski62bacae2013-03-05 10:40:32 -05001046 self.BOOT_TIMEOUT)
1047
1048
J. Richard Barnettee4af8b92013-05-01 13:16:12 -07001049 def _servo_repair_reinstall(self):
Scott Zawalski62bacae2013-03-05 10:40:32 -05001050 """Reinstall the DUT utilizing servo and a test image.
1051
1052 Re-install the OS on the DUT by:
1053 1) installing a test image on a USB storage device attached to the Servo
1054 board,
1055 2) booting that image in recovery mode, and then
1056 3) installing the image with chromeos-install.
1057
Scott Zawalski62bacae2013-03-05 10:40:32 -05001058 @raises AutoservRepairMethodNA if the device does not have servo
1059 support.
1060
1061 """
1062 if not self.servo:
1063 raise error.AutoservRepairMethodNA('Repair Reinstall NA: '
1064 'DUT has no servo support.')
1065
1066 logging.info('Attempting to recovery servo enabled device with '
1067 'servo_repair_reinstall')
1068
J. Richard Barnettee4af8b92013-05-01 13:16:12 -07001069 image_url = self.stage_image_for_servo()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001070 self.servo_install(image_url)
1071
1072
1073 def _servo_repair_power(self):
1074 """Attempt to repair DUT using an attached Servo.
1075
1076 Attempt to power on the DUT via power_long_press.
1077
1078 @raises AutoservRepairMethodNA if the device does not have servo
1079 support.
1080 @raises AutoservRepairFailure if the repair fails for any reason.
1081 """
1082 if not self.servo:
1083 raise error.AutoservRepairMethodNA('Repair Power NA: '
1084 'DUT has no servo support.')
1085
1086 logging.info('Attempting to recover servo enabled device by '
1087 'powering it off and on.')
1088 self.servo.get_power_state_controller().power_off()
1089 self.servo.get_power_state_controller().power_on()
1090 if self.wait_up(self.BOOT_TIMEOUT):
1091 return
1092
1093 raise error.AutoservRepairFailure('DUT did not boot after long_press.')
Richard Barnette03a0c132012-11-05 12:40:35 -08001094
1095
Richard Barnette82c35912012-11-20 10:09:10 -08001096 def _powercycle_to_repair(self):
1097 """Utilize the RPM Infrastructure to bring the host back up.
1098
1099 If the host is not up/repaired after the first powercycle we utilize
1100 auto fallback to the last good install by powercycling and rebooting the
1101 host 6 times.
Scott Zawalski62bacae2013-03-05 10:40:32 -05001102
1103 @raises AutoservRepairMethodNA if the device does not support remote
1104 power.
1105 @raises AutoservRepairFailure if the repair fails for any reason.
1106
Richard Barnette82c35912012-11-20 10:09:10 -08001107 """
Scott Zawalski62bacae2013-03-05 10:40:32 -05001108 if not self.has_power():
1109 raise error.AutoservRepairMethodNA('Device does not support power.')
1110
Richard Barnette82c35912012-11-20 10:09:10 -08001111 logging.info('Attempting repair via RPM powercycle.')
1112 failed_cycles = 0
1113 self.power_cycle()
1114 while not self.wait_up(timeout=self.BOOT_TIMEOUT):
1115 failed_cycles += 1
1116 if failed_cycles >= self._MAX_POWER_CYCLE_ATTEMPTS:
Scott Zawalski62bacae2013-03-05 10:40:32 -05001117 raise error.AutoservRepairFailure(
1118 'Powercycled host %s %d times; device did not come back'
1119 ' online.' % (self.hostname, failed_cycles))
Richard Barnette82c35912012-11-20 10:09:10 -08001120 self.power_cycle()
1121 if failed_cycles == 0:
1122 logging.info('Powercycling was successful first time.')
1123 else:
1124 logging.info('Powercycling was successful after %d failures.',
1125 failed_cycles)
1126
1127
MK Ryu35d661e2014-09-25 17:44:10 -07001128 def _reboot_repair(self):
1129 """SSH to this host and reboot."""
1130 if not self.is_up(self._CHECK_HOST_UP_TIMEOUT_SECS):
1131 raise error.AutoservRepairMethodNA('DUT unreachable for reboot.')
1132 logging.info('Attempting repair via SSH reboot.')
1133 self.reboot(timeout=self.BOOT_TIMEOUT, wait=True)
1134
1135
Prashanth B4d8184f2014-05-05 12:22:02 -07001136 def check_device(self):
1137 """Check if a device is ssh-able, and if so, clean and verify it.
1138
1139 @raise AutoservSSHTimeout: If the ssh ping times out.
1140 @raise AutoservSshPermissionDeniedError: If ssh ping fails due to
1141 permissions.
1142 @raise AutoservSshPingHostError: For other AutoservRunErrors during
1143 ssh_ping.
1144 @raises AutoservError: As appropriate, during cleanup and verify.
1145 """
1146 self.ssh_ping()
1147 self.cleanup()
1148 self.verify()
1149
1150
Richard Barnette82c35912012-11-20 10:09:10 -08001151 def repair_full(self):
1152 """Repair a host for repair level NO_PROTECTION.
1153
1154 This overrides the base class function for repair; it does
1155 not call back to the parent class, but instead offers a
1156 simplified implementation based on the capabilities in the
1157 Chrome OS test lab.
1158
Fang Deng5d518f42013-08-02 14:04:32 -07001159 It first verifies and repairs servo if it is a DUT in CrOS
Fang Deng03590af2013-10-07 17:34:20 -07001160 lab and a servo is attached.
Fang Deng5d518f42013-08-02 14:04:32 -07001161
Jakob Juelich82b7d1c2014-09-15 16:10:57 -07001162 This escalates in order through the following procedures and verifies
1163 the status using `self.check_device()` after each of them. This is done
1164 until both the repair and the veryfing step succeed.
1165
MK Ryu35d661e2014-09-25 17:44:10 -07001166 Escalation order of repair procedures from less intrusive to
1167 more intrusive repairs:
1168 1. SSH to the DUT and reboot.
Scott Zawalski62bacae2013-03-05 10:40:32 -05001169 2. If there's a servo for the DUT, try to power the DUT off and
1170 on.
MK Ryu35d661e2014-09-25 17:44:10 -07001171 3. If the DUT can be power-cycled via RPM, try to repair
Richard Barnette82c35912012-11-20 10:09:10 -08001172 by power-cycling.
MK Ryu35d661e2014-09-25 17:44:10 -07001173 4. Try to re-install to a known stable image using
1174 auto-update.
1175 5. If there's a servo for the DUT, try to re-install via
1176 the servo.
Richard Barnette82c35912012-11-20 10:09:10 -08001177
1178 As with the parent method, the last operation performed on
Prashanth B4d8184f2014-05-05 12:22:02 -07001179 the DUT must be to call `self.check_device()`; If that call fails the
1180 exception it raises is passed back to the caller.
J. Richard Barnettefde55fc2013-03-15 17:47:01 -07001181
Scott Zawalski62bacae2013-03-05 10:40:32 -05001182 @raises AutoservRepairTotalFailure if the repair process fails to
1183 fix the DUT.
Fang Deng5d518f42013-08-02 14:04:32 -07001184 @raises ServoHostRepairTotalFailure if the repair process fails to
1185 fix the servo host if one is attached to the DUT.
1186 @raises AutoservSshPermissionDeniedError if it is unable
1187 to ssh to the servo host due to permission error.
1188
Richard Barnette82c35912012-11-20 10:09:10 -08001189 """
Jakob Juelich82b7d1c2014-09-15 16:10:57 -07001190 # Caution: Deleting shards relies on repair to always reboot the DUT.
1191
Dan Shi4d478522014-02-14 13:46:32 -08001192 if self._servo_host and not self.servo:
Fang Deng03590af2013-10-07 17:34:20 -07001193 try:
Dan Shi4d478522014-02-14 13:46:32 -08001194 self._servo_host.repair_full()
Fang Deng03590af2013-10-07 17:34:20 -07001195 except Exception as e:
Fang Deng03590af2013-10-07 17:34:20 -07001196 logging.error('Could not create a healthy servo: %s', e)
Dan Shi4d478522014-02-14 13:46:32 -08001197 self.servo = self._servo_host.get_servo()
Fang Deng5d518f42013-08-02 14:04:32 -07001198
MK Ryu35d661e2014-09-25 17:44:10 -07001199 self.try_collect_crashlogs()
1200
Scott Zawalski62bacae2013-03-05 10:40:32 -05001201 # TODO(scottz): This should use something similar to label_decorator,
1202 # but needs to be populated in order so DUTs are repaired with the
1203 # least amount of effort.
MK Ryu35d661e2014-09-25 17:44:10 -07001204 repair_funcs = [self._reboot_repair,
1205 self._servo_repair_power,
1206 self._powercycle_to_repair,
Dan Shi849a1c42014-03-05 11:10:43 -08001207 self._install_repair,
Dan Shi2c88eed2013-11-12 10:18:38 -08001208 self._install_repair_with_powerwash,
MK Ryu35d661e2014-09-25 17:44:10 -07001209 self._servo_repair_reinstall]
Scott Zawalski62bacae2013-03-05 10:40:32 -05001210 errors = []
Simran Basie6130932013-10-01 14:07:52 -07001211 board = self._get_board_from_afe()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001212 for repair_func in repair_funcs:
1213 try:
1214 repair_func()
MK Ryu35d661e2014-09-25 17:44:10 -07001215 self.try_collect_crashlogs()
Prashanth B4d8184f2014-05-05 12:22:02 -07001216 self.check_device()
Gabe Black1e1c41b2015-02-04 23:55:15 -08001217 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001218 '%s.SUCCEEDED' % repair_func.__name__).increment()
1219 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001220 autotest_stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001221 '%s.%s.SUCCEEDED' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001222 board)).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001223 return
Simran Basie6130932013-10-01 14:07:52 -07001224 except error.AutoservRepairMethodNA as e:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001225 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001226 '%s.RepairNA' % repair_func.__name__).increment()
1227 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001228 autotest_stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001229 '%s.%s.RepairNA' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001230 board)).increment()
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001231 logging.warning('Repair function NA: %s', e)
Simran Basie6130932013-10-01 14:07:52 -07001232 errors.append(str(e))
Scott Zawalski62bacae2013-03-05 10:40:32 -05001233 except Exception as e:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001234 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001235 '%s.FAILED' % repair_func.__name__).increment()
1236 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001237 autotest_stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001238 '%s.%s.FAILED' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001239 board)).increment()
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001240 logging.warning('Failed to repair device: %s', e)
Scott Zawalski62bacae2013-03-05 10:40:32 -05001241 errors.append(str(e))
Scott Zawalski89c44dd2013-02-26 09:28:02 -05001242
Gabe Black1e1c41b2015-02-04 23:55:15 -08001243 autotest_stats.Counter('Full_Repair_Failed').increment()
Simran Basie6130932013-10-01 14:07:52 -07001244 if board:
Gabe Black1e1c41b2015-02-04 23:55:15 -08001245 autotest_stats.Counter(
Simran Basie6130932013-10-01 14:07:52 -07001246 'Full_Repair_Failed.%s' % board).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001247 raise error.AutoservRepairTotalFailure(
1248 'All attempts at repairing the device failed:\n%s' %
1249 '\n'.join(errors))
Richard Barnette82c35912012-11-20 10:09:10 -08001250
1251
MK Ryu35d661e2014-09-25 17:44:10 -07001252 def try_collect_crashlogs(self, check_host_up=True):
1253 """
1254 Check if a host is up and logs need to be collected from the host,
1255 if yes, collect them.
1256
1257 @param check_host_up: Flag for checking host is up. Default is True.
1258 """
1259 try:
1260 crash_job = self._need_crash_logs()
1261 if crash_job:
1262 logging.debug('%s: Job %s was crashed', self._CRASHLOGS_PREFIX,
1263 crash_job)
1264 if not check_host_up or self.is_up(
1265 self._CHECK_HOST_UP_TIMEOUT_SECS):
1266 self._collect_crashlogs(crash_job)
1267 logging.debug('%s: Completed collecting logs for the '
1268 'crashed job %s', self._CRASHLOGS_PREFIX,
1269 crash_job)
1270 except Exception as e:
1271 # Exception should not result in repair failure.
1272 # Therefore, suppress all exceptions here.
1273 logging.error('%s: Failed while trying to collect crash-logs: %s',
1274 self._CRASHLOGS_PREFIX, e)
1275
1276
1277 def _need_crash_logs(self):
1278 """Get the value of need_crash_logs attribute of this host.
1279
1280 @return: Value string of need_crash_logs attribute
1281 None if there is no need_crash_logs attribute
1282 """
1283 attrs = self._AFE.get_host_attribute(constants.CRASHLOGS_HOST_ATTRIBUTE,
1284 hostname=self.hostname)
1285 assert len(attrs) < 2
1286 return attrs[0].value if attrs else None
1287
1288
1289 def _collect_crashlogs(self, job_id):
1290 """Grab logs from the host where a job was crashed.
1291
1292 First, check if PRIOR_LOGS_DIR exists in the host.
1293 If yes, collect them.
1294 Otherwise, check if a lab-machine marker (_LAB_MACHINE_FILE) exists
1295 in the host.
1296 If yes, the host was repaired automatically, and we collect normal
1297 system logs.
1298
1299 @param job_id: Id of the job that was crashed.
1300 """
1301 crashlogs_dir = crashcollect.get_crashinfo_dir(self,
1302 constants.CRASHLOGS_DEST_DIR_PREFIX)
1303 flag_prior_logs = False
1304
1305 if self.path_exists(client_constants.PRIOR_LOGS_DIR):
1306 flag_prior_logs = True
1307 self._collect_prior_logs(crashlogs_dir)
1308 elif self.path_exists(self._LAB_MACHINE_FILE):
1309 self._collect_system_logs(crashlogs_dir)
1310 else:
1311 logging.warning('%s: Host was manually re-installed without '
1312 '--lab_preserve_log option. Skip collecting '
1313 'crash-logs.', self._CRASHLOGS_PREFIX)
1314
1315 # We make crash collection be one-time effort.
1316 # _collect_prior_logs() and _collect_system_logs() will not throw
1317 # any exception, and following codes will be executed even when
1318 # those methods fail.
1319 # _collect_crashlogs() is called only when the host is up (refer
1320 # to try_collect_crashlogs()). We assume _collect_prior_logs() and
1321 # _collect_system_logs() fail rarely when the host is up.
1322 # In addition, it is not clear how many times we should try crash
1323 # collection again while not triggering next repair unnecessarily.
1324 # Threfore, we try crash collection one time.
1325
1326 # Create a marker file as soon as log collection is done.
1327 # Leave the job id to this marker for gs_offloader to consume.
1328 marker_file = os.path.join(crashlogs_dir, constants.CRASHLOGS_MARKER)
1329 with open(marker_file, 'a') as f:
1330 f.write('%s\n' % job_id)
1331
1332 # Remove need_crash_logs attribute
1333 logging.debug('%s: Remove attribute need_crash_logs from host %s',
1334 self._CRASHLOGS_PREFIX, self.hostname)
1335 self._AFE.set_host_attribute(constants.CRASHLOGS_HOST_ATTRIBUTE,
1336 None, hostname=self.hostname)
1337
1338 if flag_prior_logs:
1339 logging.debug('%s: Remove %s from host %s', self._CRASHLOGS_PREFIX,
1340 client_constants.PRIOR_LOGS_DIR, self.hostname)
1341 self.run('rm -rf %s; sync' % client_constants.PRIOR_LOGS_DIR)
1342 # Wait for a few seconds to make sure the prior command is
1343 # done deep through storage.
1344 time.sleep(self._SAFE_WAIT_SECS)
1345
1346
1347 def _collect_prior_logs(self, crashlogs_dir):
1348 """Grab prior logs that were stashed before re-installing a host.
1349
1350 @param crashlogs_dir: Directory path where crash-logs are stored.
1351 """
1352 logging.debug('%s: Found %s, collecting them...',
1353 self._CRASHLOGS_PREFIX, client_constants.PRIOR_LOGS_DIR)
1354 try:
1355 self.collect_logs(client_constants.PRIOR_LOGS_DIR,
1356 crashlogs_dir, False)
1357 logging.debug('%s: %s is collected',
1358 self._CRASHLOGS_PREFIX, client_constants.PRIOR_LOGS_DIR)
1359 except Exception as e:
1360 logging.error('%s: Failed to collect %s: %s',
1361 self._CRASHLOGS_PREFIX, client_constants.PRIOR_LOGS_DIR,
1362 e)
1363
1364
1365 def _collect_system_logs(self, crashlogs_dir):
1366 """Grab normal system logs from a host.
1367
1368 @param crashlogs_dir: Directory path where crash-logs are stored.
1369 """
1370 logging.debug('%s: Found %s, collecting system logs...',
1371 self._CRASHLOGS_PREFIX, self._LAB_MACHINE_FILE)
1372 sources = server_utils.parse_simple_config(self._LOGS_TO_COLLECT_FILE)
1373 for src in sources:
1374 try:
1375 if self.path_exists(src):
1376 logging.debug('%s: Collecting %s...',
1377 self._CRASHLOGS_PREFIX, src)
1378 dest = server_utils.concat_path_except_last(
1379 crashlogs_dir, src)
1380 self.collect_logs(src, dest, False)
1381 logging.debug('%s: %s is collected',
1382 self._CRASHLOGS_PREFIX, src)
1383 except Exception as e:
1384 logging.error('%s: Failed to collect %s: %s',
1385 self._CRASHLOGS_PREFIX, src, e)
1386
1387
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001388 def close(self):
beeps32a63082013-08-22 14:02:29 -07001389 self.rpc_disconnect_all()
Fang Deng0ca40e22013-08-27 17:47:44 -07001390 super(CrosHost, self).close()
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001391
1392
Dan Shi49ca0932014-11-14 11:22:27 -08001393 def get_power_supply_info(self):
1394 """Get the output of power_supply_info.
1395
1396 power_supply_info outputs the info of each power supply, e.g.,
1397 Device: Line Power
1398 online: no
1399 type: Mains
1400 voltage (V): 0
1401 current (A): 0
1402 Device: Battery
1403 state: Discharging
1404 percentage: 95.9276
1405 technology: Li-ion
1406
1407 Above output shows two devices, Line Power and Battery, with details of
1408 each device listed. This function parses the output into a dictionary,
1409 with key being the device name, and value being a dictionary of details
1410 of the device info.
1411
1412 @return: The dictionary of power_supply_info, e.g.,
1413 {'Line Power': {'online': 'yes', 'type': 'main'},
1414 'Battery': {'vendor': 'xyz', 'percentage': '100'}}
Dan Shie9b765d2014-12-29 16:59:49 -08001415 @raise error.AutoservRunError if power_supply_info tool is not found in
1416 the DUT. Caller should handle this error to avoid false failure
1417 on verification.
Dan Shi49ca0932014-11-14 11:22:27 -08001418 """
1419 result = self.run('power_supply_info').stdout.strip()
1420 info = {}
1421 device_name = None
1422 device_info = {}
1423 for line in result.split('\n'):
1424 pair = [v.strip() for v in line.split(':')]
1425 if len(pair) != 2:
1426 continue
1427 if pair[0] == 'Device':
1428 if device_name:
1429 info[device_name] = device_info
1430 device_name = pair[1]
1431 device_info = {}
1432 else:
1433 device_info[pair[0]] = pair[1]
1434 if device_name and not device_name in info:
1435 info[device_name] = device_info
1436 return info
1437
1438
1439 def get_battery_percentage(self):
1440 """Get the battery percentage.
1441
1442 @return: The percentage of battery level, value range from 0-100. Return
1443 None if the battery info cannot be retrieved.
1444 """
1445 try:
1446 info = self.get_power_supply_info()
1447 logging.info(info)
1448 return float(info['Battery']['percentage'])
Dan Shie9b765d2014-12-29 16:59:49 -08001449 except (KeyError, ValueError, error.AutoservRunError):
Dan Shi49ca0932014-11-14 11:22:27 -08001450 return None
1451
1452
1453 def is_ac_connected(self):
1454 """Check if the dut has power adapter connected and charging.
1455
1456 @return: True if power adapter is connected and charging.
1457 """
1458 try:
1459 info = self.get_power_supply_info()
1460 return info['Line Power']['online'] == 'yes'
Dan Shie9b765d2014-12-29 16:59:49 -08001461 except (KeyError, error.AutoservRunError):
1462 return None
Dan Shi49ca0932014-11-14 11:22:27 -08001463
1464
Simran Basi5e6339a2013-03-21 11:34:32 -07001465 def _cleanup_poweron(self):
1466 """Special cleanup method to make sure hosts always get power back."""
1467 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
1468 hosts = afe.get_hosts(hostname=self.hostname)
1469 if not hosts or not (self._RPM_OUTLET_CHANGED in
1470 hosts[0].attributes):
1471 return
1472 logging.debug('This host has recently interacted with the RPM'
1473 ' Infrastructure. Ensuring power is on.')
1474 try:
1475 self.power_on()
Dan Shi7dca56e2014-11-11 17:07:56 -08001476 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, None,
1477 hostname=self.hostname)
Simran Basi5e6339a2013-03-21 11:34:32 -07001478 except rpm_client.RemotePowerException:
Simran Basi5e6339a2013-03-21 11:34:32 -07001479 logging.error('Failed to turn Power On for this host after '
1480 'cleanup through the RPM Infrastructure.')
Gabe Blackb72f4fb2015-01-20 16:47:13 -08001481 autotest_es.post(
Dan Shi7dca56e2014-11-11 17:07:56 -08001482 type_str='RPM_poweron_failure',
1483 metadata={'hostname': self.hostname})
Dan Shi49ca0932014-11-14 11:22:27 -08001484
1485 battery_percentage = self.get_battery_percentage()
Dan Shif01ebe22014-12-05 13:10:57 -08001486 if battery_percentage and battery_percentage < 50:
Dan Shi49ca0932014-11-14 11:22:27 -08001487 raise
1488 elif self.is_ac_connected():
1489 logging.info('The device has power adapter connected and '
1490 'charging. No need to try to turn RPM on '
1491 'again.')
1492 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, None,
1493 hostname=self.hostname)
1494 logging.info('Battery level is now at %s%%. The device may '
1495 'still have enough power to run test, so no '
1496 'exception will be raised.', battery_percentage)
1497
Simran Basi5e6339a2013-03-21 11:34:32 -07001498
beepsc87ff602013-07-31 21:53:00 -07001499 def _is_factory_image(self):
1500 """Checks if the image on the DUT is a factory image.
1501
1502 @return: True if the image on the DUT is a factory image.
1503 False otherwise.
1504 """
1505 result = self.run('[ -f /root/.factory_test ]', ignore_status=True)
1506 return result.exit_status == 0
1507
1508
1509 def _restart_ui(self):
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001510 """Restart the Chrome UI.
beepsc87ff602013-07-31 21:53:00 -07001511
1512 @raises: FactoryImageCheckerException for factory images, since
1513 we cannot attempt to restart ui on them.
1514 error.AutoservRunError for any other type of error that
1515 occurs while restarting ui.
1516 """
1517 if self._is_factory_image():
Dan Shi549fb822015-03-24 18:01:11 -07001518 raise FactoryImageCheckerException('Cannot restart ui on factory '
1519 'images')
beepsc87ff602013-07-31 21:53:00 -07001520
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001521 # TODO(jrbarnette): The command to stop/start the ui job
1522 # should live inside cros_ui, too. However that would seem
1523 # to imply interface changes to the existing start()/restart()
1524 # functions, which is a bridge too far (for now).
J. Richard Barnette6069aa12015-06-08 09:10:24 -07001525 prompt = cros_ui.get_chrome_session_ident(self)
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001526 self.run('stop ui; start ui')
1527 cros_ui.wait_for_chrome_ready(prompt, self)
beepsc87ff602013-07-31 21:53:00 -07001528
1529
Dan Shi549fb822015-03-24 18:01:11 -07001530 def get_release_version(self):
1531 """Get the value of attribute CHROMEOS_RELEASE_VERSION from lsb-release.
1532
1533 @returns The version string in lsb-release, under attribute
1534 CHROMEOS_RELEASE_VERSION.
1535 """
1536 lsb_release_content = self.run(
1537 'cat "%s"' % client_constants.LSB_RELEASE).stdout.strip()
1538 return lsbrelease_utils.get_chromeos_release_version(
1539 lsb_release_content=lsb_release_content)
1540
1541
1542 def verify_cros_version_label(self):
1543 """ Make sure host's cros-version label match the actual image in dut.
1544
1545 Remove any cros-version: label that doesn't match that installed in
1546 the dut.
1547
1548 @param raise_error: Set to True to raise exception if any mismatch found
1549
1550 @raise error.AutoservError: If any mismatch between cros-version label
1551 and the build installed in dut is found.
1552 """
1553 labels = self._AFE.get_labels(
1554 name__startswith=ds_constants.VERSION_PREFIX,
1555 host__hostname=self.hostname)
1556 mismatch_found = False
1557 if labels:
1558 # Get CHROMEOS_RELEASE_VERSION from lsb-release, e.g., 6908.0.0.
1559 # Note that it's different from cros-version label, which has
1560 # builder and branch info, e.g.,
1561 # cros-version:peppy-release/R43-6908.0.0
1562 release_version = self.get_release_version()
1563 host_list = [self.hostname]
1564 for label in labels:
1565 # Remove any cros-version label that does not match
1566 # release_version.
1567 build_version = label.name[len(ds_constants.VERSION_PREFIX):]
1568 if not utils.version_match(build_version, release_version):
1569 logging.warn('cros-version label "%s" does not match '
1570 'release version %s. Removing the label.',
1571 label.name, release_version)
1572 label.remove_hosts(hosts=host_list)
1573 mismatch_found = True
1574 if mismatch_found:
Dan Shi1057bae2015-03-30 11:35:09 -07001575 autotest_es.post(use_http=True,
1576 type_str='cros_version_label_mismatch',
1577 metadata={'hostname': self.hostname})
Dan Shi549fb822015-03-24 18:01:11 -07001578 raise error.AutoservError('The host has wrong cros-version label.')
1579
1580
beepsc87ff602013-07-31 21:53:00 -07001581 def cleanup(self):
MK Ryu35d661e2014-09-25 17:44:10 -07001582 self.run('rm -f %s' % client_constants.CLEANUP_LOGS_PAUSED_FILE)
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001583 try:
beepsc87ff602013-07-31 21:53:00 -07001584 self._restart_ui()
1585 except (error.AutotestRunError, error.AutoservRunError,
1586 FactoryImageCheckerException):
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001587 logging.warning('Unable to restart ui, rebooting device.')
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001588 # Since restarting the UI fails fall back to normal Autotest
1589 # cleanup routines, i.e. reboot the machine.
Fang Deng0ca40e22013-08-27 17:47:44 -07001590 super(CrosHost, self).cleanup()
Simran Basi5e6339a2013-03-21 11:34:32 -07001591 # Check if the rpm outlet was manipulated.
Simran Basid5e5e272012-09-24 15:23:59 -07001592 if self.has_power():
Simran Basi5e6339a2013-03-21 11:34:32 -07001593 self._cleanup_poweron()
Dan Shi549fb822015-03-24 18:01:11 -07001594 self.verify_cros_version_label()
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001595
1596
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001597 def reboot(self, **dargs):
1598 """
1599 This function reboots the site host. The more generic
1600 RemoteHost.reboot() performs sync and sleeps for 5
1601 seconds. This is not necessary for Chrome OS devices as the
1602 sync should be finished in a short time during the reboot
1603 command.
1604 """
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001605 if 'reboot_cmd' not in dargs:
Doug Anderson7d5aeb22014-02-27 15:12:17 -08001606 reboot_timeout = dargs.get('reboot_timeout', 10)
1607 dargs['reboot_cmd'] = ('((reboot & sleep %d; reboot -f &)'
1608 ' </dev/null >/dev/null 2>&1 &)' %
1609 reboot_timeout)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001610 # Enable fastsync to avoid running extra sync commands before reboot.
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001611 if 'fastsync' not in dargs:
1612 dargs['fastsync'] = True
Michael Liangda8c60a2014-06-03 13:24:51 -07001613
Charlie Mooneya8e6dab2014-05-29 14:37:55 -07001614 # For purposes of logging reboot times:
1615 # Get the board name i.e. 'daisy_spring'
Michael Liangca4f5a62014-07-10 15:45:13 -07001616 board_fullname = self.get_board()
1617
1618 # Strip the prefix and add it to dargs.
1619 dargs['board'] = board_fullname[board_fullname.find(':')+1:]
Fang Deng0ca40e22013-08-27 17:47:44 -07001620 super(CrosHost, self).reboot(**dargs)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001621
1622
Gwendal Grignou7a61d2f2014-05-23 11:05:51 -07001623 def suspend(self, **dargs):
1624 """
1625 This function suspends the site host.
1626 """
1627 suspend_time = dargs.get('suspend_time', 60)
1628 dargs['timeout'] = suspend_time
1629 if 'suspend_cmd' not in dargs:
1630 cmd = ' && '.join(['echo 0 > /sys/class/rtc/rtc0/wakealarm',
1631 'echo +%d > /sys/class/rtc/rtc0/wakealarm' % suspend_time,
1632 'powerd_dbus_suspend --delay=0 &'])
1633 dargs['suspend_cmd'] = ('(( %s )'
1634 '< /dev/null >/dev/null 2>&1 &)' % cmd)
1635 super(CrosHost, self).suspend(**dargs)
1636
1637
Simran Basiec564392014-08-25 16:48:09 -07001638 def upstart_status(self, service_name):
1639 """Check the status of an upstart init script.
1640
1641 @param service_name: Service to look up.
1642
1643 @returns True if the service is running, False otherwise.
1644 """
1645 return self.run('status %s | grep start/running' %
1646 service_name).stdout.strip() != ''
1647
1648
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001649 def verify_software(self):
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001650 """Verify working software on a Chrome OS system.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001651
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001652 Tests for the following conditions:
1653 1. All conditions tested by the parent version of this
1654 function.
1655 2. Sufficient space in /mnt/stateful_partition.
Fang Deng6b05f5b2013-03-20 13:42:11 -07001656 3. Sufficient space in /mnt/stateful_partition/encrypted.
1657 4. update_engine answers a simple status request over DBus.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001658
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001659 """
MK Ryu35d661e2014-09-25 17:44:10 -07001660 # Check if a job was crashed on this host.
1661 # If yes, avoid verification until crash-logs are collected.
1662 if self._need_crash_logs():
1663 raise error.AutoservCrashLogCollectRequired(
1664 'Need to collect crash-logs before verification')
1665
Fang Deng0ca40e22013-08-27 17:47:44 -07001666 super(CrosHost, self).verify_software()
J. Richard Barnette4164d1d2014-12-02 17:52:33 -08001667 self.check_inodes(
1668 '/mnt/stateful_partition',
1669 global_config.global_config.get_config_value(
1670 'SERVER', 'kilo_inodes_required', type=int,
1671 default=100))
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001672 self.check_diskspace(
1673 '/mnt/stateful_partition',
1674 global_config.global_config.get_config_value(
Fang Deng6b05f5b2013-03-20 13:42:11 -07001675 'SERVER', 'gb_diskspace_required', type=float,
1676 default=20.0))
Gaurav Shahe448af82014-06-19 15:18:59 -07001677 encrypted_stateful_path = '/mnt/stateful_partition/encrypted'
1678 # Not all targets build with encrypted stateful support.
1679 if self.path_exists(encrypted_stateful_path):
1680 self.check_diskspace(
1681 encrypted_stateful_path,
1682 global_config.global_config.get_config_value(
1683 'SERVER', 'gb_encrypted_diskspace_required', type=float,
1684 default=0.1))
beepsc87ff602013-07-31 21:53:00 -07001685
Simran Basiec564392014-08-25 16:48:09 -07001686 if not self.upstart_status('system-services'):
Prashanth B5d0a0512014-04-25 12:26:08 -07001687 raise error.AutoservError('Chrome failed to reach login. '
1688 'System services not running.')
1689
beepsc87ff602013-07-31 21:53:00 -07001690 # Factory images don't run update engine,
1691 # goofy controls dbus on these DUTs.
1692 if not self._is_factory_image():
1693 self.run('update_engine_client --status')
Scott Zawalskifbca4a92013-03-04 15:56:42 -05001694 # Makes sure python is present, loads and can use built in functions.
1695 # We have seen cases where importing cPickle fails with undefined
1696 # symbols in cPickle.so.
1697 self.run('python -c "import cPickle"')
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001698
Dan Shi549fb822015-03-24 18:01:11 -07001699 self.verify_cros_version_label()
1700
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001701
Dan Shi49ca0932014-11-14 11:22:27 -08001702 def verify_hardware(self):
1703 """Verify hardware system of a Chrome OS system.
1704
1705 Check following hardware conditions:
1706 1. Battery level.
1707 2. Is power adapter connected.
1708 """
1709 logging.info('Battery percentage: %s', self.get_battery_percentage())
Dan Shie9b765d2014-12-29 16:59:49 -08001710 if self.is_ac_connected() is None:
1711 logging.info('Can not determine if the device has power adapter '
1712 'connected.')
1713 else:
1714 logging.info('Device %s power adapter connected and charging.',
1715 'has' if self.is_ac_connected() else 'does not have')
Dan Shi49ca0932014-11-14 11:22:27 -08001716
1717
Fang Deng96667ca2013-08-01 17:46:18 -07001718 def make_ssh_command(self, user='root', port=22, opts='', hosts_file=None,
1719 connect_timeout=None, alive_interval=None):
1720 """Override default make_ssh_command to use options tuned for Chrome OS.
1721
1722 Tuning changes:
1723 - ConnectTimeout=30; maximum of 30 seconds allowed for an SSH
1724 connection failure. Consistency with remote_access.sh.
1725
1726 - ServerAliveInterval=180; which causes SSH to ping connection every
1727 180 seconds. In conjunction with ServerAliveCountMax ensures
1728 that if the connection dies, Autotest will bail out quickly.
1729 Originally tried 60 secs, but saw frequent job ABORTS where
1730 the test completed successfully.
1731
1732 - ServerAliveCountMax=3; consistency with remote_access.sh.
1733
1734 - ConnectAttempts=4; reduce flakiness in connection errors;
1735 consistency with remote_access.sh.
1736
1737 - UserKnownHostsFile=/dev/null; we don't care about the keys.
1738 Host keys change with every new installation, don't waste
1739 memory/space saving them.
1740
1741 - SSH protocol forced to 2; needed for ServerAliveInterval.
1742
1743 @param user User name to use for the ssh connection.
1744 @param port Port on the target host to use for ssh connection.
1745 @param opts Additional options to the ssh command.
1746 @param hosts_file Ignored.
1747 @param connect_timeout Ignored.
1748 @param alive_interval Ignored.
1749 """
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001750 base_command = ('/usr/bin/ssh -a -x %s %s %s'
1751 ' -o StrictHostKeyChecking=no'
Fang Deng96667ca2013-08-01 17:46:18 -07001752 ' -o UserKnownHostsFile=/dev/null -o BatchMode=yes'
1753 ' -o ConnectTimeout=30 -o ServerAliveInterval=180'
1754 ' -o ServerAliveCountMax=3 -o ConnectionAttempts=4'
1755 ' -o Protocol=2 -l %s -p %d')
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001756 return base_command % (self._ssh_verbosity_flag, self._ssh_options,
1757 opts, user, port)
Fang Deng96667ca2013-08-01 17:46:18 -07001758
1759
beeps32a63082013-08-22 14:02:29 -07001760 def _create_ssh_tunnel(self, port, local_port):
1761 """Create an ssh tunnel from local_port to port.
1762
1763 @param port: remote port on the host.
1764 @param local_port: local forwarding port.
1765
1766 @return: the tunnel process.
1767 """
1768 # Chrome OS on the target closes down most external ports
1769 # for security. We could open the port, but doing that
1770 # would conflict with security tests that check that only
1771 # expected ports are open. So, to get to the port on the
1772 # target we use an ssh tunnel.
1773 tunnel_options = '-n -N -q -L %d:localhost:%d' % (local_port, port)
1774 ssh_cmd = self.make_ssh_command(opts=tunnel_options)
1775 tunnel_cmd = '%s %s' % (ssh_cmd, self.hostname)
1776 logging.debug('Full tunnel command: %s', tunnel_cmd)
1777 tunnel_proc = subprocess.Popen(tunnel_cmd, shell=True, close_fds=True)
1778 logging.debug('Started ssh tunnel, local = %d'
1779 ' remote = %d, pid = %d',
1780 local_port, port, tunnel_proc.pid)
1781 return tunnel_proc
1782
1783
Christopher Wileydd181852013-10-10 19:56:58 -07001784 def _setup_rpc(self, port, command_name, remote_pid=None):
beeps32a63082013-08-22 14:02:29 -07001785 """Sets up a tunnel process and performs rpc connection book keeping.
1786
1787 This method assumes that xmlrpc and jsonrpc never conflict, since
1788 we can only either have an xmlrpc or a jsonrpc server listening on
1789 a remote port. As such, it enforces a single proxy->remote port
1790 policy, i.e if one starts a jsonrpc proxy/server from port A->B,
1791 and then tries to start an xmlrpc proxy forwarded to the same port,
1792 the xmlrpc proxy will override the jsonrpc tunnel process, however:
1793
1794 1. None of the methods on the xmlrpc proxy will work because
1795 the server listening on B is jsonrpc.
1796
1797 2. The xmlrpc client cannot initiate a termination of the JsonRPC
1798 server, as the only use case currently is goofy, which is tied to
1799 the factory image. It is much easier to handle a failed xmlrpc
1800 call on the client than it is to terminate goofy in this scenario,
1801 as doing the latter might leave the DUT in a hard to recover state.
1802
1803 With the current implementation newer rpc proxy connections will
1804 terminate the tunnel processes of older rpc connections tunneling
1805 to the same remote port. If methods are invoked on the client
1806 after this has happened they will fail with connection closed errors.
1807
1808 @param port: The remote forwarding port.
1809 @param command_name: The name of the remote process, to terminate
1810 using pkill.
1811
1812 @return A url that we can use to initiate the rpc connection.
1813 """
1814 self.rpc_disconnect(port)
1815 local_port = utils.get_unused_port()
1816 tunnel_proc = self._create_ssh_tunnel(port, local_port)
Christopher Wileydd181852013-10-10 19:56:58 -07001817 self._rpc_proxy_map[port] = (command_name, tunnel_proc, remote_pid)
beeps32a63082013-08-22 14:02:29 -07001818 return self._RPC_PROXY_URL % local_port
1819
1820
Christopher Wileyd78249a2013-03-01 13:05:31 -08001821 def xmlrpc_connect(self, command, port, command_name=None,
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001822 ready_test_name=None, timeout_seconds=10,
1823 logfile='/dev/null'):
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001824 """Connect to an XMLRPC server on the host.
1825
1826 The `command` argument should be a simple shell command that
1827 starts an XMLRPC server on the given `port`. The command
1828 must not daemonize, and must terminate cleanly on SIGTERM.
1829 The command is started in the background on the host, and a
1830 local XMLRPC client for the server is created and returned
1831 to the caller.
1832
1833 Note that the process of creating an XMLRPC client makes no
1834 attempt to connect to the remote server; the caller is
1835 responsible for determining whether the server is running
1836 correctly, and is ready to serve requests.
1837
Christopher Wileyd78249a2013-03-01 13:05:31 -08001838 Optionally, the caller can pass ready_test_name, a string
1839 containing the name of a method to call on the proxy. This
1840 method should take no parameters and return successfully only
1841 when the server is ready to process client requests. When
1842 ready_test_name is set, xmlrpc_connect will block until the
1843 proxy is ready, and throw a TestError if the server isn't
1844 ready by timeout_seconds.
1845
beeps32a63082013-08-22 14:02:29 -07001846 If a server is already running on the remote port, this
1847 method will kill it and disconnect the tunnel process
1848 associated with the connection before establishing a new one,
1849 by consulting the rpc_proxy_map in rpc_disconnect.
1850
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001851 @param command Shell command to start the server.
1852 @param port Port number on which the server is expected to
1853 be serving.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001854 @param command_name String to use as input to `pkill` to
1855 terminate the XMLRPC server on the host.
Christopher Wileyd78249a2013-03-01 13:05:31 -08001856 @param ready_test_name String containing the name of a
1857 method defined on the XMLRPC server.
1858 @param timeout_seconds Number of seconds to wait
1859 for the server to become 'ready.' Will throw a
1860 TestFail error if server is not ready in time.
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001861 @param logfile Logfile to send output when running
1862 'command' argument.
Yusuf Mohsinally8d19e3c2013-11-21 14:25:45 -08001863
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001864 """
Christopher Wileyc14f06a2013-10-16 13:55:39 -07001865 # Clean up any existing state. If the caller is willing
1866 # to believe their server is down, we ought to clean up
1867 # any tunnels we might have sitting around.
1868 self.rpc_disconnect(port)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001869 # Start the server on the host. Redirection in the command
1870 # below is necessary, because 'ssh' won't terminate until
1871 # background child processes close stdin, stdout, and
1872 # stderr.
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001873 remote_cmd = '%s </dev/null >%s 2>&1 & echo $!' % (command, logfile)
Christopher Wileydd181852013-10-10 19:56:58 -07001874 remote_pid = self.run(remote_cmd).stdout.rstrip('\n')
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001875 logging.debug('Started XMLRPC server on host %s, pid = %s',
1876 self.hostname, remote_pid)
1877
Christopher Wileydd181852013-10-10 19:56:58 -07001878 # Tunnel through SSH to be able to reach that remote port.
1879 rpc_url = self._setup_rpc(port, command_name, remote_pid=remote_pid)
Christopher Wileyd78249a2013-03-01 13:05:31 -08001880 proxy = xmlrpclib.ServerProxy(rpc_url, allow_none=True)
Christopher Wileydd181852013-10-10 19:56:58 -07001881
Christopher Wileyd78249a2013-03-01 13:05:31 -08001882 if ready_test_name is not None:
J. Richard Barnette13eb7c02013-03-07 12:06:29 -08001883 # retry.retry logs each attempt; calculate delay_sec to
1884 # keep log spam to a dull roar.
Christopher Wiley0ed712b2013-04-09 15:25:12 -07001885 @retry.retry((socket.error,
1886 xmlrpclib.ProtocolError,
1887 httplib.BadStatusLine),
Chris Sosa65425082013-10-16 13:26:22 -07001888 timeout_min=timeout_seconds / 60.0,
1889 delay_sec=min(max(timeout_seconds / 20.0, 0.1), 1))
Christopher Wileyd78249a2013-03-01 13:05:31 -08001890 def ready_test():
1891 """ Call proxy.ready_test_name(). """
1892 getattr(proxy, ready_test_name)()
1893 successful = False
1894 try:
1895 logging.info('Waiting %d seconds for XMLRPC server '
1896 'to start.', timeout_seconds)
1897 ready_test()
1898 successful = True
Christopher Wileyd78249a2013-03-01 13:05:31 -08001899 finally:
1900 if not successful:
1901 logging.error('Failed to start XMLRPC server.')
beeps32a63082013-08-22 14:02:29 -07001902 self.rpc_disconnect(port)
Christopher Wileyd78249a2013-03-01 13:05:31 -08001903 logging.info('XMLRPC server started successfully.')
1904 return proxy
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001905
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001906
Jason Abeleb6f924f2013-11-13 16:01:54 -08001907 def syslog(self, message, tag='autotest'):
1908 """Logs a message to syslog on host.
1909
1910 @param message String message to log into syslog
1911 @param tag String tag prefix for syslog
1912
1913 """
1914 self.run('logger -t "%s" "%s"' % (tag, message))
1915
1916
beeps32a63082013-08-22 14:02:29 -07001917 def jsonrpc_connect(self, port):
1918 """Creates a jsonrpc proxy connection through an ssh tunnel.
1919
1920 This method exists to facilitate communication with goofy (which is
1921 the default system manager on all factory images) and as such, leaves
1922 most of the rpc server sanity checking to the caller. Unlike
1923 xmlrpc_connect, this method does not facilitate the creation of a remote
1924 jsonrpc server, as the only clients of this code are factory tests,
1925 for which the goofy system manager is built in to the image and starts
1926 when the target boots.
1927
1928 One can theoretically create multiple jsonrpc proxies all forwarded
1929 to the same remote port, provided the remote port has an rpc server
1930 listening. However, in doing so we stand the risk of leaking an
1931 existing tunnel process, so we always disconnect any older tunnels
1932 we might have through rpc_disconnect.
1933
1934 @param port: port on the remote host that is serving this proxy.
1935
1936 @return: The client proxy.
1937 """
1938 if not jsonrpclib:
1939 logging.warning('Jsonrpclib could not be imported. Check that '
1940 'site-packages contains jsonrpclib.')
1941 return None
1942
1943 proxy = jsonrpclib.jsonrpc.ServerProxy(self._setup_rpc(port, None))
1944
1945 logging.info('Established a jsonrpc connection through port %s.', port)
1946 return proxy
1947
1948
1949 def rpc_disconnect(self, port):
1950 """Disconnect from an RPC server on the host.
1951
1952 Terminates the remote RPC server previously started for
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001953 the given `port`. Also closes the local ssh tunnel created
1954 for the connection to the host. This function does not
beeps32a63082013-08-22 14:02:29 -07001955 directly alter the state of a previously returned RPC
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001956 client object; however disconnection will cause all
1957 subsequent calls to methods on the object to fail.
1958
1959 This function does nothing if requested to disconnect a port
beeps32a63082013-08-22 14:02:29 -07001960 that was not previously connected via _setup_rpc.
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001961
1962 @param port Port number passed to a previous call to
beeps32a63082013-08-22 14:02:29 -07001963 `_setup_rpc()`.
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001964 """
beeps32a63082013-08-22 14:02:29 -07001965 if port not in self._rpc_proxy_map:
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001966 return
Christopher Wileydd181852013-10-10 19:56:58 -07001967 remote_name, tunnel_proc, remote_pid = self._rpc_proxy_map[port]
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001968 if remote_name:
1969 # We use 'pkill' to find our target process rather than
1970 # a PID, because the host may have rebooted since
1971 # connecting, and we don't want to kill an innocent
1972 # process with the same PID.
1973 #
1974 # 'pkill' helpfully exits with status 1 if no target
1975 # process is found, for which run() will throw an
Simran Basid5e5e272012-09-24 15:23:59 -07001976 # exception. We don't want that, so we the ignore
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001977 # status.
1978 self.run("pkill -f '%s'" % remote_name, ignore_status=True)
Christopher Wileydd181852013-10-10 19:56:58 -07001979 if remote_pid:
1980 logging.info('Waiting for RPC server "%s" shutdown',
1981 remote_name)
1982 start_time = time.time()
1983 while (time.time() - start_time <
1984 self._RPC_SHUTDOWN_TIMEOUT_SECONDS):
1985 running_processes = self.run(
1986 "pgrep -f '%s'" % remote_name,
1987 ignore_status=True).stdout.split()
1988 if not remote_pid in running_processes:
1989 logging.info('Shut down RPC server.')
1990 break
1991 time.sleep(self._RPC_SHUTDOWN_POLLING_PERIOD_SECONDS)
1992 else:
1993 raise error.TestError('Failed to shutdown RPC server %s' %
1994 remote_name)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001995
1996 if tunnel_proc.poll() is None:
1997 tunnel_proc.terminate()
1998 logging.debug('Terminated tunnel, pid %d', tunnel_proc.pid)
1999 else:
2000 logging.debug('Tunnel pid %d terminated early, status %d',
2001 tunnel_proc.pid, tunnel_proc.returncode)
beeps32a63082013-08-22 14:02:29 -07002002 del self._rpc_proxy_map[port]
J. Richard Barnette1d78b012012-05-15 13:56:30 -07002003
2004
beeps32a63082013-08-22 14:02:29 -07002005 def rpc_disconnect_all(self):
2006 """Disconnect all known RPC proxy ports."""
2007 for port in self._rpc_proxy_map.keys():
2008 self.rpc_disconnect(port)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07002009
2010
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002011 def poor_mans_rpc(self, fun):
2012 """
2013 Calls a function from client utils on the host and returns a string.
2014
2015 @param fun function in client utils namespace.
2016 @return output string from calling fun.
2017 """
Simran Basi263a9d32014-08-19 11:16:51 -07002018 script = 'cd %s/bin; ' % autotest.Autotest.get_installed_autodir(self)
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002019 script += 'python -c "import common; import utils;'
2020 script += 'print utils.%s"' % fun
2021 return script
2022
2023
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002024 def _ping_check_status(self, status):
2025 """Ping the host once, and return whether it has a given status.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002026
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002027 @param status Check the ping status against this value.
2028 @return True iff `status` and the result of ping are the same
2029 (i.e. both True or both False).
2030
2031 """
2032 ping_val = utils.ping(self.hostname, tries=1, deadline=1)
2033 return not (status ^ (ping_val == 0))
2034
2035 def _ping_wait_for_status(self, status, timeout):
2036 """Wait for the host to have a given status (UP or DOWN).
2037
2038 Status is checked by polling. Polling will not last longer
2039 than the number of seconds in `timeout`. The polling
2040 interval will be long enough that only approximately
2041 _PING_WAIT_COUNT polling cycles will be executed, subject
2042 to a maximum interval of about one minute.
2043
2044 @param status Waiting will stop immediately if `ping` of the
2045 host returns this status.
2046 @param timeout Poll for at most this many seconds.
2047 @return True iff the host status from `ping` matched the
2048 requested status at the time of return.
2049
2050 """
2051 # _ping_check_status() takes about 1 second, hence the
2052 # "- 1" in the formula below.
2053 poll_interval = min(int(timeout / self._PING_WAIT_COUNT), 60) - 1
2054 end_time = time.time() + timeout
2055 while time.time() <= end_time:
2056 if self._ping_check_status(status):
2057 return True
2058 if poll_interval > 0:
2059 time.sleep(poll_interval)
2060
2061 # The last thing we did was sleep(poll_interval), so it may
2062 # have been too long since the last `ping`. Check one more
2063 # time, just to be sure.
2064 return self._ping_check_status(status)
2065
2066 def ping_wait_up(self, timeout):
2067 """Wait for the host to respond to `ping`.
2068
2069 N.B. This method is not a reliable substitute for
2070 `wait_up()`, because a host that responds to ping will not
2071 necessarily respond to ssh. This method should only be used
2072 if the target DUT can be considered functional even if it
2073 can't be reached via ssh.
2074
2075 @param timeout Minimum time to allow before declaring the
2076 host to be non-responsive.
2077 @return True iff the host answered to ping before the timeout.
2078
2079 """
2080 return self._ping_wait_for_status(self._PING_STATUS_UP, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002081
Andrew Bresticker678c0c72013-01-22 10:44:09 -08002082 def ping_wait_down(self, timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002083 """Wait until the host no longer responds to `ping`.
2084
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002085 This function can be used as a slightly faster version of
2086 `wait_down()`, by avoiding potentially long ssh timeouts.
2087
2088 @param timeout Minimum time to allow for the host to become
2089 non-responsive.
2090 @return True iff the host quit answering ping before the
2091 timeout.
2092
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002093 """
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08002094 return self._ping_wait_for_status(self._PING_STATUS_DOWN, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002095
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002096 def test_wait_for_sleep(self, sleep_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002097 """Wait for the client to enter low-power sleep mode.
2098
2099 The test for "is asleep" can't distinguish a system that is
2100 powered off; to confirm that the unit was asleep, it is
2101 necessary to force resume, and then call
2102 `test_wait_for_resume()`.
2103
2104 This function is expected to be called from a test as part
2105 of a sequence like the following:
2106
2107 ~~~~~~~~
2108 boot_id = host.get_boot_id()
2109 # trigger sleep on the host
2110 host.test_wait_for_sleep()
2111 # trigger resume on the host
2112 host.test_wait_for_resume(boot_id)
2113 ~~~~~~~~
2114
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002115 @param sleep_timeout time limit in seconds to allow the host sleep.
2116
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002117 @exception TestFail The host did not go to sleep within
2118 the allowed time.
2119 """
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002120 if sleep_timeout is None:
2121 sleep_timeout = self.SLEEP_TIMEOUT
2122
2123 if not self.ping_wait_down(timeout=sleep_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002124 raise error.TestFail(
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002125 'client failed to sleep after %d seconds' % sleep_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002126
2127
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002128 def test_wait_for_resume(self, old_boot_id, resume_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002129 """Wait for the client to resume from low-power sleep mode.
2130
2131 The `old_boot_id` parameter should be the value from
2132 `get_boot_id()` obtained prior to entering sleep mode. A
2133 `TestFail` exception is raised if the boot id changes.
2134
2135 See @ref test_wait_for_sleep for more on this function's
2136 usage.
2137
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08002138 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002139 target host went to sleep.
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002140 @param resume_timeout time limit in seconds to allow the host up.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002141
2142 @exception TestFail The host did not respond within the
2143 allowed time.
2144 @exception TestFail The host responded, but the boot id test
2145 indicated a reboot rather than a sleep
2146 cycle.
2147 """
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002148 if resume_timeout is None:
2149 resume_timeout = self.RESUME_TIMEOUT
2150
2151 if not self.wait_up(timeout=resume_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002152 raise error.TestFail(
2153 'client failed to resume from sleep after %d seconds' %
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08002154 resume_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002155 else:
2156 new_boot_id = self.get_boot_id()
2157 if new_boot_id != old_boot_id:
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002158 logging.error('client rebooted (old boot %s, new boot %s)',
2159 old_boot_id, new_boot_id)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002160 raise error.TestFail(
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002161 'client rebooted, but sleep was expected')
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002162
2163
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002164 def test_wait_for_shutdown(self, shutdown_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002165 """Wait for the client to shut down.
2166
2167 The test for "has shut down" can't distinguish a system that
2168 is merely asleep; to confirm that the unit was down, it is
2169 necessary to force boot, and then call test_wait_for_boot().
2170
2171 This function is expected to be called from a test as part
2172 of a sequence like the following:
2173
2174 ~~~~~~~~
2175 boot_id = host.get_boot_id()
2176 # trigger shutdown on the host
2177 host.test_wait_for_shutdown()
2178 # trigger boot on the host
2179 host.test_wait_for_boot(boot_id)
2180 ~~~~~~~~
2181
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002182 @param shutdown_timeout time limit in seconds to allow the host down.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002183 @exception TestFail The host did not shut down within the
2184 allowed time.
2185 """
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002186 if shutdown_timeout is None:
2187 shutdown_timeout = self.SHUTDOWN_TIMEOUT
2188
2189 if not self.ping_wait_down(timeout=shutdown_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002190 raise error.TestFail(
2191 'client failed to shut down after %d seconds' %
Tom Wai-Hong Tamfe005c22014-12-03 09:25:44 +08002192 shutdown_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002193
2194
2195 def test_wait_for_boot(self, old_boot_id=None):
2196 """Wait for the client to boot from cold power.
2197
2198 The `old_boot_id` parameter should be the value from
2199 `get_boot_id()` obtained prior to shutting down. A
2200 `TestFail` exception is raised if the boot id does not
2201 change. The boot id test is omitted if `old_boot_id` is not
2202 specified.
2203
2204 See @ref test_wait_for_shutdown for more on this function's
2205 usage.
2206
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08002207 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002208 shut down.
2209
2210 @exception TestFail The host did not respond within the
2211 allowed time.
2212 @exception TestFail The host responded, but the boot id test
2213 indicated that there was no reboot.
2214 """
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07002215 if not self.wait_up(timeout=self.REBOOT_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002216 raise error.TestFail(
2217 'client failed to reboot after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07002218 self.REBOOT_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002219 elif old_boot_id:
2220 if self.get_boot_id() == old_boot_id:
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002221 logging.error('client not rebooted (boot %s)',
2222 old_boot_id)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07002223 raise error.TestFail(
Tom Wai-Hong Tam01792682015-01-06 08:00:46 +08002224 'client is back up, but did not reboot')
Simran Basid5e5e272012-09-24 15:23:59 -07002225
2226
2227 @staticmethod
2228 def check_for_rpm_support(hostname):
2229 """For a given hostname, return whether or not it is powered by an RPM.
2230
Simran Basi1df55112013-09-06 11:25:09 -07002231 @param hostname: hostname to check for rpm support.
2232
Simran Basid5e5e272012-09-24 15:23:59 -07002233 @return None if this host does not follows the defined naming format
2234 for RPM powered DUT's in the lab. If it does follow the format,
2235 it returns a regular expression MatchObject instead.
2236 """
Fang Dengbaff9082015-01-06 13:46:15 -08002237 return re.match(CrosHost._RPM_HOSTNAME_REGEX, hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07002238
2239
2240 def has_power(self):
2241 """For this host, return whether or not it is powered by an RPM.
2242
2243 @return True if this host is in the CROS lab and follows the defined
2244 naming format.
2245 """
Fang Deng0ca40e22013-08-27 17:47:44 -07002246 return CrosHost.check_for_rpm_support(self.hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07002247
2248
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08002249 def _set_power(self, state, power_method):
2250 """Sets the power to the host via RPM, Servo or manual.
2251
2252 @param state Specifies which power state to set to DUT
2253 @param power_method Specifies which method of power control to
2254 use. By default "RPM" will be used. Valid values
2255 are the strings "RPM", "manual", "servoj10".
2256
2257 """
2258 ACCEPTABLE_STATES = ['ON', 'OFF']
2259
2260 if state.upper() not in ACCEPTABLE_STATES:
2261 raise error.TestError('State must be one of: %s.'
2262 % (ACCEPTABLE_STATES,))
2263
2264 if power_method == self.POWER_CONTROL_SERVO:
2265 logging.info('Setting servo port J10 to %s', state)
2266 self.servo.set('prtctl3_pwren', state.lower())
2267 time.sleep(self._USB_POWER_TIMEOUT)
2268 elif power_method == self.POWER_CONTROL_MANUAL:
2269 logging.info('You have %d seconds to set the AC power to %s.',
2270 self._POWER_CYCLE_TIMEOUT, state)
2271 time.sleep(self._POWER_CYCLE_TIMEOUT)
2272 else:
2273 if not self.has_power():
2274 raise error.TestFail('DUT does not have RPM connected.')
Simran Basi5e6339a2013-03-21 11:34:32 -07002275 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
2276 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, True,
2277 hostname=self.hostname)
Simran Basi1df55112013-09-06 11:25:09 -07002278 rpm_client.set_power(self.hostname, state.upper(), timeout_mins=5)
Simran Basid5e5e272012-09-24 15:23:59 -07002279
2280
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08002281 def power_off(self, power_method=POWER_CONTROL_RPM):
2282 """Turn off power to this host via RPM, Servo or manual.
2283
2284 @param power_method Specifies which method of power control to
2285 use. By default "RPM" will be used. Valid values
2286 are the strings "RPM", "manual", "servoj10".
2287
2288 """
2289 self._set_power('OFF', power_method)
Simran Basid5e5e272012-09-24 15:23:59 -07002290
2291
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08002292 def power_on(self, power_method=POWER_CONTROL_RPM):
2293 """Turn on power to this host via RPM, Servo or manual.
2294
2295 @param power_method Specifies which method of power control to
2296 use. By default "RPM" will be used. Valid values
2297 are the strings "RPM", "manual", "servoj10".
2298
2299 """
2300 self._set_power('ON', power_method)
2301
2302
2303 def power_cycle(self, power_method=POWER_CONTROL_RPM):
2304 """Cycle power to this host by turning it OFF, then ON.
2305
2306 @param power_method Specifies which method of power control to
2307 use. By default "RPM" will be used. Valid values
2308 are the strings "RPM", "manual", "servoj10".
2309
2310 """
2311 if power_method in (self.POWER_CONTROL_SERVO,
2312 self.POWER_CONTROL_MANUAL):
2313 self.power_off(power_method=power_method)
2314 time.sleep(self._POWER_CYCLE_TIMEOUT)
2315 self.power_on(power_method=power_method)
2316 else:
2317 rpm_client.set_power(self.hostname, 'CYCLE')
Simran Basic6f1f7a2012-10-16 10:47:46 -07002318
2319
2320 def get_platform(self):
2321 """Determine the correct platform label for this host.
2322
2323 @returns a string representing this host's platform.
2324 """
2325 crossystem = utils.Crossystem(self)
2326 crossystem.init()
2327 # Extract fwid value and use the leading part as the platform id.
2328 # fwid generally follow the format of {platform}.{firmware version}
2329 # Example: Alex.X.YYY.Z or Google_Alex.X.YYY.Z
2330 platform = crossystem.fwid().split('.')[0].lower()
2331 # Newer platforms start with 'Google_' while the older ones do not.
2332 return platform.replace('google_', '')
2333
2334
Hung-ying Tyanb1328032014-04-01 14:18:54 +08002335 def get_architecture(self):
2336 """Determine the correct architecture label for this host.
2337
2338 @returns a string representing this host's architecture.
2339 """
2340 crossystem = utils.Crossystem(self)
2341 crossystem.init()
2342 return crossystem.arch()
2343
2344
Luis Lozano40b7d0d2014-01-17 15:12:06 -08002345 def get_chrome_version(self):
2346 """Gets the Chrome version number and milestone as strings.
2347
2348 Invokes "chrome --version" to get the version number and milestone.
2349
2350 @return A tuple (chrome_ver, milestone) where "chrome_ver" is the
2351 current Chrome version number as a string (in the form "W.X.Y.Z")
2352 and "milestone" is the first component of the version number
2353 (the "W" from "W.X.Y.Z"). If the version number cannot be parsed
2354 in the "W.X.Y.Z" format, the "chrome_ver" will be the full output
2355 of "chrome --version" and the milestone will be the empty string.
2356
2357 """
MK Ryu35d661e2014-09-25 17:44:10 -07002358 version_string = self.run(client_constants.CHROME_VERSION_COMMAND).stdout
Luis Lozano40b7d0d2014-01-17 15:12:06 -08002359 return utils.parse_chrome_version(version_string)
2360
Aviv Keshet74c89a92013-02-04 15:18:30 -08002361 @label_decorator()
Simran Basic6f1f7a2012-10-16 10:47:46 -07002362 def get_board(self):
2363 """Determine the correct board label for this host.
2364
2365 @returns a string representing this host's board.
2366 """
2367 release_info = utils.parse_cmd_output('cat /etc/lsb-release',
2368 run_method=self.run)
2369 board = release_info['CHROMEOS_RELEASE_BOARD']
2370 # Devices in the lab generally have the correct board name but our own
2371 # development devices have {board_name}-signed-{key_type}. The board
2372 # name may also begin with 'x86-' which we need to keep.
Simran Basi833814b2013-01-29 13:13:43 -08002373 board_format_string = ds_constants.BOARD_PREFIX + '%s'
Simran Basic6f1f7a2012-10-16 10:47:46 -07002374 if 'x86' not in board:
Simran Basi833814b2013-01-29 13:13:43 -08002375 return board_format_string % board.split('-')[0]
2376 return board_format_string % '-'.join(board.split('-')[0:2])
Simran Basic6f1f7a2012-10-16 10:47:46 -07002377
2378
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002379 @label_decorator('board_freq_mem')
2380 def get_board_with_frequency_and_memory(self):
2381 """
2382 Determines the board name with frequency and memory.
2383
2384 @returns a more detailed string representing the board. Examples are
2385 butterfly_1.1GHz_2GB, link_1.8GHz_4GB, x86-zgb_1.7GHz_2GB
2386 """
2387 board = self.run(self.poor_mans_rpc(
2388 'get_board_with_frequency_and_memory()')).stdout
2389 return 'board_freq_mem:%s' % str.strip(board)
2390
2391
Aviv Keshet74c89a92013-02-04 15:18:30 -08002392 @label_decorator('lightsensor')
Simran Basic6f1f7a2012-10-16 10:47:46 -07002393 def has_lightsensor(self):
2394 """Determine the correct board label for this host.
2395
2396 @returns the string 'lightsensor' if this host has a lightsensor or
2397 None if it does not.
2398 """
2399 search_cmd = "find -L %s -maxdepth 4 | egrep '%s'" % (
Richard Barnette82c35912012-11-20 10:09:10 -08002400 self._LIGHTSENSOR_SEARCH_DIR, '|'.join(self._LIGHTSENSOR_FILES))
Simran Basic6f1f7a2012-10-16 10:47:46 -07002401 try:
2402 # Run the search cmd following the symlinks. Stderr_tee is set to
2403 # None as there can be a symlink loop, but the command will still
2404 # execute correctly with a few messages printed to stderr.
2405 self.run(search_cmd, stdout_tee=None, stderr_tee=None)
2406 return 'lightsensor'
2407 except error.AutoservRunError:
2408 # egrep exited with a return code of 1 meaning none of the possible
2409 # lightsensor files existed.
2410 return None
2411
2412
Aviv Keshet74c89a92013-02-04 15:18:30 -08002413 @label_decorator('bluetooth')
Simran Basic6f1f7a2012-10-16 10:47:46 -07002414 def has_bluetooth(self):
2415 """Determine the correct board label for this host.
2416
2417 @returns the string 'bluetooth' if this host has bluetooth or
2418 None if it does not.
2419 """
2420 try:
2421 self.run('test -d /sys/class/bluetooth/hci0')
2422 # test exited with a return code of 0.
2423 return 'bluetooth'
2424 except error.AutoservRunError:
2425 # test exited with a return code 1 meaning the directory did not
2426 # exist.
2427 return None
2428
2429
Ilja H. Friedel1232e8a2014-06-17 21:30:48 -07002430 @label_decorator('gpu_family')
2431 def get_gpu_family(self):
2432 """
2433 Determine GPU family.
2434
2435 @returns a string representing the gpu family. Examples are mali, tegra,
2436 pinetrail, sandybridge, ivybridge, haswell and baytrail.
2437 """
2438 gpu_family = self.run(self.poor_mans_rpc('get_gpu_family()')).stdout
2439 return 'gpu_family:%s' % str.strip(gpu_family)
2440
2441
Ilja Friedel0ce0b602013-08-15 18:45:27 -07002442 @label_decorator('graphics')
2443 def get_graphics(self):
2444 """
2445 Determine the correct board label for this host.
2446
2447 @returns a string representing this host's graphics. For now ARM boards
2448 return graphics:gles while all other boards return graphics:gl. This
2449 may change over time, but for robustness reasons this should avoid
2450 executing code in actual graphics libraries (which may not be ready and
2451 is tested by graphics_GLAPICheck).
2452 """
2453 uname = self.run('uname -a').stdout.lower()
2454 if 'arm' in uname:
2455 return 'graphics:gles'
2456 return 'graphics:gl'
2457
2458
Bill Richardson4f595f52014-02-13 16:20:26 -08002459 @label_decorator('ec')
2460 def get_ec(self):
2461 """
2462 Determine the type of EC on this host.
2463
2464 @returns a string representing this host's embedded controller type.
2465 At present, it only returns "ec:cros", for Chrome OS ECs. Other types
2466 of EC (or none) don't return any strings, since no tests depend on
2467 those.
2468 """
2469 cmd = 'mosys ec info'
2470 # The output should look like these, so that the last field should
2471 # match our EC version scheme:
2472 #
2473 # stm | stm32f100 | snow_v1.3.139-375eb9f
2474 # ti | Unknown-10de | peppy_v1.5.114-5d52788
2475 #
2476 # Non-Chrome OS ECs will look like these:
2477 #
2478 # ENE | KB932 | 00BE107A00
2479 # ite | it8518 | 3.08
2480 #
2481 # And some systems don't have ECs at all (Lumpy, for example).
2482 regexp = r'^.*\|\s*(\S+_v\d+\.\d+\.\d+-[0-9a-f]+)\s*$'
2483
2484 ecinfo = self.run(command=cmd, ignore_status=True)
2485 if ecinfo.exit_status == 0:
2486 res = re.search(regexp, ecinfo.stdout)
2487 if res:
2488 logging.info("EC version is %s", res.groups()[0])
2489 return 'ec:cros'
2490 logging.info("%s got: %s", cmd, ecinfo.stdout)
2491 # Has an EC, but it's not a Chrome OS EC
2492 return None
2493 logging.info("%s exited with status %d", cmd, ecinfo.exit_status)
2494 # No EC present
2495 return None
2496
2497
Alec Berg31b932b2014-04-04 16:09:11 -07002498 @label_decorator('accels')
2499 def get_accels(self):
2500 """
2501 Determine the type of accelerometers on this host.
2502
2503 @returns a string representing this host's accelerometer type.
2504 At present, it only returns "accel:cros-ec", for accelerometers
2505 attached to a Chrome OS EC, or none, if no accelerometers.
2506 """
2507 # Check to make sure we have ectool
2508 rv = self.run('which ectool', ignore_status=True)
2509 if rv.exit_status:
2510 logging.info("No ectool cmd found, assuming no EC accelerometers")
2511 return None
2512
2513 # Check that the EC supports the motionsense command
2514 rv = self.run('ectool motionsense', ignore_status=True)
2515 if rv.exit_status:
2516 logging.info("EC does not support motionsense command "
2517 "assuming no EC accelerometers")
2518 return None
2519
2520 # Check that EC motion sensors are active
2521 active = self.run('ectool motionsense active').stdout.split('\n')
2522 if active[0] == "0":
2523 logging.info("Motion sense inactive, assuming no EC accelerometers")
2524 return None
2525
2526 logging.info("EC accelerometers found")
2527 return 'accel:cros-ec'
2528
2529
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08002530 @label_decorator('chameleon')
2531 def has_chameleon(self):
2532 """Determine if a Chameleon connected to this host.
2533
Tom Wai-Hong Tambadbb332014-10-10 02:59:41 +08002534 @returns a list containing two strings ('chameleon' and
2535 'chameleon:' + label, e.g. 'chameleon:hdmi') if this host
2536 has a Chameleon or None if it has not.
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08002537 """
2538 if self._chameleon_host:
Tom Wai-Hong Tambadbb332014-10-10 02:59:41 +08002539 return ['chameleon', 'chameleon:' + self.chameleon.get_label()]
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08002540 else:
2541 return None
2542
2543
Cheng-Yi Chiangf4104ff2014-12-23 19:39:01 +08002544 @label_decorator('audio_loopback_dongle')
2545 def has_loopback_dongle(self):
2546 """Determine if an audio loopback dongle is plugged to this host.
2547
2548 @returns 'audio_loopback_dongle' when there is an audio loopback dongle
2549 plugged to this host.
2550 None when there is no audio loopback dongle
2551 plugged to this host.
2552 """
Cheng-Yi Chiang8de78112015-05-27 14:47:08 +08002553 nodes_info = self.run(command=cras_utils.get_cras_nodes_cmd(),
2554 ignore_status=True).stdout
2555 if (cras_utils.node_type_is_plugged('HEADPHONE', nodes_info) and
2556 cras_utils.node_type_is_plugged('MIC', nodes_info)):
Cheng-Yi Chiangf4104ff2014-12-23 19:39:01 +08002557 return 'audio_loopback_dongle'
2558 else:
2559 return None
2560
2561
Derek Basehorec71ff622014-07-07 15:18:40 -07002562 @label_decorator('power_supply')
2563 def get_power_supply(self):
2564 """
2565 Determine what type of power supply the host has
2566
2567 @returns a string representing this host's power supply.
2568 'power:battery' when the device has a battery intended for
2569 extended use
2570 'power:AC_primary' when the device has a battery not intended
2571 for extended use (for moving the machine, etc)
2572 'power:AC_only' when the device has no battery at all.
2573 """
2574 psu = self.run(command='mosys psu type', ignore_status=True)
2575 if psu.exit_status:
2576 # The psu command for mosys is not included for all platforms. The
2577 # assumption is that the device will have a battery if the command
2578 # is not found.
2579 return 'power:battery'
2580
2581 psu_str = psu.stdout.strip()
2582 if psu_str == 'unknown':
2583 return None
2584
2585 return 'power:%s' % psu_str
2586
2587
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002588 @label_decorator('storage')
2589 def get_storage(self):
2590 """
2591 Determine the type of boot device for this host.
2592
2593 Determine if the internal device is SCSI or dw_mmc device.
2594 Then check that it is SSD or HDD or eMMC or something else.
2595
2596 @returns a string representing this host's internal device type.
2597 'storage:ssd' when internal device is solid state drive
2598 'storage:hdd' when internal device is hard disk drive
2599 'storage:mmc' when internal device is mmc drive
2600 None When internal device is something else or
2601 when we are unable to determine the type
2602 """
2603 # The output should be /dev/mmcblk* for SD/eMMC or /dev/sd* for scsi
2604 rootdev_cmd = ' '.join(['. /usr/sbin/write_gpt.sh;',
2605 '. /usr/share/misc/chromeos-common.sh;',
2606 'load_base_vars;',
2607 'get_fixed_dst_drive'])
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002608 rootdev = self.run(command=rootdev_cmd, ignore_status=True)
2609 if rootdev.exit_status:
2610 logging.info("Fail to run %s", rootdev_cmd)
2611 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002612 rootdev_str = rootdev.stdout.strip()
2613
2614 if not rootdev_str:
2615 return None
2616
2617 rootdev_base = os.path.basename(rootdev_str)
2618
2619 mmc_pattern = '/dev/mmcblk[0-9]'
2620 if re.match(mmc_pattern, rootdev_str):
2621 # Use type to determine if the internal device is eMMC or somthing
2622 # else. We can assume that MMC is always an internal device.
2623 type_cmd = 'cat /sys/block/%s/device/type' % rootdev_base
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002624 type = self.run(command=type_cmd, ignore_status=True)
2625 if type.exit_status:
2626 logging.info("Fail to run %s", type_cmd)
2627 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002628 type_str = type.stdout.strip()
2629
2630 if type_str == 'MMC':
2631 return 'storage:mmc'
2632
2633 scsi_pattern = '/dev/sd[a-z]+'
2634 if re.match(scsi_pattern, rootdev.stdout):
2635 # Read symlink for /sys/block/sd* to determine if the internal
2636 # device is connected via ata or usb.
2637 link_cmd = 'readlink /sys/block/%s' % rootdev_base
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002638 link = self.run(command=link_cmd, ignore_status=True)
2639 if link.exit_status:
2640 logging.info("Fail to run %s", link_cmd)
2641 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002642 link_str = link.stdout.strip()
2643 if 'usb' in link_str:
2644 return None
2645
2646 # Read rotation to determine if the internal device is ssd or hdd.
2647 rotate_cmd = str('cat /sys/block/%s/queue/rotational'
2648 % rootdev_base)
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002649 rotate = self.run(command=rotate_cmd, ignore_status=True)
2650 if rotate.exit_status:
2651 logging.info("Fail to run %s", rotate_cmd)
2652 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002653 rotate_str = rotate.stdout.strip()
2654
2655 rotate_dict = {'0':'storage:ssd', '1':'storage:hdd'}
2656 return rotate_dict.get(rotate_str)
2657
2658 # All other internal device / error case will always fall here
2659 return None
2660
2661
Dan Shi4e9a2aa2014-03-24 14:28:42 -07002662 @label_decorator('servo')
2663 def get_servo(self):
2664 """Determine if the host has a servo attached.
2665
2666 If the host has a working servo attached, it should have a servo label.
2667
2668 @return: string 'servo' if the host has servo attached. Otherwise,
2669 returns None.
2670 """
2671 return 'servo' if self._servo_host else None
2672
2673
Dan Shi5beba472014-05-28 22:46:07 -07002674 @label_decorator('video_labels')
2675 def get_video_labels(self):
2676 """Run /usr/local/bin/avtest_label_detect to get a list of video labels.
2677
2678 Sample output of avtest_label_detect:
2679 Detected label: hw_video_acc_vp8
2680 Detected label: webcam
2681
2682 @return: A list of labels detected by tool avtest_label_detect.
2683 """
2684 try:
2685 result = self.run('/usr/local/bin/avtest_label_detect').stdout
2686 return re.findall('^Detected label: (\w+)$', result, re.M)
2687 except error.AutoservRunError:
2688 # The tool is not installed.
2689 return []
2690
2691
mussa584b4462014-06-20 15:13:28 -07002692 @label_decorator('video_glitch_detection')
2693 def is_video_glitch_detection_supported(self):
2694 """ Determine if a board under test is supported for video glitch
2695 detection tests.
2696
2697 @return: 'video_glitch_detection' if board is supported, None otherwise.
2698 """
2699 parser = ConfigParser.SafeConfigParser()
2700 filename = os.path.join(
2701 common.autotest_dir, 'client/cros/video/device_spec.conf')
2702
2703 dut = self.get_board().replace(ds_constants.BOARD_PREFIX, '')
2704
2705 try:
2706 parser.read(filename)
mussa584b4462014-06-20 15:13:28 -07002707 supported_boards = parser.sections()
2708
Mussa83c84d62014-10-02 12:11:28 -07002709 return 'video_glitch_detection' if dut in supported_boards else None
mussa584b4462014-06-20 15:13:28 -07002710
2711 except ConfigParser.error:
2712 # something went wrong while parsing the conf file
2713 return None
2714
Katherine Threlkeld7b97a9f2014-06-24 13:47:14 -07002715 @label_decorator('touch_labels')
2716 def get_touch(self):
2717 """
2718 Determine whether board under test has a touchpad or touchscreen.
2719
2720 @return: A list of some combination of 'touchscreen' and 'touchpad',
2721 depending on what is present on the device.
Katherine Threlkeldab83d392015-06-18 16:45:57 -07002722
Katherine Threlkeld7b97a9f2014-06-24 13:47:14 -07002723 """
2724 labels = []
Katherine Threlkeldab83d392015-06-18 16:45:57 -07002725 looking_for = ['touchpad', 'touchscreen']
2726 player = input_playback.InputPlayback()
2727 input_events = self.run('ls /dev/input/event*').stdout.strip().split()
2728 filename = '/tmp/touch_labels'
2729 for event in input_events:
2730 self.run('evtest %s > %s' % (event, filename), timeout=1,
2731 ignore_timeout=True)
2732 properties = self.run('cat %s' % filename).stdout
2733 input_type = player._determine_input_type(properties)
2734 if input_type in looking_for:
2735 labels.append(input_type)
2736 looking_for.remove(input_type)
2737 if len(looking_for) == 0:
2738 break
2739 self.run('rm %s' % filename)
2740
Katherine Threlkeld7b97a9f2014-06-24 13:47:14 -07002741 return labels
2742
Simran Basic6f1f7a2012-10-16 10:47:46 -07002743 def get_labels(self):
2744 """Return a list of labels for this given host.
2745
2746 This is the main way to retrieve all the automatic labels for a host
2747 as it will run through all the currently implemented label functions.
2748 """
2749 labels = []
Richard Barnette82c35912012-11-20 10:09:10 -08002750 for label_function in self._LABEL_FUNCTIONS:
J. Richard Barnetteb869b222014-09-03 17:55:44 -07002751 try:
2752 label = label_function(self)
2753 except Exception as e:
2754 logging.error('Label function %s failed; ignoring it.',
2755 label_function.__name__)
2756 logging.exception(e)
2757 label = None
Simran Basic6f1f7a2012-10-16 10:47:46 -07002758 if label:
Dan Shi5beba472014-05-28 22:46:07 -07002759 if type(label) is str:
2760 labels.append(label)
2761 elif type(label) is list:
2762 labels.extend(label)
Simran Basic6f1f7a2012-10-16 10:47:46 -07002763 return labels
Dan Shi85276d42014-04-08 22:11:45 -07002764
2765
2766 def is_boot_from_usb(self):
2767 """Check if DUT is boot from USB.
2768
2769 @return: True if DUT is boot from usb.
2770 """
2771 device = self.run('rootdev -s -d').stdout.strip()
2772 removable = int(self.run('cat /sys/block/%s/removable' %
2773 os.path.basename(device)).stdout.strip())
2774 return removable == 1
Helen Zhang17dae2b2014-11-11 09:25:52 -08002775
2776
2777 def read_from_meminfo(self, key):
Dan Shi49ca0932014-11-14 11:22:27 -08002778 """Return the memory info from /proc/meminfo
Helen Zhang17dae2b2014-11-11 09:25:52 -08002779
2780 @param key: meminfo requested
2781
2782 @return the memory value as a string
2783
2784 """
Helen Zhang17dae2b2014-11-11 09:25:52 -08002785 meminfo = self.run('grep %s /proc/meminfo' % key).stdout.strip()
2786 logging.debug('%s', meminfo)
2787 return int(re.search(r'\d+', meminfo).group(0))