blob: 806fc2e5f509e5f61e392ae7d40fde009862a3af [file] [log] [blame]
J. Richard Barnette24adbf42012-04-11 15:04:53 -07001# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
Dale Curtisaa5eedb2011-08-23 16:18:52 -07002# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4
mussa584b4462014-06-20 15:13:28 -07005import ConfigParser
Aviv Keshet74c89a92013-02-04 15:18:30 -08006import functools
Christopher Wiley0ed712b2013-04-09 15:25:12 -07007import httplib
J. Richard Barnette1d78b012012-05-15 13:56:30 -07008import logging
Dan Shi0f466e82013-02-22 15:44:58 -08009import os
Simran Basid5e5e272012-09-24 15:23:59 -070010import re
Christopher Wileyd78249a2013-03-01 13:05:31 -080011import socket
J. Richard Barnette1d78b012012-05-15 13:56:30 -070012import subprocess
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070013import time
J. Richard Barnette1d78b012012-05-15 13:56:30 -070014import xmlrpclib
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070015
mussa584b4462014-06-20 15:13:28 -070016import common
J. Richard Barnette45e93de2012-04-11 17:24:15 -070017from autotest_lib.client.bin import utils
Richard Barnette0c73ffc2012-11-19 15:21:18 -080018from autotest_lib.client.common_lib import error
19from autotest_lib.client.common_lib import global_config
J. Richard Barnette45e93de2012-04-11 17:24:15 -070020from autotest_lib.client.common_lib.cros import autoupdater
Richard Barnette03a0c132012-11-05 12:40:35 -080021from autotest_lib.client.common_lib.cros import dev_server
Christopher Wileyd78249a2013-03-01 13:05:31 -080022from autotest_lib.client.common_lib.cros import retry
Michael Liangda8c60a2014-06-03 13:24:51 -070023from autotest_lib.client.common_lib.cros.graphite import stats
Richard Barnette82c35912012-11-20 10:09:10 -080024from autotest_lib.client.cros import constants
J. Richard Barnette84890bd2014-02-21 11:05:47 -080025from autotest_lib.client.cros import cros_ui
J. Richard Barnette45e93de2012-04-11 17:24:15 -070026from autotest_lib.server import autoserv_parser
Dan Shia1ecd5c2013-06-06 11:21:31 -070027from autotest_lib.server import utils as server_utils
Scott Zawalski89c44dd2013-02-26 09:28:02 -050028from autotest_lib.server.cros.dynamic_suite import constants as ds_constants
Simran Basi5e6339a2013-03-21 11:34:32 -070029from autotest_lib.server.cros.dynamic_suite import tools, frontend_wrappers
Fang Deng96667ca2013-08-01 17:46:18 -070030from autotest_lib.server.hosts import abstract_ssh
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +080031from autotest_lib.server.hosts import chameleon_host
Fang Deng5d518f42013-08-02 14:04:32 -070032from autotest_lib.server.hosts import servo_host
Simran Basidcff4252012-11-20 16:13:20 -080033from autotest_lib.site_utils.rpm_control_system import rpm_client
Simran Basid5e5e272012-09-24 15:23:59 -070034
35
beeps32a63082013-08-22 14:02:29 -070036try:
37 import jsonrpclib
38except ImportError:
39 jsonrpclib = None
Fang Deng96667ca2013-08-01 17:46:18 -070040
Fang Dengd1c2b732013-08-20 12:59:46 -070041
beepsc87ff602013-07-31 21:53:00 -070042class FactoryImageCheckerException(error.AutoservError):
43 """Exception raised when an image is a factory image."""
44 pass
45
46
Aviv Keshet74c89a92013-02-04 15:18:30 -080047def add_label_detector(label_function_list, label_list=None, label=None):
48 """Decorator used to group functions together into the provided list.
49 @param label_function_list: List of label detecting functions to add
50 decorated function to.
51 @param label_list: List of detectable labels to add detectable labels to.
52 (Default: None)
53 @param label: Label string that is detectable by this detection function
54 (Default: None)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -080055 """
Simran Basic6f1f7a2012-10-16 10:47:46 -070056 def add_func(func):
Aviv Keshet74c89a92013-02-04 15:18:30 -080057 """
58 @param func: The function to be added as a detector.
59 """
60 label_function_list.append(func)
61 if label and label_list is not None:
62 label_list.append(label)
Simran Basic6f1f7a2012-10-16 10:47:46 -070063 return func
64 return add_func
65
66
Fang Deng0ca40e22013-08-27 17:47:44 -070067class CrosHost(abstract_ssh.AbstractSSHHost):
J. Richard Barnette45e93de2012-04-11 17:24:15 -070068 """Chromium OS specific subclass of Host."""
69
70 _parser = autoserv_parser.autoserv_parser
Scott Zawalski62bacae2013-03-05 10:40:32 -050071 _AFE = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
J. Richard Barnette45e93de2012-04-11 17:24:15 -070072
Richard Barnette03a0c132012-11-05 12:40:35 -080073 # Timeout values (in seconds) associated with various Chrome OS
74 # state changes.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070075 #
Richard Barnette0c73ffc2012-11-19 15:21:18 -080076 # In general, a good rule of thumb is that the timeout can be up
77 # to twice the typical measured value on the slowest platform.
78 # The times here have not necessarily been empirically tested to
79 # meet this criterion.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070080 #
81 # SLEEP_TIMEOUT: Time to allow for suspend to memory.
Richard Barnette0c73ffc2012-11-19 15:21:18 -080082 # RESUME_TIMEOUT: Time to allow for resume after suspend, plus
83 # time to restart the netwowrk.
J. Richard Barnette84890bd2014-02-21 11:05:47 -080084 # SHUTDOWN_TIMEOUT: Time to allow for shut down.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070085 # BOOT_TIMEOUT: Time to allow for boot from power off. Among
Richard Barnette0c73ffc2012-11-19 15:21:18 -080086 # other things, this must account for the 30 second dev-mode
J. Richard Barnetted4649c62013-03-06 17:42:27 -080087 # screen delay and time to start the network.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070088 # USB_BOOT_TIMEOUT: Time to allow for boot from a USB device,
Richard Barnette0c73ffc2012-11-19 15:21:18 -080089 # including the 30 second dev-mode delay and time to start the
J. Richard Barnetted4649c62013-03-06 17:42:27 -080090 # network.
beepsf079cfb2013-09-18 17:49:51 -070091 # INSTALL_TIMEOUT: Time to allow for chromeos-install.
J. Richard Barnette84890bd2014-02-21 11:05:47 -080092 # POWERWASH_BOOT_TIMEOUT: Time to allow for a reboot that
93 # includes powerwash.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070094
95 SLEEP_TIMEOUT = 2
J. Richard Barnetted4649c62013-03-06 17:42:27 -080096 RESUME_TIMEOUT = 10
Tom Wai-Hong Tam4d169ed2014-02-14 11:05:40 +080097 SHUTDOWN_TIMEOUT = 5
J. Richard Barnettefbcc7122013-07-24 18:24:59 -070098 BOOT_TIMEOUT = 60
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070099 USB_BOOT_TIMEOUT = 150
J. Richard Barnette84890bd2014-02-21 11:05:47 -0800100 INSTALL_TIMEOUT = 240
Dan Shi2c88eed2013-11-12 10:18:38 -0800101 POWERWASH_BOOT_TIMEOUT = 60
Chris Sosab76e0ee2013-05-22 16:55:41 -0700102
J. Richard Barnette84890bd2014-02-21 11:05:47 -0800103 # REBOOT_TIMEOUT: How long to wait for a reboot.
104 #
Chris Sosab76e0ee2013-05-22 16:55:41 -0700105 # We have a long timeout to ensure we don't flakily fail due to other
106 # issues. Shorter timeouts are vetted in platform_RebootAfterUpdate.
Simran Basi1160e2c2013-10-04 16:00:24 -0700107 # TODO(sbasi - crbug.com/276094) Restore to 5 mins once the 'host did not
108 # return from reboot' bug is solved.
109 REBOOT_TIMEOUT = 480
Chris Sosab76e0ee2013-05-22 16:55:41 -0700110
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800111 # _USB_POWER_TIMEOUT: Time to allow for USB to power toggle ON and OFF.
112 # _POWER_CYCLE_TIMEOUT: Time to allow for manual power cycle.
113 _USB_POWER_TIMEOUT = 5
114 _POWER_CYCLE_TIMEOUT = 10
115
beeps32a63082013-08-22 14:02:29 -0700116 _RPC_PROXY_URL = 'http://localhost:%d'
Christopher Wileydd181852013-10-10 19:56:58 -0700117 _RPC_SHUTDOWN_POLLING_PERIOD_SECONDS = 2
Peter Qiu4410db72014-06-05 10:32:41 -0700118 # Set shutdown timeout to account for the time for restarting the UI.
119 _RPC_SHUTDOWN_TIMEOUT_SECONDS = cros_ui.RESTART_UI_TIMEOUT
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800120
Richard Barnette82c35912012-11-20 10:09:10 -0800121 _RPM_RECOVERY_BOARDS = global_config.global_config.get_config_value('CROS',
122 'rpm_recovery_boards', type=str).split(',')
123
124 _MAX_POWER_CYCLE_ATTEMPTS = 6
125 _LAB_MACHINE_FILE = '/mnt/stateful_partition/.labmachine'
126 _RPM_HOSTNAME_REGEX = ('chromeos[0-9]+(-row[0-9]+)?-rack[0-9]+[a-z]*-'
127 'host[0-9]+')
128 _LIGHTSENSOR_FILES = ['in_illuminance0_input',
129 'in_illuminance0_raw',
130 'illuminance0_input']
131 _LIGHTSENSOR_SEARCH_DIR = '/sys/bus/iio/devices'
132 _LABEL_FUNCTIONS = []
Aviv Keshet74c89a92013-02-04 15:18:30 -0800133 _DETECTABLE_LABELS = []
134 label_decorator = functools.partial(add_label_detector, _LABEL_FUNCTIONS,
135 _DETECTABLE_LABELS)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700136
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -0800137 # Constants used in ping_wait_up() and ping_wait_down().
138 #
139 # _PING_WAIT_COUNT is the approximate number of polling
140 # cycles to use when waiting for a host state change.
141 #
142 # _PING_STATUS_DOWN and _PING_STATUS_UP are names used
143 # for arguments to the internal _ping_wait_for_status()
144 # method.
145 _PING_WAIT_COUNT = 40
146 _PING_STATUS_DOWN = False
147 _PING_STATUS_UP = True
148
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800149 # Allowed values for the power_method argument.
150
151 # POWER_CONTROL_RPM: Passed as default arg for power_off/on/cycle() methods.
152 # POWER_CONTROL_SERVO: Used in set_power() and power_cycle() methods.
153 # POWER_CONTROL_MANUAL: Used in set_power() and power_cycle() methods.
154 POWER_CONTROL_RPM = 'RPM'
155 POWER_CONTROL_SERVO = 'servoj10'
156 POWER_CONTROL_MANUAL = 'manual'
157
158 POWER_CONTROL_VALID_ARGS = (POWER_CONTROL_RPM,
159 POWER_CONTROL_SERVO,
160 POWER_CONTROL_MANUAL)
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800161
Simran Basi5e6339a2013-03-21 11:34:32 -0700162 _RPM_OUTLET_CHANGED = 'outlet_changed'
163
beeps687243d2013-07-18 15:29:27 -0700164
J. Richard Barnette964fba02012-10-24 17:34:29 -0700165 @staticmethod
beeps46dadc92013-11-07 14:07:10 -0800166 def check_host(host, timeout=10):
167 """
168 Check if the given host is a chrome-os host.
169
170 @param host: An ssh host representing a device.
171 @param timeout: The timeout for the run command.
172
173 @return: True if the host device is chromeos.
174
beeps46dadc92013-11-07 14:07:10 -0800175 """
176 try:
Christopher Wiley1ea80942014-02-26 16:45:08 -0800177 result = host.run('grep -q CHROMEOS /etc/lsb-release && '
178 '! which adb >/dev/null 2>&1',
Christopher Wileyfc3eac02013-11-21 16:24:57 -0800179 ignore_status=True, timeout=timeout)
beeps46dadc92013-11-07 14:07:10 -0800180 except (error.AutoservRunError, error.AutoservSSHTimeout):
181 return False
182 return result.exit_status == 0
183
184
185 @staticmethod
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800186 def _extract_arguments(args_dict, key_subset):
187 """Extract options from `args_dict` and return a subset result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800188
189 Take the provided dictionary of argument options and return
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800190 a subset that represent standard arguments needed to construct
191 a test-assistant object (chameleon or servo) for a host. The
192 intent is to provide standard argument processing from
193 run_remote_tests for tests that require a test-assistant board
194 to operate.
195
196 @param args_dict Dictionary from which to extract the arguments.
197 @param key_subset Tuple of keys to extract from the args_dict, e.g.
198 ('servo_host', 'servo_port').
199 """
200 result = {}
201 for arg in key_subset:
202 if arg in args_dict:
203 result[arg] = args_dict[arg]
204 return result
205
206
207 @staticmethod
208 def get_chameleon_arguments(args_dict):
209 """Extract chameleon options from `args_dict` and return the result.
210
211 Recommended usage:
212 ~~~~~~~~
213 args_dict = utils.args_to_dict(args)
214 chameleon_args = hosts.CrosHost.get_chameleon_arguments(args_dict)
215 host = hosts.create_host(machine, chameleon_args=chameleon_args)
216 ~~~~~~~~
217
218 @param args_dict Dictionary from which to extract the chameleon
219 arguments.
220 """
221 return CrosHost._extract_arguments(
222 args_dict, ('chameleon_host', 'chameleon_port'))
223
224
225 @staticmethod
226 def get_servo_arguments(args_dict):
227 """Extract servo options from `args_dict` and return the result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800228
229 Recommended usage:
230 ~~~~~~~~
231 args_dict = utils.args_to_dict(args)
Fang Deng0ca40e22013-08-27 17:47:44 -0700232 servo_args = hosts.CrosHost.get_servo_arguments(args_dict)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800233 host = hosts.create_host(machine, servo_args=servo_args)
234 ~~~~~~~~
235
236 @param args_dict Dictionary from which to extract the servo
237 arguments.
238 """
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800239 return CrosHost._extract_arguments(
240 args_dict, ('servo_host', 'servo_port'))
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700241
J. Richard Barnette964fba02012-10-24 17:34:29 -0700242
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800243 def _initialize(self, hostname, chameleon_args=None, servo_args=None,
244 ssh_verbosity_flag='', ssh_options='',
Fang Dengd1c2b732013-08-20 12:59:46 -0700245 *args, **dargs):
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800246 """Initialize superclasses, |self.chameleon|, and |self.servo|.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700247
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800248 This method checks whether a chameleon/servo (aka
249 test-assistant objects) is required by checking whether
250 chameleon_args/servo_args is None. This method will only
251 attempt to create the test-assistant object when it is
252 required by the test.
Fang Deng5d518f42013-08-02 14:04:32 -0700253
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800254 For creating the test-assistant object, there are three
255 possibilities: First, if the host is a lab system known to have
256 a test-assistant board, we connect to that board unconditionally.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700257 Second, if we're called from a control file that requires
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800258 test-assistant features for testing, it will pass settings from
259 the arguments, like `servo_host`, `servo_port`. If neither of
260 these cases apply, the test-assistant object will be `None`.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700261
262 """
Fang Deng0ca40e22013-08-27 17:47:44 -0700263 super(CrosHost, self)._initialize(hostname=hostname,
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700264 *args, **dargs)
J. Richard Barnettef0859852012-08-20 14:55:50 -0700265 # self.env is a dictionary of environment variable settings
266 # to be exported for commands run on the host.
267 # LIBC_FATAL_STDERR_ can be useful for diagnosing certain
268 # errors that might happen.
269 self.env['LIBC_FATAL_STDERR_'] = '1'
beeps32a63082013-08-22 14:02:29 -0700270 self._rpc_proxy_map = {}
Fang Dengd1c2b732013-08-20 12:59:46 -0700271 self._ssh_verbosity_flag = ssh_verbosity_flag
Aviv Keshetc5947fa2013-09-04 14:06:29 -0700272 self._ssh_options = ssh_options
Fang Deng5d518f42013-08-02 14:04:32 -0700273 # TODO(fdeng): We need to simplify the
274 # process of servo and servo_host initialization.
275 # crbug.com/298432
Dan Shi4d478522014-02-14 13:46:32 -0800276 self._servo_host = servo_host.create_servo_host(dut=self.hostname,
277 servo_args=servo_args)
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800278 # TODO(waihong): Do the simplication on Chameleon too.
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800279 self._chameleon_host = chameleon_host.create_chameleon_host(
280 dut=self.hostname, chameleon_args=chameleon_args)
281
Dan Shi4d478522014-02-14 13:46:32 -0800282 if self._servo_host is not None:
283 self.servo = self._servo_host.get_servo()
284 else:
285 self.servo = None
286
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800287 if self._chameleon_host:
Tom Wai-Hong Tameaee3402014-01-22 08:52:10 +0800288 self.chameleon = self._chameleon_host.create_chameleon_board()
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800289 else:
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800290 self.chameleon = None
Fang Deng5d518f42013-08-02 14:04:32 -0700291
292
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500293 def get_repair_image_name(self):
294 """Generate a image_name from variables in the global config.
295
296 @returns a str of $board-version/$BUILD.
297
298 """
299 stable_version = global_config.global_config.get_config_value(
300 'CROS', 'stable_cros_version')
301 build_pattern = global_config.global_config.get_config_value(
302 'CROS', 'stable_build_pattern')
303 board = self._get_board_from_afe()
304 if board is None:
305 raise error.AutoservError('DUT has no board attribute, '
306 'cannot be repaired.')
307 return build_pattern % (board, stable_version)
308
309
Scott Zawalski62bacae2013-03-05 10:40:32 -0500310 def _host_in_AFE(self):
311 """Check if the host is an object the AFE knows.
312
313 @returns the host object.
314 """
315 return self._AFE.get_hosts(hostname=self.hostname)
316
317
Chris Sosab76e0ee2013-05-22 16:55:41 -0700318 def lookup_job_repo_url(self):
319 """Looks up the job_repo_url for the host.
320
321 @returns job_repo_url from AFE or None if not found.
322
323 @raises KeyError if the host does not have a job_repo_url
324 """
325 if not self._host_in_AFE():
326 return None
327
328 hosts = self._AFE.get_hosts(hostname=self.hostname)
beepsb5efc532013-06-04 11:29:34 -0700329 if hosts and ds_constants.JOB_REPO_URL in hosts[0].attributes:
330 return hosts[0].attributes[ds_constants.JOB_REPO_URL]
Chris Sosab76e0ee2013-05-22 16:55:41 -0700331
332
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500333 def clear_cros_version_labels_and_job_repo_url(self):
334 """Clear cros_version labels and host attribute job_repo_url."""
Scott Zawalski62bacae2013-03-05 10:40:32 -0500335 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400336 return
337
Scott Zawalski62bacae2013-03-05 10:40:32 -0500338 host_list = [self.hostname]
339 labels = self._AFE.get_labels(
340 name__startswith=ds_constants.VERSION_PREFIX,
341 host__hostname=self.hostname)
Dan Shi0f466e82013-02-22 15:44:58 -0800342
Scott Zawalski62bacae2013-03-05 10:40:32 -0500343 for label in labels:
344 label.remove_hosts(hosts=host_list)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500345
beepscb6f1e22013-06-28 19:14:10 -0700346 self.update_job_repo_url(None, None)
347
348
349 def update_job_repo_url(self, devserver_url, image_name):
350 """
351 Updates the job_repo_url host attribute and asserts it's value.
352
353 @param devserver_url: The devserver to use in the job_repo_url.
354 @param image_name: The name of the image to use in the job_repo_url.
355
356 @raises AutoservError: If we failed to update the job_repo_url.
357 """
358 repo_url = None
359 if devserver_url and image_name:
360 repo_url = tools.get_package_url(devserver_url, image_name)
361 self._AFE.set_host_attribute(ds_constants.JOB_REPO_URL, repo_url,
Scott Zawalski62bacae2013-03-05 10:40:32 -0500362 hostname=self.hostname)
beepscb6f1e22013-06-28 19:14:10 -0700363 if self.lookup_job_repo_url() != repo_url:
364 raise error.AutoservError('Failed to update job_repo_url with %s, '
365 'host %s' % (repo_url, self.hostname))
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500366
367
Dan Shie9309262013-06-19 22:50:21 -0700368 def add_cros_version_labels_and_job_repo_url(self, image_name):
Scott Zawalskieadbf702013-03-14 09:23:06 -0400369 """Add cros_version labels and host attribute job_repo_url.
370
371 @param image_name: The name of the image e.g.
372 lumpy-release/R27-3837.0.0
Dan Shi7458bf62013-06-10 12:50:16 -0700373
Scott Zawalskieadbf702013-03-14 09:23:06 -0400374 """
Scott Zawalski62bacae2013-03-05 10:40:32 -0500375 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400376 return
Scott Zawalski62bacae2013-03-05 10:40:32 -0500377
Scott Zawalskieadbf702013-03-14 09:23:06 -0400378 cros_label = '%s%s' % (ds_constants.VERSION_PREFIX, image_name)
Dan Shie9309262013-06-19 22:50:21 -0700379 devserver_url = dev_server.ImageServer.resolve(image_name).url()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500380
381 labels = self._AFE.get_labels(name=cros_label)
382 if labels:
383 label = labels[0]
384 else:
385 label = self._AFE.create_label(name=cros_label)
386
387 label.add_hosts([self.hostname])
beepscb6f1e22013-06-28 19:14:10 -0700388 self.update_job_repo_url(devserver_url, image_name)
389
390
beepsdae65fd2013-07-26 16:24:41 -0700391 def verify_job_repo_url(self, tag=''):
beepscb6f1e22013-06-28 19:14:10 -0700392 """
393 Make sure job_repo_url of this host is valid.
394
joychen03eaad92013-06-26 09:55:21 -0700395 Eg: The job_repo_url "http://lmn.cd.ab.xyx:8080/static/\
beepscb6f1e22013-06-28 19:14:10 -0700396 lumpy-release/R29-4279.0.0/autotest/packages" claims to have the
397 autotest package for lumpy-release/R29-4279.0.0. If this isn't the case,
398 download and extract it. If the devserver embedded in the url is
399 unresponsive, update the job_repo_url of the host after staging it on
400 another devserver.
401
402 @param job_repo_url: A url pointing to the devserver where the autotest
403 package for this build should be staged.
beepsdae65fd2013-07-26 16:24:41 -0700404 @param tag: The tag from the server job, in the format
405 <job_id>-<user>/<hostname>, or <hostless> for a server job.
beepscb6f1e22013-06-28 19:14:10 -0700406
407 @raises DevServerException: If we could not resolve a devserver.
408 @raises AutoservError: If we're unable to save the new job_repo_url as
409 a result of choosing a new devserver because the old one failed to
410 respond to a health check.
beeps0c865032013-07-30 11:37:06 -0700411 @raises urllib2.URLError: If the devserver embedded in job_repo_url
412 doesn't respond within the timeout.
beepscb6f1e22013-06-28 19:14:10 -0700413 """
414 job_repo_url = self.lookup_job_repo_url()
415 if not job_repo_url:
416 logging.warning('No job repo url set on host %s', self.hostname)
417 return
418
419 logging.info('Verifying job repo url %s', job_repo_url)
420 devserver_url, image_name = tools.get_devserver_build_from_package_url(
421 job_repo_url)
422
beeps0c865032013-07-30 11:37:06 -0700423 ds = dev_server.ImageServer(devserver_url)
beepscb6f1e22013-06-28 19:14:10 -0700424
425 logging.info('Staging autotest artifacts for %s on devserver %s',
426 image_name, ds.url())
beeps687243d2013-07-18 15:29:27 -0700427
428 start_time = time.time()
beepscb6f1e22013-06-28 19:14:10 -0700429 ds.stage_artifacts(image_name, ['autotest'])
beeps687243d2013-07-18 15:29:27 -0700430 stage_time = time.time() - start_time
431
432 # Record how much of the verification time comes from a devserver
433 # restage. If we're doing things right we should not see multiple
434 # devservers for a given board/build/branch path.
435 try:
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800436 board, build_type, branch = server_utils.ParseBuildName(
beeps687243d2013-07-18 15:29:27 -0700437 image_name)[:3]
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800438 except server_utils.ParseBuildNameException:
beeps687243d2013-07-18 15:29:27 -0700439 pass
440 else:
beeps0c865032013-07-30 11:37:06 -0700441 devserver = devserver_url[
Chris Sosa65425082013-10-16 13:26:22 -0700442 devserver_url.find('/') + 2:devserver_url.rfind(':')]
beeps687243d2013-07-18 15:29:27 -0700443 stats_key = {
444 'board': board,
445 'build_type': build_type,
446 'branch': branch,
beeps0c865032013-07-30 11:37:06 -0700447 'devserver': devserver.replace('.', '_'),
beeps687243d2013-07-18 15:29:27 -0700448 }
449 stats.Gauge('verify_job_repo_url').send(
450 '%(board)s.%(build_type)s.%(branch)s.%(devserver)s' % stats_key,
451 stage_time)
beepscb6f1e22013-06-28 19:14:10 -0700452
Scott Zawalskieadbf702013-03-14 09:23:06 -0400453
Dan Shi0f466e82013-02-22 15:44:58 -0800454 def _try_stateful_update(self, update_url, force_update, updater):
455 """Try to use stateful update to initialize DUT.
456
457 When DUT is already running the same version that machine_install
458 tries to install, stateful update is a much faster way to clean up
459 the DUT for testing, compared to a full reimage. It is implemeted
460 by calling autoupdater.run_update, but skipping updating root, as
461 updating the kernel is time consuming and not necessary.
462
463 @param update_url: url of the image.
464 @param force_update: Set to True to update the image even if the DUT
465 is running the same version.
466 @param updater: ChromiumOSUpdater instance used to update the DUT.
467 @returns: True if the DUT was updated with stateful update.
468
469 """
J. Richard Barnette3f731032014-04-07 17:42:59 -0700470 # TODO(jrbarnette): Yes, I hate this re.match() test case.
471 # It's better than the alternative: see crbug.com/360944.
472 image_name = autoupdater.url_to_image_name(update_url)
473 release_pattern = r'^.*-release/R[0-9]+-[0-9]+\.[0-9]+\.0$'
474 if not re.match(release_pattern, image_name):
475 return False
Dan Shi0f466e82013-02-22 15:44:58 -0800476 if not updater.check_version():
477 return False
478 if not force_update:
479 logging.info('Canceling stateful update because the new and '
480 'old versions are the same.')
481 return False
482 # Following folders should be rebuilt after stateful update.
483 # A test file is used to confirm each folder gets rebuilt after
484 # the stateful update.
485 folders_to_check = ['/var', '/home', '/mnt/stateful_partition']
486 test_file = '.test_file_to_be_deleted'
487 for folder in folders_to_check:
488 touch_path = os.path.join(folder, test_file)
489 self.run('touch %s' % touch_path)
490
491 if not updater.run_update(force_update=True, update_root=False):
492 return False
493
494 # Reboot to complete stateful update.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700495 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Dan Shi0f466e82013-02-22 15:44:58 -0800496 check_file_cmd = 'test -f %s; echo $?'
497 for folder in folders_to_check:
498 test_file_path = os.path.join(folder, test_file)
499 result = self.run(check_file_cmd % test_file_path,
500 ignore_status=True)
501 if result.exit_status == 1:
502 return False
503 return True
504
505
J. Richard Barnette7275b612013-06-04 18:13:11 -0700506 def _post_update_processing(self, updater, expected_kernel=None):
Dan Shi0f466e82013-02-22 15:44:58 -0800507 """After the DUT is updated, confirm machine_install succeeded.
508
509 @param updater: ChromiumOSUpdater instance used to update the DUT.
J. Richard Barnette7275b612013-06-04 18:13:11 -0700510 @param expected_kernel: kernel expected to be active after reboot,
511 or `None` to skip rollback checking.
Dan Shi0f466e82013-02-22 15:44:58 -0800512
513 """
J. Richard Barnette7275b612013-06-04 18:13:11 -0700514 # Touch the lab machine file to leave a marker that
515 # distinguishes this image from other test images.
516 # Afterwards, we must re-run the autoreboot script because
517 # it depends on the _LAB_MACHINE_FILE.
Dan Shi0f466e82013-02-22 15:44:58 -0800518 self.run('touch %s' % self._LAB_MACHINE_FILE)
Dan Shi0f466e82013-02-22 15:44:58 -0800519 self.run('start autoreboot')
Chris Sosa65425082013-10-16 13:26:22 -0700520 updater.verify_boot_expectations(
521 expected_kernel, rollback_message=
522 'Build %s failed to boot on %s; system rolled back to previous'
523 'build' % (updater.update_version, self.hostname))
J. Richard Barnette7275b612013-06-04 18:13:11 -0700524 # Check that we've got the build we meant to install.
525 if not updater.check_version_to_confirm_install():
526 raise autoupdater.ChromiumOSError(
527 'Failed to update %s to build %s; found build '
528 '%s instead' % (self.hostname,
Chris Sosa65425082013-10-16 13:26:22 -0700529 updater.update_version,
530 updater.get_build_id()))
Dan Shi0f466e82013-02-22 15:44:58 -0800531
532
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700533 def _stage_image_for_update(self, image_name=None):
Scott Zawalskieadbf702013-03-14 09:23:06 -0400534 """Stage a build on a devserver and return the update_url.
535
536 @param image_name: a name like lumpy-release/R27-3837.0.0
537 @returns an update URL like:
538 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
539 """
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700540 if not image_name:
541 image_name = self.get_repair_image_name()
542 logging.info('Staging build for AU: %s', image_name)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400543 devserver = dev_server.ImageServer.resolve(image_name)
544 devserver.trigger_download(image_name, synchronous=False)
545 return tools.image_url_pattern() % (devserver.url(), image_name)
546
547
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700548 def stage_image_for_servo(self, image_name=None):
549 """Stage a build on a devserver and return the update_url.
550
551 @param image_name: a name like lumpy-release/R27-3837.0.0
552 @returns an update URL like:
553 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
554 """
555 if not image_name:
556 image_name = self.get_repair_image_name()
557 logging.info('Staging build for servo install: %s', image_name)
558 devserver = dev_server.ImageServer.resolve(image_name)
559 devserver.stage_artifacts(image_name, ['test_image'])
560 return devserver.get_test_image_url(image_name)
561
562
beepse539be02013-07-31 21:57:39 -0700563 def stage_factory_image_for_servo(self, image_name):
564 """Stage a build on a devserver and return the update_url.
565
566 @param image_name: a name like <baord>/4262.204.0
beeps12c0a3c2013-09-03 11:58:27 -0700567
beepse539be02013-07-31 21:57:39 -0700568 @return: An update URL, eg:
569 http://<devserver>/static/canary-channel/\
570 <board>/4262.204.0/factory_test/chromiumos_factory_image.bin
beeps12c0a3c2013-09-03 11:58:27 -0700571
572 @raises: ValueError if the factory artifact name is missing from
573 the config.
574
beepse539be02013-07-31 21:57:39 -0700575 """
576 if not image_name:
577 logging.error('Need an image_name to stage a factory image.')
578 return
579
beeps12c0a3c2013-09-03 11:58:27 -0700580 factory_artifact = global_config.global_config.get_config_value(
581 'CROS', 'factory_artifact', type=str, default='')
582 if not factory_artifact:
583 raise ValueError('Cannot retrieve the factory artifact name from '
584 'autotest config, and hence cannot stage factory '
585 'artifacts.')
586
beepse539be02013-07-31 21:57:39 -0700587 logging.info('Staging build for servo install: %s', image_name)
588 devserver = dev_server.ImageServer.resolve(image_name)
589 devserver.stage_artifacts(
590 image_name,
beeps12c0a3c2013-09-03 11:58:27 -0700591 [factory_artifact],
592 archive_url=None)
beepse539be02013-07-31 21:57:39 -0700593
594 return tools.factory_image_url_pattern() % (devserver.url(), image_name)
595
596
Chris Sosaa3ac2152012-05-23 22:23:13 -0700597 def machine_install(self, update_url=None, force_update=False,
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500598 local_devserver=False, repair=False):
599 """Install the DUT.
600
Dan Shi0f466e82013-02-22 15:44:58 -0800601 Use stateful update if the DUT is already running the same build.
602 Stateful update does not update kernel and tends to run much faster
603 than a full reimage. If the DUT is running a different build, or it
604 failed to do a stateful update, full update, including kernel update,
605 will be applied to the DUT.
606
Scott Zawalskieadbf702013-03-14 09:23:06 -0400607 Once a host enters machine_install its cros_version label will be
608 removed as well as its host attribute job_repo_url (used for
609 package install).
610
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500611 @param update_url: The url to use for the update
612 pattern: http://$devserver:###/update/$build
613 If update_url is None and repair is True we will install the
614 stable image listed in global_config under
615 CROS.stable_cros_version.
616 @param force_update: Force an update even if the version installed
617 is the same. Default:False
618 @param local_devserver: Used by run_remote_test to allow people to
619 use their local devserver. Default: False
620 @param repair: Whether or not we are in repair mode. This adds special
621 cases for repairing a machine like starting update_engine.
622 Setting repair to True sets force_update to True as well.
623 default: False
624 @raises autoupdater.ChromiumOSError
625
626 """
Dan Shi7458bf62013-06-10 12:50:16 -0700627 if update_url:
628 logging.debug('update url is set to %s', update_url)
629 else:
630 logging.debug('update url is not set, resolving...')
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700631 if self._parser.options.image:
632 requested_build = self._parser.options.image
633 if requested_build.startswith('http://'):
634 update_url = requested_build
Dan Shi7458bf62013-06-10 12:50:16 -0700635 logging.debug('update url is retrieved from requested_build'
636 ': %s', update_url)
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700637 else:
638 # Try to stage any build that does not start with
639 # http:// on the devservers defined in
640 # global_config.ini.
Dan Shi7458bf62013-06-10 12:50:16 -0700641 update_url = self._stage_image_for_update(requested_build)
642 logging.debug('Build staged, and update_url is set to: %s',
643 update_url)
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700644 elif repair:
645 update_url = self._stage_image_for_update()
Dan Shi7458bf62013-06-10 12:50:16 -0700646 logging.debug('Build staged, and update_url is set to: %s',
647 update_url)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400648 else:
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700649 raise autoupdater.ChromiumOSError(
650 'Update failed. No update URL provided.')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500651
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500652 if repair:
Dan Shi0f466e82013-02-22 15:44:58 -0800653 # In case the system is in a bad state, we always reboot the machine
654 # before machine_install.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700655 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500656 self.run('stop update-engine; start update-engine')
657 force_update = True
Dan Shi0f466e82013-02-22 15:44:58 -0800658
Chris Sosaa3ac2152012-05-23 22:23:13 -0700659 updater = autoupdater.ChromiumOSUpdater(update_url, host=self,
Chris Sosa72312602013-04-16 15:01:56 -0700660 local_devserver=local_devserver)
Dan Shi0f466e82013-02-22 15:44:58 -0800661 updated = False
Scott Zawalskieadbf702013-03-14 09:23:06 -0400662 # Remove cros-version and job_repo_url host attribute from host.
663 self.clear_cros_version_labels_and_job_repo_url()
Dan Shi0f466e82013-02-22 15:44:58 -0800664 # If the DUT is already running the same build, try stateful update
665 # first. Stateful update does not update kernel and tends to run much
666 # faster than a full reimage.
667 try:
Chris Sosab76e0ee2013-05-22 16:55:41 -0700668 updated = self._try_stateful_update(
669 update_url, force_update, updater)
Dan Shi0f466e82013-02-22 15:44:58 -0800670 if updated:
671 logging.info('DUT is updated with stateful update.')
672 except Exception as e:
673 logging.exception(e)
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -0700674 logging.warning('Failed to stateful update DUT, force to update.')
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700675
Dan Shi0f466e82013-02-22 15:44:58 -0800676 inactive_kernel = None
677 # Do a full update if stateful update is not applicable or failed.
678 if not updated:
679 # In case the system is in a bad state, we always reboot the
680 # machine before machine_install.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700681 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Chris Sosab7612bc2013-03-21 10:32:37 -0700682
683 # TODO(sosa): Remove temporary hack to get rid of bricked machines
684 # that can't update due to a corrupted policy.
685 self.run('rm -rf /var/lib/whitelist')
686 self.run('touch /var/lib/whitelist')
687 self.run('chmod -w /var/lib/whitelist')
Scott Zawalskib550d5a2013-03-22 09:23:59 -0400688 self.run('stop update-engine; start update-engine')
Chris Sosab7612bc2013-03-21 10:32:37 -0700689
Dan Shi0f466e82013-02-22 15:44:58 -0800690 if updater.run_update(force_update):
691 updated = True
692 # Figure out active and inactive kernel.
693 active_kernel, inactive_kernel = updater.get_kernel_state()
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700694
Dan Shi0f466e82013-02-22 15:44:58 -0800695 # Ensure inactive kernel has higher priority than active.
696 if (updater.get_kernel_priority(inactive_kernel)
697 < updater.get_kernel_priority(active_kernel)):
698 raise autoupdater.ChromiumOSError(
699 'Update failed. The priority of the inactive kernel'
700 ' partition is less than that of the active kernel'
701 ' partition.')
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700702
Dan Shi0f466e82013-02-22 15:44:58 -0800703 # Updater has returned successfully; reboot the host.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700704 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700705
Dan Shi0f466e82013-02-22 15:44:58 -0800706 if updated:
707 self._post_update_processing(updater, inactive_kernel)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400708 image_name = autoupdater.url_to_image_name(update_url)
Dan Shie9309262013-06-19 22:50:21 -0700709 self.add_cros_version_labels_and_job_repo_url(image_name)
Simran Basi13fa1ba2013-03-04 10:56:47 -0800710
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700711 # Clean up any old autotest directories which may be lying around.
712 for path in global_config.global_config.get_config_value(
713 'AUTOSERV', 'client_autodir_paths', type=list):
714 self.run('rm -rf ' + path)
715
716
Dan Shi10e992b2013-08-30 11:02:59 -0700717 def show_update_engine_log(self):
718 """Output update engine log."""
719 logging.debug('Dumping %s', constants.UPDATE_ENGINE_LOG)
720 self.run('cat %s' % constants.UPDATE_ENGINE_LOG)
721
722
Richard Barnette82c35912012-11-20 10:09:10 -0800723 def _get_board_from_afe(self):
724 """Retrieve this host's board from its labels in the AFE.
725
726 Looks for a host label of the form "board:<board>", and
727 returns the "<board>" part of the label. `None` is returned
728 if there is not a single, unique label matching the pattern.
729
730 @returns board from label, or `None`.
731 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700732 return server_utils.get_board_from_afe(self.hostname, self._AFE)
Simran Basi833814b2013-01-29 13:13:43 -0800733
734
735 def get_build(self):
736 """Retrieve the current build for this Host from the AFE.
737
738 Looks through this host's labels in the AFE to determine its build.
739
740 @returns The current build or None if it could not find it or if there
741 were multiple build labels assigned to this host.
742 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700743 return server_utils.get_build_from_afe(self.hostname, self._AFE)
Richard Barnette82c35912012-11-20 10:09:10 -0800744
745
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500746 def _install_repair(self):
747 """Attempt to repair this host using upate-engine.
748
749 If the host is up, try installing the DUT with a stable
750 "repair" version of Chrome OS as defined in the global_config
751 under CROS.stable_cros_version.
752
Scott Zawalski62bacae2013-03-05 10:40:32 -0500753 @raises AutoservRepairMethodNA if the DUT is not reachable.
754 @raises ChromiumOSError if the install failed for some reason.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500755
756 """
757 if not self.is_up():
Scott Zawalski62bacae2013-03-05 10:40:32 -0500758 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500759 logging.info('Attempting to reimage machine to repair image.')
760 try:
761 self.machine_install(repair=True)
Fang Dengd0672f32013-03-18 17:18:09 -0700762 except autoupdater.ChromiumOSError as e:
763 logging.exception(e)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500764 logging.info('Repair via install failed.')
Scott Zawalski62bacae2013-03-05 10:40:32 -0500765 raise
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500766
767
Dan Shi2c88eed2013-11-12 10:18:38 -0800768 def _install_repair_with_powerwash(self):
Dan Shi9cc48452013-11-12 12:39:26 -0800769 """Attempt to powerwash first then repair this host using update-engine.
Dan Shi2c88eed2013-11-12 10:18:38 -0800770
Dan Shi9cc48452013-11-12 12:39:26 -0800771 update-engine may fail due to a bad image. In such case, powerwash
772 may help to cleanup the DUT for update-engine to work again.
Dan Shi2c88eed2013-11-12 10:18:38 -0800773
774 @raises AutoservRepairMethodNA if the DUT is not reachable.
775 @raises ChromiumOSError if the install failed for some reason.
776
777 """
778 if not self.is_up():
779 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
780
781 logging.info('Attempting to powerwash the DUT.')
782 self.run('echo "fast safe" > '
783 '/mnt/stateful_partition/factory_install_reset')
784 self.reboot(timeout=self.POWERWASH_BOOT_TIMEOUT, wait=True)
785 if not self.is_up():
Dan Shi9cc48452013-11-12 12:39:26 -0800786 logging.error('Powerwash failed. DUT did not come back after '
Dan Shi2c88eed2013-11-12 10:18:38 -0800787 'reboot.')
788 raise error.AutoservRepairFailure(
789 'DUT failed to boot from powerwash after %d seconds' %
790 self.POWERWASH_BOOT_TIMEOUT)
791
792 logging.info('Powerwash succeeded.')
793 self._install_repair()
794
795
beepsf079cfb2013-09-18 17:49:51 -0700796 def servo_install(self, image_url=None, usb_boot_timeout=USB_BOOT_TIMEOUT,
797 install_timeout=INSTALL_TIMEOUT):
Scott Zawalski62bacae2013-03-05 10:40:32 -0500798 """
799 Re-install the OS on the DUT by:
800 1) installing a test image on a USB storage device attached to the Servo
801 board,
Richard Barnette03a0c132012-11-05 12:40:35 -0800802 2) booting that image in recovery mode, and then
J. Richard Barnette31b2e312013-04-04 16:05:22 -0700803 3) installing the image with chromeos-install.
804
Scott Zawalski62bacae2013-03-05 10:40:32 -0500805 @param image_url: If specified use as the url to install on the DUT.
806 otherwise boot the currently staged image on the USB stick.
beepsf079cfb2013-09-18 17:49:51 -0700807 @param usb_boot_timeout: The usb_boot_timeout to use during reimage.
808 Factory images need a longer usb_boot_timeout than regular
809 cros images.
810 @param install_timeout: The timeout to use when installing the chromeos
811 image. Factory images need a longer install_timeout.
Richard Barnette03a0c132012-11-05 12:40:35 -0800812
Scott Zawalski62bacae2013-03-05 10:40:32 -0500813 @raises AutoservError if the image fails to boot.
Richard Barnette03a0c132012-11-05 12:40:35 -0800814 """
beepsf079cfb2013-09-18 17:49:51 -0700815
816 usb_boot_timer_key = ('servo_install.usb_boot_timeout_%s'
817 % usb_boot_timeout)
818 logging.info('Downloading image to USB, then booting from it. Usb boot '
819 'timeout = %s', usb_boot_timeout)
820 timer = stats.Timer(usb_boot_timer_key)
821 timer.start()
J. Richard Barnette31b2e312013-04-04 16:05:22 -0700822 self.servo.install_recovery_image(image_url)
beepsf079cfb2013-09-18 17:49:51 -0700823 if not self.wait_up(timeout=usb_boot_timeout):
Scott Zawalski62bacae2013-03-05 10:40:32 -0500824 raise error.AutoservRepairFailure(
825 'DUT failed to boot from USB after %d seconds' %
beepsf079cfb2013-09-18 17:49:51 -0700826 usb_boot_timeout)
827 timer.stop()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500828
beepsf079cfb2013-09-18 17:49:51 -0700829 install_timer_key = ('servo_install.install_timeout_%s'
830 % install_timeout)
831 timer = stats.Timer(install_timer_key)
832 timer.start()
833 logging.info('Installing image through chromeos-install.')
834 self.run('chromeos-install --yes', timeout=install_timeout)
835 timer.stop()
836
837 logging.info('Power cycling DUT through servo.')
Richard Barnette03a0c132012-11-05 12:40:35 -0800838 self.servo.power_long_press()
Fang Dengafb88142013-05-30 17:44:31 -0700839 self.servo.switch_usbkey('off')
J. Richard Barnettefbcc7122013-07-24 18:24:59 -0700840 # We *must* use power_on() here; on Parrot it's how we get
841 # out of recovery mode.
842 self.servo.get_power_state_controller().power_on()
beepsf079cfb2013-09-18 17:49:51 -0700843
844 logging.info('Waiting for DUT to come back up.')
Richard Barnette03a0c132012-11-05 12:40:35 -0800845 if not self.wait_up(timeout=self.BOOT_TIMEOUT):
846 raise error.AutoservError('DUT failed to reboot installed '
847 'test image after %d seconds' %
Scott Zawalski62bacae2013-03-05 10:40:32 -0500848 self.BOOT_TIMEOUT)
849
850
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700851 def _servo_repair_reinstall(self):
Scott Zawalski62bacae2013-03-05 10:40:32 -0500852 """Reinstall the DUT utilizing servo and a test image.
853
854 Re-install the OS on the DUT by:
855 1) installing a test image on a USB storage device attached to the Servo
856 board,
857 2) booting that image in recovery mode, and then
858 3) installing the image with chromeos-install.
859
Scott Zawalski62bacae2013-03-05 10:40:32 -0500860 @raises AutoservRepairMethodNA if the device does not have servo
861 support.
862
863 """
864 if not self.servo:
865 raise error.AutoservRepairMethodNA('Repair Reinstall NA: '
866 'DUT has no servo support.')
867
868 logging.info('Attempting to recovery servo enabled device with '
869 'servo_repair_reinstall')
870
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700871 image_url = self.stage_image_for_servo()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500872 self.servo_install(image_url)
873
874
875 def _servo_repair_power(self):
876 """Attempt to repair DUT using an attached Servo.
877
878 Attempt to power on the DUT via power_long_press.
879
880 @raises AutoservRepairMethodNA if the device does not have servo
881 support.
882 @raises AutoservRepairFailure if the repair fails for any reason.
883 """
884 if not self.servo:
885 raise error.AutoservRepairMethodNA('Repair Power NA: '
886 'DUT has no servo support.')
887
888 logging.info('Attempting to recover servo enabled device by '
889 'powering it off and on.')
890 self.servo.get_power_state_controller().power_off()
891 self.servo.get_power_state_controller().power_on()
892 if self.wait_up(self.BOOT_TIMEOUT):
893 return
894
895 raise error.AutoservRepairFailure('DUT did not boot after long_press.')
Richard Barnette03a0c132012-11-05 12:40:35 -0800896
897
Richard Barnette82c35912012-11-20 10:09:10 -0800898 def _powercycle_to_repair(self):
899 """Utilize the RPM Infrastructure to bring the host back up.
900
901 If the host is not up/repaired after the first powercycle we utilize
902 auto fallback to the last good install by powercycling and rebooting the
903 host 6 times.
Scott Zawalski62bacae2013-03-05 10:40:32 -0500904
905 @raises AutoservRepairMethodNA if the device does not support remote
906 power.
907 @raises AutoservRepairFailure if the repair fails for any reason.
908
Richard Barnette82c35912012-11-20 10:09:10 -0800909 """
Scott Zawalski62bacae2013-03-05 10:40:32 -0500910 if not self.has_power():
911 raise error.AutoservRepairMethodNA('Device does not support power.')
912
Richard Barnette82c35912012-11-20 10:09:10 -0800913 logging.info('Attempting repair via RPM powercycle.')
914 failed_cycles = 0
915 self.power_cycle()
916 while not self.wait_up(timeout=self.BOOT_TIMEOUT):
917 failed_cycles += 1
918 if failed_cycles >= self._MAX_POWER_CYCLE_ATTEMPTS:
Scott Zawalski62bacae2013-03-05 10:40:32 -0500919 raise error.AutoservRepairFailure(
920 'Powercycled host %s %d times; device did not come back'
921 ' online.' % (self.hostname, failed_cycles))
Richard Barnette82c35912012-11-20 10:09:10 -0800922 self.power_cycle()
923 if failed_cycles == 0:
924 logging.info('Powercycling was successful first time.')
925 else:
926 logging.info('Powercycling was successful after %d failures.',
927 failed_cycles)
928
929
Prashanth B4d8184f2014-05-05 12:22:02 -0700930 def check_device(self):
931 """Check if a device is ssh-able, and if so, clean and verify it.
932
933 @raise AutoservSSHTimeout: If the ssh ping times out.
934 @raise AutoservSshPermissionDeniedError: If ssh ping fails due to
935 permissions.
936 @raise AutoservSshPingHostError: For other AutoservRunErrors during
937 ssh_ping.
938 @raises AutoservError: As appropriate, during cleanup and verify.
939 """
940 self.ssh_ping()
941 self.cleanup()
942 self.verify()
943
944
Richard Barnette82c35912012-11-20 10:09:10 -0800945 def repair_full(self):
946 """Repair a host for repair level NO_PROTECTION.
947
948 This overrides the base class function for repair; it does
949 not call back to the parent class, but instead offers a
950 simplified implementation based on the capabilities in the
951 Chrome OS test lab.
952
Fang Deng5d518f42013-08-02 14:04:32 -0700953 It first verifies and repairs servo if it is a DUT in CrOS
Fang Deng03590af2013-10-07 17:34:20 -0700954 lab and a servo is attached.
Fang Deng5d518f42013-08-02 14:04:32 -0700955
Prashanth B4d8184f2014-05-05 12:22:02 -0700956 If `self.check_device()` fails, the following procedures are
J. Richard Barnettefde55fc2013-03-15 17:47:01 -0700957 attempted:
958 1. Try to re-install to a known stable image using
959 auto-update.
Scott Zawalski62bacae2013-03-05 10:40:32 -0500960 2. If there's a servo for the DUT, try to power the DUT off and
961 on.
962 3. If there's a servo for the DUT, try to re-install via
J. Richard Barnettefde55fc2013-03-15 17:47:01 -0700963 the servo.
Scott Zawalski62bacae2013-03-05 10:40:32 -0500964 4. If the DUT can be power-cycled via RPM, try to repair
Richard Barnette82c35912012-11-20 10:09:10 -0800965 by power-cycling.
966
967 As with the parent method, the last operation performed on
Prashanth B4d8184f2014-05-05 12:22:02 -0700968 the DUT must be to call `self.check_device()`; If that call fails the
969 exception it raises is passed back to the caller.
J. Richard Barnettefde55fc2013-03-15 17:47:01 -0700970
Scott Zawalski62bacae2013-03-05 10:40:32 -0500971 @raises AutoservRepairTotalFailure if the repair process fails to
972 fix the DUT.
Fang Deng5d518f42013-08-02 14:04:32 -0700973 @raises ServoHostRepairTotalFailure if the repair process fails to
974 fix the servo host if one is attached to the DUT.
975 @raises AutoservSshPermissionDeniedError if it is unable
976 to ssh to the servo host due to permission error.
977
Richard Barnette82c35912012-11-20 10:09:10 -0800978 """
Dan Shi4d478522014-02-14 13:46:32 -0800979 if self._servo_host and not self.servo:
Fang Deng03590af2013-10-07 17:34:20 -0700980 try:
Dan Shi4d478522014-02-14 13:46:32 -0800981 self._servo_host.repair_full()
Fang Deng03590af2013-10-07 17:34:20 -0700982 except Exception as e:
Fang Deng03590af2013-10-07 17:34:20 -0700983 logging.error('Could not create a healthy servo: %s', e)
Dan Shi4d478522014-02-14 13:46:32 -0800984 self.servo = self._servo_host.get_servo()
Fang Deng5d518f42013-08-02 14:04:32 -0700985
Scott Zawalski62bacae2013-03-05 10:40:32 -0500986 # TODO(scottz): This should use something similar to label_decorator,
987 # but needs to be populated in order so DUTs are repaired with the
988 # least amount of effort.
Dan Shi849a1c42014-03-05 11:10:43 -0800989 repair_funcs = [self._servo_repair_power,
990 self._install_repair,
Dan Shi2c88eed2013-11-12 10:18:38 -0800991 self._install_repair_with_powerwash,
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700992 self._servo_repair_reinstall,
Scott Zawalski62bacae2013-03-05 10:40:32 -0500993 self._powercycle_to_repair]
994 errors = []
Simran Basie6130932013-10-01 14:07:52 -0700995 board = self._get_board_from_afe()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500996 for repair_func in repair_funcs:
997 try:
998 repair_func()
Prashanth B4d8184f2014-05-05 12:22:02 -0700999 self.check_device()
Simran Basie6130932013-10-01 14:07:52 -07001000 stats.Counter(
1001 '%s.SUCCEEDED' % repair_func.__name__).increment()
1002 if board:
1003 stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001004 '%s.%s.SUCCEEDED' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001005 board)).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001006 return
Simran Basie6130932013-10-01 14:07:52 -07001007 except error.AutoservRepairMethodNA as e:
1008 stats.Counter(
1009 '%s.RepairNA' % repair_func.__name__).increment()
1010 if board:
1011 stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001012 '%s.%s.RepairNA' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001013 board)).increment()
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001014 logging.warning('Repair function NA: %s', e)
Simran Basie6130932013-10-01 14:07:52 -07001015 errors.append(str(e))
Scott Zawalski62bacae2013-03-05 10:40:32 -05001016 except Exception as e:
Simran Basie6130932013-10-01 14:07:52 -07001017 stats.Counter(
1018 '%s.FAILED' % repair_func.__name__).increment()
1019 if board:
1020 stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001021 '%s.%s.FAILED' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001022 board)).increment()
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001023 logging.warning('Failed to repair device: %s', e)
Scott Zawalski62bacae2013-03-05 10:40:32 -05001024 errors.append(str(e))
Scott Zawalski89c44dd2013-02-26 09:28:02 -05001025
Simran Basie6130932013-10-01 14:07:52 -07001026 stats.Counter('Full_Repair_Failed').increment()
1027 if board:
1028 stats.Counter(
1029 'Full_Repair_Failed.%s' % board).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001030 raise error.AutoservRepairTotalFailure(
1031 'All attempts at repairing the device failed:\n%s' %
1032 '\n'.join(errors))
Richard Barnette82c35912012-11-20 10:09:10 -08001033
1034
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001035 def close(self):
beeps32a63082013-08-22 14:02:29 -07001036 self.rpc_disconnect_all()
Fang Deng0ca40e22013-08-27 17:47:44 -07001037 super(CrosHost, self).close()
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001038
1039
Simran Basi5e6339a2013-03-21 11:34:32 -07001040 def _cleanup_poweron(self):
1041 """Special cleanup method to make sure hosts always get power back."""
1042 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
1043 hosts = afe.get_hosts(hostname=self.hostname)
1044 if not hosts or not (self._RPM_OUTLET_CHANGED in
1045 hosts[0].attributes):
1046 return
1047 logging.debug('This host has recently interacted with the RPM'
1048 ' Infrastructure. Ensuring power is on.')
1049 try:
1050 self.power_on()
1051 except rpm_client.RemotePowerException:
1052 # If cleanup has completed but there was an issue with the RPM
1053 # Infrastructure, log an error message rather than fail cleanup
1054 logging.error('Failed to turn Power On for this host after '
1055 'cleanup through the RPM Infrastructure.')
1056 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, None,
1057 hostname=self.hostname)
1058
1059
beepsc87ff602013-07-31 21:53:00 -07001060 def _is_factory_image(self):
1061 """Checks if the image on the DUT is a factory image.
1062
1063 @return: True if the image on the DUT is a factory image.
1064 False otherwise.
1065 """
1066 result = self.run('[ -f /root/.factory_test ]', ignore_status=True)
1067 return result.exit_status == 0
1068
1069
1070 def _restart_ui(self):
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001071 """Restart the Chrome UI.
beepsc87ff602013-07-31 21:53:00 -07001072
1073 @raises: FactoryImageCheckerException for factory images, since
1074 we cannot attempt to restart ui on them.
1075 error.AutoservRunError for any other type of error that
1076 occurs while restarting ui.
1077 """
1078 if self._is_factory_image():
1079 raise FactoryImageCheckerException('Cannot restart ui on factory '
1080 'images')
1081
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001082 # TODO(jrbarnette): The command to stop/start the ui job
1083 # should live inside cros_ui, too. However that would seem
1084 # to imply interface changes to the existing start()/restart()
1085 # functions, which is a bridge too far (for now).
1086 prompt = cros_ui.get_login_prompt_state(self)
1087 self.run('stop ui; start ui')
1088 cros_ui.wait_for_chrome_ready(prompt, self)
beepsc87ff602013-07-31 21:53:00 -07001089
1090
1091 def cleanup(self):
Richard Barnette82c35912012-11-20 10:09:10 -08001092 self.run('rm -f %s' % constants.CLEANUP_LOGS_PAUSED_FILE)
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001093 try:
beepsc87ff602013-07-31 21:53:00 -07001094 self._restart_ui()
1095 except (error.AutotestRunError, error.AutoservRunError,
1096 FactoryImageCheckerException):
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001097 logging.warning('Unable to restart ui, rebooting device.')
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001098 # Since restarting the UI fails fall back to normal Autotest
1099 # cleanup routines, i.e. reboot the machine.
Fang Deng0ca40e22013-08-27 17:47:44 -07001100 super(CrosHost, self).cleanup()
Simran Basi5e6339a2013-03-21 11:34:32 -07001101 # Check if the rpm outlet was manipulated.
Simran Basid5e5e272012-09-24 15:23:59 -07001102 if self.has_power():
Simran Basi5e6339a2013-03-21 11:34:32 -07001103 self._cleanup_poweron()
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001104
1105
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001106 def reboot(self, **dargs):
1107 """
1108 This function reboots the site host. The more generic
1109 RemoteHost.reboot() performs sync and sleeps for 5
1110 seconds. This is not necessary for Chrome OS devices as the
1111 sync should be finished in a short time during the reboot
1112 command.
1113 """
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001114 if 'reboot_cmd' not in dargs:
Doug Anderson7d5aeb22014-02-27 15:12:17 -08001115 reboot_timeout = dargs.get('reboot_timeout', 10)
1116 dargs['reboot_cmd'] = ('((reboot & sleep %d; reboot -f &)'
1117 ' </dev/null >/dev/null 2>&1 &)' %
1118 reboot_timeout)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001119 # Enable fastsync to avoid running extra sync commands before reboot.
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001120 if 'fastsync' not in dargs:
1121 dargs['fastsync'] = True
Michael Liangda8c60a2014-06-03 13:24:51 -07001122
Charlie Mooneya8e6dab2014-05-29 14:37:55 -07001123 # For purposes of logging reboot times:
1124 # Get the board name i.e. 'daisy_spring'
1125 dargs['board'] = self._get_board_from_afe()
Fang Deng0ca40e22013-08-27 17:47:44 -07001126 super(CrosHost, self).reboot(**dargs)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001127
1128
Gwendal Grignou7a61d2f2014-05-23 11:05:51 -07001129 def suspend(self, **dargs):
1130 """
1131 This function suspends the site host.
1132 """
1133 suspend_time = dargs.get('suspend_time', 60)
1134 dargs['timeout'] = suspend_time
1135 if 'suspend_cmd' not in dargs:
1136 cmd = ' && '.join(['echo 0 > /sys/class/rtc/rtc0/wakealarm',
1137 'echo +%d > /sys/class/rtc/rtc0/wakealarm' % suspend_time,
1138 'powerd_dbus_suspend --delay=0 &'])
1139 dargs['suspend_cmd'] = ('(( %s )'
1140 '< /dev/null >/dev/null 2>&1 &)' % cmd)
1141 super(CrosHost, self).suspend(**dargs)
1142
1143
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001144 def verify_software(self):
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001145 """Verify working software on a Chrome OS system.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001146
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001147 Tests for the following conditions:
1148 1. All conditions tested by the parent version of this
1149 function.
1150 2. Sufficient space in /mnt/stateful_partition.
Fang Deng6b05f5b2013-03-20 13:42:11 -07001151 3. Sufficient space in /mnt/stateful_partition/encrypted.
1152 4. update_engine answers a simple status request over DBus.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001153
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001154 """
Fang Deng0ca40e22013-08-27 17:47:44 -07001155 super(CrosHost, self).verify_software()
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001156 self.check_diskspace(
1157 '/mnt/stateful_partition',
1158 global_config.global_config.get_config_value(
Fang Deng6b05f5b2013-03-20 13:42:11 -07001159 'SERVER', 'gb_diskspace_required', type=float,
1160 default=20.0))
Gaurav Shahe448af82014-06-19 15:18:59 -07001161 encrypted_stateful_path = '/mnt/stateful_partition/encrypted'
1162 # Not all targets build with encrypted stateful support.
1163 if self.path_exists(encrypted_stateful_path):
1164 self.check_diskspace(
1165 encrypted_stateful_path,
1166 global_config.global_config.get_config_value(
1167 'SERVER', 'gb_encrypted_diskspace_required', type=float,
1168 default=0.1))
beepsc87ff602013-07-31 21:53:00 -07001169
Prashanth B5d0a0512014-04-25 12:26:08 -07001170 services_status = self.run('status system-services').stdout
1171 if services_status != 'system-services start/running\n':
1172 raise error.AutoservError('Chrome failed to reach login. '
1173 'System services not running.')
1174
beepsc87ff602013-07-31 21:53:00 -07001175 # Factory images don't run update engine,
1176 # goofy controls dbus on these DUTs.
1177 if not self._is_factory_image():
1178 self.run('update_engine_client --status')
Scott Zawalskifbca4a92013-03-04 15:56:42 -05001179 # Makes sure python is present, loads and can use built in functions.
1180 # We have seen cases where importing cPickle fails with undefined
1181 # symbols in cPickle.so.
1182 self.run('python -c "import cPickle"')
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001183
1184
Fang Deng96667ca2013-08-01 17:46:18 -07001185 def make_ssh_command(self, user='root', port=22, opts='', hosts_file=None,
1186 connect_timeout=None, alive_interval=None):
1187 """Override default make_ssh_command to use options tuned for Chrome OS.
1188
1189 Tuning changes:
1190 - ConnectTimeout=30; maximum of 30 seconds allowed for an SSH
1191 connection failure. Consistency with remote_access.sh.
1192
1193 - ServerAliveInterval=180; which causes SSH to ping connection every
1194 180 seconds. In conjunction with ServerAliveCountMax ensures
1195 that if the connection dies, Autotest will bail out quickly.
1196 Originally tried 60 secs, but saw frequent job ABORTS where
1197 the test completed successfully.
1198
1199 - ServerAliveCountMax=3; consistency with remote_access.sh.
1200
1201 - ConnectAttempts=4; reduce flakiness in connection errors;
1202 consistency with remote_access.sh.
1203
1204 - UserKnownHostsFile=/dev/null; we don't care about the keys.
1205 Host keys change with every new installation, don't waste
1206 memory/space saving them.
1207
1208 - SSH protocol forced to 2; needed for ServerAliveInterval.
1209
1210 @param user User name to use for the ssh connection.
1211 @param port Port on the target host to use for ssh connection.
1212 @param opts Additional options to the ssh command.
1213 @param hosts_file Ignored.
1214 @param connect_timeout Ignored.
1215 @param alive_interval Ignored.
1216 """
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001217 base_command = ('/usr/bin/ssh -a -x %s %s %s'
1218 ' -o StrictHostKeyChecking=no'
Fang Deng96667ca2013-08-01 17:46:18 -07001219 ' -o UserKnownHostsFile=/dev/null -o BatchMode=yes'
1220 ' -o ConnectTimeout=30 -o ServerAliveInterval=180'
1221 ' -o ServerAliveCountMax=3 -o ConnectionAttempts=4'
1222 ' -o Protocol=2 -l %s -p %d')
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001223 return base_command % (self._ssh_verbosity_flag, self._ssh_options,
1224 opts, user, port)
Fang Deng96667ca2013-08-01 17:46:18 -07001225
1226
beeps32a63082013-08-22 14:02:29 -07001227 def _create_ssh_tunnel(self, port, local_port):
1228 """Create an ssh tunnel from local_port to port.
1229
1230 @param port: remote port on the host.
1231 @param local_port: local forwarding port.
1232
1233 @return: the tunnel process.
1234 """
1235 # Chrome OS on the target closes down most external ports
1236 # for security. We could open the port, but doing that
1237 # would conflict with security tests that check that only
1238 # expected ports are open. So, to get to the port on the
1239 # target we use an ssh tunnel.
1240 tunnel_options = '-n -N -q -L %d:localhost:%d' % (local_port, port)
1241 ssh_cmd = self.make_ssh_command(opts=tunnel_options)
1242 tunnel_cmd = '%s %s' % (ssh_cmd, self.hostname)
1243 logging.debug('Full tunnel command: %s', tunnel_cmd)
1244 tunnel_proc = subprocess.Popen(tunnel_cmd, shell=True, close_fds=True)
1245 logging.debug('Started ssh tunnel, local = %d'
1246 ' remote = %d, pid = %d',
1247 local_port, port, tunnel_proc.pid)
1248 return tunnel_proc
1249
1250
Christopher Wileydd181852013-10-10 19:56:58 -07001251 def _setup_rpc(self, port, command_name, remote_pid=None):
beeps32a63082013-08-22 14:02:29 -07001252 """Sets up a tunnel process and performs rpc connection book keeping.
1253
1254 This method assumes that xmlrpc and jsonrpc never conflict, since
1255 we can only either have an xmlrpc or a jsonrpc server listening on
1256 a remote port. As such, it enforces a single proxy->remote port
1257 policy, i.e if one starts a jsonrpc proxy/server from port A->B,
1258 and then tries to start an xmlrpc proxy forwarded to the same port,
1259 the xmlrpc proxy will override the jsonrpc tunnel process, however:
1260
1261 1. None of the methods on the xmlrpc proxy will work because
1262 the server listening on B is jsonrpc.
1263
1264 2. The xmlrpc client cannot initiate a termination of the JsonRPC
1265 server, as the only use case currently is goofy, which is tied to
1266 the factory image. It is much easier to handle a failed xmlrpc
1267 call on the client than it is to terminate goofy in this scenario,
1268 as doing the latter might leave the DUT in a hard to recover state.
1269
1270 With the current implementation newer rpc proxy connections will
1271 terminate the tunnel processes of older rpc connections tunneling
1272 to the same remote port. If methods are invoked on the client
1273 after this has happened they will fail with connection closed errors.
1274
1275 @param port: The remote forwarding port.
1276 @param command_name: The name of the remote process, to terminate
1277 using pkill.
1278
1279 @return A url that we can use to initiate the rpc connection.
1280 """
1281 self.rpc_disconnect(port)
1282 local_port = utils.get_unused_port()
1283 tunnel_proc = self._create_ssh_tunnel(port, local_port)
Christopher Wileydd181852013-10-10 19:56:58 -07001284 self._rpc_proxy_map[port] = (command_name, tunnel_proc, remote_pid)
beeps32a63082013-08-22 14:02:29 -07001285 return self._RPC_PROXY_URL % local_port
1286
1287
Christopher Wileyd78249a2013-03-01 13:05:31 -08001288 def xmlrpc_connect(self, command, port, command_name=None,
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001289 ready_test_name=None, timeout_seconds=10,
1290 logfile='/dev/null'):
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001291 """Connect to an XMLRPC server on the host.
1292
1293 The `command` argument should be a simple shell command that
1294 starts an XMLRPC server on the given `port`. The command
1295 must not daemonize, and must terminate cleanly on SIGTERM.
1296 The command is started in the background on the host, and a
1297 local XMLRPC client for the server is created and returned
1298 to the caller.
1299
1300 Note that the process of creating an XMLRPC client makes no
1301 attempt to connect to the remote server; the caller is
1302 responsible for determining whether the server is running
1303 correctly, and is ready to serve requests.
1304
Christopher Wileyd78249a2013-03-01 13:05:31 -08001305 Optionally, the caller can pass ready_test_name, a string
1306 containing the name of a method to call on the proxy. This
1307 method should take no parameters and return successfully only
1308 when the server is ready to process client requests. When
1309 ready_test_name is set, xmlrpc_connect will block until the
1310 proxy is ready, and throw a TestError if the server isn't
1311 ready by timeout_seconds.
1312
beeps32a63082013-08-22 14:02:29 -07001313 If a server is already running on the remote port, this
1314 method will kill it and disconnect the tunnel process
1315 associated with the connection before establishing a new one,
1316 by consulting the rpc_proxy_map in rpc_disconnect.
1317
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001318 @param command Shell command to start the server.
1319 @param port Port number on which the server is expected to
1320 be serving.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001321 @param command_name String to use as input to `pkill` to
1322 terminate the XMLRPC server on the host.
Christopher Wileyd78249a2013-03-01 13:05:31 -08001323 @param ready_test_name String containing the name of a
1324 method defined on the XMLRPC server.
1325 @param timeout_seconds Number of seconds to wait
1326 for the server to become 'ready.' Will throw a
1327 TestFail error if server is not ready in time.
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001328 @param logfile Logfile to send output when running
1329 'command' argument.
Yusuf Mohsinally8d19e3c2013-11-21 14:25:45 -08001330
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001331 """
Christopher Wileyc14f06a2013-10-16 13:55:39 -07001332 # Clean up any existing state. If the caller is willing
1333 # to believe their server is down, we ought to clean up
1334 # any tunnels we might have sitting around.
1335 self.rpc_disconnect(port)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001336 # Start the server on the host. Redirection in the command
1337 # below is necessary, because 'ssh' won't terminate until
1338 # background child processes close stdin, stdout, and
1339 # stderr.
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001340 remote_cmd = '%s </dev/null >%s 2>&1 & echo $!' % (command, logfile)
Christopher Wileydd181852013-10-10 19:56:58 -07001341 remote_pid = self.run(remote_cmd).stdout.rstrip('\n')
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001342 logging.debug('Started XMLRPC server on host %s, pid = %s',
1343 self.hostname, remote_pid)
1344
Christopher Wileydd181852013-10-10 19:56:58 -07001345 # Tunnel through SSH to be able to reach that remote port.
1346 rpc_url = self._setup_rpc(port, command_name, remote_pid=remote_pid)
Christopher Wileyd78249a2013-03-01 13:05:31 -08001347 proxy = xmlrpclib.ServerProxy(rpc_url, allow_none=True)
Christopher Wileydd181852013-10-10 19:56:58 -07001348
Christopher Wileyd78249a2013-03-01 13:05:31 -08001349 if ready_test_name is not None:
J. Richard Barnette13eb7c02013-03-07 12:06:29 -08001350 # retry.retry logs each attempt; calculate delay_sec to
1351 # keep log spam to a dull roar.
Christopher Wiley0ed712b2013-04-09 15:25:12 -07001352 @retry.retry((socket.error,
1353 xmlrpclib.ProtocolError,
1354 httplib.BadStatusLine),
Chris Sosa65425082013-10-16 13:26:22 -07001355 timeout_min=timeout_seconds / 60.0,
1356 delay_sec=min(max(timeout_seconds / 20.0, 0.1), 1))
Christopher Wileyd78249a2013-03-01 13:05:31 -08001357 def ready_test():
1358 """ Call proxy.ready_test_name(). """
1359 getattr(proxy, ready_test_name)()
1360 successful = False
1361 try:
1362 logging.info('Waiting %d seconds for XMLRPC server '
1363 'to start.', timeout_seconds)
1364 ready_test()
1365 successful = True
Christopher Wileyd78249a2013-03-01 13:05:31 -08001366 finally:
1367 if not successful:
1368 logging.error('Failed to start XMLRPC server.')
beeps32a63082013-08-22 14:02:29 -07001369 self.rpc_disconnect(port)
Christopher Wileyd78249a2013-03-01 13:05:31 -08001370 logging.info('XMLRPC server started successfully.')
1371 return proxy
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001372
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001373
Jason Abeleb6f924f2013-11-13 16:01:54 -08001374 def syslog(self, message, tag='autotest'):
1375 """Logs a message to syslog on host.
1376
1377 @param message String message to log into syslog
1378 @param tag String tag prefix for syslog
1379
1380 """
1381 self.run('logger -t "%s" "%s"' % (tag, message))
1382
1383
beeps32a63082013-08-22 14:02:29 -07001384 def jsonrpc_connect(self, port):
1385 """Creates a jsonrpc proxy connection through an ssh tunnel.
1386
1387 This method exists to facilitate communication with goofy (which is
1388 the default system manager on all factory images) and as such, leaves
1389 most of the rpc server sanity checking to the caller. Unlike
1390 xmlrpc_connect, this method does not facilitate the creation of a remote
1391 jsonrpc server, as the only clients of this code are factory tests,
1392 for which the goofy system manager is built in to the image and starts
1393 when the target boots.
1394
1395 One can theoretically create multiple jsonrpc proxies all forwarded
1396 to the same remote port, provided the remote port has an rpc server
1397 listening. However, in doing so we stand the risk of leaking an
1398 existing tunnel process, so we always disconnect any older tunnels
1399 we might have through rpc_disconnect.
1400
1401 @param port: port on the remote host that is serving this proxy.
1402
1403 @return: The client proxy.
1404 """
1405 if not jsonrpclib:
1406 logging.warning('Jsonrpclib could not be imported. Check that '
1407 'site-packages contains jsonrpclib.')
1408 return None
1409
1410 proxy = jsonrpclib.jsonrpc.ServerProxy(self._setup_rpc(port, None))
1411
1412 logging.info('Established a jsonrpc connection through port %s.', port)
1413 return proxy
1414
1415
1416 def rpc_disconnect(self, port):
1417 """Disconnect from an RPC server on the host.
1418
1419 Terminates the remote RPC server previously started for
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001420 the given `port`. Also closes the local ssh tunnel created
1421 for the connection to the host. This function does not
beeps32a63082013-08-22 14:02:29 -07001422 directly alter the state of a previously returned RPC
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001423 client object; however disconnection will cause all
1424 subsequent calls to methods on the object to fail.
1425
1426 This function does nothing if requested to disconnect a port
beeps32a63082013-08-22 14:02:29 -07001427 that was not previously connected via _setup_rpc.
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001428
1429 @param port Port number passed to a previous call to
beeps32a63082013-08-22 14:02:29 -07001430 `_setup_rpc()`.
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001431 """
beeps32a63082013-08-22 14:02:29 -07001432 if port not in self._rpc_proxy_map:
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001433 return
Christopher Wileydd181852013-10-10 19:56:58 -07001434 remote_name, tunnel_proc, remote_pid = self._rpc_proxy_map[port]
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001435 if remote_name:
1436 # We use 'pkill' to find our target process rather than
1437 # a PID, because the host may have rebooted since
1438 # connecting, and we don't want to kill an innocent
1439 # process with the same PID.
1440 #
1441 # 'pkill' helpfully exits with status 1 if no target
1442 # process is found, for which run() will throw an
Simran Basid5e5e272012-09-24 15:23:59 -07001443 # exception. We don't want that, so we the ignore
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001444 # status.
1445 self.run("pkill -f '%s'" % remote_name, ignore_status=True)
Christopher Wileydd181852013-10-10 19:56:58 -07001446 if remote_pid:
1447 logging.info('Waiting for RPC server "%s" shutdown',
1448 remote_name)
1449 start_time = time.time()
1450 while (time.time() - start_time <
1451 self._RPC_SHUTDOWN_TIMEOUT_SECONDS):
1452 running_processes = self.run(
1453 "pgrep -f '%s'" % remote_name,
1454 ignore_status=True).stdout.split()
1455 if not remote_pid in running_processes:
1456 logging.info('Shut down RPC server.')
1457 break
1458 time.sleep(self._RPC_SHUTDOWN_POLLING_PERIOD_SECONDS)
1459 else:
1460 raise error.TestError('Failed to shutdown RPC server %s' %
1461 remote_name)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001462
1463 if tunnel_proc.poll() is None:
1464 tunnel_proc.terminate()
1465 logging.debug('Terminated tunnel, pid %d', tunnel_proc.pid)
1466 else:
1467 logging.debug('Tunnel pid %d terminated early, status %d',
1468 tunnel_proc.pid, tunnel_proc.returncode)
beeps32a63082013-08-22 14:02:29 -07001469 del self._rpc_proxy_map[port]
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001470
1471
beeps32a63082013-08-22 14:02:29 -07001472 def rpc_disconnect_all(self):
1473 """Disconnect all known RPC proxy ports."""
1474 for port in self._rpc_proxy_map.keys():
1475 self.rpc_disconnect(port)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001476
1477
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001478 def _ping_check_status(self, status):
1479 """Ping the host once, and return whether it has a given status.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001480
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001481 @param status Check the ping status against this value.
1482 @return True iff `status` and the result of ping are the same
1483 (i.e. both True or both False).
1484
1485 """
1486 ping_val = utils.ping(self.hostname, tries=1, deadline=1)
1487 return not (status ^ (ping_val == 0))
1488
1489 def _ping_wait_for_status(self, status, timeout):
1490 """Wait for the host to have a given status (UP or DOWN).
1491
1492 Status is checked by polling. Polling will not last longer
1493 than the number of seconds in `timeout`. The polling
1494 interval will be long enough that only approximately
1495 _PING_WAIT_COUNT polling cycles will be executed, subject
1496 to a maximum interval of about one minute.
1497
1498 @param status Waiting will stop immediately if `ping` of the
1499 host returns this status.
1500 @param timeout Poll for at most this many seconds.
1501 @return True iff the host status from `ping` matched the
1502 requested status at the time of return.
1503
1504 """
1505 # _ping_check_status() takes about 1 second, hence the
1506 # "- 1" in the formula below.
1507 poll_interval = min(int(timeout / self._PING_WAIT_COUNT), 60) - 1
1508 end_time = time.time() + timeout
1509 while time.time() <= end_time:
1510 if self._ping_check_status(status):
1511 return True
1512 if poll_interval > 0:
1513 time.sleep(poll_interval)
1514
1515 # The last thing we did was sleep(poll_interval), so it may
1516 # have been too long since the last `ping`. Check one more
1517 # time, just to be sure.
1518 return self._ping_check_status(status)
1519
1520 def ping_wait_up(self, timeout):
1521 """Wait for the host to respond to `ping`.
1522
1523 N.B. This method is not a reliable substitute for
1524 `wait_up()`, because a host that responds to ping will not
1525 necessarily respond to ssh. This method should only be used
1526 if the target DUT can be considered functional even if it
1527 can't be reached via ssh.
1528
1529 @param timeout Minimum time to allow before declaring the
1530 host to be non-responsive.
1531 @return True iff the host answered to ping before the timeout.
1532
1533 """
1534 return self._ping_wait_for_status(self._PING_STATUS_UP, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001535
Andrew Bresticker678c0c72013-01-22 10:44:09 -08001536 def ping_wait_down(self, timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001537 """Wait until the host no longer responds to `ping`.
1538
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001539 This function can be used as a slightly faster version of
1540 `wait_down()`, by avoiding potentially long ssh timeouts.
1541
1542 @param timeout Minimum time to allow for the host to become
1543 non-responsive.
1544 @return True iff the host quit answering ping before the
1545 timeout.
1546
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001547 """
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001548 return self._ping_wait_for_status(self._PING_STATUS_DOWN, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001549
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001550 def test_wait_for_sleep(self, sleep_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001551 """Wait for the client to enter low-power sleep mode.
1552
1553 The test for "is asleep" can't distinguish a system that is
1554 powered off; to confirm that the unit was asleep, it is
1555 necessary to force resume, and then call
1556 `test_wait_for_resume()`.
1557
1558 This function is expected to be called from a test as part
1559 of a sequence like the following:
1560
1561 ~~~~~~~~
1562 boot_id = host.get_boot_id()
1563 # trigger sleep on the host
1564 host.test_wait_for_sleep()
1565 # trigger resume on the host
1566 host.test_wait_for_resume(boot_id)
1567 ~~~~~~~~
1568
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001569 @param sleep_timeout time limit in seconds to allow the host sleep.
1570
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001571 @exception TestFail The host did not go to sleep within
1572 the allowed time.
1573 """
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001574 if sleep_timeout is None:
1575 sleep_timeout = self.SLEEP_TIMEOUT
1576
1577 if not self.ping_wait_down(timeout=sleep_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001578 raise error.TestFail(
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001579 'client failed to sleep after %d seconds' % sleep_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001580
1581
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001582 def test_wait_for_resume(self, old_boot_id, resume_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001583 """Wait for the client to resume from low-power sleep mode.
1584
1585 The `old_boot_id` parameter should be the value from
1586 `get_boot_id()` obtained prior to entering sleep mode. A
1587 `TestFail` exception is raised if the boot id changes.
1588
1589 See @ref test_wait_for_sleep for more on this function's
1590 usage.
1591
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001592 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001593 target host went to sleep.
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001594 @param resume_timeout time limit in seconds to allow the host up.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001595
1596 @exception TestFail The host did not respond within the
1597 allowed time.
1598 @exception TestFail The host responded, but the boot id test
1599 indicated a reboot rather than a sleep
1600 cycle.
1601 """
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001602 if resume_timeout is None:
1603 resume_timeout = self.RESUME_TIMEOUT
1604
1605 if not self.wait_up(timeout=resume_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001606 raise error.TestFail(
1607 'client failed to resume from sleep after %d seconds' %
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001608 resume_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001609 else:
1610 new_boot_id = self.get_boot_id()
1611 if new_boot_id != old_boot_id:
1612 raise error.TestFail(
1613 'client rebooted, but sleep was expected'
1614 ' (old boot %s, new boot %s)'
1615 % (old_boot_id, new_boot_id))
1616
1617
1618 def test_wait_for_shutdown(self):
1619 """Wait for the client to shut down.
1620
1621 The test for "has shut down" can't distinguish a system that
1622 is merely asleep; to confirm that the unit was down, it is
1623 necessary to force boot, and then call test_wait_for_boot().
1624
1625 This function is expected to be called from a test as part
1626 of a sequence like the following:
1627
1628 ~~~~~~~~
1629 boot_id = host.get_boot_id()
1630 # trigger shutdown on the host
1631 host.test_wait_for_shutdown()
1632 # trigger boot on the host
1633 host.test_wait_for_boot(boot_id)
1634 ~~~~~~~~
1635
1636 @exception TestFail The host did not shut down within the
1637 allowed time.
1638 """
Andrew Bresticker678c0c72013-01-22 10:44:09 -08001639 if not self.ping_wait_down(timeout=self.SHUTDOWN_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001640 raise error.TestFail(
1641 'client failed to shut down after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001642 self.SHUTDOWN_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001643
1644
1645 def test_wait_for_boot(self, old_boot_id=None):
1646 """Wait for the client to boot from cold power.
1647
1648 The `old_boot_id` parameter should be the value from
1649 `get_boot_id()` obtained prior to shutting down. A
1650 `TestFail` exception is raised if the boot id does not
1651 change. The boot id test is omitted if `old_boot_id` is not
1652 specified.
1653
1654 See @ref test_wait_for_shutdown for more on this function's
1655 usage.
1656
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001657 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001658 shut down.
1659
1660 @exception TestFail The host did not respond within the
1661 allowed time.
1662 @exception TestFail The host responded, but the boot id test
1663 indicated that there was no reboot.
1664 """
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001665 if not self.wait_up(timeout=self.REBOOT_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001666 raise error.TestFail(
1667 'client failed to reboot after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001668 self.REBOOT_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001669 elif old_boot_id:
1670 if self.get_boot_id() == old_boot_id:
1671 raise error.TestFail(
1672 'client is back up, but did not reboot'
1673 ' (boot %s)' % old_boot_id)
Simran Basid5e5e272012-09-24 15:23:59 -07001674
1675
1676 @staticmethod
1677 def check_for_rpm_support(hostname):
1678 """For a given hostname, return whether or not it is powered by an RPM.
1679
Simran Basi1df55112013-09-06 11:25:09 -07001680 @param hostname: hostname to check for rpm support.
1681
Simran Basid5e5e272012-09-24 15:23:59 -07001682 @return None if this host does not follows the defined naming format
1683 for RPM powered DUT's in the lab. If it does follow the format,
1684 it returns a regular expression MatchObject instead.
1685 """
Fang Deng0ca40e22013-08-27 17:47:44 -07001686 return re.match(CrosHost._RPM_HOSTNAME_REGEX, hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07001687
1688
1689 def has_power(self):
1690 """For this host, return whether or not it is powered by an RPM.
1691
1692 @return True if this host is in the CROS lab and follows the defined
1693 naming format.
1694 """
Fang Deng0ca40e22013-08-27 17:47:44 -07001695 return CrosHost.check_for_rpm_support(self.hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07001696
1697
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08001698 def _set_power(self, state, power_method):
1699 """Sets the power to the host via RPM, Servo or manual.
1700
1701 @param state Specifies which power state to set to DUT
1702 @param power_method Specifies which method of power control to
1703 use. By default "RPM" will be used. Valid values
1704 are the strings "RPM", "manual", "servoj10".
1705
1706 """
1707 ACCEPTABLE_STATES = ['ON', 'OFF']
1708
1709 if state.upper() not in ACCEPTABLE_STATES:
1710 raise error.TestError('State must be one of: %s.'
1711 % (ACCEPTABLE_STATES,))
1712
1713 if power_method == self.POWER_CONTROL_SERVO:
1714 logging.info('Setting servo port J10 to %s', state)
1715 self.servo.set('prtctl3_pwren', state.lower())
1716 time.sleep(self._USB_POWER_TIMEOUT)
1717 elif power_method == self.POWER_CONTROL_MANUAL:
1718 logging.info('You have %d seconds to set the AC power to %s.',
1719 self._POWER_CYCLE_TIMEOUT, state)
1720 time.sleep(self._POWER_CYCLE_TIMEOUT)
1721 else:
1722 if not self.has_power():
1723 raise error.TestFail('DUT does not have RPM connected.')
Simran Basi5e6339a2013-03-21 11:34:32 -07001724 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
1725 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, True,
1726 hostname=self.hostname)
Simran Basi1df55112013-09-06 11:25:09 -07001727 rpm_client.set_power(self.hostname, state.upper(), timeout_mins=5)
Simran Basid5e5e272012-09-24 15:23:59 -07001728
1729
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08001730 def power_off(self, power_method=POWER_CONTROL_RPM):
1731 """Turn off power to this host via RPM, Servo or manual.
1732
1733 @param power_method Specifies which method of power control to
1734 use. By default "RPM" will be used. Valid values
1735 are the strings "RPM", "manual", "servoj10".
1736
1737 """
1738 self._set_power('OFF', power_method)
Simran Basid5e5e272012-09-24 15:23:59 -07001739
1740
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08001741 def power_on(self, power_method=POWER_CONTROL_RPM):
1742 """Turn on power to this host via RPM, Servo or manual.
1743
1744 @param power_method Specifies which method of power control to
1745 use. By default "RPM" will be used. Valid values
1746 are the strings "RPM", "manual", "servoj10".
1747
1748 """
1749 self._set_power('ON', power_method)
1750
1751
1752 def power_cycle(self, power_method=POWER_CONTROL_RPM):
1753 """Cycle power to this host by turning it OFF, then ON.
1754
1755 @param power_method Specifies which method of power control to
1756 use. By default "RPM" will be used. Valid values
1757 are the strings "RPM", "manual", "servoj10".
1758
1759 """
1760 if power_method in (self.POWER_CONTROL_SERVO,
1761 self.POWER_CONTROL_MANUAL):
1762 self.power_off(power_method=power_method)
1763 time.sleep(self._POWER_CYCLE_TIMEOUT)
1764 self.power_on(power_method=power_method)
1765 else:
1766 rpm_client.set_power(self.hostname, 'CYCLE')
Simran Basic6f1f7a2012-10-16 10:47:46 -07001767
1768
1769 def get_platform(self):
1770 """Determine the correct platform label for this host.
1771
1772 @returns a string representing this host's platform.
1773 """
1774 crossystem = utils.Crossystem(self)
1775 crossystem.init()
1776 # Extract fwid value and use the leading part as the platform id.
1777 # fwid generally follow the format of {platform}.{firmware version}
1778 # Example: Alex.X.YYY.Z or Google_Alex.X.YYY.Z
1779 platform = crossystem.fwid().split('.')[0].lower()
1780 # Newer platforms start with 'Google_' while the older ones do not.
1781 return platform.replace('google_', '')
1782
1783
Hung-ying Tyanb1328032014-04-01 14:18:54 +08001784 def get_architecture(self):
1785 """Determine the correct architecture label for this host.
1786
1787 @returns a string representing this host's architecture.
1788 """
1789 crossystem = utils.Crossystem(self)
1790 crossystem.init()
1791 return crossystem.arch()
1792
1793
Luis Lozano40b7d0d2014-01-17 15:12:06 -08001794 def get_chrome_version(self):
1795 """Gets the Chrome version number and milestone as strings.
1796
1797 Invokes "chrome --version" to get the version number and milestone.
1798
1799 @return A tuple (chrome_ver, milestone) where "chrome_ver" is the
1800 current Chrome version number as a string (in the form "W.X.Y.Z")
1801 and "milestone" is the first component of the version number
1802 (the "W" from "W.X.Y.Z"). If the version number cannot be parsed
1803 in the "W.X.Y.Z" format, the "chrome_ver" will be the full output
1804 of "chrome --version" and the milestone will be the empty string.
1805
1806 """
1807 version_string = self.run(constants.CHROME_VERSION_COMMAND).stdout
1808 return utils.parse_chrome_version(version_string)
1809
Aviv Keshet74c89a92013-02-04 15:18:30 -08001810 @label_decorator()
Simran Basic6f1f7a2012-10-16 10:47:46 -07001811 def get_board(self):
1812 """Determine the correct board label for this host.
1813
1814 @returns a string representing this host's board.
1815 """
1816 release_info = utils.parse_cmd_output('cat /etc/lsb-release',
1817 run_method=self.run)
1818 board = release_info['CHROMEOS_RELEASE_BOARD']
1819 # Devices in the lab generally have the correct board name but our own
1820 # development devices have {board_name}-signed-{key_type}. The board
1821 # name may also begin with 'x86-' which we need to keep.
Simran Basi833814b2013-01-29 13:13:43 -08001822 board_format_string = ds_constants.BOARD_PREFIX + '%s'
Simran Basic6f1f7a2012-10-16 10:47:46 -07001823 if 'x86' not in board:
Simran Basi833814b2013-01-29 13:13:43 -08001824 return board_format_string % board.split('-')[0]
1825 return board_format_string % '-'.join(board.split('-')[0:2])
Simran Basic6f1f7a2012-10-16 10:47:46 -07001826
1827
Aviv Keshet74c89a92013-02-04 15:18:30 -08001828 @label_decorator('lightsensor')
Simran Basic6f1f7a2012-10-16 10:47:46 -07001829 def has_lightsensor(self):
1830 """Determine the correct board label for this host.
1831
1832 @returns the string 'lightsensor' if this host has a lightsensor or
1833 None if it does not.
1834 """
1835 search_cmd = "find -L %s -maxdepth 4 | egrep '%s'" % (
Richard Barnette82c35912012-11-20 10:09:10 -08001836 self._LIGHTSENSOR_SEARCH_DIR, '|'.join(self._LIGHTSENSOR_FILES))
Simran Basic6f1f7a2012-10-16 10:47:46 -07001837 try:
1838 # Run the search cmd following the symlinks. Stderr_tee is set to
1839 # None as there can be a symlink loop, but the command will still
1840 # execute correctly with a few messages printed to stderr.
1841 self.run(search_cmd, stdout_tee=None, stderr_tee=None)
1842 return 'lightsensor'
1843 except error.AutoservRunError:
1844 # egrep exited with a return code of 1 meaning none of the possible
1845 # lightsensor files existed.
1846 return None
1847
1848
Aviv Keshet74c89a92013-02-04 15:18:30 -08001849 @label_decorator('bluetooth')
Simran Basic6f1f7a2012-10-16 10:47:46 -07001850 def has_bluetooth(self):
1851 """Determine the correct board label for this host.
1852
1853 @returns the string 'bluetooth' if this host has bluetooth or
1854 None if it does not.
1855 """
1856 try:
1857 self.run('test -d /sys/class/bluetooth/hci0')
1858 # test exited with a return code of 0.
1859 return 'bluetooth'
1860 except error.AutoservRunError:
1861 # test exited with a return code 1 meaning the directory did not
1862 # exist.
1863 return None
1864
1865
Ilja Friedel0ce0b602013-08-15 18:45:27 -07001866 @label_decorator('graphics')
1867 def get_graphics(self):
1868 """
1869 Determine the correct board label for this host.
1870
1871 @returns a string representing this host's graphics. For now ARM boards
1872 return graphics:gles while all other boards return graphics:gl. This
1873 may change over time, but for robustness reasons this should avoid
1874 executing code in actual graphics libraries (which may not be ready and
1875 is tested by graphics_GLAPICheck).
1876 """
1877 uname = self.run('uname -a').stdout.lower()
1878 if 'arm' in uname:
1879 return 'graphics:gles'
1880 return 'graphics:gl'
1881
1882
Bill Richardson4f595f52014-02-13 16:20:26 -08001883 @label_decorator('ec')
1884 def get_ec(self):
1885 """
1886 Determine the type of EC on this host.
1887
1888 @returns a string representing this host's embedded controller type.
1889 At present, it only returns "ec:cros", for Chrome OS ECs. Other types
1890 of EC (or none) don't return any strings, since no tests depend on
1891 those.
1892 """
1893 cmd = 'mosys ec info'
1894 # The output should look like these, so that the last field should
1895 # match our EC version scheme:
1896 #
1897 # stm | stm32f100 | snow_v1.3.139-375eb9f
1898 # ti | Unknown-10de | peppy_v1.5.114-5d52788
1899 #
1900 # Non-Chrome OS ECs will look like these:
1901 #
1902 # ENE | KB932 | 00BE107A00
1903 # ite | it8518 | 3.08
1904 #
1905 # And some systems don't have ECs at all (Lumpy, for example).
1906 regexp = r'^.*\|\s*(\S+_v\d+\.\d+\.\d+-[0-9a-f]+)\s*$'
1907
1908 ecinfo = self.run(command=cmd, ignore_status=True)
1909 if ecinfo.exit_status == 0:
1910 res = re.search(regexp, ecinfo.stdout)
1911 if res:
1912 logging.info("EC version is %s", res.groups()[0])
1913 return 'ec:cros'
1914 logging.info("%s got: %s", cmd, ecinfo.stdout)
1915 # Has an EC, but it's not a Chrome OS EC
1916 return None
1917 logging.info("%s exited with status %d", cmd, ecinfo.exit_status)
1918 # No EC present
1919 return None
1920
1921
Alec Berg31b932b2014-04-04 16:09:11 -07001922 @label_decorator('accels')
1923 def get_accels(self):
1924 """
1925 Determine the type of accelerometers on this host.
1926
1927 @returns a string representing this host's accelerometer type.
1928 At present, it only returns "accel:cros-ec", for accelerometers
1929 attached to a Chrome OS EC, or none, if no accelerometers.
1930 """
1931 # Check to make sure we have ectool
1932 rv = self.run('which ectool', ignore_status=True)
1933 if rv.exit_status:
1934 logging.info("No ectool cmd found, assuming no EC accelerometers")
1935 return None
1936
1937 # Check that the EC supports the motionsense command
1938 rv = self.run('ectool motionsense', ignore_status=True)
1939 if rv.exit_status:
1940 logging.info("EC does not support motionsense command "
1941 "assuming no EC accelerometers")
1942 return None
1943
1944 # Check that EC motion sensors are active
1945 active = self.run('ectool motionsense active').stdout.split('\n')
1946 if active[0] == "0":
1947 logging.info("Motion sense inactive, assuming no EC accelerometers")
1948 return None
1949
1950 logging.info("EC accelerometers found")
1951 return 'accel:cros-ec'
1952
1953
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08001954 @label_decorator('chameleon')
1955 def has_chameleon(self):
1956 """Determine if a Chameleon connected to this host.
1957
1958 @returns the string 'chameleon' if this host has a Chameleon or
1959 None if it has not.
1960 """
1961 if self._chameleon_host:
1962 return 'chameleon'
1963 else:
1964 return None
1965
1966
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07001967 @label_decorator('storage')
1968 def get_storage(self):
1969 """
1970 Determine the type of boot device for this host.
1971
1972 Determine if the internal device is SCSI or dw_mmc device.
1973 Then check that it is SSD or HDD or eMMC or something else.
1974
1975 @returns a string representing this host's internal device type.
1976 'storage:ssd' when internal device is solid state drive
1977 'storage:hdd' when internal device is hard disk drive
1978 'storage:mmc' when internal device is mmc drive
1979 None When internal device is something else or
1980 when we are unable to determine the type
1981 """
1982 # The output should be /dev/mmcblk* for SD/eMMC or /dev/sd* for scsi
1983 rootdev_cmd = ' '.join(['. /usr/sbin/write_gpt.sh;',
1984 '. /usr/share/misc/chromeos-common.sh;',
1985 'load_base_vars;',
1986 'get_fixed_dst_drive'])
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07001987 rootdev = self.run(command=rootdev_cmd, ignore_status=True)
1988 if rootdev.exit_status:
1989 logging.info("Fail to run %s", rootdev_cmd)
1990 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07001991 rootdev_str = rootdev.stdout.strip()
1992
1993 if not rootdev_str:
1994 return None
1995
1996 rootdev_base = os.path.basename(rootdev_str)
1997
1998 mmc_pattern = '/dev/mmcblk[0-9]'
1999 if re.match(mmc_pattern, rootdev_str):
2000 # Use type to determine if the internal device is eMMC or somthing
2001 # else. We can assume that MMC is always an internal device.
2002 type_cmd = 'cat /sys/block/%s/device/type' % rootdev_base
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002003 type = self.run(command=type_cmd, ignore_status=True)
2004 if type.exit_status:
2005 logging.info("Fail to run %s", type_cmd)
2006 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002007 type_str = type.stdout.strip()
2008
2009 if type_str == 'MMC':
2010 return 'storage:mmc'
2011
2012 scsi_pattern = '/dev/sd[a-z]+'
2013 if re.match(scsi_pattern, rootdev.stdout):
2014 # Read symlink for /sys/block/sd* to determine if the internal
2015 # device is connected via ata or usb.
2016 link_cmd = 'readlink /sys/block/%s' % rootdev_base
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002017 link = self.run(command=link_cmd, ignore_status=True)
2018 if link.exit_status:
2019 logging.info("Fail to run %s", link_cmd)
2020 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002021 link_str = link.stdout.strip()
2022 if 'usb' in link_str:
2023 return None
2024
2025 # Read rotation to determine if the internal device is ssd or hdd.
2026 rotate_cmd = str('cat /sys/block/%s/queue/rotational'
2027 % rootdev_base)
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002028 rotate = self.run(command=rotate_cmd, ignore_status=True)
2029 if rotate.exit_status:
2030 logging.info("Fail to run %s", rotate_cmd)
2031 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002032 rotate_str = rotate.stdout.strip()
2033
2034 rotate_dict = {'0':'storage:ssd', '1':'storage:hdd'}
2035 return rotate_dict.get(rotate_str)
2036
2037 # All other internal device / error case will always fall here
2038 return None
2039
2040
Dan Shi4e9a2aa2014-03-24 14:28:42 -07002041 @label_decorator('servo')
2042 def get_servo(self):
2043 """Determine if the host has a servo attached.
2044
2045 If the host has a working servo attached, it should have a servo label.
2046
2047 @return: string 'servo' if the host has servo attached. Otherwise,
2048 returns None.
2049 """
2050 return 'servo' if self._servo_host else None
2051
2052
Dan Shi5beba472014-05-28 22:46:07 -07002053 @label_decorator('video_labels')
2054 def get_video_labels(self):
2055 """Run /usr/local/bin/avtest_label_detect to get a list of video labels.
2056
2057 Sample output of avtest_label_detect:
2058 Detected label: hw_video_acc_vp8
2059 Detected label: webcam
2060
2061 @return: A list of labels detected by tool avtest_label_detect.
2062 """
2063 try:
2064 result = self.run('/usr/local/bin/avtest_label_detect').stdout
2065 return re.findall('^Detected label: (\w+)$', result, re.M)
2066 except error.AutoservRunError:
2067 # The tool is not installed.
2068 return []
2069
2070
mussa584b4462014-06-20 15:13:28 -07002071 @label_decorator('video_glitch_detection')
2072 def is_video_glitch_detection_supported(self):
2073 """ Determine if a board under test is supported for video glitch
2074 detection tests.
2075
2076 @return: 'video_glitch_detection' if board is supported, None otherwise.
2077 """
2078 parser = ConfigParser.SafeConfigParser()
2079 filename = os.path.join(
2080 common.autotest_dir, 'client/cros/video/device_spec.conf')
2081
2082 dut = self.get_board().replace(ds_constants.BOARD_PREFIX, '')
2083
2084 try:
2085 parser.read(filename)
2086
2087 supported_boards = parser.sections()
2088
2089 if dut in supported_boards:
2090 return 'video_glitch_detection'
2091 else:
2092 return None
2093
2094 except ConfigParser.error:
2095 # something went wrong while parsing the conf file
2096 return None
2097
2098
Simran Basic6f1f7a2012-10-16 10:47:46 -07002099 def get_labels(self):
2100 """Return a list of labels for this given host.
2101
2102 This is the main way to retrieve all the automatic labels for a host
2103 as it will run through all the currently implemented label functions.
2104 """
2105 labels = []
Richard Barnette82c35912012-11-20 10:09:10 -08002106 for label_function in self._LABEL_FUNCTIONS:
Simran Basic6f1f7a2012-10-16 10:47:46 -07002107 label = label_function(self)
2108 if label:
Dan Shi5beba472014-05-28 22:46:07 -07002109 if type(label) is str:
2110 labels.append(label)
2111 elif type(label) is list:
2112 labels.extend(label)
Simran Basic6f1f7a2012-10-16 10:47:46 -07002113 return labels
Dan Shi85276d42014-04-08 22:11:45 -07002114
2115
2116 def is_boot_from_usb(self):
2117 """Check if DUT is boot from USB.
2118
2119 @return: True if DUT is boot from usb.
2120 """
2121 device = self.run('rootdev -s -d').stdout.strip()
2122 removable = int(self.run('cat /sys/block/%s/removable' %
2123 os.path.basename(device)).stdout.strip())
2124 return removable == 1