blob: 21991d0997a2d5546763667fa2c76bf2c121573b [file] [log] [blame]
J. Richard Barnette24adbf42012-04-11 15:04:53 -07001# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
Dale Curtisaa5eedb2011-08-23 16:18:52 -07002# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4
Aviv Keshet74c89a92013-02-04 15:18:30 -08005import functools
Christopher Wiley0ed712b2013-04-09 15:25:12 -07006import httplib
J. Richard Barnette1d78b012012-05-15 13:56:30 -07007import logging
Dan Shi0f466e82013-02-22 15:44:58 -08008import os
Simran Basid5e5e272012-09-24 15:23:59 -07009import re
Christopher Wileyd78249a2013-03-01 13:05:31 -080010import socket
J. Richard Barnette1d78b012012-05-15 13:56:30 -070011import subprocess
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070012import time
J. Richard Barnette1d78b012012-05-15 13:56:30 -070013import xmlrpclib
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070014
J. Richard Barnette45e93de2012-04-11 17:24:15 -070015from autotest_lib.client.bin import utils
Richard Barnette0c73ffc2012-11-19 15:21:18 -080016from autotest_lib.client.common_lib import error
17from autotest_lib.client.common_lib import global_config
J. Richard Barnette45e93de2012-04-11 17:24:15 -070018from autotest_lib.client.common_lib.cros import autoupdater
Richard Barnette03a0c132012-11-05 12:40:35 -080019from autotest_lib.client.common_lib.cros import dev_server
Christopher Wileyd78249a2013-03-01 13:05:31 -080020from autotest_lib.client.common_lib.cros import retry
Michael Liangda8c60a2014-06-03 13:24:51 -070021from autotest_lib.client.common_lib.cros.graphite import stats
Richard Barnette82c35912012-11-20 10:09:10 -080022from autotest_lib.client.cros import constants
J. Richard Barnette84890bd2014-02-21 11:05:47 -080023from autotest_lib.client.cros import cros_ui
J. Richard Barnette45e93de2012-04-11 17:24:15 -070024from autotest_lib.server import autoserv_parser
Dan Shia1ecd5c2013-06-06 11:21:31 -070025from autotest_lib.server import utils as server_utils
Scott Zawalski89c44dd2013-02-26 09:28:02 -050026from autotest_lib.server.cros.dynamic_suite import constants as ds_constants
Simran Basi5e6339a2013-03-21 11:34:32 -070027from autotest_lib.server.cros.dynamic_suite import tools, frontend_wrappers
Fang Deng96667ca2013-08-01 17:46:18 -070028from autotest_lib.server.hosts import abstract_ssh
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +080029from autotest_lib.server.hosts import chameleon_host
Fang Deng5d518f42013-08-02 14:04:32 -070030from autotest_lib.server.hosts import servo_host
Simran Basidcff4252012-11-20 16:13:20 -080031from autotest_lib.site_utils.rpm_control_system import rpm_client
Simran Basid5e5e272012-09-24 15:23:59 -070032
33
beeps32a63082013-08-22 14:02:29 -070034try:
35 import jsonrpclib
36except ImportError:
37 jsonrpclib = None
Fang Deng96667ca2013-08-01 17:46:18 -070038
Fang Dengd1c2b732013-08-20 12:59:46 -070039
beepsc87ff602013-07-31 21:53:00 -070040class FactoryImageCheckerException(error.AutoservError):
41 """Exception raised when an image is a factory image."""
42 pass
43
44
Aviv Keshet74c89a92013-02-04 15:18:30 -080045def add_label_detector(label_function_list, label_list=None, label=None):
46 """Decorator used to group functions together into the provided list.
47 @param label_function_list: List of label detecting functions to add
48 decorated function to.
49 @param label_list: List of detectable labels to add detectable labels to.
50 (Default: None)
51 @param label: Label string that is detectable by this detection function
52 (Default: None)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -080053 """
Simran Basic6f1f7a2012-10-16 10:47:46 -070054 def add_func(func):
Aviv Keshet74c89a92013-02-04 15:18:30 -080055 """
56 @param func: The function to be added as a detector.
57 """
58 label_function_list.append(func)
59 if label and label_list is not None:
60 label_list.append(label)
Simran Basic6f1f7a2012-10-16 10:47:46 -070061 return func
62 return add_func
63
64
Fang Deng0ca40e22013-08-27 17:47:44 -070065class CrosHost(abstract_ssh.AbstractSSHHost):
J. Richard Barnette45e93de2012-04-11 17:24:15 -070066 """Chromium OS specific subclass of Host."""
67
68 _parser = autoserv_parser.autoserv_parser
Scott Zawalski62bacae2013-03-05 10:40:32 -050069 _AFE = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
J. Richard Barnette45e93de2012-04-11 17:24:15 -070070
Richard Barnette03a0c132012-11-05 12:40:35 -080071 # Timeout values (in seconds) associated with various Chrome OS
72 # state changes.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070073 #
Richard Barnette0c73ffc2012-11-19 15:21:18 -080074 # In general, a good rule of thumb is that the timeout can be up
75 # to twice the typical measured value on the slowest platform.
76 # The times here have not necessarily been empirically tested to
77 # meet this criterion.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070078 #
79 # SLEEP_TIMEOUT: Time to allow for suspend to memory.
Richard Barnette0c73ffc2012-11-19 15:21:18 -080080 # RESUME_TIMEOUT: Time to allow for resume after suspend, plus
81 # time to restart the netwowrk.
J. Richard Barnette84890bd2014-02-21 11:05:47 -080082 # SHUTDOWN_TIMEOUT: Time to allow for shut down.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070083 # BOOT_TIMEOUT: Time to allow for boot from power off. Among
Richard Barnette0c73ffc2012-11-19 15:21:18 -080084 # other things, this must account for the 30 second dev-mode
J. Richard Barnetted4649c62013-03-06 17:42:27 -080085 # screen delay and time to start the network.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070086 # USB_BOOT_TIMEOUT: Time to allow for boot from a USB device,
Richard Barnette0c73ffc2012-11-19 15:21:18 -080087 # including the 30 second dev-mode delay and time to start the
J. Richard Barnetted4649c62013-03-06 17:42:27 -080088 # network.
beepsf079cfb2013-09-18 17:49:51 -070089 # INSTALL_TIMEOUT: Time to allow for chromeos-install.
J. Richard Barnette84890bd2014-02-21 11:05:47 -080090 # POWERWASH_BOOT_TIMEOUT: Time to allow for a reboot that
91 # includes powerwash.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070092
93 SLEEP_TIMEOUT = 2
J. Richard Barnetted4649c62013-03-06 17:42:27 -080094 RESUME_TIMEOUT = 10
Tom Wai-Hong Tam4d169ed2014-02-14 11:05:40 +080095 SHUTDOWN_TIMEOUT = 5
J. Richard Barnettefbcc7122013-07-24 18:24:59 -070096 BOOT_TIMEOUT = 60
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070097 USB_BOOT_TIMEOUT = 150
J. Richard Barnette84890bd2014-02-21 11:05:47 -080098 INSTALL_TIMEOUT = 240
Dan Shi2c88eed2013-11-12 10:18:38 -080099 POWERWASH_BOOT_TIMEOUT = 60
Chris Sosab76e0ee2013-05-22 16:55:41 -0700100
J. Richard Barnette84890bd2014-02-21 11:05:47 -0800101 # REBOOT_TIMEOUT: How long to wait for a reboot.
102 #
Chris Sosab76e0ee2013-05-22 16:55:41 -0700103 # We have a long timeout to ensure we don't flakily fail due to other
104 # issues. Shorter timeouts are vetted in platform_RebootAfterUpdate.
Simran Basi1160e2c2013-10-04 16:00:24 -0700105 # TODO(sbasi - crbug.com/276094) Restore to 5 mins once the 'host did not
106 # return from reboot' bug is solved.
107 REBOOT_TIMEOUT = 480
Chris Sosab76e0ee2013-05-22 16:55:41 -0700108
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800109 # _USB_POWER_TIMEOUT: Time to allow for USB to power toggle ON and OFF.
110 # _POWER_CYCLE_TIMEOUT: Time to allow for manual power cycle.
111 _USB_POWER_TIMEOUT = 5
112 _POWER_CYCLE_TIMEOUT = 10
113
beeps32a63082013-08-22 14:02:29 -0700114 _RPC_PROXY_URL = 'http://localhost:%d'
Christopher Wileydd181852013-10-10 19:56:58 -0700115 _RPC_SHUTDOWN_POLLING_PERIOD_SECONDS = 2
Peter Qiu4410db72014-06-05 10:32:41 -0700116 # Set shutdown timeout to account for the time for restarting the UI.
117 _RPC_SHUTDOWN_TIMEOUT_SECONDS = cros_ui.RESTART_UI_TIMEOUT
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800118
Richard Barnette82c35912012-11-20 10:09:10 -0800119 _RPM_RECOVERY_BOARDS = global_config.global_config.get_config_value('CROS',
120 'rpm_recovery_boards', type=str).split(',')
121
122 _MAX_POWER_CYCLE_ATTEMPTS = 6
123 _LAB_MACHINE_FILE = '/mnt/stateful_partition/.labmachine'
124 _RPM_HOSTNAME_REGEX = ('chromeos[0-9]+(-row[0-9]+)?-rack[0-9]+[a-z]*-'
125 'host[0-9]+')
126 _LIGHTSENSOR_FILES = ['in_illuminance0_input',
127 'in_illuminance0_raw',
128 'illuminance0_input']
129 _LIGHTSENSOR_SEARCH_DIR = '/sys/bus/iio/devices'
130 _LABEL_FUNCTIONS = []
Aviv Keshet74c89a92013-02-04 15:18:30 -0800131 _DETECTABLE_LABELS = []
132 label_decorator = functools.partial(add_label_detector, _LABEL_FUNCTIONS,
133 _DETECTABLE_LABELS)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700134
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -0800135 # Constants used in ping_wait_up() and ping_wait_down().
136 #
137 # _PING_WAIT_COUNT is the approximate number of polling
138 # cycles to use when waiting for a host state change.
139 #
140 # _PING_STATUS_DOWN and _PING_STATUS_UP are names used
141 # for arguments to the internal _ping_wait_for_status()
142 # method.
143 _PING_WAIT_COUNT = 40
144 _PING_STATUS_DOWN = False
145 _PING_STATUS_UP = True
146
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800147 # Allowed values for the power_method argument.
148
149 # POWER_CONTROL_RPM: Passed as default arg for power_off/on/cycle() methods.
150 # POWER_CONTROL_SERVO: Used in set_power() and power_cycle() methods.
151 # POWER_CONTROL_MANUAL: Used in set_power() and power_cycle() methods.
152 POWER_CONTROL_RPM = 'RPM'
153 POWER_CONTROL_SERVO = 'servoj10'
154 POWER_CONTROL_MANUAL = 'manual'
155
156 POWER_CONTROL_VALID_ARGS = (POWER_CONTROL_RPM,
157 POWER_CONTROL_SERVO,
158 POWER_CONTROL_MANUAL)
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800159
Simran Basi5e6339a2013-03-21 11:34:32 -0700160 _RPM_OUTLET_CHANGED = 'outlet_changed'
161
beeps687243d2013-07-18 15:29:27 -0700162
J. Richard Barnette964fba02012-10-24 17:34:29 -0700163 @staticmethod
beeps46dadc92013-11-07 14:07:10 -0800164 def check_host(host, timeout=10):
165 """
166 Check if the given host is a chrome-os host.
167
168 @param host: An ssh host representing a device.
169 @param timeout: The timeout for the run command.
170
171 @return: True if the host device is chromeos.
172
beeps46dadc92013-11-07 14:07:10 -0800173 """
174 try:
Christopher Wiley1ea80942014-02-26 16:45:08 -0800175 result = host.run('grep -q CHROMEOS /etc/lsb-release && '
176 '! which adb >/dev/null 2>&1',
Christopher Wileyfc3eac02013-11-21 16:24:57 -0800177 ignore_status=True, timeout=timeout)
beeps46dadc92013-11-07 14:07:10 -0800178 except (error.AutoservRunError, error.AutoservSSHTimeout):
179 return False
180 return result.exit_status == 0
181
182
183 @staticmethod
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800184 def _extract_arguments(args_dict, key_subset):
185 """Extract options from `args_dict` and return a subset result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800186
187 Take the provided dictionary of argument options and return
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800188 a subset that represent standard arguments needed to construct
189 a test-assistant object (chameleon or servo) for a host. The
190 intent is to provide standard argument processing from
191 run_remote_tests for tests that require a test-assistant board
192 to operate.
193
194 @param args_dict Dictionary from which to extract the arguments.
195 @param key_subset Tuple of keys to extract from the args_dict, e.g.
196 ('servo_host', 'servo_port').
197 """
198 result = {}
199 for arg in key_subset:
200 if arg in args_dict:
201 result[arg] = args_dict[arg]
202 return result
203
204
205 @staticmethod
206 def get_chameleon_arguments(args_dict):
207 """Extract chameleon options from `args_dict` and return the result.
208
209 Recommended usage:
210 ~~~~~~~~
211 args_dict = utils.args_to_dict(args)
212 chameleon_args = hosts.CrosHost.get_chameleon_arguments(args_dict)
213 host = hosts.create_host(machine, chameleon_args=chameleon_args)
214 ~~~~~~~~
215
216 @param args_dict Dictionary from which to extract the chameleon
217 arguments.
218 """
219 return CrosHost._extract_arguments(
220 args_dict, ('chameleon_host', 'chameleon_port'))
221
222
223 @staticmethod
224 def get_servo_arguments(args_dict):
225 """Extract servo options from `args_dict` and return the result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800226
227 Recommended usage:
228 ~~~~~~~~
229 args_dict = utils.args_to_dict(args)
Fang Deng0ca40e22013-08-27 17:47:44 -0700230 servo_args = hosts.CrosHost.get_servo_arguments(args_dict)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800231 host = hosts.create_host(machine, servo_args=servo_args)
232 ~~~~~~~~
233
234 @param args_dict Dictionary from which to extract the servo
235 arguments.
236 """
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800237 return CrosHost._extract_arguments(
238 args_dict, ('servo_host', 'servo_port'))
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700239
J. Richard Barnette964fba02012-10-24 17:34:29 -0700240
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800241 def _initialize(self, hostname, chameleon_args=None, servo_args=None,
242 ssh_verbosity_flag='', ssh_options='',
Fang Dengd1c2b732013-08-20 12:59:46 -0700243 *args, **dargs):
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800244 """Initialize superclasses, |self.chameleon|, and |self.servo|.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700245
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800246 This method checks whether a chameleon/servo (aka
247 test-assistant objects) is required by checking whether
248 chameleon_args/servo_args is None. This method will only
249 attempt to create the test-assistant object when it is
250 required by the test.
Fang Deng5d518f42013-08-02 14:04:32 -0700251
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800252 For creating the test-assistant object, there are three
253 possibilities: First, if the host is a lab system known to have
254 a test-assistant board, we connect to that board unconditionally.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700255 Second, if we're called from a control file that requires
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800256 test-assistant features for testing, it will pass settings from
257 the arguments, like `servo_host`, `servo_port`. If neither of
258 these cases apply, the test-assistant object will be `None`.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700259
260 """
Fang Deng0ca40e22013-08-27 17:47:44 -0700261 super(CrosHost, self)._initialize(hostname=hostname,
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700262 *args, **dargs)
J. Richard Barnettef0859852012-08-20 14:55:50 -0700263 # self.env is a dictionary of environment variable settings
264 # to be exported for commands run on the host.
265 # LIBC_FATAL_STDERR_ can be useful for diagnosing certain
266 # errors that might happen.
267 self.env['LIBC_FATAL_STDERR_'] = '1'
beeps32a63082013-08-22 14:02:29 -0700268 self._rpc_proxy_map = {}
Fang Dengd1c2b732013-08-20 12:59:46 -0700269 self._ssh_verbosity_flag = ssh_verbosity_flag
Aviv Keshetc5947fa2013-09-04 14:06:29 -0700270 self._ssh_options = ssh_options
Fang Deng5d518f42013-08-02 14:04:32 -0700271 # TODO(fdeng): We need to simplify the
272 # process of servo and servo_host initialization.
273 # crbug.com/298432
Dan Shi4d478522014-02-14 13:46:32 -0800274 self._servo_host = servo_host.create_servo_host(dut=self.hostname,
275 servo_args=servo_args)
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800276 # TODO(waihong): Do the simplication on Chameleon too.
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800277 self._chameleon_host = chameleon_host.create_chameleon_host(
278 dut=self.hostname, chameleon_args=chameleon_args)
279
Dan Shi4d478522014-02-14 13:46:32 -0800280 if self._servo_host is not None:
281 self.servo = self._servo_host.get_servo()
282 else:
283 self.servo = None
284
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800285 if self._chameleon_host:
Tom Wai-Hong Tameaee3402014-01-22 08:52:10 +0800286 self.chameleon = self._chameleon_host.create_chameleon_board()
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800287 else:
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +0800288 self.chameleon = None
Fang Deng5d518f42013-08-02 14:04:32 -0700289
290
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500291 def get_repair_image_name(self):
292 """Generate a image_name from variables in the global config.
293
294 @returns a str of $board-version/$BUILD.
295
296 """
297 stable_version = global_config.global_config.get_config_value(
298 'CROS', 'stable_cros_version')
299 build_pattern = global_config.global_config.get_config_value(
300 'CROS', 'stable_build_pattern')
301 board = self._get_board_from_afe()
302 if board is None:
303 raise error.AutoservError('DUT has no board attribute, '
304 'cannot be repaired.')
305 return build_pattern % (board, stable_version)
306
307
Scott Zawalski62bacae2013-03-05 10:40:32 -0500308 def _host_in_AFE(self):
309 """Check if the host is an object the AFE knows.
310
311 @returns the host object.
312 """
313 return self._AFE.get_hosts(hostname=self.hostname)
314
315
Chris Sosab76e0ee2013-05-22 16:55:41 -0700316 def lookup_job_repo_url(self):
317 """Looks up the job_repo_url for the host.
318
319 @returns job_repo_url from AFE or None if not found.
320
321 @raises KeyError if the host does not have a job_repo_url
322 """
323 if not self._host_in_AFE():
324 return None
325
326 hosts = self._AFE.get_hosts(hostname=self.hostname)
beepsb5efc532013-06-04 11:29:34 -0700327 if hosts and ds_constants.JOB_REPO_URL in hosts[0].attributes:
328 return hosts[0].attributes[ds_constants.JOB_REPO_URL]
Chris Sosab76e0ee2013-05-22 16:55:41 -0700329
330
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500331 def clear_cros_version_labels_and_job_repo_url(self):
332 """Clear cros_version labels and host attribute job_repo_url."""
Scott Zawalski62bacae2013-03-05 10:40:32 -0500333 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400334 return
335
Scott Zawalski62bacae2013-03-05 10:40:32 -0500336 host_list = [self.hostname]
337 labels = self._AFE.get_labels(
338 name__startswith=ds_constants.VERSION_PREFIX,
339 host__hostname=self.hostname)
Dan Shi0f466e82013-02-22 15:44:58 -0800340
Scott Zawalski62bacae2013-03-05 10:40:32 -0500341 for label in labels:
342 label.remove_hosts(hosts=host_list)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500343
beepscb6f1e22013-06-28 19:14:10 -0700344 self.update_job_repo_url(None, None)
345
346
347 def update_job_repo_url(self, devserver_url, image_name):
348 """
349 Updates the job_repo_url host attribute and asserts it's value.
350
351 @param devserver_url: The devserver to use in the job_repo_url.
352 @param image_name: The name of the image to use in the job_repo_url.
353
354 @raises AutoservError: If we failed to update the job_repo_url.
355 """
356 repo_url = None
357 if devserver_url and image_name:
358 repo_url = tools.get_package_url(devserver_url, image_name)
359 self._AFE.set_host_attribute(ds_constants.JOB_REPO_URL, repo_url,
Scott Zawalski62bacae2013-03-05 10:40:32 -0500360 hostname=self.hostname)
beepscb6f1e22013-06-28 19:14:10 -0700361 if self.lookup_job_repo_url() != repo_url:
362 raise error.AutoservError('Failed to update job_repo_url with %s, '
363 'host %s' % (repo_url, self.hostname))
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500364
365
Dan Shie9309262013-06-19 22:50:21 -0700366 def add_cros_version_labels_and_job_repo_url(self, image_name):
Scott Zawalskieadbf702013-03-14 09:23:06 -0400367 """Add cros_version labels and host attribute job_repo_url.
368
369 @param image_name: The name of the image e.g.
370 lumpy-release/R27-3837.0.0
Dan Shi7458bf62013-06-10 12:50:16 -0700371
Scott Zawalskieadbf702013-03-14 09:23:06 -0400372 """
Scott Zawalski62bacae2013-03-05 10:40:32 -0500373 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400374 return
Scott Zawalski62bacae2013-03-05 10:40:32 -0500375
Scott Zawalskieadbf702013-03-14 09:23:06 -0400376 cros_label = '%s%s' % (ds_constants.VERSION_PREFIX, image_name)
Dan Shie9309262013-06-19 22:50:21 -0700377 devserver_url = dev_server.ImageServer.resolve(image_name).url()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500378
379 labels = self._AFE.get_labels(name=cros_label)
380 if labels:
381 label = labels[0]
382 else:
383 label = self._AFE.create_label(name=cros_label)
384
385 label.add_hosts([self.hostname])
beepscb6f1e22013-06-28 19:14:10 -0700386 self.update_job_repo_url(devserver_url, image_name)
387
388
beepsdae65fd2013-07-26 16:24:41 -0700389 def verify_job_repo_url(self, tag=''):
beepscb6f1e22013-06-28 19:14:10 -0700390 """
391 Make sure job_repo_url of this host is valid.
392
joychen03eaad92013-06-26 09:55:21 -0700393 Eg: The job_repo_url "http://lmn.cd.ab.xyx:8080/static/\
beepscb6f1e22013-06-28 19:14:10 -0700394 lumpy-release/R29-4279.0.0/autotest/packages" claims to have the
395 autotest package for lumpy-release/R29-4279.0.0. If this isn't the case,
396 download and extract it. If the devserver embedded in the url is
397 unresponsive, update the job_repo_url of the host after staging it on
398 another devserver.
399
400 @param job_repo_url: A url pointing to the devserver where the autotest
401 package for this build should be staged.
beepsdae65fd2013-07-26 16:24:41 -0700402 @param tag: The tag from the server job, in the format
403 <job_id>-<user>/<hostname>, or <hostless> for a server job.
beepscb6f1e22013-06-28 19:14:10 -0700404
405 @raises DevServerException: If we could not resolve a devserver.
406 @raises AutoservError: If we're unable to save the new job_repo_url as
407 a result of choosing a new devserver because the old one failed to
408 respond to a health check.
beeps0c865032013-07-30 11:37:06 -0700409 @raises urllib2.URLError: If the devserver embedded in job_repo_url
410 doesn't respond within the timeout.
beepscb6f1e22013-06-28 19:14:10 -0700411 """
412 job_repo_url = self.lookup_job_repo_url()
413 if not job_repo_url:
414 logging.warning('No job repo url set on host %s', self.hostname)
415 return
416
417 logging.info('Verifying job repo url %s', job_repo_url)
418 devserver_url, image_name = tools.get_devserver_build_from_package_url(
419 job_repo_url)
420
beeps0c865032013-07-30 11:37:06 -0700421 ds = dev_server.ImageServer(devserver_url)
beepscb6f1e22013-06-28 19:14:10 -0700422
423 logging.info('Staging autotest artifacts for %s on devserver %s',
424 image_name, ds.url())
beeps687243d2013-07-18 15:29:27 -0700425
426 start_time = time.time()
beepscb6f1e22013-06-28 19:14:10 -0700427 ds.stage_artifacts(image_name, ['autotest'])
beeps687243d2013-07-18 15:29:27 -0700428 stage_time = time.time() - start_time
429
430 # Record how much of the verification time comes from a devserver
431 # restage. If we're doing things right we should not see multiple
432 # devservers for a given board/build/branch path.
433 try:
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800434 board, build_type, branch = server_utils.ParseBuildName(
beeps687243d2013-07-18 15:29:27 -0700435 image_name)[:3]
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800436 except server_utils.ParseBuildNameException:
beeps687243d2013-07-18 15:29:27 -0700437 pass
438 else:
beeps0c865032013-07-30 11:37:06 -0700439 devserver = devserver_url[
Chris Sosa65425082013-10-16 13:26:22 -0700440 devserver_url.find('/') + 2:devserver_url.rfind(':')]
beeps687243d2013-07-18 15:29:27 -0700441 stats_key = {
442 'board': board,
443 'build_type': build_type,
444 'branch': branch,
beeps0c865032013-07-30 11:37:06 -0700445 'devserver': devserver.replace('.', '_'),
beeps687243d2013-07-18 15:29:27 -0700446 }
447 stats.Gauge('verify_job_repo_url').send(
448 '%(board)s.%(build_type)s.%(branch)s.%(devserver)s' % stats_key,
449 stage_time)
beepscb6f1e22013-06-28 19:14:10 -0700450
Scott Zawalskieadbf702013-03-14 09:23:06 -0400451
Dan Shi0f466e82013-02-22 15:44:58 -0800452 def _try_stateful_update(self, update_url, force_update, updater):
453 """Try to use stateful update to initialize DUT.
454
455 When DUT is already running the same version that machine_install
456 tries to install, stateful update is a much faster way to clean up
457 the DUT for testing, compared to a full reimage. It is implemeted
458 by calling autoupdater.run_update, but skipping updating root, as
459 updating the kernel is time consuming and not necessary.
460
461 @param update_url: url of the image.
462 @param force_update: Set to True to update the image even if the DUT
463 is running the same version.
464 @param updater: ChromiumOSUpdater instance used to update the DUT.
465 @returns: True if the DUT was updated with stateful update.
466
467 """
J. Richard Barnette3f731032014-04-07 17:42:59 -0700468 # TODO(jrbarnette): Yes, I hate this re.match() test case.
469 # It's better than the alternative: see crbug.com/360944.
470 image_name = autoupdater.url_to_image_name(update_url)
471 release_pattern = r'^.*-release/R[0-9]+-[0-9]+\.[0-9]+\.0$'
472 if not re.match(release_pattern, image_name):
473 return False
Dan Shi0f466e82013-02-22 15:44:58 -0800474 if not updater.check_version():
475 return False
476 if not force_update:
477 logging.info('Canceling stateful update because the new and '
478 'old versions are the same.')
479 return False
480 # Following folders should be rebuilt after stateful update.
481 # A test file is used to confirm each folder gets rebuilt after
482 # the stateful update.
483 folders_to_check = ['/var', '/home', '/mnt/stateful_partition']
484 test_file = '.test_file_to_be_deleted'
485 for folder in folders_to_check:
486 touch_path = os.path.join(folder, test_file)
487 self.run('touch %s' % touch_path)
488
489 if not updater.run_update(force_update=True, update_root=False):
490 return False
491
492 # Reboot to complete stateful update.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700493 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Dan Shi0f466e82013-02-22 15:44:58 -0800494 check_file_cmd = 'test -f %s; echo $?'
495 for folder in folders_to_check:
496 test_file_path = os.path.join(folder, test_file)
497 result = self.run(check_file_cmd % test_file_path,
498 ignore_status=True)
499 if result.exit_status == 1:
500 return False
501 return True
502
503
J. Richard Barnette7275b612013-06-04 18:13:11 -0700504 def _post_update_processing(self, updater, expected_kernel=None):
Dan Shi0f466e82013-02-22 15:44:58 -0800505 """After the DUT is updated, confirm machine_install succeeded.
506
507 @param updater: ChromiumOSUpdater instance used to update the DUT.
J. Richard Barnette7275b612013-06-04 18:13:11 -0700508 @param expected_kernel: kernel expected to be active after reboot,
509 or `None` to skip rollback checking.
Dan Shi0f466e82013-02-22 15:44:58 -0800510
511 """
J. Richard Barnette7275b612013-06-04 18:13:11 -0700512 # Touch the lab machine file to leave a marker that
513 # distinguishes this image from other test images.
514 # Afterwards, we must re-run the autoreboot script because
515 # it depends on the _LAB_MACHINE_FILE.
Dan Shi0f466e82013-02-22 15:44:58 -0800516 self.run('touch %s' % self._LAB_MACHINE_FILE)
Dan Shi0f466e82013-02-22 15:44:58 -0800517 self.run('start autoreboot')
Chris Sosa65425082013-10-16 13:26:22 -0700518 updater.verify_boot_expectations(
519 expected_kernel, rollback_message=
520 'Build %s failed to boot on %s; system rolled back to previous'
521 'build' % (updater.update_version, self.hostname))
J. Richard Barnette7275b612013-06-04 18:13:11 -0700522 # Check that we've got the build we meant to install.
523 if not updater.check_version_to_confirm_install():
524 raise autoupdater.ChromiumOSError(
525 'Failed to update %s to build %s; found build '
526 '%s instead' % (self.hostname,
Chris Sosa65425082013-10-16 13:26:22 -0700527 updater.update_version,
528 updater.get_build_id()))
Dan Shi0f466e82013-02-22 15:44:58 -0800529
530
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700531 def _stage_image_for_update(self, image_name=None):
Scott Zawalskieadbf702013-03-14 09:23:06 -0400532 """Stage a build on a devserver and return the update_url.
533
534 @param image_name: a name like lumpy-release/R27-3837.0.0
535 @returns an update URL like:
536 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
537 """
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700538 if not image_name:
539 image_name = self.get_repair_image_name()
540 logging.info('Staging build for AU: %s', image_name)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400541 devserver = dev_server.ImageServer.resolve(image_name)
542 devserver.trigger_download(image_name, synchronous=False)
543 return tools.image_url_pattern() % (devserver.url(), image_name)
544
545
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700546 def stage_image_for_servo(self, image_name=None):
547 """Stage a build on a devserver and return the update_url.
548
549 @param image_name: a name like lumpy-release/R27-3837.0.0
550 @returns an update URL like:
551 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
552 """
553 if not image_name:
554 image_name = self.get_repair_image_name()
555 logging.info('Staging build for servo install: %s', image_name)
556 devserver = dev_server.ImageServer.resolve(image_name)
557 devserver.stage_artifacts(image_name, ['test_image'])
558 return devserver.get_test_image_url(image_name)
559
560
beepse539be02013-07-31 21:57:39 -0700561 def stage_factory_image_for_servo(self, image_name):
562 """Stage a build on a devserver and return the update_url.
563
564 @param image_name: a name like <baord>/4262.204.0
beeps12c0a3c2013-09-03 11:58:27 -0700565
beepse539be02013-07-31 21:57:39 -0700566 @return: An update URL, eg:
567 http://<devserver>/static/canary-channel/\
568 <board>/4262.204.0/factory_test/chromiumos_factory_image.bin
beeps12c0a3c2013-09-03 11:58:27 -0700569
570 @raises: ValueError if the factory artifact name is missing from
571 the config.
572
beepse539be02013-07-31 21:57:39 -0700573 """
574 if not image_name:
575 logging.error('Need an image_name to stage a factory image.')
576 return
577
beeps12c0a3c2013-09-03 11:58:27 -0700578 factory_artifact = global_config.global_config.get_config_value(
579 'CROS', 'factory_artifact', type=str, default='')
580 if not factory_artifact:
581 raise ValueError('Cannot retrieve the factory artifact name from '
582 'autotest config, and hence cannot stage factory '
583 'artifacts.')
584
beepse539be02013-07-31 21:57:39 -0700585 logging.info('Staging build for servo install: %s', image_name)
586 devserver = dev_server.ImageServer.resolve(image_name)
587 devserver.stage_artifacts(
588 image_name,
beeps12c0a3c2013-09-03 11:58:27 -0700589 [factory_artifact],
590 archive_url=None)
beepse539be02013-07-31 21:57:39 -0700591
592 return tools.factory_image_url_pattern() % (devserver.url(), image_name)
593
594
Chris Sosaa3ac2152012-05-23 22:23:13 -0700595 def machine_install(self, update_url=None, force_update=False,
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500596 local_devserver=False, repair=False):
597 """Install the DUT.
598
Dan Shi0f466e82013-02-22 15:44:58 -0800599 Use stateful update if the DUT is already running the same build.
600 Stateful update does not update kernel and tends to run much faster
601 than a full reimage. If the DUT is running a different build, or it
602 failed to do a stateful update, full update, including kernel update,
603 will be applied to the DUT.
604
Scott Zawalskieadbf702013-03-14 09:23:06 -0400605 Once a host enters machine_install its cros_version label will be
606 removed as well as its host attribute job_repo_url (used for
607 package install).
608
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500609 @param update_url: The url to use for the update
610 pattern: http://$devserver:###/update/$build
611 If update_url is None and repair is True we will install the
612 stable image listed in global_config under
613 CROS.stable_cros_version.
614 @param force_update: Force an update even if the version installed
615 is the same. Default:False
616 @param local_devserver: Used by run_remote_test to allow people to
617 use their local devserver. Default: False
618 @param repair: Whether or not we are in repair mode. This adds special
619 cases for repairing a machine like starting update_engine.
620 Setting repair to True sets force_update to True as well.
621 default: False
622 @raises autoupdater.ChromiumOSError
623
624 """
Dan Shi7458bf62013-06-10 12:50:16 -0700625 if update_url:
626 logging.debug('update url is set to %s', update_url)
627 else:
628 logging.debug('update url is not set, resolving...')
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700629 if self._parser.options.image:
630 requested_build = self._parser.options.image
631 if requested_build.startswith('http://'):
632 update_url = requested_build
Dan Shi7458bf62013-06-10 12:50:16 -0700633 logging.debug('update url is retrieved from requested_build'
634 ': %s', update_url)
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700635 else:
636 # Try to stage any build that does not start with
637 # http:// on the devservers defined in
638 # global_config.ini.
Dan Shi7458bf62013-06-10 12:50:16 -0700639 update_url = self._stage_image_for_update(requested_build)
640 logging.debug('Build staged, and update_url is set to: %s',
641 update_url)
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700642 elif repair:
643 update_url = self._stage_image_for_update()
Dan Shi7458bf62013-06-10 12:50:16 -0700644 logging.debug('Build staged, and update_url is set to: %s',
645 update_url)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400646 else:
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700647 raise autoupdater.ChromiumOSError(
648 'Update failed. No update URL provided.')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500649
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500650 if repair:
Dan Shi0f466e82013-02-22 15:44:58 -0800651 # In case the system is in a bad state, we always reboot the machine
652 # before machine_install.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700653 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500654 self.run('stop update-engine; start update-engine')
655 force_update = True
Dan Shi0f466e82013-02-22 15:44:58 -0800656
Chris Sosaa3ac2152012-05-23 22:23:13 -0700657 updater = autoupdater.ChromiumOSUpdater(update_url, host=self,
Chris Sosa72312602013-04-16 15:01:56 -0700658 local_devserver=local_devserver)
Dan Shi0f466e82013-02-22 15:44:58 -0800659 updated = False
Scott Zawalskieadbf702013-03-14 09:23:06 -0400660 # Remove cros-version and job_repo_url host attribute from host.
661 self.clear_cros_version_labels_and_job_repo_url()
Dan Shi0f466e82013-02-22 15:44:58 -0800662 # If the DUT is already running the same build, try stateful update
663 # first. Stateful update does not update kernel and tends to run much
664 # faster than a full reimage.
665 try:
Chris Sosab76e0ee2013-05-22 16:55:41 -0700666 updated = self._try_stateful_update(
667 update_url, force_update, updater)
Dan Shi0f466e82013-02-22 15:44:58 -0800668 if updated:
669 logging.info('DUT is updated with stateful update.')
670 except Exception as e:
671 logging.exception(e)
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -0700672 logging.warning('Failed to stateful update DUT, force to update.')
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700673
Dan Shi0f466e82013-02-22 15:44:58 -0800674 inactive_kernel = None
675 # Do a full update if stateful update is not applicable or failed.
676 if not updated:
677 # In case the system is in a bad state, we always reboot the
678 # machine before machine_install.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700679 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Chris Sosab7612bc2013-03-21 10:32:37 -0700680
681 # TODO(sosa): Remove temporary hack to get rid of bricked machines
682 # that can't update due to a corrupted policy.
683 self.run('rm -rf /var/lib/whitelist')
684 self.run('touch /var/lib/whitelist')
685 self.run('chmod -w /var/lib/whitelist')
Scott Zawalskib550d5a2013-03-22 09:23:59 -0400686 self.run('stop update-engine; start update-engine')
Chris Sosab7612bc2013-03-21 10:32:37 -0700687
Dan Shi0f466e82013-02-22 15:44:58 -0800688 if updater.run_update(force_update):
689 updated = True
690 # Figure out active and inactive kernel.
691 active_kernel, inactive_kernel = updater.get_kernel_state()
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700692
Dan Shi0f466e82013-02-22 15:44:58 -0800693 # Ensure inactive kernel has higher priority than active.
694 if (updater.get_kernel_priority(inactive_kernel)
695 < updater.get_kernel_priority(active_kernel)):
696 raise autoupdater.ChromiumOSError(
697 'Update failed. The priority of the inactive kernel'
698 ' partition is less than that of the active kernel'
699 ' partition.')
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700700
Dan Shi0f466e82013-02-22 15:44:58 -0800701 # Updater has returned successfully; reboot the host.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700702 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700703
Dan Shi0f466e82013-02-22 15:44:58 -0800704 if updated:
705 self._post_update_processing(updater, inactive_kernel)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400706 image_name = autoupdater.url_to_image_name(update_url)
Dan Shie9309262013-06-19 22:50:21 -0700707 self.add_cros_version_labels_and_job_repo_url(image_name)
Simran Basi13fa1ba2013-03-04 10:56:47 -0800708
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700709 # Clean up any old autotest directories which may be lying around.
710 for path in global_config.global_config.get_config_value(
711 'AUTOSERV', 'client_autodir_paths', type=list):
712 self.run('rm -rf ' + path)
713
714
Dan Shi10e992b2013-08-30 11:02:59 -0700715 def show_update_engine_log(self):
716 """Output update engine log."""
717 logging.debug('Dumping %s', constants.UPDATE_ENGINE_LOG)
718 self.run('cat %s' % constants.UPDATE_ENGINE_LOG)
719
720
Richard Barnette82c35912012-11-20 10:09:10 -0800721 def _get_board_from_afe(self):
722 """Retrieve this host's board from its labels in the AFE.
723
724 Looks for a host label of the form "board:<board>", and
725 returns the "<board>" part of the label. `None` is returned
726 if there is not a single, unique label matching the pattern.
727
728 @returns board from label, or `None`.
729 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700730 return server_utils.get_board_from_afe(self.hostname, self._AFE)
Simran Basi833814b2013-01-29 13:13:43 -0800731
732
733 def get_build(self):
734 """Retrieve the current build for this Host from the AFE.
735
736 Looks through this host's labels in the AFE to determine its build.
737
738 @returns The current build or None if it could not find it or if there
739 were multiple build labels assigned to this host.
740 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700741 return server_utils.get_build_from_afe(self.hostname, self._AFE)
Richard Barnette82c35912012-11-20 10:09:10 -0800742
743
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500744 def _install_repair(self):
745 """Attempt to repair this host using upate-engine.
746
747 If the host is up, try installing the DUT with a stable
748 "repair" version of Chrome OS as defined in the global_config
749 under CROS.stable_cros_version.
750
Scott Zawalski62bacae2013-03-05 10:40:32 -0500751 @raises AutoservRepairMethodNA if the DUT is not reachable.
752 @raises ChromiumOSError if the install failed for some reason.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500753
754 """
755 if not self.is_up():
Scott Zawalski62bacae2013-03-05 10:40:32 -0500756 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500757 logging.info('Attempting to reimage machine to repair image.')
758 try:
759 self.machine_install(repair=True)
Fang Dengd0672f32013-03-18 17:18:09 -0700760 except autoupdater.ChromiumOSError as e:
761 logging.exception(e)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500762 logging.info('Repair via install failed.')
Scott Zawalski62bacae2013-03-05 10:40:32 -0500763 raise
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500764
765
Dan Shi2c88eed2013-11-12 10:18:38 -0800766 def _install_repair_with_powerwash(self):
Dan Shi9cc48452013-11-12 12:39:26 -0800767 """Attempt to powerwash first then repair this host using update-engine.
Dan Shi2c88eed2013-11-12 10:18:38 -0800768
Dan Shi9cc48452013-11-12 12:39:26 -0800769 update-engine may fail due to a bad image. In such case, powerwash
770 may help to cleanup the DUT for update-engine to work again.
Dan Shi2c88eed2013-11-12 10:18:38 -0800771
772 @raises AutoservRepairMethodNA if the DUT is not reachable.
773 @raises ChromiumOSError if the install failed for some reason.
774
775 """
776 if not self.is_up():
777 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
778
779 logging.info('Attempting to powerwash the DUT.')
780 self.run('echo "fast safe" > '
781 '/mnt/stateful_partition/factory_install_reset')
782 self.reboot(timeout=self.POWERWASH_BOOT_TIMEOUT, wait=True)
783 if not self.is_up():
Dan Shi9cc48452013-11-12 12:39:26 -0800784 logging.error('Powerwash failed. DUT did not come back after '
Dan Shi2c88eed2013-11-12 10:18:38 -0800785 'reboot.')
786 raise error.AutoservRepairFailure(
787 'DUT failed to boot from powerwash after %d seconds' %
788 self.POWERWASH_BOOT_TIMEOUT)
789
790 logging.info('Powerwash succeeded.')
791 self._install_repair()
792
793
beepsf079cfb2013-09-18 17:49:51 -0700794 def servo_install(self, image_url=None, usb_boot_timeout=USB_BOOT_TIMEOUT,
795 install_timeout=INSTALL_TIMEOUT):
Scott Zawalski62bacae2013-03-05 10:40:32 -0500796 """
797 Re-install the OS on the DUT by:
798 1) installing a test image on a USB storage device attached to the Servo
799 board,
Richard Barnette03a0c132012-11-05 12:40:35 -0800800 2) booting that image in recovery mode, and then
J. Richard Barnette31b2e312013-04-04 16:05:22 -0700801 3) installing the image with chromeos-install.
802
Scott Zawalski62bacae2013-03-05 10:40:32 -0500803 @param image_url: If specified use as the url to install on the DUT.
804 otherwise boot the currently staged image on the USB stick.
beepsf079cfb2013-09-18 17:49:51 -0700805 @param usb_boot_timeout: The usb_boot_timeout to use during reimage.
806 Factory images need a longer usb_boot_timeout than regular
807 cros images.
808 @param install_timeout: The timeout to use when installing the chromeos
809 image. Factory images need a longer install_timeout.
Richard Barnette03a0c132012-11-05 12:40:35 -0800810
Scott Zawalski62bacae2013-03-05 10:40:32 -0500811 @raises AutoservError if the image fails to boot.
Richard Barnette03a0c132012-11-05 12:40:35 -0800812 """
beepsf079cfb2013-09-18 17:49:51 -0700813
814 usb_boot_timer_key = ('servo_install.usb_boot_timeout_%s'
815 % usb_boot_timeout)
816 logging.info('Downloading image to USB, then booting from it. Usb boot '
817 'timeout = %s', usb_boot_timeout)
818 timer = stats.Timer(usb_boot_timer_key)
819 timer.start()
J. Richard Barnette31b2e312013-04-04 16:05:22 -0700820 self.servo.install_recovery_image(image_url)
beepsf079cfb2013-09-18 17:49:51 -0700821 if not self.wait_up(timeout=usb_boot_timeout):
Scott Zawalski62bacae2013-03-05 10:40:32 -0500822 raise error.AutoservRepairFailure(
823 'DUT failed to boot from USB after %d seconds' %
beepsf079cfb2013-09-18 17:49:51 -0700824 usb_boot_timeout)
825 timer.stop()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500826
beepsf079cfb2013-09-18 17:49:51 -0700827 install_timer_key = ('servo_install.install_timeout_%s'
828 % install_timeout)
829 timer = stats.Timer(install_timer_key)
830 timer.start()
831 logging.info('Installing image through chromeos-install.')
832 self.run('chromeos-install --yes', timeout=install_timeout)
833 timer.stop()
834
835 logging.info('Power cycling DUT through servo.')
Richard Barnette03a0c132012-11-05 12:40:35 -0800836 self.servo.power_long_press()
Fang Dengafb88142013-05-30 17:44:31 -0700837 self.servo.switch_usbkey('off')
J. Richard Barnettefbcc7122013-07-24 18:24:59 -0700838 # We *must* use power_on() here; on Parrot it's how we get
839 # out of recovery mode.
840 self.servo.get_power_state_controller().power_on()
beepsf079cfb2013-09-18 17:49:51 -0700841
842 logging.info('Waiting for DUT to come back up.')
Richard Barnette03a0c132012-11-05 12:40:35 -0800843 if not self.wait_up(timeout=self.BOOT_TIMEOUT):
844 raise error.AutoservError('DUT failed to reboot installed '
845 'test image after %d seconds' %
Scott Zawalski62bacae2013-03-05 10:40:32 -0500846 self.BOOT_TIMEOUT)
847
848
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700849 def _servo_repair_reinstall(self):
Scott Zawalski62bacae2013-03-05 10:40:32 -0500850 """Reinstall the DUT utilizing servo and a test image.
851
852 Re-install the OS on the DUT by:
853 1) installing a test image on a USB storage device attached to the Servo
854 board,
855 2) booting that image in recovery mode, and then
856 3) installing the image with chromeos-install.
857
Scott Zawalski62bacae2013-03-05 10:40:32 -0500858 @raises AutoservRepairMethodNA if the device does not have servo
859 support.
860
861 """
862 if not self.servo:
863 raise error.AutoservRepairMethodNA('Repair Reinstall NA: '
864 'DUT has no servo support.')
865
866 logging.info('Attempting to recovery servo enabled device with '
867 'servo_repair_reinstall')
868
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700869 image_url = self.stage_image_for_servo()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500870 self.servo_install(image_url)
871
872
873 def _servo_repair_power(self):
874 """Attempt to repair DUT using an attached Servo.
875
876 Attempt to power on the DUT via power_long_press.
877
878 @raises AutoservRepairMethodNA if the device does not have servo
879 support.
880 @raises AutoservRepairFailure if the repair fails for any reason.
881 """
882 if not self.servo:
883 raise error.AutoservRepairMethodNA('Repair Power NA: '
884 'DUT has no servo support.')
885
886 logging.info('Attempting to recover servo enabled device by '
887 'powering it off and on.')
888 self.servo.get_power_state_controller().power_off()
889 self.servo.get_power_state_controller().power_on()
890 if self.wait_up(self.BOOT_TIMEOUT):
891 return
892
893 raise error.AutoservRepairFailure('DUT did not boot after long_press.')
Richard Barnette03a0c132012-11-05 12:40:35 -0800894
895
Richard Barnette82c35912012-11-20 10:09:10 -0800896 def _powercycle_to_repair(self):
897 """Utilize the RPM Infrastructure to bring the host back up.
898
899 If the host is not up/repaired after the first powercycle we utilize
900 auto fallback to the last good install by powercycling and rebooting the
901 host 6 times.
Scott Zawalski62bacae2013-03-05 10:40:32 -0500902
903 @raises AutoservRepairMethodNA if the device does not support remote
904 power.
905 @raises AutoservRepairFailure if the repair fails for any reason.
906
Richard Barnette82c35912012-11-20 10:09:10 -0800907 """
Scott Zawalski62bacae2013-03-05 10:40:32 -0500908 if not self.has_power():
909 raise error.AutoservRepairMethodNA('Device does not support power.')
910
Richard Barnette82c35912012-11-20 10:09:10 -0800911 logging.info('Attempting repair via RPM powercycle.')
912 failed_cycles = 0
913 self.power_cycle()
914 while not self.wait_up(timeout=self.BOOT_TIMEOUT):
915 failed_cycles += 1
916 if failed_cycles >= self._MAX_POWER_CYCLE_ATTEMPTS:
Scott Zawalski62bacae2013-03-05 10:40:32 -0500917 raise error.AutoservRepairFailure(
918 'Powercycled host %s %d times; device did not come back'
919 ' online.' % (self.hostname, failed_cycles))
Richard Barnette82c35912012-11-20 10:09:10 -0800920 self.power_cycle()
921 if failed_cycles == 0:
922 logging.info('Powercycling was successful first time.')
923 else:
924 logging.info('Powercycling was successful after %d failures.',
925 failed_cycles)
926
927
Prashanth B4d8184f2014-05-05 12:22:02 -0700928 def check_device(self):
929 """Check if a device is ssh-able, and if so, clean and verify it.
930
931 @raise AutoservSSHTimeout: If the ssh ping times out.
932 @raise AutoservSshPermissionDeniedError: If ssh ping fails due to
933 permissions.
934 @raise AutoservSshPingHostError: For other AutoservRunErrors during
935 ssh_ping.
936 @raises AutoservError: As appropriate, during cleanup and verify.
937 """
938 self.ssh_ping()
939 self.cleanup()
940 self.verify()
941
942
Richard Barnette82c35912012-11-20 10:09:10 -0800943 def repair_full(self):
944 """Repair a host for repair level NO_PROTECTION.
945
946 This overrides the base class function for repair; it does
947 not call back to the parent class, but instead offers a
948 simplified implementation based on the capabilities in the
949 Chrome OS test lab.
950
Fang Deng5d518f42013-08-02 14:04:32 -0700951 It first verifies and repairs servo if it is a DUT in CrOS
Fang Deng03590af2013-10-07 17:34:20 -0700952 lab and a servo is attached.
Fang Deng5d518f42013-08-02 14:04:32 -0700953
Prashanth B4d8184f2014-05-05 12:22:02 -0700954 If `self.check_device()` fails, the following procedures are
J. Richard Barnettefde55fc2013-03-15 17:47:01 -0700955 attempted:
956 1. Try to re-install to a known stable image using
957 auto-update.
Scott Zawalski62bacae2013-03-05 10:40:32 -0500958 2. If there's a servo for the DUT, try to power the DUT off and
959 on.
960 3. If there's a servo for the DUT, try to re-install via
J. Richard Barnettefde55fc2013-03-15 17:47:01 -0700961 the servo.
Scott Zawalski62bacae2013-03-05 10:40:32 -0500962 4. If the DUT can be power-cycled via RPM, try to repair
Richard Barnette82c35912012-11-20 10:09:10 -0800963 by power-cycling.
964
965 As with the parent method, the last operation performed on
Prashanth B4d8184f2014-05-05 12:22:02 -0700966 the DUT must be to call `self.check_device()`; If that call fails the
967 exception it raises is passed back to the caller.
J. Richard Barnettefde55fc2013-03-15 17:47:01 -0700968
Scott Zawalski62bacae2013-03-05 10:40:32 -0500969 @raises AutoservRepairTotalFailure if the repair process fails to
970 fix the DUT.
Fang Deng5d518f42013-08-02 14:04:32 -0700971 @raises ServoHostRepairTotalFailure if the repair process fails to
972 fix the servo host if one is attached to the DUT.
973 @raises AutoservSshPermissionDeniedError if it is unable
974 to ssh to the servo host due to permission error.
975
Richard Barnette82c35912012-11-20 10:09:10 -0800976 """
Dan Shi4d478522014-02-14 13:46:32 -0800977 if self._servo_host and not self.servo:
Fang Deng03590af2013-10-07 17:34:20 -0700978 try:
Dan Shi4d478522014-02-14 13:46:32 -0800979 self._servo_host.repair_full()
Fang Deng03590af2013-10-07 17:34:20 -0700980 except Exception as e:
Fang Deng03590af2013-10-07 17:34:20 -0700981 logging.error('Could not create a healthy servo: %s', e)
Dan Shi4d478522014-02-14 13:46:32 -0800982 self.servo = self._servo_host.get_servo()
Fang Deng5d518f42013-08-02 14:04:32 -0700983
Scott Zawalski62bacae2013-03-05 10:40:32 -0500984 # TODO(scottz): This should use something similar to label_decorator,
985 # but needs to be populated in order so DUTs are repaired with the
986 # least amount of effort.
Dan Shi849a1c42014-03-05 11:10:43 -0800987 repair_funcs = [self._servo_repair_power,
988 self._install_repair,
Dan Shi2c88eed2013-11-12 10:18:38 -0800989 self._install_repair_with_powerwash,
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700990 self._servo_repair_reinstall,
Scott Zawalski62bacae2013-03-05 10:40:32 -0500991 self._powercycle_to_repair]
992 errors = []
Simran Basie6130932013-10-01 14:07:52 -0700993 board = self._get_board_from_afe()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500994 for repair_func in repair_funcs:
995 try:
996 repair_func()
Prashanth B4d8184f2014-05-05 12:22:02 -0700997 self.check_device()
Simran Basie6130932013-10-01 14:07:52 -0700998 stats.Counter(
999 '%s.SUCCEEDED' % repair_func.__name__).increment()
1000 if board:
1001 stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001002 '%s.%s.SUCCEEDED' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001003 board)).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001004 return
Simran Basie6130932013-10-01 14:07:52 -07001005 except error.AutoservRepairMethodNA as e:
1006 stats.Counter(
1007 '%s.RepairNA' % repair_func.__name__).increment()
1008 if board:
1009 stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001010 '%s.%s.RepairNA' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001011 board)).increment()
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001012 logging.warning('Repair function NA: %s', e)
Simran Basie6130932013-10-01 14:07:52 -07001013 errors.append(str(e))
Scott Zawalski62bacae2013-03-05 10:40:32 -05001014 except Exception as e:
Simran Basie6130932013-10-01 14:07:52 -07001015 stats.Counter(
1016 '%s.FAILED' % repair_func.__name__).increment()
1017 if board:
1018 stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001019 '%s.%s.FAILED' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001020 board)).increment()
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001021 logging.warning('Failed to repair device: %s', e)
Scott Zawalski62bacae2013-03-05 10:40:32 -05001022 errors.append(str(e))
Scott Zawalski89c44dd2013-02-26 09:28:02 -05001023
Simran Basie6130932013-10-01 14:07:52 -07001024 stats.Counter('Full_Repair_Failed').increment()
1025 if board:
1026 stats.Counter(
1027 'Full_Repair_Failed.%s' % board).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001028 raise error.AutoservRepairTotalFailure(
1029 'All attempts at repairing the device failed:\n%s' %
1030 '\n'.join(errors))
Richard Barnette82c35912012-11-20 10:09:10 -08001031
1032
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001033 def close(self):
beeps32a63082013-08-22 14:02:29 -07001034 self.rpc_disconnect_all()
Fang Deng0ca40e22013-08-27 17:47:44 -07001035 super(CrosHost, self).close()
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001036
1037
Simran Basi5e6339a2013-03-21 11:34:32 -07001038 def _cleanup_poweron(self):
1039 """Special cleanup method to make sure hosts always get power back."""
1040 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
1041 hosts = afe.get_hosts(hostname=self.hostname)
1042 if not hosts or not (self._RPM_OUTLET_CHANGED in
1043 hosts[0].attributes):
1044 return
1045 logging.debug('This host has recently interacted with the RPM'
1046 ' Infrastructure. Ensuring power is on.')
1047 try:
1048 self.power_on()
1049 except rpm_client.RemotePowerException:
1050 # If cleanup has completed but there was an issue with the RPM
1051 # Infrastructure, log an error message rather than fail cleanup
1052 logging.error('Failed to turn Power On for this host after '
1053 'cleanup through the RPM Infrastructure.')
1054 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, None,
1055 hostname=self.hostname)
1056
1057
beepsc87ff602013-07-31 21:53:00 -07001058 def _is_factory_image(self):
1059 """Checks if the image on the DUT is a factory image.
1060
1061 @return: True if the image on the DUT is a factory image.
1062 False otherwise.
1063 """
1064 result = self.run('[ -f /root/.factory_test ]', ignore_status=True)
1065 return result.exit_status == 0
1066
1067
1068 def _restart_ui(self):
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001069 """Restart the Chrome UI.
beepsc87ff602013-07-31 21:53:00 -07001070
1071 @raises: FactoryImageCheckerException for factory images, since
1072 we cannot attempt to restart ui on them.
1073 error.AutoservRunError for any other type of error that
1074 occurs while restarting ui.
1075 """
1076 if self._is_factory_image():
1077 raise FactoryImageCheckerException('Cannot restart ui on factory '
1078 'images')
1079
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001080 # TODO(jrbarnette): The command to stop/start the ui job
1081 # should live inside cros_ui, too. However that would seem
1082 # to imply interface changes to the existing start()/restart()
1083 # functions, which is a bridge too far (for now).
1084 prompt = cros_ui.get_login_prompt_state(self)
1085 self.run('stop ui; start ui')
1086 cros_ui.wait_for_chrome_ready(prompt, self)
beepsc87ff602013-07-31 21:53:00 -07001087
1088
1089 def cleanup(self):
Richard Barnette82c35912012-11-20 10:09:10 -08001090 self.run('rm -f %s' % constants.CLEANUP_LOGS_PAUSED_FILE)
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001091 try:
beepsc87ff602013-07-31 21:53:00 -07001092 self._restart_ui()
1093 except (error.AutotestRunError, error.AutoservRunError,
1094 FactoryImageCheckerException):
Ilja H. Friedel04be2bd2014-05-07 21:29:59 -07001095 logging.warning('Unable to restart ui, rebooting device.')
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001096 # Since restarting the UI fails fall back to normal Autotest
1097 # cleanup routines, i.e. reboot the machine.
Fang Deng0ca40e22013-08-27 17:47:44 -07001098 super(CrosHost, self).cleanup()
Simran Basi5e6339a2013-03-21 11:34:32 -07001099 # Check if the rpm outlet was manipulated.
Simran Basid5e5e272012-09-24 15:23:59 -07001100 if self.has_power():
Simran Basi5e6339a2013-03-21 11:34:32 -07001101 self._cleanup_poweron()
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001102
1103
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001104 def reboot(self, **dargs):
1105 """
1106 This function reboots the site host. The more generic
1107 RemoteHost.reboot() performs sync and sleeps for 5
1108 seconds. This is not necessary for Chrome OS devices as the
1109 sync should be finished in a short time during the reboot
1110 command.
1111 """
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001112 if 'reboot_cmd' not in dargs:
Doug Anderson7d5aeb22014-02-27 15:12:17 -08001113 reboot_timeout = dargs.get('reboot_timeout', 10)
1114 dargs['reboot_cmd'] = ('((reboot & sleep %d; reboot -f &)'
1115 ' </dev/null >/dev/null 2>&1 &)' %
1116 reboot_timeout)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001117 # Enable fastsync to avoid running extra sync commands before reboot.
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001118 if 'fastsync' not in dargs:
1119 dargs['fastsync'] = True
Michael Liangda8c60a2014-06-03 13:24:51 -07001120
Charlie Mooneya8e6dab2014-05-29 14:37:55 -07001121 # For purposes of logging reboot times:
1122 # Get the board name i.e. 'daisy_spring'
1123 dargs['board'] = self._get_board_from_afe()
Fang Deng0ca40e22013-08-27 17:47:44 -07001124 super(CrosHost, self).reboot(**dargs)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001125
1126
Gwendal Grignou7a61d2f2014-05-23 11:05:51 -07001127 def suspend(self, **dargs):
1128 """
1129 This function suspends the site host.
1130 """
1131 suspend_time = dargs.get('suspend_time', 60)
1132 dargs['timeout'] = suspend_time
1133 if 'suspend_cmd' not in dargs:
1134 cmd = ' && '.join(['echo 0 > /sys/class/rtc/rtc0/wakealarm',
1135 'echo +%d > /sys/class/rtc/rtc0/wakealarm' % suspend_time,
1136 'powerd_dbus_suspend --delay=0 &'])
1137 dargs['suspend_cmd'] = ('(( %s )'
1138 '< /dev/null >/dev/null 2>&1 &)' % cmd)
1139 super(CrosHost, self).suspend(**dargs)
1140
1141
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001142 def verify_software(self):
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001143 """Verify working software on a Chrome OS system.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001144
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001145 Tests for the following conditions:
1146 1. All conditions tested by the parent version of this
1147 function.
1148 2. Sufficient space in /mnt/stateful_partition.
Fang Deng6b05f5b2013-03-20 13:42:11 -07001149 3. Sufficient space in /mnt/stateful_partition/encrypted.
1150 4. update_engine answers a simple status request over DBus.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001151
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001152 """
Fang Deng0ca40e22013-08-27 17:47:44 -07001153 super(CrosHost, self).verify_software()
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001154 self.check_diskspace(
1155 '/mnt/stateful_partition',
1156 global_config.global_config.get_config_value(
Fang Deng6b05f5b2013-03-20 13:42:11 -07001157 'SERVER', 'gb_diskspace_required', type=float,
1158 default=20.0))
Gaurav Shahe448af82014-06-19 15:18:59 -07001159 encrypted_stateful_path = '/mnt/stateful_partition/encrypted'
1160 # Not all targets build with encrypted stateful support.
1161 if self.path_exists(encrypted_stateful_path):
1162 self.check_diskspace(
1163 encrypted_stateful_path,
1164 global_config.global_config.get_config_value(
1165 'SERVER', 'gb_encrypted_diskspace_required', type=float,
1166 default=0.1))
beepsc87ff602013-07-31 21:53:00 -07001167
Prashanth B5d0a0512014-04-25 12:26:08 -07001168 services_status = self.run('status system-services').stdout
1169 if services_status != 'system-services start/running\n':
1170 raise error.AutoservError('Chrome failed to reach login. '
1171 'System services not running.')
1172
beepsc87ff602013-07-31 21:53:00 -07001173 # Factory images don't run update engine,
1174 # goofy controls dbus on these DUTs.
1175 if not self._is_factory_image():
1176 self.run('update_engine_client --status')
Scott Zawalskifbca4a92013-03-04 15:56:42 -05001177 # Makes sure python is present, loads and can use built in functions.
1178 # We have seen cases where importing cPickle fails with undefined
1179 # symbols in cPickle.so.
1180 self.run('python -c "import cPickle"')
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001181
1182
Fang Deng96667ca2013-08-01 17:46:18 -07001183 def make_ssh_command(self, user='root', port=22, opts='', hosts_file=None,
1184 connect_timeout=None, alive_interval=None):
1185 """Override default make_ssh_command to use options tuned for Chrome OS.
1186
1187 Tuning changes:
1188 - ConnectTimeout=30; maximum of 30 seconds allowed for an SSH
1189 connection failure. Consistency with remote_access.sh.
1190
1191 - ServerAliveInterval=180; which causes SSH to ping connection every
1192 180 seconds. In conjunction with ServerAliveCountMax ensures
1193 that if the connection dies, Autotest will bail out quickly.
1194 Originally tried 60 secs, but saw frequent job ABORTS where
1195 the test completed successfully.
1196
1197 - ServerAliveCountMax=3; consistency with remote_access.sh.
1198
1199 - ConnectAttempts=4; reduce flakiness in connection errors;
1200 consistency with remote_access.sh.
1201
1202 - UserKnownHostsFile=/dev/null; we don't care about the keys.
1203 Host keys change with every new installation, don't waste
1204 memory/space saving them.
1205
1206 - SSH protocol forced to 2; needed for ServerAliveInterval.
1207
1208 @param user User name to use for the ssh connection.
1209 @param port Port on the target host to use for ssh connection.
1210 @param opts Additional options to the ssh command.
1211 @param hosts_file Ignored.
1212 @param connect_timeout Ignored.
1213 @param alive_interval Ignored.
1214 """
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001215 base_command = ('/usr/bin/ssh -a -x %s %s %s'
1216 ' -o StrictHostKeyChecking=no'
Fang Deng96667ca2013-08-01 17:46:18 -07001217 ' -o UserKnownHostsFile=/dev/null -o BatchMode=yes'
1218 ' -o ConnectTimeout=30 -o ServerAliveInterval=180'
1219 ' -o ServerAliveCountMax=3 -o ConnectionAttempts=4'
1220 ' -o Protocol=2 -l %s -p %d')
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001221 return base_command % (self._ssh_verbosity_flag, self._ssh_options,
1222 opts, user, port)
Fang Deng96667ca2013-08-01 17:46:18 -07001223
1224
beeps32a63082013-08-22 14:02:29 -07001225 def _create_ssh_tunnel(self, port, local_port):
1226 """Create an ssh tunnel from local_port to port.
1227
1228 @param port: remote port on the host.
1229 @param local_port: local forwarding port.
1230
1231 @return: the tunnel process.
1232 """
1233 # Chrome OS on the target closes down most external ports
1234 # for security. We could open the port, but doing that
1235 # would conflict with security tests that check that only
1236 # expected ports are open. So, to get to the port on the
1237 # target we use an ssh tunnel.
1238 tunnel_options = '-n -N -q -L %d:localhost:%d' % (local_port, port)
1239 ssh_cmd = self.make_ssh_command(opts=tunnel_options)
1240 tunnel_cmd = '%s %s' % (ssh_cmd, self.hostname)
1241 logging.debug('Full tunnel command: %s', tunnel_cmd)
1242 tunnel_proc = subprocess.Popen(tunnel_cmd, shell=True, close_fds=True)
1243 logging.debug('Started ssh tunnel, local = %d'
1244 ' remote = %d, pid = %d',
1245 local_port, port, tunnel_proc.pid)
1246 return tunnel_proc
1247
1248
Christopher Wileydd181852013-10-10 19:56:58 -07001249 def _setup_rpc(self, port, command_name, remote_pid=None):
beeps32a63082013-08-22 14:02:29 -07001250 """Sets up a tunnel process and performs rpc connection book keeping.
1251
1252 This method assumes that xmlrpc and jsonrpc never conflict, since
1253 we can only either have an xmlrpc or a jsonrpc server listening on
1254 a remote port. As such, it enforces a single proxy->remote port
1255 policy, i.e if one starts a jsonrpc proxy/server from port A->B,
1256 and then tries to start an xmlrpc proxy forwarded to the same port,
1257 the xmlrpc proxy will override the jsonrpc tunnel process, however:
1258
1259 1. None of the methods on the xmlrpc proxy will work because
1260 the server listening on B is jsonrpc.
1261
1262 2. The xmlrpc client cannot initiate a termination of the JsonRPC
1263 server, as the only use case currently is goofy, which is tied to
1264 the factory image. It is much easier to handle a failed xmlrpc
1265 call on the client than it is to terminate goofy in this scenario,
1266 as doing the latter might leave the DUT in a hard to recover state.
1267
1268 With the current implementation newer rpc proxy connections will
1269 terminate the tunnel processes of older rpc connections tunneling
1270 to the same remote port. If methods are invoked on the client
1271 after this has happened they will fail with connection closed errors.
1272
1273 @param port: The remote forwarding port.
1274 @param command_name: The name of the remote process, to terminate
1275 using pkill.
1276
1277 @return A url that we can use to initiate the rpc connection.
1278 """
1279 self.rpc_disconnect(port)
1280 local_port = utils.get_unused_port()
1281 tunnel_proc = self._create_ssh_tunnel(port, local_port)
Christopher Wileydd181852013-10-10 19:56:58 -07001282 self._rpc_proxy_map[port] = (command_name, tunnel_proc, remote_pid)
beeps32a63082013-08-22 14:02:29 -07001283 return self._RPC_PROXY_URL % local_port
1284
1285
Christopher Wileyd78249a2013-03-01 13:05:31 -08001286 def xmlrpc_connect(self, command, port, command_name=None,
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001287 ready_test_name=None, timeout_seconds=10,
1288 logfile='/dev/null'):
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001289 """Connect to an XMLRPC server on the host.
1290
1291 The `command` argument should be a simple shell command that
1292 starts an XMLRPC server on the given `port`. The command
1293 must not daemonize, and must terminate cleanly on SIGTERM.
1294 The command is started in the background on the host, and a
1295 local XMLRPC client for the server is created and returned
1296 to the caller.
1297
1298 Note that the process of creating an XMLRPC client makes no
1299 attempt to connect to the remote server; the caller is
1300 responsible for determining whether the server is running
1301 correctly, and is ready to serve requests.
1302
Christopher Wileyd78249a2013-03-01 13:05:31 -08001303 Optionally, the caller can pass ready_test_name, a string
1304 containing the name of a method to call on the proxy. This
1305 method should take no parameters and return successfully only
1306 when the server is ready to process client requests. When
1307 ready_test_name is set, xmlrpc_connect will block until the
1308 proxy is ready, and throw a TestError if the server isn't
1309 ready by timeout_seconds.
1310
beeps32a63082013-08-22 14:02:29 -07001311 If a server is already running on the remote port, this
1312 method will kill it and disconnect the tunnel process
1313 associated with the connection before establishing a new one,
1314 by consulting the rpc_proxy_map in rpc_disconnect.
1315
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001316 @param command Shell command to start the server.
1317 @param port Port number on which the server is expected to
1318 be serving.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001319 @param command_name String to use as input to `pkill` to
1320 terminate the XMLRPC server on the host.
Christopher Wileyd78249a2013-03-01 13:05:31 -08001321 @param ready_test_name String containing the name of a
1322 method defined on the XMLRPC server.
1323 @param timeout_seconds Number of seconds to wait
1324 for the server to become 'ready.' Will throw a
1325 TestFail error if server is not ready in time.
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001326 @param logfile Logfile to send output when running
1327 'command' argument.
Yusuf Mohsinally8d19e3c2013-11-21 14:25:45 -08001328
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001329 """
Christopher Wileyc14f06a2013-10-16 13:55:39 -07001330 # Clean up any existing state. If the caller is willing
1331 # to believe their server is down, we ought to clean up
1332 # any tunnels we might have sitting around.
1333 self.rpc_disconnect(port)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001334 # Start the server on the host. Redirection in the command
1335 # below is necessary, because 'ssh' won't terminate until
1336 # background child processes close stdin, stdout, and
1337 # stderr.
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001338 remote_cmd = '%s </dev/null >%s 2>&1 & echo $!' % (command, logfile)
Christopher Wileydd181852013-10-10 19:56:58 -07001339 remote_pid = self.run(remote_cmd).stdout.rstrip('\n')
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001340 logging.debug('Started XMLRPC server on host %s, pid = %s',
1341 self.hostname, remote_pid)
1342
Christopher Wileydd181852013-10-10 19:56:58 -07001343 # Tunnel through SSH to be able to reach that remote port.
1344 rpc_url = self._setup_rpc(port, command_name, remote_pid=remote_pid)
Christopher Wileyd78249a2013-03-01 13:05:31 -08001345 proxy = xmlrpclib.ServerProxy(rpc_url, allow_none=True)
Christopher Wileydd181852013-10-10 19:56:58 -07001346
Christopher Wileyd78249a2013-03-01 13:05:31 -08001347 if ready_test_name is not None:
J. Richard Barnette13eb7c02013-03-07 12:06:29 -08001348 # retry.retry logs each attempt; calculate delay_sec to
1349 # keep log spam to a dull roar.
Christopher Wiley0ed712b2013-04-09 15:25:12 -07001350 @retry.retry((socket.error,
1351 xmlrpclib.ProtocolError,
1352 httplib.BadStatusLine),
Chris Sosa65425082013-10-16 13:26:22 -07001353 timeout_min=timeout_seconds / 60.0,
1354 delay_sec=min(max(timeout_seconds / 20.0, 0.1), 1))
Christopher Wileyd78249a2013-03-01 13:05:31 -08001355 def ready_test():
1356 """ Call proxy.ready_test_name(). """
1357 getattr(proxy, ready_test_name)()
1358 successful = False
1359 try:
1360 logging.info('Waiting %d seconds for XMLRPC server '
1361 'to start.', timeout_seconds)
1362 ready_test()
1363 successful = True
Christopher Wileyd78249a2013-03-01 13:05:31 -08001364 finally:
1365 if not successful:
1366 logging.error('Failed to start XMLRPC server.')
beeps32a63082013-08-22 14:02:29 -07001367 self.rpc_disconnect(port)
Christopher Wileyd78249a2013-03-01 13:05:31 -08001368 logging.info('XMLRPC server started successfully.')
1369 return proxy
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001370
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001371
Jason Abeleb6f924f2013-11-13 16:01:54 -08001372 def syslog(self, message, tag='autotest'):
1373 """Logs a message to syslog on host.
1374
1375 @param message String message to log into syslog
1376 @param tag String tag prefix for syslog
1377
1378 """
1379 self.run('logger -t "%s" "%s"' % (tag, message))
1380
1381
beeps32a63082013-08-22 14:02:29 -07001382 def jsonrpc_connect(self, port):
1383 """Creates a jsonrpc proxy connection through an ssh tunnel.
1384
1385 This method exists to facilitate communication with goofy (which is
1386 the default system manager on all factory images) and as such, leaves
1387 most of the rpc server sanity checking to the caller. Unlike
1388 xmlrpc_connect, this method does not facilitate the creation of a remote
1389 jsonrpc server, as the only clients of this code are factory tests,
1390 for which the goofy system manager is built in to the image and starts
1391 when the target boots.
1392
1393 One can theoretically create multiple jsonrpc proxies all forwarded
1394 to the same remote port, provided the remote port has an rpc server
1395 listening. However, in doing so we stand the risk of leaking an
1396 existing tunnel process, so we always disconnect any older tunnels
1397 we might have through rpc_disconnect.
1398
1399 @param port: port on the remote host that is serving this proxy.
1400
1401 @return: The client proxy.
1402 """
1403 if not jsonrpclib:
1404 logging.warning('Jsonrpclib could not be imported. Check that '
1405 'site-packages contains jsonrpclib.')
1406 return None
1407
1408 proxy = jsonrpclib.jsonrpc.ServerProxy(self._setup_rpc(port, None))
1409
1410 logging.info('Established a jsonrpc connection through port %s.', port)
1411 return proxy
1412
1413
1414 def rpc_disconnect(self, port):
1415 """Disconnect from an RPC server on the host.
1416
1417 Terminates the remote RPC server previously started for
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001418 the given `port`. Also closes the local ssh tunnel created
1419 for the connection to the host. This function does not
beeps32a63082013-08-22 14:02:29 -07001420 directly alter the state of a previously returned RPC
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001421 client object; however disconnection will cause all
1422 subsequent calls to methods on the object to fail.
1423
1424 This function does nothing if requested to disconnect a port
beeps32a63082013-08-22 14:02:29 -07001425 that was not previously connected via _setup_rpc.
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001426
1427 @param port Port number passed to a previous call to
beeps32a63082013-08-22 14:02:29 -07001428 `_setup_rpc()`.
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001429 """
beeps32a63082013-08-22 14:02:29 -07001430 if port not in self._rpc_proxy_map:
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001431 return
Christopher Wileydd181852013-10-10 19:56:58 -07001432 remote_name, tunnel_proc, remote_pid = self._rpc_proxy_map[port]
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001433 if remote_name:
1434 # We use 'pkill' to find our target process rather than
1435 # a PID, because the host may have rebooted since
1436 # connecting, and we don't want to kill an innocent
1437 # process with the same PID.
1438 #
1439 # 'pkill' helpfully exits with status 1 if no target
1440 # process is found, for which run() will throw an
Simran Basid5e5e272012-09-24 15:23:59 -07001441 # exception. We don't want that, so we the ignore
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001442 # status.
1443 self.run("pkill -f '%s'" % remote_name, ignore_status=True)
Christopher Wileydd181852013-10-10 19:56:58 -07001444 if remote_pid:
1445 logging.info('Waiting for RPC server "%s" shutdown',
1446 remote_name)
1447 start_time = time.time()
1448 while (time.time() - start_time <
1449 self._RPC_SHUTDOWN_TIMEOUT_SECONDS):
1450 running_processes = self.run(
1451 "pgrep -f '%s'" % remote_name,
1452 ignore_status=True).stdout.split()
1453 if not remote_pid in running_processes:
1454 logging.info('Shut down RPC server.')
1455 break
1456 time.sleep(self._RPC_SHUTDOWN_POLLING_PERIOD_SECONDS)
1457 else:
1458 raise error.TestError('Failed to shutdown RPC server %s' %
1459 remote_name)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001460
1461 if tunnel_proc.poll() is None:
1462 tunnel_proc.terminate()
1463 logging.debug('Terminated tunnel, pid %d', tunnel_proc.pid)
1464 else:
1465 logging.debug('Tunnel pid %d terminated early, status %d',
1466 tunnel_proc.pid, tunnel_proc.returncode)
beeps32a63082013-08-22 14:02:29 -07001467 del self._rpc_proxy_map[port]
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001468
1469
beeps32a63082013-08-22 14:02:29 -07001470 def rpc_disconnect_all(self):
1471 """Disconnect all known RPC proxy ports."""
1472 for port in self._rpc_proxy_map.keys():
1473 self.rpc_disconnect(port)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001474
1475
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001476 def _ping_check_status(self, status):
1477 """Ping the host once, and return whether it has a given status.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001478
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001479 @param status Check the ping status against this value.
1480 @return True iff `status` and the result of ping are the same
1481 (i.e. both True or both False).
1482
1483 """
1484 ping_val = utils.ping(self.hostname, tries=1, deadline=1)
1485 return not (status ^ (ping_val == 0))
1486
1487 def _ping_wait_for_status(self, status, timeout):
1488 """Wait for the host to have a given status (UP or DOWN).
1489
1490 Status is checked by polling. Polling will not last longer
1491 than the number of seconds in `timeout`. The polling
1492 interval will be long enough that only approximately
1493 _PING_WAIT_COUNT polling cycles will be executed, subject
1494 to a maximum interval of about one minute.
1495
1496 @param status Waiting will stop immediately if `ping` of the
1497 host returns this status.
1498 @param timeout Poll for at most this many seconds.
1499 @return True iff the host status from `ping` matched the
1500 requested status at the time of return.
1501
1502 """
1503 # _ping_check_status() takes about 1 second, hence the
1504 # "- 1" in the formula below.
1505 poll_interval = min(int(timeout / self._PING_WAIT_COUNT), 60) - 1
1506 end_time = time.time() + timeout
1507 while time.time() <= end_time:
1508 if self._ping_check_status(status):
1509 return True
1510 if poll_interval > 0:
1511 time.sleep(poll_interval)
1512
1513 # The last thing we did was sleep(poll_interval), so it may
1514 # have been too long since the last `ping`. Check one more
1515 # time, just to be sure.
1516 return self._ping_check_status(status)
1517
1518 def ping_wait_up(self, timeout):
1519 """Wait for the host to respond to `ping`.
1520
1521 N.B. This method is not a reliable substitute for
1522 `wait_up()`, because a host that responds to ping will not
1523 necessarily respond to ssh. This method should only be used
1524 if the target DUT can be considered functional even if it
1525 can't be reached via ssh.
1526
1527 @param timeout Minimum time to allow before declaring the
1528 host to be non-responsive.
1529 @return True iff the host answered to ping before the timeout.
1530
1531 """
1532 return self._ping_wait_for_status(self._PING_STATUS_UP, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001533
Andrew Bresticker678c0c72013-01-22 10:44:09 -08001534 def ping_wait_down(self, timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001535 """Wait until the host no longer responds to `ping`.
1536
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001537 This function can be used as a slightly faster version of
1538 `wait_down()`, by avoiding potentially long ssh timeouts.
1539
1540 @param timeout Minimum time to allow for the host to become
1541 non-responsive.
1542 @return True iff the host quit answering ping before the
1543 timeout.
1544
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001545 """
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001546 return self._ping_wait_for_status(self._PING_STATUS_DOWN, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001547
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001548 def test_wait_for_sleep(self, sleep_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001549 """Wait for the client to enter low-power sleep mode.
1550
1551 The test for "is asleep" can't distinguish a system that is
1552 powered off; to confirm that the unit was asleep, it is
1553 necessary to force resume, and then call
1554 `test_wait_for_resume()`.
1555
1556 This function is expected to be called from a test as part
1557 of a sequence like the following:
1558
1559 ~~~~~~~~
1560 boot_id = host.get_boot_id()
1561 # trigger sleep on the host
1562 host.test_wait_for_sleep()
1563 # trigger resume on the host
1564 host.test_wait_for_resume(boot_id)
1565 ~~~~~~~~
1566
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001567 @param sleep_timeout time limit in seconds to allow the host sleep.
1568
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001569 @exception TestFail The host did not go to sleep within
1570 the allowed time.
1571 """
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001572 if sleep_timeout is None:
1573 sleep_timeout = self.SLEEP_TIMEOUT
1574
1575 if not self.ping_wait_down(timeout=sleep_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001576 raise error.TestFail(
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001577 'client failed to sleep after %d seconds' % sleep_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001578
1579
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001580 def test_wait_for_resume(self, old_boot_id, resume_timeout=None):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001581 """Wait for the client to resume from low-power sleep mode.
1582
1583 The `old_boot_id` parameter should be the value from
1584 `get_boot_id()` obtained prior to entering sleep mode. A
1585 `TestFail` exception is raised if the boot id changes.
1586
1587 See @ref test_wait_for_sleep for more on this function's
1588 usage.
1589
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001590 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001591 target host went to sleep.
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001592 @param resume_timeout time limit in seconds to allow the host up.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001593
1594 @exception TestFail The host did not respond within the
1595 allowed time.
1596 @exception TestFail The host responded, but the boot id test
1597 indicated a reboot rather than a sleep
1598 cycle.
1599 """
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001600 if resume_timeout is None:
1601 resume_timeout = self.RESUME_TIMEOUT
1602
1603 if not self.wait_up(timeout=resume_timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001604 raise error.TestFail(
1605 'client failed to resume from sleep after %d seconds' %
Tom Wai-Hong Tamfced4f62014-04-17 10:56:30 +08001606 resume_timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001607 else:
1608 new_boot_id = self.get_boot_id()
1609 if new_boot_id != old_boot_id:
1610 raise error.TestFail(
1611 'client rebooted, but sleep was expected'
1612 ' (old boot %s, new boot %s)'
1613 % (old_boot_id, new_boot_id))
1614
1615
1616 def test_wait_for_shutdown(self):
1617 """Wait for the client to shut down.
1618
1619 The test for "has shut down" can't distinguish a system that
1620 is merely asleep; to confirm that the unit was down, it is
1621 necessary to force boot, and then call test_wait_for_boot().
1622
1623 This function is expected to be called from a test as part
1624 of a sequence like the following:
1625
1626 ~~~~~~~~
1627 boot_id = host.get_boot_id()
1628 # trigger shutdown on the host
1629 host.test_wait_for_shutdown()
1630 # trigger boot on the host
1631 host.test_wait_for_boot(boot_id)
1632 ~~~~~~~~
1633
1634 @exception TestFail The host did not shut down within the
1635 allowed time.
1636 """
Andrew Bresticker678c0c72013-01-22 10:44:09 -08001637 if not self.ping_wait_down(timeout=self.SHUTDOWN_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001638 raise error.TestFail(
1639 'client failed to shut down after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001640 self.SHUTDOWN_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001641
1642
1643 def test_wait_for_boot(self, old_boot_id=None):
1644 """Wait for the client to boot from cold power.
1645
1646 The `old_boot_id` parameter should be the value from
1647 `get_boot_id()` obtained prior to shutting down. A
1648 `TestFail` exception is raised if the boot id does not
1649 change. The boot id test is omitted if `old_boot_id` is not
1650 specified.
1651
1652 See @ref test_wait_for_shutdown for more on this function's
1653 usage.
1654
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001655 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001656 shut down.
1657
1658 @exception TestFail The host did not respond within the
1659 allowed time.
1660 @exception TestFail The host responded, but the boot id test
1661 indicated that there was no reboot.
1662 """
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001663 if not self.wait_up(timeout=self.REBOOT_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001664 raise error.TestFail(
1665 'client failed to reboot after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001666 self.REBOOT_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001667 elif old_boot_id:
1668 if self.get_boot_id() == old_boot_id:
1669 raise error.TestFail(
1670 'client is back up, but did not reboot'
1671 ' (boot %s)' % old_boot_id)
Simran Basid5e5e272012-09-24 15:23:59 -07001672
1673
1674 @staticmethod
1675 def check_for_rpm_support(hostname):
1676 """For a given hostname, return whether or not it is powered by an RPM.
1677
Simran Basi1df55112013-09-06 11:25:09 -07001678 @param hostname: hostname to check for rpm support.
1679
Simran Basid5e5e272012-09-24 15:23:59 -07001680 @return None if this host does not follows the defined naming format
1681 for RPM powered DUT's in the lab. If it does follow the format,
1682 it returns a regular expression MatchObject instead.
1683 """
Fang Deng0ca40e22013-08-27 17:47:44 -07001684 return re.match(CrosHost._RPM_HOSTNAME_REGEX, hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07001685
1686
1687 def has_power(self):
1688 """For this host, return whether or not it is powered by an RPM.
1689
1690 @return True if this host is in the CROS lab and follows the defined
1691 naming format.
1692 """
Fang Deng0ca40e22013-08-27 17:47:44 -07001693 return CrosHost.check_for_rpm_support(self.hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07001694
1695
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08001696 def _set_power(self, state, power_method):
1697 """Sets the power to the host via RPM, Servo or manual.
1698
1699 @param state Specifies which power state to set to DUT
1700 @param power_method Specifies which method of power control to
1701 use. By default "RPM" will be used. Valid values
1702 are the strings "RPM", "manual", "servoj10".
1703
1704 """
1705 ACCEPTABLE_STATES = ['ON', 'OFF']
1706
1707 if state.upper() not in ACCEPTABLE_STATES:
1708 raise error.TestError('State must be one of: %s.'
1709 % (ACCEPTABLE_STATES,))
1710
1711 if power_method == self.POWER_CONTROL_SERVO:
1712 logging.info('Setting servo port J10 to %s', state)
1713 self.servo.set('prtctl3_pwren', state.lower())
1714 time.sleep(self._USB_POWER_TIMEOUT)
1715 elif power_method == self.POWER_CONTROL_MANUAL:
1716 logging.info('You have %d seconds to set the AC power to %s.',
1717 self._POWER_CYCLE_TIMEOUT, state)
1718 time.sleep(self._POWER_CYCLE_TIMEOUT)
1719 else:
1720 if not self.has_power():
1721 raise error.TestFail('DUT does not have RPM connected.')
Simran Basi5e6339a2013-03-21 11:34:32 -07001722 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
1723 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, True,
1724 hostname=self.hostname)
Simran Basi1df55112013-09-06 11:25:09 -07001725 rpm_client.set_power(self.hostname, state.upper(), timeout_mins=5)
Simran Basid5e5e272012-09-24 15:23:59 -07001726
1727
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08001728 def power_off(self, power_method=POWER_CONTROL_RPM):
1729 """Turn off power to this host via RPM, Servo or manual.
1730
1731 @param power_method Specifies which method of power control to
1732 use. By default "RPM" will be used. Valid values
1733 are the strings "RPM", "manual", "servoj10".
1734
1735 """
1736 self._set_power('OFF', power_method)
Simran Basid5e5e272012-09-24 15:23:59 -07001737
1738
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08001739 def power_on(self, power_method=POWER_CONTROL_RPM):
1740 """Turn on power to this host via RPM, Servo or manual.
1741
1742 @param power_method Specifies which method of power control to
1743 use. By default "RPM" will be used. Valid values
1744 are the strings "RPM", "manual", "servoj10".
1745
1746 """
1747 self._set_power('ON', power_method)
1748
1749
1750 def power_cycle(self, power_method=POWER_CONTROL_RPM):
1751 """Cycle power to this host by turning it OFF, then ON.
1752
1753 @param power_method Specifies which method of power control to
1754 use. By default "RPM" will be used. Valid values
1755 are the strings "RPM", "manual", "servoj10".
1756
1757 """
1758 if power_method in (self.POWER_CONTROL_SERVO,
1759 self.POWER_CONTROL_MANUAL):
1760 self.power_off(power_method=power_method)
1761 time.sleep(self._POWER_CYCLE_TIMEOUT)
1762 self.power_on(power_method=power_method)
1763 else:
1764 rpm_client.set_power(self.hostname, 'CYCLE')
Simran Basic6f1f7a2012-10-16 10:47:46 -07001765
1766
1767 def get_platform(self):
1768 """Determine the correct platform label for this host.
1769
1770 @returns a string representing this host's platform.
1771 """
1772 crossystem = utils.Crossystem(self)
1773 crossystem.init()
1774 # Extract fwid value and use the leading part as the platform id.
1775 # fwid generally follow the format of {platform}.{firmware version}
1776 # Example: Alex.X.YYY.Z or Google_Alex.X.YYY.Z
1777 platform = crossystem.fwid().split('.')[0].lower()
1778 # Newer platforms start with 'Google_' while the older ones do not.
1779 return platform.replace('google_', '')
1780
1781
Hung-ying Tyanb1328032014-04-01 14:18:54 +08001782 def get_architecture(self):
1783 """Determine the correct architecture label for this host.
1784
1785 @returns a string representing this host's architecture.
1786 """
1787 crossystem = utils.Crossystem(self)
1788 crossystem.init()
1789 return crossystem.arch()
1790
1791
Luis Lozano40b7d0d2014-01-17 15:12:06 -08001792 def get_chrome_version(self):
1793 """Gets the Chrome version number and milestone as strings.
1794
1795 Invokes "chrome --version" to get the version number and milestone.
1796
1797 @return A tuple (chrome_ver, milestone) where "chrome_ver" is the
1798 current Chrome version number as a string (in the form "W.X.Y.Z")
1799 and "milestone" is the first component of the version number
1800 (the "W" from "W.X.Y.Z"). If the version number cannot be parsed
1801 in the "W.X.Y.Z" format, the "chrome_ver" will be the full output
1802 of "chrome --version" and the milestone will be the empty string.
1803
1804 """
1805 version_string = self.run(constants.CHROME_VERSION_COMMAND).stdout
1806 return utils.parse_chrome_version(version_string)
1807
Aviv Keshet74c89a92013-02-04 15:18:30 -08001808 @label_decorator()
Simran Basic6f1f7a2012-10-16 10:47:46 -07001809 def get_board(self):
1810 """Determine the correct board label for this host.
1811
1812 @returns a string representing this host's board.
1813 """
1814 release_info = utils.parse_cmd_output('cat /etc/lsb-release',
1815 run_method=self.run)
1816 board = release_info['CHROMEOS_RELEASE_BOARD']
1817 # Devices in the lab generally have the correct board name but our own
1818 # development devices have {board_name}-signed-{key_type}. The board
1819 # name may also begin with 'x86-' which we need to keep.
Simran Basi833814b2013-01-29 13:13:43 -08001820 board_format_string = ds_constants.BOARD_PREFIX + '%s'
Simran Basic6f1f7a2012-10-16 10:47:46 -07001821 if 'x86' not in board:
Simran Basi833814b2013-01-29 13:13:43 -08001822 return board_format_string % board.split('-')[0]
1823 return board_format_string % '-'.join(board.split('-')[0:2])
Simran Basic6f1f7a2012-10-16 10:47:46 -07001824
1825
Aviv Keshet74c89a92013-02-04 15:18:30 -08001826 @label_decorator('lightsensor')
Simran Basic6f1f7a2012-10-16 10:47:46 -07001827 def has_lightsensor(self):
1828 """Determine the correct board label for this host.
1829
1830 @returns the string 'lightsensor' if this host has a lightsensor or
1831 None if it does not.
1832 """
1833 search_cmd = "find -L %s -maxdepth 4 | egrep '%s'" % (
Richard Barnette82c35912012-11-20 10:09:10 -08001834 self._LIGHTSENSOR_SEARCH_DIR, '|'.join(self._LIGHTSENSOR_FILES))
Simran Basic6f1f7a2012-10-16 10:47:46 -07001835 try:
1836 # Run the search cmd following the symlinks. Stderr_tee is set to
1837 # None as there can be a symlink loop, but the command will still
1838 # execute correctly with a few messages printed to stderr.
1839 self.run(search_cmd, stdout_tee=None, stderr_tee=None)
1840 return 'lightsensor'
1841 except error.AutoservRunError:
1842 # egrep exited with a return code of 1 meaning none of the possible
1843 # lightsensor files existed.
1844 return None
1845
1846
Aviv Keshet74c89a92013-02-04 15:18:30 -08001847 @label_decorator('bluetooth')
Simran Basic6f1f7a2012-10-16 10:47:46 -07001848 def has_bluetooth(self):
1849 """Determine the correct board label for this host.
1850
1851 @returns the string 'bluetooth' if this host has bluetooth or
1852 None if it does not.
1853 """
1854 try:
1855 self.run('test -d /sys/class/bluetooth/hci0')
1856 # test exited with a return code of 0.
1857 return 'bluetooth'
1858 except error.AutoservRunError:
1859 # test exited with a return code 1 meaning the directory did not
1860 # exist.
1861 return None
1862
1863
Ilja Friedel0ce0b602013-08-15 18:45:27 -07001864 @label_decorator('graphics')
1865 def get_graphics(self):
1866 """
1867 Determine the correct board label for this host.
1868
1869 @returns a string representing this host's graphics. For now ARM boards
1870 return graphics:gles while all other boards return graphics:gl. This
1871 may change over time, but for robustness reasons this should avoid
1872 executing code in actual graphics libraries (which may not be ready and
1873 is tested by graphics_GLAPICheck).
1874 """
1875 uname = self.run('uname -a').stdout.lower()
1876 if 'arm' in uname:
1877 return 'graphics:gles'
1878 return 'graphics:gl'
1879
1880
Bill Richardson4f595f52014-02-13 16:20:26 -08001881 @label_decorator('ec')
1882 def get_ec(self):
1883 """
1884 Determine the type of EC on this host.
1885
1886 @returns a string representing this host's embedded controller type.
1887 At present, it only returns "ec:cros", for Chrome OS ECs. Other types
1888 of EC (or none) don't return any strings, since no tests depend on
1889 those.
1890 """
1891 cmd = 'mosys ec info'
1892 # The output should look like these, so that the last field should
1893 # match our EC version scheme:
1894 #
1895 # stm | stm32f100 | snow_v1.3.139-375eb9f
1896 # ti | Unknown-10de | peppy_v1.5.114-5d52788
1897 #
1898 # Non-Chrome OS ECs will look like these:
1899 #
1900 # ENE | KB932 | 00BE107A00
1901 # ite | it8518 | 3.08
1902 #
1903 # And some systems don't have ECs at all (Lumpy, for example).
1904 regexp = r'^.*\|\s*(\S+_v\d+\.\d+\.\d+-[0-9a-f]+)\s*$'
1905
1906 ecinfo = self.run(command=cmd, ignore_status=True)
1907 if ecinfo.exit_status == 0:
1908 res = re.search(regexp, ecinfo.stdout)
1909 if res:
1910 logging.info("EC version is %s", res.groups()[0])
1911 return 'ec:cros'
1912 logging.info("%s got: %s", cmd, ecinfo.stdout)
1913 # Has an EC, but it's not a Chrome OS EC
1914 return None
1915 logging.info("%s exited with status %d", cmd, ecinfo.exit_status)
1916 # No EC present
1917 return None
1918
1919
Alec Berg31b932b2014-04-04 16:09:11 -07001920 @label_decorator('accels')
1921 def get_accels(self):
1922 """
1923 Determine the type of accelerometers on this host.
1924
1925 @returns a string representing this host's accelerometer type.
1926 At present, it only returns "accel:cros-ec", for accelerometers
1927 attached to a Chrome OS EC, or none, if no accelerometers.
1928 """
1929 # Check to make sure we have ectool
1930 rv = self.run('which ectool', ignore_status=True)
1931 if rv.exit_status:
1932 logging.info("No ectool cmd found, assuming no EC accelerometers")
1933 return None
1934
1935 # Check that the EC supports the motionsense command
1936 rv = self.run('ectool motionsense', ignore_status=True)
1937 if rv.exit_status:
1938 logging.info("EC does not support motionsense command "
1939 "assuming no EC accelerometers")
1940 return None
1941
1942 # Check that EC motion sensors are active
1943 active = self.run('ectool motionsense active').stdout.split('\n')
1944 if active[0] == "0":
1945 logging.info("Motion sense inactive, assuming no EC accelerometers")
1946 return None
1947
1948 logging.info("EC accelerometers found")
1949 return 'accel:cros-ec'
1950
1951
Tom Wai-Hong Tam3d6790d2014-04-14 16:15:47 +08001952 @label_decorator('chameleon')
1953 def has_chameleon(self):
1954 """Determine if a Chameleon connected to this host.
1955
1956 @returns the string 'chameleon' if this host has a Chameleon or
1957 None if it has not.
1958 """
1959 if self._chameleon_host:
1960 return 'chameleon'
1961 else:
1962 return None
1963
1964
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07001965 @label_decorator('storage')
1966 def get_storage(self):
1967 """
1968 Determine the type of boot device for this host.
1969
1970 Determine if the internal device is SCSI or dw_mmc device.
1971 Then check that it is SSD or HDD or eMMC or something else.
1972
1973 @returns a string representing this host's internal device type.
1974 'storage:ssd' when internal device is solid state drive
1975 'storage:hdd' when internal device is hard disk drive
1976 'storage:mmc' when internal device is mmc drive
1977 None When internal device is something else or
1978 when we are unable to determine the type
1979 """
1980 # The output should be /dev/mmcblk* for SD/eMMC or /dev/sd* for scsi
1981 rootdev_cmd = ' '.join(['. /usr/sbin/write_gpt.sh;',
1982 '. /usr/share/misc/chromeos-common.sh;',
1983 'load_base_vars;',
1984 'get_fixed_dst_drive'])
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07001985 rootdev = self.run(command=rootdev_cmd, ignore_status=True)
1986 if rootdev.exit_status:
1987 logging.info("Fail to run %s", rootdev_cmd)
1988 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07001989 rootdev_str = rootdev.stdout.strip()
1990
1991 if not rootdev_str:
1992 return None
1993
1994 rootdev_base = os.path.basename(rootdev_str)
1995
1996 mmc_pattern = '/dev/mmcblk[0-9]'
1997 if re.match(mmc_pattern, rootdev_str):
1998 # Use type to determine if the internal device is eMMC or somthing
1999 # else. We can assume that MMC is always an internal device.
2000 type_cmd = 'cat /sys/block/%s/device/type' % rootdev_base
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002001 type = self.run(command=type_cmd, ignore_status=True)
2002 if type.exit_status:
2003 logging.info("Fail to run %s", type_cmd)
2004 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002005 type_str = type.stdout.strip()
2006
2007 if type_str == 'MMC':
2008 return 'storage:mmc'
2009
2010 scsi_pattern = '/dev/sd[a-z]+'
2011 if re.match(scsi_pattern, rootdev.stdout):
2012 # Read symlink for /sys/block/sd* to determine if the internal
2013 # device is connected via ata or usb.
2014 link_cmd = 'readlink /sys/block/%s' % rootdev_base
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002015 link = self.run(command=link_cmd, ignore_status=True)
2016 if link.exit_status:
2017 logging.info("Fail to run %s", link_cmd)
2018 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002019 link_str = link.stdout.strip()
2020 if 'usb' in link_str:
2021 return None
2022
2023 # Read rotation to determine if the internal device is ssd or hdd.
2024 rotate_cmd = str('cat /sys/block/%s/queue/rotational'
2025 % rootdev_base)
Puthikorn Voravootivat03c51682014-04-24 13:52:12 -07002026 rotate = self.run(command=rotate_cmd, ignore_status=True)
2027 if rotate.exit_status:
2028 logging.info("Fail to run %s", rotate_cmd)
2029 return None
Puthikorn Voravootivatfa011242014-03-14 18:45:11 -07002030 rotate_str = rotate.stdout.strip()
2031
2032 rotate_dict = {'0':'storage:ssd', '1':'storage:hdd'}
2033 return rotate_dict.get(rotate_str)
2034
2035 # All other internal device / error case will always fall here
2036 return None
2037
2038
Dan Shi4e9a2aa2014-03-24 14:28:42 -07002039 @label_decorator('servo')
2040 def get_servo(self):
2041 """Determine if the host has a servo attached.
2042
2043 If the host has a working servo attached, it should have a servo label.
2044
2045 @return: string 'servo' if the host has servo attached. Otherwise,
2046 returns None.
2047 """
2048 return 'servo' if self._servo_host else None
2049
2050
Dan Shi5beba472014-05-28 22:46:07 -07002051 @label_decorator('video_labels')
2052 def get_video_labels(self):
2053 """Run /usr/local/bin/avtest_label_detect to get a list of video labels.
2054
2055 Sample output of avtest_label_detect:
2056 Detected label: hw_video_acc_vp8
2057 Detected label: webcam
2058
2059 @return: A list of labels detected by tool avtest_label_detect.
2060 """
2061 try:
2062 result = self.run('/usr/local/bin/avtest_label_detect').stdout
2063 return re.findall('^Detected label: (\w+)$', result, re.M)
2064 except error.AutoservRunError:
2065 # The tool is not installed.
2066 return []
2067
2068
Simran Basic6f1f7a2012-10-16 10:47:46 -07002069 def get_labels(self):
2070 """Return a list of labels for this given host.
2071
2072 This is the main way to retrieve all the automatic labels for a host
2073 as it will run through all the currently implemented label functions.
2074 """
2075 labels = []
Richard Barnette82c35912012-11-20 10:09:10 -08002076 for label_function in self._LABEL_FUNCTIONS:
Simran Basic6f1f7a2012-10-16 10:47:46 -07002077 label = label_function(self)
2078 if label:
Dan Shi5beba472014-05-28 22:46:07 -07002079 if type(label) is str:
2080 labels.append(label)
2081 elif type(label) is list:
2082 labels.extend(label)
Simran Basic6f1f7a2012-10-16 10:47:46 -07002083 return labels
Dan Shi85276d42014-04-08 22:11:45 -07002084
2085
2086 def is_boot_from_usb(self):
2087 """Check if DUT is boot from USB.
2088
2089 @return: True if DUT is boot from usb.
2090 """
2091 device = self.run('rootdev -s -d').stdout.strip()
2092 removable = int(self.run('cat /sys/block/%s/removable' %
2093 os.path.basename(device)).stdout.strip())
2094 return removable == 1