blob: c5cb10a6da6cb615a6116fe39c0053387aad5065 [file] [log] [blame]
J. Richard Barnette24adbf42012-04-11 15:04:53 -07001# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
Dale Curtisaa5eedb2011-08-23 16:18:52 -07002# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4
Aviv Keshet74c89a92013-02-04 15:18:30 -08005import functools
Christopher Wiley0ed712b2013-04-09 15:25:12 -07006import httplib
J. Richard Barnette1d78b012012-05-15 13:56:30 -07007import logging
Dan Shi0f466e82013-02-22 15:44:58 -08008import os
Simran Basid5e5e272012-09-24 15:23:59 -07009import re
Christopher Wileyd78249a2013-03-01 13:05:31 -080010import socket
J. Richard Barnette1d78b012012-05-15 13:56:30 -070011import subprocess
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070012import time
J. Richard Barnette1d78b012012-05-15 13:56:30 -070013import xmlrpclib
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070014
J. Richard Barnette45e93de2012-04-11 17:24:15 -070015from autotest_lib.client.bin import utils
Richard Barnette0c73ffc2012-11-19 15:21:18 -080016from autotest_lib.client.common_lib import error
17from autotest_lib.client.common_lib import global_config
J. Richard Barnette45e93de2012-04-11 17:24:15 -070018from autotest_lib.client.common_lib.cros import autoupdater
Richard Barnette03a0c132012-11-05 12:40:35 -080019from autotest_lib.client.common_lib.cros import dev_server
Christopher Wileyd78249a2013-03-01 13:05:31 -080020from autotest_lib.client.common_lib.cros import retry
Richard Barnette82c35912012-11-20 10:09:10 -080021from autotest_lib.client.cros import constants
J. Richard Barnette84890bd2014-02-21 11:05:47 -080022from autotest_lib.client.cros import cros_ui
J. Richard Barnette45e93de2012-04-11 17:24:15 -070023from autotest_lib.server import autoserv_parser
Dan Shia1ecd5c2013-06-06 11:21:31 -070024from autotest_lib.server import utils as server_utils
Scott Zawalski89c44dd2013-02-26 09:28:02 -050025from autotest_lib.server.cros.dynamic_suite import constants as ds_constants
Simran Basi5e6339a2013-03-21 11:34:32 -070026from autotest_lib.server.cros.dynamic_suite import tools, frontend_wrappers
Fang Deng96667ca2013-08-01 17:46:18 -070027from autotest_lib.server.hosts import abstract_ssh
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +080028from autotest_lib.server.hosts import chameleon_host
Fang Deng5d518f42013-08-02 14:04:32 -070029from autotest_lib.server.hosts import servo_host
beeps687243d2013-07-18 15:29:27 -070030from autotest_lib.site_utils.graphite import stats
Simran Basidcff4252012-11-20 16:13:20 -080031from autotest_lib.site_utils.rpm_control_system import rpm_client
Simran Basid5e5e272012-09-24 15:23:59 -070032
33
beeps32a63082013-08-22 14:02:29 -070034try:
35 import jsonrpclib
36except ImportError:
37 jsonrpclib = None
Fang Deng96667ca2013-08-01 17:46:18 -070038
Fang Dengd1c2b732013-08-20 12:59:46 -070039
beepsc87ff602013-07-31 21:53:00 -070040class FactoryImageCheckerException(error.AutoservError):
41 """Exception raised when an image is a factory image."""
42 pass
43
44
Aviv Keshet74c89a92013-02-04 15:18:30 -080045def add_label_detector(label_function_list, label_list=None, label=None):
46 """Decorator used to group functions together into the provided list.
47 @param label_function_list: List of label detecting functions to add
48 decorated function to.
49 @param label_list: List of detectable labels to add detectable labels to.
50 (Default: None)
51 @param label: Label string that is detectable by this detection function
52 (Default: None)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -080053 """
Simran Basic6f1f7a2012-10-16 10:47:46 -070054 def add_func(func):
Aviv Keshet74c89a92013-02-04 15:18:30 -080055 """
56 @param func: The function to be added as a detector.
57 """
58 label_function_list.append(func)
59 if label and label_list is not None:
60 label_list.append(label)
Simran Basic6f1f7a2012-10-16 10:47:46 -070061 return func
62 return add_func
63
64
Fang Deng0ca40e22013-08-27 17:47:44 -070065class CrosHost(abstract_ssh.AbstractSSHHost):
J. Richard Barnette45e93de2012-04-11 17:24:15 -070066 """Chromium OS specific subclass of Host."""
67
68 _parser = autoserv_parser.autoserv_parser
Scott Zawalski62bacae2013-03-05 10:40:32 -050069 _AFE = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
J. Richard Barnette45e93de2012-04-11 17:24:15 -070070
Richard Barnette03a0c132012-11-05 12:40:35 -080071 # Timeout values (in seconds) associated with various Chrome OS
72 # state changes.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070073 #
Richard Barnette0c73ffc2012-11-19 15:21:18 -080074 # In general, a good rule of thumb is that the timeout can be up
75 # to twice the typical measured value on the slowest platform.
76 # The times here have not necessarily been empirically tested to
77 # meet this criterion.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070078 #
79 # SLEEP_TIMEOUT: Time to allow for suspend to memory.
Richard Barnette0c73ffc2012-11-19 15:21:18 -080080 # RESUME_TIMEOUT: Time to allow for resume after suspend, plus
81 # time to restart the netwowrk.
J. Richard Barnette84890bd2014-02-21 11:05:47 -080082 # SHUTDOWN_TIMEOUT: Time to allow for shut down.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070083 # BOOT_TIMEOUT: Time to allow for boot from power off. Among
Richard Barnette0c73ffc2012-11-19 15:21:18 -080084 # other things, this must account for the 30 second dev-mode
J. Richard Barnetted4649c62013-03-06 17:42:27 -080085 # screen delay and time to start the network.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070086 # USB_BOOT_TIMEOUT: Time to allow for boot from a USB device,
Richard Barnette0c73ffc2012-11-19 15:21:18 -080087 # including the 30 second dev-mode delay and time to start the
J. Richard Barnetted4649c62013-03-06 17:42:27 -080088 # network.
beepsf079cfb2013-09-18 17:49:51 -070089 # INSTALL_TIMEOUT: Time to allow for chromeos-install.
J. Richard Barnette84890bd2014-02-21 11:05:47 -080090 # POWERWASH_BOOT_TIMEOUT: Time to allow for a reboot that
91 # includes powerwash.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070092
93 SLEEP_TIMEOUT = 2
J. Richard Barnetted4649c62013-03-06 17:42:27 -080094 RESUME_TIMEOUT = 10
Tom Wai-Hong Tam4d169ed2014-02-14 11:05:40 +080095 SHUTDOWN_TIMEOUT = 5
J. Richard Barnettefbcc7122013-07-24 18:24:59 -070096 BOOT_TIMEOUT = 60
J. Richard Barnetteeb69d722012-06-18 17:29:44 -070097 USB_BOOT_TIMEOUT = 150
J. Richard Barnette84890bd2014-02-21 11:05:47 -080098 INSTALL_TIMEOUT = 240
Dan Shi2c88eed2013-11-12 10:18:38 -080099 POWERWASH_BOOT_TIMEOUT = 60
Chris Sosab76e0ee2013-05-22 16:55:41 -0700100
J. Richard Barnette84890bd2014-02-21 11:05:47 -0800101 # REBOOT_TIMEOUT: How long to wait for a reboot.
102 #
Chris Sosab76e0ee2013-05-22 16:55:41 -0700103 # We have a long timeout to ensure we don't flakily fail due to other
104 # issues. Shorter timeouts are vetted in platform_RebootAfterUpdate.
Simran Basi1160e2c2013-10-04 16:00:24 -0700105 # TODO(sbasi - crbug.com/276094) Restore to 5 mins once the 'host did not
106 # return from reboot' bug is solved.
107 REBOOT_TIMEOUT = 480
Chris Sosab76e0ee2013-05-22 16:55:41 -0700108
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800109 # _USB_POWER_TIMEOUT: Time to allow for USB to power toggle ON and OFF.
110 # _POWER_CYCLE_TIMEOUT: Time to allow for manual power cycle.
111 _USB_POWER_TIMEOUT = 5
112 _POWER_CYCLE_TIMEOUT = 10
113
beeps32a63082013-08-22 14:02:29 -0700114 _RPC_PROXY_URL = 'http://localhost:%d'
Christopher Wileydd181852013-10-10 19:56:58 -0700115 _RPC_SHUTDOWN_POLLING_PERIOD_SECONDS = 2
116 _RPC_SHUTDOWN_TIMEOUT_SECONDS = 20
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800117
Richard Barnette82c35912012-11-20 10:09:10 -0800118 _RPM_RECOVERY_BOARDS = global_config.global_config.get_config_value('CROS',
119 'rpm_recovery_boards', type=str).split(',')
120
121 _MAX_POWER_CYCLE_ATTEMPTS = 6
122 _LAB_MACHINE_FILE = '/mnt/stateful_partition/.labmachine'
123 _RPM_HOSTNAME_REGEX = ('chromeos[0-9]+(-row[0-9]+)?-rack[0-9]+[a-z]*-'
124 'host[0-9]+')
125 _LIGHTSENSOR_FILES = ['in_illuminance0_input',
126 'in_illuminance0_raw',
127 'illuminance0_input']
128 _LIGHTSENSOR_SEARCH_DIR = '/sys/bus/iio/devices'
129 _LABEL_FUNCTIONS = []
Aviv Keshet74c89a92013-02-04 15:18:30 -0800130 _DETECTABLE_LABELS = []
131 label_decorator = functools.partial(add_label_detector, _LABEL_FUNCTIONS,
132 _DETECTABLE_LABELS)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700133
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -0800134 # Constants used in ping_wait_up() and ping_wait_down().
135 #
136 # _PING_WAIT_COUNT is the approximate number of polling
137 # cycles to use when waiting for a host state change.
138 #
139 # _PING_STATUS_DOWN and _PING_STATUS_UP are names used
140 # for arguments to the internal _ping_wait_for_status()
141 # method.
142 _PING_WAIT_COUNT = 40
143 _PING_STATUS_DOWN = False
144 _PING_STATUS_UP = True
145
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800146 # Allowed values for the power_method argument.
147
148 # POWER_CONTROL_RPM: Passed as default arg for power_off/on/cycle() methods.
149 # POWER_CONTROL_SERVO: Used in set_power() and power_cycle() methods.
150 # POWER_CONTROL_MANUAL: Used in set_power() and power_cycle() methods.
151 POWER_CONTROL_RPM = 'RPM'
152 POWER_CONTROL_SERVO = 'servoj10'
153 POWER_CONTROL_MANUAL = 'manual'
154
155 POWER_CONTROL_VALID_ARGS = (POWER_CONTROL_RPM,
156 POWER_CONTROL_SERVO,
157 POWER_CONTROL_MANUAL)
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800158
Simran Basi5e6339a2013-03-21 11:34:32 -0700159 _RPM_OUTLET_CHANGED = 'outlet_changed'
160
beeps687243d2013-07-18 15:29:27 -0700161
J. Richard Barnette964fba02012-10-24 17:34:29 -0700162 @staticmethod
beeps46dadc92013-11-07 14:07:10 -0800163 def check_host(host, timeout=10):
164 """
165 Check if the given host is a chrome-os host.
166
167 @param host: An ssh host representing a device.
168 @param timeout: The timeout for the run command.
169
170 @return: True if the host device is chromeos.
171
beeps46dadc92013-11-07 14:07:10 -0800172 """
173 try:
Christopher Wiley1ea80942014-02-26 16:45:08 -0800174 result = host.run('grep -q CHROMEOS /etc/lsb-release && '
175 '! which adb >/dev/null 2>&1',
Christopher Wileyfc3eac02013-11-21 16:24:57 -0800176 ignore_status=True, timeout=timeout)
beeps46dadc92013-11-07 14:07:10 -0800177 except (error.AutoservRunError, error.AutoservSSHTimeout):
178 return False
179 return result.exit_status == 0
180
181
182 @staticmethod
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800183 def _extract_arguments(args_dict, key_subset):
184 """Extract options from `args_dict` and return a subset result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800185
186 Take the provided dictionary of argument options and return
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800187 a subset that represent standard arguments needed to construct
188 a test-assistant object (chameleon or servo) for a host. The
189 intent is to provide standard argument processing from
190 run_remote_tests for tests that require a test-assistant board
191 to operate.
192
193 @param args_dict Dictionary from which to extract the arguments.
194 @param key_subset Tuple of keys to extract from the args_dict, e.g.
195 ('servo_host', 'servo_port').
196 """
197 result = {}
198 for arg in key_subset:
199 if arg in args_dict:
200 result[arg] = args_dict[arg]
201 return result
202
203
204 @staticmethod
205 def get_chameleon_arguments(args_dict):
206 """Extract chameleon options from `args_dict` and return the result.
207
208 Recommended usage:
209 ~~~~~~~~
210 args_dict = utils.args_to_dict(args)
211 chameleon_args = hosts.CrosHost.get_chameleon_arguments(args_dict)
212 host = hosts.create_host(machine, chameleon_args=chameleon_args)
213 ~~~~~~~~
214
215 @param args_dict Dictionary from which to extract the chameleon
216 arguments.
217 """
218 return CrosHost._extract_arguments(
219 args_dict, ('chameleon_host', 'chameleon_port'))
220
221
222 @staticmethod
223 def get_servo_arguments(args_dict):
224 """Extract servo options from `args_dict` and return the result.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800225
226 Recommended usage:
227 ~~~~~~~~
228 args_dict = utils.args_to_dict(args)
Fang Deng0ca40e22013-08-27 17:47:44 -0700229 servo_args = hosts.CrosHost.get_servo_arguments(args_dict)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800230 host = hosts.create_host(machine, servo_args=servo_args)
231 ~~~~~~~~
232
233 @param args_dict Dictionary from which to extract the servo
234 arguments.
235 """
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800236 return CrosHost._extract_arguments(
237 args_dict, ('servo_host', 'servo_port'))
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700238
J. Richard Barnette964fba02012-10-24 17:34:29 -0700239
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800240 def _initialize(self, hostname, chameleon_args=None, servo_args=None,
241 ssh_verbosity_flag='', ssh_options='',
Fang Dengd1c2b732013-08-20 12:59:46 -0700242 *args, **dargs):
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800243 """Initialize superclasses, |self.chameleon|, and |self.servo|.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700244
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800245 This method checks whether a chameleon/servo (aka
246 test-assistant objects) is required by checking whether
247 chameleon_args/servo_args is None. This method will only
248 attempt to create the test-assistant object when it is
249 required by the test.
Fang Deng5d518f42013-08-02 14:04:32 -0700250
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800251 For creating the test-assistant object, there are three
252 possibilities: First, if the host is a lab system known to have
253 a test-assistant board, we connect to that board unconditionally.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700254 Second, if we're called from a control file that requires
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800255 test-assistant features for testing, it will pass settings from
256 the arguments, like `servo_host`, `servo_port`. If neither of
257 these cases apply, the test-assistant object will be `None`.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700258
259 """
Fang Deng0ca40e22013-08-27 17:47:44 -0700260 super(CrosHost, self)._initialize(hostname=hostname,
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700261 *args, **dargs)
J. Richard Barnettef0859852012-08-20 14:55:50 -0700262 # self.env is a dictionary of environment variable settings
263 # to be exported for commands run on the host.
264 # LIBC_FATAL_STDERR_ can be useful for diagnosing certain
265 # errors that might happen.
266 self.env['LIBC_FATAL_STDERR_'] = '1'
beeps32a63082013-08-22 14:02:29 -0700267 self._rpc_proxy_map = {}
Fang Dengd1c2b732013-08-20 12:59:46 -0700268 self._ssh_verbosity_flag = ssh_verbosity_flag
Aviv Keshetc5947fa2013-09-04 14:06:29 -0700269 self._ssh_options = ssh_options
Fang Deng5d518f42013-08-02 14:04:32 -0700270 # TODO(fdeng): We need to simplify the
271 # process of servo and servo_host initialization.
272 # crbug.com/298432
Dan Shi4d478522014-02-14 13:46:32 -0800273 self._servo_host = servo_host.create_servo_host(dut=self.hostname,
274 servo_args=servo_args)
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800275 # TODO(waihong): Do the simplication on Chameleon too.
276 self._chameleon_host = self._create_chameleon_host(chameleon_args)
Dan Shi4d478522014-02-14 13:46:32 -0800277 if self._servo_host is not None:
278 self.servo = self._servo_host.get_servo()
279 else:
280 self.servo = None
281
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800282 if chameleon_args is not None:
Tom Wai-Hong Tameaee3402014-01-22 08:52:10 +0800283 self.chameleon = self._chameleon_host.create_chameleon_board()
Tom Wai-Hong Tamefe1c7f2014-01-02 14:00:11 +0800284
285
286 def _create_chameleon_host(self, chameleon_args):
287 """Create a ChameleonHost object.
288
289 There three possible cases:
290 1) If the DUT is in Cros Lab and has a chameleon board, then create
291 a ChameleonHost object pointing to the board. chameleon_args
292 is ignored.
293 2) If not case 1) and chameleon_args is neither None nor empty, then
294 create a ChameleonHost object using chameleon_args.
295 3) If neither case 1) or 2) applies, return None.
296
297 @param chameleon_args: A dictionary that contains args for creating
298 a ChameleonHost object,
299 e.g. {'chameleon_host': '172.11.11.112',
300 'chameleon_port': 9992}.
301
302 @returns: A ChameleonHost object or None.
303
304 """
305 hostname = chameleon_host.make_chameleon_hostname(self.hostname)
306 if utils.host_is_in_lab_zone(hostname):
307 return chameleon_host.ChameleonHost(chameleon_host=hostname)
308 elif chameleon_args is not None:
309 return chameleon_host.ChameleonHost(**chameleon_args)
310 else:
311 return None
Fang Deng5d518f42013-08-02 14:04:32 -0700312
313
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500314 def get_repair_image_name(self):
315 """Generate a image_name from variables in the global config.
316
317 @returns a str of $board-version/$BUILD.
318
319 """
320 stable_version = global_config.global_config.get_config_value(
321 'CROS', 'stable_cros_version')
322 build_pattern = global_config.global_config.get_config_value(
323 'CROS', 'stable_build_pattern')
324 board = self._get_board_from_afe()
325 if board is None:
326 raise error.AutoservError('DUT has no board attribute, '
327 'cannot be repaired.')
328 return build_pattern % (board, stable_version)
329
330
Scott Zawalski62bacae2013-03-05 10:40:32 -0500331 def _host_in_AFE(self):
332 """Check if the host is an object the AFE knows.
333
334 @returns the host object.
335 """
336 return self._AFE.get_hosts(hostname=self.hostname)
337
338
Chris Sosab76e0ee2013-05-22 16:55:41 -0700339 def lookup_job_repo_url(self):
340 """Looks up the job_repo_url for the host.
341
342 @returns job_repo_url from AFE or None if not found.
343
344 @raises KeyError if the host does not have a job_repo_url
345 """
346 if not self._host_in_AFE():
347 return None
348
349 hosts = self._AFE.get_hosts(hostname=self.hostname)
beepsb5efc532013-06-04 11:29:34 -0700350 if hosts and ds_constants.JOB_REPO_URL in hosts[0].attributes:
351 return hosts[0].attributes[ds_constants.JOB_REPO_URL]
Chris Sosab76e0ee2013-05-22 16:55:41 -0700352
353
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500354 def clear_cros_version_labels_and_job_repo_url(self):
355 """Clear cros_version labels and host attribute job_repo_url."""
Scott Zawalski62bacae2013-03-05 10:40:32 -0500356 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400357 return
358
Scott Zawalski62bacae2013-03-05 10:40:32 -0500359 host_list = [self.hostname]
360 labels = self._AFE.get_labels(
361 name__startswith=ds_constants.VERSION_PREFIX,
362 host__hostname=self.hostname)
Dan Shi0f466e82013-02-22 15:44:58 -0800363
Scott Zawalski62bacae2013-03-05 10:40:32 -0500364 for label in labels:
365 label.remove_hosts(hosts=host_list)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500366
beepscb6f1e22013-06-28 19:14:10 -0700367 self.update_job_repo_url(None, None)
368
369
370 def update_job_repo_url(self, devserver_url, image_name):
371 """
372 Updates the job_repo_url host attribute and asserts it's value.
373
374 @param devserver_url: The devserver to use in the job_repo_url.
375 @param image_name: The name of the image to use in the job_repo_url.
376
377 @raises AutoservError: If we failed to update the job_repo_url.
378 """
379 repo_url = None
380 if devserver_url and image_name:
381 repo_url = tools.get_package_url(devserver_url, image_name)
382 self._AFE.set_host_attribute(ds_constants.JOB_REPO_URL, repo_url,
Scott Zawalski62bacae2013-03-05 10:40:32 -0500383 hostname=self.hostname)
beepscb6f1e22013-06-28 19:14:10 -0700384 if self.lookup_job_repo_url() != repo_url:
385 raise error.AutoservError('Failed to update job_repo_url with %s, '
386 'host %s' % (repo_url, self.hostname))
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500387
388
Dan Shie9309262013-06-19 22:50:21 -0700389 def add_cros_version_labels_and_job_repo_url(self, image_name):
Scott Zawalskieadbf702013-03-14 09:23:06 -0400390 """Add cros_version labels and host attribute job_repo_url.
391
392 @param image_name: The name of the image e.g.
393 lumpy-release/R27-3837.0.0
Dan Shi7458bf62013-06-10 12:50:16 -0700394
Scott Zawalskieadbf702013-03-14 09:23:06 -0400395 """
Scott Zawalski62bacae2013-03-05 10:40:32 -0500396 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400397 return
Scott Zawalski62bacae2013-03-05 10:40:32 -0500398
Scott Zawalskieadbf702013-03-14 09:23:06 -0400399 cros_label = '%s%s' % (ds_constants.VERSION_PREFIX, image_name)
Dan Shie9309262013-06-19 22:50:21 -0700400 devserver_url = dev_server.ImageServer.resolve(image_name).url()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500401
402 labels = self._AFE.get_labels(name=cros_label)
403 if labels:
404 label = labels[0]
405 else:
406 label = self._AFE.create_label(name=cros_label)
407
408 label.add_hosts([self.hostname])
beepscb6f1e22013-06-28 19:14:10 -0700409 self.update_job_repo_url(devserver_url, image_name)
410
411
beepsdae65fd2013-07-26 16:24:41 -0700412 def verify_job_repo_url(self, tag=''):
beepscb6f1e22013-06-28 19:14:10 -0700413 """
414 Make sure job_repo_url of this host is valid.
415
joychen03eaad92013-06-26 09:55:21 -0700416 Eg: The job_repo_url "http://lmn.cd.ab.xyx:8080/static/\
beepscb6f1e22013-06-28 19:14:10 -0700417 lumpy-release/R29-4279.0.0/autotest/packages" claims to have the
418 autotest package for lumpy-release/R29-4279.0.0. If this isn't the case,
419 download and extract it. If the devserver embedded in the url is
420 unresponsive, update the job_repo_url of the host after staging it on
421 another devserver.
422
423 @param job_repo_url: A url pointing to the devserver where the autotest
424 package for this build should be staged.
beepsdae65fd2013-07-26 16:24:41 -0700425 @param tag: The tag from the server job, in the format
426 <job_id>-<user>/<hostname>, or <hostless> for a server job.
beepscb6f1e22013-06-28 19:14:10 -0700427
428 @raises DevServerException: If we could not resolve a devserver.
429 @raises AutoservError: If we're unable to save the new job_repo_url as
430 a result of choosing a new devserver because the old one failed to
431 respond to a health check.
beeps0c865032013-07-30 11:37:06 -0700432 @raises urllib2.URLError: If the devserver embedded in job_repo_url
433 doesn't respond within the timeout.
beepscb6f1e22013-06-28 19:14:10 -0700434 """
435 job_repo_url = self.lookup_job_repo_url()
436 if not job_repo_url:
437 logging.warning('No job repo url set on host %s', self.hostname)
438 return
439
440 logging.info('Verifying job repo url %s', job_repo_url)
441 devserver_url, image_name = tools.get_devserver_build_from_package_url(
442 job_repo_url)
443
beeps0c865032013-07-30 11:37:06 -0700444 ds = dev_server.ImageServer(devserver_url)
beepscb6f1e22013-06-28 19:14:10 -0700445
446 logging.info('Staging autotest artifacts for %s on devserver %s',
447 image_name, ds.url())
beeps687243d2013-07-18 15:29:27 -0700448
449 start_time = time.time()
beepscb6f1e22013-06-28 19:14:10 -0700450 ds.stage_artifacts(image_name, ['autotest'])
beeps687243d2013-07-18 15:29:27 -0700451 stage_time = time.time() - start_time
452
453 # Record how much of the verification time comes from a devserver
454 # restage. If we're doing things right we should not see multiple
455 # devservers for a given board/build/branch path.
456 try:
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800457 board, build_type, branch = server_utils.ParseBuildName(
beeps687243d2013-07-18 15:29:27 -0700458 image_name)[:3]
J. Richard Barnette3cbd76b2013-11-27 12:11:25 -0800459 except server_utils.ParseBuildNameException:
beeps687243d2013-07-18 15:29:27 -0700460 pass
461 else:
beeps0c865032013-07-30 11:37:06 -0700462 devserver = devserver_url[
Chris Sosa65425082013-10-16 13:26:22 -0700463 devserver_url.find('/') + 2:devserver_url.rfind(':')]
beeps687243d2013-07-18 15:29:27 -0700464 stats_key = {
465 'board': board,
466 'build_type': build_type,
467 'branch': branch,
beeps0c865032013-07-30 11:37:06 -0700468 'devserver': devserver.replace('.', '_'),
beeps687243d2013-07-18 15:29:27 -0700469 }
470 stats.Gauge('verify_job_repo_url').send(
471 '%(board)s.%(build_type)s.%(branch)s.%(devserver)s' % stats_key,
472 stage_time)
beepscb6f1e22013-06-28 19:14:10 -0700473
Scott Zawalskieadbf702013-03-14 09:23:06 -0400474
Dan Shi0f466e82013-02-22 15:44:58 -0800475 def _try_stateful_update(self, update_url, force_update, updater):
476 """Try to use stateful update to initialize DUT.
477
478 When DUT is already running the same version that machine_install
479 tries to install, stateful update is a much faster way to clean up
480 the DUT for testing, compared to a full reimage. It is implemeted
481 by calling autoupdater.run_update, but skipping updating root, as
482 updating the kernel is time consuming and not necessary.
483
484 @param update_url: url of the image.
485 @param force_update: Set to True to update the image even if the DUT
486 is running the same version.
487 @param updater: ChromiumOSUpdater instance used to update the DUT.
488 @returns: True if the DUT was updated with stateful update.
489
490 """
J. Richard Barnette3f731032014-04-07 17:42:59 -0700491 # TODO(jrbarnette): Yes, I hate this re.match() test case.
492 # It's better than the alternative: see crbug.com/360944.
493 image_name = autoupdater.url_to_image_name(update_url)
494 release_pattern = r'^.*-release/R[0-9]+-[0-9]+\.[0-9]+\.0$'
495 if not re.match(release_pattern, image_name):
496 return False
Dan Shi0f466e82013-02-22 15:44:58 -0800497 if not updater.check_version():
498 return False
499 if not force_update:
500 logging.info('Canceling stateful update because the new and '
501 'old versions are the same.')
502 return False
503 # Following folders should be rebuilt after stateful update.
504 # A test file is used to confirm each folder gets rebuilt after
505 # the stateful update.
506 folders_to_check = ['/var', '/home', '/mnt/stateful_partition']
507 test_file = '.test_file_to_be_deleted'
508 for folder in folders_to_check:
509 touch_path = os.path.join(folder, test_file)
510 self.run('touch %s' % touch_path)
511
512 if not updater.run_update(force_update=True, update_root=False):
513 return False
514
515 # Reboot to complete stateful update.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700516 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Dan Shi0f466e82013-02-22 15:44:58 -0800517 check_file_cmd = 'test -f %s; echo $?'
518 for folder in folders_to_check:
519 test_file_path = os.path.join(folder, test_file)
520 result = self.run(check_file_cmd % test_file_path,
521 ignore_status=True)
522 if result.exit_status == 1:
523 return False
524 return True
525
526
J. Richard Barnette7275b612013-06-04 18:13:11 -0700527 def _post_update_processing(self, updater, expected_kernel=None):
Dan Shi0f466e82013-02-22 15:44:58 -0800528 """After the DUT is updated, confirm machine_install succeeded.
529
530 @param updater: ChromiumOSUpdater instance used to update the DUT.
J. Richard Barnette7275b612013-06-04 18:13:11 -0700531 @param expected_kernel: kernel expected to be active after reboot,
532 or `None` to skip rollback checking.
Dan Shi0f466e82013-02-22 15:44:58 -0800533
534 """
J. Richard Barnette7275b612013-06-04 18:13:11 -0700535 # Touch the lab machine file to leave a marker that
536 # distinguishes this image from other test images.
537 # Afterwards, we must re-run the autoreboot script because
538 # it depends on the _LAB_MACHINE_FILE.
Dan Shi0f466e82013-02-22 15:44:58 -0800539 self.run('touch %s' % self._LAB_MACHINE_FILE)
Dan Shi0f466e82013-02-22 15:44:58 -0800540 self.run('start autoreboot')
Chris Sosa65425082013-10-16 13:26:22 -0700541 updater.verify_boot_expectations(
542 expected_kernel, rollback_message=
543 'Build %s failed to boot on %s; system rolled back to previous'
544 'build' % (updater.update_version, self.hostname))
J. Richard Barnette7275b612013-06-04 18:13:11 -0700545 # Check that we've got the build we meant to install.
546 if not updater.check_version_to_confirm_install():
547 raise autoupdater.ChromiumOSError(
548 'Failed to update %s to build %s; found build '
549 '%s instead' % (self.hostname,
Chris Sosa65425082013-10-16 13:26:22 -0700550 updater.update_version,
551 updater.get_build_id()))
Dan Shi0f466e82013-02-22 15:44:58 -0800552
553
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700554 def _stage_image_for_update(self, image_name=None):
Scott Zawalskieadbf702013-03-14 09:23:06 -0400555 """Stage a build on a devserver and return the update_url.
556
557 @param image_name: a name like lumpy-release/R27-3837.0.0
558 @returns an update URL like:
559 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
560 """
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700561 if not image_name:
562 image_name = self.get_repair_image_name()
563 logging.info('Staging build for AU: %s', image_name)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400564 devserver = dev_server.ImageServer.resolve(image_name)
565 devserver.trigger_download(image_name, synchronous=False)
566 return tools.image_url_pattern() % (devserver.url(), image_name)
567
568
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700569 def stage_image_for_servo(self, image_name=None):
570 """Stage a build on a devserver and return the update_url.
571
572 @param image_name: a name like lumpy-release/R27-3837.0.0
573 @returns an update URL like:
574 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
575 """
576 if not image_name:
577 image_name = self.get_repair_image_name()
578 logging.info('Staging build for servo install: %s', image_name)
579 devserver = dev_server.ImageServer.resolve(image_name)
580 devserver.stage_artifacts(image_name, ['test_image'])
581 return devserver.get_test_image_url(image_name)
582
583
beepse539be02013-07-31 21:57:39 -0700584 def stage_factory_image_for_servo(self, image_name):
585 """Stage a build on a devserver and return the update_url.
586
587 @param image_name: a name like <baord>/4262.204.0
beeps12c0a3c2013-09-03 11:58:27 -0700588
beepse539be02013-07-31 21:57:39 -0700589 @return: An update URL, eg:
590 http://<devserver>/static/canary-channel/\
591 <board>/4262.204.0/factory_test/chromiumos_factory_image.bin
beeps12c0a3c2013-09-03 11:58:27 -0700592
593 @raises: ValueError if the factory artifact name is missing from
594 the config.
595
beepse539be02013-07-31 21:57:39 -0700596 """
597 if not image_name:
598 logging.error('Need an image_name to stage a factory image.')
599 return
600
beeps12c0a3c2013-09-03 11:58:27 -0700601 factory_artifact = global_config.global_config.get_config_value(
602 'CROS', 'factory_artifact', type=str, default='')
603 if not factory_artifact:
604 raise ValueError('Cannot retrieve the factory artifact name from '
605 'autotest config, and hence cannot stage factory '
606 'artifacts.')
607
beepse539be02013-07-31 21:57:39 -0700608 logging.info('Staging build for servo install: %s', image_name)
609 devserver = dev_server.ImageServer.resolve(image_name)
610 devserver.stage_artifacts(
611 image_name,
beeps12c0a3c2013-09-03 11:58:27 -0700612 [factory_artifact],
613 archive_url=None)
beepse539be02013-07-31 21:57:39 -0700614
615 return tools.factory_image_url_pattern() % (devserver.url(), image_name)
616
617
Chris Sosaa3ac2152012-05-23 22:23:13 -0700618 def machine_install(self, update_url=None, force_update=False,
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500619 local_devserver=False, repair=False):
620 """Install the DUT.
621
Dan Shi0f466e82013-02-22 15:44:58 -0800622 Use stateful update if the DUT is already running the same build.
623 Stateful update does not update kernel and tends to run much faster
624 than a full reimage. If the DUT is running a different build, or it
625 failed to do a stateful update, full update, including kernel update,
626 will be applied to the DUT.
627
Scott Zawalskieadbf702013-03-14 09:23:06 -0400628 Once a host enters machine_install its cros_version label will be
629 removed as well as its host attribute job_repo_url (used for
630 package install).
631
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500632 @param update_url: The url to use for the update
633 pattern: http://$devserver:###/update/$build
634 If update_url is None and repair is True we will install the
635 stable image listed in global_config under
636 CROS.stable_cros_version.
637 @param force_update: Force an update even if the version installed
638 is the same. Default:False
639 @param local_devserver: Used by run_remote_test to allow people to
640 use their local devserver. Default: False
641 @param repair: Whether or not we are in repair mode. This adds special
642 cases for repairing a machine like starting update_engine.
643 Setting repair to True sets force_update to True as well.
644 default: False
645 @raises autoupdater.ChromiumOSError
646
647 """
Dan Shi7458bf62013-06-10 12:50:16 -0700648 if update_url:
649 logging.debug('update url is set to %s', update_url)
650 else:
651 logging.debug('update url is not set, resolving...')
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700652 if self._parser.options.image:
653 requested_build = self._parser.options.image
654 if requested_build.startswith('http://'):
655 update_url = requested_build
Dan Shi7458bf62013-06-10 12:50:16 -0700656 logging.debug('update url is retrieved from requested_build'
657 ': %s', update_url)
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700658 else:
659 # Try to stage any build that does not start with
660 # http:// on the devservers defined in
661 # global_config.ini.
Dan Shi7458bf62013-06-10 12:50:16 -0700662 update_url = self._stage_image_for_update(requested_build)
663 logging.debug('Build staged, and update_url is set to: %s',
664 update_url)
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700665 elif repair:
666 update_url = self._stage_image_for_update()
Dan Shi7458bf62013-06-10 12:50:16 -0700667 logging.debug('Build staged, and update_url is set to: %s',
668 update_url)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400669 else:
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700670 raise autoupdater.ChromiumOSError(
671 'Update failed. No update URL provided.')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500672
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500673 if repair:
Dan Shi0f466e82013-02-22 15:44:58 -0800674 # In case the system is in a bad state, we always reboot the machine
675 # before machine_install.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700676 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500677 self.run('stop update-engine; start update-engine')
678 force_update = True
Dan Shi0f466e82013-02-22 15:44:58 -0800679
Chris Sosaa3ac2152012-05-23 22:23:13 -0700680 updater = autoupdater.ChromiumOSUpdater(update_url, host=self,
Chris Sosa72312602013-04-16 15:01:56 -0700681 local_devserver=local_devserver)
Dan Shi0f466e82013-02-22 15:44:58 -0800682 updated = False
Scott Zawalskieadbf702013-03-14 09:23:06 -0400683 # Remove cros-version and job_repo_url host attribute from host.
684 self.clear_cros_version_labels_and_job_repo_url()
Dan Shi0f466e82013-02-22 15:44:58 -0800685 # If the DUT is already running the same build, try stateful update
686 # first. Stateful update does not update kernel and tends to run much
687 # faster than a full reimage.
688 try:
Chris Sosab76e0ee2013-05-22 16:55:41 -0700689 updated = self._try_stateful_update(
690 update_url, force_update, updater)
Dan Shi0f466e82013-02-22 15:44:58 -0800691 if updated:
692 logging.info('DUT is updated with stateful update.')
693 except Exception as e:
694 logging.exception(e)
695 logging.warn('Failed to stateful update DUT, force to update.')
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700696
Dan Shi0f466e82013-02-22 15:44:58 -0800697 inactive_kernel = None
698 # Do a full update if stateful update is not applicable or failed.
699 if not updated:
700 # In case the system is in a bad state, we always reboot the
701 # machine before machine_install.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700702 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Chris Sosab7612bc2013-03-21 10:32:37 -0700703
704 # TODO(sosa): Remove temporary hack to get rid of bricked machines
705 # that can't update due to a corrupted policy.
706 self.run('rm -rf /var/lib/whitelist')
707 self.run('touch /var/lib/whitelist')
708 self.run('chmod -w /var/lib/whitelist')
Scott Zawalskib550d5a2013-03-22 09:23:59 -0400709 self.run('stop update-engine; start update-engine')
Chris Sosab7612bc2013-03-21 10:32:37 -0700710
Dan Shi0f466e82013-02-22 15:44:58 -0800711 if updater.run_update(force_update):
712 updated = True
713 # Figure out active and inactive kernel.
714 active_kernel, inactive_kernel = updater.get_kernel_state()
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700715
Dan Shi0f466e82013-02-22 15:44:58 -0800716 # Ensure inactive kernel has higher priority than active.
717 if (updater.get_kernel_priority(inactive_kernel)
718 < updater.get_kernel_priority(active_kernel)):
719 raise autoupdater.ChromiumOSError(
720 'Update failed. The priority of the inactive kernel'
721 ' partition is less than that of the active kernel'
722 ' partition.')
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700723
Dan Shi0f466e82013-02-22 15:44:58 -0800724 # Updater has returned successfully; reboot the host.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700725 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700726
Dan Shi0f466e82013-02-22 15:44:58 -0800727 if updated:
728 self._post_update_processing(updater, inactive_kernel)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400729 image_name = autoupdater.url_to_image_name(update_url)
Dan Shie9309262013-06-19 22:50:21 -0700730 self.add_cros_version_labels_and_job_repo_url(image_name)
Simran Basi13fa1ba2013-03-04 10:56:47 -0800731
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700732 # Clean up any old autotest directories which may be lying around.
733 for path in global_config.global_config.get_config_value(
734 'AUTOSERV', 'client_autodir_paths', type=list):
735 self.run('rm -rf ' + path)
736
737
Dan Shi10e992b2013-08-30 11:02:59 -0700738 def show_update_engine_log(self):
739 """Output update engine log."""
740 logging.debug('Dumping %s', constants.UPDATE_ENGINE_LOG)
741 self.run('cat %s' % constants.UPDATE_ENGINE_LOG)
742
743
Richard Barnette82c35912012-11-20 10:09:10 -0800744 def _get_board_from_afe(self):
745 """Retrieve this host's board from its labels in the AFE.
746
747 Looks for a host label of the form "board:<board>", and
748 returns the "<board>" part of the label. `None` is returned
749 if there is not a single, unique label matching the pattern.
750
751 @returns board from label, or `None`.
752 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700753 return server_utils.get_board_from_afe(self.hostname, self._AFE)
Simran Basi833814b2013-01-29 13:13:43 -0800754
755
756 def get_build(self):
757 """Retrieve the current build for this Host from the AFE.
758
759 Looks through this host's labels in the AFE to determine its build.
760
761 @returns The current build or None if it could not find it or if there
762 were multiple build labels assigned to this host.
763 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700764 return server_utils.get_build_from_afe(self.hostname, self._AFE)
Richard Barnette82c35912012-11-20 10:09:10 -0800765
766
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500767 def _install_repair(self):
768 """Attempt to repair this host using upate-engine.
769
770 If the host is up, try installing the DUT with a stable
771 "repair" version of Chrome OS as defined in the global_config
772 under CROS.stable_cros_version.
773
Scott Zawalski62bacae2013-03-05 10:40:32 -0500774 @raises AutoservRepairMethodNA if the DUT is not reachable.
775 @raises ChromiumOSError if the install failed for some reason.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500776
777 """
778 if not self.is_up():
Scott Zawalski62bacae2013-03-05 10:40:32 -0500779 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500780
781 logging.info('Attempting to reimage machine to repair image.')
782 try:
783 self.machine_install(repair=True)
Fang Dengd0672f32013-03-18 17:18:09 -0700784 except autoupdater.ChromiumOSError as e:
785 logging.exception(e)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500786 logging.info('Repair via install failed.')
Scott Zawalski62bacae2013-03-05 10:40:32 -0500787 raise
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500788
789
Dan Shi2c88eed2013-11-12 10:18:38 -0800790 def _install_repair_with_powerwash(self):
Dan Shi9cc48452013-11-12 12:39:26 -0800791 """Attempt to powerwash first then repair this host using update-engine.
Dan Shi2c88eed2013-11-12 10:18:38 -0800792
Dan Shi9cc48452013-11-12 12:39:26 -0800793 update-engine may fail due to a bad image. In such case, powerwash
794 may help to cleanup the DUT for update-engine to work again.
Dan Shi2c88eed2013-11-12 10:18:38 -0800795
796 @raises AutoservRepairMethodNA if the DUT is not reachable.
797 @raises ChromiumOSError if the install failed for some reason.
798
799 """
800 if not self.is_up():
801 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
802
803 logging.info('Attempting to powerwash the DUT.')
804 self.run('echo "fast safe" > '
805 '/mnt/stateful_partition/factory_install_reset')
806 self.reboot(timeout=self.POWERWASH_BOOT_TIMEOUT, wait=True)
807 if not self.is_up():
Dan Shi9cc48452013-11-12 12:39:26 -0800808 logging.error('Powerwash failed. DUT did not come back after '
Dan Shi2c88eed2013-11-12 10:18:38 -0800809 'reboot.')
810 raise error.AutoservRepairFailure(
811 'DUT failed to boot from powerwash after %d seconds' %
812 self.POWERWASH_BOOT_TIMEOUT)
813
814 logging.info('Powerwash succeeded.')
815 self._install_repair()
816
817
beepsf079cfb2013-09-18 17:49:51 -0700818 def servo_install(self, image_url=None, usb_boot_timeout=USB_BOOT_TIMEOUT,
819 install_timeout=INSTALL_TIMEOUT):
Scott Zawalski62bacae2013-03-05 10:40:32 -0500820 """
821 Re-install the OS on the DUT by:
822 1) installing a test image on a USB storage device attached to the Servo
823 board,
Richard Barnette03a0c132012-11-05 12:40:35 -0800824 2) booting that image in recovery mode, and then
J. Richard Barnette31b2e312013-04-04 16:05:22 -0700825 3) installing the image with chromeos-install.
826
Scott Zawalski62bacae2013-03-05 10:40:32 -0500827 @param image_url: If specified use as the url to install on the DUT.
828 otherwise boot the currently staged image on the USB stick.
beepsf079cfb2013-09-18 17:49:51 -0700829 @param usb_boot_timeout: The usb_boot_timeout to use during reimage.
830 Factory images need a longer usb_boot_timeout than regular
831 cros images.
832 @param install_timeout: The timeout to use when installing the chromeos
833 image. Factory images need a longer install_timeout.
Richard Barnette03a0c132012-11-05 12:40:35 -0800834
Scott Zawalski62bacae2013-03-05 10:40:32 -0500835 @raises AutoservError if the image fails to boot.
Richard Barnette03a0c132012-11-05 12:40:35 -0800836 """
beepsf079cfb2013-09-18 17:49:51 -0700837
838 usb_boot_timer_key = ('servo_install.usb_boot_timeout_%s'
839 % usb_boot_timeout)
840 logging.info('Downloading image to USB, then booting from it. Usb boot '
841 'timeout = %s', usb_boot_timeout)
842 timer = stats.Timer(usb_boot_timer_key)
843 timer.start()
J. Richard Barnette31b2e312013-04-04 16:05:22 -0700844 self.servo.install_recovery_image(image_url)
beepsf079cfb2013-09-18 17:49:51 -0700845 if not self.wait_up(timeout=usb_boot_timeout):
Scott Zawalski62bacae2013-03-05 10:40:32 -0500846 raise error.AutoservRepairFailure(
847 'DUT failed to boot from USB after %d seconds' %
beepsf079cfb2013-09-18 17:49:51 -0700848 usb_boot_timeout)
849 timer.stop()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500850
beepsf079cfb2013-09-18 17:49:51 -0700851 install_timer_key = ('servo_install.install_timeout_%s'
852 % install_timeout)
853 timer = stats.Timer(install_timer_key)
854 timer.start()
855 logging.info('Installing image through chromeos-install.')
856 self.run('chromeos-install --yes', timeout=install_timeout)
857 timer.stop()
858
859 logging.info('Power cycling DUT through servo.')
Richard Barnette03a0c132012-11-05 12:40:35 -0800860 self.servo.power_long_press()
Fang Dengafb88142013-05-30 17:44:31 -0700861 self.servo.switch_usbkey('off')
J. Richard Barnettefbcc7122013-07-24 18:24:59 -0700862 # We *must* use power_on() here; on Parrot it's how we get
863 # out of recovery mode.
864 self.servo.get_power_state_controller().power_on()
beepsf079cfb2013-09-18 17:49:51 -0700865
866 logging.info('Waiting for DUT to come back up.')
Richard Barnette03a0c132012-11-05 12:40:35 -0800867 if not self.wait_up(timeout=self.BOOT_TIMEOUT):
868 raise error.AutoservError('DUT failed to reboot installed '
869 'test image after %d seconds' %
Scott Zawalski62bacae2013-03-05 10:40:32 -0500870 self.BOOT_TIMEOUT)
871
872
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700873 def _servo_repair_reinstall(self):
Scott Zawalski62bacae2013-03-05 10:40:32 -0500874 """Reinstall the DUT utilizing servo and a test image.
875
876 Re-install the OS on the DUT by:
877 1) installing a test image on a USB storage device attached to the Servo
878 board,
879 2) booting that image in recovery mode, and then
880 3) installing the image with chromeos-install.
881
Scott Zawalski62bacae2013-03-05 10:40:32 -0500882 @raises AutoservRepairMethodNA if the device does not have servo
883 support.
884
885 """
886 if not self.servo:
887 raise error.AutoservRepairMethodNA('Repair Reinstall NA: '
888 'DUT has no servo support.')
889
890 logging.info('Attempting to recovery servo enabled device with '
891 'servo_repair_reinstall')
892
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700893 image_url = self.stage_image_for_servo()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500894 self.servo_install(image_url)
895
896
897 def _servo_repair_power(self):
898 """Attempt to repair DUT using an attached Servo.
899
900 Attempt to power on the DUT via power_long_press.
901
902 @raises AutoservRepairMethodNA if the device does not have servo
903 support.
904 @raises AutoservRepairFailure if the repair fails for any reason.
905 """
906 if not self.servo:
907 raise error.AutoservRepairMethodNA('Repair Power NA: '
908 'DUT has no servo support.')
909
910 logging.info('Attempting to recover servo enabled device by '
911 'powering it off and on.')
912 self.servo.get_power_state_controller().power_off()
913 self.servo.get_power_state_controller().power_on()
914 if self.wait_up(self.BOOT_TIMEOUT):
915 return
916
917 raise error.AutoservRepairFailure('DUT did not boot after long_press.')
Richard Barnette03a0c132012-11-05 12:40:35 -0800918
919
Richard Barnette82c35912012-11-20 10:09:10 -0800920 def _powercycle_to_repair(self):
921 """Utilize the RPM Infrastructure to bring the host back up.
922
923 If the host is not up/repaired after the first powercycle we utilize
924 auto fallback to the last good install by powercycling and rebooting the
925 host 6 times.
Scott Zawalski62bacae2013-03-05 10:40:32 -0500926
927 @raises AutoservRepairMethodNA if the device does not support remote
928 power.
929 @raises AutoservRepairFailure if the repair fails for any reason.
930
Richard Barnette82c35912012-11-20 10:09:10 -0800931 """
Scott Zawalski62bacae2013-03-05 10:40:32 -0500932 if not self.has_power():
933 raise error.AutoservRepairMethodNA('Device does not support power.')
934
Richard Barnette82c35912012-11-20 10:09:10 -0800935 logging.info('Attempting repair via RPM powercycle.')
936 failed_cycles = 0
937 self.power_cycle()
938 while not self.wait_up(timeout=self.BOOT_TIMEOUT):
939 failed_cycles += 1
940 if failed_cycles >= self._MAX_POWER_CYCLE_ATTEMPTS:
Scott Zawalski62bacae2013-03-05 10:40:32 -0500941 raise error.AutoservRepairFailure(
942 'Powercycled host %s %d times; device did not come back'
943 ' online.' % (self.hostname, failed_cycles))
Richard Barnette82c35912012-11-20 10:09:10 -0800944 self.power_cycle()
945 if failed_cycles == 0:
946 logging.info('Powercycling was successful first time.')
947 else:
948 logging.info('Powercycling was successful after %d failures.',
949 failed_cycles)
950
951
952 def repair_full(self):
953 """Repair a host for repair level NO_PROTECTION.
954
955 This overrides the base class function for repair; it does
956 not call back to the parent class, but instead offers a
957 simplified implementation based on the capabilities in the
958 Chrome OS test lab.
959
Fang Deng5d518f42013-08-02 14:04:32 -0700960 It first verifies and repairs servo if it is a DUT in CrOS
Fang Deng03590af2013-10-07 17:34:20 -0700961 lab and a servo is attached.
Fang Deng5d518f42013-08-02 14:04:32 -0700962
J. Richard Barnettefde55fc2013-03-15 17:47:01 -0700963 If `self.verify()` fails, the following procedures are
964 attempted:
965 1. Try to re-install to a known stable image using
966 auto-update.
Scott Zawalski62bacae2013-03-05 10:40:32 -0500967 2. If there's a servo for the DUT, try to power the DUT off and
968 on.
969 3. If there's a servo for the DUT, try to re-install via
J. Richard Barnettefde55fc2013-03-15 17:47:01 -0700970 the servo.
Scott Zawalski62bacae2013-03-05 10:40:32 -0500971 4. If the DUT can be power-cycled via RPM, try to repair
Richard Barnette82c35912012-11-20 10:09:10 -0800972 by power-cycling.
973
974 As with the parent method, the last operation performed on
975 the DUT must be to call `self.verify()`; if that call fails,
976 the exception it raises is passed back to the caller.
J. Richard Barnettefde55fc2013-03-15 17:47:01 -0700977
Scott Zawalski62bacae2013-03-05 10:40:32 -0500978 @raises AutoservRepairTotalFailure if the repair process fails to
979 fix the DUT.
Fang Deng5d518f42013-08-02 14:04:32 -0700980 @raises ServoHostRepairTotalFailure if the repair process fails to
981 fix the servo host if one is attached to the DUT.
982 @raises AutoservSshPermissionDeniedError if it is unable
983 to ssh to the servo host due to permission error.
984
Richard Barnette82c35912012-11-20 10:09:10 -0800985 """
Dan Shi4d478522014-02-14 13:46:32 -0800986 if self._servo_host and not self.servo:
Fang Deng03590af2013-10-07 17:34:20 -0700987 try:
Dan Shi4d478522014-02-14 13:46:32 -0800988 self._servo_host.repair_full()
Fang Deng03590af2013-10-07 17:34:20 -0700989 except Exception as e:
Fang Deng03590af2013-10-07 17:34:20 -0700990 logging.error('Could not create a healthy servo: %s', e)
Dan Shi4d478522014-02-14 13:46:32 -0800991 self.servo = self._servo_host.get_servo()
Fang Deng5d518f42013-08-02 14:04:32 -0700992
Scott Zawalski62bacae2013-03-05 10:40:32 -0500993 # TODO(scottz): This should use something similar to label_decorator,
994 # but needs to be populated in order so DUTs are repaired with the
995 # least amount of effort.
Dan Shi849a1c42014-03-05 11:10:43 -0800996 repair_funcs = [self._servo_repair_power,
997 self._install_repair,
Dan Shi2c88eed2013-11-12 10:18:38 -0800998 self._install_repair_with_powerwash,
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700999 self._servo_repair_reinstall,
Scott Zawalski62bacae2013-03-05 10:40:32 -05001000 self._powercycle_to_repair]
1001 errors = []
Simran Basie6130932013-10-01 14:07:52 -07001002 board = self._get_board_from_afe()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001003 for repair_func in repair_funcs:
1004 try:
1005 repair_func()
1006 self.verify()
Simran Basie6130932013-10-01 14:07:52 -07001007 stats.Counter(
1008 '%s.SUCCEEDED' % repair_func.__name__).increment()
1009 if board:
1010 stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001011 '%s.%s.SUCCEEDED' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001012 board)).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001013 return
Simran Basie6130932013-10-01 14:07:52 -07001014 except error.AutoservRepairMethodNA as e:
1015 stats.Counter(
1016 '%s.RepairNA' % repair_func.__name__).increment()
1017 if board:
1018 stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001019 '%s.%s.RepairNA' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001020 board)).increment()
1021 logging.warn('Repair function NA: %s', e)
1022 errors.append(str(e))
Scott Zawalski62bacae2013-03-05 10:40:32 -05001023 except Exception as e:
Simran Basie6130932013-10-01 14:07:52 -07001024 stats.Counter(
1025 '%s.FAILED' % repair_func.__name__).increment()
1026 if board:
1027 stats.Counter(
Dan Shib87c3aa2014-02-12 15:40:31 -08001028 '%s.%s.FAILED' % (repair_func.__name__,
Simran Basie6130932013-10-01 14:07:52 -07001029 board)).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001030 logging.warn('Failed to repair device: %s', e)
1031 errors.append(str(e))
Scott Zawalski89c44dd2013-02-26 09:28:02 -05001032
Simran Basie6130932013-10-01 14:07:52 -07001033 stats.Counter('Full_Repair_Failed').increment()
1034 if board:
1035 stats.Counter(
1036 'Full_Repair_Failed.%s' % board).increment()
Scott Zawalski62bacae2013-03-05 10:40:32 -05001037 raise error.AutoservRepairTotalFailure(
1038 'All attempts at repairing the device failed:\n%s' %
1039 '\n'.join(errors))
Richard Barnette82c35912012-11-20 10:09:10 -08001040
1041
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001042 def close(self):
beeps32a63082013-08-22 14:02:29 -07001043 self.rpc_disconnect_all()
Fang Deng0ca40e22013-08-27 17:47:44 -07001044 super(CrosHost, self).close()
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001045
1046
Simran Basi5e6339a2013-03-21 11:34:32 -07001047 def _cleanup_poweron(self):
1048 """Special cleanup method to make sure hosts always get power back."""
1049 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
1050 hosts = afe.get_hosts(hostname=self.hostname)
1051 if not hosts or not (self._RPM_OUTLET_CHANGED in
1052 hosts[0].attributes):
1053 return
1054 logging.debug('This host has recently interacted with the RPM'
1055 ' Infrastructure. Ensuring power is on.')
1056 try:
1057 self.power_on()
1058 except rpm_client.RemotePowerException:
1059 # If cleanup has completed but there was an issue with the RPM
1060 # Infrastructure, log an error message rather than fail cleanup
1061 logging.error('Failed to turn Power On for this host after '
1062 'cleanup through the RPM Infrastructure.')
1063 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, None,
1064 hostname=self.hostname)
1065
1066
beepsc87ff602013-07-31 21:53:00 -07001067 def _is_factory_image(self):
1068 """Checks if the image on the DUT is a factory image.
1069
1070 @return: True if the image on the DUT is a factory image.
1071 False otherwise.
1072 """
1073 result = self.run('[ -f /root/.factory_test ]', ignore_status=True)
1074 return result.exit_status == 0
1075
1076
1077 def _restart_ui(self):
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001078 """Restart the Chrome UI.
beepsc87ff602013-07-31 21:53:00 -07001079
1080 @raises: FactoryImageCheckerException for factory images, since
1081 we cannot attempt to restart ui on them.
1082 error.AutoservRunError for any other type of error that
1083 occurs while restarting ui.
1084 """
1085 if self._is_factory_image():
1086 raise FactoryImageCheckerException('Cannot restart ui on factory '
1087 'images')
1088
J. Richard Barnette84890bd2014-02-21 11:05:47 -08001089 # TODO(jrbarnette): The command to stop/start the ui job
1090 # should live inside cros_ui, too. However that would seem
1091 # to imply interface changes to the existing start()/restart()
1092 # functions, which is a bridge too far (for now).
1093 prompt = cros_ui.get_login_prompt_state(self)
1094 self.run('stop ui; start ui')
1095 cros_ui.wait_for_chrome_ready(prompt, self)
beepsc87ff602013-07-31 21:53:00 -07001096
1097
1098 def cleanup(self):
Richard Barnette82c35912012-11-20 10:09:10 -08001099 self.run('rm -f %s' % constants.CLEANUP_LOGS_PAUSED_FILE)
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001100 try:
beepsc87ff602013-07-31 21:53:00 -07001101 self._restart_ui()
1102 except (error.AutotestRunError, error.AutoservRunError,
1103 FactoryImageCheckerException):
Scott Zawalskiddbc31e2012-11-15 11:29:01 -05001104 logging.warn('Unable to restart ui, rebooting device.')
1105 # Since restarting the UI fails fall back to normal Autotest
1106 # cleanup routines, i.e. reboot the machine.
Fang Deng0ca40e22013-08-27 17:47:44 -07001107 super(CrosHost, self).cleanup()
Simran Basi5e6339a2013-03-21 11:34:32 -07001108 # Check if the rpm outlet was manipulated.
Simran Basid5e5e272012-09-24 15:23:59 -07001109 if self.has_power():
Simran Basi5e6339a2013-03-21 11:34:32 -07001110 self._cleanup_poweron()
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001111
1112
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001113 def reboot(self, **dargs):
1114 """
1115 This function reboots the site host. The more generic
1116 RemoteHost.reboot() performs sync and sleeps for 5
1117 seconds. This is not necessary for Chrome OS devices as the
1118 sync should be finished in a short time during the reboot
1119 command.
1120 """
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001121 if 'reboot_cmd' not in dargs:
Doug Anderson7d5aeb22014-02-27 15:12:17 -08001122 reboot_timeout = dargs.get('reboot_timeout', 10)
1123 dargs['reboot_cmd'] = ('((reboot & sleep %d; reboot -f &)'
1124 ' </dev/null >/dev/null 2>&1 &)' %
1125 reboot_timeout)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001126 # Enable fastsync to avoid running extra sync commands before reboot.
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +08001127 if 'fastsync' not in dargs:
1128 dargs['fastsync'] = True
Fang Deng0ca40e22013-08-27 17:47:44 -07001129 super(CrosHost, self).reboot(**dargs)
Yu-Ju Honga2be94a2012-07-31 09:48:52 -07001130
1131
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001132 def verify_software(self):
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001133 """Verify working software on a Chrome OS system.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001134
Richard Barnetteb2bc13c2013-01-08 17:32:51 -08001135 Tests for the following conditions:
1136 1. All conditions tested by the parent version of this
1137 function.
1138 2. Sufficient space in /mnt/stateful_partition.
Fang Deng6b05f5b2013-03-20 13:42:11 -07001139 3. Sufficient space in /mnt/stateful_partition/encrypted.
1140 4. update_engine answers a simple status request over DBus.
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001141
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001142 """
Fang Deng0ca40e22013-08-27 17:47:44 -07001143 super(CrosHost, self).verify_software()
J. Richard Barnette45e93de2012-04-11 17:24:15 -07001144 self.check_diskspace(
1145 '/mnt/stateful_partition',
1146 global_config.global_config.get_config_value(
Fang Deng6b05f5b2013-03-20 13:42:11 -07001147 'SERVER', 'gb_diskspace_required', type=float,
1148 default=20.0))
1149 self.check_diskspace(
1150 '/mnt/stateful_partition/encrypted',
1151 global_config.global_config.get_config_value(
1152 'SERVER', 'gb_encrypted_diskspace_required', type=float,
1153 default=0.1))
beepsc87ff602013-07-31 21:53:00 -07001154
1155 # Factory images don't run update engine,
1156 # goofy controls dbus on these DUTs.
1157 if not self._is_factory_image():
1158 self.run('update_engine_client --status')
Scott Zawalskifbca4a92013-03-04 15:56:42 -05001159 # Makes sure python is present, loads and can use built in functions.
1160 # We have seen cases where importing cPickle fails with undefined
1161 # symbols in cPickle.so.
1162 self.run('python -c "import cPickle"')
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001163
1164
Fang Deng96667ca2013-08-01 17:46:18 -07001165 def make_ssh_command(self, user='root', port=22, opts='', hosts_file=None,
1166 connect_timeout=None, alive_interval=None):
1167 """Override default make_ssh_command to use options tuned for Chrome OS.
1168
1169 Tuning changes:
1170 - ConnectTimeout=30; maximum of 30 seconds allowed for an SSH
1171 connection failure. Consistency with remote_access.sh.
1172
1173 - ServerAliveInterval=180; which causes SSH to ping connection every
1174 180 seconds. In conjunction with ServerAliveCountMax ensures
1175 that if the connection dies, Autotest will bail out quickly.
1176 Originally tried 60 secs, but saw frequent job ABORTS where
1177 the test completed successfully.
1178
1179 - ServerAliveCountMax=3; consistency with remote_access.sh.
1180
1181 - ConnectAttempts=4; reduce flakiness in connection errors;
1182 consistency with remote_access.sh.
1183
1184 - UserKnownHostsFile=/dev/null; we don't care about the keys.
1185 Host keys change with every new installation, don't waste
1186 memory/space saving them.
1187
1188 - SSH protocol forced to 2; needed for ServerAliveInterval.
1189
1190 @param user User name to use for the ssh connection.
1191 @param port Port on the target host to use for ssh connection.
1192 @param opts Additional options to the ssh command.
1193 @param hosts_file Ignored.
1194 @param connect_timeout Ignored.
1195 @param alive_interval Ignored.
1196 """
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001197 base_command = ('/usr/bin/ssh -a -x %s %s %s'
1198 ' -o StrictHostKeyChecking=no'
Fang Deng96667ca2013-08-01 17:46:18 -07001199 ' -o UserKnownHostsFile=/dev/null -o BatchMode=yes'
1200 ' -o ConnectTimeout=30 -o ServerAliveInterval=180'
1201 ' -o ServerAliveCountMax=3 -o ConnectionAttempts=4'
1202 ' -o Protocol=2 -l %s -p %d')
Aviv Keshetc5947fa2013-09-04 14:06:29 -07001203 return base_command % (self._ssh_verbosity_flag, self._ssh_options,
1204 opts, user, port)
Fang Deng96667ca2013-08-01 17:46:18 -07001205
1206
beeps32a63082013-08-22 14:02:29 -07001207 def _create_ssh_tunnel(self, port, local_port):
1208 """Create an ssh tunnel from local_port to port.
1209
1210 @param port: remote port on the host.
1211 @param local_port: local forwarding port.
1212
1213 @return: the tunnel process.
1214 """
1215 # Chrome OS on the target closes down most external ports
1216 # for security. We could open the port, but doing that
1217 # would conflict with security tests that check that only
1218 # expected ports are open. So, to get to the port on the
1219 # target we use an ssh tunnel.
1220 tunnel_options = '-n -N -q -L %d:localhost:%d' % (local_port, port)
1221 ssh_cmd = self.make_ssh_command(opts=tunnel_options)
1222 tunnel_cmd = '%s %s' % (ssh_cmd, self.hostname)
1223 logging.debug('Full tunnel command: %s', tunnel_cmd)
1224 tunnel_proc = subprocess.Popen(tunnel_cmd, shell=True, close_fds=True)
1225 logging.debug('Started ssh tunnel, local = %d'
1226 ' remote = %d, pid = %d',
1227 local_port, port, tunnel_proc.pid)
1228 return tunnel_proc
1229
1230
Christopher Wileydd181852013-10-10 19:56:58 -07001231 def _setup_rpc(self, port, command_name, remote_pid=None):
beeps32a63082013-08-22 14:02:29 -07001232 """Sets up a tunnel process and performs rpc connection book keeping.
1233
1234 This method assumes that xmlrpc and jsonrpc never conflict, since
1235 we can only either have an xmlrpc or a jsonrpc server listening on
1236 a remote port. As such, it enforces a single proxy->remote port
1237 policy, i.e if one starts a jsonrpc proxy/server from port A->B,
1238 and then tries to start an xmlrpc proxy forwarded to the same port,
1239 the xmlrpc proxy will override the jsonrpc tunnel process, however:
1240
1241 1. None of the methods on the xmlrpc proxy will work because
1242 the server listening on B is jsonrpc.
1243
1244 2. The xmlrpc client cannot initiate a termination of the JsonRPC
1245 server, as the only use case currently is goofy, which is tied to
1246 the factory image. It is much easier to handle a failed xmlrpc
1247 call on the client than it is to terminate goofy in this scenario,
1248 as doing the latter might leave the DUT in a hard to recover state.
1249
1250 With the current implementation newer rpc proxy connections will
1251 terminate the tunnel processes of older rpc connections tunneling
1252 to the same remote port. If methods are invoked on the client
1253 after this has happened they will fail with connection closed errors.
1254
1255 @param port: The remote forwarding port.
1256 @param command_name: The name of the remote process, to terminate
1257 using pkill.
1258
1259 @return A url that we can use to initiate the rpc connection.
1260 """
1261 self.rpc_disconnect(port)
1262 local_port = utils.get_unused_port()
1263 tunnel_proc = self._create_ssh_tunnel(port, local_port)
Christopher Wileydd181852013-10-10 19:56:58 -07001264 self._rpc_proxy_map[port] = (command_name, tunnel_proc, remote_pid)
beeps32a63082013-08-22 14:02:29 -07001265 return self._RPC_PROXY_URL % local_port
1266
1267
Christopher Wileyd78249a2013-03-01 13:05:31 -08001268 def xmlrpc_connect(self, command, port, command_name=None,
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001269 ready_test_name=None, timeout_seconds=10,
1270 logfile='/dev/null'):
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001271 """Connect to an XMLRPC server on the host.
1272
1273 The `command` argument should be a simple shell command that
1274 starts an XMLRPC server on the given `port`. The command
1275 must not daemonize, and must terminate cleanly on SIGTERM.
1276 The command is started in the background on the host, and a
1277 local XMLRPC client for the server is created and returned
1278 to the caller.
1279
1280 Note that the process of creating an XMLRPC client makes no
1281 attempt to connect to the remote server; the caller is
1282 responsible for determining whether the server is running
1283 correctly, and is ready to serve requests.
1284
Christopher Wileyd78249a2013-03-01 13:05:31 -08001285 Optionally, the caller can pass ready_test_name, a string
1286 containing the name of a method to call on the proxy. This
1287 method should take no parameters and return successfully only
1288 when the server is ready to process client requests. When
1289 ready_test_name is set, xmlrpc_connect will block until the
1290 proxy is ready, and throw a TestError if the server isn't
1291 ready by timeout_seconds.
1292
beeps32a63082013-08-22 14:02:29 -07001293 If a server is already running on the remote port, this
1294 method will kill it and disconnect the tunnel process
1295 associated with the connection before establishing a new one,
1296 by consulting the rpc_proxy_map in rpc_disconnect.
1297
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001298 @param command Shell command to start the server.
1299 @param port Port number on which the server is expected to
1300 be serving.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001301 @param command_name String to use as input to `pkill` to
1302 terminate the XMLRPC server on the host.
Christopher Wileyd78249a2013-03-01 13:05:31 -08001303 @param ready_test_name String containing the name of a
1304 method defined on the XMLRPC server.
1305 @param timeout_seconds Number of seconds to wait
1306 for the server to become 'ready.' Will throw a
1307 TestFail error if server is not ready in time.
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001308 @param logfile Logfile to send output when running
1309 'command' argument.
Yusuf Mohsinally8d19e3c2013-11-21 14:25:45 -08001310
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001311 """
Christopher Wileyc14f06a2013-10-16 13:55:39 -07001312 # Clean up any existing state. If the caller is willing
1313 # to believe their server is down, we ought to clean up
1314 # any tunnels we might have sitting around.
1315 self.rpc_disconnect(port)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001316 # Start the server on the host. Redirection in the command
1317 # below is necessary, because 'ssh' won't terminate until
1318 # background child processes close stdin, stdout, and
1319 # stderr.
Yusuf Mohsinallyfff89d62013-11-18 16:34:07 -08001320 remote_cmd = '%s </dev/null >%s 2>&1 & echo $!' % (command, logfile)
Christopher Wileydd181852013-10-10 19:56:58 -07001321 remote_pid = self.run(remote_cmd).stdout.rstrip('\n')
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001322 logging.debug('Started XMLRPC server on host %s, pid = %s',
1323 self.hostname, remote_pid)
1324
Christopher Wileydd181852013-10-10 19:56:58 -07001325 # Tunnel through SSH to be able to reach that remote port.
1326 rpc_url = self._setup_rpc(port, command_name, remote_pid=remote_pid)
Christopher Wileyd78249a2013-03-01 13:05:31 -08001327 proxy = xmlrpclib.ServerProxy(rpc_url, allow_none=True)
Christopher Wileydd181852013-10-10 19:56:58 -07001328
Christopher Wileyd78249a2013-03-01 13:05:31 -08001329 if ready_test_name is not None:
J. Richard Barnette13eb7c02013-03-07 12:06:29 -08001330 # retry.retry logs each attempt; calculate delay_sec to
1331 # keep log spam to a dull roar.
Christopher Wiley0ed712b2013-04-09 15:25:12 -07001332 @retry.retry((socket.error,
1333 xmlrpclib.ProtocolError,
1334 httplib.BadStatusLine),
Chris Sosa65425082013-10-16 13:26:22 -07001335 timeout_min=timeout_seconds / 60.0,
1336 delay_sec=min(max(timeout_seconds / 20.0, 0.1), 1))
Christopher Wileyd78249a2013-03-01 13:05:31 -08001337 def ready_test():
1338 """ Call proxy.ready_test_name(). """
1339 getattr(proxy, ready_test_name)()
1340 successful = False
1341 try:
1342 logging.info('Waiting %d seconds for XMLRPC server '
1343 'to start.', timeout_seconds)
1344 ready_test()
1345 successful = True
Christopher Wileyd78249a2013-03-01 13:05:31 -08001346 finally:
1347 if not successful:
1348 logging.error('Failed to start XMLRPC server.')
beeps32a63082013-08-22 14:02:29 -07001349 self.rpc_disconnect(port)
Christopher Wileyd78249a2013-03-01 13:05:31 -08001350 logging.info('XMLRPC server started successfully.')
1351 return proxy
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001352
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001353
Jason Abeleb6f924f2013-11-13 16:01:54 -08001354 def syslog(self, message, tag='autotest'):
1355 """Logs a message to syslog on host.
1356
1357 @param message String message to log into syslog
1358 @param tag String tag prefix for syslog
1359
1360 """
1361 self.run('logger -t "%s" "%s"' % (tag, message))
1362
1363
beeps32a63082013-08-22 14:02:29 -07001364 def jsonrpc_connect(self, port):
1365 """Creates a jsonrpc proxy connection through an ssh tunnel.
1366
1367 This method exists to facilitate communication with goofy (which is
1368 the default system manager on all factory images) and as such, leaves
1369 most of the rpc server sanity checking to the caller. Unlike
1370 xmlrpc_connect, this method does not facilitate the creation of a remote
1371 jsonrpc server, as the only clients of this code are factory tests,
1372 for which the goofy system manager is built in to the image and starts
1373 when the target boots.
1374
1375 One can theoretically create multiple jsonrpc proxies all forwarded
1376 to the same remote port, provided the remote port has an rpc server
1377 listening. However, in doing so we stand the risk of leaking an
1378 existing tunnel process, so we always disconnect any older tunnels
1379 we might have through rpc_disconnect.
1380
1381 @param port: port on the remote host that is serving this proxy.
1382
1383 @return: The client proxy.
1384 """
1385 if not jsonrpclib:
1386 logging.warning('Jsonrpclib could not be imported. Check that '
1387 'site-packages contains jsonrpclib.')
1388 return None
1389
1390 proxy = jsonrpclib.jsonrpc.ServerProxy(self._setup_rpc(port, None))
1391
1392 logging.info('Established a jsonrpc connection through port %s.', port)
1393 return proxy
1394
1395
1396 def rpc_disconnect(self, port):
1397 """Disconnect from an RPC server on the host.
1398
1399 Terminates the remote RPC server previously started for
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001400 the given `port`. Also closes the local ssh tunnel created
1401 for the connection to the host. This function does not
beeps32a63082013-08-22 14:02:29 -07001402 directly alter the state of a previously returned RPC
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001403 client object; however disconnection will cause all
1404 subsequent calls to methods on the object to fail.
1405
1406 This function does nothing if requested to disconnect a port
beeps32a63082013-08-22 14:02:29 -07001407 that was not previously connected via _setup_rpc.
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001408
1409 @param port Port number passed to a previous call to
beeps32a63082013-08-22 14:02:29 -07001410 `_setup_rpc()`.
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001411 """
beeps32a63082013-08-22 14:02:29 -07001412 if port not in self._rpc_proxy_map:
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001413 return
Christopher Wileydd181852013-10-10 19:56:58 -07001414 remote_name, tunnel_proc, remote_pid = self._rpc_proxy_map[port]
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001415 if remote_name:
1416 # We use 'pkill' to find our target process rather than
1417 # a PID, because the host may have rebooted since
1418 # connecting, and we don't want to kill an innocent
1419 # process with the same PID.
1420 #
1421 # 'pkill' helpfully exits with status 1 if no target
1422 # process is found, for which run() will throw an
Simran Basid5e5e272012-09-24 15:23:59 -07001423 # exception. We don't want that, so we the ignore
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001424 # status.
1425 self.run("pkill -f '%s'" % remote_name, ignore_status=True)
Christopher Wileydd181852013-10-10 19:56:58 -07001426 if remote_pid:
1427 logging.info('Waiting for RPC server "%s" shutdown',
1428 remote_name)
1429 start_time = time.time()
1430 while (time.time() - start_time <
1431 self._RPC_SHUTDOWN_TIMEOUT_SECONDS):
1432 running_processes = self.run(
1433 "pgrep -f '%s'" % remote_name,
1434 ignore_status=True).stdout.split()
1435 if not remote_pid in running_processes:
1436 logging.info('Shut down RPC server.')
1437 break
1438 time.sleep(self._RPC_SHUTDOWN_POLLING_PERIOD_SECONDS)
1439 else:
1440 raise error.TestError('Failed to shutdown RPC server %s' %
1441 remote_name)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001442
1443 if tunnel_proc.poll() is None:
1444 tunnel_proc.terminate()
1445 logging.debug('Terminated tunnel, pid %d', tunnel_proc.pid)
1446 else:
1447 logging.debug('Tunnel pid %d terminated early, status %d',
1448 tunnel_proc.pid, tunnel_proc.returncode)
beeps32a63082013-08-22 14:02:29 -07001449 del self._rpc_proxy_map[port]
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001450
1451
beeps32a63082013-08-22 14:02:29 -07001452 def rpc_disconnect_all(self):
1453 """Disconnect all known RPC proxy ports."""
1454 for port in self._rpc_proxy_map.keys():
1455 self.rpc_disconnect(port)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001456
1457
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001458 def _ping_check_status(self, status):
1459 """Ping the host once, and return whether it has a given status.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001460
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001461 @param status Check the ping status against this value.
1462 @return True iff `status` and the result of ping are the same
1463 (i.e. both True or both False).
1464
1465 """
1466 ping_val = utils.ping(self.hostname, tries=1, deadline=1)
1467 return not (status ^ (ping_val == 0))
1468
1469 def _ping_wait_for_status(self, status, timeout):
1470 """Wait for the host to have a given status (UP or DOWN).
1471
1472 Status is checked by polling. Polling will not last longer
1473 than the number of seconds in `timeout`. The polling
1474 interval will be long enough that only approximately
1475 _PING_WAIT_COUNT polling cycles will be executed, subject
1476 to a maximum interval of about one minute.
1477
1478 @param status Waiting will stop immediately if `ping` of the
1479 host returns this status.
1480 @param timeout Poll for at most this many seconds.
1481 @return True iff the host status from `ping` matched the
1482 requested status at the time of return.
1483
1484 """
1485 # _ping_check_status() takes about 1 second, hence the
1486 # "- 1" in the formula below.
1487 poll_interval = min(int(timeout / self._PING_WAIT_COUNT), 60) - 1
1488 end_time = time.time() + timeout
1489 while time.time() <= end_time:
1490 if self._ping_check_status(status):
1491 return True
1492 if poll_interval > 0:
1493 time.sleep(poll_interval)
1494
1495 # The last thing we did was sleep(poll_interval), so it may
1496 # have been too long since the last `ping`. Check one more
1497 # time, just to be sure.
1498 return self._ping_check_status(status)
1499
1500 def ping_wait_up(self, timeout):
1501 """Wait for the host to respond to `ping`.
1502
1503 N.B. This method is not a reliable substitute for
1504 `wait_up()`, because a host that responds to ping will not
1505 necessarily respond to ssh. This method should only be used
1506 if the target DUT can be considered functional even if it
1507 can't be reached via ssh.
1508
1509 @param timeout Minimum time to allow before declaring the
1510 host to be non-responsive.
1511 @return True iff the host answered to ping before the timeout.
1512
1513 """
1514 return self._ping_wait_for_status(self._PING_STATUS_UP, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001515
Andrew Bresticker678c0c72013-01-22 10:44:09 -08001516 def ping_wait_down(self, timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001517 """Wait until the host no longer responds to `ping`.
1518
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001519 This function can be used as a slightly faster version of
1520 `wait_down()`, by avoiding potentially long ssh timeouts.
1521
1522 @param timeout Minimum time to allow for the host to become
1523 non-responsive.
1524 @return True iff the host quit answering ping before the
1525 timeout.
1526
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001527 """
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001528 return self._ping_wait_for_status(self._PING_STATUS_DOWN, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001529
1530 def test_wait_for_sleep(self):
1531 """Wait for the client to enter low-power sleep mode.
1532
1533 The test for "is asleep" can't distinguish a system that is
1534 powered off; to confirm that the unit was asleep, it is
1535 necessary to force resume, and then call
1536 `test_wait_for_resume()`.
1537
1538 This function is expected to be called from a test as part
1539 of a sequence like the following:
1540
1541 ~~~~~~~~
1542 boot_id = host.get_boot_id()
1543 # trigger sleep on the host
1544 host.test_wait_for_sleep()
1545 # trigger resume on the host
1546 host.test_wait_for_resume(boot_id)
1547 ~~~~~~~~
1548
1549 @exception TestFail The host did not go to sleep within
1550 the allowed time.
1551 """
Andrew Bresticker678c0c72013-01-22 10:44:09 -08001552 if not self.ping_wait_down(timeout=self.SLEEP_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001553 raise error.TestFail(
1554 'client failed to sleep after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001555 self.SLEEP_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001556
1557
1558 def test_wait_for_resume(self, old_boot_id):
1559 """Wait for the client to resume from low-power sleep mode.
1560
1561 The `old_boot_id` parameter should be the value from
1562 `get_boot_id()` obtained prior to entering sleep mode. A
1563 `TestFail` exception is raised if the boot id changes.
1564
1565 See @ref test_wait_for_sleep for more on this function's
1566 usage.
1567
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001568 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001569 target host went to sleep.
1570
1571 @exception TestFail The host did not respond within the
1572 allowed time.
1573 @exception TestFail The host responded, but the boot id test
1574 indicated a reboot rather than a sleep
1575 cycle.
1576 """
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001577 if not self.wait_up(timeout=self.RESUME_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001578 raise error.TestFail(
1579 'client failed to resume from sleep after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001580 self.RESUME_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001581 else:
1582 new_boot_id = self.get_boot_id()
1583 if new_boot_id != old_boot_id:
1584 raise error.TestFail(
1585 'client rebooted, but sleep was expected'
1586 ' (old boot %s, new boot %s)'
1587 % (old_boot_id, new_boot_id))
1588
1589
1590 def test_wait_for_shutdown(self):
1591 """Wait for the client to shut down.
1592
1593 The test for "has shut down" can't distinguish a system that
1594 is merely asleep; to confirm that the unit was down, it is
1595 necessary to force boot, and then call test_wait_for_boot().
1596
1597 This function is expected to be called from a test as part
1598 of a sequence like the following:
1599
1600 ~~~~~~~~
1601 boot_id = host.get_boot_id()
1602 # trigger shutdown on the host
1603 host.test_wait_for_shutdown()
1604 # trigger boot on the host
1605 host.test_wait_for_boot(boot_id)
1606 ~~~~~~~~
1607
1608 @exception TestFail The host did not shut down within the
1609 allowed time.
1610 """
Andrew Bresticker678c0c72013-01-22 10:44:09 -08001611 if not self.ping_wait_down(timeout=self.SHUTDOWN_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001612 raise error.TestFail(
1613 'client failed to shut down after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001614 self.SHUTDOWN_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001615
1616
1617 def test_wait_for_boot(self, old_boot_id=None):
1618 """Wait for the client to boot from cold power.
1619
1620 The `old_boot_id` parameter should be the value from
1621 `get_boot_id()` obtained prior to shutting down. A
1622 `TestFail` exception is raised if the boot id does not
1623 change. The boot id test is omitted if `old_boot_id` is not
1624 specified.
1625
1626 See @ref test_wait_for_shutdown for more on this function's
1627 usage.
1628
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001629 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001630 shut down.
1631
1632 @exception TestFail The host did not respond within the
1633 allowed time.
1634 @exception TestFail The host responded, but the boot id test
1635 indicated that there was no reboot.
1636 """
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001637 if not self.wait_up(timeout=self.REBOOT_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001638 raise error.TestFail(
1639 'client failed to reboot after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001640 self.REBOOT_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001641 elif old_boot_id:
1642 if self.get_boot_id() == old_boot_id:
1643 raise error.TestFail(
1644 'client is back up, but did not reboot'
1645 ' (boot %s)' % old_boot_id)
Simran Basid5e5e272012-09-24 15:23:59 -07001646
1647
1648 @staticmethod
1649 def check_for_rpm_support(hostname):
1650 """For a given hostname, return whether or not it is powered by an RPM.
1651
Simran Basi1df55112013-09-06 11:25:09 -07001652 @param hostname: hostname to check for rpm support.
1653
Simran Basid5e5e272012-09-24 15:23:59 -07001654 @return None if this host does not follows the defined naming format
1655 for RPM powered DUT's in the lab. If it does follow the format,
1656 it returns a regular expression MatchObject instead.
1657 """
Fang Deng0ca40e22013-08-27 17:47:44 -07001658 return re.match(CrosHost._RPM_HOSTNAME_REGEX, hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07001659
1660
1661 def has_power(self):
1662 """For this host, return whether or not it is powered by an RPM.
1663
1664 @return True if this host is in the CROS lab and follows the defined
1665 naming format.
1666 """
Fang Deng0ca40e22013-08-27 17:47:44 -07001667 return CrosHost.check_for_rpm_support(self.hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07001668
1669
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08001670 def _set_power(self, state, power_method):
1671 """Sets the power to the host via RPM, Servo or manual.
1672
1673 @param state Specifies which power state to set to DUT
1674 @param power_method Specifies which method of power control to
1675 use. By default "RPM" will be used. Valid values
1676 are the strings "RPM", "manual", "servoj10".
1677
1678 """
1679 ACCEPTABLE_STATES = ['ON', 'OFF']
1680
1681 if state.upper() not in ACCEPTABLE_STATES:
1682 raise error.TestError('State must be one of: %s.'
1683 % (ACCEPTABLE_STATES,))
1684
1685 if power_method == self.POWER_CONTROL_SERVO:
1686 logging.info('Setting servo port J10 to %s', state)
1687 self.servo.set('prtctl3_pwren', state.lower())
1688 time.sleep(self._USB_POWER_TIMEOUT)
1689 elif power_method == self.POWER_CONTROL_MANUAL:
1690 logging.info('You have %d seconds to set the AC power to %s.',
1691 self._POWER_CYCLE_TIMEOUT, state)
1692 time.sleep(self._POWER_CYCLE_TIMEOUT)
1693 else:
1694 if not self.has_power():
1695 raise error.TestFail('DUT does not have RPM connected.')
Simran Basi5e6339a2013-03-21 11:34:32 -07001696 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
1697 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, True,
1698 hostname=self.hostname)
Simran Basi1df55112013-09-06 11:25:09 -07001699 rpm_client.set_power(self.hostname, state.upper(), timeout_mins=5)
Simran Basid5e5e272012-09-24 15:23:59 -07001700
1701
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08001702 def power_off(self, power_method=POWER_CONTROL_RPM):
1703 """Turn off power to this host via RPM, Servo or manual.
1704
1705 @param power_method Specifies which method of power control to
1706 use. By default "RPM" will be used. Valid values
1707 are the strings "RPM", "manual", "servoj10".
1708
1709 """
1710 self._set_power('OFF', power_method)
Simran Basid5e5e272012-09-24 15:23:59 -07001711
1712
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08001713 def power_on(self, power_method=POWER_CONTROL_RPM):
1714 """Turn on power to this host via RPM, Servo or manual.
1715
1716 @param power_method Specifies which method of power control to
1717 use. By default "RPM" will be used. Valid values
1718 are the strings "RPM", "manual", "servoj10".
1719
1720 """
1721 self._set_power('ON', power_method)
1722
1723
1724 def power_cycle(self, power_method=POWER_CONTROL_RPM):
1725 """Cycle power to this host by turning it OFF, then ON.
1726
1727 @param power_method Specifies which method of power control to
1728 use. By default "RPM" will be used. Valid values
1729 are the strings "RPM", "manual", "servoj10".
1730
1731 """
1732 if power_method in (self.POWER_CONTROL_SERVO,
1733 self.POWER_CONTROL_MANUAL):
1734 self.power_off(power_method=power_method)
1735 time.sleep(self._POWER_CYCLE_TIMEOUT)
1736 self.power_on(power_method=power_method)
1737 else:
1738 rpm_client.set_power(self.hostname, 'CYCLE')
Simran Basic6f1f7a2012-10-16 10:47:46 -07001739
1740
1741 def get_platform(self):
1742 """Determine the correct platform label for this host.
1743
1744 @returns a string representing this host's platform.
1745 """
1746 crossystem = utils.Crossystem(self)
1747 crossystem.init()
1748 # Extract fwid value and use the leading part as the platform id.
1749 # fwid generally follow the format of {platform}.{firmware version}
1750 # Example: Alex.X.YYY.Z or Google_Alex.X.YYY.Z
1751 platform = crossystem.fwid().split('.')[0].lower()
1752 # Newer platforms start with 'Google_' while the older ones do not.
1753 return platform.replace('google_', '')
1754
1755
Hung-ying Tyanb1328032014-04-01 14:18:54 +08001756 def get_architecture(self):
1757 """Determine the correct architecture label for this host.
1758
1759 @returns a string representing this host's architecture.
1760 """
1761 crossystem = utils.Crossystem(self)
1762 crossystem.init()
1763 return crossystem.arch()
1764
1765
Luis Lozano40b7d0d2014-01-17 15:12:06 -08001766 def get_chrome_version(self):
1767 """Gets the Chrome version number and milestone as strings.
1768
1769 Invokes "chrome --version" to get the version number and milestone.
1770
1771 @return A tuple (chrome_ver, milestone) where "chrome_ver" is the
1772 current Chrome version number as a string (in the form "W.X.Y.Z")
1773 and "milestone" is the first component of the version number
1774 (the "W" from "W.X.Y.Z"). If the version number cannot be parsed
1775 in the "W.X.Y.Z" format, the "chrome_ver" will be the full output
1776 of "chrome --version" and the milestone will be the empty string.
1777
1778 """
1779 version_string = self.run(constants.CHROME_VERSION_COMMAND).stdout
1780 return utils.parse_chrome_version(version_string)
1781
Aviv Keshet74c89a92013-02-04 15:18:30 -08001782 @label_decorator()
Simran Basic6f1f7a2012-10-16 10:47:46 -07001783 def get_board(self):
1784 """Determine the correct board label for this host.
1785
1786 @returns a string representing this host's board.
1787 """
1788 release_info = utils.parse_cmd_output('cat /etc/lsb-release',
1789 run_method=self.run)
1790 board = release_info['CHROMEOS_RELEASE_BOARD']
1791 # Devices in the lab generally have the correct board name but our own
1792 # development devices have {board_name}-signed-{key_type}. The board
1793 # name may also begin with 'x86-' which we need to keep.
Simran Basi833814b2013-01-29 13:13:43 -08001794 board_format_string = ds_constants.BOARD_PREFIX + '%s'
Simran Basic6f1f7a2012-10-16 10:47:46 -07001795 if 'x86' not in board:
Simran Basi833814b2013-01-29 13:13:43 -08001796 return board_format_string % board.split('-')[0]
1797 return board_format_string % '-'.join(board.split('-')[0:2])
Simran Basic6f1f7a2012-10-16 10:47:46 -07001798
1799
Aviv Keshet74c89a92013-02-04 15:18:30 -08001800 @label_decorator('lightsensor')
Simran Basic6f1f7a2012-10-16 10:47:46 -07001801 def has_lightsensor(self):
1802 """Determine the correct board label for this host.
1803
1804 @returns the string 'lightsensor' if this host has a lightsensor or
1805 None if it does not.
1806 """
1807 search_cmd = "find -L %s -maxdepth 4 | egrep '%s'" % (
Richard Barnette82c35912012-11-20 10:09:10 -08001808 self._LIGHTSENSOR_SEARCH_DIR, '|'.join(self._LIGHTSENSOR_FILES))
Simran Basic6f1f7a2012-10-16 10:47:46 -07001809 try:
1810 # Run the search cmd following the symlinks. Stderr_tee is set to
1811 # None as there can be a symlink loop, but the command will still
1812 # execute correctly with a few messages printed to stderr.
1813 self.run(search_cmd, stdout_tee=None, stderr_tee=None)
1814 return 'lightsensor'
1815 except error.AutoservRunError:
1816 # egrep exited with a return code of 1 meaning none of the possible
1817 # lightsensor files existed.
1818 return None
1819
1820
Aviv Keshet74c89a92013-02-04 15:18:30 -08001821 @label_decorator('bluetooth')
Simran Basic6f1f7a2012-10-16 10:47:46 -07001822 def has_bluetooth(self):
1823 """Determine the correct board label for this host.
1824
1825 @returns the string 'bluetooth' if this host has bluetooth or
1826 None if it does not.
1827 """
1828 try:
1829 self.run('test -d /sys/class/bluetooth/hci0')
1830 # test exited with a return code of 0.
1831 return 'bluetooth'
1832 except error.AutoservRunError:
1833 # test exited with a return code 1 meaning the directory did not
1834 # exist.
1835 return None
1836
1837
Ilja Friedel0ce0b602013-08-15 18:45:27 -07001838 @label_decorator('graphics')
1839 def get_graphics(self):
1840 """
1841 Determine the correct board label for this host.
1842
1843 @returns a string representing this host's graphics. For now ARM boards
1844 return graphics:gles while all other boards return graphics:gl. This
1845 may change over time, but for robustness reasons this should avoid
1846 executing code in actual graphics libraries (which may not be ready and
1847 is tested by graphics_GLAPICheck).
1848 """
1849 uname = self.run('uname -a').stdout.lower()
1850 if 'arm' in uname:
1851 return 'graphics:gles'
1852 return 'graphics:gl'
1853
1854
Bill Richardson4f595f52014-02-13 16:20:26 -08001855 @label_decorator('ec')
1856 def get_ec(self):
1857 """
1858 Determine the type of EC on this host.
1859
1860 @returns a string representing this host's embedded controller type.
1861 At present, it only returns "ec:cros", for Chrome OS ECs. Other types
1862 of EC (or none) don't return any strings, since no tests depend on
1863 those.
1864 """
1865 cmd = 'mosys ec info'
1866 # The output should look like these, so that the last field should
1867 # match our EC version scheme:
1868 #
1869 # stm | stm32f100 | snow_v1.3.139-375eb9f
1870 # ti | Unknown-10de | peppy_v1.5.114-5d52788
1871 #
1872 # Non-Chrome OS ECs will look like these:
1873 #
1874 # ENE | KB932 | 00BE107A00
1875 # ite | it8518 | 3.08
1876 #
1877 # And some systems don't have ECs at all (Lumpy, for example).
1878 regexp = r'^.*\|\s*(\S+_v\d+\.\d+\.\d+-[0-9a-f]+)\s*$'
1879
1880 ecinfo = self.run(command=cmd, ignore_status=True)
1881 if ecinfo.exit_status == 0:
1882 res = re.search(regexp, ecinfo.stdout)
1883 if res:
1884 logging.info("EC version is %s", res.groups()[0])
1885 return 'ec:cros'
1886 logging.info("%s got: %s", cmd, ecinfo.stdout)
1887 # Has an EC, but it's not a Chrome OS EC
1888 return None
1889 logging.info("%s exited with status %d", cmd, ecinfo.exit_status)
1890 # No EC present
1891 return None
1892
1893
Simran Basic6f1f7a2012-10-16 10:47:46 -07001894 def get_labels(self):
1895 """Return a list of labels for this given host.
1896
1897 This is the main way to retrieve all the automatic labels for a host
1898 as it will run through all the currently implemented label functions.
1899 """
1900 labels = []
Richard Barnette82c35912012-11-20 10:09:10 -08001901 for label_function in self._LABEL_FUNCTIONS:
Simran Basic6f1f7a2012-10-16 10:47:46 -07001902 label = label_function(self)
1903 if label:
1904 labels.append(label)
1905 return labels