blob: 6a9d7beba5d12113e9121027291d47041ebf7622 [file] [log] [blame]
J. Richard Barnette24adbf42012-04-11 15:04:53 -07001# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
Dale Curtisaa5eedb2011-08-23 16:18:52 -07002# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4
Aviv Keshet74c89a92013-02-04 15:18:30 -08005import functools
Christopher Wiley0ed712b2013-04-09 15:25:12 -07006import httplib
J. Richard Barnette1d78b012012-05-15 13:56:30 -07007import logging
Dan Shi0f466e82013-02-22 15:44:58 -08008import os
Simran Basid5e5e272012-09-24 15:23:59 -07009import re
Christopher Wileyd78249a2013-03-01 13:05:31 -080010import socket
J. Richard Barnette1d78b012012-05-15 13:56:30 -070011import subprocess
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070012import time
J. Richard Barnette1d78b012012-05-15 13:56:30 -070013import xmlrpclib
J. Richard Barnette134ec2c2012-04-25 12:59:37 -070014
J. Richard Barnette45e93de2012-04-11 17:24:15 -070015from autotest_lib.client.bin import utils
Richard Barnette0c73ffc2012-11-19 15:21:18 -080016from autotest_lib.client.common_lib import error
17from autotest_lib.client.common_lib import global_config
J. Richard Barnette45e93de2012-04-11 17:24:15 -070018from autotest_lib.client.common_lib.cros import autoupdater
Richard Barnette03a0c132012-11-05 12:40:35 -080019from autotest_lib.client.common_lib.cros import dev_server
Christopher Wileyd78249a2013-03-01 13:05:31 -080020from autotest_lib.client.common_lib.cros import retry
Richard Barnette82c35912012-11-20 10:09:10 -080021from autotest_lib.client.cros import constants
J. Richard Barnette45e93de2012-04-11 17:24:15 -070022from autotest_lib.server import autoserv_parser
Chris Sosaf4d43ff2012-10-30 11:21:05 -070023from autotest_lib.server import autotest
Dan Shia1ecd5c2013-06-06 11:21:31 -070024from autotest_lib.server import utils as server_utils
Scott Zawalski89c44dd2013-02-26 09:28:02 -050025from autotest_lib.server.cros.dynamic_suite import constants as ds_constants
Simran Basi5e6339a2013-03-21 11:34:32 -070026from autotest_lib.server.cros.dynamic_suite import tools, frontend_wrappers
J. Richard Barnette75487572013-03-08 12:47:50 -080027from autotest_lib.server.cros.servo import servo
J. Richard Barnette45e93de2012-04-11 17:24:15 -070028from autotest_lib.server.hosts import remote
Simran Basidcff4252012-11-20 16:13:20 -080029from autotest_lib.site_utils.rpm_control_system import rpm_client
Simran Basid5e5e272012-09-24 15:23:59 -070030
31
J. Richard Barnettebe5ebcc2013-02-11 16:03:15 -080032def _make_servo_hostname(hostname):
33 host_parts = hostname.split('.')
34 host_parts[0] = host_parts[0] + '-servo'
35 return '.'.join(host_parts)
36
37
38def _get_lab_servo(target_hostname):
39 """Instantiate a Servo for |target_hostname| in the lab.
40
41 Assuming that |target_hostname| is a device in the CrOS test
42 lab, create and return a Servo object pointed at the servo
43 attached to that DUT. The servo in the test lab is assumed
44 to already have servod up and running on it.
45
46 @param target_hostname: device whose servo we want to target.
47 @return an appropriately configured Servo instance.
48 """
49 servo_host = _make_servo_hostname(target_hostname)
50 if utils.host_is_in_lab_zone(servo_host):
51 try:
J. Richard Barnetted5f807a2013-02-11 16:51:00 -080052 return servo.Servo(servo_host=servo_host)
J. Richard Barnettebe5ebcc2013-02-11 16:03:15 -080053 except: # pylint: disable=W0702
54 # TODO(jrbarnette): Long-term, if we can't get to
55 # a servo in the lab, we want to fail, so we should
56 # pass any exceptions along. Short-term, we're not
57 # ready to rely on servo, so we ignore failures.
58 pass
59 return None
60
61
Dale Curtiscb7bfaf2011-06-07 16:21:57 -070062def make_ssh_command(user='root', port=22, opts='', hosts_file=None,
63 connect_timeout=None, alive_interval=None):
64 """Override default make_ssh_command to use options tuned for Chrome OS.
65
66 Tuning changes:
Chris Sosaf7fcd6e2011-09-27 17:30:47 -070067 - ConnectTimeout=30; maximum of 30 seconds allowed for an SSH connection
68 failure. Consistency with remote_access.sh.
Dale Curtiscb7bfaf2011-06-07 16:21:57 -070069
Dale Curtisaa5eedb2011-08-23 16:18:52 -070070 - ServerAliveInterval=180; which causes SSH to ping connection every
71 180 seconds. In conjunction with ServerAliveCountMax ensures that if the
72 connection dies, Autotest will bail out quickly. Originally tried 60 secs,
73 but saw frequent job ABORTS where the test completed successfully.
Dale Curtiscb7bfaf2011-06-07 16:21:57 -070074
Chris Sosaf7fcd6e2011-09-27 17:30:47 -070075 - ServerAliveCountMax=3; consistency with remote_access.sh.
76
77 - ConnectAttempts=4; reduce flakiness in connection errors; consistency
78 with remote_access.sh.
Dale Curtiscb7bfaf2011-06-07 16:21:57 -070079
80 - UserKnownHostsFile=/dev/null; we don't care about the keys. Host keys
81 change with every new installation, don't waste memory/space saving them.
Chris Sosaf7fcd6e2011-09-27 17:30:47 -070082
83 - SSH protocol forced to 2; needed for ServerAliveInterval.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -080084
85 @param user User name to use for the ssh connection.
86 @param port Port on the target host to use for ssh connection.
87 @param opts Additional options to the ssh command.
88 @param hosts_file Ignored.
89 @param connect_timeout Ignored.
90 @param alive_interval Ignored.
Dale Curtiscb7bfaf2011-06-07 16:21:57 -070091 """
92 base_command = ('/usr/bin/ssh -a -x %s -o StrictHostKeyChecking=no'
93 ' -o UserKnownHostsFile=/dev/null -o BatchMode=yes'
Chris Sosaf7fcd6e2011-09-27 17:30:47 -070094 ' -o ConnectTimeout=30 -o ServerAliveInterval=180'
95 ' -o ServerAliveCountMax=3 -o ConnectionAttempts=4'
96 ' -o Protocol=2 -l %s -p %d')
Dale Curtiscb7bfaf2011-06-07 16:21:57 -070097 return base_command % (opts, user, port)
J. Richard Barnette45e93de2012-04-11 17:24:15 -070098
99
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800100
Aviv Keshet74c89a92013-02-04 15:18:30 -0800101def add_label_detector(label_function_list, label_list=None, label=None):
102 """Decorator used to group functions together into the provided list.
103 @param label_function_list: List of label detecting functions to add
104 decorated function to.
105 @param label_list: List of detectable labels to add detectable labels to.
106 (Default: None)
107 @param label: Label string that is detectable by this detection function
108 (Default: None)
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800109 """
Simran Basic6f1f7a2012-10-16 10:47:46 -0700110 def add_func(func):
Aviv Keshet74c89a92013-02-04 15:18:30 -0800111 """
112 @param func: The function to be added as a detector.
113 """
114 label_function_list.append(func)
115 if label and label_list is not None:
116 label_list.append(label)
Simran Basic6f1f7a2012-10-16 10:47:46 -0700117 return func
118 return add_func
119
120
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700121class SiteHost(remote.RemoteHost):
122 """Chromium OS specific subclass of Host."""
123
124 _parser = autoserv_parser.autoserv_parser
Scott Zawalski62bacae2013-03-05 10:40:32 -0500125 _AFE = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700126
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800127 # Time to wait for new kernel to be marked successful after
128 # auto update.
Chris Masone163cead2012-05-16 11:49:48 -0700129 _KERNEL_UPDATE_TIMEOUT = 120
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700130
Richard Barnette03a0c132012-11-05 12:40:35 -0800131 # Timeout values (in seconds) associated with various Chrome OS
132 # state changes.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700133 #
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800134 # In general, a good rule of thumb is that the timeout can be up
135 # to twice the typical measured value on the slowest platform.
136 # The times here have not necessarily been empirically tested to
137 # meet this criterion.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -0700138 #
139 # SLEEP_TIMEOUT: Time to allow for suspend to memory.
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800140 # RESUME_TIMEOUT: Time to allow for resume after suspend, plus
141 # time to restart the netwowrk.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -0700142 # BOOT_TIMEOUT: Time to allow for boot from power off. Among
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800143 # other things, this must account for the 30 second dev-mode
J. Richard Barnetted4649c62013-03-06 17:42:27 -0800144 # screen delay and time to start the network.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -0700145 # USB_BOOT_TIMEOUT: Time to allow for boot from a USB device,
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800146 # including the 30 second dev-mode delay and time to start the
J. Richard Barnetted4649c62013-03-06 17:42:27 -0800147 # network.
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800148 # SHUTDOWN_TIMEOUT: Time to allow for shut down.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700149 # REBOOT_TIMEOUT: How long to wait for a reboot.
Richard Barnette03a0c132012-11-05 12:40:35 -0800150 # _INSTALL_TIMEOUT: Time to allow for chromeos-install.
J. Richard Barnetteeb69d722012-06-18 17:29:44 -0700151
152 SLEEP_TIMEOUT = 2
J. Richard Barnetted4649c62013-03-06 17:42:27 -0800153 RESUME_TIMEOUT = 10
J. Richard Barnetteeb69d722012-06-18 17:29:44 -0700154 BOOT_TIMEOUT = 45
155 USB_BOOT_TIMEOUT = 150
Chris Sosab76e0ee2013-05-22 16:55:41 -0700156
157 # We have a long timeout to ensure we don't flakily fail due to other
158 # issues. Shorter timeouts are vetted in platform_RebootAfterUpdate.
159 REBOOT_TIMEOUT = 300
160
Richard Barnette03a0c132012-11-05 12:40:35 -0800161 _INSTALL_TIMEOUT = 240
162
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800163 # _USB_POWER_TIMEOUT: Time to allow for USB to power toggle ON and OFF.
164 # _POWER_CYCLE_TIMEOUT: Time to allow for manual power cycle.
165 _USB_POWER_TIMEOUT = 5
166 _POWER_CYCLE_TIMEOUT = 10
167
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800168
Richard Barnette82c35912012-11-20 10:09:10 -0800169 _RPM_RECOVERY_BOARDS = global_config.global_config.get_config_value('CROS',
170 'rpm_recovery_boards', type=str).split(',')
171
172 _MAX_POWER_CYCLE_ATTEMPTS = 6
173 _LAB_MACHINE_FILE = '/mnt/stateful_partition/.labmachine'
174 _RPM_HOSTNAME_REGEX = ('chromeos[0-9]+(-row[0-9]+)?-rack[0-9]+[a-z]*-'
175 'host[0-9]+')
176 _LIGHTSENSOR_FILES = ['in_illuminance0_input',
177 'in_illuminance0_raw',
178 'illuminance0_input']
179 _LIGHTSENSOR_SEARCH_DIR = '/sys/bus/iio/devices'
180 _LABEL_FUNCTIONS = []
Aviv Keshet74c89a92013-02-04 15:18:30 -0800181 _DETECTABLE_LABELS = []
182 label_decorator = functools.partial(add_label_detector, _LABEL_FUNCTIONS,
183 _DETECTABLE_LABELS)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700184
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -0800185 # Constants used in ping_wait_up() and ping_wait_down().
186 #
187 # _PING_WAIT_COUNT is the approximate number of polling
188 # cycles to use when waiting for a host state change.
189 #
190 # _PING_STATUS_DOWN and _PING_STATUS_UP are names used
191 # for arguments to the internal _ping_wait_for_status()
192 # method.
193 _PING_WAIT_COUNT = 40
194 _PING_STATUS_DOWN = False
195 _PING_STATUS_UP = True
196
Ismail Noorbasha07fdb612013-02-14 14:13:31 -0800197 # Allowed values for the power_method argument.
198
199 # POWER_CONTROL_RPM: Passed as default arg for power_off/on/cycle() methods.
200 # POWER_CONTROL_SERVO: Used in set_power() and power_cycle() methods.
201 # POWER_CONTROL_MANUAL: Used in set_power() and power_cycle() methods.
202 POWER_CONTROL_RPM = 'RPM'
203 POWER_CONTROL_SERVO = 'servoj10'
204 POWER_CONTROL_MANUAL = 'manual'
205
206 POWER_CONTROL_VALID_ARGS = (POWER_CONTROL_RPM,
207 POWER_CONTROL_SERVO,
208 POWER_CONTROL_MANUAL)
Richard Barnette0c73ffc2012-11-19 15:21:18 -0800209
Simran Basi5e6339a2013-03-21 11:34:32 -0700210 _RPM_OUTLET_CHANGED = 'outlet_changed'
211
J. Richard Barnette964fba02012-10-24 17:34:29 -0700212 @staticmethod
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800213 def get_servo_arguments(args_dict):
214 """Extract servo options from `args_dict` and return the result.
215
216 Take the provided dictionary of argument options and return
217 a subset that represent standard arguments needed to
218 construct a servo object for a host. The intent is to
219 provide standard argument processing from run_remote_tests
220 for tests that require a servo to operate.
221
222 Recommended usage:
223 ~~~~~~~~
224 args_dict = utils.args_to_dict(args)
225 servo_args = hosts.SiteHost.get_servo_arguments(args_dict)
226 host = hosts.create_host(machine, servo_args=servo_args)
227 ~~~~~~~~
228
229 @param args_dict Dictionary from which to extract the servo
230 arguments.
231 """
J. Richard Barnette964fba02012-10-24 17:34:29 -0700232 servo_args = {}
233 for arg in ('servo_host', 'servo_port'):
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800234 if arg in args_dict:
235 servo_args[arg] = args_dict[arg]
J. Richard Barnette964fba02012-10-24 17:34:29 -0700236 return servo_args
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700237
J. Richard Barnette964fba02012-10-24 17:34:29 -0700238
239 def _initialize(self, hostname, servo_args=None, *args, **dargs):
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700240 """Initialize superclasses, and |self.servo|.
241
242 For creating the host servo object, there are three
243 possibilities: First, if the host is a lab system known to
244 have a servo board, we connect to that servo unconditionally.
245 Second, if we're called from a control file that requires
J. Richard Barnette55fb8062012-05-23 10:29:31 -0700246 servo features for testing, it will pass settings for
247 `servo_host`, `servo_port`, or both. If neither of these
248 cases apply, `self.servo` will be `None`.
J. Richard Barnette67ccb872012-04-19 16:34:56 -0700249
250 """
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700251 super(SiteHost, self)._initialize(hostname=hostname,
252 *args, **dargs)
J. Richard Barnettef0859852012-08-20 14:55:50 -0700253 # self.env is a dictionary of environment variable settings
254 # to be exported for commands run on the host.
255 # LIBC_FATAL_STDERR_ can be useful for diagnosing certain
256 # errors that might happen.
257 self.env['LIBC_FATAL_STDERR_'] = '1'
J. Richard Barnette1d78b012012-05-15 13:56:30 -0700258 self._xmlrpc_proxy_map = {}
J. Richard Barnettebe5ebcc2013-02-11 16:03:15 -0800259 self.servo = _get_lab_servo(hostname)
J. Richard Barnettead7da482012-10-30 16:46:52 -0700260 if not self.servo and servo_args is not None:
J. Richard Barnette964fba02012-10-24 17:34:29 -0700261 self.servo = servo.Servo(**servo_args)
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700262
263
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500264 def get_repair_image_name(self):
265 """Generate a image_name from variables in the global config.
266
267 @returns a str of $board-version/$BUILD.
268
269 """
270 stable_version = global_config.global_config.get_config_value(
271 'CROS', 'stable_cros_version')
272 build_pattern = global_config.global_config.get_config_value(
273 'CROS', 'stable_build_pattern')
274 board = self._get_board_from_afe()
275 if board is None:
276 raise error.AutoservError('DUT has no board attribute, '
277 'cannot be repaired.')
278 return build_pattern % (board, stable_version)
279
280
Scott Zawalski62bacae2013-03-05 10:40:32 -0500281 def _host_in_AFE(self):
282 """Check if the host is an object the AFE knows.
283
284 @returns the host object.
285 """
286 return self._AFE.get_hosts(hostname=self.hostname)
287
288
Chris Sosab76e0ee2013-05-22 16:55:41 -0700289 def lookup_job_repo_url(self):
290 """Looks up the job_repo_url for the host.
291
292 @returns job_repo_url from AFE or None if not found.
293
294 @raises KeyError if the host does not have a job_repo_url
295 """
296 if not self._host_in_AFE():
297 return None
298
299 hosts = self._AFE.get_hosts(hostname=self.hostname)
beepsb5efc532013-06-04 11:29:34 -0700300 if hosts and ds_constants.JOB_REPO_URL in hosts[0].attributes:
301 return hosts[0].attributes[ds_constants.JOB_REPO_URL]
Chris Sosab76e0ee2013-05-22 16:55:41 -0700302
303
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500304 def clear_cros_version_labels_and_job_repo_url(self):
305 """Clear cros_version labels and host attribute job_repo_url."""
Scott Zawalski62bacae2013-03-05 10:40:32 -0500306 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400307 return
308
Scott Zawalski62bacae2013-03-05 10:40:32 -0500309 host_list = [self.hostname]
310 labels = self._AFE.get_labels(
311 name__startswith=ds_constants.VERSION_PREFIX,
312 host__hostname=self.hostname)
Dan Shi0f466e82013-02-22 15:44:58 -0800313
Scott Zawalski62bacae2013-03-05 10:40:32 -0500314 for label in labels:
315 label.remove_hosts(hosts=host_list)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500316
beepscb6f1e22013-06-28 19:14:10 -0700317 self.update_job_repo_url(None, None)
318
319
320 def update_job_repo_url(self, devserver_url, image_name):
321 """
322 Updates the job_repo_url host attribute and asserts it's value.
323
324 @param devserver_url: The devserver to use in the job_repo_url.
325 @param image_name: The name of the image to use in the job_repo_url.
326
327 @raises AutoservError: If we failed to update the job_repo_url.
328 """
329 repo_url = None
330 if devserver_url and image_name:
331 repo_url = tools.get_package_url(devserver_url, image_name)
332 self._AFE.set_host_attribute(ds_constants.JOB_REPO_URL, repo_url,
Scott Zawalski62bacae2013-03-05 10:40:32 -0500333 hostname=self.hostname)
beepscb6f1e22013-06-28 19:14:10 -0700334 if self.lookup_job_repo_url() != repo_url:
335 raise error.AutoservError('Failed to update job_repo_url with %s, '
336 'host %s' % (repo_url, self.hostname))
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500337
338
Dan Shie9309262013-06-19 22:50:21 -0700339 def add_cros_version_labels_and_job_repo_url(self, image_name):
Scott Zawalskieadbf702013-03-14 09:23:06 -0400340 """Add cros_version labels and host attribute job_repo_url.
341
342 @param image_name: The name of the image e.g.
343 lumpy-release/R27-3837.0.0
Dan Shi7458bf62013-06-10 12:50:16 -0700344
Scott Zawalskieadbf702013-03-14 09:23:06 -0400345 """
Scott Zawalski62bacae2013-03-05 10:40:32 -0500346 if not self._host_in_AFE():
Scott Zawalskieadbf702013-03-14 09:23:06 -0400347 return
Scott Zawalski62bacae2013-03-05 10:40:32 -0500348
Scott Zawalskieadbf702013-03-14 09:23:06 -0400349 cros_label = '%s%s' % (ds_constants.VERSION_PREFIX, image_name)
Dan Shie9309262013-06-19 22:50:21 -0700350 devserver_url = dev_server.ImageServer.resolve(image_name).url()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500351
352 labels = self._AFE.get_labels(name=cros_label)
353 if labels:
354 label = labels[0]
355 else:
356 label = self._AFE.create_label(name=cros_label)
357
358 label.add_hosts([self.hostname])
beepscb6f1e22013-06-28 19:14:10 -0700359 self.update_job_repo_url(devserver_url, image_name)
360
361
362 def verify_job_repo_url(self):
363 """
364 Make sure job_repo_url of this host is valid.
365
366 Eg: The job_repo_url "http://lmn.cd.ab.xyx:8080/static/archive/\
367 lumpy-release/R29-4279.0.0/autotest/packages" claims to have the
368 autotest package for lumpy-release/R29-4279.0.0. If this isn't the case,
369 download and extract it. If the devserver embedded in the url is
370 unresponsive, update the job_repo_url of the host after staging it on
371 another devserver.
372
373 @param job_repo_url: A url pointing to the devserver where the autotest
374 package for this build should be staged.
375
376 @raises DevServerException: If we could not resolve a devserver.
377 @raises AutoservError: If we're unable to save the new job_repo_url as
378 a result of choosing a new devserver because the old one failed to
379 respond to a health check.
380 """
381 job_repo_url = self.lookup_job_repo_url()
382 if not job_repo_url:
383 logging.warning('No job repo url set on host %s', self.hostname)
384 return
385
386 logging.info('Verifying job repo url %s', job_repo_url)
387 devserver_url, image_name = tools.get_devserver_build_from_package_url(
388 job_repo_url)
389
390 ds = dev_server.ImageServer.resolve(image_name)
391
392 logging.info('Staging autotest artifacts for %s on devserver %s',
393 image_name, ds.url())
394 ds.stage_artifacts(image_name, ['autotest'])
395
396 if ds.url() != devserver_url:
Dan Shi7458bf62013-06-10 12:50:16 -0700397 logging.info('Devserver url changed, new devserver is %s, '
beepscb6f1e22013-06-28 19:14:10 -0700398 'old devserver was %s',
399 ds.url(), devserver_url)
400 self.update_job_repo_url(ds.url(), image_name)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400401
402
Dan Shi0f466e82013-02-22 15:44:58 -0800403 def _try_stateful_update(self, update_url, force_update, updater):
404 """Try to use stateful update to initialize DUT.
405
406 When DUT is already running the same version that machine_install
407 tries to install, stateful update is a much faster way to clean up
408 the DUT for testing, compared to a full reimage. It is implemeted
409 by calling autoupdater.run_update, but skipping updating root, as
410 updating the kernel is time consuming and not necessary.
411
412 @param update_url: url of the image.
413 @param force_update: Set to True to update the image even if the DUT
414 is running the same version.
415 @param updater: ChromiumOSUpdater instance used to update the DUT.
416 @returns: True if the DUT was updated with stateful update.
417
418 """
419 if not updater.check_version():
420 return False
421 if not force_update:
422 logging.info('Canceling stateful update because the new and '
423 'old versions are the same.')
424 return False
425 # Following folders should be rebuilt after stateful update.
426 # A test file is used to confirm each folder gets rebuilt after
427 # the stateful update.
428 folders_to_check = ['/var', '/home', '/mnt/stateful_partition']
429 test_file = '.test_file_to_be_deleted'
430 for folder in folders_to_check:
431 touch_path = os.path.join(folder, test_file)
432 self.run('touch %s' % touch_path)
433
434 if not updater.run_update(force_update=True, update_root=False):
435 return False
436
437 # Reboot to complete stateful update.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700438 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Dan Shi0f466e82013-02-22 15:44:58 -0800439 check_file_cmd = 'test -f %s; echo $?'
440 for folder in folders_to_check:
441 test_file_path = os.path.join(folder, test_file)
442 result = self.run(check_file_cmd % test_file_path,
443 ignore_status=True)
444 if result.exit_status == 1:
445 return False
446 return True
447
448
J. Richard Barnette7275b612013-06-04 18:13:11 -0700449 def _post_update_processing(self, updater, expected_kernel=None):
Dan Shi0f466e82013-02-22 15:44:58 -0800450 """After the DUT is updated, confirm machine_install succeeded.
451
452 @param updater: ChromiumOSUpdater instance used to update the DUT.
J. Richard Barnette7275b612013-06-04 18:13:11 -0700453 @param expected_kernel: kernel expected to be active after reboot,
454 or `None` to skip rollback checking.
Dan Shi0f466e82013-02-22 15:44:58 -0800455
456 """
J. Richard Barnette7275b612013-06-04 18:13:11 -0700457 # Touch the lab machine file to leave a marker that
458 # distinguishes this image from other test images.
459 # Afterwards, we must re-run the autoreboot script because
460 # it depends on the _LAB_MACHINE_FILE.
Dan Shi0f466e82013-02-22 15:44:58 -0800461 self.run('touch %s' % self._LAB_MACHINE_FILE)
Dan Shi0f466e82013-02-22 15:44:58 -0800462 self.run('start autoreboot')
463
J. Richard Barnette7275b612013-06-04 18:13:11 -0700464 # Figure out the newly active kernel.
465 active_kernel, _ = updater.get_kernel_state()
466
467 # Check for rollback due to a bad build.
468 if expected_kernel and active_kernel != expected_kernel:
469 # Print out some information to make it easier to debug
470 # the rollback.
Dan Shi0f466e82013-02-22 15:44:58 -0800471 logging.debug('Dumping partition table.')
Dan Shi346725f2013-03-20 15:22:38 -0700472 self.run('cgpt show $(rootdev -s -d)')
Dan Shi0f466e82013-02-22 15:44:58 -0800473 logging.debug('Dumping crossystem for firmware debugging.')
Dan Shi346725f2013-03-20 15:22:38 -0700474 self.run('crossystem --all')
Dan Shi0f466e82013-02-22 15:44:58 -0800475 raise autoupdater.ChromiumOSError(
J. Richard Barnette7275b612013-06-04 18:13:11 -0700476 'Build %s failed to boot on %s; system rolled back '
477 'to previous build' % (updater.update_version,
478 self.hostname))
Dan Shi0f466e82013-02-22 15:44:58 -0800479
J. Richard Barnette7275b612013-06-04 18:13:11 -0700480 # Check that we've got the build we meant to install.
481 if not updater.check_version_to_confirm_install():
482 raise autoupdater.ChromiumOSError(
483 'Failed to update %s to build %s; found build '
484 '%s instead' % (self.hostname,
485 updater.update_version,
486 updater.get_build_id()))
Scott Zawalski62bacae2013-03-05 10:40:32 -0500487
J. Richard Barnette7275b612013-06-04 18:13:11 -0700488 # Make sure chromeos-setgoodkernel runs.
489 try:
Dan Shi0f466e82013-02-22 15:44:58 -0800490 utils.poll_for_condition(
J. Richard Barnette7275b612013-06-04 18:13:11 -0700491 lambda: (updater.get_kernel_tries(active_kernel) == 0
492 and updater.get_kernel_success(active_kernel)),
493 exception=autoupdater.ChromiumOSError(),
Dan Shi0f466e82013-02-22 15:44:58 -0800494 timeout=self._KERNEL_UPDATE_TIMEOUT, sleep_interval=5)
J. Richard Barnette7275b612013-06-04 18:13:11 -0700495 except autoupdater.ChromiumOSError as e:
496 services_status = self.run('status system-services').stdout
497 if services_status != 'system-services start/running\n':
498 event = ('Chrome failed to reach login screen')
499 else:
500 event = ('update-engine failed to call '
501 'chromeos-setgoodkernel')
502 raise autoupdater.ChromiumOSError(
503 'After update and reboot, %s '
504 'within %d seconds' % (event,
505 self._KERNEL_UPDATE_TIMEOUT))
Dan Shi0f466e82013-02-22 15:44:58 -0800506
507
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700508 def _stage_image_for_update(self, image_name=None):
Scott Zawalskieadbf702013-03-14 09:23:06 -0400509 """Stage a build on a devserver and return the update_url.
510
511 @param image_name: a name like lumpy-release/R27-3837.0.0
512 @returns an update URL like:
513 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
514 """
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700515 if not image_name:
516 image_name = self.get_repair_image_name()
517 logging.info('Staging build for AU: %s', image_name)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400518 devserver = dev_server.ImageServer.resolve(image_name)
519 devserver.trigger_download(image_name, synchronous=False)
520 return tools.image_url_pattern() % (devserver.url(), image_name)
521
522
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700523 def stage_image_for_servo(self, image_name=None):
524 """Stage a build on a devserver and return the update_url.
525
526 @param image_name: a name like lumpy-release/R27-3837.0.0
527 @returns an update URL like:
528 http://172.22.50.205:8082/update/lumpy-release/R27-3837.0.0
529 """
530 if not image_name:
531 image_name = self.get_repair_image_name()
532 logging.info('Staging build for servo install: %s', image_name)
533 devserver = dev_server.ImageServer.resolve(image_name)
534 devserver.stage_artifacts(image_name, ['test_image'])
535 return devserver.get_test_image_url(image_name)
536
537
Chris Sosaa3ac2152012-05-23 22:23:13 -0700538 def machine_install(self, update_url=None, force_update=False,
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500539 local_devserver=False, repair=False):
540 """Install the DUT.
541
Dan Shi0f466e82013-02-22 15:44:58 -0800542 Use stateful update if the DUT is already running the same build.
543 Stateful update does not update kernel and tends to run much faster
544 than a full reimage. If the DUT is running a different build, or it
545 failed to do a stateful update, full update, including kernel update,
546 will be applied to the DUT.
547
Scott Zawalskieadbf702013-03-14 09:23:06 -0400548 Once a host enters machine_install its cros_version label will be
549 removed as well as its host attribute job_repo_url (used for
550 package install).
551
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500552 @param update_url: The url to use for the update
553 pattern: http://$devserver:###/update/$build
554 If update_url is None and repair is True we will install the
555 stable image listed in global_config under
556 CROS.stable_cros_version.
557 @param force_update: Force an update even if the version installed
558 is the same. Default:False
559 @param local_devserver: Used by run_remote_test to allow people to
560 use their local devserver. Default: False
561 @param repair: Whether or not we are in repair mode. This adds special
562 cases for repairing a machine like starting update_engine.
563 Setting repair to True sets force_update to True as well.
564 default: False
565 @raises autoupdater.ChromiumOSError
566
567 """
Dan Shi7458bf62013-06-10 12:50:16 -0700568 if update_url:
569 logging.debug('update url is set to %s', update_url)
570 else:
571 logging.debug('update url is not set, resolving...')
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700572 if self._parser.options.image:
573 requested_build = self._parser.options.image
574 if requested_build.startswith('http://'):
575 update_url = requested_build
Dan Shi7458bf62013-06-10 12:50:16 -0700576 logging.debug('update url is retrieved from requested_build'
577 ': %s', update_url)
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700578 else:
579 # Try to stage any build that does not start with
580 # http:// on the devservers defined in
581 # global_config.ini.
Dan Shi7458bf62013-06-10 12:50:16 -0700582 update_url = self._stage_image_for_update(requested_build)
583 logging.debug('Build staged, and update_url is set to: %s',
584 update_url)
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700585 elif repair:
586 update_url = self._stage_image_for_update()
Dan Shi7458bf62013-06-10 12:50:16 -0700587 logging.debug('Build staged, and update_url is set to: %s',
588 update_url)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400589 else:
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700590 raise autoupdater.ChromiumOSError(
591 'Update failed. No update URL provided.')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500592
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500593 if repair:
Dan Shi0f466e82013-02-22 15:44:58 -0800594 # In case the system is in a bad state, we always reboot the machine
595 # before machine_install.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700596 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500597 self.run('stop update-engine; start update-engine')
598 force_update = True
Dan Shi0f466e82013-02-22 15:44:58 -0800599
Chris Sosaa3ac2152012-05-23 22:23:13 -0700600 updater = autoupdater.ChromiumOSUpdater(update_url, host=self,
Chris Sosa72312602013-04-16 15:01:56 -0700601 local_devserver=local_devserver)
Dan Shi0f466e82013-02-22 15:44:58 -0800602 updated = False
Scott Zawalskieadbf702013-03-14 09:23:06 -0400603 # Remove cros-version and job_repo_url host attribute from host.
604 self.clear_cros_version_labels_and_job_repo_url()
Dan Shi0f466e82013-02-22 15:44:58 -0800605 # If the DUT is already running the same build, try stateful update
606 # first. Stateful update does not update kernel and tends to run much
607 # faster than a full reimage.
608 try:
Chris Sosab76e0ee2013-05-22 16:55:41 -0700609 updated = self._try_stateful_update(
610 update_url, force_update, updater)
Dan Shi0f466e82013-02-22 15:44:58 -0800611 if updated:
612 logging.info('DUT is updated with stateful update.')
613 except Exception as e:
614 logging.exception(e)
615 logging.warn('Failed to stateful update DUT, force to update.')
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700616
Dan Shi0f466e82013-02-22 15:44:58 -0800617 inactive_kernel = None
618 # Do a full update if stateful update is not applicable or failed.
619 if not updated:
620 # In case the system is in a bad state, we always reboot the
621 # machine before machine_install.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700622 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
Chris Sosab7612bc2013-03-21 10:32:37 -0700623
624 # TODO(sosa): Remove temporary hack to get rid of bricked machines
625 # that can't update due to a corrupted policy.
626 self.run('rm -rf /var/lib/whitelist')
627 self.run('touch /var/lib/whitelist')
628 self.run('chmod -w /var/lib/whitelist')
Scott Zawalskib550d5a2013-03-22 09:23:59 -0400629 self.run('stop update-engine; start update-engine')
Chris Sosab7612bc2013-03-21 10:32:37 -0700630
Dan Shi0f466e82013-02-22 15:44:58 -0800631 if updater.run_update(force_update):
632 updated = True
633 # Figure out active and inactive kernel.
634 active_kernel, inactive_kernel = updater.get_kernel_state()
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700635
Dan Shi0f466e82013-02-22 15:44:58 -0800636 # Ensure inactive kernel has higher priority than active.
637 if (updater.get_kernel_priority(inactive_kernel)
638 < updater.get_kernel_priority(active_kernel)):
639 raise autoupdater.ChromiumOSError(
640 'Update failed. The priority of the inactive kernel'
641 ' partition is less than that of the active kernel'
642 ' partition.')
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700643
Dan Shi0f466e82013-02-22 15:44:58 -0800644 update_engine_log = '/var/log/update_engine.log'
645 logging.info('Dumping %s', update_engine_log)
646 self.run('cat %s' % update_engine_log)
647 # Updater has returned successfully; reboot the host.
Chris Sosab76e0ee2013-05-22 16:55:41 -0700648 self.reboot(timeout=self.REBOOT_TIMEOUT, wait=True)
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700649
Dan Shi0f466e82013-02-22 15:44:58 -0800650 if updated:
651 self._post_update_processing(updater, inactive_kernel)
Scott Zawalskieadbf702013-03-14 09:23:06 -0400652 image_name = autoupdater.url_to_image_name(update_url)
Dan Shie9309262013-06-19 22:50:21 -0700653 self.add_cros_version_labels_and_job_repo_url(image_name)
Simran Basi13fa1ba2013-03-04 10:56:47 -0800654
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700655 # Clean up any old autotest directories which may be lying around.
656 for path in global_config.global_config.get_config_value(
657 'AUTOSERV', 'client_autodir_paths', type=list):
658 self.run('rm -rf ' + path)
659
660
Richard Barnette82c35912012-11-20 10:09:10 -0800661 def _get_board_from_afe(self):
662 """Retrieve this host's board from its labels in the AFE.
663
664 Looks for a host label of the form "board:<board>", and
665 returns the "<board>" part of the label. `None` is returned
666 if there is not a single, unique label matching the pattern.
667
668 @returns board from label, or `None`.
669 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700670 return server_utils.get_board_from_afe(self.hostname, self._AFE)
Simran Basi833814b2013-01-29 13:13:43 -0800671
672
673 def get_build(self):
674 """Retrieve the current build for this Host from the AFE.
675
676 Looks through this host's labels in the AFE to determine its build.
677
678 @returns The current build or None if it could not find it or if there
679 were multiple build labels assigned to this host.
680 """
Dan Shia1ecd5c2013-06-06 11:21:31 -0700681 return server_utils.get_build_from_afe(self.hostname, self._AFE)
Richard Barnette82c35912012-11-20 10:09:10 -0800682
683
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500684 def _install_repair(self):
685 """Attempt to repair this host using upate-engine.
686
687 If the host is up, try installing the DUT with a stable
688 "repair" version of Chrome OS as defined in the global_config
689 under CROS.stable_cros_version.
690
Scott Zawalski62bacae2013-03-05 10:40:32 -0500691 @raises AutoservRepairMethodNA if the DUT is not reachable.
692 @raises ChromiumOSError if the install failed for some reason.
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500693
694 """
695 if not self.is_up():
Scott Zawalski62bacae2013-03-05 10:40:32 -0500696 raise error.AutoservRepairMethodNA('DUT unreachable for install.')
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500697
698 logging.info('Attempting to reimage machine to repair image.')
699 try:
700 self.machine_install(repair=True)
Fang Dengd0672f32013-03-18 17:18:09 -0700701 except autoupdater.ChromiumOSError as e:
702 logging.exception(e)
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500703 logging.info('Repair via install failed.')
Scott Zawalski62bacae2013-03-05 10:40:32 -0500704 raise
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500705
706
Scott Zawalski62bacae2013-03-05 10:40:32 -0500707 def servo_install(self, image_url=None):
708 """
709 Re-install the OS on the DUT by:
710 1) installing a test image on a USB storage device attached to the Servo
711 board,
Richard Barnette03a0c132012-11-05 12:40:35 -0800712 2) booting that image in recovery mode, and then
J. Richard Barnette31b2e312013-04-04 16:05:22 -0700713 3) installing the image with chromeos-install.
714
Scott Zawalski62bacae2013-03-05 10:40:32 -0500715 @param image_url: If specified use as the url to install on the DUT.
716 otherwise boot the currently staged image on the USB stick.
Richard Barnette03a0c132012-11-05 12:40:35 -0800717
Scott Zawalski62bacae2013-03-05 10:40:32 -0500718 @raises AutoservError if the image fails to boot.
Richard Barnette03a0c132012-11-05 12:40:35 -0800719 """
J. Richard Barnette31b2e312013-04-04 16:05:22 -0700720 self.servo.install_recovery_image(image_url)
Richard Barnette03a0c132012-11-05 12:40:35 -0800721 if not self.wait_up(timeout=self.USB_BOOT_TIMEOUT):
Scott Zawalski62bacae2013-03-05 10:40:32 -0500722 raise error.AutoservRepairFailure(
723 'DUT failed to boot from USB after %d seconds' %
724 self.USB_BOOT_TIMEOUT)
725
726 self.run('chromeos-install --yes', timeout=self._INSTALL_TIMEOUT)
Richard Barnette03a0c132012-11-05 12:40:35 -0800727 self.servo.power_long_press()
Fang Dengafb88142013-05-30 17:44:31 -0700728 self.servo.switch_usbkey('off')
Richard Barnette03a0c132012-11-05 12:40:35 -0800729 self.servo.power_short_press()
730 if not self.wait_up(timeout=self.BOOT_TIMEOUT):
731 raise error.AutoservError('DUT failed to reboot installed '
732 'test image after %d seconds' %
Scott Zawalski62bacae2013-03-05 10:40:32 -0500733 self.BOOT_TIMEOUT)
734
735
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700736 def _servo_repair_reinstall(self):
Scott Zawalski62bacae2013-03-05 10:40:32 -0500737 """Reinstall the DUT utilizing servo and a test image.
738
739 Re-install the OS on the DUT by:
740 1) installing a test image on a USB storage device attached to the Servo
741 board,
742 2) booting that image in recovery mode, and then
743 3) installing the image with chromeos-install.
744
Scott Zawalski62bacae2013-03-05 10:40:32 -0500745 @raises AutoservRepairMethodNA if the device does not have servo
746 support.
747
748 """
749 if not self.servo:
750 raise error.AutoservRepairMethodNA('Repair Reinstall NA: '
751 'DUT has no servo support.')
752
753 logging.info('Attempting to recovery servo enabled device with '
754 'servo_repair_reinstall')
755
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700756 image_url = self.stage_image_for_servo()
Scott Zawalski62bacae2013-03-05 10:40:32 -0500757 self.servo_install(image_url)
758
759
760 def _servo_repair_power(self):
761 """Attempt to repair DUT using an attached Servo.
762
763 Attempt to power on the DUT via power_long_press.
764
765 @raises AutoservRepairMethodNA if the device does not have servo
766 support.
767 @raises AutoservRepairFailure if the repair fails for any reason.
768 """
769 if not self.servo:
770 raise error.AutoservRepairMethodNA('Repair Power NA: '
771 'DUT has no servo support.')
772
773 logging.info('Attempting to recover servo enabled device by '
774 'powering it off and on.')
775 self.servo.get_power_state_controller().power_off()
776 self.servo.get_power_state_controller().power_on()
777 if self.wait_up(self.BOOT_TIMEOUT):
778 return
779
780 raise error.AutoservRepairFailure('DUT did not boot after long_press.')
Richard Barnette03a0c132012-11-05 12:40:35 -0800781
782
Richard Barnette82c35912012-11-20 10:09:10 -0800783 def _powercycle_to_repair(self):
784 """Utilize the RPM Infrastructure to bring the host back up.
785
786 If the host is not up/repaired after the first powercycle we utilize
787 auto fallback to the last good install by powercycling and rebooting the
788 host 6 times.
Scott Zawalski62bacae2013-03-05 10:40:32 -0500789
790 @raises AutoservRepairMethodNA if the device does not support remote
791 power.
792 @raises AutoservRepairFailure if the repair fails for any reason.
793
Richard Barnette82c35912012-11-20 10:09:10 -0800794 """
Scott Zawalski62bacae2013-03-05 10:40:32 -0500795 if not self.has_power():
796 raise error.AutoservRepairMethodNA('Device does not support power.')
797
Richard Barnette82c35912012-11-20 10:09:10 -0800798 logging.info('Attempting repair via RPM powercycle.')
799 failed_cycles = 0
800 self.power_cycle()
801 while not self.wait_up(timeout=self.BOOT_TIMEOUT):
802 failed_cycles += 1
803 if failed_cycles >= self._MAX_POWER_CYCLE_ATTEMPTS:
Scott Zawalski62bacae2013-03-05 10:40:32 -0500804 raise error.AutoservRepairFailure(
805 'Powercycled host %s %d times; device did not come back'
806 ' online.' % (self.hostname, failed_cycles))
Richard Barnette82c35912012-11-20 10:09:10 -0800807 self.power_cycle()
808 if failed_cycles == 0:
809 logging.info('Powercycling was successful first time.')
810 else:
811 logging.info('Powercycling was successful after %d failures.',
812 failed_cycles)
813
814
815 def repair_full(self):
816 """Repair a host for repair level NO_PROTECTION.
817
818 This overrides the base class function for repair; it does
819 not call back to the parent class, but instead offers a
820 simplified implementation based on the capabilities in the
821 Chrome OS test lab.
822
J. Richard Barnettefde55fc2013-03-15 17:47:01 -0700823 If `self.verify()` fails, the following procedures are
824 attempted:
825 1. Try to re-install to a known stable image using
826 auto-update.
Scott Zawalski62bacae2013-03-05 10:40:32 -0500827 2. If there's a servo for the DUT, try to power the DUT off and
828 on.
829 3. If there's a servo for the DUT, try to re-install via
J. Richard Barnettefde55fc2013-03-15 17:47:01 -0700830 the servo.
Scott Zawalski62bacae2013-03-05 10:40:32 -0500831 4. If the DUT can be power-cycled via RPM, try to repair
Richard Barnette82c35912012-11-20 10:09:10 -0800832 by power-cycling.
833
834 As with the parent method, the last operation performed on
835 the DUT must be to call `self.verify()`; if that call fails,
836 the exception it raises is passed back to the caller.
J. Richard Barnettefde55fc2013-03-15 17:47:01 -0700837
Scott Zawalski62bacae2013-03-05 10:40:32 -0500838 @raises AutoservRepairTotalFailure if the repair process fails to
839 fix the DUT.
Richard Barnette82c35912012-11-20 10:09:10 -0800840 """
Scott Zawalski62bacae2013-03-05 10:40:32 -0500841 # TODO(scottz): This should use something similar to label_decorator,
842 # but needs to be populated in order so DUTs are repaired with the
843 # least amount of effort.
844 repair_funcs = [self._install_repair, self._servo_repair_power,
J. Richard Barnettee4af8b92013-05-01 13:16:12 -0700845 self._servo_repair_reinstall,
Scott Zawalski62bacae2013-03-05 10:40:32 -0500846 self._powercycle_to_repair]
847 errors = []
848 for repair_func in repair_funcs:
849 try:
850 repair_func()
851 self.verify()
852 return
853 except Exception as e:
854 logging.warn('Failed to repair device: %s', e)
855 errors.append(str(e))
Scott Zawalski89c44dd2013-02-26 09:28:02 -0500856
Scott Zawalski62bacae2013-03-05 10:40:32 -0500857 raise error.AutoservRepairTotalFailure(
858 'All attempts at repairing the device failed:\n%s' %
859 '\n'.join(errors))
Richard Barnette82c35912012-11-20 10:09:10 -0800860
861
J. Richard Barnette1d78b012012-05-15 13:56:30 -0700862 def close(self):
863 super(SiteHost, self).close()
864 self.xmlrpc_disconnect_all()
865
866
Simran Basi5e6339a2013-03-21 11:34:32 -0700867 def _cleanup_poweron(self):
868 """Special cleanup method to make sure hosts always get power back."""
869 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
870 hosts = afe.get_hosts(hostname=self.hostname)
871 if not hosts or not (self._RPM_OUTLET_CHANGED in
872 hosts[0].attributes):
873 return
874 logging.debug('This host has recently interacted with the RPM'
875 ' Infrastructure. Ensuring power is on.')
876 try:
877 self.power_on()
878 except rpm_client.RemotePowerException:
879 # If cleanup has completed but there was an issue with the RPM
880 # Infrastructure, log an error message rather than fail cleanup
881 logging.error('Failed to turn Power On for this host after '
882 'cleanup through the RPM Infrastructure.')
883 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, None,
884 hostname=self.hostname)
885
886
Chris Sosaf4d43ff2012-10-30 11:21:05 -0700887 def cleanup(self):
Chris Sosaf4d43ff2012-10-30 11:21:05 -0700888 client_at = autotest.Autotest(self)
Richard Barnette82c35912012-11-20 10:09:10 -0800889 self.run('rm -f %s' % constants.CLEANUP_LOGS_PAUSED_FILE)
Scott Zawalskiddbc31e2012-11-15 11:29:01 -0500890 try:
891 client_at.run_static_method('autotest_lib.client.cros.cros_ui',
892 '_clear_login_prompt_state')
893 self.run('restart ui')
894 client_at.run_static_method('autotest_lib.client.cros.cros_ui',
895 '_wait_for_login_prompt')
Alex Millerf4517962013-02-25 15:03:02 -0800896 except (error.AutotestRunError, error.AutoservRunError):
Scott Zawalskiddbc31e2012-11-15 11:29:01 -0500897 logging.warn('Unable to restart ui, rebooting device.')
898 # Since restarting the UI fails fall back to normal Autotest
899 # cleanup routines, i.e. reboot the machine.
900 super(SiteHost, self).cleanup()
Simran Basi5e6339a2013-03-21 11:34:32 -0700901 # Check if the rpm outlet was manipulated.
Simran Basid5e5e272012-09-24 15:23:59 -0700902 if self.has_power():
Simran Basi5e6339a2013-03-21 11:34:32 -0700903 self._cleanup_poweron()
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700904
905
Yu-Ju Honga2be94a2012-07-31 09:48:52 -0700906 def reboot(self, **dargs):
907 """
908 This function reboots the site host. The more generic
909 RemoteHost.reboot() performs sync and sleeps for 5
910 seconds. This is not necessary for Chrome OS devices as the
911 sync should be finished in a short time during the reboot
912 command.
913 """
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +0800914 if 'reboot_cmd' not in dargs:
915 dargs['reboot_cmd'] = ('((reboot & sleep 10; reboot -f &)'
916 ' </dev/null >/dev/null 2>&1 &)')
Yu-Ju Honga2be94a2012-07-31 09:48:52 -0700917 # Enable fastsync to avoid running extra sync commands before reboot.
Tom Wai-Hong Tamf5cd1d42012-08-13 12:04:08 +0800918 if 'fastsync' not in dargs:
919 dargs['fastsync'] = True
Yu-Ju Honga2be94a2012-07-31 09:48:52 -0700920 super(SiteHost, self).reboot(**dargs)
921
922
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700923 def verify_software(self):
Richard Barnetteb2bc13c2013-01-08 17:32:51 -0800924 """Verify working software on a Chrome OS system.
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700925
Richard Barnetteb2bc13c2013-01-08 17:32:51 -0800926 Tests for the following conditions:
927 1. All conditions tested by the parent version of this
928 function.
929 2. Sufficient space in /mnt/stateful_partition.
Fang Deng6b05f5b2013-03-20 13:42:11 -0700930 3. Sufficient space in /mnt/stateful_partition/encrypted.
931 4. update_engine answers a simple status request over DBus.
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700932
J. Richard Barnette45e93de2012-04-11 17:24:15 -0700933 """
934 super(SiteHost, self).verify_software()
935 self.check_diskspace(
936 '/mnt/stateful_partition',
937 global_config.global_config.get_config_value(
Fang Deng6b05f5b2013-03-20 13:42:11 -0700938 'SERVER', 'gb_diskspace_required', type=float,
939 default=20.0))
940 self.check_diskspace(
941 '/mnt/stateful_partition/encrypted',
942 global_config.global_config.get_config_value(
943 'SERVER', 'gb_encrypted_diskspace_required', type=float,
944 default=0.1))
Richard Barnetteb2bc13c2013-01-08 17:32:51 -0800945 self.run('update_engine_client --status')
Scott Zawalskifbca4a92013-03-04 15:56:42 -0500946 # Makes sure python is present, loads and can use built in functions.
947 # We have seen cases where importing cPickle fails with undefined
948 # symbols in cPickle.so.
949 self.run('python -c "import cPickle"')
J. Richard Barnette134ec2c2012-04-25 12:59:37 -0700950
951
Christopher Wileyd78249a2013-03-01 13:05:31 -0800952 def xmlrpc_connect(self, command, port, command_name=None,
953 ready_test_name=None, timeout_seconds=10):
J. Richard Barnette1d78b012012-05-15 13:56:30 -0700954 """Connect to an XMLRPC server on the host.
955
956 The `command` argument should be a simple shell command that
957 starts an XMLRPC server on the given `port`. The command
958 must not daemonize, and must terminate cleanly on SIGTERM.
959 The command is started in the background on the host, and a
960 local XMLRPC client for the server is created and returned
961 to the caller.
962
963 Note that the process of creating an XMLRPC client makes no
964 attempt to connect to the remote server; the caller is
965 responsible for determining whether the server is running
966 correctly, and is ready to serve requests.
967
Christopher Wileyd78249a2013-03-01 13:05:31 -0800968 Optionally, the caller can pass ready_test_name, a string
969 containing the name of a method to call on the proxy. This
970 method should take no parameters and return successfully only
971 when the server is ready to process client requests. When
972 ready_test_name is set, xmlrpc_connect will block until the
973 proxy is ready, and throw a TestError if the server isn't
974 ready by timeout_seconds.
975
J. Richard Barnette1d78b012012-05-15 13:56:30 -0700976 @param command Shell command to start the server.
977 @param port Port number on which the server is expected to
978 be serving.
J. Richard Barnette7214e0b2013-02-06 15:20:49 -0800979 @param command_name String to use as input to `pkill` to
980 terminate the XMLRPC server on the host.
Christopher Wileyd78249a2013-03-01 13:05:31 -0800981 @param ready_test_name String containing the name of a
982 method defined on the XMLRPC server.
983 @param timeout_seconds Number of seconds to wait
984 for the server to become 'ready.' Will throw a
985 TestFail error if server is not ready in time.
986
J. Richard Barnette1d78b012012-05-15 13:56:30 -0700987 """
988 self.xmlrpc_disconnect(port)
989
990 # Chrome OS on the target closes down most external ports
991 # for security. We could open the port, but doing that
992 # would conflict with security tests that check that only
993 # expected ports are open. So, to get to the port on the
994 # target we use an ssh tunnel.
995 local_port = utils.get_unused_port()
996 tunnel_options = '-n -N -q -L %d:localhost:%d' % (local_port, port)
997 ssh_cmd = make_ssh_command(opts=tunnel_options)
998 tunnel_cmd = '%s %s' % (ssh_cmd, self.hostname)
999 logging.debug('Full tunnel command: %s', tunnel_cmd)
1000 tunnel_proc = subprocess.Popen(tunnel_cmd, shell=True, close_fds=True)
1001 logging.debug('Started XMLRPC tunnel, local = %d'
1002 ' remote = %d, pid = %d',
1003 local_port, port, tunnel_proc.pid)
1004
1005 # Start the server on the host. Redirection in the command
1006 # below is necessary, because 'ssh' won't terminate until
1007 # background child processes close stdin, stdout, and
1008 # stderr.
1009 remote_cmd = '( %s ) </dev/null >/dev/null 2>&1 & echo $!' % command
1010 remote_pid = self.run(remote_cmd).stdout.rstrip('\n')
1011 logging.debug('Started XMLRPC server on host %s, pid = %s',
1012 self.hostname, remote_pid)
1013
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001014 self._xmlrpc_proxy_map[port] = (command_name, tunnel_proc)
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001015 rpc_url = 'http://localhost:%d' % local_port
Christopher Wileyd78249a2013-03-01 13:05:31 -08001016 proxy = xmlrpclib.ServerProxy(rpc_url, allow_none=True)
1017 if ready_test_name is not None:
J. Richard Barnette13eb7c02013-03-07 12:06:29 -08001018 # retry.retry logs each attempt; calculate delay_sec to
1019 # keep log spam to a dull roar.
Christopher Wiley0ed712b2013-04-09 15:25:12 -07001020 @retry.retry((socket.error,
1021 xmlrpclib.ProtocolError,
1022 httplib.BadStatusLine),
Christopher Wileyd78249a2013-03-01 13:05:31 -08001023 timeout_min=timeout_seconds/60.0,
J. Richard Barnette13eb7c02013-03-07 12:06:29 -08001024 delay_sec=min(max(timeout_seconds/20.0, 0.1), 1))
Christopher Wileyd78249a2013-03-01 13:05:31 -08001025 def ready_test():
1026 """ Call proxy.ready_test_name(). """
1027 getattr(proxy, ready_test_name)()
1028 successful = False
1029 try:
1030 logging.info('Waiting %d seconds for XMLRPC server '
1031 'to start.', timeout_seconds)
1032 ready_test()
1033 successful = True
Christopher Wileyd78249a2013-03-01 13:05:31 -08001034 finally:
1035 if not successful:
1036 logging.error('Failed to start XMLRPC server.')
1037 self.xmlrpc_disconnect(port)
1038 logging.info('XMLRPC server started successfully.')
1039 return proxy
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001040
1041 def xmlrpc_disconnect(self, port):
1042 """Disconnect from an XMLRPC server on the host.
1043
1044 Terminates the remote XMLRPC server previously started for
1045 the given `port`. Also closes the local ssh tunnel created
1046 for the connection to the host. This function does not
1047 directly alter the state of a previously returned XMLRPC
1048 client object; however disconnection will cause all
1049 subsequent calls to methods on the object to fail.
1050
1051 This function does nothing if requested to disconnect a port
1052 that was not previously connected via `self.xmlrpc_connect()`
1053
1054 @param port Port number passed to a previous call to
1055 `xmlrpc_connect()`
1056 """
1057 if port not in self._xmlrpc_proxy_map:
1058 return
1059 entry = self._xmlrpc_proxy_map[port]
1060 remote_name = entry[0]
1061 tunnel_proc = entry[1]
1062 if remote_name:
1063 # We use 'pkill' to find our target process rather than
1064 # a PID, because the host may have rebooted since
1065 # connecting, and we don't want to kill an innocent
1066 # process with the same PID.
1067 #
1068 # 'pkill' helpfully exits with status 1 if no target
1069 # process is found, for which run() will throw an
Simran Basid5e5e272012-09-24 15:23:59 -07001070 # exception. We don't want that, so we the ignore
J. Richard Barnette1d78b012012-05-15 13:56:30 -07001071 # status.
1072 self.run("pkill -f '%s'" % remote_name, ignore_status=True)
1073
1074 if tunnel_proc.poll() is None:
1075 tunnel_proc.terminate()
1076 logging.debug('Terminated tunnel, pid %d', tunnel_proc.pid)
1077 else:
1078 logging.debug('Tunnel pid %d terminated early, status %d',
1079 tunnel_proc.pid, tunnel_proc.returncode)
1080 del self._xmlrpc_proxy_map[port]
1081
1082
1083 def xmlrpc_disconnect_all(self):
1084 """Disconnect all known XMLRPC proxy ports."""
1085 for port in self._xmlrpc_proxy_map.keys():
1086 self.xmlrpc_disconnect(port)
1087
1088
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001089 def _ping_check_status(self, status):
1090 """Ping the host once, and return whether it has a given status.
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001091
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001092 @param status Check the ping status against this value.
1093 @return True iff `status` and the result of ping are the same
1094 (i.e. both True or both False).
1095
1096 """
1097 ping_val = utils.ping(self.hostname, tries=1, deadline=1)
1098 return not (status ^ (ping_val == 0))
1099
1100 def _ping_wait_for_status(self, status, timeout):
1101 """Wait for the host to have a given status (UP or DOWN).
1102
1103 Status is checked by polling. Polling will not last longer
1104 than the number of seconds in `timeout`. The polling
1105 interval will be long enough that only approximately
1106 _PING_WAIT_COUNT polling cycles will be executed, subject
1107 to a maximum interval of about one minute.
1108
1109 @param status Waiting will stop immediately if `ping` of the
1110 host returns this status.
1111 @param timeout Poll for at most this many seconds.
1112 @return True iff the host status from `ping` matched the
1113 requested status at the time of return.
1114
1115 """
1116 # _ping_check_status() takes about 1 second, hence the
1117 # "- 1" in the formula below.
1118 poll_interval = min(int(timeout / self._PING_WAIT_COUNT), 60) - 1
1119 end_time = time.time() + timeout
1120 while time.time() <= end_time:
1121 if self._ping_check_status(status):
1122 return True
1123 if poll_interval > 0:
1124 time.sleep(poll_interval)
1125
1126 # The last thing we did was sleep(poll_interval), so it may
1127 # have been too long since the last `ping`. Check one more
1128 # time, just to be sure.
1129 return self._ping_check_status(status)
1130
1131 def ping_wait_up(self, timeout):
1132 """Wait for the host to respond to `ping`.
1133
1134 N.B. This method is not a reliable substitute for
1135 `wait_up()`, because a host that responds to ping will not
1136 necessarily respond to ssh. This method should only be used
1137 if the target DUT can be considered functional even if it
1138 can't be reached via ssh.
1139
1140 @param timeout Minimum time to allow before declaring the
1141 host to be non-responsive.
1142 @return True iff the host answered to ping before the timeout.
1143
1144 """
1145 return self._ping_wait_for_status(self._PING_STATUS_UP, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001146
Andrew Bresticker678c0c72013-01-22 10:44:09 -08001147 def ping_wait_down(self, timeout):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001148 """Wait until the host no longer responds to `ping`.
1149
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001150 This function can be used as a slightly faster version of
1151 `wait_down()`, by avoiding potentially long ssh timeouts.
1152
1153 @param timeout Minimum time to allow for the host to become
1154 non-responsive.
1155 @return True iff the host quit answering ping before the
1156 timeout.
1157
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001158 """
J. Richard Barnetteb6de7e32013-02-14 13:28:04 -08001159 return self._ping_wait_for_status(self._PING_STATUS_DOWN, timeout)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001160
1161 def test_wait_for_sleep(self):
1162 """Wait for the client to enter low-power sleep mode.
1163
1164 The test for "is asleep" can't distinguish a system that is
1165 powered off; to confirm that the unit was asleep, it is
1166 necessary to force resume, and then call
1167 `test_wait_for_resume()`.
1168
1169 This function is expected to be called from a test as part
1170 of a sequence like the following:
1171
1172 ~~~~~~~~
1173 boot_id = host.get_boot_id()
1174 # trigger sleep on the host
1175 host.test_wait_for_sleep()
1176 # trigger resume on the host
1177 host.test_wait_for_resume(boot_id)
1178 ~~~~~~~~
1179
1180 @exception TestFail The host did not go to sleep within
1181 the allowed time.
1182 """
Andrew Bresticker678c0c72013-01-22 10:44:09 -08001183 if not self.ping_wait_down(timeout=self.SLEEP_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001184 raise error.TestFail(
1185 'client failed to sleep after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001186 self.SLEEP_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001187
1188
1189 def test_wait_for_resume(self, old_boot_id):
1190 """Wait for the client to resume from low-power sleep mode.
1191
1192 The `old_boot_id` parameter should be the value from
1193 `get_boot_id()` obtained prior to entering sleep mode. A
1194 `TestFail` exception is raised if the boot id changes.
1195
1196 See @ref test_wait_for_sleep for more on this function's
1197 usage.
1198
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001199 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001200 target host went to sleep.
1201
1202 @exception TestFail The host did not respond within the
1203 allowed time.
1204 @exception TestFail The host responded, but the boot id test
1205 indicated a reboot rather than a sleep
1206 cycle.
1207 """
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001208 if not self.wait_up(timeout=self.RESUME_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001209 raise error.TestFail(
1210 'client failed to resume from sleep after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001211 self.RESUME_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001212 else:
1213 new_boot_id = self.get_boot_id()
1214 if new_boot_id != old_boot_id:
1215 raise error.TestFail(
1216 'client rebooted, but sleep was expected'
1217 ' (old boot %s, new boot %s)'
1218 % (old_boot_id, new_boot_id))
1219
1220
1221 def test_wait_for_shutdown(self):
1222 """Wait for the client to shut down.
1223
1224 The test for "has shut down" can't distinguish a system that
1225 is merely asleep; to confirm that the unit was down, it is
1226 necessary to force boot, and then call test_wait_for_boot().
1227
1228 This function is expected to be called from a test as part
1229 of a sequence like the following:
1230
1231 ~~~~~~~~
1232 boot_id = host.get_boot_id()
1233 # trigger shutdown on the host
1234 host.test_wait_for_shutdown()
1235 # trigger boot on the host
1236 host.test_wait_for_boot(boot_id)
1237 ~~~~~~~~
1238
1239 @exception TestFail The host did not shut down within the
1240 allowed time.
1241 """
Andrew Bresticker678c0c72013-01-22 10:44:09 -08001242 if not self.ping_wait_down(timeout=self.SHUTDOWN_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001243 raise error.TestFail(
1244 'client failed to shut down after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001245 self.SHUTDOWN_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001246
1247
1248 def test_wait_for_boot(self, old_boot_id=None):
1249 """Wait for the client to boot from cold power.
1250
1251 The `old_boot_id` parameter should be the value from
1252 `get_boot_id()` obtained prior to shutting down. A
1253 `TestFail` exception is raised if the boot id does not
1254 change. The boot id test is omitted if `old_boot_id` is not
1255 specified.
1256
1257 See @ref test_wait_for_shutdown for more on this function's
1258 usage.
1259
J. Richard Barnette7214e0b2013-02-06 15:20:49 -08001260 @param old_boot_id A boot id value obtained before the
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001261 shut down.
1262
1263 @exception TestFail The host did not respond within the
1264 allowed time.
1265 @exception TestFail The host responded, but the boot id test
1266 indicated that there was no reboot.
1267 """
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001268 if not self.wait_up(timeout=self.REBOOT_TIMEOUT):
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001269 raise error.TestFail(
1270 'client failed to reboot after %d seconds' %
J. Richard Barnetteeb69d722012-06-18 17:29:44 -07001271 self.REBOOT_TIMEOUT)
J. Richard Barnette134ec2c2012-04-25 12:59:37 -07001272 elif old_boot_id:
1273 if self.get_boot_id() == old_boot_id:
1274 raise error.TestFail(
1275 'client is back up, but did not reboot'
1276 ' (boot %s)' % old_boot_id)
Simran Basid5e5e272012-09-24 15:23:59 -07001277
1278
1279 @staticmethod
1280 def check_for_rpm_support(hostname):
1281 """For a given hostname, return whether or not it is powered by an RPM.
1282
1283 @return None if this host does not follows the defined naming format
1284 for RPM powered DUT's in the lab. If it does follow the format,
1285 it returns a regular expression MatchObject instead.
1286 """
Richard Barnette82c35912012-11-20 10:09:10 -08001287 return re.match(SiteHost._RPM_HOSTNAME_REGEX, hostname)
Simran Basid5e5e272012-09-24 15:23:59 -07001288
1289
1290 def has_power(self):
1291 """For this host, return whether or not it is powered by an RPM.
1292
1293 @return True if this host is in the CROS lab and follows the defined
1294 naming format.
1295 """
1296 return SiteHost.check_for_rpm_support(self.hostname)
1297
1298
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08001299 def _set_power(self, state, power_method):
1300 """Sets the power to the host via RPM, Servo or manual.
1301
1302 @param state Specifies which power state to set to DUT
1303 @param power_method Specifies which method of power control to
1304 use. By default "RPM" will be used. Valid values
1305 are the strings "RPM", "manual", "servoj10".
1306
1307 """
1308 ACCEPTABLE_STATES = ['ON', 'OFF']
1309
1310 if state.upper() not in ACCEPTABLE_STATES:
1311 raise error.TestError('State must be one of: %s.'
1312 % (ACCEPTABLE_STATES,))
1313
1314 if power_method == self.POWER_CONTROL_SERVO:
1315 logging.info('Setting servo port J10 to %s', state)
1316 self.servo.set('prtctl3_pwren', state.lower())
1317 time.sleep(self._USB_POWER_TIMEOUT)
1318 elif power_method == self.POWER_CONTROL_MANUAL:
1319 logging.info('You have %d seconds to set the AC power to %s.',
1320 self._POWER_CYCLE_TIMEOUT, state)
1321 time.sleep(self._POWER_CYCLE_TIMEOUT)
1322 else:
1323 if not self.has_power():
1324 raise error.TestFail('DUT does not have RPM connected.')
Simran Basi5e6339a2013-03-21 11:34:32 -07001325 afe = frontend_wrappers.RetryingAFE(timeout_min=5, delay_sec=10)
1326 afe.set_host_attribute(self._RPM_OUTLET_CHANGED, True,
1327 hostname=self.hostname)
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08001328 rpm_client.set_power(self.hostname, state.upper())
Simran Basid5e5e272012-09-24 15:23:59 -07001329
1330
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08001331 def power_off(self, power_method=POWER_CONTROL_RPM):
1332 """Turn off power to this host via RPM, Servo or manual.
1333
1334 @param power_method Specifies which method of power control to
1335 use. By default "RPM" will be used. Valid values
1336 are the strings "RPM", "manual", "servoj10".
1337
1338 """
1339 self._set_power('OFF', power_method)
Simran Basid5e5e272012-09-24 15:23:59 -07001340
1341
Ismail Noorbasha07fdb612013-02-14 14:13:31 -08001342 def power_on(self, power_method=POWER_CONTROL_RPM):
1343 """Turn on power to this host via RPM, Servo or manual.
1344
1345 @param power_method Specifies which method of power control to
1346 use. By default "RPM" will be used. Valid values
1347 are the strings "RPM", "manual", "servoj10".
1348
1349 """
1350 self._set_power('ON', power_method)
1351
1352
1353 def power_cycle(self, power_method=POWER_CONTROL_RPM):
1354 """Cycle power to this host by turning it OFF, then ON.
1355
1356 @param power_method Specifies which method of power control to
1357 use. By default "RPM" will be used. Valid values
1358 are the strings "RPM", "manual", "servoj10".
1359
1360 """
1361 if power_method in (self.POWER_CONTROL_SERVO,
1362 self.POWER_CONTROL_MANUAL):
1363 self.power_off(power_method=power_method)
1364 time.sleep(self._POWER_CYCLE_TIMEOUT)
1365 self.power_on(power_method=power_method)
1366 else:
1367 rpm_client.set_power(self.hostname, 'CYCLE')
Simran Basic6f1f7a2012-10-16 10:47:46 -07001368
1369
1370 def get_platform(self):
1371 """Determine the correct platform label for this host.
1372
1373 @returns a string representing this host's platform.
1374 """
1375 crossystem = utils.Crossystem(self)
1376 crossystem.init()
1377 # Extract fwid value and use the leading part as the platform id.
1378 # fwid generally follow the format of {platform}.{firmware version}
1379 # Example: Alex.X.YYY.Z or Google_Alex.X.YYY.Z
1380 platform = crossystem.fwid().split('.')[0].lower()
1381 # Newer platforms start with 'Google_' while the older ones do not.
1382 return platform.replace('google_', '')
1383
1384
Aviv Keshet74c89a92013-02-04 15:18:30 -08001385 @label_decorator()
Simran Basic6f1f7a2012-10-16 10:47:46 -07001386 def get_board(self):
1387 """Determine the correct board label for this host.
1388
1389 @returns a string representing this host's board.
1390 """
1391 release_info = utils.parse_cmd_output('cat /etc/lsb-release',
1392 run_method=self.run)
1393 board = release_info['CHROMEOS_RELEASE_BOARD']
1394 # Devices in the lab generally have the correct board name but our own
1395 # development devices have {board_name}-signed-{key_type}. The board
1396 # name may also begin with 'x86-' which we need to keep.
Simran Basi833814b2013-01-29 13:13:43 -08001397 board_format_string = ds_constants.BOARD_PREFIX + '%s'
Simran Basic6f1f7a2012-10-16 10:47:46 -07001398 if 'x86' not in board:
Simran Basi833814b2013-01-29 13:13:43 -08001399 return board_format_string % board.split('-')[0]
1400 return board_format_string % '-'.join(board.split('-')[0:2])
Simran Basic6f1f7a2012-10-16 10:47:46 -07001401
1402
Aviv Keshet74c89a92013-02-04 15:18:30 -08001403 @label_decorator('lightsensor')
Simran Basic6f1f7a2012-10-16 10:47:46 -07001404 def has_lightsensor(self):
1405 """Determine the correct board label for this host.
1406
1407 @returns the string 'lightsensor' if this host has a lightsensor or
1408 None if it does not.
1409 """
1410 search_cmd = "find -L %s -maxdepth 4 | egrep '%s'" % (
Richard Barnette82c35912012-11-20 10:09:10 -08001411 self._LIGHTSENSOR_SEARCH_DIR, '|'.join(self._LIGHTSENSOR_FILES))
Simran Basic6f1f7a2012-10-16 10:47:46 -07001412 try:
1413 # Run the search cmd following the symlinks. Stderr_tee is set to
1414 # None as there can be a symlink loop, but the command will still
1415 # execute correctly with a few messages printed to stderr.
1416 self.run(search_cmd, stdout_tee=None, stderr_tee=None)
1417 return 'lightsensor'
1418 except error.AutoservRunError:
1419 # egrep exited with a return code of 1 meaning none of the possible
1420 # lightsensor files existed.
1421 return None
1422
1423
Aviv Keshet74c89a92013-02-04 15:18:30 -08001424 @label_decorator('bluetooth')
Simran Basic6f1f7a2012-10-16 10:47:46 -07001425 def has_bluetooth(self):
1426 """Determine the correct board label for this host.
1427
1428 @returns the string 'bluetooth' if this host has bluetooth or
1429 None if it does not.
1430 """
1431 try:
1432 self.run('test -d /sys/class/bluetooth/hci0')
1433 # test exited with a return code of 0.
1434 return 'bluetooth'
1435 except error.AutoservRunError:
1436 # test exited with a return code 1 meaning the directory did not
1437 # exist.
1438 return None
1439
1440
1441 def get_labels(self):
1442 """Return a list of labels for this given host.
1443
1444 This is the main way to retrieve all the automatic labels for a host
1445 as it will run through all the currently implemented label functions.
1446 """
1447 labels = []
Richard Barnette82c35912012-11-20 10:09:10 -08001448 for label_function in self._LABEL_FUNCTIONS:
Simran Basic6f1f7a2012-10-16 10:47:46 -07001449 label = label_function(self)
1450 if label:
1451 labels.append(label)
1452 return labels