blob: 52f963d259832b07433c8e6a3b9490c95a43ab1c [file] [log] [blame]
Fang Deng5d518f42013-08-02 14:04:32 -07001# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
2# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4#
5# Expects to be run in an environment with sudo and no interactive password
6# prompt, such as within the Chromium OS development chroot.
7
8
9"""This file provides core logic for servo verify/repair process."""
10
11
Fang Deng5d518f42013-08-02 14:04:32 -070012import logging
Raul E Rangel52ca2e82018-07-03 14:10:14 -060013import os
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080014import re
15import tarfile
Garry Wangc1288cf2019-12-17 14:58:00 -080016import time
Gregory Nisbet265a52c2019-12-10 20:38:42 -080017import traceback
Dana Goyette4dc0adc2019-05-06 14:51:53 -070018import xmlrpclib
Fang Deng5d518f42013-08-02 14:04:32 -070019
20from autotest_lib.client.bin import utils
Garry Wang79e9af62019-06-12 15:19:19 -070021from autotest_lib.client.common_lib import error
Richard Barnette9a26ad62016-06-10 12:03:08 -070022from autotest_lib.client.common_lib import hosts
Garry Wang7b0e1b72020-03-25 19:08:59 -070023from autotest_lib.client.common_lib import lsbrelease_utils
Fang Deng5d518f42013-08-02 14:04:32 -070024from autotest_lib.client.common_lib.cros import retry
Christopher Wileycef1f902014-06-19 11:11:23 -070025from autotest_lib.client.common_lib.cros.network import ping_runner
Richard Barnette9a26ad62016-06-10 12:03:08 -070026from autotest_lib.server.cros.servo import servo
Richard Barnetted31580e2018-05-14 19:58:00 +000027from autotest_lib.server.hosts import servo_repair
Garry Wangebc015b2019-06-06 17:45:06 -070028from autotest_lib.server.hosts import base_servohost
Garry Wang11b5e872020-03-11 15:14:08 -070029from autotest_lib.server.hosts import servo_constants
Otabek Kasimov4ea636e2020-04-14 23:35:06 -070030from autotest_lib.server.cros.faft.utils import config
Garry Wang11b5e872020-03-11 15:14:08 -070031from autotest_lib.client.common_lib import global_config
Garry Wangd7367482020-02-27 13:52:40 -080032
Otabek Kasimov15963492020-06-23 21:10:51 -070033try:
34 from chromite.lib import metrics
35except ImportError:
36 metrics = utils.metrics_mock
37
Dan Shi3b2adf62015-09-02 17:46:54 -070038_CONFIG = global_config.global_config
Fang Deng5d518f42013-08-02 14:04:32 -070039
Otabek Kasimova7ba91a2020-03-09 08:31:01 -070040
Garry Wangebc015b2019-06-06 17:45:06 -070041class ServoHost(base_servohost.BaseServoHost):
42 """Host class for a servo host(e.g. beaglebone, labstation)
Dana Goyette0b6e6402019-10-04 11:09:24 -070043 that with a servo instance for a specific port.
44
45 @type _servo: servo.Servo | None
46 """
Fang Deng5d518f42013-08-02 14:04:32 -070047
Raul E Rangel52ca2e82018-07-03 14:10:14 -060048 DEFAULT_PORT = int(os.getenv('SERVOD_PORT', '9999'))
Richard Barnette9a26ad62016-06-10 12:03:08 -070049
Dan Shie5b3c512014-08-21 12:12:09 -070050 # Timeout for initializing servo signals.
Wai-Hong Tam37b6ed32017-09-19 15:52:39 -070051 INITIALIZE_SERVO_TIMEOUT_SECS = 60
Richard Barnette9a26ad62016-06-10 12:03:08 -070052
xixuan6cf6d2f2016-01-29 15:29:00 -080053 # Ready test function
54 SERVO_READY_METHOD = 'get_version'
Fang Deng5d518f42013-08-02 14:04:32 -070055
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080056 # Directory prefix on the servo host where the servod logs are stored.
57 SERVOD_LOG_PREFIX = '/var/log/servod'
58
59 # Exit code to use when symlinks for servod logs are not found.
60 NO_SYMLINKS_CODE = 9
61
62 # Directory in the job's results directory to dump the logs into.
63 LOG_DIR = 'servod'
64
65 # Prefix for joint loglevel files in the logs.
66 JOINT_LOG_PREFIX = 'log'
67
68 # Regex group to extract timestamp from logfile name.
69 TS_GROUP = 'ts'
70
71 # This regex is used to extract the timestamp from servod logs.
72 # files always start with log.
73 TS_RE = (r'log.'
74 # The timestamp is of format %Y-%m-%d--%H-%M-%S.MS
75 r'(?P<%s>\d{4}(\-\d{2}){2}\-(-\d{2}){3}.\d{3})'
76 # The loglevel is optional depending on labstation version.
77 r'(.(INFO|DEBUG|WARNING))?' % TS_GROUP)
78 TS_EXTRACTOR = re.compile(TS_RE)
79
80 # Regex group to extract MCU name from logline in servod logs.
81 MCU_GROUP = 'mcu'
82
83 # Regex group to extract logline from MCU logline in servod logs.
84 LINE_GROUP = 'line'
85
86 # This regex is used to extract the mcu and the line content from an
87 # MCU logline in servod logs. e.g. EC or servo_v4 console logs.
88 # Here is an example log-line:
89 #
90 # 2020-01-23 13:15:12,223 - servo_v4 - EC3PO.Console - DEBUG -
91 # console.py:219:LogConsoleOutput - /dev/pts/9 - cc polarity: cc1
92 #
93 # Here is conceptually how they are formatted:
94 #
95 # <time> - <MCU> - EC3PO.Console - <LVL> - <file:line:func> - <pts> -
96 # <output>
97 #
98 # The log format starts with a timestamp
99 MCU_RE = (r'[\d\-]+ [\d:,]+ '
100 # The mcu that is logging this is next.
101 r'- (?P<%s>\w+) - '
102 # Next, we have more log outputs before the actual line.
103 # Information about the file line, logging function etc.
104 # Anchor on EC3PO Console, LogConsoleOutput and dev/pts.
105 # NOTE: if the log format changes, this regex needs to be
106 # adjusted.
107 r'EC3PO\.Console[\s\-\w\d:.]+LogConsoleOutput - /dev/pts/\d+ - '
108 # Lastly, we get the MCU's console line.
109 r'(?P<%s>.+$)' % (MCU_GROUP, LINE_GROUP))
110 MCU_EXTRACTOR = re.compile(MCU_RE)
111
112 # Suffix to identify compressed logfiles.
113 COMPRESSION_SUFFIX = '.tbz2'
114
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700115 # A suffix to mark servod log directories that came from instance that
116 # ran during this servo_host, but are not the last one running e.g. when
117 # an instance (on purpose, or due to a bug) restarted in the middle of the
118 # run.
119 OLD_LOG_SUFFIX = 'old'
120
Otabek Kasimov15963492020-06-23 21:10:51 -0700121 # States of verifiers
122 # True - verifier run and passed
123 # False - verifier run and failed
124 # None - verifier did not run or dependency failed
125 VERIFY_SUCCESS = True
126 VERIFY_FAILED = False
127 VERIFY_NOT_RUN = None
128
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800129 def _init_attributes(self):
130 self._servo_state = None
131 self.servo_port = None
132 self.servo_board = None
133 self.servo_model = None
134 self.servo_serial = None
Garry Wang000c6c02020-05-11 21:27:23 -0700135 # The flag that indicate if a servo is connected to a smart usbhub.
136 # TODO(xianuowang@) remove this flag once all usbhubs in the lab
137 # get replaced.
138 self.smart_usbhub = None
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800139 self._servo = None
140 self._servod_server_proxy = None
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700141 self._initial_instance_ts = None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800142 # Flag to make sure that multiple calls to close do not result in the
143 # logic executing multiple times.
144 self._closed = False
Fang Deng5d518f42013-08-02 14:04:32 -0700145
Richard Barnette17bfc6c2016-08-04 18:41:43 -0700146 def _initialize(self, servo_host='localhost',
Richard Barnettee519dcd2016-08-15 17:37:17 -0700147 servo_port=DEFAULT_PORT, servo_board=None,
Nick Sanders2f3c9852018-10-24 12:10:24 -0700148 servo_model=None, servo_serial=None, is_in_lab=None,
149 *args, **dargs):
Fang Deng5d518f42013-08-02 14:04:32 -0700150 """Initialize a ServoHost instance.
151
152 A ServoHost instance represents a host that controls a servo.
153
154 @param servo_host: Name of the host where the servod process
155 is running.
Raul E Rangel52ca2e82018-07-03 14:10:14 -0600156 @param servo_port: Port the servod process is listening on. Defaults
157 to the SERVOD_PORT environment variable if set,
158 otherwise 9999.
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700159 @param servo_board: Board that the servo is connected to.
Nick Sanders2f3c9852018-10-24 12:10:24 -0700160 @param servo_model: Model that the servo is connected to.
Dan Shi4d478522014-02-14 13:46:32 -0800161 @param is_in_lab: True if the servo host is in Cros Lab. Default is set
162 to None, for which utils.host_is_in_lab_zone will be
163 called to check if the servo host is in Cros lab.
Fang Deng5d518f42013-08-02 14:04:32 -0700164
165 """
166 super(ServoHost, self)._initialize(hostname=servo_host,
Garry Wangebc015b2019-06-06 17:45:06 -0700167 is_in_lab=is_in_lab, *args, **dargs)
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800168 self._init_attributes()
Richard Barnette42f4db92018-08-23 15:05:15 -0700169 self.servo_port = int(servo_port)
Richard Barnettee519dcd2016-08-15 17:37:17 -0700170 self.servo_board = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -0700171 self.servo_model = servo_model
Kevin Cheng643ce8a2016-09-15 15:42:12 -0700172 self.servo_serial = servo_serial
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800173
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800174 # The location of the log files on the servo host for this instance.
175 self.remote_log_dir = '%s_%s' % (self.SERVOD_LOG_PREFIX,
176 self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700177 # Path of the servo host lock file.
178 self._lock_file = (self.TEMP_FILE_DIR + str(self.servo_port)
179 + self.LOCK_FILE_POSTFIX)
180 # File path to declare a reboot request.
181 self._reboot_file = (self.TEMP_FILE_DIR + str(self.servo_port)
182 + self.REBOOT_FILE_POSTFIX)
183
184 # Lock the servo host if it's an in-lab labstation to prevent other
185 # task to reboot it until current task completes. We also wait and
186 # make sure the labstation is up here, in the case of the labstation is
187 # in the middle of reboot.
Garry Wang7c00b0f2019-06-25 17:28:17 -0700188 self._is_locked = False
Garry Wang42b4d862019-06-25 15:50:49 -0700189 if (self.wait_up(self.REBOOT_TIMEOUT) and self.is_in_lab()
190 and self.is_labstation()):
Garry Wang79e9af62019-06-12 15:19:19 -0700191 self._lock()
Garry Wangebc015b2019-06-06 17:45:06 -0700192
Richard Barnette9a26ad62016-06-10 12:03:08 -0700193 self._repair_strategy = (
194 servo_repair.create_servo_repair_strategy())
Richard Barnettee519dcd2016-08-15 17:37:17 -0700195
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700196 def __str__(self):
197 return "<%s '%s:%s'>" % (
198 type(self).__name__, self.hostname, self.servo_port)
199
Richard Barnette9a26ad62016-06-10 12:03:08 -0700200 def connect_servo(self):
Garry Wang8c8dc972020-06-09 13:41:51 -0700201 """ Initialize and setup servo for later use.
202 """
203 self.initilize_servo()
204 self.initialize_dut_for_servo()
205
206
207 def initilize_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700208 """Establish a connection to the servod server on this host.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700209
210 Initializes `self._servo` and then verifies that all network
211 connections are working. This will create an ssh tunnel if
212 it's required.
Garry Wang8c8dc972020-06-09 13:41:51 -0700213 """
214 self._servo = servo.Servo(servo_host=self,
215 servo_serial=self.servo_serial)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700216
Garry Wang8c8dc972020-06-09 13:41:51 -0700217
218 def initialize_dut_for_servo(self):
219 """This method will do some setup for dut control, e.g. setup
220 main servo_v4 device, and also testing the connection between servo
221 and DUT. As a side effect of testing the connection, all signals on
222 the target servo are reset to default values, and the USB stick is
Richard Barnette9a26ad62016-06-10 12:03:08 -0700223 set to the neutral (off) position.
224 """
Garry Wang8c8dc972020-06-09 13:41:51 -0700225 if not self._servo:
226 raise hosts.AutoservVerifyError('Servo object needs to be'
227 ' initialized before initialize'
228 ' DUT.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700229 timeout, _ = retry.timeout(
Garry Wang8c8dc972020-06-09 13:41:51 -0700230 self._servo.initialize_dut,
231 timeout_sec=self.INITIALIZE_SERVO_TIMEOUT_SECS)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700232 if timeout:
Garry Wang8c8dc972020-06-09 13:41:51 -0700233 raise hosts.AutoservVerifyError('Initialize dut for servo timed'
234 ' out.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700235
236
237 def disconnect_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700238 """Disconnect our servo if it exists.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700239
240 If we've previously successfully connected to our servo,
241 disconnect any established ssh tunnel, and set `self._servo`
242 back to `None`.
243 """
244 if self._servo:
245 # N.B. This call is safe even without a tunnel:
246 # rpc_server_tracker.disconnect() silently ignores
247 # unknown ports.
248 self.rpc_server_tracker.disconnect(self.servo_port)
249 self._servo = None
Fang Deng5d518f42013-08-02 14:04:32 -0700250
Garry Wangc1288cf2019-12-17 14:58:00 -0800251
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800252 def _create_servod_server_proxy(self):
253 """Create a proxy that can be used to communicate with servod server.
Fang Deng5d518f42013-08-02 14:04:32 -0700254
255 @returns: An xmlrpclib.ServerProxy that is connected to the servod
256 server on the host.
Fang Deng5d518f42013-08-02 14:04:32 -0700257 """
Garry Wang11b5e872020-03-11 15:14:08 -0700258 if (servo_constants.ENABLE_SSH_TUNNEL_FOR_SERVO
259 and not self.is_localhost()):
Richard Barnette9a26ad62016-06-10 12:03:08 -0700260 return self.rpc_server_tracker.xmlrpc_connect(
261 None, self.servo_port,
262 ready_test_name=self.SERVO_READY_METHOD,
Allen Li2b1a8992018-11-27 14:17:18 -0800263 timeout_seconds=60,
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700264 request_timeout_seconds=3600,
265 server_desc=str(self))
Richard Barnette9a26ad62016-06-10 12:03:08 -0700266 else:
267 remote = 'http://%s:%s' % (self.hostname, self.servo_port)
268 return xmlrpclib.ServerProxy(remote)
Fang Deng5d518f42013-08-02 14:04:32 -0700269
270
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800271 def get_servod_server_proxy(self):
272 """Return a cached proxy if exists; otherwise, create a new one.
273
274 @returns: An xmlrpclib.ServerProxy that is connected to the servod
275 server on the host.
276 """
277 # Single-threaded execution, no race
278 if self._servod_server_proxy is None:
279 self._servod_server_proxy = self._create_servod_server_proxy()
280 return self._servod_server_proxy
281
282
Richard Barnette1edbb162016-11-01 11:47:50 -0700283 def verify(self, silent=False):
284 """Update the servo host and verify it's in a good state.
285
286 @param silent If true, suppress logging in `status.log`.
287 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700288 message = 'Beginning verify for servo host %s port %s serial %s'
289 message %= (self.hostname, self.servo_port, self.servo_serial)
290 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700291 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700292 self._repair_strategy.verify(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700293 self._servo_state = servo_constants.SERVO_STATE_WORKING
294 self.record('INFO', None, None,
295 'ServoHost verify set servo_state as WORKING')
Garry Wang63b8c382020-03-11 22:28:40 -0700296 except Exception as e:
Otabek Kasimov15963492020-06-23 21:10:51 -0700297 self._servo_state = self.determine_servo_state()
Garry Wang11b5e872020-03-11 15:14:08 -0700298 self.record('INFO', None, None,
Otabek Kasimov15963492020-06-23 21:10:51 -0700299 'ServoHost verify set servo_state as %s'
300 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700301 if self._is_critical_error(e):
302 raise
Fang Deng5d518f42013-08-02 14:04:32 -0700303
304
Garry Wang7b0e1b72020-03-25 19:08:59 -0700305 def get_image_name_from_usbkey(self, usbkey_dev):
306 """Mount usb drive and check ChromeOS image name on it if there is
307 one. This method assumes the image_usbkey_direction is already set
308 to servo side.
309
310 @param: usbkey_dev usbkey dev path(e.g. /dev/sdb).
311
312 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
313 or empty string if no test image detected, or unexpected
314 error occurred.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700315 """
Garry Wang70e5d062020-04-03 18:01:05 -0700316 logging.info('Checking ChromeOS image name on usbkey.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700317 usb_mount_path = '/media/servo_usb/%s' % self.servo_port
318 unmount_cmd = 'umount %s' % usb_mount_path
319 # ChromeOS root fs is in /dev/sdx3
320 mount_cmd = 'mount -o ro %s3 %s' % (usbkey_dev, usb_mount_path)
321 # Unmount if there is an existing stale mount.
322 self.run(unmount_cmd, ignore_status=True)
323 # Create if the mount point is not existing.
324 self.run('mkdir -p %s' % usb_mount_path)
325 try:
326 # Attempt to mount the usb drive.
327 mount_result = self.run(mount_cmd, ignore_status=True)
Garry Wang70e5d062020-04-03 18:01:05 -0700328 if mount_result.exit_status != 0:
329 logging.error('Unexpected error occurred on mount usb drive.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700330 return ''
Garry Wang70e5d062020-04-03 18:01:05 -0700331
332 release_content = self.run(
333 'cat %s/etc/lsb-release' % usb_mount_path,
334 ignore_status=True).stdout.strip()
335
336 if not re.search(r'RELEASE_TRACK=.*test', release_content):
337 logging.info('The image on usbkey is not a test image')
338 return ''
339
340 return lsbrelease_utils.get_chromeos_release_builder_path(
341 lsb_release_content=release_content)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700342 finally:
Garry Wang70e5d062020-04-03 18:01:05 -0700343 logging.debug('Image check compeleted, unmounting the usb drive.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700344 self.run(unmount_cmd, ignore_status=True)
345
346
Garry Wang70e5d062020-04-03 18:01:05 -0700347 def _probe_and_validate_usb_dev(self):
348 """This method probe the usb dev path by talking to servo, and then
349 validate the dev path is valid block device to servohost.
350 Possible output:
351 1. Encounter error during probe usb dev, returns empty string.
352 2. probe usb dev completed without error but cannot find usb dev,
353 raise AutoservRepairError.
354 3. probe usb dev find a usb dev path, but failed validation in this
355 method, raise AutoservRepairError.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700356
Garry Wang70e5d062020-04-03 18:01:05 -0700357 @returns: A string of usb dev path(e.g. '/dev/sdb'), or empty string
358 if unexpected error occurred during probe.
359 @raises: AutoservRepairError if servo couldn't probe the usb dev path
360 (servo.probe_host_usb_dev() returns empty string), or the dev path is
361 not valid block device to servohost.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700362 """
363 logging.info('Validating image usbkey on servo.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700364 try:
Garry Wang70e5d062020-04-03 18:01:05 -0700365 usb_dev = self._servo.probe_host_usb_dev()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700366 except Exception as e:
367 # We don't want any unexpected or transient servo communicating
368 # failure block usb repair, so capture all errors here.
369 logging.error(e, exc_info=True)
370 logging.error('Unexpected error occurred on get usbkey dev path,'
371 ' skipping usbkey validation.')
372 return ''
373
Garry Wang70e5d062020-04-03 18:01:05 -0700374 if usb_dev:
375 # probe_host_usb_dev() sometimes return stale record,
376 # so we need to make sure the path exists in fdisk.
377 validate_cmd = 'fdisk -l | grep %s' % usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700378 try:
379 resp = self.run(validate_cmd, ignore_status=True, timeout=60)
380 if resp.exit_status == 0:
381 return usb_dev
Garry Wang70e5d062020-04-03 18:01:05 -0700382
Garry Wang11441182020-06-16 18:34:14 -0700383 logging.error('%s is reported from "image_usbkey_dev" control'
384 ' but not detected by fdisk!', usb_dev)
385 except error.AutoservRunError as e:
386 if 'Timeout encountered' in str(e):
387 logging.warning('Timeout encountered during fdisk run,'
388 ' skipping usbkey validation.')
389 return ''
390 raise
Garry Wang70e5d062020-04-03 18:01:05 -0700391
392 raise hosts.AutoservRepairError(
393 'No usbkey detected on servo, the usbkey may be either missing'
394 ' or broken. Please replace usbkey on the servo and retry.',
395 'missing usbkey')
396
397
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700398 def is_ec_supported(self):
Garry Wang9b8f2342020-04-17 16:34:09 -0700399 """Check if ec is supported on the servo_board"""
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700400 if self.servo_board:
401 try:
402 frm_config = config.Config(self.servo_board, self.servo_model)
403 return frm_config.chrome_ec
404 except Exception as e:
405 logging.error('Unexpected error when read from firmware'
406 ' configs; %s', str(e))
407 return False
408
Garry Wang70e5d062020-04-03 18:01:05 -0700409 def validate_image_usbkey(self):
410 """This method first validate if there is a recover usbkey on servo
411 that accessible to servohost, and second check if a ChromeOS image is
412 already on the usb drive and return the image_name so we can avoid
413 unnecessary download and flash to the recover usbkey on servo.
414
415 Please note that, there is special error handling logic here:
416 1. If unexpected error happens, we return empty string. So repair
417 actions will not get blocked.
418 2. If no working usbkey present on servo, but no errors, we'll raise
419 AutoservRepairError here.
420
421 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
422 or empty string if no test image detected, or unexpected
423 error occurred.
424 @raises: AutoservRepairError if the usbkey is not detected on servo.
425 """
426 usb_dev = self._probe_and_validate_usb_dev()
427 if usb_dev:
428 return self.get_image_name_from_usbkey(usb_dev)
429 else:
430 return ''
Garry Wang7b0e1b72020-03-25 19:08:59 -0700431
432
Richard Barnette1edbb162016-11-01 11:47:50 -0700433 def repair(self, silent=False):
434 """Attempt to repair servo host.
435
436 @param silent If true, suppress logging in `status.log`.
437 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700438 message = 'Beginning repair for servo host %s port %s serial %s'
439 message %= (self.hostname, self.servo_port, self.servo_serial)
440 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700441 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700442 self._repair_strategy.repair(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700443 self._servo_state = servo_constants.SERVO_STATE_WORKING
444 self.record('INFO', None, None,
445 'ServoHost repair set servo_state as WORKING')
Garry Wang464ff1e2019-07-18 17:20:34 -0700446 # If target is a labstation then try to withdraw any existing
447 # reboot request created by this servo because it passed repair.
448 if self.is_labstation():
449 self.withdraw_reboot_request()
Garry Wang63b8c382020-03-11 22:28:40 -0700450 except Exception as e:
Otabek Kasimov15963492020-06-23 21:10:51 -0700451 self._servo_state = self.determine_servo_state()
Garry Wang11b5e872020-03-11 15:14:08 -0700452 self.record('INFO', None, None,
Otabek Kasimov15963492020-06-23 21:10:51 -0700453 'ServoHost repair set servo_state as %s'
454 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700455 if self._is_critical_error(e):
456 self.disconnect_servo()
457 self.stop_servod()
458 raise
459
460
461 def _is_critical_error(self, error):
462 if (isinstance(error, hosts.AutoservVerifyDependencyError)
463 and not error.is_critical()):
464 logging.warning('Non-critical verify failure(s) detected during'
465 ' verify/repair servo, servo connection will'
466 ' still up but may not fully functional.'
467 ' Some repair actions and servo depended'
468 ' tests may not run.')
469 return False
470 logging.info('Critical verify failure(s) detected during repair/verify'
471 ' servo. Disconnecting servo and stop servod, all repair '
472 'action and tests that depends on servo will not run.')
473 return True
Fang Deng5d518f42013-08-02 14:04:32 -0700474
475
Dan Shi4d478522014-02-14 13:46:32 -0800476 def get_servo(self):
477 """Get the cached servo.Servo object.
Fang Deng5d518f42013-08-02 14:04:32 -0700478
Dan Shi4d478522014-02-14 13:46:32 -0800479 @return: a servo.Servo object.
Dana Goyette353d1d92019-06-27 10:43:59 -0700480 @rtype: autotest_lib.server.cros.servo.servo.Servo
Fang Deng5d518f42013-08-02 14:04:32 -0700481 """
Dan Shi4d478522014-02-14 13:46:32 -0800482 return self._servo
483
484
Garry Wang79e9af62019-06-12 15:19:19 -0700485 def request_reboot(self):
486 """Request servohost to be rebooted when it's safe to by touch a file.
487 """
488 logging.debug('Request to reboot servohost %s has been created by '
Garry Wang464ff1e2019-07-18 17:20:34 -0700489 'servo with port # %s', self.hostname, self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700490 self.run('touch %s' % self._reboot_file, ignore_status=True)
491
492
Garry Wang464ff1e2019-07-18 17:20:34 -0700493 def withdraw_reboot_request(self):
494 """Withdraw a servohost reboot request if exists by remove the flag
495 file.
496 """
497 logging.debug('Withdrawing request to reboot servohost %s that created'
498 ' by servo with port # %s if exists.',
499 self.hostname, self.servo_port)
500 self.run('rm -f %s' % self._reboot_file, ignore_status=True)
501
502
Garry Wangc1288cf2019-12-17 14:58:00 -0800503 def start_servod(self, quick_startup=False):
504 """Start the servod process on servohost.
505 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800506 # Skip if running on the localhost.(crbug.com/1038168)
507 if self.is_localhost():
508 logging.debug("Servohost is a localhost, skipping start servod.")
509 return
510
511 cmd = 'start servod'
Garry Wangc1288cf2019-12-17 14:58:00 -0800512 if self.servo_board:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800513 cmd += ' BOARD=%s' % self.servo_board
Garry Wangc1288cf2019-12-17 14:58:00 -0800514 if self.servo_model:
515 cmd += ' MODEL=%s' % self.servo_model
Garry Wangc1288cf2019-12-17 14:58:00 -0800516 else:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800517 logging.warning('Board for DUT is unknown; starting servod'
518 ' assuming a pre-configured board.')
519
520 cmd += ' PORT=%d' % self.servo_port
521 if self.servo_serial:
522 cmd += ' SERIAL=%s' % self.servo_serial
Garry Wangd7367482020-02-27 13:52:40 -0800523
524 # Start servod with dual_v4 if the DUT/servo from designated pools.
525 dut_host_info = self.get_dut_host_info()
526 if dut_host_info:
Garry Wang11b5e872020-03-11 15:14:08 -0700527 if bool(dut_host_info.pools &
528 servo_constants.POOLS_SUPPORT_DUAL_V4):
Garry Wangd7367482020-02-27 13:52:40 -0800529 logging.debug('The DUT is detected in following designated'
530 ' pools %s,starting servod with DUAL_V4 option.',
Garry Wang11b5e872020-03-11 15:14:08 -0700531 servo_constants.POOLS_SUPPORT_DUAL_V4)
Garry Wangd7367482020-02-27 13:52:40 -0800532 cmd += ' DUAL_V4=1'
533
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800534 # Remove the symbolic links from the logs. This helps ensure that
535 # a failed servod instantiation does not cause us to grab old logs
536 # by mistake.
537 self.remove_latest_log_symlinks()
Garry Wangcdd27b22020-01-13 14:59:11 -0800538 self.run(cmd, timeout=60)
Garry Wangc1288cf2019-12-17 14:58:00 -0800539
540 # There's a lag between when `start servod` completes and when
541 # the _ServodConnectionVerifier trigger can actually succeed.
542 # The call to time.sleep() below gives time to make sure that
543 # the trigger won't fail after we return.
544
545 # Normally servod on servo_v3 and labstation take ~10 seconds to ready,
546 # But in the rare case all servo on a labstation are in heavy use they
547 # may take ~30 seconds. So the timeout value will double these value,
548 # and we'll try quick start up when first time initialize servohost,
549 # and use standard start up timeout in repair.
550 if quick_startup:
Garry Wang11b5e872020-03-11 15:14:08 -0700551 timeout = servo_constants.SERVOD_QUICK_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800552 else:
Garry Wang11b5e872020-03-11 15:14:08 -0700553 timeout = servo_constants.SERVOD_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800554 logging.debug('Wait %s seconds for servod process fully up.', timeout)
555 time.sleep(timeout)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700556 # Cache the initial instance timestamp to check against servod restarts
557 self._initial_instance_ts = self.get_instance_logs_ts()
Garry Wangc1288cf2019-12-17 14:58:00 -0800558
559
560 def stop_servod(self):
561 """Stop the servod process on servohost.
562 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800563 # Skip if running on the localhost.(crbug.com/1038168)
564 if self.is_localhost():
565 logging.debug("Servohost is a localhost, skipping stop servod.")
566 return
567
Garry Wangc1288cf2019-12-17 14:58:00 -0800568 logging.debug('Stopping servod on port %s', self.servo_port)
Garry Wangcdd27b22020-01-13 14:59:11 -0800569 self.run('stop servod PORT=%d' % self.servo_port,
570 timeout=60, ignore_status=True)
Garry Wangc1288cf2019-12-17 14:58:00 -0800571 logging.debug('Wait %s seconds for servod process fully teardown.',
Garry Wang11b5e872020-03-11 15:14:08 -0700572 servo_constants.SERVOD_TEARDOWN_TIMEOUT)
573 time.sleep(servo_constants.SERVOD_TEARDOWN_TIMEOUT)
Garry Wangc1288cf2019-12-17 14:58:00 -0800574
575
576 def restart_servod(self, quick_startup=False):
577 """Restart the servod process on servohost.
578 """
579 self.stop_servod()
580 self.start_servod(quick_startup)
581
Garry Wang11b5e872020-03-11 15:14:08 -0700582
Garry Wangffbd2162020-04-17 16:13:48 -0700583 def _process_servodtool_error(self, response):
584 """Helper function to handle non-zero servodtool response.
585 """
586 if re.search(servo_constants.ERROR_MESSAGE_USB_HUB_NOT_COMPATIBLE,
Garry Wangad245002020-05-15 15:20:23 -0700587 response.stdout):
Garry Wangffbd2162020-04-17 16:13:48 -0700588 logging.error('The servo is not plugged on a usb hub that supports'
589 ' power-cycle!')
Garry Wang000c6c02020-05-11 21:27:23 -0700590 # change the flag so we can update this label in later process.
591 self.smart_usbhub = False
Garry Wangffbd2162020-04-17 16:13:48 -0700592 return
593
594 if re.search(servo_constants.ERROR_MESSAGE_DEVICE_NOT_FOUND %
595 self.servo_serial, response.stdout):
596 logging.error('No servo with serial %s found!', self.servo_serial)
597 return
598
599 logging.error('Unexpected error occurred from usbhub control, please'
600 ' file a bug and inform chrome-fleet-software@ team!')
601
602
603 def _get_servo_usb_devnum(self):
604 """Helper function to collect current usb devnum of servo.
605 """
Otabek Kasimov09192682020-06-01 18:17:44 -0700606 # TODO remove try-except when fix crbug.com/1087964
607 try:
608 cmd = 'servodtool device -s %s usb-path' % self.servo_serial
609 resp = self.run(cmd, ignore_status=True, timeout=30)
610 except Exception as e:
611 # Here we catch only timeout errors.
612 # Other errors is filtered by ignore_status=True
613 logging.debug('Attempt to get servo usb-path failed due to '
614 'timeout; %s', e)
615 return ''
616
Garry Wangffbd2162020-04-17 16:13:48 -0700617 if resp.exit_status != 0:
618 self._process_servodtool_error(resp)
619 return ''
620 usb_path = resp.stdout.strip()
621 logging.info('Usb path of servo %s is %s', self.servo_serial, usb_path)
622
623 resp = self.run('cat %s/devnum' % usb_path,
624 ignore_status=True)
625 if resp.exit_status != 0:
626 self._process_servodtool_error(resp)
627 return ''
628 return resp.stdout.strip()
629
630
631 def _reset_servo(self):
632 logging.info('Resetting servo through smart usbhub.')
Otabek Kasimov09192682020-06-01 18:17:44 -0700633 # TODO remove try-except when fix crbug.com/1087964
634 try:
635 resp = self.run('servodtool device -s %s power-cycle' %
636 self.servo_serial, ignore_status=True,
637 timeout=30)
638 if resp.exit_status != 0:
639 self._process_servodtool_error(resp)
640 return False
641 except Exception as e:
642 # Here we catch only timeout errors.
643 # Other errors is filtered by ignore_status=True
644 logging.debug('Attempt to reset servo failed due to timeout;'
645 ' %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -0700646 return False
647
648 logging.debug('Wait %s seconds for servo to come back from reset.',
649 servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
650 time.sleep(servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
Garry Wang000c6c02020-05-11 21:27:23 -0700651 # change the flag so we can update this label in later process.
652 self.smart_usbhub = True
Garry Wangffbd2162020-04-17 16:13:48 -0700653 return True
654
655
656 def reset_servo(self):
657 """Reset(power-cycle) the servo via smart usbhub.
658 """
659 if not self.is_labstation():
660 logging.info('Servo reset is not applicable to servo_v3.')
661 return
662
663 pre_reset_devnum = self._get_servo_usb_devnum()
664 logging.info('Servo usb devnum before reset: %s', pre_reset_devnum)
665 result = self._reset_servo()
666 if not result:
Garry Wangfd5c8b62020-06-08 15:36:54 -0700667 message = ('Failed to reset servo with serial: %s. (Please ignore'
668 ' this error if the DUT is not connected to a smart'
669 ' usbhub).' % self.servo_serial)
Garry Wangffbd2162020-04-17 16:13:48 -0700670 logging.warning(message)
671 self.record('INFO', None, None, message)
672 return
673
674 post_reset_devnum = self._get_servo_usb_devnum()
675 logging.info('Servo usb devnum after reset: %s', post_reset_devnum)
676 if not (pre_reset_devnum and post_reset_devnum):
677 message = ('Servo reset completed but unable to verify'
678 ' devnum change!')
679 elif pre_reset_devnum != post_reset_devnum:
680 message = ('Reset servo with serial %s completed successfully!'
681 % self.servo_serial)
682 else:
683 message = 'Servo reset completed but devnum is still not changed!'
684 logging.info(message)
685 self.record('INFO', None, None, message)
686
687
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800688 def _extract_compressed_logs(self, logdir, relevant_files):
689 """Decompress servod logs in |logdir|.
690
691 @param logdir: directory containing compressed servod logs.
692 @param relevant_files: list of files in |logdir| to consider.
693
694 @returns: tuple, (tarfiles, files) where
695 tarfiles: list of the compressed filenames that have been
696 extracted and deleted
697 files: list of the uncompressed files that were generated
698 """
699 # For all tar-files, first extract them to the directory, and
700 # then let the common flow handle them.
701 tarfiles = [cf for cf in relevant_files if
702 cf.endswith(self.COMPRESSION_SUFFIX)]
703 files = []
704 for f in tarfiles:
705 norm_name = os.path.basename(f)[:-len(self.COMPRESSION_SUFFIX)]
706 with tarfile.open(f) as tf:
707 # Each tarfile has only one member, as
708 # that's the compressed log.
709 member = tf.members[0]
710 # Manipulate so that it only extracts the basename, and not
711 # the directories etc.
712 member.name = norm_name
713 files.append(os.path.join(logdir, member.name))
714 tf.extract(member, logdir)
715 # File has been extracted: remove the compressed file.
716 os.remove(f)
717 return tarfiles, files
718
719 def _extract_mcu_logs(self, log_subdir):
720 """Extract MCU (EC, Cr50, etc) console output from servod debug logs.
721
722 Using the MCU_EXTRACTOR regex (above) extract and split out MCU console
723 lines from the logs to generate invidiual console logs e.g. after
724 this method, you can find an ec.txt and servo_v4.txt in |log_dir| if
725 those MCUs had any console input/output.
726
727 @param log_subdir: directory with log.DEBUG.txt main servod debug logs.
728 """
729 # Extract the MCU for each one. The MCU logs are only in the .DEBUG
730 # files
731 mcu_lines_file = os.path.join(log_subdir, 'log.DEBUG.txt')
732 if not os.path.exists(mcu_lines_file):
733 logging.info('No DEBUG logs found to extract MCU logs from.')
734 return
735 mcu_files = {}
736 mcu_file_template = '%s.txt'
737 with open(mcu_lines_file, 'r') as f:
738 for line in f:
739 match = self.MCU_EXTRACTOR.match(line)
740 if match:
741 mcu = match.group(self.MCU_GROUP).lower()
742 line = match.group(self.LINE_GROUP)
743 if mcu not in mcu_files:
744 mcu_file = os.path.join(log_subdir,
745 mcu_file_template % mcu)
746 mcu_files[mcu] = open(mcu_file, 'a')
747 fd = mcu_files[mcu]
748 fd.write(line + '\n')
749 for f in mcu_files:
750 mcu_files[f].close()
751
752
753 def remove_latest_log_symlinks(self):
754 """Remove the conveninence symlinks 'latest' servod logs."""
755 symlink_wildcard = '%s/latest*' % self.remote_log_dir
756 cmd = 'rm ' + symlink_wildcard
757 self.run(cmd, stderr_tee=None, ignore_status=True)
758
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700759 def probe_servod_restart(self, instance_ts, outdir):
760 """Grab servod logs from previous instances if part of this session.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800761
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700762 If since the last time this host called start_servod() servod crashed
763 and restarted, this helper finds those logs as well, and stores them
764 with the |OLD_LOG_SUFFIX| to investigate if necessary.
Prasad Vuppalapu5bd9da12020-03-31 01:46:47 +0000765
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700766 It also issues a panicinfo command to servo devices after the restart
767 to try and collect reboot information for debugging.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800768
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700769 @param instance_ts: the log timestamp that the current instance uses
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800770 @param outdir: directory to create a subdirectory into to place the
771 servod logs into.
772 """
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700773 if self._initial_instance_ts is None:
774 logging.info('No log timestamp grabbed successfully on servod '
775 'startup. Cannot check device restarts. Ignoring.')
776 return
777 if instance_ts == self._initial_instance_ts:
778 logging.debug('Servod appears to have run without restarting')
779 return
780 # Servod seems to have restarted (at least once). |_initial_instance_ts|
781 # is the first timestamp, and instance_ts is the current timestamp. Find
782 # all timestamps in between them, and grab the logs for each.
783 tss = self._find_instance_timestamps_between(self._initial_instance_ts,
784 instance_ts)
785 logging.info('Servod has restarted %d times between the start and the '
786 'end of this servo_host.', len(tss))
787 logging.info('This might be an issue. Will extract all logs from each '
788 'instance.')
789 logging.info('Logs that are not the currently running (about to turn '
790 'down) instance are maked with a .%s in their folder.',
791 self.OLD_LOG_SUFFIX)
792 for ts in tss:
793 self.get_instance_logs(ts, outdir, old=True)
794 # Lastly, servod has restarted due to a potential issue. Try to get
795 # panic information from servo micro and servo v4 for the current logs.
796 # This can only happen if the |_servo| attribute is initialized.
797 if self._servo:
798 for mcu in ['servo_micro', 'servo_v4']:
799 ctrl = '%s_uart_cmd' % mcu
800 if self._servo.has_control(ctrl):
801 logging.info('Trying to retrieve %r panicinfo into logs',
802 mcu)
803 try:
804 self._servo.set_nocheck(ctrl, 'panicinfo')
805 except error.TestFail as e:
806 logging.error('Failed to generate panicinfo for %r '
807 'logs. %s', mcu, str(e))
808
809 def _find_instance_timestamps_between(self, start_ts, end_ts):
810 """Find all log timestamps between [start_ts, end_ts).
811
812 @param start_ts: str, earliest log timestamp of interest
813 @param end_ts: str, latest log timestamp of interest
814
815 @returns: list, all timestamps between start_ts and end_ts, end_ts
816 exclusive, on the servo_host. An empty list on errors
817 """
818 # Simply get all timestamp, and then sort and remove
819 cmd = 'ls %s' % self.remote_log_dir
820 res = self.run(cmd, stderr_tee=None, ignore_status=True)
821 if res.exit_status != 0:
822 # Here we failed to find anything.
823 logging.info('Failed to find remote servod logs. Ignoring.')
824 return []
825 logfiles = res.stdout.strip().split()
826 timestamps = set()
827 for logfile in logfiles:
828 ts_match = self.TS_EXTRACTOR.match(logfile)
829 if not ts_match:
830 # Simply ignore files that fail the check. It might be the
831 # 'latest' symlinks or random files.
832 continue
833 timestamps.add(ts_match.group(self.TS_GROUP))
834 # At this point we have all unique timestamps.
835 timestamps = sorted(timestamps)
836 for ts in [start_ts, end_ts]:
837 if ts not in timestamps:
838 logging.error('Timestamp %r not in servod logs. Cannot query '
839 'for timestamps in between %r and %r', ts,
840 start_ts, end_ts)
841 return []
842 return timestamps[timestamps.index(start_ts):timestamps.index(end_ts)]
843
844 def get_instance_logs_ts(self):
845 """Retrieve the currently running servod instance's log timestamp
846
847 @returns: str, timestamp for current instance, or None on failure
848 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800849 # First, extract the timestamp. This cmd gives the real filename of
850 # the latest aka current log file.
851 cmd = ('if [ -f %(dir)s/latest.DEBUG ];'
852 'then realpath %(dir)s/latest.DEBUG;'
853 'elif [ -f %(dir)s/latest ];'
854 'then realpath %(dir)s/latest;'
855 'else exit %(code)d;'
856 'fi' % {'dir': self.remote_log_dir,
857 'code': self.NO_SYMLINKS_CODE})
858 res = self.run(cmd, stderr_tee=None, ignore_status=True)
859 if res.exit_status != 0:
860 if res.exit_status == self.NO_SYMLINKS_CODE:
861 logging.warning('servod log latest symlinks not found. '
862 'This is likely due to an error starting up '
863 'servod. Ignoring..')
864 else:
865 logging.warning('Failed to find servod logs on servo host.')
866 logging.warning(res.stderr.strip())
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700867 return None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800868 fname = os.path.basename(res.stdout.strip())
869 # From the fname, ought to extract the timestamp using the TS_EXTRACTOR
Ruben Rodriguez Buchillone9aa2b02020-03-04 12:14:28 -0800870 ts_match = self.TS_EXTRACTOR.match(fname)
871 if not ts_match:
872 logging.warning('Failed to extract timestamp from servod log file '
873 '%r. Skipping. The servo host is using outdated '
874 'servod logging and needs to be updated.', fname)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700875 return None
876 return ts_match.group(self.TS_GROUP)
877
878 def get_instance_logs(self, instance_ts, outdir, old=False):
879 """Collect all logs with |instance_ts| and dump into a dir in |outdir|
880
881 This method first collects all logs on the servo_host side pertaining
882 to this servod instance (port, instatiation). It glues them together
883 into combined log.[level].txt files and extracts all available MCU
884 console I/O from the logs into individual files e.g. servo_v4.txt
885
886 All the output can be found in a directory inside |outdir| that
887 this generates based on |LOG_DIR|, the servod port, and the instance
888 timestamp on the servo_host side.
889
890 @param instance_ts: log timestamp to grab logfiles for
891 @param outdir: directory to create a subdirectory into to place the
892 servod logs into.
893 @param old: bool, whether to append |OLD_LOG_SUFFIX| to output dir
894 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800895 # Create the local results log dir.
896 log_dir = os.path.join(outdir, '%s_%s.%s' % (self.LOG_DIR,
897 str(self.servo_port),
898 instance_ts))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700899 if old:
900 log_dir = '%s.%s' % (log_dir, self.OLD_LOG_SUFFIX)
901 logging.info('Saving servod logs to %r.', log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800902 os.mkdir(log_dir)
903 # Now, get all files with that timestamp.
904 cmd = 'find %s -maxdepth 1 -name "log.%s*"' % (self.remote_log_dir,
905 instance_ts)
906 res = self.run(cmd, stderr_tee=None, ignore_status=True)
907 files = res.stdout.strip().split()
908 try:
909 self.get_file(files, log_dir, try_rsync=False)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700910 if not os.listdir(log_dir):
911 logging.info('No servod logs retrieved. Ignoring, and removing '
912 '%r again.', log_dir)
913 os.rmdir(log_dir)
914 return
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800915 except error.AutoservRunError as e:
916 result = e.result_obj
917 if result.exit_status != 0:
918 stderr = result.stderr.strip()
919 logging.warning("Couldn't retrieve servod logs. Ignoring: %s",
920 stderr or '\n%s' % result)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700921 # Remove the log_dir as nothing was added to it.
922 os.rmdir(log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800923 return
924 local_files = [os.path.join(log_dir, f) for f in os.listdir(log_dir)]
925 # TODO(crrev.com/c/1793030): remove no-level case once CL is pushed
926 for level_name in ('DEBUG', 'INFO', 'WARNING', ''):
927 # Create the joint files for each loglevel. i.e log.DEBUG
928 joint_file = self.JOINT_LOG_PREFIX
929 if level_name:
930 joint_file = '%s.%s' % (self.JOINT_LOG_PREFIX, level_name)
931 # This helps with some online tools to avoid complaints about an
932 # unknown filetype.
933 joint_file = joint_file + '.txt'
934 joint_path = os.path.join(log_dir, joint_file)
935 files = [f for f in local_files if level_name in f]
936 if not files:
937 # TODO(crrev.com/c/1793030): remove no-level case once CL
938 # is pushed
939 continue
940 # Extract compressed logs if any.
941 compressed, extracted = self._extract_compressed_logs(log_dir,
942 files)
943 files = list(set(files) - set(compressed))
944 files.extend(extracted)
945 # Need to sort. As they all share the same timestamp, and
946 # loglevel, the index itself is sufficient. The highest index
947 # is the oldest file, therefore we need a descending sort.
948 def sortkey(f, level=level_name):
949 """Custom sortkey to sort based on rotation number int."""
950 if f.endswith(level_name): return 0
951 return int(f.split('.')[-1])
952
953 files.sort(reverse=True, key=sortkey)
954 # Just rename the first file rather than building from scratch.
955 os.rename(files[0], joint_path)
956 with open(joint_path, 'a') as joint_f:
957 for logfile in files[1:]:
958 # Transfer the file to the joint file line by line.
959 with open(logfile, 'r') as log_f:
960 for line in log_f:
961 joint_f.write(line)
962 # File has been written over. Delete safely.
963 os.remove(logfile)
964 # Need to remove all files form |local_files| so we don't
965 # analyze them again.
966 local_files = list(set(local_files) - set(files) - set(compressed))
967 # Lastly, extract MCU logs from the joint logs.
968 self._extract_mcu_logs(log_dir)
969
Garry Wang79e9af62019-06-12 15:19:19 -0700970 def _lock(self):
971 """lock servohost by touching a file.
972 """
973 logging.debug('Locking servohost %s by touching %s file',
974 self.hostname, self._lock_file)
975 self.run('touch %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -0700976 self._is_locked = True
Garry Wang79e9af62019-06-12 15:19:19 -0700977
978
979 def _unlock(self):
980 """Unlock servohost by removing the lock file.
981 """
982 logging.debug('Unlocking servohost by removing %s file',
983 self._lock_file)
984 self.run('rm %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -0700985 self._is_locked = False
Garry Wang79e9af62019-06-12 15:19:19 -0700986
987
Congbin Guoa1f9cba2018-07-03 11:36:59 -0700988 def close(self):
Congbin Guofc3b8962019-03-22 17:38:46 -0700989 """Close the associated servo and the host object."""
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700990 # NOTE: throughout this method there are multiple attempts to catch
991 # all errors. This is WAI as log grabbing should not fail tests.
992 # However, the goal is to catch and handle/process all errors, thus
993 # we print the traceback and ask for a bug.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800994 if self._closed:
995 logging.debug('ServoHost is already closed.')
996 return
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700997 instance_ts = self.get_instance_logs_ts()
998 # TODO(crbug.com/1011516): once enabled, remove the check against
999 # localhost and instead check against log-rotiation enablement.
1000 logs_available = (instance_ts is not None and
1001 self.job and
1002 not self.is_localhost())
1003 if logs_available:
1004 # Probe whether there was a servod restart, and grab those old
1005 # logs as well.
1006 try:
1007 self.probe_servod_restart(instance_ts, self.job.resultdir)
1008 except (error.AutoservRunError, error.TestFail) as e:
1009 logging.info('Failed to grab servo logs due to: %s. '
1010 'This error is forgiven.', str(e))
1011 except Exception as e:
1012 logging.error('Unexpected error probing for old logs. %s. '
1013 'Forgiven. Please file a bug and fix or catch '
1014 'in log probing function', str(e),
1015 exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001016 if self._servo:
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001017 outdir = None if not self.job else self.job.resultdir
Congbin Guo2e5e2a22018-07-27 10:32:48 -07001018 # In some cases when we run as lab-tools, the job object is None.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001019 self._servo.close(outdir)
1020
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001021 if logs_available:
1022 # Grab current (not old like above) logs after the servo instance
1023 # was closed out.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001024 try:
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001025 self.get_instance_logs(instance_ts, self.job.resultdir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001026 except error.AutoservRunError as e:
1027 logging.info('Failed to grab servo logs due to: %s. '
1028 'This error is forgiven.', str(e))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001029 except Exception as e:
1030 logging.error('Unexpected error grabbing servod logs. %s. '
1031 'Forgiven. Please file a bug and fix or catch '
1032 'in log grabbing function', str(e), exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001033
Garry Wang7c00b0f2019-06-25 17:28:17 -07001034 if self._is_locked:
1035 # Remove the lock if the servohost has been locked.
Garry Wang79e9af62019-06-12 15:19:19 -07001036 try:
1037 self._unlock()
1038 except error.AutoservSSHTimeout:
1039 logging.error('Unlock servohost failed due to ssh timeout.'
1040 ' It may caused by servohost went down during'
1041 ' the task.')
Garry Wangc1288cf2019-12-17 14:58:00 -08001042 # We want always stop servod after task to minimum the impact of bad
1043 # servod process interfere other servods.(see crbug.com/1028665)
Garry Wang4c624bc2020-01-27 16:34:43 -08001044 try:
1045 self.stop_servod()
1046 except error.AutoservRunError as e:
1047 logging.info("Failed to stop servod due to:\n%s\n"
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001048 "This error is forgiven.", str(e))
Garry Wangc1288cf2019-12-17 14:58:00 -08001049
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001050 super(ServoHost, self).close()
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001051 # Mark closed.
1052 self._closed = True
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001053
1054
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001055 def get_servo_state(self):
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001056 if self._servo_state is None:
Garry Wang11b5e872020-03-11 15:14:08 -07001057 return servo_constants.SERVO_STATE_UNKNOWN
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001058 return self._servo_state
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001059
Otabek Kasimov15963492020-06-23 21:10:51 -07001060 def get_verify_state(self, tag):
1061 """Return the state of servo verifier.
1062
1063 @returns: bool or None
1064 """
1065 return self._repair_strategy.verifier_is_good(tag)
1066
1067 def determine_servo_state(self):
1068 """Determine servo state based on the failed verifier.
1069
1070 @returns: servo state value
1071 The state detecting based on first fail verifier or collecting of
1072 them.
1073 """
1074 ssh = self.get_verify_state('servo_ssh')
1075 disk_space = self.get_verify_state('disk_space')
1076 start_servod = self.get_verify_state('servod_job')
1077 create_servo = self.get_verify_state('servod_connection')
1078 init_servo = self.get_verify_state('servod_control')
1079 pwr_button = self.get_verify_state('pwr_button')
1080 lid_open = self.get_verify_state('lid_open')
1081 ec_board = self.get_verify_state('ec_board')
1082 ccd_testlab = self.get_verify_state('ccd_testlab')
1083
1084 if not ssh:
1085 return servo_constants.SERVO_STATE_NO_SSH
1086
1087 # one of the reason why servo can not initialized
1088 if ccd_testlab == self.VERIFY_FAILED:
1089 return servo_constants.SERVO_STATE_CCD_TESTLAB_ISSUE
1090
1091 if init_servo == self.VERIFY_FAILED:
1092 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1093
1094 if pwr_button == self.VERIFY_FAILED:
1095 return servo_constants.SERVO_STATE_BAD_RIBBON_CABLE
1096 if lid_open == self.VERIFY_FAILED:
1097 return servo_constants.SERVO_STATE_LID_OPEN_FAILED
1098 if ec_board == self.VERIFY_FAILED:
1099 return servo_constants.SERVO_STATE_EC_BROKEN
1100
1101 data = {'port': self.servo_port,
1102 'host': self.hostname,
1103 'board': self.servo_board or ''}
1104 metrics.Counter(
1105 'chromeos/autotest/repair/unknown_servo_state'
1106 ).increment(fields=data)
1107 logging.info('We do not have special state for this failure yet :)')
1108 return servo_constants.SERVO_STATE_BROKEN
1109
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001110
Richard Barnetteea3e4602016-06-10 12:36:41 -07001111def make_servo_hostname(dut_hostname):
1112 """Given a DUT's hostname, return the hostname of its servo.
1113
1114 @param dut_hostname: hostname of a DUT.
1115
1116 @return hostname of the DUT's servo.
1117
1118 """
1119 host_parts = dut_hostname.split('.')
1120 host_parts[0] = host_parts[0] + '-servo'
1121 return '.'.join(host_parts)
1122
1123
1124def servo_host_is_up(servo_hostname):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001125 """Given a servo host name, return if it's up or not.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001126
1127 @param servo_hostname: hostname of the servo host.
1128
1129 @return True if it's up, False otherwise
1130 """
1131 # Technically, this duplicates the SSH ping done early in the servo
1132 # proxy initialization code. However, this ping ends in a couple
1133 # seconds when if fails, rather than the 60 seconds it takes to decide
1134 # that an SSH ping has timed out. Specifically, that timeout happens
1135 # when our servo DNS name resolves, but there is no host at that IP.
1136 logging.info('Pinging servo host at %s', servo_hostname)
1137 ping_config = ping_runner.PingConfig(
1138 servo_hostname, count=3,
1139 ignore_result=True, ignore_status=True)
1140 return ping_runner.PingRunner().ping(ping_config).received > 0
1141
1142
Richard Barnettee519dcd2016-08-15 17:37:17 -07001143def _map_afe_board_to_servo_board(afe_board):
1144 """Map a board we get from the AFE to a servo appropriate value.
1145
1146 Many boards are identical to other boards for servo's purposes.
1147 This function makes that mapping.
1148
1149 @param afe_board string board name received from AFE.
1150 @return board we expect servo to have.
1151
1152 """
1153 KNOWN_SUFFIXES = ['-freon', '_freon', '_moblab', '-cheets']
1154 BOARD_MAP = {'gizmo': 'panther'}
1155 mapped_board = afe_board
1156 if afe_board in BOARD_MAP:
1157 mapped_board = BOARD_MAP[afe_board]
1158 else:
1159 for suffix in KNOWN_SUFFIXES:
1160 if afe_board.endswith(suffix):
1161 mapped_board = afe_board[0:-len(suffix)]
1162 break
1163 if mapped_board != afe_board:
1164 logging.info('Mapping AFE board=%s to %s', afe_board, mapped_board)
1165 return mapped_board
1166
1167
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001168def get_servo_args_for_host(dut_host):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001169 """Return servo data associated with a given DUT.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001170
Richard Barnetteea3e4602016-06-10 12:36:41 -07001171 @param dut_host Instance of `Host` on which to find the servo
1172 attributes.
Prathmesh Prabhuf605dd32018-08-28 17:09:04 -07001173 @return `servo_args` dict with host and an optional port.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001174 """
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001175 info = dut_host.host_info_store.get()
1176 servo_args = {k: v for k, v in info.attributes.iteritems()
Garry Wang11b5e872020-03-11 15:14:08 -07001177 if k in servo_constants.SERVO_ATTR_KEYS}
Richard Barnetteea3e4602016-06-10 12:36:41 -07001178
Garry Wang11b5e872020-03-11 15:14:08 -07001179 if servo_constants.SERVO_PORT_ATTR in servo_args:
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001180 try:
Garry Wang11b5e872020-03-11 15:14:08 -07001181 servo_args[servo_constants.SERVO_PORT_ATTR] = int(
1182 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001183 except ValueError:
1184 logging.error('servo port is not an int: %s',
Garry Wang11b5e872020-03-11 15:14:08 -07001185 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001186 # Reset servo_args because we don't want to use an invalid port.
Garry Wang11b5e872020-03-11 15:14:08 -07001187 servo_args.pop(servo_constants.SERVO_HOST_ATTR, None)
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001188
1189 if info.board:
Garry Wang11b5e872020-03-11 15:14:08 -07001190 servo_board = _map_afe_board_to_servo_board(info.board)
1191 servo_args[servo_constants.SERVO_BOARD_ATTR] = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -07001192 if info.model:
Garry Wang11b5e872020-03-11 15:14:08 -07001193 servo_args[servo_constants.SERVO_MODEL_ATTR] = info.model
1194 return servo_args if servo_constants.SERVO_HOST_ATTR in servo_args else None
Richard Barnetteea3e4602016-06-10 12:36:41 -07001195
1196
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001197def _tweak_args_for_ssp_moblab(servo_args):
Garry Wang11b5e872020-03-11 15:14:08 -07001198 if (servo_args[servo_constants.SERVO_HOST_ATTR]
1199 in ['localhost', '127.0.0.1']):
1200 servo_args[servo_constants.SERVO_HOST_ATTR] = _CONFIG.get_config_value(
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001201 'SSP', 'host_container_ip', type=str, default=None)
1202
1203
Dan Shi023aae32016-05-25 11:13:01 -07001204def create_servo_host(dut, servo_args, try_lab_servo=False,
Gregory Nisbetde13e2a2019-12-09 22:44:00 -08001205 try_servo_repair=False, dut_host_info=None):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001206 """Create a ServoHost object for a given DUT, if appropriate.
Dan Shi4d478522014-02-14 13:46:32 -08001207
Richard Barnette9a26ad62016-06-10 12:03:08 -07001208 This function attempts to create and verify or repair a `ServoHost`
1209 object for a servo connected to the given `dut`, subject to various
1210 constraints imposed by the parameters:
1211 * When the `servo_args` parameter is not `None`, a servo
1212 host must be created, and must be checked with `repair()`.
1213 * Otherwise, if a servo exists in the lab and `try_lab_servo` is
1214 true:
1215 * If `try_servo_repair` is true, then create a servo host and
1216 check it with `repair()`.
1217 * Otherwise, if the servo responds to `ping` then create a
1218 servo host and check it with `verify()`.
Fang Denge545abb2014-12-30 18:43:47 -08001219
Richard Barnette9a26ad62016-06-10 12:03:08 -07001220 In cases where `servo_args` was not `None`, repair failure
1221 exceptions are passed back to the caller; otherwise, exceptions
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001222 are logged and then discarded. Note that this only happens in cases
1223 where we're called from a test (not special task) control file that
1224 has an explicit dependency on servo. In that case, we require that
1225 repair not write to `status.log`, so as to avoid polluting test
1226 results.
1227
1228 TODO(jrbarnette): The special handling for servo in test control
1229 files is a thorn in my flesh; I dearly hope to see it cut out before
1230 my retirement.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001231
1232 Parameters for a servo host consist of a host name, port number, and
1233 DUT board, and are determined from one of these sources, in order of
1234 priority:
Richard Barnetteea3e4602016-06-10 12:36:41 -07001235 * Servo attributes from the `dut` parameter take precedence over
1236 all other sources of information.
1237 * If a DNS entry for the servo based on the DUT hostname exists in
1238 the CrOS lab network, that hostname is used with the default
Richard Barnette9a26ad62016-06-10 12:03:08 -07001239 port and the DUT's board.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001240 * If no other options are found, the parameters will be taken
Richard Barnette9a26ad62016-06-10 12:03:08 -07001241 from the `servo_args` dict passed in from the caller.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001242
1243 @param dut An instance of `Host` from which to take
1244 servo parameters (if available).
1245 @param servo_args A dictionary with servo parameters to use if
1246 they can't be found from `dut`. If this
1247 argument is supplied, unrepaired exceptions
1248 from `verify()` will be passed back to the
1249 caller.
1250 @param try_lab_servo If not true, servo host creation will be
1251 skipped unless otherwise required by the
1252 caller.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001253 @param try_servo_repair If true, check a servo host with
1254 `repair()` instead of `verify()`.
Dan Shi4d478522014-02-14 13:46:32 -08001255
1256 @returns: A ServoHost object or None. See comments above.
1257
1258 """
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001259 servo_dependency = servo_args is not None
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001260 if dut is not None and (try_lab_servo or servo_dependency):
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001261 servo_args_override = get_servo_args_for_host(dut)
Richard Barnetteea3e4602016-06-10 12:36:41 -07001262 if servo_args_override is not None:
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001263 if utils.in_moblab_ssp():
1264 _tweak_args_for_ssp_moblab(servo_args_override)
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001265 logging.debug(
1266 'Overriding provided servo_args (%s) with arguments'
1267 ' determined from the host (%s)',
1268 servo_args,
1269 servo_args_override,
1270 )
Richard Barnetteea3e4602016-06-10 12:36:41 -07001271 servo_args = servo_args_override
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001272
Richard Barnetteea3e4602016-06-10 12:36:41 -07001273 if servo_args is None:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001274 logging.debug('No servo_args provided, and failed to find overrides.')
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001275 if try_lab_servo or servo_dependency:
Otabek Kasimov646812c2020-06-23 20:01:36 -07001276 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001277 else:
1278 # For regular test case which not required the servo
1279 return None, None
1280
Garry Wang11b5e872020-03-11 15:14:08 -07001281 servo_hostname = servo_args.get(servo_constants.SERVO_HOST_ATTR)
1282 servo_port = servo_args.get(servo_constants.SERVO_PORT_ATTR)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001283 if not _is_servo_host_information_exist(servo_hostname, servo_port):
1284 logging.debug(
1285 'Servo connection info missed hostname: %s , port: %s',
1286 servo_hostname, servo_port)
Otabek Kasimov646812c2020-06-23 20:01:36 -07001287 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001288 if not is_servo_host_information_valid(servo_hostname, servo_port):
1289 logging.debug(
1290 'Servo connection info is incorrect hostname: %s , port: %s',
1291 servo_hostname, servo_port)
Garry Wang11b5e872020-03-11 15:14:08 -07001292 return None, servo_constants.SERVO_STATE_WRONG_CONFIG
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001293 if (not servo_dependency and not try_servo_repair and
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001294 not servo_host_is_up(servo_hostname)):
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001295 logging.debug('ServoHost is not up.')
Otabek Kasimov646812c2020-06-23 20:01:36 -07001296 return None, servo_constants.SERVO_STATE_NO_SSH
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001297
Garry Wangebc015b2019-06-06 17:45:06 -07001298 newhost = ServoHost(**servo_args)
Garry Wangffbd2162020-04-17 16:13:48 -07001299
1300 # Reset servo if the servo is locked, as we check if the servohost is up,
1301 # if the servohost is labstation and if the servohost is in lab inside the
1302 # locking logic. Also check try_servo_repair to make sure we only do this
1303 # in AdminRepair tasks.
1304 if newhost._is_locked and try_servo_repair:
1305 newhost.reset_servo()
1306
Garry Wangcdd27b22020-01-13 14:59:11 -08001307 try:
1308 newhost.restart_servod(quick_startup=True)
1309 except error.AutoservSSHTimeout:
1310 logging.warning("Restart servod failed due ssh connection "
1311 "to servohost timed out. This error is forgiven"
1312 " here, we will retry in servo repair process.")
1313 except error.AutoservRunError as e:
1314 logging.warning("Restart servod failed due to:\n%s\n"
1315 "This error is forgiven here, we will retry"
1316 " in servo repair process.", str(e))
Garry Wangebc015b2019-06-06 17:45:06 -07001317
Gregory Nisbetde13e2a2019-12-09 22:44:00 -08001318 # TODO(gregorynisbet): Clean all of this up.
1319 logging.debug('create_servo_host: attempt to set info store on '
1320 'servo host')
1321 try:
1322 if dut_host_info is None:
1323 logging.debug('create_servo_host: dut_host_info is '
1324 'None, skipping')
1325 else:
1326 newhost.set_dut_host_info(dut_host_info)
1327 logging.debug('create_servo_host: successfully set info '
1328 'store')
1329 except Exception:
1330 logging.error("create_servo_host: (%s)", traceback.format_exc())
1331
Richard Barnette9a26ad62016-06-10 12:03:08 -07001332 # Note that the logic of repair() includes everything done
1333 # by verify(). It's sufficient to call one or the other;
1334 # we don't need both.
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001335 if servo_dependency:
1336 newhost.repair(silent=True)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001337 return newhost, newhost.get_servo_state()
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001338
1339 if try_servo_repair:
1340 try:
1341 newhost.repair()
1342 except Exception:
1343 logging.exception('servo repair failed for %s', newhost.hostname)
Richard Barnette9a26ad62016-06-10 12:03:08 -07001344 else:
1345 try:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001346 newhost.verify()
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001347 except Exception:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001348 logging.exception('servo verify failed for %s', newhost.hostname)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001349 return newhost, newhost.get_servo_state()
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001350
1351
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001352def _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001353 if hostname is None or len(hostname.strip()) == 0:
1354 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001355 if port is None:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001356 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001357 if not type(port) is int:
1358 try:
1359 int(port)
1360 except ValueError:
1361 return False
1362
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001363 return True
1364
1365
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001366def is_servo_host_information_valid(hostname, port):
Garry Wang9b8f2342020-04-17 16:34:09 -07001367 """Check if provided servo attributes are valid.
1368
1369 @param hostname Hostname of the servohost.
1370 @param port servo port number.
1371
1372 @returns: A bool value to indicate if provided servo attribute valid.
1373 """
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001374 if not _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001375 return False
1376 # checking range and correct of the port
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001377 port_int = int(port)
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001378 if port_int < 1 or port_int > 65000:
1379 return False
1380 # we expecting host contain only latters, digits and '-' or '_'
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001381 if not re.match('[a-zA-Z0-9-_\.]*$', hostname) or len(hostname) < 5:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001382 return False
1383 return True