blob: 7863ce8c5a4632171f455720f821e88a3627d464 [file] [log] [blame]
Fang Deng5d518f42013-08-02 14:04:32 -07001# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
2# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4#
5# Expects to be run in an environment with sudo and no interactive password
6# prompt, such as within the Chromium OS development chroot.
7
8
9"""This file provides core logic for servo verify/repair process."""
10
11
Fang Deng5d518f42013-08-02 14:04:32 -070012import logging
Raul E Rangel52ca2e82018-07-03 14:10:14 -060013import os
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080014import re
15import tarfile
Garry Wangc1288cf2019-12-17 14:58:00 -080016import time
Gregory Nisbet265a52c2019-12-10 20:38:42 -080017import traceback
Dana Goyette4dc0adc2019-05-06 14:51:53 -070018import xmlrpclib
Fang Deng5d518f42013-08-02 14:04:32 -070019
20from autotest_lib.client.bin import utils
Garry Wang79e9af62019-06-12 15:19:19 -070021from autotest_lib.client.common_lib import error
Richard Barnette9a26ad62016-06-10 12:03:08 -070022from autotest_lib.client.common_lib import hosts
Garry Wang7b0e1b72020-03-25 19:08:59 -070023from autotest_lib.client.common_lib import lsbrelease_utils
Fang Deng5d518f42013-08-02 14:04:32 -070024from autotest_lib.client.common_lib.cros import retry
Christopher Wileycef1f902014-06-19 11:11:23 -070025from autotest_lib.client.common_lib.cros.network import ping_runner
Richard Barnette9a26ad62016-06-10 12:03:08 -070026from autotest_lib.server.cros.servo import servo
Richard Barnetted31580e2018-05-14 19:58:00 +000027from autotest_lib.server.hosts import servo_repair
Garry Wangebc015b2019-06-06 17:45:06 -070028from autotest_lib.server.hosts import base_servohost
Garry Wang11b5e872020-03-11 15:14:08 -070029from autotest_lib.server.hosts import servo_constants
30from autotest_lib.client.common_lib import global_config
Garry Wangd7367482020-02-27 13:52:40 -080031
Dan Shi3b2adf62015-09-02 17:46:54 -070032_CONFIG = global_config.global_config
Fang Deng5d518f42013-08-02 14:04:32 -070033
Otabek Kasimova7ba91a2020-03-09 08:31:01 -070034
Garry Wangebc015b2019-06-06 17:45:06 -070035class ServoHost(base_servohost.BaseServoHost):
36 """Host class for a servo host(e.g. beaglebone, labstation)
Dana Goyette0b6e6402019-10-04 11:09:24 -070037 that with a servo instance for a specific port.
38
39 @type _servo: servo.Servo | None
40 """
Fang Deng5d518f42013-08-02 14:04:32 -070041
Raul E Rangel52ca2e82018-07-03 14:10:14 -060042 DEFAULT_PORT = int(os.getenv('SERVOD_PORT', '9999'))
Richard Barnette9a26ad62016-06-10 12:03:08 -070043
Dan Shie5b3c512014-08-21 12:12:09 -070044 # Timeout for initializing servo signals.
Wai-Hong Tam37b6ed32017-09-19 15:52:39 -070045 INITIALIZE_SERVO_TIMEOUT_SECS = 60
Richard Barnette9a26ad62016-06-10 12:03:08 -070046
xixuan6cf6d2f2016-01-29 15:29:00 -080047 # Ready test function
48 SERVO_READY_METHOD = 'get_version'
Fang Deng5d518f42013-08-02 14:04:32 -070049
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080050 # Directory prefix on the servo host where the servod logs are stored.
51 SERVOD_LOG_PREFIX = '/var/log/servod'
52
53 # Exit code to use when symlinks for servod logs are not found.
54 NO_SYMLINKS_CODE = 9
55
56 # Directory in the job's results directory to dump the logs into.
57 LOG_DIR = 'servod'
58
59 # Prefix for joint loglevel files in the logs.
60 JOINT_LOG_PREFIX = 'log'
61
62 # Regex group to extract timestamp from logfile name.
63 TS_GROUP = 'ts'
64
65 # This regex is used to extract the timestamp from servod logs.
66 # files always start with log.
67 TS_RE = (r'log.'
68 # The timestamp is of format %Y-%m-%d--%H-%M-%S.MS
69 r'(?P<%s>\d{4}(\-\d{2}){2}\-(-\d{2}){3}.\d{3})'
70 # The loglevel is optional depending on labstation version.
71 r'(.(INFO|DEBUG|WARNING))?' % TS_GROUP)
72 TS_EXTRACTOR = re.compile(TS_RE)
73
74 # Regex group to extract MCU name from logline in servod logs.
75 MCU_GROUP = 'mcu'
76
77 # Regex group to extract logline from MCU logline in servod logs.
78 LINE_GROUP = 'line'
79
80 # This regex is used to extract the mcu and the line content from an
81 # MCU logline in servod logs. e.g. EC or servo_v4 console logs.
82 # Here is an example log-line:
83 #
84 # 2020-01-23 13:15:12,223 - servo_v4 - EC3PO.Console - DEBUG -
85 # console.py:219:LogConsoleOutput - /dev/pts/9 - cc polarity: cc1
86 #
87 # Here is conceptually how they are formatted:
88 #
89 # <time> - <MCU> - EC3PO.Console - <LVL> - <file:line:func> - <pts> -
90 # <output>
91 #
92 # The log format starts with a timestamp
93 MCU_RE = (r'[\d\-]+ [\d:,]+ '
94 # The mcu that is logging this is next.
95 r'- (?P<%s>\w+) - '
96 # Next, we have more log outputs before the actual line.
97 # Information about the file line, logging function etc.
98 # Anchor on EC3PO Console, LogConsoleOutput and dev/pts.
99 # NOTE: if the log format changes, this regex needs to be
100 # adjusted.
101 r'EC3PO\.Console[\s\-\w\d:.]+LogConsoleOutput - /dev/pts/\d+ - '
102 # Lastly, we get the MCU's console line.
103 r'(?P<%s>.+$)' % (MCU_GROUP, LINE_GROUP))
104 MCU_EXTRACTOR = re.compile(MCU_RE)
105
106 # Suffix to identify compressed logfiles.
107 COMPRESSION_SUFFIX = '.tbz2'
108
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800109 def _init_attributes(self):
110 self._servo_state = None
111 self.servo_port = None
112 self.servo_board = None
113 self.servo_model = None
114 self.servo_serial = None
115 self._servo = None
116 self._servod_server_proxy = None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800117 # Flag to make sure that multiple calls to close do not result in the
118 # logic executing multiple times.
119 self._closed = False
Fang Deng5d518f42013-08-02 14:04:32 -0700120
Richard Barnette17bfc6c2016-08-04 18:41:43 -0700121 def _initialize(self, servo_host='localhost',
Richard Barnettee519dcd2016-08-15 17:37:17 -0700122 servo_port=DEFAULT_PORT, servo_board=None,
Nick Sanders2f3c9852018-10-24 12:10:24 -0700123 servo_model=None, servo_serial=None, is_in_lab=None,
124 *args, **dargs):
Fang Deng5d518f42013-08-02 14:04:32 -0700125 """Initialize a ServoHost instance.
126
127 A ServoHost instance represents a host that controls a servo.
128
129 @param servo_host: Name of the host where the servod process
130 is running.
Raul E Rangel52ca2e82018-07-03 14:10:14 -0600131 @param servo_port: Port the servod process is listening on. Defaults
132 to the SERVOD_PORT environment variable if set,
133 otherwise 9999.
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700134 @param servo_board: Board that the servo is connected to.
Nick Sanders2f3c9852018-10-24 12:10:24 -0700135 @param servo_model: Model that the servo is connected to.
Dan Shi4d478522014-02-14 13:46:32 -0800136 @param is_in_lab: True if the servo host is in Cros Lab. Default is set
137 to None, for which utils.host_is_in_lab_zone will be
138 called to check if the servo host is in Cros lab.
Fang Deng5d518f42013-08-02 14:04:32 -0700139
140 """
141 super(ServoHost, self)._initialize(hostname=servo_host,
Garry Wangebc015b2019-06-06 17:45:06 -0700142 is_in_lab=is_in_lab, *args, **dargs)
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800143 self._init_attributes()
Richard Barnette42f4db92018-08-23 15:05:15 -0700144 self.servo_port = int(servo_port)
Richard Barnettee519dcd2016-08-15 17:37:17 -0700145 self.servo_board = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -0700146 self.servo_model = servo_model
Kevin Cheng643ce8a2016-09-15 15:42:12 -0700147 self.servo_serial = servo_serial
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800148
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800149 # The location of the log files on the servo host for this instance.
150 self.remote_log_dir = '%s_%s' % (self.SERVOD_LOG_PREFIX,
151 self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700152 # Path of the servo host lock file.
153 self._lock_file = (self.TEMP_FILE_DIR + str(self.servo_port)
154 + self.LOCK_FILE_POSTFIX)
155 # File path to declare a reboot request.
156 self._reboot_file = (self.TEMP_FILE_DIR + str(self.servo_port)
157 + self.REBOOT_FILE_POSTFIX)
158
159 # Lock the servo host if it's an in-lab labstation to prevent other
160 # task to reboot it until current task completes. We also wait and
161 # make sure the labstation is up here, in the case of the labstation is
162 # in the middle of reboot.
Garry Wang7c00b0f2019-06-25 17:28:17 -0700163 self._is_locked = False
Garry Wang42b4d862019-06-25 15:50:49 -0700164 if (self.wait_up(self.REBOOT_TIMEOUT) and self.is_in_lab()
165 and self.is_labstation()):
Garry Wang79e9af62019-06-12 15:19:19 -0700166 self._lock()
Garry Wangebc015b2019-06-06 17:45:06 -0700167
Richard Barnette9a26ad62016-06-10 12:03:08 -0700168 self._repair_strategy = (
169 servo_repair.create_servo_repair_strategy())
Richard Barnettee519dcd2016-08-15 17:37:17 -0700170
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700171 def __str__(self):
172 return "<%s '%s:%s'>" % (
173 type(self).__name__, self.hostname, self.servo_port)
174
Richard Barnette9a26ad62016-06-10 12:03:08 -0700175 def connect_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700176 """Establish a connection to the servod server on this host.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700177
178 Initializes `self._servo` and then verifies that all network
179 connections are working. This will create an ssh tunnel if
180 it's required.
181
182 As a side effect of testing the connection, all signals on the
183 target servo are reset to default values, and the USB stick is
184 set to the neutral (off) position.
185 """
Kevin Cheng643ce8a2016-09-15 15:42:12 -0700186 servo_obj = servo.Servo(servo_host=self, servo_serial=self.servo_serial)
Kuang-che Wu05763f52019-08-30 16:48:21 +0800187 self._servo = servo_obj
Richard Barnette9a26ad62016-06-10 12:03:08 -0700188 timeout, _ = retry.timeout(
189 servo_obj.initialize_dut,
190 timeout_sec=self.INITIALIZE_SERVO_TIMEOUT_SECS)
191 if timeout:
192 raise hosts.AutoservVerifyError(
193 'Servo initialize timed out.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700194
195
196 def disconnect_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700197 """Disconnect our servo if it exists.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700198
199 If we've previously successfully connected to our servo,
200 disconnect any established ssh tunnel, and set `self._servo`
201 back to `None`.
202 """
203 if self._servo:
204 # N.B. This call is safe even without a tunnel:
205 # rpc_server_tracker.disconnect() silently ignores
206 # unknown ports.
207 self.rpc_server_tracker.disconnect(self.servo_port)
208 self._servo = None
Fang Deng5d518f42013-08-02 14:04:32 -0700209
Garry Wangc1288cf2019-12-17 14:58:00 -0800210
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800211 def _create_servod_server_proxy(self):
212 """Create a proxy that can be used to communicate with servod server.
Fang Deng5d518f42013-08-02 14:04:32 -0700213
214 @returns: An xmlrpclib.ServerProxy that is connected to the servod
215 server on the host.
Fang Deng5d518f42013-08-02 14:04:32 -0700216 """
Garry Wang11b5e872020-03-11 15:14:08 -0700217 if (servo_constants.ENABLE_SSH_TUNNEL_FOR_SERVO
218 and not self.is_localhost()):
Richard Barnette9a26ad62016-06-10 12:03:08 -0700219 return self.rpc_server_tracker.xmlrpc_connect(
220 None, self.servo_port,
221 ready_test_name=self.SERVO_READY_METHOD,
Allen Li2b1a8992018-11-27 14:17:18 -0800222 timeout_seconds=60,
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700223 request_timeout_seconds=3600,
224 server_desc=str(self))
Richard Barnette9a26ad62016-06-10 12:03:08 -0700225 else:
226 remote = 'http://%s:%s' % (self.hostname, self.servo_port)
227 return xmlrpclib.ServerProxy(remote)
Fang Deng5d518f42013-08-02 14:04:32 -0700228
229
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800230 def get_servod_server_proxy(self):
231 """Return a cached proxy if exists; otherwise, create a new one.
232
233 @returns: An xmlrpclib.ServerProxy that is connected to the servod
234 server on the host.
235 """
236 # Single-threaded execution, no race
237 if self._servod_server_proxy is None:
238 self._servod_server_proxy = self._create_servod_server_proxy()
239 return self._servod_server_proxy
240
241
Richard Barnette1edbb162016-11-01 11:47:50 -0700242 def verify(self, silent=False):
243 """Update the servo host and verify it's in a good state.
244
245 @param silent If true, suppress logging in `status.log`.
246 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700247 message = 'Beginning verify for servo host %s port %s serial %s'
248 message %= (self.hostname, self.servo_port, self.servo_serial)
249 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700250 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700251 self._repair_strategy.verify(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700252 self._servo_state = servo_constants.SERVO_STATE_WORKING
253 self.record('INFO', None, None,
254 'ServoHost verify set servo_state as WORKING')
Garry Wang63b8c382020-03-11 22:28:40 -0700255 except Exception as e:
Garry Wang11b5e872020-03-11 15:14:08 -0700256 self._servo_state = servo_constants.SERVO_STATE_BROKEN
257 self.record('INFO', None, None,
258 'ServoHost verify set servo_state as BROKEN')
Garry Wang63b8c382020-03-11 22:28:40 -0700259 if self._is_critical_error(e):
260 raise
Fang Deng5d518f42013-08-02 14:04:32 -0700261
262
Garry Wang7b0e1b72020-03-25 19:08:59 -0700263 def get_image_name_from_usbkey(self, usbkey_dev):
264 """Mount usb drive and check ChromeOS image name on it if there is
265 one. This method assumes the image_usbkey_direction is already set
266 to servo side.
267
268 @param: usbkey_dev usbkey dev path(e.g. /dev/sdb).
269
270 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
271 or empty string if no test image detected, or unexpected
272 error occurred.
273 @raises AutoservRepairError if mount usb drive failed with no
274 specific device error, which usually means the usbkey is
275 not existing or in bad shape.
276 """
277 usb_mount_path = '/media/servo_usb/%s' % self.servo_port
278 unmount_cmd = 'umount %s' % usb_mount_path
279 # ChromeOS root fs is in /dev/sdx3
280 mount_cmd = 'mount -o ro %s3 %s' % (usbkey_dev, usb_mount_path)
281 # Unmount if there is an existing stale mount.
282 self.run(unmount_cmd, ignore_status=True)
283 # Create if the mount point is not existing.
284 self.run('mkdir -p %s' % usb_mount_path)
285 try:
286 # Attempt to mount the usb drive.
287 mount_result = self.run(mount_cmd, ignore_status=True)
288 if mount_result.exit_status == 0:
289 release_content = self.run(
290 'cat %s/etc/lsb-release' % usb_mount_path,
291 ignore_status=True).stdout.strip()
292
293 if not re.search(r'RELEASE_TRACK=.*test', release_content):
294 logging.info('The image on usbkey is not a test image')
295 return ''
296
297 return lsbrelease_utils.get_chromeos_release_builder_path(
298 lsb_release_content=release_content)
299 elif (mount_result.exit_status == 32
300 and 'does not exist' in mount_result.stderr):
301 ## probe_host_usb_dev() sometimes return stale record.
302 raise hosts.AutoservRepairError('No usbkey detected on servo,'
303 ' the usbkey may be either'
304 ' missing or broken.',
305 'missing usbkey')
306 else:
307 logging.error('Unexpected error occurred on mount usb'
308 ' drive, skipping usbkey validation.')
309 return ''
310 finally:
311 logging.debug('Usbkey validation compeleted, unmounting the'
312 ' usb drive.')
313 self.run(unmount_cmd, ignore_status=True)
314
315
316 def validate_image_usbkey(self):
317 """This method validate if there is a usbkey on servo that accessible
318 to servohost. It will get the usb disk path, and then mount the usb,
319 if image_name is provided, this method will also check if the image
320 is already on the usb drive, so we can avoid unnecessary download and
321 flash to usb device.
322
323 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
324 or empty string if no test image detected, or unexpected
325 error occurred.
326 @raises: AutoservRepairError if the usbkey is not detected on servo.
327 """
328 logging.info('Validating image usbkey on servo.')
329 usbkey_dev = None
330 try:
331 usbkey_dev = self._servo.probe_host_usb_dev()
332 except Exception as e:
333 # We don't want any unexpected or transient servo communicating
334 # failure block usb repair, so capture all errors here.
335 logging.error(e, exc_info=True)
336 logging.error('Unexpected error occurred on get usbkey dev path,'
337 ' skipping usbkey validation.')
338 return ''
339
340 if not usbkey_dev:
341 raise hosts.AutoservRepairError('No usbkey detected on servo, the'
342 ' usbkey may be either missing or'
343 ' broken.', 'missing usbkey')
344 return self.get_image_name_from_usbkey(usbkey_dev)
345
346
Richard Barnette1edbb162016-11-01 11:47:50 -0700347 def repair(self, silent=False):
348 """Attempt to repair servo host.
349
350 @param silent If true, suppress logging in `status.log`.
351 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700352 message = 'Beginning repair for servo host %s port %s serial %s'
353 message %= (self.hostname, self.servo_port, self.servo_serial)
354 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700355 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700356 self._repair_strategy.repair(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700357 self._servo_state = servo_constants.SERVO_STATE_WORKING
358 self.record('INFO', None, None,
359 'ServoHost repair set servo_state as WORKING')
Garry Wang464ff1e2019-07-18 17:20:34 -0700360 # If target is a labstation then try to withdraw any existing
361 # reboot request created by this servo because it passed repair.
362 if self.is_labstation():
363 self.withdraw_reboot_request()
Garry Wang63b8c382020-03-11 22:28:40 -0700364 except Exception as e:
Garry Wang11b5e872020-03-11 15:14:08 -0700365 self._servo_state = servo_constants.SERVO_STATE_BROKEN
366 self.record('INFO', None, None,
367 'ServoHost repair set servo_state as BROKEN')
Garry Wang63b8c382020-03-11 22:28:40 -0700368 if self._is_critical_error(e):
369 self.disconnect_servo()
370 self.stop_servod()
371 raise
372
373
374 def _is_critical_error(self, error):
375 if (isinstance(error, hosts.AutoservVerifyDependencyError)
376 and not error.is_critical()):
377 logging.warning('Non-critical verify failure(s) detected during'
378 ' verify/repair servo, servo connection will'
379 ' still up but may not fully functional.'
380 ' Some repair actions and servo depended'
381 ' tests may not run.')
382 return False
383 logging.info('Critical verify failure(s) detected during repair/verify'
384 ' servo. Disconnecting servo and stop servod, all repair '
385 'action and tests that depends on servo will not run.')
386 return True
Fang Deng5d518f42013-08-02 14:04:32 -0700387
388
Dan Shi4d478522014-02-14 13:46:32 -0800389 def get_servo(self):
390 """Get the cached servo.Servo object.
Fang Deng5d518f42013-08-02 14:04:32 -0700391
Dan Shi4d478522014-02-14 13:46:32 -0800392 @return: a servo.Servo object.
Dana Goyette353d1d92019-06-27 10:43:59 -0700393 @rtype: autotest_lib.server.cros.servo.servo.Servo
Fang Deng5d518f42013-08-02 14:04:32 -0700394 """
Dan Shi4d478522014-02-14 13:46:32 -0800395 return self._servo
396
397
Garry Wang79e9af62019-06-12 15:19:19 -0700398 def request_reboot(self):
399 """Request servohost to be rebooted when it's safe to by touch a file.
400 """
401 logging.debug('Request to reboot servohost %s has been created by '
Garry Wang464ff1e2019-07-18 17:20:34 -0700402 'servo with port # %s', self.hostname, self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700403 self.run('touch %s' % self._reboot_file, ignore_status=True)
404
405
Garry Wang464ff1e2019-07-18 17:20:34 -0700406 def withdraw_reboot_request(self):
407 """Withdraw a servohost reboot request if exists by remove the flag
408 file.
409 """
410 logging.debug('Withdrawing request to reboot servohost %s that created'
411 ' by servo with port # %s if exists.',
412 self.hostname, self.servo_port)
413 self.run('rm -f %s' % self._reboot_file, ignore_status=True)
414
415
Garry Wangc1288cf2019-12-17 14:58:00 -0800416 def start_servod(self, quick_startup=False):
417 """Start the servod process on servohost.
418 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800419 # Skip if running on the localhost.(crbug.com/1038168)
420 if self.is_localhost():
421 logging.debug("Servohost is a localhost, skipping start servod.")
422 return
423
424 cmd = 'start servod'
Garry Wangc1288cf2019-12-17 14:58:00 -0800425 if self.servo_board:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800426 cmd += ' BOARD=%s' % self.servo_board
Garry Wangc1288cf2019-12-17 14:58:00 -0800427 if self.servo_model:
428 cmd += ' MODEL=%s' % self.servo_model
Garry Wangc1288cf2019-12-17 14:58:00 -0800429 else:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800430 logging.warning('Board for DUT is unknown; starting servod'
431 ' assuming a pre-configured board.')
432
433 cmd += ' PORT=%d' % self.servo_port
434 if self.servo_serial:
435 cmd += ' SERIAL=%s' % self.servo_serial
Garry Wangd7367482020-02-27 13:52:40 -0800436
437 # Start servod with dual_v4 if the DUT/servo from designated pools.
438 dut_host_info = self.get_dut_host_info()
439 if dut_host_info:
Garry Wang11b5e872020-03-11 15:14:08 -0700440 if bool(dut_host_info.pools &
441 servo_constants.POOLS_SUPPORT_DUAL_V4):
Garry Wangd7367482020-02-27 13:52:40 -0800442 logging.debug('The DUT is detected in following designated'
443 ' pools %s,starting servod with DUAL_V4 option.',
Garry Wang11b5e872020-03-11 15:14:08 -0700444 servo_constants.POOLS_SUPPORT_DUAL_V4)
Garry Wangd7367482020-02-27 13:52:40 -0800445 cmd += ' DUAL_V4=1'
446
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800447 # Remove the symbolic links from the logs. This helps ensure that
448 # a failed servod instantiation does not cause us to grab old logs
449 # by mistake.
450 self.remove_latest_log_symlinks()
Garry Wangcdd27b22020-01-13 14:59:11 -0800451 self.run(cmd, timeout=60)
Garry Wangc1288cf2019-12-17 14:58:00 -0800452
453 # There's a lag between when `start servod` completes and when
454 # the _ServodConnectionVerifier trigger can actually succeed.
455 # The call to time.sleep() below gives time to make sure that
456 # the trigger won't fail after we return.
457
458 # Normally servod on servo_v3 and labstation take ~10 seconds to ready,
459 # But in the rare case all servo on a labstation are in heavy use they
460 # may take ~30 seconds. So the timeout value will double these value,
461 # and we'll try quick start up when first time initialize servohost,
462 # and use standard start up timeout in repair.
463 if quick_startup:
Garry Wang11b5e872020-03-11 15:14:08 -0700464 timeout = servo_constants.SERVOD_QUICK_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800465 else:
Garry Wang11b5e872020-03-11 15:14:08 -0700466 timeout = servo_constants.SERVOD_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800467 logging.debug('Wait %s seconds for servod process fully up.', timeout)
468 time.sleep(timeout)
469
470
471 def stop_servod(self):
472 """Stop the servod process on servohost.
473 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800474 # Skip if running on the localhost.(crbug.com/1038168)
475 if self.is_localhost():
476 logging.debug("Servohost is a localhost, skipping stop servod.")
477 return
478
Garry Wangc1288cf2019-12-17 14:58:00 -0800479 logging.debug('Stopping servod on port %s', self.servo_port)
Garry Wangcdd27b22020-01-13 14:59:11 -0800480 self.run('stop servod PORT=%d' % self.servo_port,
481 timeout=60, ignore_status=True)
Garry Wangc1288cf2019-12-17 14:58:00 -0800482 logging.debug('Wait %s seconds for servod process fully teardown.',
Garry Wang11b5e872020-03-11 15:14:08 -0700483 servo_constants.SERVOD_TEARDOWN_TIMEOUT)
484 time.sleep(servo_constants.SERVOD_TEARDOWN_TIMEOUT)
Garry Wangc1288cf2019-12-17 14:58:00 -0800485
486
487 def restart_servod(self, quick_startup=False):
488 """Restart the servod process on servohost.
489 """
490 self.stop_servod()
491 self.start_servod(quick_startup)
492
Garry Wang11b5e872020-03-11 15:14:08 -0700493
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800494 def _extract_compressed_logs(self, logdir, relevant_files):
495 """Decompress servod logs in |logdir|.
496
497 @param logdir: directory containing compressed servod logs.
498 @param relevant_files: list of files in |logdir| to consider.
499
500 @returns: tuple, (tarfiles, files) where
501 tarfiles: list of the compressed filenames that have been
502 extracted and deleted
503 files: list of the uncompressed files that were generated
504 """
505 # For all tar-files, first extract them to the directory, and
506 # then let the common flow handle them.
507 tarfiles = [cf for cf in relevant_files if
508 cf.endswith(self.COMPRESSION_SUFFIX)]
509 files = []
510 for f in tarfiles:
511 norm_name = os.path.basename(f)[:-len(self.COMPRESSION_SUFFIX)]
512 with tarfile.open(f) as tf:
513 # Each tarfile has only one member, as
514 # that's the compressed log.
515 member = tf.members[0]
516 # Manipulate so that it only extracts the basename, and not
517 # the directories etc.
518 member.name = norm_name
519 files.append(os.path.join(logdir, member.name))
520 tf.extract(member, logdir)
521 # File has been extracted: remove the compressed file.
522 os.remove(f)
523 return tarfiles, files
524
525 def _extract_mcu_logs(self, log_subdir):
526 """Extract MCU (EC, Cr50, etc) console output from servod debug logs.
527
528 Using the MCU_EXTRACTOR regex (above) extract and split out MCU console
529 lines from the logs to generate invidiual console logs e.g. after
530 this method, you can find an ec.txt and servo_v4.txt in |log_dir| if
531 those MCUs had any console input/output.
532
533 @param log_subdir: directory with log.DEBUG.txt main servod debug logs.
534 """
535 # Extract the MCU for each one. The MCU logs are only in the .DEBUG
536 # files
537 mcu_lines_file = os.path.join(log_subdir, 'log.DEBUG.txt')
538 if not os.path.exists(mcu_lines_file):
539 logging.info('No DEBUG logs found to extract MCU logs from.')
540 return
541 mcu_files = {}
542 mcu_file_template = '%s.txt'
543 with open(mcu_lines_file, 'r') as f:
544 for line in f:
545 match = self.MCU_EXTRACTOR.match(line)
546 if match:
547 mcu = match.group(self.MCU_GROUP).lower()
548 line = match.group(self.LINE_GROUP)
549 if mcu not in mcu_files:
550 mcu_file = os.path.join(log_subdir,
551 mcu_file_template % mcu)
552 mcu_files[mcu] = open(mcu_file, 'a')
553 fd = mcu_files[mcu]
554 fd.write(line + '\n')
555 for f in mcu_files:
556 mcu_files[f].close()
557
558
559 def remove_latest_log_symlinks(self):
560 """Remove the conveninence symlinks 'latest' servod logs."""
561 symlink_wildcard = '%s/latest*' % self.remote_log_dir
562 cmd = 'rm ' + symlink_wildcard
563 self.run(cmd, stderr_tee=None, ignore_status=True)
564
565 def grab_logs(self, outdir):
566 """Retrieve logs from servo_host to |outdir|/servod_{port}.{ts}/.
567
Prasad Vuppalapu5bd9da12020-03-31 01:46:47 +0000568 This method first collects all logs on the servo_host side pertaining
569 to this servod instance (port, instatiation). It glues them together
570 into combined log.[level].txt files and extracts all available MCU
571 console I/O from the logs into individual files e.g. servo_v4.txt
572
573 All the output can be found in a directory inside |outdir| that
574 this generates based on |LOG_DIR|, the servod port, and the instance
575 timestamp on the servo_host side.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800576
577 @param outdir: directory to create a subdirectory into to place the
578 servod logs into.
579 """
580 # First, extract the timestamp. This cmd gives the real filename of
581 # the latest aka current log file.
582 cmd = ('if [ -f %(dir)s/latest.DEBUG ];'
583 'then realpath %(dir)s/latest.DEBUG;'
584 'elif [ -f %(dir)s/latest ];'
585 'then realpath %(dir)s/latest;'
586 'else exit %(code)d;'
587 'fi' % {'dir': self.remote_log_dir,
588 'code': self.NO_SYMLINKS_CODE})
589 res = self.run(cmd, stderr_tee=None, ignore_status=True)
590 if res.exit_status != 0:
591 if res.exit_status == self.NO_SYMLINKS_CODE:
592 logging.warning('servod log latest symlinks not found. '
593 'This is likely due to an error starting up '
594 'servod. Ignoring..')
595 else:
596 logging.warning('Failed to find servod logs on servo host.')
597 logging.warning(res.stderr.strip())
Prasad Vuppalapu5bd9da12020-03-31 01:46:47 +0000598 return
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800599 fname = os.path.basename(res.stdout.strip())
600 # From the fname, ought to extract the timestamp using the TS_EXTRACTOR
Ruben Rodriguez Buchillone9aa2b02020-03-04 12:14:28 -0800601 ts_match = self.TS_EXTRACTOR.match(fname)
602 if not ts_match:
603 logging.warning('Failed to extract timestamp from servod log file '
604 '%r. Skipping. The servo host is using outdated '
605 'servod logging and needs to be updated.', fname)
Prasad Vuppalapu5bd9da12020-03-31 01:46:47 +0000606 return
607 instance_ts = ts_match.group(self.TS_GROUP)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800608 # Create the local results log dir.
609 log_dir = os.path.join(outdir, '%s_%s.%s' % (self.LOG_DIR,
610 str(self.servo_port),
611 instance_ts))
612 logging.info('Saving servod logs to %s.', log_dir)
613 os.mkdir(log_dir)
614 # Now, get all files with that timestamp.
615 cmd = 'find %s -maxdepth 1 -name "log.%s*"' % (self.remote_log_dir,
616 instance_ts)
617 res = self.run(cmd, stderr_tee=None, ignore_status=True)
618 files = res.stdout.strip().split()
619 try:
620 self.get_file(files, log_dir, try_rsync=False)
621
622 except error.AutoservRunError as e:
623 result = e.result_obj
624 if result.exit_status != 0:
625 stderr = result.stderr.strip()
626 logging.warning("Couldn't retrieve servod logs. Ignoring: %s",
627 stderr or '\n%s' % result)
628 return
629 local_files = [os.path.join(log_dir, f) for f in os.listdir(log_dir)]
630 # TODO(crrev.com/c/1793030): remove no-level case once CL is pushed
631 for level_name in ('DEBUG', 'INFO', 'WARNING', ''):
632 # Create the joint files for each loglevel. i.e log.DEBUG
633 joint_file = self.JOINT_LOG_PREFIX
634 if level_name:
635 joint_file = '%s.%s' % (self.JOINT_LOG_PREFIX, level_name)
636 # This helps with some online tools to avoid complaints about an
637 # unknown filetype.
638 joint_file = joint_file + '.txt'
639 joint_path = os.path.join(log_dir, joint_file)
640 files = [f for f in local_files if level_name in f]
641 if not files:
642 # TODO(crrev.com/c/1793030): remove no-level case once CL
643 # is pushed
644 continue
645 # Extract compressed logs if any.
646 compressed, extracted = self._extract_compressed_logs(log_dir,
647 files)
648 files = list(set(files) - set(compressed))
649 files.extend(extracted)
650 # Need to sort. As they all share the same timestamp, and
651 # loglevel, the index itself is sufficient. The highest index
652 # is the oldest file, therefore we need a descending sort.
653 def sortkey(f, level=level_name):
654 """Custom sortkey to sort based on rotation number int."""
655 if f.endswith(level_name): return 0
656 return int(f.split('.')[-1])
657
658 files.sort(reverse=True, key=sortkey)
659 # Just rename the first file rather than building from scratch.
660 os.rename(files[0], joint_path)
661 with open(joint_path, 'a') as joint_f:
662 for logfile in files[1:]:
663 # Transfer the file to the joint file line by line.
664 with open(logfile, 'r') as log_f:
665 for line in log_f:
666 joint_f.write(line)
667 # File has been written over. Delete safely.
668 os.remove(logfile)
669 # Need to remove all files form |local_files| so we don't
670 # analyze them again.
671 local_files = list(set(local_files) - set(files) - set(compressed))
672 # Lastly, extract MCU logs from the joint logs.
673 self._extract_mcu_logs(log_dir)
674
Garry Wangc1288cf2019-12-17 14:58:00 -0800675
Garry Wang79e9af62019-06-12 15:19:19 -0700676 def _lock(self):
677 """lock servohost by touching a file.
678 """
679 logging.debug('Locking servohost %s by touching %s file',
680 self.hostname, self._lock_file)
681 self.run('touch %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -0700682 self._is_locked = True
Garry Wang79e9af62019-06-12 15:19:19 -0700683
684
685 def _unlock(self):
686 """Unlock servohost by removing the lock file.
687 """
688 logging.debug('Unlocking servohost by removing %s file',
689 self._lock_file)
690 self.run('rm %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -0700691 self._is_locked = False
Garry Wang79e9af62019-06-12 15:19:19 -0700692
693
Congbin Guoa1f9cba2018-07-03 11:36:59 -0700694 def close(self):
Congbin Guofc3b8962019-03-22 17:38:46 -0700695 """Close the associated servo and the host object."""
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800696 if self._closed:
697 logging.debug('ServoHost is already closed.')
698 return
Congbin Guoa1f9cba2018-07-03 11:36:59 -0700699 if self._servo:
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800700 outdir = None if not self.job else self.job.resultdir
Congbin Guo2e5e2a22018-07-27 10:32:48 -0700701 # In some cases when we run as lab-tools, the job object is None.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800702 self._servo.close(outdir)
703
704 if self.job and not self.is_localhost():
705 # Grab all logs from this servod instance before stopping servod.
706 # TODO(crbug.com/1011516): once enabled, remove the check against
707 # localhost and instead check against log-rotiation enablement.
708 try:
709 self.grab_logs(self.job.resultdir)
710 except error.AutoservRunError as e:
711 logging.info('Failed to grab servo logs due to: %s. '
712 'This error is forgiven.', str(e))
Congbin Guoa1f9cba2018-07-03 11:36:59 -0700713
Garry Wang7c00b0f2019-06-25 17:28:17 -0700714 if self._is_locked:
715 # Remove the lock if the servohost has been locked.
Garry Wang79e9af62019-06-12 15:19:19 -0700716 try:
717 self._unlock()
718 except error.AutoservSSHTimeout:
719 logging.error('Unlock servohost failed due to ssh timeout.'
720 ' It may caused by servohost went down during'
721 ' the task.')
Garry Wangc1288cf2019-12-17 14:58:00 -0800722 # We want always stop servod after task to minimum the impact of bad
723 # servod process interfere other servods.(see crbug.com/1028665)
Garry Wang4c624bc2020-01-27 16:34:43 -0800724 try:
725 self.stop_servod()
726 except error.AutoservRunError as e:
727 logging.info("Failed to stop servod due to:\n%s\n"
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800728 "This error is forgiven.", str(e))
Garry Wangc1288cf2019-12-17 14:58:00 -0800729
Congbin Guoa1f9cba2018-07-03 11:36:59 -0700730 super(ServoHost, self).close()
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800731 # Mark closed.
732 self._closed = True
Congbin Guoa1f9cba2018-07-03 11:36:59 -0700733
734
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800735 def get_servo_state(self):
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700736 if self._servo_state is None:
Garry Wang11b5e872020-03-11 15:14:08 -0700737 return servo_constants.SERVO_STATE_UNKNOWN
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700738 return self._servo_state
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800739
740
Richard Barnetteea3e4602016-06-10 12:36:41 -0700741def make_servo_hostname(dut_hostname):
742 """Given a DUT's hostname, return the hostname of its servo.
743
744 @param dut_hostname: hostname of a DUT.
745
746 @return hostname of the DUT's servo.
747
748 """
749 host_parts = dut_hostname.split('.')
750 host_parts[0] = host_parts[0] + '-servo'
751 return '.'.join(host_parts)
752
753
754def servo_host_is_up(servo_hostname):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700755 """Given a servo host name, return if it's up or not.
Richard Barnetteea3e4602016-06-10 12:36:41 -0700756
757 @param servo_hostname: hostname of the servo host.
758
759 @return True if it's up, False otherwise
760 """
761 # Technically, this duplicates the SSH ping done early in the servo
762 # proxy initialization code. However, this ping ends in a couple
763 # seconds when if fails, rather than the 60 seconds it takes to decide
764 # that an SSH ping has timed out. Specifically, that timeout happens
765 # when our servo DNS name resolves, but there is no host at that IP.
766 logging.info('Pinging servo host at %s', servo_hostname)
767 ping_config = ping_runner.PingConfig(
768 servo_hostname, count=3,
769 ignore_result=True, ignore_status=True)
770 return ping_runner.PingRunner().ping(ping_config).received > 0
771
772
Richard Barnettee519dcd2016-08-15 17:37:17 -0700773def _map_afe_board_to_servo_board(afe_board):
774 """Map a board we get from the AFE to a servo appropriate value.
775
776 Many boards are identical to other boards for servo's purposes.
777 This function makes that mapping.
778
779 @param afe_board string board name received from AFE.
780 @return board we expect servo to have.
781
782 """
783 KNOWN_SUFFIXES = ['-freon', '_freon', '_moblab', '-cheets']
784 BOARD_MAP = {'gizmo': 'panther'}
785 mapped_board = afe_board
786 if afe_board in BOARD_MAP:
787 mapped_board = BOARD_MAP[afe_board]
788 else:
789 for suffix in KNOWN_SUFFIXES:
790 if afe_board.endswith(suffix):
791 mapped_board = afe_board[0:-len(suffix)]
792 break
793 if mapped_board != afe_board:
794 logging.info('Mapping AFE board=%s to %s', afe_board, mapped_board)
795 return mapped_board
796
797
Prathmesh Prabhub4810232018-09-07 13:24:08 -0700798def get_servo_args_for_host(dut_host):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700799 """Return servo data associated with a given DUT.
Richard Barnetteea3e4602016-06-10 12:36:41 -0700800
Richard Barnetteea3e4602016-06-10 12:36:41 -0700801 @param dut_host Instance of `Host` on which to find the servo
802 attributes.
Prathmesh Prabhuf605dd32018-08-28 17:09:04 -0700803 @return `servo_args` dict with host and an optional port.
Richard Barnetteea3e4602016-06-10 12:36:41 -0700804 """
Prathmesh Prabhucba44292018-08-28 17:44:45 -0700805 info = dut_host.host_info_store.get()
806 servo_args = {k: v for k, v in info.attributes.iteritems()
Garry Wang11b5e872020-03-11 15:14:08 -0700807 if k in servo_constants.SERVO_ATTR_KEYS}
Richard Barnetteea3e4602016-06-10 12:36:41 -0700808
Garry Wang11b5e872020-03-11 15:14:08 -0700809 if servo_constants.SERVO_PORT_ATTR in servo_args:
Prathmesh Prabhucba44292018-08-28 17:44:45 -0700810 try:
Garry Wang11b5e872020-03-11 15:14:08 -0700811 servo_args[servo_constants.SERVO_PORT_ATTR] = int(
812 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -0700813 except ValueError:
814 logging.error('servo port is not an int: %s',
Garry Wang11b5e872020-03-11 15:14:08 -0700815 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -0700816 # Reset servo_args because we don't want to use an invalid port.
Garry Wang11b5e872020-03-11 15:14:08 -0700817 servo_args.pop(servo_constants.SERVO_HOST_ATTR, None)
Prathmesh Prabhucba44292018-08-28 17:44:45 -0700818
819 if info.board:
Garry Wang11b5e872020-03-11 15:14:08 -0700820 servo_board = _map_afe_board_to_servo_board(info.board)
821 servo_args[servo_constants.SERVO_BOARD_ATTR] = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -0700822 if info.model:
Garry Wang11b5e872020-03-11 15:14:08 -0700823 servo_args[servo_constants.SERVO_MODEL_ATTR] = info.model
824 return servo_args if servo_constants.SERVO_HOST_ATTR in servo_args else None
Richard Barnetteea3e4602016-06-10 12:36:41 -0700825
826
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -0700827def _tweak_args_for_ssp_moblab(servo_args):
Garry Wang11b5e872020-03-11 15:14:08 -0700828 if (servo_args[servo_constants.SERVO_HOST_ATTR]
829 in ['localhost', '127.0.0.1']):
830 servo_args[servo_constants.SERVO_HOST_ATTR] = _CONFIG.get_config_value(
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -0700831 'SSP', 'host_container_ip', type=str, default=None)
832
833
Dan Shi023aae32016-05-25 11:13:01 -0700834def create_servo_host(dut, servo_args, try_lab_servo=False,
Gregory Nisbetde13e2a2019-12-09 22:44:00 -0800835 try_servo_repair=False, dut_host_info=None):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700836 """Create a ServoHost object for a given DUT, if appropriate.
Dan Shi4d478522014-02-14 13:46:32 -0800837
Richard Barnette9a26ad62016-06-10 12:03:08 -0700838 This function attempts to create and verify or repair a `ServoHost`
839 object for a servo connected to the given `dut`, subject to various
840 constraints imposed by the parameters:
841 * When the `servo_args` parameter is not `None`, a servo
842 host must be created, and must be checked with `repair()`.
843 * Otherwise, if a servo exists in the lab and `try_lab_servo` is
844 true:
845 * If `try_servo_repair` is true, then create a servo host and
846 check it with `repair()`.
847 * Otherwise, if the servo responds to `ping` then create a
848 servo host and check it with `verify()`.
Fang Denge545abb2014-12-30 18:43:47 -0800849
Richard Barnette9a26ad62016-06-10 12:03:08 -0700850 In cases where `servo_args` was not `None`, repair failure
851 exceptions are passed back to the caller; otherwise, exceptions
Richard Barnette07c2e1d2016-10-26 14:24:28 -0700852 are logged and then discarded. Note that this only happens in cases
853 where we're called from a test (not special task) control file that
854 has an explicit dependency on servo. In that case, we require that
855 repair not write to `status.log`, so as to avoid polluting test
856 results.
857
858 TODO(jrbarnette): The special handling for servo in test control
859 files is a thorn in my flesh; I dearly hope to see it cut out before
860 my retirement.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700861
862 Parameters for a servo host consist of a host name, port number, and
863 DUT board, and are determined from one of these sources, in order of
864 priority:
Richard Barnetteea3e4602016-06-10 12:36:41 -0700865 * Servo attributes from the `dut` parameter take precedence over
866 all other sources of information.
867 * If a DNS entry for the servo based on the DUT hostname exists in
868 the CrOS lab network, that hostname is used with the default
Richard Barnette9a26ad62016-06-10 12:03:08 -0700869 port and the DUT's board.
Richard Barnetteea3e4602016-06-10 12:36:41 -0700870 * If no other options are found, the parameters will be taken
Richard Barnette9a26ad62016-06-10 12:03:08 -0700871 from the `servo_args` dict passed in from the caller.
Richard Barnetteea3e4602016-06-10 12:36:41 -0700872
873 @param dut An instance of `Host` from which to take
874 servo parameters (if available).
875 @param servo_args A dictionary with servo parameters to use if
876 they can't be found from `dut`. If this
877 argument is supplied, unrepaired exceptions
878 from `verify()` will be passed back to the
879 caller.
880 @param try_lab_servo If not true, servo host creation will be
881 skipped unless otherwise required by the
882 caller.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700883 @param try_servo_repair If true, check a servo host with
884 `repair()` instead of `verify()`.
Dan Shi4d478522014-02-14 13:46:32 -0800885
886 @returns: A ServoHost object or None. See comments above.
887
888 """
Richard Barnette07c2e1d2016-10-26 14:24:28 -0700889 servo_dependency = servo_args is not None
Richard Barnette07c2e1d2016-10-26 14:24:28 -0700890 if dut is not None and (try_lab_servo or servo_dependency):
Prathmesh Prabhub4810232018-09-07 13:24:08 -0700891 servo_args_override = get_servo_args_for_host(dut)
Richard Barnetteea3e4602016-06-10 12:36:41 -0700892 if servo_args_override is not None:
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -0700893 if utils.in_moblab_ssp():
894 _tweak_args_for_ssp_moblab(servo_args_override)
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -0700895 logging.debug(
896 'Overriding provided servo_args (%s) with arguments'
897 ' determined from the host (%s)',
898 servo_args,
899 servo_args_override,
900 )
Richard Barnetteea3e4602016-06-10 12:36:41 -0700901 servo_args = servo_args_override
Prathmesh Prabhucba44292018-08-28 17:44:45 -0700902
Richard Barnetteea3e4602016-06-10 12:36:41 -0700903 if servo_args is None:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -0700904 logging.debug('No servo_args provided, and failed to find overrides.')
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700905 if try_lab_servo or servo_dependency:
Garry Wang11b5e872020-03-11 15:14:08 -0700906 return None, servo_constants.SERVO_STATE_NOT_CONNECTED
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700907 else:
908 # For regular test case which not required the servo
909 return None, None
910
Garry Wang11b5e872020-03-11 15:14:08 -0700911 servo_hostname = servo_args.get(servo_constants.SERVO_HOST_ATTR)
912 servo_port = servo_args.get(servo_constants.SERVO_PORT_ATTR)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700913 if not _is_servo_host_information_exist(servo_hostname, servo_port):
914 logging.debug(
915 'Servo connection info missed hostname: %s , port: %s',
916 servo_hostname, servo_port)
Garry Wang11b5e872020-03-11 15:14:08 -0700917 return None, servo_constants.SERVO_STATE_NOT_CONNECTED
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700918 if not is_servo_host_information_valid(servo_hostname, servo_port):
919 logging.debug(
920 'Servo connection info is incorrect hostname: %s , port: %s',
921 servo_hostname, servo_port)
Garry Wang11b5e872020-03-11 15:14:08 -0700922 return None, servo_constants.SERVO_STATE_WRONG_CONFIG
Richard Barnette07c2e1d2016-10-26 14:24:28 -0700923 if (not servo_dependency and not try_servo_repair and
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700924 not servo_host_is_up(servo_hostname)):
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -0700925 logging.debug('ServoHost is not up.')
Garry Wang11b5e872020-03-11 15:14:08 -0700926 return None, servo_constants.SERVO_STATE_BROKEN
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -0700927
Garry Wangebc015b2019-06-06 17:45:06 -0700928 newhost = ServoHost(**servo_args)
Garry Wangcdd27b22020-01-13 14:59:11 -0800929 try:
930 newhost.restart_servod(quick_startup=True)
931 except error.AutoservSSHTimeout:
932 logging.warning("Restart servod failed due ssh connection "
933 "to servohost timed out. This error is forgiven"
934 " here, we will retry in servo repair process.")
935 except error.AutoservRunError as e:
936 logging.warning("Restart servod failed due to:\n%s\n"
937 "This error is forgiven here, we will retry"
938 " in servo repair process.", str(e))
Garry Wangebc015b2019-06-06 17:45:06 -0700939
Gregory Nisbetde13e2a2019-12-09 22:44:00 -0800940 # TODO(gregorynisbet): Clean all of this up.
941 logging.debug('create_servo_host: attempt to set info store on '
942 'servo host')
943 try:
944 if dut_host_info is None:
945 logging.debug('create_servo_host: dut_host_info is '
946 'None, skipping')
947 else:
948 newhost.set_dut_host_info(dut_host_info)
949 logging.debug('create_servo_host: successfully set info '
950 'store')
951 except Exception:
952 logging.error("create_servo_host: (%s)", traceback.format_exc())
953
Richard Barnette9a26ad62016-06-10 12:03:08 -0700954 # Note that the logic of repair() includes everything done
955 # by verify(). It's sufficient to call one or the other;
956 # we don't need both.
Richard Barnette07c2e1d2016-10-26 14:24:28 -0700957 if servo_dependency:
958 newhost.repair(silent=True)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700959 return newhost, newhost.get_servo_state()
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -0700960
961 if try_servo_repair:
962 try:
963 newhost.repair()
964 except Exception:
965 logging.exception('servo repair failed for %s', newhost.hostname)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700966 else:
967 try:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -0700968 newhost.verify()
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700969 except Exception:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -0700970 logging.exception('servo verify failed for %s', newhost.hostname)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700971 return newhost, newhost.get_servo_state()
Otabek Kasimov7267a7a2020-03-04 11:18:45 -0800972
973
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700974def _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -0800975 if hostname is None or len(hostname.strip()) == 0:
976 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700977 if port is None:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -0800978 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700979 if not type(port) is int:
980 try:
981 int(port)
982 except ValueError:
983 return False
984
Otabek Kasimov7267a7a2020-03-04 11:18:45 -0800985 return True
986
987
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700988def is_servo_host_information_valid(hostname, port):
989 if not _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -0800990 return False
991 # checking range and correct of the port
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700992 port_int = int(port)
Otabek Kasimov7267a7a2020-03-04 11:18:45 -0800993 if port_int < 1 or port_int > 65000:
994 return False
995 # we expecting host contain only latters, digits and '-' or '_'
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700996 if not re.match('[a-zA-Z0-9-_\.]*$', hostname) or len(hostname) < 5:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -0800997 return False
998 return True