blob: 6c6fe6c98495f7cf530bc93dcbcdff7f962e514d [file] [log] [blame]
Fang Deng5d518f42013-08-02 14:04:32 -07001# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
2# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4#
5# Expects to be run in an environment with sudo and no interactive password
6# prompt, such as within the Chromium OS development chroot.
7
8
9"""This file provides core logic for servo verify/repair process."""
10
11
Fang Deng5d518f42013-08-02 14:04:32 -070012import logging
Raul E Rangel52ca2e82018-07-03 14:10:14 -060013import os
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080014import re
15import tarfile
Garry Wangc1288cf2019-12-17 14:58:00 -080016import time
Gregory Nisbet265a52c2019-12-10 20:38:42 -080017import traceback
Dana Goyette4dc0adc2019-05-06 14:51:53 -070018import xmlrpclib
Fang Deng5d518f42013-08-02 14:04:32 -070019
20from autotest_lib.client.bin import utils
Garry Wang79e9af62019-06-12 15:19:19 -070021from autotest_lib.client.common_lib import error
Richard Barnette9a26ad62016-06-10 12:03:08 -070022from autotest_lib.client.common_lib import hosts
Fang Deng5d518f42013-08-02 14:04:32 -070023from autotest_lib.client.common_lib.cros import retry
Christopher Wileycef1f902014-06-19 11:11:23 -070024from autotest_lib.client.common_lib.cros.network import ping_runner
Richard Barnette9a26ad62016-06-10 12:03:08 -070025from autotest_lib.server.cros.servo import servo
Richard Barnetted31580e2018-05-14 19:58:00 +000026from autotest_lib.server.hosts import servo_repair
Garry Wangebc015b2019-06-06 17:45:06 -070027from autotest_lib.server.hosts import base_servohost
Garry Wang11b5e872020-03-11 15:14:08 -070028from autotest_lib.server.hosts import servo_constants
29from autotest_lib.client.common_lib import global_config
Garry Wangd7367482020-02-27 13:52:40 -080030
Dan Shi3b2adf62015-09-02 17:46:54 -070031_CONFIG = global_config.global_config
Fang Deng5d518f42013-08-02 14:04:32 -070032
Otabek Kasimova7ba91a2020-03-09 08:31:01 -070033
Garry Wangebc015b2019-06-06 17:45:06 -070034class ServoHost(base_servohost.BaseServoHost):
35 """Host class for a servo host(e.g. beaglebone, labstation)
Dana Goyette0b6e6402019-10-04 11:09:24 -070036 that with a servo instance for a specific port.
37
38 @type _servo: servo.Servo | None
39 """
Fang Deng5d518f42013-08-02 14:04:32 -070040
Raul E Rangel52ca2e82018-07-03 14:10:14 -060041 DEFAULT_PORT = int(os.getenv('SERVOD_PORT', '9999'))
Richard Barnette9a26ad62016-06-10 12:03:08 -070042
Dan Shie5b3c512014-08-21 12:12:09 -070043 # Timeout for initializing servo signals.
Wai-Hong Tam37b6ed32017-09-19 15:52:39 -070044 INITIALIZE_SERVO_TIMEOUT_SECS = 60
Richard Barnette9a26ad62016-06-10 12:03:08 -070045
xixuan6cf6d2f2016-01-29 15:29:00 -080046 # Ready test function
47 SERVO_READY_METHOD = 'get_version'
Fang Deng5d518f42013-08-02 14:04:32 -070048
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080049 # Directory prefix on the servo host where the servod logs are stored.
50 SERVOD_LOG_PREFIX = '/var/log/servod'
51
52 # Exit code to use when symlinks for servod logs are not found.
53 NO_SYMLINKS_CODE = 9
54
55 # Directory in the job's results directory to dump the logs into.
56 LOG_DIR = 'servod'
57
58 # Prefix for joint loglevel files in the logs.
59 JOINT_LOG_PREFIX = 'log'
60
61 # Regex group to extract timestamp from logfile name.
62 TS_GROUP = 'ts'
63
64 # This regex is used to extract the timestamp from servod logs.
65 # files always start with log.
66 TS_RE = (r'log.'
67 # The timestamp is of format %Y-%m-%d--%H-%M-%S.MS
68 r'(?P<%s>\d{4}(\-\d{2}){2}\-(-\d{2}){3}.\d{3})'
69 # The loglevel is optional depending on labstation version.
70 r'(.(INFO|DEBUG|WARNING))?' % TS_GROUP)
71 TS_EXTRACTOR = re.compile(TS_RE)
72
73 # Regex group to extract MCU name from logline in servod logs.
74 MCU_GROUP = 'mcu'
75
76 # Regex group to extract logline from MCU logline in servod logs.
77 LINE_GROUP = 'line'
78
79 # This regex is used to extract the mcu and the line content from an
80 # MCU logline in servod logs. e.g. EC or servo_v4 console logs.
81 # Here is an example log-line:
82 #
83 # 2020-01-23 13:15:12,223 - servo_v4 - EC3PO.Console - DEBUG -
84 # console.py:219:LogConsoleOutput - /dev/pts/9 - cc polarity: cc1
85 #
86 # Here is conceptually how they are formatted:
87 #
88 # <time> - <MCU> - EC3PO.Console - <LVL> - <file:line:func> - <pts> -
89 # <output>
90 #
91 # The log format starts with a timestamp
92 MCU_RE = (r'[\d\-]+ [\d:,]+ '
93 # The mcu that is logging this is next.
94 r'- (?P<%s>\w+) - '
95 # Next, we have more log outputs before the actual line.
96 # Information about the file line, logging function etc.
97 # Anchor on EC3PO Console, LogConsoleOutput and dev/pts.
98 # NOTE: if the log format changes, this regex needs to be
99 # adjusted.
100 r'EC3PO\.Console[\s\-\w\d:.]+LogConsoleOutput - /dev/pts/\d+ - '
101 # Lastly, we get the MCU's console line.
102 r'(?P<%s>.+$)' % (MCU_GROUP, LINE_GROUP))
103 MCU_EXTRACTOR = re.compile(MCU_RE)
104
105 # Suffix to identify compressed logfiles.
106 COMPRESSION_SUFFIX = '.tbz2'
107
Ruben Rodriguez Buchillonb0ef0f42020-03-25 21:32:58 -0700108 # A suffix to mark servod log directories that came from instance that
109 # ran during this servo_host, but are not the last one running e.g. when
110 # an instance (on purpose, or due to a bug) restarted in the middle of the
111 # run.
112 OLD_LOG_SUFFIX = 'old'
113
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800114 def _init_attributes(self):
115 self._servo_state = None
116 self.servo_port = None
117 self.servo_board = None
118 self.servo_model = None
119 self.servo_serial = None
120 self._servo = None
121 self._servod_server_proxy = None
Ruben Rodriguez Buchillonb0ef0f42020-03-25 21:32:58 -0700122 self._initial_instance_ts = None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800123 # Flag to make sure that multiple calls to close do not result in the
124 # logic executing multiple times.
125 self._closed = False
Fang Deng5d518f42013-08-02 14:04:32 -0700126
Richard Barnette17bfc6c2016-08-04 18:41:43 -0700127 def _initialize(self, servo_host='localhost',
Richard Barnettee519dcd2016-08-15 17:37:17 -0700128 servo_port=DEFAULT_PORT, servo_board=None,
Nick Sanders2f3c9852018-10-24 12:10:24 -0700129 servo_model=None, servo_serial=None, is_in_lab=None,
130 *args, **dargs):
Fang Deng5d518f42013-08-02 14:04:32 -0700131 """Initialize a ServoHost instance.
132
133 A ServoHost instance represents a host that controls a servo.
134
135 @param servo_host: Name of the host where the servod process
136 is running.
Raul E Rangel52ca2e82018-07-03 14:10:14 -0600137 @param servo_port: Port the servod process is listening on. Defaults
138 to the SERVOD_PORT environment variable if set,
139 otherwise 9999.
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700140 @param servo_board: Board that the servo is connected to.
Nick Sanders2f3c9852018-10-24 12:10:24 -0700141 @param servo_model: Model that the servo is connected to.
Dan Shi4d478522014-02-14 13:46:32 -0800142 @param is_in_lab: True if the servo host is in Cros Lab. Default is set
143 to None, for which utils.host_is_in_lab_zone will be
144 called to check if the servo host is in Cros lab.
Fang Deng5d518f42013-08-02 14:04:32 -0700145
146 """
147 super(ServoHost, self)._initialize(hostname=servo_host,
Garry Wangebc015b2019-06-06 17:45:06 -0700148 is_in_lab=is_in_lab, *args, **dargs)
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800149 self._init_attributes()
Richard Barnette42f4db92018-08-23 15:05:15 -0700150 self.servo_port = int(servo_port)
Richard Barnettee519dcd2016-08-15 17:37:17 -0700151 self.servo_board = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -0700152 self.servo_model = servo_model
Kevin Cheng643ce8a2016-09-15 15:42:12 -0700153 self.servo_serial = servo_serial
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800154
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800155 # The location of the log files on the servo host for this instance.
156 self.remote_log_dir = '%s_%s' % (self.SERVOD_LOG_PREFIX,
157 self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700158 # Path of the servo host lock file.
159 self._lock_file = (self.TEMP_FILE_DIR + str(self.servo_port)
160 + self.LOCK_FILE_POSTFIX)
161 # File path to declare a reboot request.
162 self._reboot_file = (self.TEMP_FILE_DIR + str(self.servo_port)
163 + self.REBOOT_FILE_POSTFIX)
164
165 # Lock the servo host if it's an in-lab labstation to prevent other
166 # task to reboot it until current task completes. We also wait and
167 # make sure the labstation is up here, in the case of the labstation is
168 # in the middle of reboot.
Garry Wang7c00b0f2019-06-25 17:28:17 -0700169 self._is_locked = False
Garry Wang42b4d862019-06-25 15:50:49 -0700170 if (self.wait_up(self.REBOOT_TIMEOUT) and self.is_in_lab()
171 and self.is_labstation()):
Garry Wang79e9af62019-06-12 15:19:19 -0700172 self._lock()
Garry Wangebc015b2019-06-06 17:45:06 -0700173
Richard Barnette9a26ad62016-06-10 12:03:08 -0700174 self._repair_strategy = (
175 servo_repair.create_servo_repair_strategy())
Richard Barnettee519dcd2016-08-15 17:37:17 -0700176
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700177 def __str__(self):
178 return "<%s '%s:%s'>" % (
179 type(self).__name__, self.hostname, self.servo_port)
180
Richard Barnette9a26ad62016-06-10 12:03:08 -0700181 def connect_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700182 """Establish a connection to the servod server on this host.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700183
184 Initializes `self._servo` and then verifies that all network
185 connections are working. This will create an ssh tunnel if
186 it's required.
187
188 As a side effect of testing the connection, all signals on the
189 target servo are reset to default values, and the USB stick is
190 set to the neutral (off) position.
191 """
Kevin Cheng643ce8a2016-09-15 15:42:12 -0700192 servo_obj = servo.Servo(servo_host=self, servo_serial=self.servo_serial)
Kuang-che Wu05763f52019-08-30 16:48:21 +0800193 self._servo = servo_obj
Richard Barnette9a26ad62016-06-10 12:03:08 -0700194 timeout, _ = retry.timeout(
195 servo_obj.initialize_dut,
196 timeout_sec=self.INITIALIZE_SERVO_TIMEOUT_SECS)
197 if timeout:
198 raise hosts.AutoservVerifyError(
199 'Servo initialize timed out.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700200
201
202 def disconnect_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700203 """Disconnect our servo if it exists.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700204
205 If we've previously successfully connected to our servo,
206 disconnect any established ssh tunnel, and set `self._servo`
207 back to `None`.
208 """
209 if self._servo:
210 # N.B. This call is safe even without a tunnel:
211 # rpc_server_tracker.disconnect() silently ignores
212 # unknown ports.
213 self.rpc_server_tracker.disconnect(self.servo_port)
214 self._servo = None
Fang Deng5d518f42013-08-02 14:04:32 -0700215
Garry Wangc1288cf2019-12-17 14:58:00 -0800216
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800217 def _create_servod_server_proxy(self):
218 """Create a proxy that can be used to communicate with servod server.
Fang Deng5d518f42013-08-02 14:04:32 -0700219
220 @returns: An xmlrpclib.ServerProxy that is connected to the servod
221 server on the host.
Fang Deng5d518f42013-08-02 14:04:32 -0700222 """
Garry Wang11b5e872020-03-11 15:14:08 -0700223 if (servo_constants.ENABLE_SSH_TUNNEL_FOR_SERVO
224 and not self.is_localhost()):
Richard Barnette9a26ad62016-06-10 12:03:08 -0700225 return self.rpc_server_tracker.xmlrpc_connect(
226 None, self.servo_port,
227 ready_test_name=self.SERVO_READY_METHOD,
Allen Li2b1a8992018-11-27 14:17:18 -0800228 timeout_seconds=60,
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700229 request_timeout_seconds=3600,
230 server_desc=str(self))
Richard Barnette9a26ad62016-06-10 12:03:08 -0700231 else:
232 remote = 'http://%s:%s' % (self.hostname, self.servo_port)
233 return xmlrpclib.ServerProxy(remote)
Fang Deng5d518f42013-08-02 14:04:32 -0700234
235
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800236 def get_servod_server_proxy(self):
237 """Return a cached proxy if exists; otherwise, create a new one.
238
239 @returns: An xmlrpclib.ServerProxy that is connected to the servod
240 server on the host.
241 """
242 # Single-threaded execution, no race
243 if self._servod_server_proxy is None:
244 self._servod_server_proxy = self._create_servod_server_proxy()
245 return self._servod_server_proxy
246
247
Richard Barnette1edbb162016-11-01 11:47:50 -0700248 def verify(self, silent=False):
249 """Update the servo host and verify it's in a good state.
250
251 @param silent If true, suppress logging in `status.log`.
252 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700253 message = 'Beginning verify for servo host %s port %s serial %s'
254 message %= (self.hostname, self.servo_port, self.servo_serial)
255 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700256 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700257 self._repair_strategy.verify(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700258 self._servo_state = servo_constants.SERVO_STATE_WORKING
259 self.record('INFO', None, None,
260 'ServoHost verify set servo_state as WORKING')
Garry Wang63b8c382020-03-11 22:28:40 -0700261 except Exception as e:
Garry Wang11b5e872020-03-11 15:14:08 -0700262 self._servo_state = servo_constants.SERVO_STATE_BROKEN
263 self.record('INFO', None, None,
264 'ServoHost verify set servo_state as BROKEN')
Garry Wang63b8c382020-03-11 22:28:40 -0700265 if self._is_critical_error(e):
266 raise
Fang Deng5d518f42013-08-02 14:04:32 -0700267
268
Richard Barnette1edbb162016-11-01 11:47:50 -0700269 def repair(self, silent=False):
270 """Attempt to repair servo host.
271
272 @param silent If true, suppress logging in `status.log`.
273 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700274 message = 'Beginning repair for servo host %s port %s serial %s'
275 message %= (self.hostname, self.servo_port, self.servo_serial)
276 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700277 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700278 self._repair_strategy.repair(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700279 self._servo_state = servo_constants.SERVO_STATE_WORKING
280 self.record('INFO', None, None,
281 'ServoHost repair set servo_state as WORKING')
Garry Wang464ff1e2019-07-18 17:20:34 -0700282 # If target is a labstation then try to withdraw any existing
283 # reboot request created by this servo because it passed repair.
284 if self.is_labstation():
285 self.withdraw_reboot_request()
Garry Wang63b8c382020-03-11 22:28:40 -0700286 except Exception as e:
Garry Wang11b5e872020-03-11 15:14:08 -0700287 self._servo_state = servo_constants.SERVO_STATE_BROKEN
288 self.record('INFO', None, None,
289 'ServoHost repair set servo_state as BROKEN')
Garry Wang63b8c382020-03-11 22:28:40 -0700290 if self._is_critical_error(e):
291 self.disconnect_servo()
292 self.stop_servod()
293 raise
294
295
296 def _is_critical_error(self, error):
297 if (isinstance(error, hosts.AutoservVerifyDependencyError)
298 and not error.is_critical()):
299 logging.warning('Non-critical verify failure(s) detected during'
300 ' verify/repair servo, servo connection will'
301 ' still up but may not fully functional.'
302 ' Some repair actions and servo depended'
303 ' tests may not run.')
304 return False
305 logging.info('Critical verify failure(s) detected during repair/verify'
306 ' servo. Disconnecting servo and stop servod, all repair '
307 'action and tests that depends on servo will not run.')
308 return True
Fang Deng5d518f42013-08-02 14:04:32 -0700309
310
Dan Shi4d478522014-02-14 13:46:32 -0800311 def get_servo(self):
312 """Get the cached servo.Servo object.
Fang Deng5d518f42013-08-02 14:04:32 -0700313
Dan Shi4d478522014-02-14 13:46:32 -0800314 @return: a servo.Servo object.
Dana Goyette353d1d92019-06-27 10:43:59 -0700315 @rtype: autotest_lib.server.cros.servo.servo.Servo
Fang Deng5d518f42013-08-02 14:04:32 -0700316 """
Dan Shi4d478522014-02-14 13:46:32 -0800317 return self._servo
318
319
Garry Wang79e9af62019-06-12 15:19:19 -0700320 def request_reboot(self):
321 """Request servohost to be rebooted when it's safe to by touch a file.
322 """
323 logging.debug('Request to reboot servohost %s has been created by '
Garry Wang464ff1e2019-07-18 17:20:34 -0700324 'servo with port # %s', self.hostname, self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700325 self.run('touch %s' % self._reboot_file, ignore_status=True)
326
327
Garry Wang464ff1e2019-07-18 17:20:34 -0700328 def withdraw_reboot_request(self):
329 """Withdraw a servohost reboot request if exists by remove the flag
330 file.
331 """
332 logging.debug('Withdrawing request to reboot servohost %s that created'
333 ' by servo with port # %s if exists.',
334 self.hostname, self.servo_port)
335 self.run('rm -f %s' % self._reboot_file, ignore_status=True)
336
337
Garry Wangc1288cf2019-12-17 14:58:00 -0800338 def start_servod(self, quick_startup=False):
339 """Start the servod process on servohost.
340 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800341 # Skip if running on the localhost.(crbug.com/1038168)
342 if self.is_localhost():
343 logging.debug("Servohost is a localhost, skipping start servod.")
344 return
345
346 cmd = 'start servod'
Garry Wangc1288cf2019-12-17 14:58:00 -0800347 if self.servo_board:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800348 cmd += ' BOARD=%s' % self.servo_board
Garry Wangc1288cf2019-12-17 14:58:00 -0800349 if self.servo_model:
350 cmd += ' MODEL=%s' % self.servo_model
Garry Wangc1288cf2019-12-17 14:58:00 -0800351 else:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800352 logging.warning('Board for DUT is unknown; starting servod'
353 ' assuming a pre-configured board.')
354
355 cmd += ' PORT=%d' % self.servo_port
356 if self.servo_serial:
357 cmd += ' SERIAL=%s' % self.servo_serial
Garry Wangd7367482020-02-27 13:52:40 -0800358
359 # Start servod with dual_v4 if the DUT/servo from designated pools.
360 dut_host_info = self.get_dut_host_info()
361 if dut_host_info:
Garry Wang11b5e872020-03-11 15:14:08 -0700362 if bool(dut_host_info.pools &
363 servo_constants.POOLS_SUPPORT_DUAL_V4):
Garry Wangd7367482020-02-27 13:52:40 -0800364 logging.debug('The DUT is detected in following designated'
365 ' pools %s,starting servod with DUAL_V4 option.',
Garry Wang11b5e872020-03-11 15:14:08 -0700366 servo_constants.POOLS_SUPPORT_DUAL_V4)
Garry Wangd7367482020-02-27 13:52:40 -0800367 cmd += ' DUAL_V4=1'
368
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800369 # Remove the symbolic links from the logs. This helps ensure that
370 # a failed servod instantiation does not cause us to grab old logs
371 # by mistake.
372 self.remove_latest_log_symlinks()
Garry Wangcdd27b22020-01-13 14:59:11 -0800373 self.run(cmd, timeout=60)
Garry Wangc1288cf2019-12-17 14:58:00 -0800374
375 # There's a lag between when `start servod` completes and when
376 # the _ServodConnectionVerifier trigger can actually succeed.
377 # The call to time.sleep() below gives time to make sure that
378 # the trigger won't fail after we return.
379
380 # Normally servod on servo_v3 and labstation take ~10 seconds to ready,
381 # But in the rare case all servo on a labstation are in heavy use they
382 # may take ~30 seconds. So the timeout value will double these value,
383 # and we'll try quick start up when first time initialize servohost,
384 # and use standard start up timeout in repair.
385 if quick_startup:
Garry Wang11b5e872020-03-11 15:14:08 -0700386 timeout = servo_constants.SERVOD_QUICK_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800387 else:
Garry Wang11b5e872020-03-11 15:14:08 -0700388 timeout = servo_constants.SERVOD_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800389 logging.debug('Wait %s seconds for servod process fully up.', timeout)
390 time.sleep(timeout)
Ruben Rodriguez Buchillonb0ef0f42020-03-25 21:32:58 -0700391 # Cache the initial instance timestamp to check against servod restarts
392 self._initial_instance_ts = self.get_instance_logs_ts()
Garry Wangc1288cf2019-12-17 14:58:00 -0800393
394
395 def stop_servod(self):
396 """Stop the servod process on servohost.
397 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800398 # Skip if running on the localhost.(crbug.com/1038168)
399 if self.is_localhost():
400 logging.debug("Servohost is a localhost, skipping stop servod.")
401 return
402
Garry Wangc1288cf2019-12-17 14:58:00 -0800403 logging.debug('Stopping servod on port %s', self.servo_port)
Garry Wangcdd27b22020-01-13 14:59:11 -0800404 self.run('stop servod PORT=%d' % self.servo_port,
405 timeout=60, ignore_status=True)
Garry Wangc1288cf2019-12-17 14:58:00 -0800406 logging.debug('Wait %s seconds for servod process fully teardown.',
Garry Wang11b5e872020-03-11 15:14:08 -0700407 servo_constants.SERVOD_TEARDOWN_TIMEOUT)
408 time.sleep(servo_constants.SERVOD_TEARDOWN_TIMEOUT)
Garry Wangc1288cf2019-12-17 14:58:00 -0800409
410
411 def restart_servod(self, quick_startup=False):
412 """Restart the servod process on servohost.
413 """
414 self.stop_servod()
415 self.start_servod(quick_startup)
416
Garry Wang11b5e872020-03-11 15:14:08 -0700417
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800418 def _extract_compressed_logs(self, logdir, relevant_files):
419 """Decompress servod logs in |logdir|.
420
421 @param logdir: directory containing compressed servod logs.
422 @param relevant_files: list of files in |logdir| to consider.
423
424 @returns: tuple, (tarfiles, files) where
425 tarfiles: list of the compressed filenames that have been
426 extracted and deleted
427 files: list of the uncompressed files that were generated
428 """
429 # For all tar-files, first extract them to the directory, and
430 # then let the common flow handle them.
431 tarfiles = [cf for cf in relevant_files if
432 cf.endswith(self.COMPRESSION_SUFFIX)]
433 files = []
434 for f in tarfiles:
435 norm_name = os.path.basename(f)[:-len(self.COMPRESSION_SUFFIX)]
436 with tarfile.open(f) as tf:
437 # Each tarfile has only one member, as
438 # that's the compressed log.
439 member = tf.members[0]
440 # Manipulate so that it only extracts the basename, and not
441 # the directories etc.
442 member.name = norm_name
443 files.append(os.path.join(logdir, member.name))
444 tf.extract(member, logdir)
445 # File has been extracted: remove the compressed file.
446 os.remove(f)
447 return tarfiles, files
448
449 def _extract_mcu_logs(self, log_subdir):
450 """Extract MCU (EC, Cr50, etc) console output from servod debug logs.
451
452 Using the MCU_EXTRACTOR regex (above) extract and split out MCU console
453 lines from the logs to generate invidiual console logs e.g. after
454 this method, you can find an ec.txt and servo_v4.txt in |log_dir| if
455 those MCUs had any console input/output.
456
457 @param log_subdir: directory with log.DEBUG.txt main servod debug logs.
458 """
459 # Extract the MCU for each one. The MCU logs are only in the .DEBUG
460 # files
461 mcu_lines_file = os.path.join(log_subdir, 'log.DEBUG.txt')
462 if not os.path.exists(mcu_lines_file):
463 logging.info('No DEBUG logs found to extract MCU logs from.')
464 return
465 mcu_files = {}
466 mcu_file_template = '%s.txt'
467 with open(mcu_lines_file, 'r') as f:
468 for line in f:
469 match = self.MCU_EXTRACTOR.match(line)
470 if match:
471 mcu = match.group(self.MCU_GROUP).lower()
472 line = match.group(self.LINE_GROUP)
473 if mcu not in mcu_files:
474 mcu_file = os.path.join(log_subdir,
475 mcu_file_template % mcu)
476 mcu_files[mcu] = open(mcu_file, 'a')
477 fd = mcu_files[mcu]
478 fd.write(line + '\n')
479 for f in mcu_files:
480 mcu_files[f].close()
481
482
483 def remove_latest_log_symlinks(self):
484 """Remove the conveninence symlinks 'latest' servod logs."""
485 symlink_wildcard = '%s/latest*' % self.remote_log_dir
486 cmd = 'rm ' + symlink_wildcard
487 self.run(cmd, stderr_tee=None, ignore_status=True)
488
Ruben Rodriguez Buchillonb0ef0f42020-03-25 21:32:58 -0700489 def probe_servod_restart(self, instance_ts, outdir):
490 """Grab servod logs from previous instances if part of this session.
491
492 If since the last time this host called start_servod() servod crashed
493 and restarted, this helper finds those logs as well, and stores them
494 with the |OLD_LOG_SUFFIX| to investigate if necessary.
495
496 It also issues a panicinfo command to servo devices after the restart
497 to try and collect reboot information for debugging.
498
499 @param instance_ts: the log timestamp that the current instance uses
500 @param outdir: directory to create a subdirectory into to place the
501 servod logs into.
502 """
503 if self._initial_instance_ts is None:
504 logging.info('No log timestamp grabbed successfully on servod '
505 'startup. Cannot check device restarts. Ignoring.')
506 return
507 if instance_ts == self._initial_instance_ts:
508 logging.debug('Servod appears to have run without restarting')
509 return
510 # Servod seems to have restarted (at least once). |_initial_instance_ts|
511 # is the first timestamp, and instance_ts is the current timestamp. Find
512 # all timestamps in between them, and grab the logs for each.
513 tss = self._find_instance_timestamps_between(self._initial_instance_ts,
514 instance_ts)
515 logging.info('Servod has restarted %d times between the start and the '
516 'end of this servo_host.', len(tss))
517 logging.info('This might be an issue. Will extract all logs from each '
518 'instance.')
519 logging.info('Logs that are not the currently running (about to turn '
520 'down) instance are maked with a .%s in their folder.',
521 self.OLD_LOG_SUFFIX)
522 for ts in tss:
523 self.get_instance_logs(ts, outdir, old=True)
524 # Lastly, servod has restarted due to a potential issue. Try to get
525 # panic information from servo micro and servo v4 for the current logs.
526 for mcu in ['servo_micro', 'servo_v4']:
527 ctrl = '%s_uart_cmd' % mcu
528 if self._servo.has_control(ctrl):
529 logging.info('Trying to retrieve %r panicinfo into logs', mcu)
530 try:
531 self._servo.set_nocheck(ctrl, 'panicinfo')
532 except error.TestFail as e:
533 logging.error('Failed to generate panicinfo for %r logs. '
534 '%s', mcu, str(e))
535
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800536 def grab_logs(self, outdir):
537 """Retrieve logs from servo_host to |outdir|/servod_{port}.{ts}/.
538
Ruben Rodriguez Buchillonb0ef0f42020-03-25 21:32:58 -0700539 This method grabs all logs since servod was last restarted by this host
540 i.e. if servod restarts in the middle of the run (intentionally or not)
541 those logs will all be grabbed as well.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800542
543 @param outdir: directory to create a subdirectory into to place the
544 servod logs into.
545 """
Ruben Rodriguez Buchillonb0ef0f42020-03-25 21:32:58 -0700546 instance_ts = self.get_instance_logs_ts()
547 if instance_ts is not None:
548 self.probe_servod_restart(instance_ts, outdir)
549 self.get_instance_logs(instance_ts, outdir)
550
551 def _find_instance_timestamps_between(self, start_ts, end_ts):
552 """Find all log timestamps between [start_ts, end_ts).
553
554 @param start_ts: str, earliest log timestamp of interest
555 @param end_ts: str, latest log timestamp of interest
556
557 @returns: list, all timestamps between start_ts and end_ts, end_ts
558 exclusive, on the servo_host. An empty list on errors
559 """
560 # Simply get all timestamp, and then sort and remove
561 cmd = 'ls %s' % self.remote_log_dir
562 res = self.run(cmd, stderr_tee=None, ignore_status=True)
563 if res.exit_status != 0:
564 # Here we failed to find anything.
565 logging.info('Failed to find remote servod logs. Ignoring.')
566 return []
567 logfiles = res.stdout.strip().split()
568 timestamps = set()
569 for logfile in logfiles:
570 ts_match = self.TS_EXTRACTOR.match(logfile)
571 if not ts_match:
572 # Simply ignore files that fail the check. It might be the
573 # 'latest' symlinks or random files.
574 continue
575 timestamps.add(ts_match.group(self.TS_GROUP))
576 # At this point we have all unique timestamps.
577 timestamps = sorted(timestamps)
578 for ts in [start_ts, end_ts]:
579 if ts not in timestamps:
580 logging.error('Timestamp %r not in servod logs. Cannot query '
581 'for timestamps in between %r and %r', ts,
582 start_ts, end_ts)
583 return []
584 return timestamps[timestamps.index(start_ts):timestamps.index(end_ts)]
585
586 def get_instance_logs_ts(self):
587 """Retrieve the currently running servod instance's log timestamp
588
589 @returns: str, timestamp for current instance, or None on failure
590 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800591 # First, extract the timestamp. This cmd gives the real filename of
592 # the latest aka current log file.
593 cmd = ('if [ -f %(dir)s/latest.DEBUG ];'
594 'then realpath %(dir)s/latest.DEBUG;'
595 'elif [ -f %(dir)s/latest ];'
596 'then realpath %(dir)s/latest;'
597 'else exit %(code)d;'
598 'fi' % {'dir': self.remote_log_dir,
599 'code': self.NO_SYMLINKS_CODE})
600 res = self.run(cmd, stderr_tee=None, ignore_status=True)
601 if res.exit_status != 0:
602 if res.exit_status == self.NO_SYMLINKS_CODE:
603 logging.warning('servod log latest symlinks not found. '
604 'This is likely due to an error starting up '
605 'servod. Ignoring..')
606 else:
607 logging.warning('Failed to find servod logs on servo host.')
608 logging.warning(res.stderr.strip())
Ruben Rodriguez Buchillonb0ef0f42020-03-25 21:32:58 -0700609 return None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800610 fname = os.path.basename(res.stdout.strip())
611 # From the fname, ought to extract the timestamp using the TS_EXTRACTOR
Ruben Rodriguez Buchillone9aa2b02020-03-04 12:14:28 -0800612 ts_match = self.TS_EXTRACTOR.match(fname)
613 if not ts_match:
614 logging.warning('Failed to extract timestamp from servod log file '
615 '%r. Skipping. The servo host is using outdated '
616 'servod logging and needs to be updated.', fname)
Ruben Rodriguez Buchillonb0ef0f42020-03-25 21:32:58 -0700617 return None
618 return ts_match.group(self.TS_GROUP)
619
620 def get_instance_logs(self, instance_ts, outdir, old=False):
621 """Collect all logs with |instance_ts| and dump into a dir in |outdir|
622
623 This method first collects all logs on the servo_host side pertaining
624 to this servod instance (port, instatiation). It glues them together
625 into combined log.[level].txt files and extracts all available MCU
626 console I/O from the logs into individual files e.g. servo_v4.txt
627
628 All the output can be found in a directory inside |outdir| that
629 this generates based on |LOG_DIR|, the servod port, and the instance
630 timestamp on the servo_host side.
631
632 @param instance_ts: log timestamp to grab logfiles for
633 @param outdir: directory to create a subdirectory into to place the
634 servod logs into.
635 @param old: bool, whether to append |OLD_LOG_SUFFIX| to output dir
636 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800637 # Create the local results log dir.
638 log_dir = os.path.join(outdir, '%s_%s.%s' % (self.LOG_DIR,
639 str(self.servo_port),
640 instance_ts))
Ruben Rodriguez Buchillonb0ef0f42020-03-25 21:32:58 -0700641 if old:
642 log_dir = '%s.%s' % (log_dir, self.OLD_LOG_SUFFIX)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800643 logging.info('Saving servod logs to %s.', log_dir)
644 os.mkdir(log_dir)
645 # Now, get all files with that timestamp.
646 cmd = 'find %s -maxdepth 1 -name "log.%s*"' % (self.remote_log_dir,
647 instance_ts)
648 res = self.run(cmd, stderr_tee=None, ignore_status=True)
649 files = res.stdout.strip().split()
650 try:
651 self.get_file(files, log_dir, try_rsync=False)
652
653 except error.AutoservRunError as e:
654 result = e.result_obj
655 if result.exit_status != 0:
656 stderr = result.stderr.strip()
657 logging.warning("Couldn't retrieve servod logs. Ignoring: %s",
658 stderr or '\n%s' % result)
659 return
660 local_files = [os.path.join(log_dir, f) for f in os.listdir(log_dir)]
661 # TODO(crrev.com/c/1793030): remove no-level case once CL is pushed
662 for level_name in ('DEBUG', 'INFO', 'WARNING', ''):
663 # Create the joint files for each loglevel. i.e log.DEBUG
664 joint_file = self.JOINT_LOG_PREFIX
665 if level_name:
666 joint_file = '%s.%s' % (self.JOINT_LOG_PREFIX, level_name)
667 # This helps with some online tools to avoid complaints about an
668 # unknown filetype.
669 joint_file = joint_file + '.txt'
670 joint_path = os.path.join(log_dir, joint_file)
671 files = [f for f in local_files if level_name in f]
672 if not files:
673 # TODO(crrev.com/c/1793030): remove no-level case once CL
674 # is pushed
675 continue
676 # Extract compressed logs if any.
677 compressed, extracted = self._extract_compressed_logs(log_dir,
678 files)
679 files = list(set(files) - set(compressed))
680 files.extend(extracted)
681 # Need to sort. As they all share the same timestamp, and
682 # loglevel, the index itself is sufficient. The highest index
683 # is the oldest file, therefore we need a descending sort.
684 def sortkey(f, level=level_name):
685 """Custom sortkey to sort based on rotation number int."""
686 if f.endswith(level_name): return 0
687 return int(f.split('.')[-1])
688
689 files.sort(reverse=True, key=sortkey)
690 # Just rename the first file rather than building from scratch.
691 os.rename(files[0], joint_path)
692 with open(joint_path, 'a') as joint_f:
693 for logfile in files[1:]:
694 # Transfer the file to the joint file line by line.
695 with open(logfile, 'r') as log_f:
696 for line in log_f:
697 joint_f.write(line)
698 # File has been written over. Delete safely.
699 os.remove(logfile)
700 # Need to remove all files form |local_files| so we don't
701 # analyze them again.
702 local_files = list(set(local_files) - set(files) - set(compressed))
703 # Lastly, extract MCU logs from the joint logs.
704 self._extract_mcu_logs(log_dir)
705
Garry Wangc1288cf2019-12-17 14:58:00 -0800706
Garry Wang79e9af62019-06-12 15:19:19 -0700707 def _lock(self):
708 """lock servohost by touching a file.
709 """
710 logging.debug('Locking servohost %s by touching %s file',
711 self.hostname, self._lock_file)
712 self.run('touch %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -0700713 self._is_locked = True
Garry Wang79e9af62019-06-12 15:19:19 -0700714
715
716 def _unlock(self):
717 """Unlock servohost by removing the lock file.
718 """
719 logging.debug('Unlocking servohost by removing %s file',
720 self._lock_file)
721 self.run('rm %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -0700722 self._is_locked = False
Garry Wang79e9af62019-06-12 15:19:19 -0700723
724
Congbin Guoa1f9cba2018-07-03 11:36:59 -0700725 def close(self):
Congbin Guofc3b8962019-03-22 17:38:46 -0700726 """Close the associated servo and the host object."""
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800727 if self._closed:
728 logging.debug('ServoHost is already closed.')
729 return
Congbin Guoa1f9cba2018-07-03 11:36:59 -0700730 if self._servo:
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800731 outdir = None if not self.job else self.job.resultdir
Congbin Guo2e5e2a22018-07-27 10:32:48 -0700732 # In some cases when we run as lab-tools, the job object is None.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800733 self._servo.close(outdir)
734
735 if self.job and not self.is_localhost():
736 # Grab all logs from this servod instance before stopping servod.
737 # TODO(crbug.com/1011516): once enabled, remove the check against
738 # localhost and instead check against log-rotiation enablement.
739 try:
740 self.grab_logs(self.job.resultdir)
741 except error.AutoservRunError as e:
742 logging.info('Failed to grab servo logs due to: %s. '
743 'This error is forgiven.', str(e))
Congbin Guoa1f9cba2018-07-03 11:36:59 -0700744
Garry Wang7c00b0f2019-06-25 17:28:17 -0700745 if self._is_locked:
746 # Remove the lock if the servohost has been locked.
Garry Wang79e9af62019-06-12 15:19:19 -0700747 try:
748 self._unlock()
749 except error.AutoservSSHTimeout:
750 logging.error('Unlock servohost failed due to ssh timeout.'
751 ' It may caused by servohost went down during'
752 ' the task.')
Garry Wangc1288cf2019-12-17 14:58:00 -0800753 # We want always stop servod after task to minimum the impact of bad
754 # servod process interfere other servods.(see crbug.com/1028665)
Garry Wang4c624bc2020-01-27 16:34:43 -0800755 try:
756 self.stop_servod()
757 except error.AutoservRunError as e:
758 logging.info("Failed to stop servod due to:\n%s\n"
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800759 "This error is forgiven.", str(e))
Garry Wangc1288cf2019-12-17 14:58:00 -0800760
Congbin Guoa1f9cba2018-07-03 11:36:59 -0700761 super(ServoHost, self).close()
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800762 # Mark closed.
763 self._closed = True
Congbin Guoa1f9cba2018-07-03 11:36:59 -0700764
765
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800766 def get_servo_state(self):
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700767 if self._servo_state is None:
Garry Wang11b5e872020-03-11 15:14:08 -0700768 return servo_constants.SERVO_STATE_UNKNOWN
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700769 return self._servo_state
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800770
771
Richard Barnetteea3e4602016-06-10 12:36:41 -0700772def make_servo_hostname(dut_hostname):
773 """Given a DUT's hostname, return the hostname of its servo.
774
775 @param dut_hostname: hostname of a DUT.
776
777 @return hostname of the DUT's servo.
778
779 """
780 host_parts = dut_hostname.split('.')
781 host_parts[0] = host_parts[0] + '-servo'
782 return '.'.join(host_parts)
783
784
785def servo_host_is_up(servo_hostname):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700786 """Given a servo host name, return if it's up or not.
Richard Barnetteea3e4602016-06-10 12:36:41 -0700787
788 @param servo_hostname: hostname of the servo host.
789
790 @return True if it's up, False otherwise
791 """
792 # Technically, this duplicates the SSH ping done early in the servo
793 # proxy initialization code. However, this ping ends in a couple
794 # seconds when if fails, rather than the 60 seconds it takes to decide
795 # that an SSH ping has timed out. Specifically, that timeout happens
796 # when our servo DNS name resolves, but there is no host at that IP.
797 logging.info('Pinging servo host at %s', servo_hostname)
798 ping_config = ping_runner.PingConfig(
799 servo_hostname, count=3,
800 ignore_result=True, ignore_status=True)
801 return ping_runner.PingRunner().ping(ping_config).received > 0
802
803
Richard Barnettee519dcd2016-08-15 17:37:17 -0700804def _map_afe_board_to_servo_board(afe_board):
805 """Map a board we get from the AFE to a servo appropriate value.
806
807 Many boards are identical to other boards for servo's purposes.
808 This function makes that mapping.
809
810 @param afe_board string board name received from AFE.
811 @return board we expect servo to have.
812
813 """
814 KNOWN_SUFFIXES = ['-freon', '_freon', '_moblab', '-cheets']
815 BOARD_MAP = {'gizmo': 'panther'}
816 mapped_board = afe_board
817 if afe_board in BOARD_MAP:
818 mapped_board = BOARD_MAP[afe_board]
819 else:
820 for suffix in KNOWN_SUFFIXES:
821 if afe_board.endswith(suffix):
822 mapped_board = afe_board[0:-len(suffix)]
823 break
824 if mapped_board != afe_board:
825 logging.info('Mapping AFE board=%s to %s', afe_board, mapped_board)
826 return mapped_board
827
828
Prathmesh Prabhub4810232018-09-07 13:24:08 -0700829def get_servo_args_for_host(dut_host):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700830 """Return servo data associated with a given DUT.
Richard Barnetteea3e4602016-06-10 12:36:41 -0700831
Richard Barnetteea3e4602016-06-10 12:36:41 -0700832 @param dut_host Instance of `Host` on which to find the servo
833 attributes.
Prathmesh Prabhuf605dd32018-08-28 17:09:04 -0700834 @return `servo_args` dict with host and an optional port.
Richard Barnetteea3e4602016-06-10 12:36:41 -0700835 """
Prathmesh Prabhucba44292018-08-28 17:44:45 -0700836 info = dut_host.host_info_store.get()
837 servo_args = {k: v for k, v in info.attributes.iteritems()
Garry Wang11b5e872020-03-11 15:14:08 -0700838 if k in servo_constants.SERVO_ATTR_KEYS}
Richard Barnetteea3e4602016-06-10 12:36:41 -0700839
Garry Wang11b5e872020-03-11 15:14:08 -0700840 if servo_constants.SERVO_PORT_ATTR in servo_args:
Prathmesh Prabhucba44292018-08-28 17:44:45 -0700841 try:
Garry Wang11b5e872020-03-11 15:14:08 -0700842 servo_args[servo_constants.SERVO_PORT_ATTR] = int(
843 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -0700844 except ValueError:
845 logging.error('servo port is not an int: %s',
Garry Wang11b5e872020-03-11 15:14:08 -0700846 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -0700847 # Reset servo_args because we don't want to use an invalid port.
Garry Wang11b5e872020-03-11 15:14:08 -0700848 servo_args.pop(servo_constants.SERVO_HOST_ATTR, None)
Prathmesh Prabhucba44292018-08-28 17:44:45 -0700849
850 if info.board:
Garry Wang11b5e872020-03-11 15:14:08 -0700851 servo_board = _map_afe_board_to_servo_board(info.board)
852 servo_args[servo_constants.SERVO_BOARD_ATTR] = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -0700853 if info.model:
Garry Wang11b5e872020-03-11 15:14:08 -0700854 servo_args[servo_constants.SERVO_MODEL_ATTR] = info.model
855 return servo_args if servo_constants.SERVO_HOST_ATTR in servo_args else None
Richard Barnetteea3e4602016-06-10 12:36:41 -0700856
857
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -0700858def _tweak_args_for_ssp_moblab(servo_args):
Garry Wang11b5e872020-03-11 15:14:08 -0700859 if (servo_args[servo_constants.SERVO_HOST_ATTR]
860 in ['localhost', '127.0.0.1']):
861 servo_args[servo_constants.SERVO_HOST_ATTR] = _CONFIG.get_config_value(
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -0700862 'SSP', 'host_container_ip', type=str, default=None)
863
864
Dan Shi023aae32016-05-25 11:13:01 -0700865def create_servo_host(dut, servo_args, try_lab_servo=False,
Gregory Nisbetde13e2a2019-12-09 22:44:00 -0800866 try_servo_repair=False, dut_host_info=None):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700867 """Create a ServoHost object for a given DUT, if appropriate.
Dan Shi4d478522014-02-14 13:46:32 -0800868
Richard Barnette9a26ad62016-06-10 12:03:08 -0700869 This function attempts to create and verify or repair a `ServoHost`
870 object for a servo connected to the given `dut`, subject to various
871 constraints imposed by the parameters:
872 * When the `servo_args` parameter is not `None`, a servo
873 host must be created, and must be checked with `repair()`.
874 * Otherwise, if a servo exists in the lab and `try_lab_servo` is
875 true:
876 * If `try_servo_repair` is true, then create a servo host and
877 check it with `repair()`.
878 * Otherwise, if the servo responds to `ping` then create a
879 servo host and check it with `verify()`.
Fang Denge545abb2014-12-30 18:43:47 -0800880
Richard Barnette9a26ad62016-06-10 12:03:08 -0700881 In cases where `servo_args` was not `None`, repair failure
882 exceptions are passed back to the caller; otherwise, exceptions
Richard Barnette07c2e1d2016-10-26 14:24:28 -0700883 are logged and then discarded. Note that this only happens in cases
884 where we're called from a test (not special task) control file that
885 has an explicit dependency on servo. In that case, we require that
886 repair not write to `status.log`, so as to avoid polluting test
887 results.
888
889 TODO(jrbarnette): The special handling for servo in test control
890 files is a thorn in my flesh; I dearly hope to see it cut out before
891 my retirement.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700892
893 Parameters for a servo host consist of a host name, port number, and
894 DUT board, and are determined from one of these sources, in order of
895 priority:
Richard Barnetteea3e4602016-06-10 12:36:41 -0700896 * Servo attributes from the `dut` parameter take precedence over
897 all other sources of information.
898 * If a DNS entry for the servo based on the DUT hostname exists in
899 the CrOS lab network, that hostname is used with the default
Richard Barnette9a26ad62016-06-10 12:03:08 -0700900 port and the DUT's board.
Richard Barnetteea3e4602016-06-10 12:36:41 -0700901 * If no other options are found, the parameters will be taken
Richard Barnette9a26ad62016-06-10 12:03:08 -0700902 from the `servo_args` dict passed in from the caller.
Richard Barnetteea3e4602016-06-10 12:36:41 -0700903
904 @param dut An instance of `Host` from which to take
905 servo parameters (if available).
906 @param servo_args A dictionary with servo parameters to use if
907 they can't be found from `dut`. If this
908 argument is supplied, unrepaired exceptions
909 from `verify()` will be passed back to the
910 caller.
911 @param try_lab_servo If not true, servo host creation will be
912 skipped unless otherwise required by the
913 caller.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700914 @param try_servo_repair If true, check a servo host with
915 `repair()` instead of `verify()`.
Dan Shi4d478522014-02-14 13:46:32 -0800916
917 @returns: A ServoHost object or None. See comments above.
918
919 """
Richard Barnette07c2e1d2016-10-26 14:24:28 -0700920 servo_dependency = servo_args is not None
Richard Barnette07c2e1d2016-10-26 14:24:28 -0700921 if dut is not None and (try_lab_servo or servo_dependency):
Prathmesh Prabhub4810232018-09-07 13:24:08 -0700922 servo_args_override = get_servo_args_for_host(dut)
Richard Barnetteea3e4602016-06-10 12:36:41 -0700923 if servo_args_override is not None:
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -0700924 if utils.in_moblab_ssp():
925 _tweak_args_for_ssp_moblab(servo_args_override)
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -0700926 logging.debug(
927 'Overriding provided servo_args (%s) with arguments'
928 ' determined from the host (%s)',
929 servo_args,
930 servo_args_override,
931 )
Richard Barnetteea3e4602016-06-10 12:36:41 -0700932 servo_args = servo_args_override
Prathmesh Prabhucba44292018-08-28 17:44:45 -0700933
Richard Barnetteea3e4602016-06-10 12:36:41 -0700934 if servo_args is None:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -0700935 logging.debug('No servo_args provided, and failed to find overrides.')
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700936 if try_lab_servo or servo_dependency:
Garry Wang11b5e872020-03-11 15:14:08 -0700937 return None, servo_constants.SERVO_STATE_NOT_CONNECTED
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700938 else:
939 # For regular test case which not required the servo
940 return None, None
941
Garry Wang11b5e872020-03-11 15:14:08 -0700942 servo_hostname = servo_args.get(servo_constants.SERVO_HOST_ATTR)
943 servo_port = servo_args.get(servo_constants.SERVO_PORT_ATTR)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700944 if not _is_servo_host_information_exist(servo_hostname, servo_port):
945 logging.debug(
946 'Servo connection info missed hostname: %s , port: %s',
947 servo_hostname, servo_port)
Garry Wang11b5e872020-03-11 15:14:08 -0700948 return None, servo_constants.SERVO_STATE_NOT_CONNECTED
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700949 if not is_servo_host_information_valid(servo_hostname, servo_port):
950 logging.debug(
951 'Servo connection info is incorrect hostname: %s , port: %s',
952 servo_hostname, servo_port)
Garry Wang11b5e872020-03-11 15:14:08 -0700953 return None, servo_constants.SERVO_STATE_WRONG_CONFIG
Richard Barnette07c2e1d2016-10-26 14:24:28 -0700954 if (not servo_dependency and not try_servo_repair and
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700955 not servo_host_is_up(servo_hostname)):
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -0700956 logging.debug('ServoHost is not up.')
Garry Wang11b5e872020-03-11 15:14:08 -0700957 return None, servo_constants.SERVO_STATE_BROKEN
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -0700958
Garry Wangebc015b2019-06-06 17:45:06 -0700959 newhost = ServoHost(**servo_args)
Garry Wangcdd27b22020-01-13 14:59:11 -0800960 try:
961 newhost.restart_servod(quick_startup=True)
962 except error.AutoservSSHTimeout:
963 logging.warning("Restart servod failed due ssh connection "
964 "to servohost timed out. This error is forgiven"
965 " here, we will retry in servo repair process.")
966 except error.AutoservRunError as e:
967 logging.warning("Restart servod failed due to:\n%s\n"
968 "This error is forgiven here, we will retry"
969 " in servo repair process.", str(e))
Garry Wangebc015b2019-06-06 17:45:06 -0700970
Gregory Nisbetde13e2a2019-12-09 22:44:00 -0800971 # TODO(gregorynisbet): Clean all of this up.
972 logging.debug('create_servo_host: attempt to set info store on '
973 'servo host')
974 try:
975 if dut_host_info is None:
976 logging.debug('create_servo_host: dut_host_info is '
977 'None, skipping')
978 else:
979 newhost.set_dut_host_info(dut_host_info)
980 logging.debug('create_servo_host: successfully set info '
981 'store')
982 except Exception:
983 logging.error("create_servo_host: (%s)", traceback.format_exc())
984
Richard Barnette9a26ad62016-06-10 12:03:08 -0700985 # Note that the logic of repair() includes everything done
986 # by verify(). It's sufficient to call one or the other;
987 # we don't need both.
Richard Barnette07c2e1d2016-10-26 14:24:28 -0700988 if servo_dependency:
989 newhost.repair(silent=True)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -0700990 return newhost, newhost.get_servo_state()
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -0700991
992 if try_servo_repair:
993 try:
994 newhost.repair()
995 except Exception:
996 logging.exception('servo repair failed for %s', newhost.hostname)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700997 else:
998 try:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -0700999 newhost.verify()
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001000 except Exception:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001001 logging.exception('servo verify failed for %s', newhost.hostname)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001002 return newhost, newhost.get_servo_state()
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001003
1004
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001005def _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001006 if hostname is None or len(hostname.strip()) == 0:
1007 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001008 if port is None:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001009 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001010 if not type(port) is int:
1011 try:
1012 int(port)
1013 except ValueError:
1014 return False
1015
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001016 return True
1017
1018
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001019def is_servo_host_information_valid(hostname, port):
1020 if not _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001021 return False
1022 # checking range and correct of the port
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001023 port_int = int(port)
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001024 if port_int < 1 or port_int > 65000:
1025 return False
1026 # we expecting host contain only latters, digits and '-' or '_'
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001027 if not re.match('[a-zA-Z0-9-_\.]*$', hostname) or len(hostname) < 5:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001028 return False
1029 return True