blob: 137e27e347a7a75b9905d02cafe9fbacf225ccc9 [file] [log] [blame]
Fang Deng5d518f42013-08-02 14:04:32 -07001# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
2# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4#
5# Expects to be run in an environment with sudo and no interactive password
6# prompt, such as within the Chromium OS development chroot.
7
8
9"""This file provides core logic for servo verify/repair process."""
10
11
Fang Deng5d518f42013-08-02 14:04:32 -070012import logging
Raul E Rangel52ca2e82018-07-03 14:10:14 -060013import os
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080014import re
15import tarfile
Garry Wangc1288cf2019-12-17 14:58:00 -080016import time
Gregory Nisbet265a52c2019-12-10 20:38:42 -080017import traceback
Dana Goyette4dc0adc2019-05-06 14:51:53 -070018import xmlrpclib
Fang Deng5d518f42013-08-02 14:04:32 -070019
20from autotest_lib.client.bin import utils
Garry Wang79e9af62019-06-12 15:19:19 -070021from autotest_lib.client.common_lib import error
Richard Barnette9a26ad62016-06-10 12:03:08 -070022from autotest_lib.client.common_lib import hosts
Garry Wang7b0e1b72020-03-25 19:08:59 -070023from autotest_lib.client.common_lib import lsbrelease_utils
Fang Deng5d518f42013-08-02 14:04:32 -070024from autotest_lib.client.common_lib.cros import retry
Christopher Wileycef1f902014-06-19 11:11:23 -070025from autotest_lib.client.common_lib.cros.network import ping_runner
Richard Barnette9a26ad62016-06-10 12:03:08 -070026from autotest_lib.server.cros.servo import servo
Richard Barnetted31580e2018-05-14 19:58:00 +000027from autotest_lib.server.hosts import servo_repair
Garry Wangebc015b2019-06-06 17:45:06 -070028from autotest_lib.server.hosts import base_servohost
Garry Wang11b5e872020-03-11 15:14:08 -070029from autotest_lib.server.hosts import servo_constants
Otabek Kasimov4ea636e2020-04-14 23:35:06 -070030from autotest_lib.server.cros.faft.utils import config
Garry Wang11b5e872020-03-11 15:14:08 -070031from autotest_lib.client.common_lib import global_config
Garry Wangd7367482020-02-27 13:52:40 -080032
Otabek Kasimov15963492020-06-23 21:10:51 -070033try:
34 from chromite.lib import metrics
35except ImportError:
36 metrics = utils.metrics_mock
37
Dan Shi3b2adf62015-09-02 17:46:54 -070038_CONFIG = global_config.global_config
Fang Deng5d518f42013-08-02 14:04:32 -070039
Otabek Kasimova7ba91a2020-03-09 08:31:01 -070040
Garry Wangebc015b2019-06-06 17:45:06 -070041class ServoHost(base_servohost.BaseServoHost):
42 """Host class for a servo host(e.g. beaglebone, labstation)
Dana Goyette0b6e6402019-10-04 11:09:24 -070043 that with a servo instance for a specific port.
44
45 @type _servo: servo.Servo | None
46 """
Fang Deng5d518f42013-08-02 14:04:32 -070047
Raul E Rangel52ca2e82018-07-03 14:10:14 -060048 DEFAULT_PORT = int(os.getenv('SERVOD_PORT', '9999'))
Richard Barnette9a26ad62016-06-10 12:03:08 -070049
Dan Shie5b3c512014-08-21 12:12:09 -070050 # Timeout for initializing servo signals.
Wai-Hong Tam37b6ed32017-09-19 15:52:39 -070051 INITIALIZE_SERVO_TIMEOUT_SECS = 60
Richard Barnette9a26ad62016-06-10 12:03:08 -070052
xixuan6cf6d2f2016-01-29 15:29:00 -080053 # Ready test function
54 SERVO_READY_METHOD = 'get_version'
Fang Deng5d518f42013-08-02 14:04:32 -070055
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080056 # Directory prefix on the servo host where the servod logs are stored.
57 SERVOD_LOG_PREFIX = '/var/log/servod'
58
59 # Exit code to use when symlinks for servod logs are not found.
60 NO_SYMLINKS_CODE = 9
61
62 # Directory in the job's results directory to dump the logs into.
63 LOG_DIR = 'servod'
64
65 # Prefix for joint loglevel files in the logs.
66 JOINT_LOG_PREFIX = 'log'
67
68 # Regex group to extract timestamp from logfile name.
69 TS_GROUP = 'ts'
70
71 # This regex is used to extract the timestamp from servod logs.
72 # files always start with log.
73 TS_RE = (r'log.'
74 # The timestamp is of format %Y-%m-%d--%H-%M-%S.MS
75 r'(?P<%s>\d{4}(\-\d{2}){2}\-(-\d{2}){3}.\d{3})'
76 # The loglevel is optional depending on labstation version.
77 r'(.(INFO|DEBUG|WARNING))?' % TS_GROUP)
78 TS_EXTRACTOR = re.compile(TS_RE)
79
80 # Regex group to extract MCU name from logline in servod logs.
81 MCU_GROUP = 'mcu'
82
83 # Regex group to extract logline from MCU logline in servod logs.
84 LINE_GROUP = 'line'
85
86 # This regex is used to extract the mcu and the line content from an
87 # MCU logline in servod logs. e.g. EC or servo_v4 console logs.
88 # Here is an example log-line:
89 #
90 # 2020-01-23 13:15:12,223 - servo_v4 - EC3PO.Console - DEBUG -
91 # console.py:219:LogConsoleOutput - /dev/pts/9 - cc polarity: cc1
92 #
93 # Here is conceptually how they are formatted:
94 #
95 # <time> - <MCU> - EC3PO.Console - <LVL> - <file:line:func> - <pts> -
96 # <output>
97 #
98 # The log format starts with a timestamp
99 MCU_RE = (r'[\d\-]+ [\d:,]+ '
100 # The mcu that is logging this is next.
101 r'- (?P<%s>\w+) - '
102 # Next, we have more log outputs before the actual line.
103 # Information about the file line, logging function etc.
104 # Anchor on EC3PO Console, LogConsoleOutput and dev/pts.
105 # NOTE: if the log format changes, this regex needs to be
106 # adjusted.
107 r'EC3PO\.Console[\s\-\w\d:.]+LogConsoleOutput - /dev/pts/\d+ - '
108 # Lastly, we get the MCU's console line.
109 r'(?P<%s>.+$)' % (MCU_GROUP, LINE_GROUP))
110 MCU_EXTRACTOR = re.compile(MCU_RE)
111
112 # Suffix to identify compressed logfiles.
113 COMPRESSION_SUFFIX = '.tbz2'
114
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700115 # A suffix to mark servod log directories that came from instance that
116 # ran during this servo_host, but are not the last one running e.g. when
117 # an instance (on purpose, or due to a bug) restarted in the middle of the
118 # run.
119 OLD_LOG_SUFFIX = 'old'
120
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700121 # Mapping servo board with their vid-pid
122 SERVO_VID_PID = {
123 'servo_v4':'18d1:501b',
124 'ccd_cr50':'18d1:5014',
125 'servo_micro':'18d1:501a',
126 'servo_v3':['18d1:5004', '0403:6014'],
127 }
128
Otabek Kasimov15963492020-06-23 21:10:51 -0700129 # States of verifiers
130 # True - verifier run and passed
131 # False - verifier run and failed
132 # None - verifier did not run or dependency failed
133 VERIFY_SUCCESS = True
134 VERIFY_FAILED = False
135 VERIFY_NOT_RUN = None
136
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800137 def _init_attributes(self):
138 self._servo_state = None
139 self.servo_port = None
140 self.servo_board = None
141 self.servo_model = None
142 self.servo_serial = None
Garry Wang000c6c02020-05-11 21:27:23 -0700143 # The flag that indicate if a servo is connected to a smart usbhub.
144 # TODO(xianuowang@) remove this flag once all usbhubs in the lab
145 # get replaced.
146 self.smart_usbhub = None
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800147 self._servo = None
148 self._servod_server_proxy = None
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700149 self._initial_instance_ts = None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800150 # Flag to make sure that multiple calls to close do not result in the
151 # logic executing multiple times.
152 self._closed = False
Fang Deng5d518f42013-08-02 14:04:32 -0700153
Richard Barnette17bfc6c2016-08-04 18:41:43 -0700154 def _initialize(self, servo_host='localhost',
Richard Barnettee519dcd2016-08-15 17:37:17 -0700155 servo_port=DEFAULT_PORT, servo_board=None,
Nick Sanders2f3c9852018-10-24 12:10:24 -0700156 servo_model=None, servo_serial=None, is_in_lab=None,
157 *args, **dargs):
Fang Deng5d518f42013-08-02 14:04:32 -0700158 """Initialize a ServoHost instance.
159
160 A ServoHost instance represents a host that controls a servo.
161
162 @param servo_host: Name of the host where the servod process
163 is running.
Raul E Rangel52ca2e82018-07-03 14:10:14 -0600164 @param servo_port: Port the servod process is listening on. Defaults
165 to the SERVOD_PORT environment variable if set,
166 otherwise 9999.
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700167 @param servo_board: Board that the servo is connected to.
Nick Sanders2f3c9852018-10-24 12:10:24 -0700168 @param servo_model: Model that the servo is connected to.
Dan Shi4d478522014-02-14 13:46:32 -0800169 @param is_in_lab: True if the servo host is in Cros Lab. Default is set
170 to None, for which utils.host_is_in_lab_zone will be
171 called to check if the servo host is in Cros lab.
Fang Deng5d518f42013-08-02 14:04:32 -0700172
173 """
174 super(ServoHost, self)._initialize(hostname=servo_host,
Garry Wangebc015b2019-06-06 17:45:06 -0700175 is_in_lab=is_in_lab, *args, **dargs)
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800176 self._init_attributes()
Richard Barnette42f4db92018-08-23 15:05:15 -0700177 self.servo_port = int(servo_port)
Richard Barnettee519dcd2016-08-15 17:37:17 -0700178 self.servo_board = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -0700179 self.servo_model = servo_model
Kevin Cheng643ce8a2016-09-15 15:42:12 -0700180 self.servo_serial = servo_serial
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800181
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800182 # The location of the log files on the servo host for this instance.
183 self.remote_log_dir = '%s_%s' % (self.SERVOD_LOG_PREFIX,
184 self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700185 # Path of the servo host lock file.
186 self._lock_file = (self.TEMP_FILE_DIR + str(self.servo_port)
187 + self.LOCK_FILE_POSTFIX)
188 # File path to declare a reboot request.
189 self._reboot_file = (self.TEMP_FILE_DIR + str(self.servo_port)
190 + self.REBOOT_FILE_POSTFIX)
191
192 # Lock the servo host if it's an in-lab labstation to prevent other
193 # task to reboot it until current task completes. We also wait and
194 # make sure the labstation is up here, in the case of the labstation is
195 # in the middle of reboot.
Garry Wang7c00b0f2019-06-25 17:28:17 -0700196 self._is_locked = False
Garry Wang42b4d862019-06-25 15:50:49 -0700197 if (self.wait_up(self.REBOOT_TIMEOUT) and self.is_in_lab()
198 and self.is_labstation()):
Garry Wang79e9af62019-06-12 15:19:19 -0700199 self._lock()
Garry Wangebc015b2019-06-06 17:45:06 -0700200
Richard Barnette9a26ad62016-06-10 12:03:08 -0700201 self._repair_strategy = (
202 servo_repair.create_servo_repair_strategy())
Richard Barnettee519dcd2016-08-15 17:37:17 -0700203
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700204 def __str__(self):
205 return "<%s '%s:%s'>" % (
206 type(self).__name__, self.hostname, self.servo_port)
207
Richard Barnette9a26ad62016-06-10 12:03:08 -0700208 def connect_servo(self):
Garry Wang8c8dc972020-06-09 13:41:51 -0700209 """ Initialize and setup servo for later use.
210 """
211 self.initilize_servo()
212 self.initialize_dut_for_servo()
213
214
215 def initilize_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700216 """Establish a connection to the servod server on this host.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700217
218 Initializes `self._servo` and then verifies that all network
219 connections are working. This will create an ssh tunnel if
220 it's required.
Garry Wang8c8dc972020-06-09 13:41:51 -0700221 """
222 self._servo = servo.Servo(servo_host=self,
223 servo_serial=self.servo_serial)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700224
Garry Wang8c8dc972020-06-09 13:41:51 -0700225
226 def initialize_dut_for_servo(self):
227 """This method will do some setup for dut control, e.g. setup
228 main servo_v4 device, and also testing the connection between servo
229 and DUT. As a side effect of testing the connection, all signals on
230 the target servo are reset to default values, and the USB stick is
Richard Barnette9a26ad62016-06-10 12:03:08 -0700231 set to the neutral (off) position.
232 """
Garry Wang8c8dc972020-06-09 13:41:51 -0700233 if not self._servo:
234 raise hosts.AutoservVerifyError('Servo object needs to be'
235 ' initialized before initialize'
236 ' DUT.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700237 timeout, _ = retry.timeout(
Garry Wang8c8dc972020-06-09 13:41:51 -0700238 self._servo.initialize_dut,
239 timeout_sec=self.INITIALIZE_SERVO_TIMEOUT_SECS)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700240 if timeout:
Garry Wang8c8dc972020-06-09 13:41:51 -0700241 raise hosts.AutoservVerifyError('Initialize dut for servo timed'
242 ' out.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700243
244
245 def disconnect_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700246 """Disconnect our servo if it exists.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700247
248 If we've previously successfully connected to our servo,
249 disconnect any established ssh tunnel, and set `self._servo`
250 back to `None`.
251 """
252 if self._servo:
253 # N.B. This call is safe even without a tunnel:
254 # rpc_server_tracker.disconnect() silently ignores
255 # unknown ports.
256 self.rpc_server_tracker.disconnect(self.servo_port)
257 self._servo = None
Fang Deng5d518f42013-08-02 14:04:32 -0700258
Garry Wangc1288cf2019-12-17 14:58:00 -0800259
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800260 def _create_servod_server_proxy(self):
261 """Create a proxy that can be used to communicate with servod server.
Fang Deng5d518f42013-08-02 14:04:32 -0700262
263 @returns: An xmlrpclib.ServerProxy that is connected to the servod
264 server on the host.
Fang Deng5d518f42013-08-02 14:04:32 -0700265 """
Garry Wang11b5e872020-03-11 15:14:08 -0700266 if (servo_constants.ENABLE_SSH_TUNNEL_FOR_SERVO
267 and not self.is_localhost()):
Richard Barnette9a26ad62016-06-10 12:03:08 -0700268 return self.rpc_server_tracker.xmlrpc_connect(
269 None, self.servo_port,
270 ready_test_name=self.SERVO_READY_METHOD,
Allen Li2b1a8992018-11-27 14:17:18 -0800271 timeout_seconds=60,
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700272 request_timeout_seconds=3600,
273 server_desc=str(self))
Richard Barnette9a26ad62016-06-10 12:03:08 -0700274 else:
275 remote = 'http://%s:%s' % (self.hostname, self.servo_port)
276 return xmlrpclib.ServerProxy(remote)
Fang Deng5d518f42013-08-02 14:04:32 -0700277
278
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800279 def get_servod_server_proxy(self):
280 """Return a cached proxy if exists; otherwise, create a new one.
281
282 @returns: An xmlrpclib.ServerProxy that is connected to the servod
283 server on the host.
284 """
285 # Single-threaded execution, no race
286 if self._servod_server_proxy is None:
287 self._servod_server_proxy = self._create_servod_server_proxy()
288 return self._servod_server_proxy
289
290
Richard Barnette1edbb162016-11-01 11:47:50 -0700291 def verify(self, silent=False):
292 """Update the servo host and verify it's in a good state.
293
294 @param silent If true, suppress logging in `status.log`.
295 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700296 message = 'Beginning verify for servo host %s port %s serial %s'
297 message %= (self.hostname, self.servo_port, self.servo_serial)
298 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700299 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700300 self._repair_strategy.verify(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700301 self._servo_state = servo_constants.SERVO_STATE_WORKING
302 self.record('INFO', None, None,
303 'ServoHost verify set servo_state as WORKING')
Garry Wang63b8c382020-03-11 22:28:40 -0700304 except Exception as e:
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700305 if self.is_localhost():
306 self._servo_state = self.determine_servo_state()
307 self.record('INFO', None, None,
308 'ServoHost verify set servo_state as %s'
309 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700310 if self._is_critical_error(e):
311 raise
Fang Deng5d518f42013-08-02 14:04:32 -0700312
313
Garry Wang7b0e1b72020-03-25 19:08:59 -0700314 def get_image_name_from_usbkey(self, usbkey_dev):
315 """Mount usb drive and check ChromeOS image name on it if there is
316 one. This method assumes the image_usbkey_direction is already set
317 to servo side.
318
319 @param: usbkey_dev usbkey dev path(e.g. /dev/sdb).
320
321 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
322 or empty string if no test image detected, or unexpected
323 error occurred.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700324 """
Garry Wang70e5d062020-04-03 18:01:05 -0700325 logging.info('Checking ChromeOS image name on usbkey.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700326 usb_mount_path = '/media/servo_usb/%s' % self.servo_port
327 unmount_cmd = 'umount %s' % usb_mount_path
328 # ChromeOS root fs is in /dev/sdx3
329 mount_cmd = 'mount -o ro %s3 %s' % (usbkey_dev, usb_mount_path)
330 # Unmount if there is an existing stale mount.
331 self.run(unmount_cmd, ignore_status=True)
332 # Create if the mount point is not existing.
333 self.run('mkdir -p %s' % usb_mount_path)
334 try:
335 # Attempt to mount the usb drive.
336 mount_result = self.run(mount_cmd, ignore_status=True)
Garry Wang70e5d062020-04-03 18:01:05 -0700337 if mount_result.exit_status != 0:
338 logging.error('Unexpected error occurred on mount usb drive.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700339 return ''
Garry Wang70e5d062020-04-03 18:01:05 -0700340
341 release_content = self.run(
342 'cat %s/etc/lsb-release' % usb_mount_path,
343 ignore_status=True).stdout.strip()
344
345 if not re.search(r'RELEASE_TRACK=.*test', release_content):
346 logging.info('The image on usbkey is not a test image')
347 return ''
348
349 return lsbrelease_utils.get_chromeos_release_builder_path(
350 lsb_release_content=release_content)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700351 finally:
Garry Wang70e5d062020-04-03 18:01:05 -0700352 logging.debug('Image check compeleted, unmounting the usb drive.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700353 self.run(unmount_cmd, ignore_status=True)
354
355
Garry Wang70e5d062020-04-03 18:01:05 -0700356 def _probe_and_validate_usb_dev(self):
357 """This method probe the usb dev path by talking to servo, and then
358 validate the dev path is valid block device to servohost.
359 Possible output:
360 1. Encounter error during probe usb dev, returns empty string.
361 2. probe usb dev completed without error but cannot find usb dev,
362 raise AutoservRepairError.
363 3. probe usb dev find a usb dev path, but failed validation in this
364 method, raise AutoservRepairError.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700365
Garry Wang70e5d062020-04-03 18:01:05 -0700366 @returns: A string of usb dev path(e.g. '/dev/sdb'), or empty string
367 if unexpected error occurred during probe.
368 @raises: AutoservRepairError if servo couldn't probe the usb dev path
369 (servo.probe_host_usb_dev() returns empty string), or the dev path is
370 not valid block device to servohost.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700371 """
372 logging.info('Validating image usbkey on servo.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700373 try:
Garry Wang70e5d062020-04-03 18:01:05 -0700374 usb_dev = self._servo.probe_host_usb_dev()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700375 except Exception as e:
376 # We don't want any unexpected or transient servo communicating
377 # failure block usb repair, so capture all errors here.
378 logging.error(e, exc_info=True)
379 logging.error('Unexpected error occurred on get usbkey dev path,'
380 ' skipping usbkey validation.')
381 return ''
382
Garry Wang70e5d062020-04-03 18:01:05 -0700383 if usb_dev:
384 # probe_host_usb_dev() sometimes return stale record,
385 # so we need to make sure the path exists in fdisk.
386 validate_cmd = 'fdisk -l | grep %s' % usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700387 try:
388 resp = self.run(validate_cmd, ignore_status=True, timeout=60)
389 if resp.exit_status == 0:
390 return usb_dev
Garry Wang70e5d062020-04-03 18:01:05 -0700391
Garry Wang11441182020-06-16 18:34:14 -0700392 logging.error('%s is reported from "image_usbkey_dev" control'
393 ' but not detected by fdisk!', usb_dev)
394 except error.AutoservRunError as e:
395 if 'Timeout encountered' in str(e):
396 logging.warning('Timeout encountered during fdisk run,'
397 ' skipping usbkey validation.')
398 return ''
399 raise
Garry Wang70e5d062020-04-03 18:01:05 -0700400
401 raise hosts.AutoservRepairError(
402 'No usbkey detected on servo, the usbkey may be either missing'
403 ' or broken. Please replace usbkey on the servo and retry.',
404 'missing usbkey')
405
406
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700407 def is_ec_supported(self):
Garry Wang9b8f2342020-04-17 16:34:09 -0700408 """Check if ec is supported on the servo_board"""
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700409 if self.servo_board:
410 try:
411 frm_config = config.Config(self.servo_board, self.servo_model)
412 return frm_config.chrome_ec
413 except Exception as e:
414 logging.error('Unexpected error when read from firmware'
415 ' configs; %s', str(e))
416 return False
417
Garry Wang70e5d062020-04-03 18:01:05 -0700418 def validate_image_usbkey(self):
419 """This method first validate if there is a recover usbkey on servo
420 that accessible to servohost, and second check if a ChromeOS image is
421 already on the usb drive and return the image_name so we can avoid
422 unnecessary download and flash to the recover usbkey on servo.
423
424 Please note that, there is special error handling logic here:
425 1. If unexpected error happens, we return empty string. So repair
426 actions will not get blocked.
427 2. If no working usbkey present on servo, but no errors, we'll raise
428 AutoservRepairError here.
429
430 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
431 or empty string if no test image detected, or unexpected
432 error occurred.
433 @raises: AutoservRepairError if the usbkey is not detected on servo.
434 """
435 usb_dev = self._probe_and_validate_usb_dev()
436 if usb_dev:
437 return self.get_image_name_from_usbkey(usb_dev)
438 else:
439 return ''
Garry Wang7b0e1b72020-03-25 19:08:59 -0700440
441
Richard Barnette1edbb162016-11-01 11:47:50 -0700442 def repair(self, silent=False):
443 """Attempt to repair servo host.
444
445 @param silent If true, suppress logging in `status.log`.
446 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700447 message = 'Beginning repair for servo host %s port %s serial %s'
448 message %= (self.hostname, self.servo_port, self.servo_serial)
449 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700450 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700451 self._repair_strategy.repair(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700452 self._servo_state = servo_constants.SERVO_STATE_WORKING
453 self.record('INFO', None, None,
454 'ServoHost repair set servo_state as WORKING')
Garry Wang464ff1e2019-07-18 17:20:34 -0700455 # If target is a labstation then try to withdraw any existing
456 # reboot request created by this servo because it passed repair.
457 if self.is_labstation():
458 self.withdraw_reboot_request()
Garry Wang63b8c382020-03-11 22:28:40 -0700459 except Exception as e:
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700460 if self.is_localhost():
461 self._servo_state = self.determine_servo_state()
462 self.record('INFO', None, None,
463 'ServoHost repair set servo_state as %s'
464 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700465 if self._is_critical_error(e):
466 self.disconnect_servo()
467 self.stop_servod()
468 raise
469
470
471 def _is_critical_error(self, error):
472 if (isinstance(error, hosts.AutoservVerifyDependencyError)
473 and not error.is_critical()):
474 logging.warning('Non-critical verify failure(s) detected during'
475 ' verify/repair servo, servo connection will'
476 ' still up but may not fully functional.'
477 ' Some repair actions and servo depended'
478 ' tests may not run.')
479 return False
480 logging.info('Critical verify failure(s) detected during repair/verify'
481 ' servo. Disconnecting servo and stop servod, all repair '
482 'action and tests that depends on servo will not run.')
483 return True
Fang Deng5d518f42013-08-02 14:04:32 -0700484
485
Dan Shi4d478522014-02-14 13:46:32 -0800486 def get_servo(self):
487 """Get the cached servo.Servo object.
Fang Deng5d518f42013-08-02 14:04:32 -0700488
Dan Shi4d478522014-02-14 13:46:32 -0800489 @return: a servo.Servo object.
Dana Goyette353d1d92019-06-27 10:43:59 -0700490 @rtype: autotest_lib.server.cros.servo.servo.Servo
Fang Deng5d518f42013-08-02 14:04:32 -0700491 """
Dan Shi4d478522014-02-14 13:46:32 -0800492 return self._servo
493
494
Garry Wang79e9af62019-06-12 15:19:19 -0700495 def request_reboot(self):
496 """Request servohost to be rebooted when it's safe to by touch a file.
497 """
498 logging.debug('Request to reboot servohost %s has been created by '
Garry Wang464ff1e2019-07-18 17:20:34 -0700499 'servo with port # %s', self.hostname, self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700500 self.run('touch %s' % self._reboot_file, ignore_status=True)
501
502
Garry Wang464ff1e2019-07-18 17:20:34 -0700503 def withdraw_reboot_request(self):
504 """Withdraw a servohost reboot request if exists by remove the flag
505 file.
506 """
507 logging.debug('Withdrawing request to reboot servohost %s that created'
508 ' by servo with port # %s if exists.',
509 self.hostname, self.servo_port)
510 self.run('rm -f %s' % self._reboot_file, ignore_status=True)
511
512
Garry Wangc1288cf2019-12-17 14:58:00 -0800513 def start_servod(self, quick_startup=False):
514 """Start the servod process on servohost.
515 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800516 # Skip if running on the localhost.(crbug.com/1038168)
517 if self.is_localhost():
518 logging.debug("Servohost is a localhost, skipping start servod.")
519 return
520
521 cmd = 'start servod'
Garry Wangc1288cf2019-12-17 14:58:00 -0800522 if self.servo_board:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800523 cmd += ' BOARD=%s' % self.servo_board
Garry Wangc1288cf2019-12-17 14:58:00 -0800524 if self.servo_model:
525 cmd += ' MODEL=%s' % self.servo_model
Garry Wangc1288cf2019-12-17 14:58:00 -0800526 else:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800527 logging.warning('Board for DUT is unknown; starting servod'
528 ' assuming a pre-configured board.')
529
530 cmd += ' PORT=%d' % self.servo_port
531 if self.servo_serial:
532 cmd += ' SERIAL=%s' % self.servo_serial
Garry Wangd7367482020-02-27 13:52:40 -0800533
534 # Start servod with dual_v4 if the DUT/servo from designated pools.
535 dut_host_info = self.get_dut_host_info()
536 if dut_host_info:
Garry Wang11b5e872020-03-11 15:14:08 -0700537 if bool(dut_host_info.pools &
538 servo_constants.POOLS_SUPPORT_DUAL_V4):
Garry Wangd7367482020-02-27 13:52:40 -0800539 logging.debug('The DUT is detected in following designated'
540 ' pools %s,starting servod with DUAL_V4 option.',
Garry Wang11b5e872020-03-11 15:14:08 -0700541 servo_constants.POOLS_SUPPORT_DUAL_V4)
Garry Wangd7367482020-02-27 13:52:40 -0800542 cmd += ' DUAL_V4=1'
543
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800544 # Remove the symbolic links from the logs. This helps ensure that
545 # a failed servod instantiation does not cause us to grab old logs
546 # by mistake.
547 self.remove_latest_log_symlinks()
Garry Wangcdd27b22020-01-13 14:59:11 -0800548 self.run(cmd, timeout=60)
Garry Wangc1288cf2019-12-17 14:58:00 -0800549
550 # There's a lag between when `start servod` completes and when
551 # the _ServodConnectionVerifier trigger can actually succeed.
552 # The call to time.sleep() below gives time to make sure that
553 # the trigger won't fail after we return.
554
555 # Normally servod on servo_v3 and labstation take ~10 seconds to ready,
556 # But in the rare case all servo on a labstation are in heavy use they
557 # may take ~30 seconds. So the timeout value will double these value,
558 # and we'll try quick start up when first time initialize servohost,
559 # and use standard start up timeout in repair.
560 if quick_startup:
Garry Wang11b5e872020-03-11 15:14:08 -0700561 timeout = servo_constants.SERVOD_QUICK_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800562 else:
Garry Wang11b5e872020-03-11 15:14:08 -0700563 timeout = servo_constants.SERVOD_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800564 logging.debug('Wait %s seconds for servod process fully up.', timeout)
565 time.sleep(timeout)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700566 # Cache the initial instance timestamp to check against servod restarts
567 self._initial_instance_ts = self.get_instance_logs_ts()
Garry Wangc1288cf2019-12-17 14:58:00 -0800568
569
570 def stop_servod(self):
571 """Stop the servod process on servohost.
572 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800573 # Skip if running on the localhost.(crbug.com/1038168)
574 if self.is_localhost():
575 logging.debug("Servohost is a localhost, skipping stop servod.")
576 return
577
Garry Wangc1288cf2019-12-17 14:58:00 -0800578 logging.debug('Stopping servod on port %s', self.servo_port)
Garry Wangcdd27b22020-01-13 14:59:11 -0800579 self.run('stop servod PORT=%d' % self.servo_port,
580 timeout=60, ignore_status=True)
Garry Wangc1288cf2019-12-17 14:58:00 -0800581 logging.debug('Wait %s seconds for servod process fully teardown.',
Garry Wang11b5e872020-03-11 15:14:08 -0700582 servo_constants.SERVOD_TEARDOWN_TIMEOUT)
583 time.sleep(servo_constants.SERVOD_TEARDOWN_TIMEOUT)
Garry Wangc1288cf2019-12-17 14:58:00 -0800584
585
586 def restart_servod(self, quick_startup=False):
587 """Restart the servod process on servohost.
588 """
589 self.stop_servod()
590 self.start_servod(quick_startup)
591
Garry Wang11b5e872020-03-11 15:14:08 -0700592
Garry Wangffbd2162020-04-17 16:13:48 -0700593 def _process_servodtool_error(self, response):
594 """Helper function to handle non-zero servodtool response.
595 """
596 if re.search(servo_constants.ERROR_MESSAGE_USB_HUB_NOT_COMPATIBLE,
Garry Wangad245002020-05-15 15:20:23 -0700597 response.stdout):
Garry Wangffbd2162020-04-17 16:13:48 -0700598 logging.error('The servo is not plugged on a usb hub that supports'
599 ' power-cycle!')
Garry Wang000c6c02020-05-11 21:27:23 -0700600 # change the flag so we can update this label in later process.
601 self.smart_usbhub = False
Garry Wangffbd2162020-04-17 16:13:48 -0700602 return
603
604 if re.search(servo_constants.ERROR_MESSAGE_DEVICE_NOT_FOUND %
605 self.servo_serial, response.stdout):
606 logging.error('No servo with serial %s found!', self.servo_serial)
607 return
608
609 logging.error('Unexpected error occurred from usbhub control, please'
610 ' file a bug and inform chrome-fleet-software@ team!')
611
612
613 def _get_servo_usb_devnum(self):
614 """Helper function to collect current usb devnum of servo.
615 """
Otabek Kasimov09192682020-06-01 18:17:44 -0700616 # TODO remove try-except when fix crbug.com/1087964
617 try:
618 cmd = 'servodtool device -s %s usb-path' % self.servo_serial
619 resp = self.run(cmd, ignore_status=True, timeout=30)
620 except Exception as e:
621 # Here we catch only timeout errors.
622 # Other errors is filtered by ignore_status=True
623 logging.debug('Attempt to get servo usb-path failed due to '
624 'timeout; %s', e)
625 return ''
626
Garry Wangffbd2162020-04-17 16:13:48 -0700627 if resp.exit_status != 0:
628 self._process_servodtool_error(resp)
629 return ''
630 usb_path = resp.stdout.strip()
631 logging.info('Usb path of servo %s is %s', self.servo_serial, usb_path)
632
633 resp = self.run('cat %s/devnum' % usb_path,
634 ignore_status=True)
635 if resp.exit_status != 0:
636 self._process_servodtool_error(resp)
637 return ''
638 return resp.stdout.strip()
639
640
641 def _reset_servo(self):
642 logging.info('Resetting servo through smart usbhub.')
Otabek Kasimov09192682020-06-01 18:17:44 -0700643 # TODO remove try-except when fix crbug.com/1087964
644 try:
645 resp = self.run('servodtool device -s %s power-cycle' %
646 self.servo_serial, ignore_status=True,
647 timeout=30)
648 if resp.exit_status != 0:
649 self._process_servodtool_error(resp)
650 return False
651 except Exception as e:
652 # Here we catch only timeout errors.
653 # Other errors is filtered by ignore_status=True
654 logging.debug('Attempt to reset servo failed due to timeout;'
655 ' %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -0700656 return False
657
658 logging.debug('Wait %s seconds for servo to come back from reset.',
659 servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
660 time.sleep(servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
Garry Wang000c6c02020-05-11 21:27:23 -0700661 # change the flag so we can update this label in later process.
662 self.smart_usbhub = True
Garry Wangffbd2162020-04-17 16:13:48 -0700663 return True
664
665
666 def reset_servo(self):
667 """Reset(power-cycle) the servo via smart usbhub.
668 """
669 if not self.is_labstation():
670 logging.info('Servo reset is not applicable to servo_v3.')
671 return
672
673 pre_reset_devnum = self._get_servo_usb_devnum()
674 logging.info('Servo usb devnum before reset: %s', pre_reset_devnum)
675 result = self._reset_servo()
676 if not result:
Garry Wangfd5c8b62020-06-08 15:36:54 -0700677 message = ('Failed to reset servo with serial: %s. (Please ignore'
678 ' this error if the DUT is not connected to a smart'
679 ' usbhub).' % self.servo_serial)
Garry Wangffbd2162020-04-17 16:13:48 -0700680 logging.warning(message)
681 self.record('INFO', None, None, message)
682 return
683
684 post_reset_devnum = self._get_servo_usb_devnum()
685 logging.info('Servo usb devnum after reset: %s', post_reset_devnum)
686 if not (pre_reset_devnum and post_reset_devnum):
687 message = ('Servo reset completed but unable to verify'
688 ' devnum change!')
689 elif pre_reset_devnum != post_reset_devnum:
690 message = ('Reset servo with serial %s completed successfully!'
691 % self.servo_serial)
692 else:
693 message = 'Servo reset completed but devnum is still not changed!'
694 logging.info(message)
695 self.record('INFO', None, None, message)
696
697
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800698 def _extract_compressed_logs(self, logdir, relevant_files):
699 """Decompress servod logs in |logdir|.
700
701 @param logdir: directory containing compressed servod logs.
702 @param relevant_files: list of files in |logdir| to consider.
703
704 @returns: tuple, (tarfiles, files) where
705 tarfiles: list of the compressed filenames that have been
706 extracted and deleted
707 files: list of the uncompressed files that were generated
708 """
709 # For all tar-files, first extract them to the directory, and
710 # then let the common flow handle them.
711 tarfiles = [cf for cf in relevant_files if
712 cf.endswith(self.COMPRESSION_SUFFIX)]
713 files = []
714 for f in tarfiles:
715 norm_name = os.path.basename(f)[:-len(self.COMPRESSION_SUFFIX)]
716 with tarfile.open(f) as tf:
717 # Each tarfile has only one member, as
718 # that's the compressed log.
719 member = tf.members[0]
720 # Manipulate so that it only extracts the basename, and not
721 # the directories etc.
722 member.name = norm_name
723 files.append(os.path.join(logdir, member.name))
724 tf.extract(member, logdir)
725 # File has been extracted: remove the compressed file.
726 os.remove(f)
727 return tarfiles, files
728
729 def _extract_mcu_logs(self, log_subdir):
730 """Extract MCU (EC, Cr50, etc) console output from servod debug logs.
731
732 Using the MCU_EXTRACTOR regex (above) extract and split out MCU console
733 lines from the logs to generate invidiual console logs e.g. after
734 this method, you can find an ec.txt and servo_v4.txt in |log_dir| if
735 those MCUs had any console input/output.
736
737 @param log_subdir: directory with log.DEBUG.txt main servod debug logs.
738 """
739 # Extract the MCU for each one. The MCU logs are only in the .DEBUG
740 # files
741 mcu_lines_file = os.path.join(log_subdir, 'log.DEBUG.txt')
742 if not os.path.exists(mcu_lines_file):
743 logging.info('No DEBUG logs found to extract MCU logs from.')
744 return
745 mcu_files = {}
746 mcu_file_template = '%s.txt'
747 with open(mcu_lines_file, 'r') as f:
748 for line in f:
749 match = self.MCU_EXTRACTOR.match(line)
750 if match:
751 mcu = match.group(self.MCU_GROUP).lower()
752 line = match.group(self.LINE_GROUP)
753 if mcu not in mcu_files:
754 mcu_file = os.path.join(log_subdir,
755 mcu_file_template % mcu)
756 mcu_files[mcu] = open(mcu_file, 'a')
757 fd = mcu_files[mcu]
758 fd.write(line + '\n')
759 for f in mcu_files:
760 mcu_files[f].close()
761
762
763 def remove_latest_log_symlinks(self):
764 """Remove the conveninence symlinks 'latest' servod logs."""
765 symlink_wildcard = '%s/latest*' % self.remote_log_dir
766 cmd = 'rm ' + symlink_wildcard
767 self.run(cmd, stderr_tee=None, ignore_status=True)
768
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700769 def probe_servod_restart(self, instance_ts, outdir):
770 """Grab servod logs from previous instances if part of this session.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800771
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700772 If since the last time this host called start_servod() servod crashed
773 and restarted, this helper finds those logs as well, and stores them
774 with the |OLD_LOG_SUFFIX| to investigate if necessary.
Prasad Vuppalapu5bd9da12020-03-31 01:46:47 +0000775
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700776 It also issues a panicinfo command to servo devices after the restart
777 to try and collect reboot information for debugging.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800778
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700779 @param instance_ts: the log timestamp that the current instance uses
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800780 @param outdir: directory to create a subdirectory into to place the
781 servod logs into.
782 """
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700783 if self._initial_instance_ts is None:
784 logging.info('No log timestamp grabbed successfully on servod '
785 'startup. Cannot check device restarts. Ignoring.')
786 return
787 if instance_ts == self._initial_instance_ts:
788 logging.debug('Servod appears to have run without restarting')
789 return
790 # Servod seems to have restarted (at least once). |_initial_instance_ts|
791 # is the first timestamp, and instance_ts is the current timestamp. Find
792 # all timestamps in between them, and grab the logs for each.
793 tss = self._find_instance_timestamps_between(self._initial_instance_ts,
794 instance_ts)
795 logging.info('Servod has restarted %d times between the start and the '
796 'end of this servo_host.', len(tss))
797 logging.info('This might be an issue. Will extract all logs from each '
798 'instance.')
799 logging.info('Logs that are not the currently running (about to turn '
800 'down) instance are maked with a .%s in their folder.',
801 self.OLD_LOG_SUFFIX)
802 for ts in tss:
803 self.get_instance_logs(ts, outdir, old=True)
804 # Lastly, servod has restarted due to a potential issue. Try to get
805 # panic information from servo micro and servo v4 for the current logs.
806 # This can only happen if the |_servo| attribute is initialized.
807 if self._servo:
808 for mcu in ['servo_micro', 'servo_v4']:
809 ctrl = '%s_uart_cmd' % mcu
810 if self._servo.has_control(ctrl):
811 logging.info('Trying to retrieve %r panicinfo into logs',
812 mcu)
813 try:
814 self._servo.set_nocheck(ctrl, 'panicinfo')
815 except error.TestFail as e:
816 logging.error('Failed to generate panicinfo for %r '
817 'logs. %s', mcu, str(e))
818
819 def _find_instance_timestamps_between(self, start_ts, end_ts):
820 """Find all log timestamps between [start_ts, end_ts).
821
822 @param start_ts: str, earliest log timestamp of interest
823 @param end_ts: str, latest log timestamp of interest
824
825 @returns: list, all timestamps between start_ts and end_ts, end_ts
826 exclusive, on the servo_host. An empty list on errors
827 """
828 # Simply get all timestamp, and then sort and remove
829 cmd = 'ls %s' % self.remote_log_dir
830 res = self.run(cmd, stderr_tee=None, ignore_status=True)
831 if res.exit_status != 0:
832 # Here we failed to find anything.
833 logging.info('Failed to find remote servod logs. Ignoring.')
834 return []
835 logfiles = res.stdout.strip().split()
836 timestamps = set()
837 for logfile in logfiles:
838 ts_match = self.TS_EXTRACTOR.match(logfile)
839 if not ts_match:
840 # Simply ignore files that fail the check. It might be the
841 # 'latest' symlinks or random files.
842 continue
843 timestamps.add(ts_match.group(self.TS_GROUP))
844 # At this point we have all unique timestamps.
845 timestamps = sorted(timestamps)
846 for ts in [start_ts, end_ts]:
847 if ts not in timestamps:
848 logging.error('Timestamp %r not in servod logs. Cannot query '
849 'for timestamps in between %r and %r', ts,
850 start_ts, end_ts)
851 return []
852 return timestamps[timestamps.index(start_ts):timestamps.index(end_ts)]
853
854 def get_instance_logs_ts(self):
855 """Retrieve the currently running servod instance's log timestamp
856
857 @returns: str, timestamp for current instance, or None on failure
858 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800859 # First, extract the timestamp. This cmd gives the real filename of
860 # the latest aka current log file.
861 cmd = ('if [ -f %(dir)s/latest.DEBUG ];'
862 'then realpath %(dir)s/latest.DEBUG;'
863 'elif [ -f %(dir)s/latest ];'
864 'then realpath %(dir)s/latest;'
865 'else exit %(code)d;'
866 'fi' % {'dir': self.remote_log_dir,
867 'code': self.NO_SYMLINKS_CODE})
868 res = self.run(cmd, stderr_tee=None, ignore_status=True)
869 if res.exit_status != 0:
870 if res.exit_status == self.NO_SYMLINKS_CODE:
871 logging.warning('servod log latest symlinks not found. '
872 'This is likely due to an error starting up '
873 'servod. Ignoring..')
874 else:
875 logging.warning('Failed to find servod logs on servo host.')
876 logging.warning(res.stderr.strip())
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700877 return None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800878 fname = os.path.basename(res.stdout.strip())
879 # From the fname, ought to extract the timestamp using the TS_EXTRACTOR
Ruben Rodriguez Buchillone9aa2b02020-03-04 12:14:28 -0800880 ts_match = self.TS_EXTRACTOR.match(fname)
881 if not ts_match:
882 logging.warning('Failed to extract timestamp from servod log file '
883 '%r. Skipping. The servo host is using outdated '
884 'servod logging and needs to be updated.', fname)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700885 return None
886 return ts_match.group(self.TS_GROUP)
887
888 def get_instance_logs(self, instance_ts, outdir, old=False):
889 """Collect all logs with |instance_ts| and dump into a dir in |outdir|
890
891 This method first collects all logs on the servo_host side pertaining
892 to this servod instance (port, instatiation). It glues them together
893 into combined log.[level].txt files and extracts all available MCU
894 console I/O from the logs into individual files e.g. servo_v4.txt
895
896 All the output can be found in a directory inside |outdir| that
897 this generates based on |LOG_DIR|, the servod port, and the instance
898 timestamp on the servo_host side.
899
900 @param instance_ts: log timestamp to grab logfiles for
901 @param outdir: directory to create a subdirectory into to place the
902 servod logs into.
903 @param old: bool, whether to append |OLD_LOG_SUFFIX| to output dir
904 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800905 # Create the local results log dir.
906 log_dir = os.path.join(outdir, '%s_%s.%s' % (self.LOG_DIR,
907 str(self.servo_port),
908 instance_ts))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700909 if old:
910 log_dir = '%s.%s' % (log_dir, self.OLD_LOG_SUFFIX)
911 logging.info('Saving servod logs to %r.', log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800912 os.mkdir(log_dir)
913 # Now, get all files with that timestamp.
914 cmd = 'find %s -maxdepth 1 -name "log.%s*"' % (self.remote_log_dir,
915 instance_ts)
916 res = self.run(cmd, stderr_tee=None, ignore_status=True)
917 files = res.stdout.strip().split()
918 try:
919 self.get_file(files, log_dir, try_rsync=False)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700920 if not os.listdir(log_dir):
921 logging.info('No servod logs retrieved. Ignoring, and removing '
922 '%r again.', log_dir)
923 os.rmdir(log_dir)
924 return
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800925 except error.AutoservRunError as e:
926 result = e.result_obj
927 if result.exit_status != 0:
928 stderr = result.stderr.strip()
929 logging.warning("Couldn't retrieve servod logs. Ignoring: %s",
930 stderr or '\n%s' % result)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700931 # Remove the log_dir as nothing was added to it.
932 os.rmdir(log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800933 return
934 local_files = [os.path.join(log_dir, f) for f in os.listdir(log_dir)]
935 # TODO(crrev.com/c/1793030): remove no-level case once CL is pushed
936 for level_name in ('DEBUG', 'INFO', 'WARNING', ''):
937 # Create the joint files for each loglevel. i.e log.DEBUG
938 joint_file = self.JOINT_LOG_PREFIX
939 if level_name:
940 joint_file = '%s.%s' % (self.JOINT_LOG_PREFIX, level_name)
941 # This helps with some online tools to avoid complaints about an
942 # unknown filetype.
943 joint_file = joint_file + '.txt'
944 joint_path = os.path.join(log_dir, joint_file)
945 files = [f for f in local_files if level_name in f]
946 if not files:
947 # TODO(crrev.com/c/1793030): remove no-level case once CL
948 # is pushed
949 continue
950 # Extract compressed logs if any.
951 compressed, extracted = self._extract_compressed_logs(log_dir,
952 files)
953 files = list(set(files) - set(compressed))
954 files.extend(extracted)
955 # Need to sort. As they all share the same timestamp, and
956 # loglevel, the index itself is sufficient. The highest index
957 # is the oldest file, therefore we need a descending sort.
958 def sortkey(f, level=level_name):
959 """Custom sortkey to sort based on rotation number int."""
960 if f.endswith(level_name): return 0
961 return int(f.split('.')[-1])
962
963 files.sort(reverse=True, key=sortkey)
964 # Just rename the first file rather than building from scratch.
965 os.rename(files[0], joint_path)
966 with open(joint_path, 'a') as joint_f:
967 for logfile in files[1:]:
968 # Transfer the file to the joint file line by line.
969 with open(logfile, 'r') as log_f:
970 for line in log_f:
971 joint_f.write(line)
972 # File has been written over. Delete safely.
973 os.remove(logfile)
974 # Need to remove all files form |local_files| so we don't
975 # analyze them again.
976 local_files = list(set(local_files) - set(files) - set(compressed))
977 # Lastly, extract MCU logs from the joint logs.
978 self._extract_mcu_logs(log_dir)
979
Garry Wang79e9af62019-06-12 15:19:19 -0700980 def _lock(self):
981 """lock servohost by touching a file.
982 """
983 logging.debug('Locking servohost %s by touching %s file',
984 self.hostname, self._lock_file)
985 self.run('touch %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -0700986 self._is_locked = True
Garry Wang79e9af62019-06-12 15:19:19 -0700987
988
989 def _unlock(self):
990 """Unlock servohost by removing the lock file.
991 """
992 logging.debug('Unlocking servohost by removing %s file',
993 self._lock_file)
994 self.run('rm %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -0700995 self._is_locked = False
Garry Wang79e9af62019-06-12 15:19:19 -0700996
997
Congbin Guoa1f9cba2018-07-03 11:36:59 -0700998 def close(self):
Congbin Guofc3b8962019-03-22 17:38:46 -0700999 """Close the associated servo and the host object."""
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001000 # NOTE: throughout this method there are multiple attempts to catch
1001 # all errors. This is WAI as log grabbing should not fail tests.
1002 # However, the goal is to catch and handle/process all errors, thus
1003 # we print the traceback and ask for a bug.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001004 if self._closed:
1005 logging.debug('ServoHost is already closed.')
1006 return
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001007 instance_ts = self.get_instance_logs_ts()
1008 # TODO(crbug.com/1011516): once enabled, remove the check against
1009 # localhost and instead check against log-rotiation enablement.
1010 logs_available = (instance_ts is not None and
1011 self.job and
1012 not self.is_localhost())
1013 if logs_available:
1014 # Probe whether there was a servod restart, and grab those old
1015 # logs as well.
1016 try:
1017 self.probe_servod_restart(instance_ts, self.job.resultdir)
1018 except (error.AutoservRunError, error.TestFail) as e:
1019 logging.info('Failed to grab servo logs due to: %s. '
1020 'This error is forgiven.', str(e))
1021 except Exception as e:
1022 logging.error('Unexpected error probing for old logs. %s. '
1023 'Forgiven. Please file a bug and fix or catch '
1024 'in log probing function', str(e),
1025 exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001026 if self._servo:
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001027 outdir = None if not self.job else self.job.resultdir
Congbin Guo2e5e2a22018-07-27 10:32:48 -07001028 # In some cases when we run as lab-tools, the job object is None.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001029 self._servo.close(outdir)
1030
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001031 if logs_available:
1032 # Grab current (not old like above) logs after the servo instance
1033 # was closed out.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001034 try:
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001035 self.get_instance_logs(instance_ts, self.job.resultdir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001036 except error.AutoservRunError as e:
1037 logging.info('Failed to grab servo logs due to: %s. '
1038 'This error is forgiven.', str(e))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001039 except Exception as e:
1040 logging.error('Unexpected error grabbing servod logs. %s. '
1041 'Forgiven. Please file a bug and fix or catch '
1042 'in log grabbing function', str(e), exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001043
Garry Wang7c00b0f2019-06-25 17:28:17 -07001044 if self._is_locked:
1045 # Remove the lock if the servohost has been locked.
Garry Wang79e9af62019-06-12 15:19:19 -07001046 try:
1047 self._unlock()
1048 except error.AutoservSSHTimeout:
1049 logging.error('Unlock servohost failed due to ssh timeout.'
1050 ' It may caused by servohost went down during'
1051 ' the task.')
Garry Wangc1288cf2019-12-17 14:58:00 -08001052 # We want always stop servod after task to minimum the impact of bad
1053 # servod process interfere other servods.(see crbug.com/1028665)
Garry Wang4c624bc2020-01-27 16:34:43 -08001054 try:
1055 self.stop_servod()
1056 except error.AutoservRunError as e:
1057 logging.info("Failed to stop servod due to:\n%s\n"
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001058 "This error is forgiven.", str(e))
Garry Wangc1288cf2019-12-17 14:58:00 -08001059
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001060 super(ServoHost, self).close()
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001061 # Mark closed.
1062 self._closed = True
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001063
1064
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001065 def get_servo_state(self):
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001066 return self._servo_state
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001067
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001068 def _get_host_metrics_data(self):
1069 return {'port': self.servo_port,
1070 'host': self.hostname,
1071 'board': self.servo_board or ''}
1072
1073 def _is_servo_device_connected(self, servo_type, serial):
1074 """Check if device is connected to the labstation.
1075
1076 Works for all servo devices connected to the labstation.
1077 For servo_v3 please use 'self._is_servo_board_present_on_servo_v3'
1078
1079 @param servo_type: The type of servo device. Expecting value can be
1080 servo_v4 or servo_micro.
1081 @param serial: The serial number of the device to detect it.
1082 """
1083 vid_pid = self.SERVO_VID_PID.get(servo_type)
1084 if not vid_pid or not serial:
1085 # device cannot detected without VID/PID or serial number
1086 return False
1087 logging.debug('Started to detect %s', servo_type)
1088 try:
1089 cmd = 'lsusb -v -d %s |grep iSerial |grep %s' % (vid_pid, serial)
1090 result = self.run(cmd, ignore_status=True, timeout=30)
1091 if result.exit_status == 0 and result.stdout.strip():
1092 logging.debug('The %s is plugged in to the host.', servo_type)
1093 return True
1094 logging.debug('%s device is not detected; %s', servo_type, result)
1095 return False
1096 except Exception as e:
1097 # can be triggered by timeout issue due running the script
1098 metrics.Counter(
1099 'chromeos/autotest/repair/servo_detection/timeout'
1100 ).increment(fields=self._get_host_metrics_data())
1101 logging.error('%s device is not detected; %s', servo_type, str(e))
1102 return None
1103
1104 def _is_servo_board_present_on_servo_v3(self):
1105 """Check if servo board is detected on servo_v3"""
1106 vid_pids = self.SERVO_VID_PID['servo_v3']
1107 if not vid_pids or len(vid_pids) == 0:
1108 # device cannot detected without VID/PID
1109 return False
1110 logging.debug('Started to detect servo board on servo_v3')
1111 not_detected = 'The servo board is not detected on servo_v3'
1112 try:
1113 cmd = 'lsusb | grep "%s"' % "\|".join(vid_pids)
1114 result = self.run(cmd, ignore_status=True, timeout=30)
1115 if result.exit_status == 0 and result.stdout.strip():
1116 logging.debug('The servo board is detected on servo_v3')
1117 return True
1118 logging.debug('%s; %s', not_detected, result)
1119 return False
1120 except Exception as e:
1121 # can be triggered by timeout issue due running the script
1122 metrics.Counter(
1123 'chromeos/autotest/repair/servo_detection/timeout'
1124 ).increment(fields=self._get_host_metrics_data())
1125 logging.error('%s; %s', not_detected, str(e))
1126 return None
1127
Otabek Kasimov15963492020-06-23 21:10:51 -07001128 def get_verify_state(self, tag):
1129 """Return the state of servo verifier.
1130
1131 @returns: bool or None
1132 """
1133 return self._repair_strategy.verifier_is_good(tag)
1134
1135 def determine_servo_state(self):
1136 """Determine servo state based on the failed verifier.
1137
1138 @returns: servo state value
1139 The state detecting based on first fail verifier or collecting of
1140 them.
1141 """
1142 ssh = self.get_verify_state('servo_ssh')
1143 disk_space = self.get_verify_state('disk_space')
1144 start_servod = self.get_verify_state('servod_job')
1145 create_servo = self.get_verify_state('servod_connection')
1146 init_servo = self.get_verify_state('servod_control')
1147 pwr_button = self.get_verify_state('pwr_button')
1148 lid_open = self.get_verify_state('lid_open')
1149 ec_board = self.get_verify_state('ec_board')
1150 ccd_testlab = self.get_verify_state('ccd_testlab')
1151
1152 if not ssh:
1153 return servo_constants.SERVO_STATE_NO_SSH
1154
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001155 if start_servod == self.VERIFY_FAILED:
1156 # can be cause if device is not connected to the servo host
1157 if self.is_labstation():
1158 if not self.servo_serial:
1159 return servo_constants.SERVO_STATE_WRONG_CONFIG
1160 if self._is_servo_device_connected(
1161 'servo_v4',
1162 self.servo_serial) == False:
1163 return servo_constants.SERVO_STATE_NOT_CONNECTED
1164 elif self._is_servo_board_present_on_servo_v3() == False:
1165 return servo_constants.SERVO_STATE_NOT_CONNECTED
1166 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1167
Otabek Kasimov15963492020-06-23 21:10:51 -07001168 # one of the reason why servo can not initialized
1169 if ccd_testlab == self.VERIFY_FAILED:
1170 return servo_constants.SERVO_STATE_CCD_TESTLAB_ISSUE
1171
1172 if init_servo == self.VERIFY_FAILED:
1173 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1174
1175 if pwr_button == self.VERIFY_FAILED:
1176 return servo_constants.SERVO_STATE_BAD_RIBBON_CABLE
1177 if lid_open == self.VERIFY_FAILED:
1178 return servo_constants.SERVO_STATE_LID_OPEN_FAILED
1179 if ec_board == self.VERIFY_FAILED:
1180 return servo_constants.SERVO_STATE_EC_BROKEN
1181
Otabek Kasimov15963492020-06-23 21:10:51 -07001182 metrics.Counter(
1183 'chromeos/autotest/repair/unknown_servo_state'
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001184 ).increment(fields=self._get_host_metrics_data())
Otabek Kasimov15963492020-06-23 21:10:51 -07001185 logging.info('We do not have special state for this failure yet :)')
1186 return servo_constants.SERVO_STATE_BROKEN
1187
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001188
Richard Barnetteea3e4602016-06-10 12:36:41 -07001189def make_servo_hostname(dut_hostname):
1190 """Given a DUT's hostname, return the hostname of its servo.
1191
1192 @param dut_hostname: hostname of a DUT.
1193
1194 @return hostname of the DUT's servo.
1195
1196 """
1197 host_parts = dut_hostname.split('.')
1198 host_parts[0] = host_parts[0] + '-servo'
1199 return '.'.join(host_parts)
1200
1201
1202def servo_host_is_up(servo_hostname):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001203 """Given a servo host name, return if it's up or not.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001204
1205 @param servo_hostname: hostname of the servo host.
1206
1207 @return True if it's up, False otherwise
1208 """
1209 # Technically, this duplicates the SSH ping done early in the servo
1210 # proxy initialization code. However, this ping ends in a couple
1211 # seconds when if fails, rather than the 60 seconds it takes to decide
1212 # that an SSH ping has timed out. Specifically, that timeout happens
1213 # when our servo DNS name resolves, but there is no host at that IP.
1214 logging.info('Pinging servo host at %s', servo_hostname)
1215 ping_config = ping_runner.PingConfig(
1216 servo_hostname, count=3,
1217 ignore_result=True, ignore_status=True)
1218 return ping_runner.PingRunner().ping(ping_config).received > 0
1219
1220
Richard Barnettee519dcd2016-08-15 17:37:17 -07001221def _map_afe_board_to_servo_board(afe_board):
1222 """Map a board we get from the AFE to a servo appropriate value.
1223
1224 Many boards are identical to other boards for servo's purposes.
1225 This function makes that mapping.
1226
1227 @param afe_board string board name received from AFE.
1228 @return board we expect servo to have.
1229
1230 """
1231 KNOWN_SUFFIXES = ['-freon', '_freon', '_moblab', '-cheets']
1232 BOARD_MAP = {'gizmo': 'panther'}
1233 mapped_board = afe_board
1234 if afe_board in BOARD_MAP:
1235 mapped_board = BOARD_MAP[afe_board]
1236 else:
1237 for suffix in KNOWN_SUFFIXES:
1238 if afe_board.endswith(suffix):
1239 mapped_board = afe_board[0:-len(suffix)]
1240 break
1241 if mapped_board != afe_board:
1242 logging.info('Mapping AFE board=%s to %s', afe_board, mapped_board)
1243 return mapped_board
1244
1245
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001246def get_servo_args_for_host(dut_host):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001247 """Return servo data associated with a given DUT.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001248
Richard Barnetteea3e4602016-06-10 12:36:41 -07001249 @param dut_host Instance of `Host` on which to find the servo
1250 attributes.
Prathmesh Prabhuf605dd32018-08-28 17:09:04 -07001251 @return `servo_args` dict with host and an optional port.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001252 """
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001253 info = dut_host.host_info_store.get()
1254 servo_args = {k: v for k, v in info.attributes.iteritems()
Garry Wang11b5e872020-03-11 15:14:08 -07001255 if k in servo_constants.SERVO_ATTR_KEYS}
Richard Barnetteea3e4602016-06-10 12:36:41 -07001256
Garry Wang11b5e872020-03-11 15:14:08 -07001257 if servo_constants.SERVO_PORT_ATTR in servo_args:
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001258 try:
Garry Wang11b5e872020-03-11 15:14:08 -07001259 servo_args[servo_constants.SERVO_PORT_ATTR] = int(
1260 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001261 except ValueError:
1262 logging.error('servo port is not an int: %s',
Garry Wang11b5e872020-03-11 15:14:08 -07001263 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001264 # Reset servo_args because we don't want to use an invalid port.
Garry Wang11b5e872020-03-11 15:14:08 -07001265 servo_args.pop(servo_constants.SERVO_HOST_ATTR, None)
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001266
1267 if info.board:
Garry Wang11b5e872020-03-11 15:14:08 -07001268 servo_board = _map_afe_board_to_servo_board(info.board)
1269 servo_args[servo_constants.SERVO_BOARD_ATTR] = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -07001270 if info.model:
Garry Wang11b5e872020-03-11 15:14:08 -07001271 servo_args[servo_constants.SERVO_MODEL_ATTR] = info.model
1272 return servo_args if servo_constants.SERVO_HOST_ATTR in servo_args else None
Richard Barnetteea3e4602016-06-10 12:36:41 -07001273
1274
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001275def _tweak_args_for_ssp_moblab(servo_args):
Garry Wang11b5e872020-03-11 15:14:08 -07001276 if (servo_args[servo_constants.SERVO_HOST_ATTR]
1277 in ['localhost', '127.0.0.1']):
1278 servo_args[servo_constants.SERVO_HOST_ATTR] = _CONFIG.get_config_value(
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001279 'SSP', 'host_container_ip', type=str, default=None)
1280
1281
Dan Shi023aae32016-05-25 11:13:01 -07001282def create_servo_host(dut, servo_args, try_lab_servo=False,
Gregory Nisbetde13e2a2019-12-09 22:44:00 -08001283 try_servo_repair=False, dut_host_info=None):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001284 """Create a ServoHost object for a given DUT, if appropriate.
Dan Shi4d478522014-02-14 13:46:32 -08001285
Richard Barnette9a26ad62016-06-10 12:03:08 -07001286 This function attempts to create and verify or repair a `ServoHost`
1287 object for a servo connected to the given `dut`, subject to various
1288 constraints imposed by the parameters:
1289 * When the `servo_args` parameter is not `None`, a servo
1290 host must be created, and must be checked with `repair()`.
1291 * Otherwise, if a servo exists in the lab and `try_lab_servo` is
1292 true:
1293 * If `try_servo_repair` is true, then create a servo host and
1294 check it with `repair()`.
1295 * Otherwise, if the servo responds to `ping` then create a
1296 servo host and check it with `verify()`.
Fang Denge545abb2014-12-30 18:43:47 -08001297
Richard Barnette9a26ad62016-06-10 12:03:08 -07001298 In cases where `servo_args` was not `None`, repair failure
1299 exceptions are passed back to the caller; otherwise, exceptions
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001300 are logged and then discarded. Note that this only happens in cases
1301 where we're called from a test (not special task) control file that
1302 has an explicit dependency on servo. In that case, we require that
1303 repair not write to `status.log`, so as to avoid polluting test
1304 results.
1305
1306 TODO(jrbarnette): The special handling for servo in test control
1307 files is a thorn in my flesh; I dearly hope to see it cut out before
1308 my retirement.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001309
1310 Parameters for a servo host consist of a host name, port number, and
1311 DUT board, and are determined from one of these sources, in order of
1312 priority:
Richard Barnetteea3e4602016-06-10 12:36:41 -07001313 * Servo attributes from the `dut` parameter take precedence over
1314 all other sources of information.
1315 * If a DNS entry for the servo based on the DUT hostname exists in
1316 the CrOS lab network, that hostname is used with the default
Richard Barnette9a26ad62016-06-10 12:03:08 -07001317 port and the DUT's board.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001318 * If no other options are found, the parameters will be taken
Richard Barnette9a26ad62016-06-10 12:03:08 -07001319 from the `servo_args` dict passed in from the caller.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001320
1321 @param dut An instance of `Host` from which to take
1322 servo parameters (if available).
1323 @param servo_args A dictionary with servo parameters to use if
1324 they can't be found from `dut`. If this
1325 argument is supplied, unrepaired exceptions
1326 from `verify()` will be passed back to the
1327 caller.
1328 @param try_lab_servo If not true, servo host creation will be
1329 skipped unless otherwise required by the
1330 caller.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001331 @param try_servo_repair If true, check a servo host with
1332 `repair()` instead of `verify()`.
Dan Shi4d478522014-02-14 13:46:32 -08001333
1334 @returns: A ServoHost object or None. See comments above.
1335
1336 """
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001337 servo_dependency = servo_args is not None
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001338 if dut is not None and (try_lab_servo or servo_dependency):
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001339 servo_args_override = get_servo_args_for_host(dut)
Richard Barnetteea3e4602016-06-10 12:36:41 -07001340 if servo_args_override is not None:
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001341 if utils.in_moblab_ssp():
1342 _tweak_args_for_ssp_moblab(servo_args_override)
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001343 logging.debug(
1344 'Overriding provided servo_args (%s) with arguments'
1345 ' determined from the host (%s)',
1346 servo_args,
1347 servo_args_override,
1348 )
Richard Barnetteea3e4602016-06-10 12:36:41 -07001349 servo_args = servo_args_override
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001350
Richard Barnetteea3e4602016-06-10 12:36:41 -07001351 if servo_args is None:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001352 logging.debug('No servo_args provided, and failed to find overrides.')
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001353 if try_lab_servo or servo_dependency:
Otabek Kasimov646812c2020-06-23 20:01:36 -07001354 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001355 else:
1356 # For regular test case which not required the servo
1357 return None, None
1358
Garry Wang11b5e872020-03-11 15:14:08 -07001359 servo_hostname = servo_args.get(servo_constants.SERVO_HOST_ATTR)
1360 servo_port = servo_args.get(servo_constants.SERVO_PORT_ATTR)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001361 if not _is_servo_host_information_exist(servo_hostname, servo_port):
1362 logging.debug(
1363 'Servo connection info missed hostname: %s , port: %s',
1364 servo_hostname, servo_port)
Otabek Kasimov646812c2020-06-23 20:01:36 -07001365 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001366 if not is_servo_host_information_valid(servo_hostname, servo_port):
1367 logging.debug(
1368 'Servo connection info is incorrect hostname: %s , port: %s',
1369 servo_hostname, servo_port)
Garry Wang11b5e872020-03-11 15:14:08 -07001370 return None, servo_constants.SERVO_STATE_WRONG_CONFIG
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001371 if (not servo_dependency and not try_servo_repair and
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001372 not servo_host_is_up(servo_hostname)):
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001373 logging.debug('ServoHost is not up.')
Otabek Kasimov646812c2020-06-23 20:01:36 -07001374 return None, servo_constants.SERVO_STATE_NO_SSH
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001375
Garry Wangebc015b2019-06-06 17:45:06 -07001376 newhost = ServoHost(**servo_args)
Garry Wangffbd2162020-04-17 16:13:48 -07001377
1378 # Reset servo if the servo is locked, as we check if the servohost is up,
1379 # if the servohost is labstation and if the servohost is in lab inside the
1380 # locking logic. Also check try_servo_repair to make sure we only do this
1381 # in AdminRepair tasks.
1382 if newhost._is_locked and try_servo_repair:
1383 newhost.reset_servo()
1384
Garry Wangcdd27b22020-01-13 14:59:11 -08001385 try:
1386 newhost.restart_servod(quick_startup=True)
1387 except error.AutoservSSHTimeout:
1388 logging.warning("Restart servod failed due ssh connection "
1389 "to servohost timed out. This error is forgiven"
1390 " here, we will retry in servo repair process.")
1391 except error.AutoservRunError as e:
1392 logging.warning("Restart servod failed due to:\n%s\n"
1393 "This error is forgiven here, we will retry"
1394 " in servo repair process.", str(e))
Garry Wangebc015b2019-06-06 17:45:06 -07001395
Gregory Nisbetde13e2a2019-12-09 22:44:00 -08001396 # TODO(gregorynisbet): Clean all of this up.
1397 logging.debug('create_servo_host: attempt to set info store on '
1398 'servo host')
1399 try:
1400 if dut_host_info is None:
1401 logging.debug('create_servo_host: dut_host_info is '
1402 'None, skipping')
1403 else:
1404 newhost.set_dut_host_info(dut_host_info)
1405 logging.debug('create_servo_host: successfully set info '
1406 'store')
1407 except Exception:
1408 logging.error("create_servo_host: (%s)", traceback.format_exc())
1409
Richard Barnette9a26ad62016-06-10 12:03:08 -07001410 # Note that the logic of repair() includes everything done
1411 # by verify(). It's sufficient to call one or the other;
1412 # we don't need both.
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001413 if servo_dependency:
1414 newhost.repair(silent=True)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001415 return newhost, newhost.get_servo_state()
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001416
1417 if try_servo_repair:
1418 try:
1419 newhost.repair()
1420 except Exception:
1421 logging.exception('servo repair failed for %s', newhost.hostname)
Richard Barnette9a26ad62016-06-10 12:03:08 -07001422 else:
1423 try:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001424 newhost.verify()
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001425 except Exception:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001426 logging.exception('servo verify failed for %s', newhost.hostname)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001427 return newhost, newhost.get_servo_state()
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001428
1429
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001430def _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001431 if hostname is None or len(hostname.strip()) == 0:
1432 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001433 if port is None:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001434 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001435 if not type(port) is int:
1436 try:
1437 int(port)
1438 except ValueError:
1439 return False
1440
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001441 return True
1442
1443
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001444def is_servo_host_information_valid(hostname, port):
Garry Wang9b8f2342020-04-17 16:34:09 -07001445 """Check if provided servo attributes are valid.
1446
1447 @param hostname Hostname of the servohost.
1448 @param port servo port number.
1449
1450 @returns: A bool value to indicate if provided servo attribute valid.
1451 """
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001452 if not _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001453 return False
1454 # checking range and correct of the port
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001455 port_int = int(port)
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001456 if port_int < 1 or port_int > 65000:
1457 return False
1458 # we expecting host contain only latters, digits and '-' or '_'
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001459 if not re.match('[a-zA-Z0-9-_\.]*$', hostname) or len(hostname) < 5:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001460 return False
1461 return True