blob: ce5d17d5691a6faeae8587f39ed0341f15c080fe [file] [log] [blame]
Derek Beckettf73baca2020-08-19 15:08:47 -07001# Lint as: python2, python3
Fang Deng5d518f42013-08-02 14:04:32 -07002# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
3# Use of this source code is governed by a BSD-style license that can be
4# found in the LICENSE file.
5#
6# Expects to be run in an environment with sudo and no interactive password
7# prompt, such as within the Chromium OS development chroot.
8
9
10"""This file provides core logic for servo verify/repair process."""
11
12
Derek Beckettf73baca2020-08-19 15:08:47 -070013from __future__ import absolute_import
14from __future__ import division
15from __future__ import print_function
16
Fang Deng5d518f42013-08-02 14:04:32 -070017import logging
Raul E Rangel52ca2e82018-07-03 14:10:14 -060018import os
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080019import re
20import tarfile
Andrew McRaef0679932020-08-13 09:15:23 +100021import threading
Garry Wang2b5eef92020-08-21 16:23:35 -070022import json
Garry Wangc1288cf2019-12-17 14:58:00 -080023import time
Derek Beckettf73baca2020-08-19 15:08:47 -070024import six
25import six.moves.xmlrpc_client
Fang Deng5d518f42013-08-02 14:04:32 -070026
27from autotest_lib.client.bin import utils
Garry Wang79e9af62019-06-12 15:19:19 -070028from autotest_lib.client.common_lib import error
Richard Barnette9a26ad62016-06-10 12:03:08 -070029from autotest_lib.client.common_lib import hosts
Garry Wang7b0e1b72020-03-25 19:08:59 -070030from autotest_lib.client.common_lib import lsbrelease_utils
Fang Deng5d518f42013-08-02 14:04:32 -070031from autotest_lib.client.common_lib.cros import retry
Garry Wang970fda92021-06-22 18:03:43 -070032from autotest_lib.server import crashcollect
Richard Barnette9a26ad62016-06-10 12:03:08 -070033from autotest_lib.server.cros.servo import servo
Richard Barnetted31580e2018-05-14 19:58:00 +000034from autotest_lib.server.hosts import servo_repair
Garry Wangebc015b2019-06-06 17:45:06 -070035from autotest_lib.server.hosts import base_servohost
Garry Wang11b5e872020-03-11 15:14:08 -070036from autotest_lib.server.hosts import servo_constants
Otabek Kasimov4ea636e2020-04-14 23:35:06 -070037from autotest_lib.server.cros.faft.utils import config
Garry Wang11b5e872020-03-11 15:14:08 -070038from autotest_lib.client.common_lib import global_config
Otabek Kasimov382c3bb2020-10-28 13:22:45 -070039from autotest_lib.server.cros.servo.topology import servo_topology
Garry Wangd7367482020-02-27 13:52:40 -080040
Otabek Kasimov15963492020-06-23 21:10:51 -070041
Dan Shi3b2adf62015-09-02 17:46:54 -070042_CONFIG = global_config.global_config
Fang Deng5d518f42013-08-02 14:04:32 -070043
Otabek Kasimova7ba91a2020-03-09 08:31:01 -070044
Garry Wangebc015b2019-06-06 17:45:06 -070045class ServoHost(base_servohost.BaseServoHost):
46 """Host class for a servo host(e.g. beaglebone, labstation)
Dana Goyette0b6e6402019-10-04 11:09:24 -070047 that with a servo instance for a specific port.
48
49 @type _servo: servo.Servo | None
50 """
Fang Deng5d518f42013-08-02 14:04:32 -070051
Raul E Rangel52ca2e82018-07-03 14:10:14 -060052 DEFAULT_PORT = int(os.getenv('SERVOD_PORT', '9999'))
Richard Barnette9a26ad62016-06-10 12:03:08 -070053
Dan Shie5b3c512014-08-21 12:12:09 -070054 # Timeout for initializing servo signals.
Wai-Hong Tam37b6ed32017-09-19 15:52:39 -070055 INITIALIZE_SERVO_TIMEOUT_SECS = 60
Richard Barnette9a26ad62016-06-10 12:03:08 -070056
Otabek Kasimov545739c2020-08-20 00:24:21 -070057 # Default timeout for run terminal command.
58 DEFAULT_TERMINAL_TIMEOUT = 30
59
xixuan6cf6d2f2016-01-29 15:29:00 -080060 # Ready test function
61 SERVO_READY_METHOD = 'get_version'
Fang Deng5d518f42013-08-02 14:04:32 -070062
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080063 # Directory prefix on the servo host where the servod logs are stored.
64 SERVOD_LOG_PREFIX = '/var/log/servod'
65
66 # Exit code to use when symlinks for servod logs are not found.
67 NO_SYMLINKS_CODE = 9
68
69 # Directory in the job's results directory to dump the logs into.
70 LOG_DIR = 'servod'
71
72 # Prefix for joint loglevel files in the logs.
73 JOINT_LOG_PREFIX = 'log'
74
75 # Regex group to extract timestamp from logfile name.
76 TS_GROUP = 'ts'
77
78 # This regex is used to extract the timestamp from servod logs.
Garry Wang22f2e842020-09-09 20:19:19 -070079 # files always start with log.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080080 TS_RE = (r'log.'
81 # The timestamp is of format %Y-%m-%d--%H-%M-%S.MS
82 r'(?P<%s>\d{4}(\-\d{2}){2}\-(-\d{2}){3}.\d{3})'
83 # The loglevel is optional depending on labstation version.
84 r'(.(INFO|DEBUG|WARNING))?' % TS_GROUP)
85 TS_EXTRACTOR = re.compile(TS_RE)
86
87 # Regex group to extract MCU name from logline in servod logs.
88 MCU_GROUP = 'mcu'
89
90 # Regex group to extract logline from MCU logline in servod logs.
91 LINE_GROUP = 'line'
92
93 # This regex is used to extract the mcu and the line content from an
94 # MCU logline in servod logs. e.g. EC or servo_v4 console logs.
95 # Here is an example log-line:
96 #
97 # 2020-01-23 13:15:12,223 - servo_v4 - EC3PO.Console - DEBUG -
98 # console.py:219:LogConsoleOutput - /dev/pts/9 - cc polarity: cc1
99 #
100 # Here is conceptually how they are formatted:
101 #
102 # <time> - <MCU> - EC3PO.Console - <LVL> - <file:line:func> - <pts> -
103 # <output>
104 #
Garry Wang22f2e842020-09-09 20:19:19 -0700105 # The log format starts with a timestamp
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800106 MCU_RE = (r'[\d\-]+ [\d:,]+ '
107 # The mcu that is logging this is next.
108 r'- (?P<%s>\w+) - '
109 # Next, we have more log outputs before the actual line.
110 # Information about the file line, logging function etc.
111 # Anchor on EC3PO Console, LogConsoleOutput and dev/pts.
112 # NOTE: if the log format changes, this regex needs to be
113 # adjusted.
114 r'EC3PO\.Console[\s\-\w\d:.]+LogConsoleOutput - /dev/pts/\d+ - '
115 # Lastly, we get the MCU's console line.
116 r'(?P<%s>.+$)' % (MCU_GROUP, LINE_GROUP))
117 MCU_EXTRACTOR = re.compile(MCU_RE)
118
Otabek Kasimov545739c2020-08-20 00:24:21 -0700119 # Regex to detect timeout messages when USBC pigtail has timeout issue.
120 # e.g.: [475635.427072 PD TMOUT RX 1/1]
121 USBC_PIGTAIL_TIMEOUT_RE = r'\[[\d \.]{1,20}(PD TMOUT RX 1\/1)\]'
122
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800123 # Suffix to identify compressed logfiles.
124 COMPRESSION_SUFFIX = '.tbz2'
125
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700126 # A suffix to mark servod log directories that came from instance that
127 # ran during this servo_host, but are not the last one running e.g. when
128 # an instance (on purpose, or due to a bug) restarted in the middle of the
129 # run.
130 OLD_LOG_SUFFIX = 'old'
131
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800132 def _init_attributes(self):
133 self._servo_state = None
134 self.servo_port = None
135 self.servo_board = None
136 self.servo_model = None
137 self.servo_serial = None
Garry Wangcb06f3b2020-10-08 20:56:21 -0700138 self.servo_setup = None
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800139 self.servo_recovery = None
Otabek Kasimovab4ae222021-03-06 01:38:47 -0800140 self.servo_fw_channel = None
Garry Wang6a680062020-11-03 13:40:29 -0800141 self.additional_servod_args = None
Otabek Kasimov39637412020-11-23 19:09:27 -0800142 self._dut_health_profile = None
Garry Wang000c6c02020-05-11 21:27:23 -0700143 # The flag that indicate if a servo is connected to a smart usbhub.
144 # TODO(xianuowang@) remove this flag once all usbhubs in the lab
145 # get replaced.
146 self.smart_usbhub = None
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800147 self._servo = None
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700148 self._topology = None
Andrew McRaef0679932020-08-13 09:15:23 +1000149 self._tunnel_proxy = None
150 self._tunnel_proxy_lock = threading.Lock()
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700151 self._initial_instance_ts = None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800152 # Flag to make sure that multiple calls to close do not result in the
153 # logic executing multiple times.
154 self._closed = False
Andrew McRaef0679932020-08-13 09:15:23 +1000155 # Per-thread local data
156 self._local = threading.local()
Fang Deng5d518f42013-08-02 14:04:32 -0700157
Garry Wangcb06f3b2020-10-08 20:56:21 -0700158 def _initialize(self,
159 servo_host='localhost',
160 servo_port=DEFAULT_PORT,
161 servo_board=None,
162 servo_model=None,
163 servo_serial=None,
164 servo_setup=None,
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800165 servo_recovery=None,
Otabek Kasimovab4ae222021-03-06 01:38:47 -0800166 servo_fw_channel=None,
Garry Wang6a680062020-11-03 13:40:29 -0800167 additional_servod_args=None,
Garry Wangcb06f3b2020-10-08 20:56:21 -0700168 is_in_lab=None,
169 *args,
170 **dargs):
Fang Deng5d518f42013-08-02 14:04:32 -0700171 """Initialize a ServoHost instance.
172
173 A ServoHost instance represents a host that controls a servo.
174
175 @param servo_host: Name of the host where the servod process
176 is running.
Raul E Rangel52ca2e82018-07-03 14:10:14 -0600177 @param servo_port: Port the servod process is listening on. Defaults
178 to the SERVOD_PORT environment variable if set,
179 otherwise 9999.
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700180 @param servo_board: Board that the servo is connected to.
Nick Sanders2f3c9852018-10-24 12:10:24 -0700181 @param servo_model: Model that the servo is connected to.
Garry Wangcb06f3b2020-10-08 20:56:21 -0700182 @param servo_serial: Serial number of the servo device.
183 @param servo_setup: Type of servo setup, e.g. REGULAR or DUAL_V4.
Garry Wang6a680062020-11-03 13:40:29 -0800184 @param additional_servod_args: Additional args that will append to
185 servod start command.
Dan Shi4d478522014-02-14 13:46:32 -0800186 @param is_in_lab: True if the servo host is in Cros Lab. Default is set
187 to None, for which utils.host_is_in_lab_zone will be
188 called to check if the servo host is in Cros lab.
Fang Deng5d518f42013-08-02 14:04:32 -0700189
190 """
191 super(ServoHost, self)._initialize(hostname=servo_host,
Garry Wangebc015b2019-06-06 17:45:06 -0700192 is_in_lab=is_in_lab, *args, **dargs)
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800193 self._init_attributes()
Richard Barnette42f4db92018-08-23 15:05:15 -0700194 self.servo_port = int(servo_port)
Richard Barnettee519dcd2016-08-15 17:37:17 -0700195 self.servo_board = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -0700196 self.servo_model = servo_model
Kevin Cheng643ce8a2016-09-15 15:42:12 -0700197 self.servo_serial = servo_serial
Garry Wangcb06f3b2020-10-08 20:56:21 -0700198 self.servo_setup = servo_setup
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800199 self.servo_recovery = servo_recovery
Otabek Kasimovab4ae222021-03-06 01:38:47 -0800200 self.servo_fw_channel = servo_fw_channel
Garry Wang6a680062020-11-03 13:40:29 -0800201 self.additional_servod_args = additional_servod_args
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800202
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800203 # The location of the log files on the servo host for this instance.
204 self.remote_log_dir = '%s_%s' % (self.SERVOD_LOG_PREFIX,
205 self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700206 # Path of the servo host lock file.
Derek Beckettf73baca2020-08-19 15:08:47 -0700207 self._lock_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
208 self.LOCK_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700209 # File path to declare a reboot request.
Derek Beckettf73baca2020-08-19 15:08:47 -0700210 self._reboot_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
211 self.REBOOT_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700212
213 # Lock the servo host if it's an in-lab labstation to prevent other
214 # task to reboot it until current task completes. We also wait and
215 # make sure the labstation is up here, in the case of the labstation is
216 # in the middle of reboot.
Garry Wang7c00b0f2019-06-25 17:28:17 -0700217 self._is_locked = False
Garry Wang42b4d862019-06-25 15:50:49 -0700218 if (self.wait_up(self.REBOOT_TIMEOUT) and self.is_in_lab()
219 and self.is_labstation()):
Garry Wang79e9af62019-06-12 15:19:19 -0700220 self._lock()
Garry Wang78ce64d2020-10-13 18:23:45 -0700221 try:
222 self.wait_ready()
223 except Exception as e:
224 logging.info(
225 'Unexpected error while ensure labstation'
226 ' readiness; %s', str(e))
Garry Wangebc015b2019-06-06 17:45:06 -0700227
Richard Barnette9a26ad62016-06-10 12:03:08 -0700228 self._repair_strategy = (
229 servo_repair.create_servo_repair_strategy())
Richard Barnettee519dcd2016-08-15 17:37:17 -0700230
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700231 def __str__(self):
232 return "<%s '%s:%s'>" % (
233 type(self).__name__, self.hostname, self.servo_port)
234
Richard Barnette9a26ad62016-06-10 12:03:08 -0700235 def connect_servo(self):
Garry Wang8c8dc972020-06-09 13:41:51 -0700236 """ Initialize and setup servo for later use.
237 """
Greg Edelstonff2665d2021-04-21 14:32:27 -0600238 self.initialize_servo()
Garry Wang8c8dc972020-06-09 13:41:51 -0700239 self.initialize_dut_for_servo()
240
Greg Edelstonff2665d2021-04-21 14:32:27 -0600241 def initialize_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700242 """Establish a connection to the servod server on this host.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700243
244 Initializes `self._servo` and then verifies that all network
245 connections are working. This will create an ssh tunnel if
246 it's required.
Garry Wang8c8dc972020-06-09 13:41:51 -0700247 """
248 self._servo = servo.Servo(servo_host=self,
249 servo_serial=self.servo_serial)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700250
Garry Wang8c8dc972020-06-09 13:41:51 -0700251 def initialize_dut_for_servo(self):
252 """This method will do some setup for dut control, e.g. setup
253 main servo_v4 device, and also testing the connection between servo
254 and DUT. As a side effect of testing the connection, all signals on
255 the target servo are reset to default values, and the USB stick is
Richard Barnette9a26ad62016-06-10 12:03:08 -0700256 set to the neutral (off) position.
257 """
Garry Wang8c8dc972020-06-09 13:41:51 -0700258 if not self._servo:
259 raise hosts.AutoservVerifyError('Servo object needs to be'
260 ' initialized before initialize'
261 ' DUT.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700262 timeout, _ = retry.timeout(
Garry Wang8c8dc972020-06-09 13:41:51 -0700263 self._servo.initialize_dut,
264 timeout_sec=self.INITIALIZE_SERVO_TIMEOUT_SECS)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700265 if timeout:
Garry Wang8c8dc972020-06-09 13:41:51 -0700266 raise hosts.AutoservVerifyError('Initialize dut for servo timed'
267 ' out.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700268
Richard Barnette9a26ad62016-06-10 12:03:08 -0700269 def disconnect_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700270 """Disconnect our servo if it exists.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700271
272 If we've previously successfully connected to our servo,
273 disconnect any established ssh tunnel, and set `self._servo`
274 back to `None`.
275 """
276 if self._servo:
277 # N.B. This call is safe even without a tunnel:
278 # rpc_server_tracker.disconnect() silently ignores
279 # unknown ports.
280 self.rpc_server_tracker.disconnect(self.servo_port)
281 self._servo = None
Fang Deng5d518f42013-08-02 14:04:32 -0700282
Andrew McRaef0679932020-08-13 09:15:23 +1000283 def _maybe_create_servod_ssh_tunnel_proxy(self):
284 """Create a xmlrpc proxy for use with a ssh tunnel.
285 A lock is used to safely create a singleton proxy.
286 """
287 with self._tunnel_proxy_lock:
288 if self._tunnel_proxy is None:
289 self._tunnel_proxy = self.rpc_server_tracker.xmlrpc_connect(
290 None,
291 self.servo_port,
292 ready_test_name=self.SERVO_READY_METHOD,
293 timeout_seconds=60,
294 request_timeout_seconds=3600,
295 server_desc=str(self))
296
Andrew McRaef0679932020-08-13 09:15:23 +1000297 def get_servod_server_proxy(self):
298 """Return a proxy if it exists; otherwise, create a new one.
299 A proxy can either be a ssh tunnel based proxy, or a httplib
300 based proxy.
Fang Deng5d518f42013-08-02 14:04:32 -0700301
302 @returns: An xmlrpclib.ServerProxy that is connected to the servod
303 server on the host.
Fang Deng5d518f42013-08-02 14:04:32 -0700304 """
Garry Wang11b5e872020-03-11 15:14:08 -0700305 if (servo_constants.ENABLE_SSH_TUNNEL_FOR_SERVO
306 and not self.is_localhost()):
Andrew McRaef0679932020-08-13 09:15:23 +1000307 # Check for existing ssh tunnel proxy.
308 if self._tunnel_proxy is None:
309 self._maybe_create_servod_ssh_tunnel_proxy()
310 return self._tunnel_proxy
Richard Barnette9a26ad62016-06-10 12:03:08 -0700311 else:
Andrew McRaef0679932020-08-13 09:15:23 +1000312 # xmlrpc/httplib is not thread-safe, so each thread must have its
313 # own separate proxy connection.
314 if not hasattr(self._local, "_per_thread_proxy"):
315 remote = 'http://%s:%s' % (self.hostname, self.servo_port)
Derek Beckettf73baca2020-08-19 15:08:47 -0700316 self._local._per_thread_proxy = six.moves.xmlrpc_client.ServerProxy(remote)
Andrew McRaef0679932020-08-13 09:15:23 +1000317 return self._local._per_thread_proxy
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800318
Richard Barnette1edbb162016-11-01 11:47:50 -0700319 def verify(self, silent=False):
320 """Update the servo host and verify it's in a good state.
321
322 @param silent If true, suppress logging in `status.log`.
323 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700324 message = 'Beginning verify for servo host %s port %s serial %s'
325 message %= (self.hostname, self.servo_port, self.servo_serial)
326 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700327 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700328 self._repair_strategy.verify(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700329 self._servo_state = servo_constants.SERVO_STATE_WORKING
330 self.record('INFO', None, None,
331 'ServoHost verify set servo_state as WORKING')
Garry Wang63b8c382020-03-11 22:28:40 -0700332 except Exception as e:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -0700333 if not self.is_localhost():
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700334 self._servo_state = self.determine_servo_state()
335 self.record('INFO', None, None,
336 'ServoHost verify set servo_state as %s'
337 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700338 if self._is_critical_error(e):
339 raise
Fang Deng5d518f42013-08-02 14:04:32 -0700340
Garry Wang2b5eef92020-08-21 16:23:35 -0700341 def _get_default_usbkey_mount_path(self):
342 return '/media/servo_usb/%s' % self.servo_port
Fang Deng5d518f42013-08-02 14:04:32 -0700343
Garry Wang7b0e1b72020-03-25 19:08:59 -0700344 def get_image_name_from_usbkey(self, usbkey_dev):
345 """Mount usb drive and check ChromeOS image name on it if there is
346 one. This method assumes the image_usbkey_direction is already set
347 to servo side.
348
Garry Wang4b980202020-09-24 17:00:17 -0700349 @param usbkey_dev: usbkey dev path(e.g. /dev/sdb).
Garry Wang7b0e1b72020-03-25 19:08:59 -0700350
351 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
352 or empty string if no test image detected, or unexpected
353 error occurred.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700354 """
Garry Wang70e5d062020-04-03 18:01:05 -0700355 logging.info('Checking ChromeOS image name on usbkey.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700356 mount_dst = self._get_default_usbkey_mount_path()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700357 # Unmount if there is an existing stale mount.
Garry Wang2b5eef92020-08-21 16:23:35 -0700358 self._unmount_drive(mount_dst)
359 # ChromeOS root fs is in /dev/sdx3
360 mount_src = usbkey_dev + '3'
Garry Wang7b0e1b72020-03-25 19:08:59 -0700361 try:
Garry Wang2b5eef92020-08-21 16:23:35 -0700362 if not self._mount_drive(mount_src, mount_dst):
363 logging.debug('Unexpected error occurred on mount usb drive.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700364 return ''
Garry Wang70e5d062020-04-03 18:01:05 -0700365
366 release_content = self.run(
Garry Wang2b5eef92020-08-21 16:23:35 -0700367 'cat %s/etc/lsb-release' % mount_dst,
Garry Wang70e5d062020-04-03 18:01:05 -0700368 ignore_status=True).stdout.strip()
369
370 if not re.search(r'RELEASE_TRACK=.*test', release_content):
371 logging.info('The image on usbkey is not a test image')
372 return ''
373
374 return lsbrelease_utils.get_chromeos_release_builder_path(
375 lsb_release_content=release_content)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700376 finally:
Garry Wang70e5d062020-04-03 18:01:05 -0700377 logging.debug('Image check compeleted, unmounting the usb drive.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700378 self._unmount_drive(mount_dst)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700379
Garry Wang2b5eef92020-08-21 16:23:35 -0700380 def _extract_firmware_image_from_usbkey(self, fw_dst):
381 """Extract firmware images from the usbkey on servo, this method
382 assumes there is already a ChromeOS test image staged on servo.
383
Garry Wang4b980202020-09-24 17:00:17 -0700384 @param fw_dst: the path that we'll copy firmware images to.
Garry Wang2b5eef92020-08-21 16:23:35 -0700385
386 @returns: a json format string of firmware manifest data.
387 """
388 usbkey_dev = self._probe_and_validate_usb_dev()
389 if not usbkey_dev:
390 raise hosts.AutoservRepairError('Unexpected error occurred when'
391 ' probe usbkey dev path, please check logs for detail.')
392
393 mount_dst = self._get_default_usbkey_mount_path()
394 # Unmount if there is an existing stale mount.
395 self._unmount_drive(mount_dst)
396 # ChromeOS root fs is in /dev/sdx3
397 mount_src = usbkey_dev + '3'
398 try:
399 if not self._mount_drive(mount_src, mount_dst):
400 raise hosts.AutoservRepairError('Failed to extract firmware'
401 ' image; Unable to mount %s.' % usbkey_dev,
402 'unable to mount usbkey')
403 updater_bin = os.path.join(mount_dst,
404 'usr/sbin/chromeos-firmwareupdate')
405 self.run('%s --unpack %s' % (updater_bin, fw_dst))
406 return self.run('%s --manifest' % updater_bin).stdout
407 finally:
408 self._unmount_drive(mount_dst)
409
410 def prepare_repair_firmware_image(self, fw_dst=None):
411 """Prepare firmware image on the servohost for auto repair process
412 to consume.
413
Garry Wang4b980202020-09-24 17:00:17 -0700414 @param fw_dst: the path that we want to store firmware image on
415 the servohost.
Garry Wang2b5eef92020-08-21 16:23:35 -0700416
417 @returns: A tuple that containes ec firmware image path and bios
418 firmware image path on the servohost, or None if type of
419 image is not available based on manifest and dut's model.
420 """
421 model = self.servo_model or self._dut_host_info.model
422 if not model:
423 raise hosts.AutoservRepairError(
424 'Could not determine DUT\'s model.',
425 'model infomation unknown')
426
427 if not fw_dst:
428 fw_dst = '/tmp/firmware_image/%s' % self.servo_port
429 # Cleanup and re-create dst path to have a fresh start.
430 self.run('rm -rf %s' % fw_dst)
431 self.run('mkdir -p %s' % fw_dst)
432
433 manifest = json.loads(self._extract_firmware_image_from_usbkey(fw_dst))
Garry Wang50b56c12020-09-24 17:26:52 -0700434 # For models that have packed $MODEL_signed variant, we want use the
435 # 'signed' variant once we get DVT devices, so try to read manifest
436 # from $MODEL_signed first.
437 build = manifest.get('%s_signed' % model) or manifest.get(model)
438 if not build:
Garry Wang2b5eef92020-08-21 16:23:35 -0700439 raise hosts.AutoservRepairError('Could not find firmware manifest'
440 ' for model:%s' % model, 'model manifest not found')
441 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700442 ec_image = os.path.join(fw_dst, build['ec']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700443 except KeyError:
444 ec_image = None
445 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700446 bios_image = os.path.join(fw_dst, build['host']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700447 except KeyError:
448 bios_image = None
449 if not ec_image and not bios_image:
450 raise hosts.AutoservRepairError('Could not find any firmware image'
451 ' for model:%s' % model, 'cannot find firmware image')
452 return ec_image, bios_image
Garry Wang7b0e1b72020-03-25 19:08:59 -0700453
Garry Wang4b980202020-09-24 17:00:17 -0700454 def flash_ap_firmware_via_servo(self, image):
455 """Flash AP firmware by use a provided image.
456
457 This is will be a short term enhanment for infra repair use, it use
458 'futility update' which will automatically determine various parameters
459 needed for flashrom, and will preserve the GBB, VPD, and HWID for
460 AP firmware update.
461 @TODO(xianuowang@) Remove this method once b/148403277 implemented.
462
463 @param image: the firmware image path on servohost.
464 """
465 cmd = 'futility update -i %s --servo_port=%s'
466 self.run(cmd % (image, self.servo_port), timeout=900)
467
Garry Wang70e5d062020-04-03 18:01:05 -0700468 def _probe_and_validate_usb_dev(self):
469 """This method probe the usb dev path by talking to servo, and then
470 validate the dev path is valid block device to servohost.
471 Possible output:
472 1. Encounter error during probe usb dev, returns empty string.
473 2. probe usb dev completed without error but cannot find usb dev,
474 raise AutoservRepairError.
475 3. probe usb dev find a usb dev path, but failed validation in this
476 method, raise AutoservRepairError.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700477
Garry Wang70e5d062020-04-03 18:01:05 -0700478 @returns: A string of usb dev path(e.g. '/dev/sdb'), or empty string
479 if unexpected error occurred during probe.
480 @raises: AutoservRepairError if servo couldn't probe the usb dev path
481 (servo.probe_host_usb_dev() returns empty string), or the dev path is
482 not valid block device to servohost.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700483 """
484 logging.info('Validating image usbkey on servo.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700485 try:
Garry Wang70e5d062020-04-03 18:01:05 -0700486 usb_dev = self._servo.probe_host_usb_dev()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700487 except Exception as e:
488 # We don't want any unexpected or transient servo communicating
489 # failure block usb repair, so capture all errors here.
490 logging.error(e, exc_info=True)
491 logging.error('Unexpected error occurred on get usbkey dev path,'
492 ' skipping usbkey validation.')
493 return ''
494
Garry Wang70e5d062020-04-03 18:01:05 -0700495 if usb_dev:
496 # probe_host_usb_dev() sometimes return stale record,
497 # so we need to make sure the path exists in fdisk.
Otabek Kasimov77bff672020-10-08 15:52:03 -0700498 validate_cmd = 'fdisk -l %s' % usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700499 try:
Otabek Kasimov77bff672020-10-08 15:52:03 -0700500 resp = self.run(validate_cmd, ignore_status=True, timeout=30)
Garry Wang11441182020-06-16 18:34:14 -0700501 if resp.exit_status == 0:
502 return usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700503 logging.error('%s is reported from "image_usbkey_dev" control'
504 ' but not detected by fdisk!', usb_dev)
505 except error.AutoservRunError as e:
506 if 'Timeout encountered' in str(e):
507 logging.warning('Timeout encountered during fdisk run,'
508 ' skipping usbkey validation.')
509 return ''
510 raise
Garry Wang70e5d062020-04-03 18:01:05 -0700511
512 raise hosts.AutoservRepairError(
513 'No usbkey detected on servo, the usbkey may be either missing'
514 ' or broken. Please replace usbkey on the servo and retry.',
515 'missing usbkey')
516
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700517 def is_ec_supported(self):
Garry Wang9b8f2342020-04-17 16:34:09 -0700518 """Check if ec is supported on the servo_board"""
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700519 if self.servo_board:
520 try:
521 frm_config = config.Config(self.servo_board, self.servo_model)
522 return frm_config.chrome_ec
523 except Exception as e:
524 logging.error('Unexpected error when read from firmware'
525 ' configs; %s', str(e))
526 return False
527
Garry Wang70e5d062020-04-03 18:01:05 -0700528 def validate_image_usbkey(self):
529 """This method first validate if there is a recover usbkey on servo
530 that accessible to servohost, and second check if a ChromeOS image is
531 already on the usb drive and return the image_name so we can avoid
532 unnecessary download and flash to the recover usbkey on servo.
533
534 Please note that, there is special error handling logic here:
535 1. If unexpected error happens, we return empty string. So repair
536 actions will not get blocked.
537 2. If no working usbkey present on servo, but no errors, we'll raise
538 AutoservRepairError here.
539
540 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
541 or empty string if no test image detected, or unexpected
542 error occurred.
543 @raises: AutoservRepairError if the usbkey is not detected on servo.
544 """
545 usb_dev = self._probe_and_validate_usb_dev()
546 if usb_dev:
547 return self.get_image_name_from_usbkey(usb_dev)
548 else:
549 return ''
Garry Wang7b0e1b72020-03-25 19:08:59 -0700550
Richard Barnette1edbb162016-11-01 11:47:50 -0700551 def repair(self, silent=False):
552 """Attempt to repair servo host.
553
554 @param silent If true, suppress logging in `status.log`.
555 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700556 message = 'Beginning repair for servo host %s port %s serial %s'
557 message %= (self.hostname, self.servo_port, self.servo_serial)
558 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700559 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700560 self._repair_strategy.repair(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700561 self._servo_state = servo_constants.SERVO_STATE_WORKING
562 self.record('INFO', None, None,
563 'ServoHost repair set servo_state as WORKING')
Garry Wang464ff1e2019-07-18 17:20:34 -0700564 # If target is a labstation then try to withdraw any existing
565 # reboot request created by this servo because it passed repair.
566 if self.is_labstation():
567 self.withdraw_reboot_request()
Garry Wang63b8c382020-03-11 22:28:40 -0700568 except Exception as e:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -0700569 if not self.is_localhost():
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700570 self._servo_state = self.determine_servo_state()
571 self.record('INFO', None, None,
572 'ServoHost repair set servo_state as %s'
573 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700574 if self._is_critical_error(e):
575 self.disconnect_servo()
576 self.stop_servod()
577 raise
578
Garry Wang63b8c382020-03-11 22:28:40 -0700579 def _is_critical_error(self, error):
580 if (isinstance(error, hosts.AutoservVerifyDependencyError)
581 and not error.is_critical()):
582 logging.warning('Non-critical verify failure(s) detected during'
583 ' verify/repair servo, servo connection will'
Evan Benn2c41c262020-10-28 11:34:27 +1100584 ' still be up but may not be fully functional.'
585 ' Some repair actions and servo dependent'
Garry Wang63b8c382020-03-11 22:28:40 -0700586 ' tests may not run.')
587 return False
Evan Benn2c41c262020-10-28 11:34:27 +1100588 logging.info(
589 'Critical verify failure(s) detected during repair/verify '
590 'servo. Disconnecting servo and running `stop servod`, all'
591 ' repair actions and tests that depends on servo will not '
592 'run.')
Garry Wang63b8c382020-03-11 22:28:40 -0700593 return True
Fang Deng5d518f42013-08-02 14:04:32 -0700594
Dan Shi4d478522014-02-14 13:46:32 -0800595 def get_servo(self):
596 """Get the cached servo.Servo object.
Fang Deng5d518f42013-08-02 14:04:32 -0700597
Dan Shi4d478522014-02-14 13:46:32 -0800598 @return: a servo.Servo object.
Dana Goyette353d1d92019-06-27 10:43:59 -0700599 @rtype: autotest_lib.server.cros.servo.servo.Servo
Fang Deng5d518f42013-08-02 14:04:32 -0700600 """
Dan Shi4d478522014-02-14 13:46:32 -0800601 return self._servo
602
Garry Wang79e9af62019-06-12 15:19:19 -0700603 def request_reboot(self):
604 """Request servohost to be rebooted when it's safe to by touch a file.
605 """
606 logging.debug('Request to reboot servohost %s has been created by '
Garry Wang464ff1e2019-07-18 17:20:34 -0700607 'servo with port # %s', self.hostname, self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700608 self.run('touch %s' % self._reboot_file, ignore_status=True)
609
Garry Wang464ff1e2019-07-18 17:20:34 -0700610 def withdraw_reboot_request(self):
611 """Withdraw a servohost reboot request if exists by remove the flag
612 file.
613 """
614 logging.debug('Withdrawing request to reboot servohost %s that created'
615 ' by servo with port # %s if exists.',
616 self.hostname, self.servo_port)
617 self.run('rm -f %s' % self._reboot_file, ignore_status=True)
618
Garry Wangc1288cf2019-12-17 14:58:00 -0800619 def start_servod(self, quick_startup=False):
620 """Start the servod process on servohost.
621 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800622 # Skip if running on the localhost.(crbug.com/1038168)
623 if self.is_localhost():
624 logging.debug("Servohost is a localhost, skipping start servod.")
625 return
626
627 cmd = 'start servod'
Garry Wangc1288cf2019-12-17 14:58:00 -0800628 if self.servo_board:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800629 cmd += ' BOARD=%s' % self.servo_board
Garry Wangc1288cf2019-12-17 14:58:00 -0800630 if self.servo_model:
631 cmd += ' MODEL=%s' % self.servo_model
Garry Wangc1288cf2019-12-17 14:58:00 -0800632 else:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800633 logging.warning('Board for DUT is unknown; starting servod'
634 ' assuming a pre-configured board.')
635
636 cmd += ' PORT=%d' % self.servo_port
637 if self.servo_serial:
638 cmd += ' SERIAL=%s' % self.servo_serial
Garry Wangd7367482020-02-27 13:52:40 -0800639
Garry Wangcb06f3b2020-10-08 20:56:21 -0700640 # Start servod with dual_v4 based on servo_setup.
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700641 if self.is_dual_setup():
Garry Wangcb06f3b2020-10-08 20:56:21 -0700642 cmd += ' DUAL_V4=1'
Garry Wangd7367482020-02-27 13:52:40 -0800643
Garry Wangcb06f3b2020-10-08 20:56:21 -0700644 # Start servod with CONFIG=cr50.xml which required for some pools.
645 if self._require_cr50_servod_config():
646 cmd += ' CONFIG=cr50.xml'
Garry Wangb5cee3e2020-09-16 14:58:13 -0700647
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800648 if self.servo_recovery == True:
649 cmd += ' REC_MODE=1'
650
Garry Wang6a680062020-11-03 13:40:29 -0800651 # Adding customized args if any.
652 if self.additional_servod_args:
653 cmd += ' ' + self.additional_servod_args
654
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800655 # Remove the symbolic links from the logs. This helps ensure that
656 # a failed servod instantiation does not cause us to grab old logs
657 # by mistake.
658 self.remove_latest_log_symlinks()
Garry Wangcdd27b22020-01-13 14:59:11 -0800659 self.run(cmd, timeout=60)
Garry Wangc1288cf2019-12-17 14:58:00 -0800660
661 # There's a lag between when `start servod` completes and when
662 # the _ServodConnectionVerifier trigger can actually succeed.
663 # The call to time.sleep() below gives time to make sure that
664 # the trigger won't fail after we return.
665
666 # Normally servod on servo_v3 and labstation take ~10 seconds to ready,
667 # But in the rare case all servo on a labstation are in heavy use they
668 # may take ~30 seconds. So the timeout value will double these value,
669 # and we'll try quick start up when first time initialize servohost,
670 # and use standard start up timeout in repair.
671 if quick_startup:
Garry Wang11b5e872020-03-11 15:14:08 -0700672 timeout = servo_constants.SERVOD_QUICK_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800673 else:
Garry Wang11b5e872020-03-11 15:14:08 -0700674 timeout = servo_constants.SERVOD_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800675 logging.debug('Wait %s seconds for servod process fully up.', timeout)
676 time.sleep(timeout)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700677 # Cache the initial instance timestamp to check against servod restarts
678 self._initial_instance_ts = self.get_instance_logs_ts()
Garry Wangc1288cf2019-12-17 14:58:00 -0800679
Garry Wangc1288cf2019-12-17 14:58:00 -0800680 def stop_servod(self):
681 """Stop the servod process on servohost.
682 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800683 # Skip if running on the localhost.(crbug.com/1038168)
684 if self.is_localhost():
685 logging.debug("Servohost is a localhost, skipping stop servod.")
686 return
687
Garry Wangc1288cf2019-12-17 14:58:00 -0800688 logging.debug('Stopping servod on port %s', self.servo_port)
Garry Wangcdd27b22020-01-13 14:59:11 -0800689 self.run('stop servod PORT=%d' % self.servo_port,
690 timeout=60, ignore_status=True)
Garry Wangc1288cf2019-12-17 14:58:00 -0800691 logging.debug('Wait %s seconds for servod process fully teardown.',
Garry Wang11b5e872020-03-11 15:14:08 -0700692 servo_constants.SERVOD_TEARDOWN_TIMEOUT)
693 time.sleep(servo_constants.SERVOD_TEARDOWN_TIMEOUT)
Garry Wangc1288cf2019-12-17 14:58:00 -0800694
Garry Wangc1288cf2019-12-17 14:58:00 -0800695 def restart_servod(self, quick_startup=False):
696 """Restart the servod process on servohost.
697 """
698 self.stop_servod()
699 self.start_servod(quick_startup)
700
Garry Wangffbd2162020-04-17 16:13:48 -0700701 def _process_servodtool_error(self, response):
702 """Helper function to handle non-zero servodtool response.
703 """
704 if re.search(servo_constants.ERROR_MESSAGE_USB_HUB_NOT_COMPATIBLE,
Garry Wangad245002020-05-15 15:20:23 -0700705 response.stdout):
Garry Wangffbd2162020-04-17 16:13:48 -0700706 logging.error('The servo is not plugged on a usb hub that supports'
707 ' power-cycle!')
Garry Wang000c6c02020-05-11 21:27:23 -0700708 # change the flag so we can update this label in later process.
709 self.smart_usbhub = False
Garry Wangffbd2162020-04-17 16:13:48 -0700710 return
711
712 if re.search(servo_constants.ERROR_MESSAGE_DEVICE_NOT_FOUND %
713 self.servo_serial, response.stdout):
714 logging.error('No servo with serial %s found!', self.servo_serial)
715 return
716
717 logging.error('Unexpected error occurred from usbhub control, please'
718 ' file a bug and inform chrome-fleet-software@ team!')
719
Otabek Kasimov86062d02020-11-17 13:30:22 -0800720 def get_main_servo_usb_path(self):
721 """Helper function to collect current usb-path to main servo.
722
723 The usb-path is path to the folder where usb-device was enumerated.
724 If fail then will return an empty string ('').
725
726 @returns: string, usb-path to the main servo device.
727 e.g.: '/sys/bus/usb/devices/1-6.1.3.1'
Garry Wangffbd2162020-04-17 16:13:48 -0700728 """
Otabek Kasimov09192682020-06-01 18:17:44 -0700729 # TODO remove try-except when fix crbug.com/1087964
730 try:
731 cmd = 'servodtool device -s %s usb-path' % self.servo_serial
732 resp = self.run(cmd, ignore_status=True, timeout=30)
733 except Exception as e:
734 # Here we catch only timeout errors.
735 # Other errors is filtered by ignore_status=True
736 logging.debug('Attempt to get servo usb-path failed due to '
737 'timeout; %s', e)
738 return ''
Garry Wangffbd2162020-04-17 16:13:48 -0700739 if resp.exit_status != 0:
740 self._process_servodtool_error(resp)
741 return ''
742 usb_path = resp.stdout.strip()
743 logging.info('Usb path of servo %s is %s', self.servo_serial, usb_path)
Otabek Kasimov86062d02020-11-17 13:30:22 -0800744 return usb_path
Garry Wangffbd2162020-04-17 16:13:48 -0700745
Otabek Kasimov86062d02020-11-17 13:30:22 -0800746 def _get_servo_usb_devnum(self):
747 """Helper function to collect current usb devnum of servo."""
748 usb_path = self.get_main_servo_usb_path()
749 if not usb_path:
750 return ''
751 resp = self.run('cat %s/devnum' % usb_path, ignore_status=True)
Garry Wangffbd2162020-04-17 16:13:48 -0700752 if resp.exit_status != 0:
753 self._process_servodtool_error(resp)
754 return ''
755 return resp.stdout.strip()
756
Garry Wang358aad42020-08-02 20:56:04 -0700757 def reboot_servo_v3_on_need(self):
758 """Check and reboot servo_v3 based on below conditions.
759 1. If there is an update pending on reboot.
760 2. Servo_v3 has been up for more than 96 hours.
761 """
762 if self.get_board() != 'beaglebone_servo':
763 logging.info('Servo reboot is only applicable for servo V3.')
Otabek Kasimove6df8102020-07-21 20:15:25 -0700764 return
765
Garry Wang358aad42020-08-02 20:56:04 -0700766 update_pending_reboot = (self._check_update_status() ==
767 self.UPDATE_STATE.PENDING_REBOOT)
768 uptime_hours = float(self.check_uptime())/3600
769 logging.info('Uptime of servo_v3: %s hour(s)', uptime_hours)
770 long_up_time = uptime_hours > 96
771
772 # Skip reboot if neither condition are met.
773 if not (update_pending_reboot or long_up_time):
Otabek Kasimove6df8102020-07-21 20:15:25 -0700774 return
775
Garry Wang358aad42020-08-02 20:56:04 -0700776 if update_pending_reboot:
777 message = 'Starting reboot servo_v3 because an update is pending.'
778 reboot_method = self._post_update_reboot
779 elif long_up_time:
780 message = 'Starting reboot servo_v3 because uptime > 96 hours.'
781 reboot_method = self._servo_host_reboot
782 self.record('INFO', None, None, message)
783 logging.info(message)
Otabek Kasimove6df8102020-07-21 20:15:25 -0700784 try:
Garry Wang358aad42020-08-02 20:56:04 -0700785 reboot_method()
Otabek Kasimove6df8102020-07-21 20:15:25 -0700786 message = 'Servo_v3 reboot completed successfully.'
787 except Exception as e:
788 logging.debug("Fail to reboot servo_v3; %s", e)
789 message = ('Servo_v3 reboot failed, please check debug log '
790 'for details.')
791 logging.info(message)
792 self.record('INFO', None, None, message)
Garry Wangffbd2162020-04-17 16:13:48 -0700793
794 def _reset_servo(self):
795 logging.info('Resetting servo through smart usbhub.')
Otabek Kasimov09192682020-06-01 18:17:44 -0700796 # TODO remove try-except when fix crbug.com/1087964
797 try:
798 resp = self.run('servodtool device -s %s power-cycle' %
799 self.servo_serial, ignore_status=True,
800 timeout=30)
801 if resp.exit_status != 0:
802 self._process_servodtool_error(resp)
803 return False
804 except Exception as e:
805 # Here we catch only timeout errors.
806 # Other errors is filtered by ignore_status=True
807 logging.debug('Attempt to reset servo failed due to timeout;'
808 ' %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -0700809 return False
810
811 logging.debug('Wait %s seconds for servo to come back from reset.',
812 servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
813 time.sleep(servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
Garry Wang000c6c02020-05-11 21:27:23 -0700814 # change the flag so we can update this label in later process.
815 self.smart_usbhub = True
Garry Wangffbd2162020-04-17 16:13:48 -0700816 return True
817
Garry Wangffbd2162020-04-17 16:13:48 -0700818 def reset_servo(self):
819 """Reset(power-cycle) the servo via smart usbhub.
820 """
821 if not self.is_labstation():
822 logging.info('Servo reset is not applicable to servo_v3.')
823 return
824
825 pre_reset_devnum = self._get_servo_usb_devnum()
826 logging.info('Servo usb devnum before reset: %s', pre_reset_devnum)
827 result = self._reset_servo()
828 if not result:
Garry Wangfd5c8b62020-06-08 15:36:54 -0700829 message = ('Failed to reset servo with serial: %s. (Please ignore'
830 ' this error if the DUT is not connected to a smart'
831 ' usbhub).' % self.servo_serial)
Garry Wangffbd2162020-04-17 16:13:48 -0700832 logging.warning(message)
833 self.record('INFO', None, None, message)
834 return
835
836 post_reset_devnum = self._get_servo_usb_devnum()
837 logging.info('Servo usb devnum after reset: %s', post_reset_devnum)
838 if not (pre_reset_devnum and post_reset_devnum):
839 message = ('Servo reset completed but unable to verify'
840 ' devnum change!')
841 elif pre_reset_devnum != post_reset_devnum:
842 message = ('Reset servo with serial %s completed successfully!'
843 % self.servo_serial)
844 else:
845 message = 'Servo reset completed but devnum is still not changed!'
846 logging.info(message)
847 self.record('INFO', None, None, message)
848
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800849 def _extract_compressed_logs(self, logdir, relevant_files):
850 """Decompress servod logs in |logdir|.
851
852 @param logdir: directory containing compressed servod logs.
853 @param relevant_files: list of files in |logdir| to consider.
854
855 @returns: tuple, (tarfiles, files) where
856 tarfiles: list of the compressed filenames that have been
857 extracted and deleted
858 files: list of the uncompressed files that were generated
859 """
860 # For all tar-files, first extract them to the directory, and
861 # then let the common flow handle them.
862 tarfiles = [cf for cf in relevant_files if
863 cf.endswith(self.COMPRESSION_SUFFIX)]
864 files = []
865 for f in tarfiles:
866 norm_name = os.path.basename(f)[:-len(self.COMPRESSION_SUFFIX)]
867 with tarfile.open(f) as tf:
868 # Each tarfile has only one member, as
869 # that's the compressed log.
870 member = tf.members[0]
871 # Manipulate so that it only extracts the basename, and not
872 # the directories etc.
873 member.name = norm_name
874 files.append(os.path.join(logdir, member.name))
875 tf.extract(member, logdir)
876 # File has been extracted: remove the compressed file.
877 os.remove(f)
878 return tarfiles, files
879
880 def _extract_mcu_logs(self, log_subdir):
881 """Extract MCU (EC, Cr50, etc) console output from servod debug logs.
882
883 Using the MCU_EXTRACTOR regex (above) extract and split out MCU console
884 lines from the logs to generate invidiual console logs e.g. after
885 this method, you can find an ec.txt and servo_v4.txt in |log_dir| if
886 those MCUs had any console input/output.
887
888 @param log_subdir: directory with log.DEBUG.txt main servod debug logs.
889 """
890 # Extract the MCU for each one. The MCU logs are only in the .DEBUG
891 # files
892 mcu_lines_file = os.path.join(log_subdir, 'log.DEBUG.txt')
893 if not os.path.exists(mcu_lines_file):
894 logging.info('No DEBUG logs found to extract MCU logs from.')
895 return
896 mcu_files = {}
897 mcu_file_template = '%s.txt'
898 with open(mcu_lines_file, 'r') as f:
899 for line in f:
900 match = self.MCU_EXTRACTOR.match(line)
901 if match:
902 mcu = match.group(self.MCU_GROUP).lower()
903 line = match.group(self.LINE_GROUP)
904 if mcu not in mcu_files:
905 mcu_file = os.path.join(log_subdir,
906 mcu_file_template % mcu)
907 mcu_files[mcu] = open(mcu_file, 'a')
908 fd = mcu_files[mcu]
909 fd.write(line + '\n')
910 for f in mcu_files:
911 mcu_files[f].close()
912
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800913 def remove_latest_log_symlinks(self):
914 """Remove the conveninence symlinks 'latest' servod logs."""
915 symlink_wildcard = '%s/latest*' % self.remote_log_dir
916 cmd = 'rm ' + symlink_wildcard
917 self.run(cmd, stderr_tee=None, ignore_status=True)
918
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700919 def probe_servod_restart(self, instance_ts, outdir):
920 """Grab servod logs from previous instances if part of this session.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800921
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700922 If since the last time this host called start_servod() servod crashed
923 and restarted, this helper finds those logs as well, and stores them
924 with the |OLD_LOG_SUFFIX| to investigate if necessary.
Prasad Vuppalapu5bd9da12020-03-31 01:46:47 +0000925
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700926 It also issues a panicinfo command to servo devices after the restart
927 to try and collect reboot information for debugging.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800928
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700929 @param instance_ts: the log timestamp that the current instance uses
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800930 @param outdir: directory to create a subdirectory into to place the
931 servod logs into.
932 """
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700933 if self._initial_instance_ts is None:
934 logging.info('No log timestamp grabbed successfully on servod '
935 'startup. Cannot check device restarts. Ignoring.')
936 return
937 if instance_ts == self._initial_instance_ts:
938 logging.debug('Servod appears to have run without restarting')
939 return
940 # Servod seems to have restarted (at least once). |_initial_instance_ts|
941 # is the first timestamp, and instance_ts is the current timestamp. Find
942 # all timestamps in between them, and grab the logs for each.
943 tss = self._find_instance_timestamps_between(self._initial_instance_ts,
944 instance_ts)
945 logging.info('Servod has restarted %d times between the start and the '
946 'end of this servo_host.', len(tss))
947 logging.info('This might be an issue. Will extract all logs from each '
948 'instance.')
949 logging.info('Logs that are not the currently running (about to turn '
950 'down) instance are maked with a .%s in their folder.',
951 self.OLD_LOG_SUFFIX)
952 for ts in tss:
953 self.get_instance_logs(ts, outdir, old=True)
954 # Lastly, servod has restarted due to a potential issue. Try to get
955 # panic information from servo micro and servo v4 for the current logs.
956 # This can only happen if the |_servo| attribute is initialized.
957 if self._servo:
Ruben Rodriguez Buchillon030ff162021-03-09 17:21:25 -0800958 for mcu in ['servo_micro', 'servo_v4', 'servo_v4p1']:
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700959 ctrl = '%s_uart_cmd' % mcu
960 if self._servo.has_control(ctrl):
961 logging.info('Trying to retrieve %r panicinfo into logs',
962 mcu)
963 try:
964 self._servo.set_nocheck(ctrl, 'panicinfo')
965 except error.TestFail as e:
966 logging.error('Failed to generate panicinfo for %r '
967 'logs. %s', mcu, str(e))
968
969 def _find_instance_timestamps_between(self, start_ts, end_ts):
970 """Find all log timestamps between [start_ts, end_ts).
971
972 @param start_ts: str, earliest log timestamp of interest
973 @param end_ts: str, latest log timestamp of interest
974
975 @returns: list, all timestamps between start_ts and end_ts, end_ts
976 exclusive, on the servo_host. An empty list on errors
977 """
978 # Simply get all timestamp, and then sort and remove
979 cmd = 'ls %s' % self.remote_log_dir
980 res = self.run(cmd, stderr_tee=None, ignore_status=True)
981 if res.exit_status != 0:
982 # Here we failed to find anything.
983 logging.info('Failed to find remote servod logs. Ignoring.')
984 return []
985 logfiles = res.stdout.strip().split()
986 timestamps = set()
987 for logfile in logfiles:
988 ts_match = self.TS_EXTRACTOR.match(logfile)
989 if not ts_match:
990 # Simply ignore files that fail the check. It might be the
991 # 'latest' symlinks or random files.
992 continue
993 timestamps.add(ts_match.group(self.TS_GROUP))
994 # At this point we have all unique timestamps.
995 timestamps = sorted(timestamps)
996 for ts in [start_ts, end_ts]:
997 if ts not in timestamps:
998 logging.error('Timestamp %r not in servod logs. Cannot query '
999 'for timestamps in between %r and %r', ts,
1000 start_ts, end_ts)
1001 return []
1002 return timestamps[timestamps.index(start_ts):timestamps.index(end_ts)]
1003
1004 def get_instance_logs_ts(self):
1005 """Retrieve the currently running servod instance's log timestamp
1006
1007 @returns: str, timestamp for current instance, or None on failure
1008 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001009 # First, extract the timestamp. This cmd gives the real filename of
1010 # the latest aka current log file.
1011 cmd = ('if [ -f %(dir)s/latest.DEBUG ];'
1012 'then realpath %(dir)s/latest.DEBUG;'
1013 'elif [ -f %(dir)s/latest ];'
1014 'then realpath %(dir)s/latest;'
1015 'else exit %(code)d;'
1016 'fi' % {'dir': self.remote_log_dir,
1017 'code': self.NO_SYMLINKS_CODE})
1018 res = self.run(cmd, stderr_tee=None, ignore_status=True)
1019 if res.exit_status != 0:
1020 if res.exit_status == self.NO_SYMLINKS_CODE:
1021 logging.warning('servod log latest symlinks not found. '
1022 'This is likely due to an error starting up '
1023 'servod. Ignoring..')
1024 else:
1025 logging.warning('Failed to find servod logs on servo host.')
1026 logging.warning(res.stderr.strip())
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001027 return None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001028 fname = os.path.basename(res.stdout.strip())
1029 # From the fname, ought to extract the timestamp using the TS_EXTRACTOR
Ruben Rodriguez Buchillone9aa2b02020-03-04 12:14:28 -08001030 ts_match = self.TS_EXTRACTOR.match(fname)
1031 if not ts_match:
1032 logging.warning('Failed to extract timestamp from servod log file '
1033 '%r. Skipping. The servo host is using outdated '
1034 'servod logging and needs to be updated.', fname)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001035 return None
1036 return ts_match.group(self.TS_GROUP)
1037
Garry Wang970fda92021-06-22 18:03:43 -07001038 def get_servohost_logs(self, outdir):
1039 """Get logs that can help debugging servo/servod problem from
1040 the servohost
1041 """
1042 log_dir = os.path.join(outdir, 'servohost_%s' % self.hostname)
1043 if os.path.isdir(log_dir):
1044 # In multi-DUTs testing, each DUTs will may their own servohost
1045 # instance, where could cause duplicate efforts if they share a
1046 # same servohost, so we can just skip the collect if the log
1047 # dir already exists.
1048 logging.info(
1049 'Skip dmesg and messages logs collecting as %s'
1050 ' already exists.', log_dir)
1051 return
1052 logging.info('Collecting dmesg and messages from servohost %s',
1053 self.hostname)
1054 os.mkdir(log_dir)
1055 logging.info('Saving servohost logs to %s.', log_dir)
1056 # First collect dmesg from the servohost.
1057 crashcollect.collect_command(self, 'dmesg -H',
1058 os.path.join(log_dir, 'dmesg'))
1059 # Collect messages log from the servohost.
1060 try:
1061 self.get_file('/var/log/messages', log_dir, try_rsync=False)
1062 except error.AutoservRunError as e:
1063 logging.warning('Failed to collect messages log from servohost.')
1064
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001065 def get_instance_logs(self, instance_ts, outdir, old=False):
1066 """Collect all logs with |instance_ts| and dump into a dir in |outdir|
1067
1068 This method first collects all logs on the servo_host side pertaining
1069 to this servod instance (port, instatiation). It glues them together
1070 into combined log.[level].txt files and extracts all available MCU
1071 console I/O from the logs into individual files e.g. servo_v4.txt
1072
1073 All the output can be found in a directory inside |outdir| that
1074 this generates based on |LOG_DIR|, the servod port, and the instance
1075 timestamp on the servo_host side.
1076
1077 @param instance_ts: log timestamp to grab logfiles for
1078 @param outdir: directory to create a subdirectory into to place the
1079 servod logs into.
1080 @param old: bool, whether to append |OLD_LOG_SUFFIX| to output dir
1081 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001082 # Create the local results log dir.
1083 log_dir = os.path.join(outdir, '%s_%s.%s' % (self.LOG_DIR,
1084 str(self.servo_port),
1085 instance_ts))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001086 if old:
Garry Wang22f2e842020-09-09 20:19:19 -07001087 log_dir = '%s.%s' % (log_dir, self.OLD_LOG_SUFFIX)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001088 logging.info('Saving servod logs to %r.', log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001089 os.mkdir(log_dir)
1090 # Now, get all files with that timestamp.
1091 cmd = 'find %s -maxdepth 1 -name "log.%s*"' % (self.remote_log_dir,
1092 instance_ts)
1093 res = self.run(cmd, stderr_tee=None, ignore_status=True)
1094 files = res.stdout.strip().split()
1095 try:
1096 self.get_file(files, log_dir, try_rsync=False)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001097 if not os.listdir(log_dir):
1098 logging.info('No servod logs retrieved. Ignoring, and removing '
1099 '%r again.', log_dir)
1100 os.rmdir(log_dir)
1101 return
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001102 except error.AutoservRunError as e:
1103 result = e.result_obj
1104 if result.exit_status != 0:
1105 stderr = result.stderr.strip()
1106 logging.warning("Couldn't retrieve servod logs. Ignoring: %s",
1107 stderr or '\n%s' % result)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001108 # Remove the log_dir as nothing was added to it.
1109 os.rmdir(log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001110 return
1111 local_files = [os.path.join(log_dir, f) for f in os.listdir(log_dir)]
1112 # TODO(crrev.com/c/1793030): remove no-level case once CL is pushed
1113 for level_name in ('DEBUG', 'INFO', 'WARNING', ''):
1114 # Create the joint files for each loglevel. i.e log.DEBUG
1115 joint_file = self.JOINT_LOG_PREFIX
1116 if level_name:
1117 joint_file = '%s.%s' % (self.JOINT_LOG_PREFIX, level_name)
1118 # This helps with some online tools to avoid complaints about an
1119 # unknown filetype.
1120 joint_file = joint_file + '.txt'
1121 joint_path = os.path.join(log_dir, joint_file)
1122 files = [f for f in local_files if level_name in f]
1123 if not files:
1124 # TODO(crrev.com/c/1793030): remove no-level case once CL
1125 # is pushed
1126 continue
1127 # Extract compressed logs if any.
1128 compressed, extracted = self._extract_compressed_logs(log_dir,
1129 files)
1130 files = list(set(files) - set(compressed))
1131 files.extend(extracted)
1132 # Need to sort. As they all share the same timestamp, and
1133 # loglevel, the index itself is sufficient. The highest index
1134 # is the oldest file, therefore we need a descending sort.
1135 def sortkey(f, level=level_name):
1136 """Custom sortkey to sort based on rotation number int."""
1137 if f.endswith(level_name): return 0
1138 return int(f.split('.')[-1])
1139
1140 files.sort(reverse=True, key=sortkey)
1141 # Just rename the first file rather than building from scratch.
1142 os.rename(files[0], joint_path)
1143 with open(joint_path, 'a') as joint_f:
1144 for logfile in files[1:]:
1145 # Transfer the file to the joint file line by line.
1146 with open(logfile, 'r') as log_f:
1147 for line in log_f:
1148 joint_f.write(line)
1149 # File has been written over. Delete safely.
1150 os.remove(logfile)
1151 # Need to remove all files form |local_files| so we don't
1152 # analyze them again.
1153 local_files = list(set(local_files) - set(files) - set(compressed))
1154 # Lastly, extract MCU logs from the joint logs.
1155 self._extract_mcu_logs(log_dir)
1156
Garry Wang79e9af62019-06-12 15:19:19 -07001157 def _lock(self):
1158 """lock servohost by touching a file.
1159 """
1160 logging.debug('Locking servohost %s by touching %s file',
1161 self.hostname, self._lock_file)
1162 self.run('touch %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001163 self._is_locked = True
Garry Wang79e9af62019-06-12 15:19:19 -07001164
Garry Wang79e9af62019-06-12 15:19:19 -07001165 def _unlock(self):
1166 """Unlock servohost by removing the lock file.
1167 """
1168 logging.debug('Unlocking servohost by removing %s file',
1169 self._lock_file)
1170 self.run('rm %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001171 self._is_locked = False
Garry Wang79e9af62019-06-12 15:19:19 -07001172
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001173 def close(self):
Congbin Guofc3b8962019-03-22 17:38:46 -07001174 """Close the associated servo and the host object."""
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001175 # NOTE: throughout this method there are multiple attempts to catch
1176 # all errors. This is WAI as log grabbing should not fail tests.
1177 # However, the goal is to catch and handle/process all errors, thus
1178 # we print the traceback and ask for a bug.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001179 if self._closed:
1180 logging.debug('ServoHost is already closed.')
1181 return
Garry Wang22f2e842020-09-09 20:19:19 -07001182
1183 # Only attempt ssh related actions if servohost is sshable. We call
1184 # check_cached_up_status() first because it's lightweighted and return
1185 # much faster in the case servohost is down, however, we still want
1186 # to call is_up() later since check_cached_up_status() is ping based check
1187 # and not guarantee the servohost is sshable.
1188 servo_host_ready = self.check_cached_up_status() and self.is_up()
1189
1190 if servo_host_ready:
1191 instance_ts = self.get_instance_logs_ts()
1192 else:
1193 logging.info('Servohost is down, will skip servod log collecting.')
1194 instance_ts = None
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001195 # TODO(crbug.com/1011516): once enabled, remove the check against
1196 # localhost and instead check against log-rotiation enablement.
1197 logs_available = (instance_ts is not None and
1198 self.job and
1199 not self.is_localhost())
1200 if logs_available:
1201 # Probe whether there was a servod restart, and grab those old
1202 # logs as well.
1203 try:
1204 self.probe_servod_restart(instance_ts, self.job.resultdir)
1205 except (error.AutoservRunError, error.TestFail) as e:
1206 logging.info('Failed to grab servo logs due to: %s. '
1207 'This error is forgiven.', str(e))
1208 except Exception as e:
1209 logging.error('Unexpected error probing for old logs. %s. '
1210 'Forgiven. Please file a bug and fix or catch '
1211 'in log probing function', str(e),
1212 exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001213 if self._servo:
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001214 outdir = None if not self.job else self.job.resultdir
Congbin Guo2e5e2a22018-07-27 10:32:48 -07001215 # In some cases when we run as lab-tools, the job object is None.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001216 self._servo.close(outdir)
1217
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001218 if logs_available:
1219 # Grab current (not old like above) logs after the servo instance
1220 # was closed out.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001221 try:
Garry Wang970fda92021-06-22 18:03:43 -07001222 self.get_servohost_logs(self.job.resultdir)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001223 self.get_instance_logs(instance_ts, self.job.resultdir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001224 except error.AutoservRunError as e:
1225 logging.info('Failed to grab servo logs due to: %s. '
1226 'This error is forgiven.', str(e))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001227 except Exception as e:
1228 logging.error('Unexpected error grabbing servod logs. %s. '
1229 'Forgiven. Please file a bug and fix or catch '
1230 'in log grabbing function', str(e), exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001231
Garry Wang22f2e842020-09-09 20:19:19 -07001232 if self._is_locked and servo_host_ready:
Garry Wang7c00b0f2019-06-25 17:28:17 -07001233 # Remove the lock if the servohost has been locked.
Garry Wang79e9af62019-06-12 15:19:19 -07001234 try:
1235 self._unlock()
1236 except error.AutoservSSHTimeout:
1237 logging.error('Unlock servohost failed due to ssh timeout.'
1238 ' It may caused by servohost went down during'
1239 ' the task.')
Garry Wangc1288cf2019-12-17 14:58:00 -08001240 # We want always stop servod after task to minimum the impact of bad
1241 # servod process interfere other servods.(see crbug.com/1028665)
Garry Wang22f2e842020-09-09 20:19:19 -07001242 if servo_host_ready:
1243 try:
1244 self.stop_servod()
1245 except error.AutoservRunError as e:
1246 logging.info(
1247 "Failed to stop servod due to:\n%s\n"
1248 "This error is forgiven.", str(e))
Garry Wangc1288cf2019-12-17 14:58:00 -08001249
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001250 super(ServoHost, self).close()
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001251 # Mark closed.
1252 self._closed = True
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001253
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001254 def get_servo_state(self):
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001255 return self._servo_state
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001256
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001257 def is_servo_board_present_on_servo_v3(self):
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001258 """Check if servo board is detected on servo_v3"""
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001259 logging.debug('Started to detect servo board on servo_v3')
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001260 vid_pids = ['18d1:5004', '0403:6014']
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001261 not_detected = 'The servo board is not detected on servo_v3'
1262 try:
1263 cmd = 'lsusb | grep "%s"' % "\|".join(vid_pids)
1264 result = self.run(cmd, ignore_status=True, timeout=30)
1265 if result.exit_status == 0 and result.stdout.strip():
1266 logging.debug('The servo board is detected on servo_v3')
1267 return True
1268 logging.debug('%s; %s', not_detected, result)
1269 return False
1270 except Exception as e:
1271 # can be triggered by timeout issue due running the script
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001272 logging.error('%s; %s', not_detected, str(e))
1273 return None
1274
Garry Wangb5cee3e2020-09-16 14:58:13 -07001275 def _require_cr50_servod_config(self):
1276 """Check whether we need start servod with CONFIG=cr50.xml"""
1277 dut_host_info = self.get_dut_host_info()
1278 if not dut_host_info:
1279 return False
1280 for pool in dut_host_info.pools:
1281 if pool.startswith(servo_constants.CR50_CONFIG_POOL_PREFIX):
1282 return True
1283 return False
1284
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001285 def get_verifier_state(self, tag):
Otabek Kasimov15963492020-06-23 21:10:51 -07001286 """Return the state of servo verifier.
1287
1288 @returns: bool or None
1289 """
1290 return self._repair_strategy.verifier_is_good(tag)
1291
Otabek Kasimov044a54b2021-05-06 19:12:18 -07001292 def get_repair_strategy_node(self, tag):
1293 """Return the instance of verifier/repair node for host by tag.
1294
1295 @returns: _DependencyNode or None
1296 """
1297 return self._repair_strategy.node_by_tag(tag)
1298
Otabek Kasimov15963492020-06-23 21:10:51 -07001299 def determine_servo_state(self):
1300 """Determine servo state based on the failed verifier.
1301
1302 @returns: servo state value
1303 The state detecting based on first fail verifier or collecting of
1304 them.
1305 """
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001306 ssh = self.get_verifier_state('servo_ssh')
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001307 servo_root_present = self.get_verifier_state('servo_root_present')
Otabek Kasimov044a54b2021-05-06 19:12:18 -07001308 servo_root_present_node = self.get_repair_strategy_node(
1309 'servo_root_present')
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001310 servo_v3_present = self.get_verifier_state('servo_v3_root_present')
Otabek Kasimov79be61b2021-02-18 12:30:44 -08001311 servo_fw = self.get_verifier_state('servo_fw')
Otabek Kasimov9049ebe2021-05-06 19:19:12 -07001312 servo_fw_update = self.get_repair_strategy_node('servo_fw_update')
Otabek Kasimov1614e2e2021-01-27 22:14:36 -08001313 disk_space = self.get_verifier_state('servo_disk_space')
Otabek Kasimov3c63cbf2021-04-30 18:51:31 -07001314 start_servod = self.get_verifier_state('start_servod')
1315 servod_started = self.get_verifier_state('servod_started')
Otabek Kasimov261bf402021-05-06 19:11:09 -07001316 servod_echo = self.get_verifier_state('servod_echo')
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001317 create_servo = self.get_verifier_state('servod_connection')
1318 init_servo = self.get_verifier_state('servod_control')
Otabek Kasimov1614e2e2021-01-27 22:14:36 -08001319 cr50_low_sbu = self.get_verifier_state('servo_cr50_low_sbu')
1320 cr50_off = self.get_verifier_state('servo_cr50_off')
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001321 servo_topology = self.get_verifier_state('servo_topology')
Otabek Kasimov1614e2e2021-01-27 22:14:36 -08001322 dut_connected = self.get_verifier_state('servo_dut_connected')
1323 hub_connected = self.get_verifier_state('servo_hub_connected')
1324 pwr_button = self.get_verifier_state('servo_pwr_button')
1325 lid_open = self.get_verifier_state('servo_lid_open')
1326 ec_board = self.get_verifier_state('servo_ec_board')
1327 cr50_console = self.get_verifier_state('servo_cr50_console')
1328 ccd_testlab = self.get_verifier_state('servo_ccd_testlab')
Otabek Kasimov15963492020-06-23 21:10:51 -07001329
1330 if not ssh:
1331 return servo_constants.SERVO_STATE_NO_SSH
Otabek Kasimov3c63cbf2021-04-30 18:51:31 -07001332 if start_servod == hosts.VERIFY_FAILED:
1333 return servo_constants.SERVO_STATE_SERVO_HOST_ISSUE
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001334 if servo_root_present == hosts.VERIFY_FAILED:
1335 if not self.servo_serial:
1336 return servo_constants.SERVO_STATE_WRONG_CONFIG
Otabek Kasimov044a54b2021-05-06 19:12:18 -07001337 if hasattr(servo_root_present_node, 'serial_mismatch'):
1338 return servo_constants.SERVO_STATE_SERIAL_MISMATCH
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001339 return servo_constants.SERVO_STATE_NOT_CONNECTED
1340 if servo_v3_present == hosts.VERIFY_FAILED:
1341 # if we cannot find required board on servo_v3
1342 return servo_constants.SERVO_STATE_NEED_REPLACEMENT
Otabek Kasimov79be61b2021-02-18 12:30:44 -08001343 if servo_fw == hosts.VERIFY_FAILED:
Otabek Kasimov9049ebe2021-05-06 19:19:12 -07001344 logging.info(servo_fw_update)
1345 if hasattr(servo_fw_update, 'servo_updater_issue_detected'):
1346 return servo_constants.SERVO_STATE_SERVO_UPDATER_ISSUE
Otabek Kasimov79be61b2021-02-18 12:30:44 -08001347 return servo_constants.SERVO_STATE_NEED_REPLACEMENT
Otabek Kasimov15963492020-06-23 21:10:51 -07001348
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001349 if dut_connected == hosts.VERIFY_FAILED:
1350 return servo_constants.SERVO_STATE_DUT_NOT_CONNECTED
1351 if hub_connected == hosts.VERIFY_FAILED:
1352 logging.info('Servo HUB not connected')
1353 return servo_constants.SERVO_STATE_DUT_NOT_CONNECTED
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001354
Otabek Kasimov8e88a742021-01-11 18:03:13 -08001355 if cr50_low_sbu == hosts.VERIFY_FAILED:
1356 return servo_constants.SERVO_STATE_SBU_LOW_VOLTAGE
1357 if cr50_off == hosts.VERIFY_FAILED:
1358 return servo_constants.SERVO_STATE_CR50_NOT_ENUMERATED
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001359
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001360 if servo_topology == hosts.VERIFY_FAILED:
1361 return servo_constants.SERVO_STATE_TOPOLOGY_ISSUE
1362
Otabek Kasimov261bf402021-05-06 19:11:09 -07001363 if (servod_started == hosts.VERIFY_FAILED
1364 or servod_echo == hosts.VERIFY_FAILED):
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001365 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1366
Otabek Kasimov15963492020-06-23 21:10:51 -07001367 # one of the reason why servo can not initialized
Otabek Kasimovbb3bc462020-11-03 16:40:33 -08001368 if cr50_console == hosts.VERIFY_FAILED:
1369 return servo_constants.SERVO_STATE_CR50_CONSOLE_MISSING
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001370 if ccd_testlab == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001371 return servo_constants.SERVO_STATE_CCD_TESTLAB_ISSUE
1372
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001373 if (create_servo == hosts.VERIFY_FAILED
1374 or init_servo == hosts.VERIFY_FAILED):
Otabek Kasimov261bf402021-05-06 19:11:09 -07001375 return servo_constants.SERVO_STATE_SERVOD_PROXY_ISSUE
Otabek Kasimov15963492020-06-23 21:10:51 -07001376
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001377 if ec_board == hosts.VERIFY_FAILED:
Otabek Kasimov015c15c2020-08-20 00:40:42 -07001378 return servo_constants.SERVO_STATE_EC_BROKEN
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001379 if pwr_button == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001380 return servo_constants.SERVO_STATE_BAD_RIBBON_CABLE
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001381 if lid_open == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001382 return servo_constants.SERVO_STATE_LID_OPEN_FAILED
Otabek Kasimov15963492020-06-23 21:10:51 -07001383
Otabek Kasimov15963492020-06-23 21:10:51 -07001384 logging.info('We do not have special state for this failure yet :)')
1385 return servo_constants.SERVO_STATE_BROKEN
1386
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001387 def is_servo_topology_supported(self):
1388 """Check if servo_topology is supported."""
Otabek Kasimovda994012020-11-25 15:23:04 -08001389 if not self.is_up_fast():
1390 logging.info('Servo-Host is not reachable.')
1391 return False
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001392 if not self.is_labstation():
1393 logging.info('Servo-topology supported only for labstation.')
1394 return False
1395 if not self.servo_serial:
1396 logging.info('Servo-topology required a servo serial.')
1397 return False
1398 return True
1399
1400 def get_topology(self):
1401 """Get servo topology."""
Otabek Kasimovfe41e2d2021-02-14 20:48:52 -08001402 if not self._topology:
1403 self._topology = servo_topology.ServoTopology(self)
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001404 return self._topology
1405
1406 def is_dual_setup(self):
1407 """Check is servo will run in dual setup.
1408
1409 Dual setup used only for servo_v4 when used ccd_cr50 and servo_micro
1410 at the same time.
1411 """
1412 return self.servo_setup == servo_constants.SERVO_SETUP_VALUE_DUAL_V4
1413
Otabek Kasimov39637412020-11-23 19:09:27 -08001414 def set_dut_health_profile(self, dut_health_profile):
1415 """
1416 @param dut_health_profile: A DeviceHealthProfile object.
1417 """
1418 logging.debug('setting dut_health_profile field to (%s)',
1419 dut_health_profile)
1420 self._dut_health_profile = dut_health_profile
1421
1422 def get_dut_health_profile(self):
1423 """
1424 @return A DeviceHealthProfile object.
1425 """
1426 return self._dut_health_profile
1427
Otabek Kasimov51ed19a2021-05-03 12:30:50 -07001428 def print_all_servo_of_host(self):
1429 """Print all servos detected on the host."""
1430 try:
1431 logging.info('\tDevices detected on the host:')
1432 devices = self.get_topology().get_list_available_servos()
1433 for device in devices:
1434 logging.info('\t%s', device)
1435 except Exception as e:
1436 logging.debug('(Not critical) Fail list all servos: %s', e)
1437
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001438
Richard Barnetteea3e4602016-06-10 12:36:41 -07001439def make_servo_hostname(dut_hostname):
1440 """Given a DUT's hostname, return the hostname of its servo.
1441
1442 @param dut_hostname: hostname of a DUT.
1443
1444 @return hostname of the DUT's servo.
1445
1446 """
1447 host_parts = dut_hostname.split('.')
1448 host_parts[0] = host_parts[0] + '-servo'
1449 return '.'.join(host_parts)
1450
1451
Richard Barnettee519dcd2016-08-15 17:37:17 -07001452def _map_afe_board_to_servo_board(afe_board):
1453 """Map a board we get from the AFE to a servo appropriate value.
1454
1455 Many boards are identical to other boards for servo's purposes.
1456 This function makes that mapping.
1457
1458 @param afe_board string board name received from AFE.
1459 @return board we expect servo to have.
1460
1461 """
1462 KNOWN_SUFFIXES = ['-freon', '_freon', '_moblab', '-cheets']
1463 BOARD_MAP = {'gizmo': 'panther'}
1464 mapped_board = afe_board
1465 if afe_board in BOARD_MAP:
1466 mapped_board = BOARD_MAP[afe_board]
1467 else:
1468 for suffix in KNOWN_SUFFIXES:
1469 if afe_board.endswith(suffix):
1470 mapped_board = afe_board[0:-len(suffix)]
1471 break
1472 if mapped_board != afe_board:
1473 logging.info('Mapping AFE board=%s to %s', afe_board, mapped_board)
1474 return mapped_board
1475
1476
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001477def get_servo_args_for_host(dut_host):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001478 """Return servo data associated with a given DUT.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001479
Richard Barnetteea3e4602016-06-10 12:36:41 -07001480 @param dut_host Instance of `Host` on which to find the servo
1481 attributes.
Prathmesh Prabhuf605dd32018-08-28 17:09:04 -07001482 @return `servo_args` dict with host and an optional port.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001483 """
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001484 info = dut_host.host_info_store.get()
Derek Beckettf73baca2020-08-19 15:08:47 -07001485 servo_args = {k: v for k, v in six.iteritems(info.attributes)
Garry Wang11b5e872020-03-11 15:14:08 -07001486 if k in servo_constants.SERVO_ATTR_KEYS}
Richard Barnetteea3e4602016-06-10 12:36:41 -07001487
Andrew Luo4be621d2020-03-21 07:01:13 -07001488 if servo_constants.SERVO_HOST_SSH_PORT_ATTR in servo_args:
1489 try:
1490 servo_args[servo_constants.SERVO_HOST_SSH_PORT_ATTR] = int(
1491 servo_args[servo_constants.SERVO_HOST_SSH_PORT_ATTR])
1492 except ValueError:
1493 logging.error('servo host port is not an int: %s',
1494 servo_args[servo_constants.SERVO_HOST_SSH_PORT_ATTR])
1495 # Reset servo_args because we don't want to use an invalid port.
1496 servo_args.pop(servo_constants.SERVO_HOST_SSH_PORT_ATTR, None)
1497
Garry Wang11b5e872020-03-11 15:14:08 -07001498 if servo_constants.SERVO_PORT_ATTR in servo_args:
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001499 try:
Garry Wang11b5e872020-03-11 15:14:08 -07001500 servo_args[servo_constants.SERVO_PORT_ATTR] = int(
1501 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001502 except ValueError:
1503 logging.error('servo port is not an int: %s',
Garry Wang11b5e872020-03-11 15:14:08 -07001504 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001505 # Reset servo_args because we don't want to use an invalid port.
Garry Wang11b5e872020-03-11 15:14:08 -07001506 servo_args.pop(servo_constants.SERVO_HOST_ATTR, None)
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001507
1508 if info.board:
Garry Wang11b5e872020-03-11 15:14:08 -07001509 servo_board = _map_afe_board_to_servo_board(info.board)
1510 servo_args[servo_constants.SERVO_BOARD_ATTR] = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -07001511 if info.model:
Garry Wang11b5e872020-03-11 15:14:08 -07001512 servo_args[servo_constants.SERVO_MODEL_ATTR] = info.model
1513 return servo_args if servo_constants.SERVO_HOST_ATTR in servo_args else None
Richard Barnetteea3e4602016-06-10 12:36:41 -07001514
1515
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001516def _tweak_args_for_ssp_moblab(servo_args):
Garry Wang11b5e872020-03-11 15:14:08 -07001517 if (servo_args[servo_constants.SERVO_HOST_ATTR]
1518 in ['localhost', '127.0.0.1']):
1519 servo_args[servo_constants.SERVO_HOST_ATTR] = _CONFIG.get_config_value(
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001520 'SSP', 'host_container_ip', type=str, default=None)
1521
1522
Otabek Kasimov39637412020-11-23 19:09:27 -08001523def create_servo_host(dut,
1524 servo_args,
1525 try_lab_servo=False,
1526 try_servo_repair=False,
Otabek Kasimovcdcf1ee2021-03-10 12:10:10 -08001527 try_servo_recovery=True,
Otabek Kasimov39637412020-11-23 19:09:27 -08001528 dut_host_info=None,
1529 dut_health_profile=None):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001530 """Create a ServoHost object for a given DUT, if appropriate.
Dan Shi4d478522014-02-14 13:46:32 -08001531
Richard Barnette9a26ad62016-06-10 12:03:08 -07001532 This function attempts to create and verify or repair a `ServoHost`
1533 object for a servo connected to the given `dut`, subject to various
1534 constraints imposed by the parameters:
1535 * When the `servo_args` parameter is not `None`, a servo
1536 host must be created, and must be checked with `repair()`.
1537 * Otherwise, if a servo exists in the lab and `try_lab_servo` is
1538 true:
1539 * If `try_servo_repair` is true, then create a servo host and
1540 check it with `repair()`.
1541 * Otherwise, if the servo responds to `ping` then create a
1542 servo host and check it with `verify()`.
Fang Denge545abb2014-12-30 18:43:47 -08001543
Richard Barnette9a26ad62016-06-10 12:03:08 -07001544 In cases where `servo_args` was not `None`, repair failure
1545 exceptions are passed back to the caller; otherwise, exceptions
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001546 are logged and then discarded. Note that this only happens in cases
1547 where we're called from a test (not special task) control file that
1548 has an explicit dependency on servo. In that case, we require that
1549 repair not write to `status.log`, so as to avoid polluting test
1550 results.
1551
1552 TODO(jrbarnette): The special handling for servo in test control
1553 files is a thorn in my flesh; I dearly hope to see it cut out before
1554 my retirement.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001555
1556 Parameters for a servo host consist of a host name, port number, and
1557 DUT board, and are determined from one of these sources, in order of
1558 priority:
Richard Barnetteea3e4602016-06-10 12:36:41 -07001559 * Servo attributes from the `dut` parameter take precedence over
1560 all other sources of information.
1561 * If a DNS entry for the servo based on the DUT hostname exists in
1562 the CrOS lab network, that hostname is used with the default
Richard Barnette9a26ad62016-06-10 12:03:08 -07001563 port and the DUT's board.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001564 * If no other options are found, the parameters will be taken
Richard Barnette9a26ad62016-06-10 12:03:08 -07001565 from the `servo_args` dict passed in from the caller.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001566
Otabek Kasimovcdcf1ee2021-03-10 12:10:10 -08001567 @param dut: An instance of `Host` from which to take
1568 servo parameters (if available).
1569 @param servo_args: A dictionary with servo parameters to use if
1570 they can't be found from `dut`. If this
1571 argument is supplied, unrepaired exceptions
1572 from `verify()` will be passed back to the
1573 caller.
1574 @param try_lab_servo: If not true, servo host creation will be
1575 skipped unless otherwise required by the
1576 caller.
1577 @param try_servo_repair: If true, check a servo host with
1578 `repair()` instead of `verify()`.
1579 @param try_servo_recovery: If true, start servod in recovery mode.
1580 Default value is True.
1581 @param dut_host_info: A HostInfo object of the DUT that connected
1582 to this servo.
1583 @param dut_health_profile: DUT repair info with history.
Dan Shi4d478522014-02-14 13:46:32 -08001584
1585 @returns: A ServoHost object or None. See comments above.
1586
1587 """
Garry Wang2d23a892021-04-02 22:33:56 -07001588 # We are explicitly looking for if servo_args is None here(which means
1589 # servo not needed), as servo_args == {} means servo is needed and
1590 # we expect load servo_args from host_info_store.
1591 if servo_args is None:
1592 servo_dependency = False
1593 local_run = False
1594 else:
1595 servo_dependency = True
1596 # If servo_args pass in directly, then this is a local test run.
1597 local_run = servo_constants.SERVO_HOST_ATTR in servo_args
1598
1599 if local_run:
1600 logging.warning('User input servo_args detected, will attempt'
1601 ' to start servod and initialize servo conncetion'
1602 ' directly. All servo/servohost verify and repair'
1603 ' steps will be skipped.')
1604
1605 # Loading servo args from host_info_store.
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001606 if dut is not None and (try_lab_servo or servo_dependency):
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001607 servo_args_override = get_servo_args_for_host(dut)
Richard Barnetteea3e4602016-06-10 12:36:41 -07001608 if servo_args_override is not None:
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001609 if utils.in_moblab_ssp():
1610 _tweak_args_for_ssp_moblab(servo_args_override)
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001611 logging.debug(
1612 'Overriding provided servo_args (%s) with arguments'
1613 ' determined from the host (%s)',
1614 servo_args,
1615 servo_args_override,
1616 )
Richard Barnetteea3e4602016-06-10 12:36:41 -07001617 servo_args = servo_args_override
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001618
Garry Wang2d23a892021-04-02 22:33:56 -07001619 if not servo_args:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001620 logging.debug('No servo_args provided, and failed to find overrides.')
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001621 if try_lab_servo or servo_dependency:
Otabek Kasimov646812c2020-06-23 20:01:36 -07001622 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001623 else:
1624 # For regular test case which not required the servo
1625 return None, None
1626
Garry Wang11b5e872020-03-11 15:14:08 -07001627 servo_hostname = servo_args.get(servo_constants.SERVO_HOST_ATTR)
1628 servo_port = servo_args.get(servo_constants.SERVO_PORT_ATTR)
Garry Wang2d23a892021-04-02 22:33:56 -07001629 if not local_run:
1630 if not _is_servo_host_information_exist(servo_hostname, servo_port):
1631 logging.debug(
1632 'Servo connection info missed hostname: %s , port: %s',
1633 servo_hostname, servo_port)
1634 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
1635 if not is_servo_host_information_valid(servo_hostname, servo_port):
1636 logging.debug(
1637 'Servo connection info is incorrect hostname: %s , port: %s',
1638 servo_hostname, servo_port)
1639 return None, servo_constants.SERVO_STATE_WRONG_CONFIG
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001640
Garry Wang2d23a892021-04-02 22:33:56 -07001641 if try_servo_recovery == True:
1642 servo_args[servo_constants.SERVO_RECOVERY_MODE] = True
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001643
Garry Wangebc015b2019-06-06 17:45:06 -07001644 newhost = ServoHost(**servo_args)
Garry Wang2d23a892021-04-02 22:33:56 -07001645 if local_run:
1646 try:
1647 newhost.start_servod()
1648 except:
1649 # If we failed to start servod here, we can assume the servod
1650 # either already started or the test is running against a
1651 # non-standard servohost so the user will resiponsble for ensure
1652 # servod is running.
1653 pass
1654 try:
Greg Edelstonff2665d2021-04-21 14:32:27 -06001655 newhost.initialize_servo()
Garry Wang2d23a892021-04-02 22:33:56 -07001656 newhost.initialize_dut_for_servo()
1657 newhost._servo_state = servo_constants.SERVO_STATE_WORKING
1658 return newhost, newhost.get_servo_state()
1659 except Exception as e:
1660 logging.error('Failed to initialize servo. %s', e)
1661 return None, servo_constants.SERVO_STATE_BROKEN
1662
Andrew Luo4be621d2020-03-21 07:01:13 -07001663 if newhost.use_icmp and not newhost.is_up_fast(count=3):
Otabek Kasimov32cafe92020-12-14 16:58:12 -08001664 # ServoHost has internal check to wait if servo-host is in reboot
1665 # process. If servo-host still is not available this check will stop
1666 # further attempts as we do not have any option to recover servo_host.
Otabek Kasimov39637412020-11-23 19:09:27 -08001667 return None, servo_constants.SERVO_STATE_NO_SSH
Garry Wangffbd2162020-04-17 16:13:48 -07001668
Otabek Kasimove6df8102020-07-21 20:15:25 -07001669 # Reset or reboot servo device only during AdminRepair tasks.
1670 if try_servo_repair:
1671 if newhost._is_locked:
Otabek Kasimov51ed19a2021-05-03 12:30:50 -07001672 # Print available servos on the host for debugging.
1673 newhost.print_all_servo_of_host()
Otabek Kasimove6df8102020-07-21 20:15:25 -07001674 # Reset servo if the servo is locked, as we check if the servohost
1675 # is up, if the servohost is labstation and if the servohost is in
1676 # lab inside the locking logic.
1677 newhost.reset_servo()
1678 else:
Garry Wang358aad42020-08-02 20:56:04 -07001679 try:
1680 newhost.reboot_servo_v3_on_need()
Garry Wang1f0d5332020-08-10 19:32:32 -07001681 except Exception as e:
1682 logging.info('[Non-critical] Unexpected error while trying to'
1683 ' reboot servo_v3, skipping the reboot; %s', e)
Otabek Kasimove6df8102020-07-21 20:15:25 -07001684
Otabek Kasimov2b50cdb2020-07-06 19:16:06 -07001685 if dut:
1686 newhost.set_dut_hostname(dut.hostname)
Otabek Kasimov9e90ae12020-08-14 03:01:19 -07001687 if dut_host_info:
1688 newhost.set_dut_host_info(dut_host_info)
Otabek Kasimov39637412020-11-23 19:09:27 -08001689 if dut_health_profile and (try_lab_servo or try_servo_repair):
1690 try:
1691 if newhost.is_localhost():
1692 logging.info('Servohost is a localhost, skip device'
1693 ' health profile setup...')
1694 else:
1695 dut_health_profile.init_profile(newhost)
1696 newhost.set_dut_health_profile(dut_health_profile)
1697 except Exception as e:
1698 logging.info(
1699 '[Non-critical] Unexpected error while trying to'
1700 ' load device health profile; %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -07001701
Richard Barnette9a26ad62016-06-10 12:03:08 -07001702 # Note that the logic of repair() includes everything done
1703 # by verify(). It's sufficient to call one or the other;
1704 # we don't need both.
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001705 if servo_dependency:
1706 newhost.repair(silent=True)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001707 return newhost, newhost.get_servo_state()
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001708
1709 if try_servo_repair:
1710 try:
1711 newhost.repair()
1712 except Exception:
1713 logging.exception('servo repair failed for %s', newhost.hostname)
Richard Barnette9a26ad62016-06-10 12:03:08 -07001714 else:
1715 try:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001716 newhost.verify()
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001717 except Exception:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001718 logging.exception('servo verify failed for %s', newhost.hostname)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001719 return newhost, newhost.get_servo_state()
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001720
1721
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001722def _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001723 if hostname is None or len(hostname.strip()) == 0:
1724 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001725 if port is None:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001726 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001727 if not type(port) is int:
1728 try:
1729 int(port)
1730 except ValueError:
1731 return False
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001732 return True
1733
1734
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001735def is_servo_host_information_valid(hostname, port):
Garry Wang9b8f2342020-04-17 16:34:09 -07001736 """Check if provided servo attributes are valid.
1737
1738 @param hostname Hostname of the servohost.
1739 @param port servo port number.
1740
1741 @returns: A bool value to indicate if provided servo attribute valid.
1742 """
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001743 if not _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001744 return False
1745 # checking range and correct of the port
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001746 port_int = int(port)
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001747 if port_int < 1 or port_int > 65000:
1748 return False
1749 # we expecting host contain only latters, digits and '-' or '_'
Garry Wang536d2852021-03-28 22:33:40 -07001750 if not re.match('[a-zA-Z0-9-_\.:]*$', hostname) or len(hostname) < 5:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001751 return False
1752 return True