blob: a95be30a936bb522f66fefdcc651c8b98e0dc065 [file] [log] [blame]
Derek Beckettf73baca2020-08-19 15:08:47 -07001# Lint as: python2, python3
Fang Deng5d518f42013-08-02 14:04:32 -07002# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
3# Use of this source code is governed by a BSD-style license that can be
4# found in the LICENSE file.
5#
6# Expects to be run in an environment with sudo and no interactive password
7# prompt, such as within the Chromium OS development chroot.
8
9
10"""This file provides core logic for servo verify/repair process."""
11
12
Derek Beckettf73baca2020-08-19 15:08:47 -070013from __future__ import absolute_import
14from __future__ import division
15from __future__ import print_function
16
Fang Deng5d518f42013-08-02 14:04:32 -070017import logging
Raul E Rangel52ca2e82018-07-03 14:10:14 -060018import os
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080019import re
20import tarfile
Andrew McRaef0679932020-08-13 09:15:23 +100021import threading
Garry Wang2b5eef92020-08-21 16:23:35 -070022import json
Garry Wangc1288cf2019-12-17 14:58:00 -080023import time
Derek Beckettf73baca2020-08-19 15:08:47 -070024import six
25import six.moves.xmlrpc_client
Fang Deng5d518f42013-08-02 14:04:32 -070026
27from autotest_lib.client.bin import utils
Garry Wang79e9af62019-06-12 15:19:19 -070028from autotest_lib.client.common_lib import error
Richard Barnette9a26ad62016-06-10 12:03:08 -070029from autotest_lib.client.common_lib import hosts
Garry Wang7b0e1b72020-03-25 19:08:59 -070030from autotest_lib.client.common_lib import lsbrelease_utils
Fang Deng5d518f42013-08-02 14:04:32 -070031from autotest_lib.client.common_lib.cros import retry
Garry Wang970fda92021-06-22 18:03:43 -070032from autotest_lib.server import crashcollect
Derek Beckett3d743402021-08-04 09:25:44 -070033from autotest_lib.server import tauto_warnings
Richard Barnette9a26ad62016-06-10 12:03:08 -070034from autotest_lib.server.cros.servo import servo
Garry Wangebc015b2019-06-06 17:45:06 -070035from autotest_lib.server.hosts import base_servohost
Garry Wang11b5e872020-03-11 15:14:08 -070036from autotest_lib.server.hosts import servo_constants
Otabek Kasimov4ea636e2020-04-14 23:35:06 -070037from autotest_lib.server.cros.faft.utils import config
Garry Wang11b5e872020-03-11 15:14:08 -070038from autotest_lib.client.common_lib import global_config
Otabek Kasimov382c3bb2020-10-28 13:22:45 -070039from autotest_lib.server.cros.servo.topology import servo_topology
Garry Wangd7367482020-02-27 13:52:40 -080040
Otabek Kasimov15963492020-06-23 21:10:51 -070041
Dan Shi3b2adf62015-09-02 17:46:54 -070042_CONFIG = global_config.global_config
Fang Deng5d518f42013-08-02 14:04:32 -070043
Otabek Kasimova7ba91a2020-03-09 08:31:01 -070044
Garry Wangebc015b2019-06-06 17:45:06 -070045class ServoHost(base_servohost.BaseServoHost):
46 """Host class for a servo host(e.g. beaglebone, labstation)
Dana Goyette0b6e6402019-10-04 11:09:24 -070047 that with a servo instance for a specific port.
48
49 @type _servo: servo.Servo | None
50 """
Fang Deng5d518f42013-08-02 14:04:32 -070051
Raul E Rangel52ca2e82018-07-03 14:10:14 -060052 DEFAULT_PORT = int(os.getenv('SERVOD_PORT', '9999'))
Richard Barnette9a26ad62016-06-10 12:03:08 -070053
Dan Shie5b3c512014-08-21 12:12:09 -070054 # Timeout for initializing servo signals.
Wai-Hong Tam37b6ed32017-09-19 15:52:39 -070055 INITIALIZE_SERVO_TIMEOUT_SECS = 60
Richard Barnette9a26ad62016-06-10 12:03:08 -070056
Otabek Kasimov545739c2020-08-20 00:24:21 -070057 # Default timeout for run terminal command.
58 DEFAULT_TERMINAL_TIMEOUT = 30
59
xixuan6cf6d2f2016-01-29 15:29:00 -080060 # Ready test function
61 SERVO_READY_METHOD = 'get_version'
Fang Deng5d518f42013-08-02 14:04:32 -070062
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080063 # Directory prefix on the servo host where the servod logs are stored.
64 SERVOD_LOG_PREFIX = '/var/log/servod'
65
66 # Exit code to use when symlinks for servod logs are not found.
67 NO_SYMLINKS_CODE = 9
68
69 # Directory in the job's results directory to dump the logs into.
70 LOG_DIR = 'servod'
71
72 # Prefix for joint loglevel files in the logs.
73 JOINT_LOG_PREFIX = 'log'
74
75 # Regex group to extract timestamp from logfile name.
76 TS_GROUP = 'ts'
77
78 # This regex is used to extract the timestamp from servod logs.
Garry Wang22f2e842020-09-09 20:19:19 -070079 # files always start with log.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080080 TS_RE = (r'log.'
81 # The timestamp is of format %Y-%m-%d--%H-%M-%S.MS
82 r'(?P<%s>\d{4}(\-\d{2}){2}\-(-\d{2}){3}.\d{3})'
83 # The loglevel is optional depending on labstation version.
84 r'(.(INFO|DEBUG|WARNING))?' % TS_GROUP)
85 TS_EXTRACTOR = re.compile(TS_RE)
86
87 # Regex group to extract MCU name from logline in servod logs.
88 MCU_GROUP = 'mcu'
89
90 # Regex group to extract logline from MCU logline in servod logs.
91 LINE_GROUP = 'line'
92
93 # This regex is used to extract the mcu and the line content from an
94 # MCU logline in servod logs. e.g. EC or servo_v4 console logs.
95 # Here is an example log-line:
96 #
97 # 2020-01-23 13:15:12,223 - servo_v4 - EC3PO.Console - DEBUG -
98 # console.py:219:LogConsoleOutput - /dev/pts/9 - cc polarity: cc1
99 #
100 # Here is conceptually how they are formatted:
101 #
102 # <time> - <MCU> - EC3PO.Console - <LVL> - <file:line:func> - <pts> -
103 # <output>
104 #
Garry Wang22f2e842020-09-09 20:19:19 -0700105 # The log format starts with a timestamp
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800106 MCU_RE = (r'[\d\-]+ [\d:,]+ '
107 # The mcu that is logging this is next.
108 r'- (?P<%s>\w+) - '
109 # Next, we have more log outputs before the actual line.
110 # Information about the file line, logging function etc.
111 # Anchor on EC3PO Console, LogConsoleOutput and dev/pts.
112 # NOTE: if the log format changes, this regex needs to be
113 # adjusted.
114 r'EC3PO\.Console[\s\-\w\d:.]+LogConsoleOutput - /dev/pts/\d+ - '
115 # Lastly, we get the MCU's console line.
116 r'(?P<%s>.+$)' % (MCU_GROUP, LINE_GROUP))
117 MCU_EXTRACTOR = re.compile(MCU_RE)
118
Otabek Kasimov545739c2020-08-20 00:24:21 -0700119 # Regex to detect timeout messages when USBC pigtail has timeout issue.
120 # e.g.: [475635.427072 PD TMOUT RX 1/1]
121 USBC_PIGTAIL_TIMEOUT_RE = r'\[[\d \.]{1,20}(PD TMOUT RX 1\/1)\]'
122
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800123 # Suffix to identify compressed logfiles.
124 COMPRESSION_SUFFIX = '.tbz2'
125
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700126 # A suffix to mark servod log directories that came from instance that
127 # ran during this servo_host, but are not the last one running e.g. when
128 # an instance (on purpose, or due to a bug) restarted in the middle of the
129 # run.
130 OLD_LOG_SUFFIX = 'old'
131
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800132 def _init_attributes(self):
133 self._servo_state = None
134 self.servo_port = None
135 self.servo_board = None
136 self.servo_model = None
137 self.servo_serial = None
Garry Wangcb06f3b2020-10-08 20:56:21 -0700138 self.servo_setup = None
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800139 self.servo_recovery = None
Otabek Kasimovab4ae222021-03-06 01:38:47 -0800140 self.servo_fw_channel = None
Garry Wang6a680062020-11-03 13:40:29 -0800141 self.additional_servod_args = None
Otabek Kasimov39637412020-11-23 19:09:27 -0800142 self._dut_health_profile = None
Garry Wang000c6c02020-05-11 21:27:23 -0700143 # The flag that indicate if a servo is connected to a smart usbhub.
144 # TODO(xianuowang@) remove this flag once all usbhubs in the lab
145 # get replaced.
146 self.smart_usbhub = None
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800147 self._servo = None
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700148 self._topology = None
Andrew McRaef0679932020-08-13 09:15:23 +1000149 self._tunnel_proxy = None
150 self._tunnel_proxy_lock = threading.Lock()
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700151 self._initial_instance_ts = None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800152 # Flag to make sure that multiple calls to close do not result in the
153 # logic executing multiple times.
154 self._closed = False
Andrew McRaef0679932020-08-13 09:15:23 +1000155 # Per-thread local data
156 self._local = threading.local()
Fang Deng5d518f42013-08-02 14:04:32 -0700157
Garry Wangcb06f3b2020-10-08 20:56:21 -0700158 def _initialize(self,
159 servo_host='localhost',
160 servo_port=DEFAULT_PORT,
161 servo_board=None,
162 servo_model=None,
163 servo_serial=None,
164 servo_setup=None,
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800165 servo_recovery=None,
Otabek Kasimovab4ae222021-03-06 01:38:47 -0800166 servo_fw_channel=None,
Garry Wang6a680062020-11-03 13:40:29 -0800167 additional_servod_args=None,
Garry Wangcb06f3b2020-10-08 20:56:21 -0700168 is_in_lab=None,
169 *args,
170 **dargs):
Fang Deng5d518f42013-08-02 14:04:32 -0700171 """Initialize a ServoHost instance.
172
173 A ServoHost instance represents a host that controls a servo.
174
175 @param servo_host: Name of the host where the servod process
176 is running.
Raul E Rangel52ca2e82018-07-03 14:10:14 -0600177 @param servo_port: Port the servod process is listening on. Defaults
178 to the SERVOD_PORT environment variable if set,
179 otherwise 9999.
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700180 @param servo_board: Board that the servo is connected to.
Nick Sanders2f3c9852018-10-24 12:10:24 -0700181 @param servo_model: Model that the servo is connected to.
Garry Wangcb06f3b2020-10-08 20:56:21 -0700182 @param servo_serial: Serial number of the servo device.
183 @param servo_setup: Type of servo setup, e.g. REGULAR or DUAL_V4.
Garry Wang6a680062020-11-03 13:40:29 -0800184 @param additional_servod_args: Additional args that will append to
185 servod start command.
Dan Shi4d478522014-02-14 13:46:32 -0800186 @param is_in_lab: True if the servo host is in Cros Lab. Default is set
187 to None, for which utils.host_is_in_lab_zone will be
188 called to check if the servo host is in Cros lab.
Fang Deng5d518f42013-08-02 14:04:32 -0700189
190 """
191 super(ServoHost, self)._initialize(hostname=servo_host,
Garry Wangebc015b2019-06-06 17:45:06 -0700192 is_in_lab=is_in_lab, *args, **dargs)
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800193 self._init_attributes()
Richard Barnette42f4db92018-08-23 15:05:15 -0700194 self.servo_port = int(servo_port)
Richard Barnettee519dcd2016-08-15 17:37:17 -0700195 self.servo_board = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -0700196 self.servo_model = servo_model
Kevin Cheng643ce8a2016-09-15 15:42:12 -0700197 self.servo_serial = servo_serial
Garry Wangcb06f3b2020-10-08 20:56:21 -0700198 self.servo_setup = servo_setup
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800199 self.servo_recovery = servo_recovery
Otabek Kasimovab4ae222021-03-06 01:38:47 -0800200 self.servo_fw_channel = servo_fw_channel
Garry Wang6a680062020-11-03 13:40:29 -0800201 self.additional_servod_args = additional_servod_args
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800202
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800203 # The location of the log files on the servo host for this instance.
204 self.remote_log_dir = '%s_%s' % (self.SERVOD_LOG_PREFIX,
205 self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700206 # Path of the servo host lock file.
Derek Beckettf73baca2020-08-19 15:08:47 -0700207 self._lock_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
208 self.LOCK_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700209 # File path to declare a reboot request.
Derek Beckettf73baca2020-08-19 15:08:47 -0700210 self._reboot_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
211 self.REBOOT_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700212
213 # Lock the servo host if it's an in-lab labstation to prevent other
214 # task to reboot it until current task completes. We also wait and
215 # make sure the labstation is up here, in the case of the labstation is
216 # in the middle of reboot.
Garry Wang7c00b0f2019-06-25 17:28:17 -0700217 self._is_locked = False
Garry Wang42b4d862019-06-25 15:50:49 -0700218 if (self.wait_up(self.REBOOT_TIMEOUT) and self.is_in_lab()
219 and self.is_labstation()):
Garry Wang79e9af62019-06-12 15:19:19 -0700220 self._lock()
Garry Wang78ce64d2020-10-13 18:23:45 -0700221 try:
222 self.wait_ready()
223 except Exception as e:
224 logging.info(
225 'Unexpected error while ensure labstation'
226 ' readiness; %s', str(e))
Garry Wangebc015b2019-06-06 17:45:06 -0700227
Derek Beckett3d743402021-08-04 09:25:44 -0700228 self._repair_strategy = None
Richard Barnettee519dcd2016-08-15 17:37:17 -0700229
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700230 def __str__(self):
231 return "<%s '%s:%s'>" % (
232 type(self).__name__, self.hostname, self.servo_port)
233
Richard Barnette9a26ad62016-06-10 12:03:08 -0700234 def connect_servo(self):
Garry Wang8c8dc972020-06-09 13:41:51 -0700235 """ Initialize and setup servo for later use.
236 """
Greg Edelstonff2665d2021-04-21 14:32:27 -0600237 self.initialize_servo()
Garry Wang8c8dc972020-06-09 13:41:51 -0700238 self.initialize_dut_for_servo()
239
Greg Edelstonff2665d2021-04-21 14:32:27 -0600240 def initialize_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700241 """Establish a connection to the servod server on this host.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700242
243 Initializes `self._servo` and then verifies that all network
244 connections are working. This will create an ssh tunnel if
245 it's required.
Garry Wang8c8dc972020-06-09 13:41:51 -0700246 """
247 self._servo = servo.Servo(servo_host=self,
248 servo_serial=self.servo_serial)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700249
Garry Wang8c8dc972020-06-09 13:41:51 -0700250 def initialize_dut_for_servo(self):
251 """This method will do some setup for dut control, e.g. setup
252 main servo_v4 device, and also testing the connection between servo
253 and DUT. As a side effect of testing the connection, all signals on
254 the target servo are reset to default values, and the USB stick is
Richard Barnette9a26ad62016-06-10 12:03:08 -0700255 set to the neutral (off) position.
256 """
Garry Wang8c8dc972020-06-09 13:41:51 -0700257 if not self._servo:
258 raise hosts.AutoservVerifyError('Servo object needs to be'
259 ' initialized before initialize'
260 ' DUT.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700261 timeout, _ = retry.timeout(
Garry Wang8c8dc972020-06-09 13:41:51 -0700262 self._servo.initialize_dut,
263 timeout_sec=self.INITIALIZE_SERVO_TIMEOUT_SECS)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700264 if timeout:
Garry Wang8c8dc972020-06-09 13:41:51 -0700265 raise hosts.AutoservVerifyError('Initialize dut for servo timed'
266 ' out.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700267
Richard Barnette9a26ad62016-06-10 12:03:08 -0700268 def disconnect_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700269 """Disconnect our servo if it exists.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700270
271 If we've previously successfully connected to our servo,
272 disconnect any established ssh tunnel, and set `self._servo`
273 back to `None`.
274 """
275 if self._servo:
276 # N.B. This call is safe even without a tunnel:
277 # rpc_server_tracker.disconnect() silently ignores
278 # unknown ports.
279 self.rpc_server_tracker.disconnect(self.servo_port)
280 self._servo = None
Fang Deng5d518f42013-08-02 14:04:32 -0700281
Andrew McRaef0679932020-08-13 09:15:23 +1000282 def _maybe_create_servod_ssh_tunnel_proxy(self):
283 """Create a xmlrpc proxy for use with a ssh tunnel.
284 A lock is used to safely create a singleton proxy.
285 """
286 with self._tunnel_proxy_lock:
287 if self._tunnel_proxy is None:
288 self._tunnel_proxy = self.rpc_server_tracker.xmlrpc_connect(
289 None,
290 self.servo_port,
291 ready_test_name=self.SERVO_READY_METHOD,
292 timeout_seconds=60,
293 request_timeout_seconds=3600,
294 server_desc=str(self))
295
Andrew McRaef0679932020-08-13 09:15:23 +1000296 def get_servod_server_proxy(self):
297 """Return a proxy if it exists; otherwise, create a new one.
298 A proxy can either be a ssh tunnel based proxy, or a httplib
299 based proxy.
Fang Deng5d518f42013-08-02 14:04:32 -0700300
301 @returns: An xmlrpclib.ServerProxy that is connected to the servod
302 server on the host.
Fang Deng5d518f42013-08-02 14:04:32 -0700303 """
Garry Wang11b5e872020-03-11 15:14:08 -0700304 if (servo_constants.ENABLE_SSH_TUNNEL_FOR_SERVO
305 and not self.is_localhost()):
Andrew McRaef0679932020-08-13 09:15:23 +1000306 # Check for existing ssh tunnel proxy.
307 if self._tunnel_proxy is None:
308 self._maybe_create_servod_ssh_tunnel_proxy()
309 return self._tunnel_proxy
Richard Barnette9a26ad62016-06-10 12:03:08 -0700310 else:
Andrew McRaef0679932020-08-13 09:15:23 +1000311 # xmlrpc/httplib is not thread-safe, so each thread must have its
312 # own separate proxy connection.
313 if not hasattr(self._local, "_per_thread_proxy"):
314 remote = 'http://%s:%s' % (self.hostname, self.servo_port)
Derek Beckettf73baca2020-08-19 15:08:47 -0700315 self._local._per_thread_proxy = six.moves.xmlrpc_client.ServerProxy(remote)
Andrew McRaef0679932020-08-13 09:15:23 +1000316 return self._local._per_thread_proxy
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800317
Richard Barnette1edbb162016-11-01 11:47:50 -0700318 def verify(self, silent=False):
319 """Update the servo host and verify it's in a good state.
320
321 @param silent If true, suppress logging in `status.log`.
322 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700323 message = 'Beginning verify for servo host %s port %s serial %s'
324 message %= (self.hostname, self.servo_port, self.servo_serial)
325 self.record('INFO', None, None, message)
Derek Beckett3d743402021-08-04 09:25:44 -0700326 tauto_warnings.lab_services_warn_and_error("Verify Servo state")
Fang Deng5d518f42013-08-02 14:04:32 -0700327
Garry Wang2b5eef92020-08-21 16:23:35 -0700328 def _get_default_usbkey_mount_path(self):
329 return '/media/servo_usb/%s' % self.servo_port
Fang Deng5d518f42013-08-02 14:04:32 -0700330
Garry Wang7b0e1b72020-03-25 19:08:59 -0700331 def get_image_name_from_usbkey(self, usbkey_dev):
332 """Mount usb drive and check ChromeOS image name on it if there is
333 one. This method assumes the image_usbkey_direction is already set
334 to servo side.
335
Garry Wang4b980202020-09-24 17:00:17 -0700336 @param usbkey_dev: usbkey dev path(e.g. /dev/sdb).
Garry Wang7b0e1b72020-03-25 19:08:59 -0700337
338 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
339 or empty string if no test image detected, or unexpected
340 error occurred.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700341 """
Garry Wang70e5d062020-04-03 18:01:05 -0700342 logging.info('Checking ChromeOS image name on usbkey.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700343 mount_dst = self._get_default_usbkey_mount_path()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700344 # Unmount if there is an existing stale mount.
Garry Wang2b5eef92020-08-21 16:23:35 -0700345 self._unmount_drive(mount_dst)
346 # ChromeOS root fs is in /dev/sdx3
347 mount_src = usbkey_dev + '3'
Garry Wang7b0e1b72020-03-25 19:08:59 -0700348 try:
Garry Wang2b5eef92020-08-21 16:23:35 -0700349 if not self._mount_drive(mount_src, mount_dst):
350 logging.debug('Unexpected error occurred on mount usb drive.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700351 return ''
Garry Wang70e5d062020-04-03 18:01:05 -0700352
353 release_content = self.run(
Garry Wang2b5eef92020-08-21 16:23:35 -0700354 'cat %s/etc/lsb-release' % mount_dst,
Garry Wang70e5d062020-04-03 18:01:05 -0700355 ignore_status=True).stdout.strip()
356
357 if not re.search(r'RELEASE_TRACK=.*test', release_content):
358 logging.info('The image on usbkey is not a test image')
359 return ''
360
361 return lsbrelease_utils.get_chromeos_release_builder_path(
362 lsb_release_content=release_content)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700363 finally:
Garry Wang70e5d062020-04-03 18:01:05 -0700364 logging.debug('Image check compeleted, unmounting the usb drive.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700365 self._unmount_drive(mount_dst)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700366
Garry Wang2b5eef92020-08-21 16:23:35 -0700367 def _extract_firmware_image_from_usbkey(self, fw_dst):
368 """Extract firmware images from the usbkey on servo, this method
369 assumes there is already a ChromeOS test image staged on servo.
370
Garry Wang4b980202020-09-24 17:00:17 -0700371 @param fw_dst: the path that we'll copy firmware images to.
Garry Wang2b5eef92020-08-21 16:23:35 -0700372
373 @returns: a json format string of firmware manifest data.
374 """
375 usbkey_dev = self._probe_and_validate_usb_dev()
376 if not usbkey_dev:
377 raise hosts.AutoservRepairError('Unexpected error occurred when'
378 ' probe usbkey dev path, please check logs for detail.')
379
380 mount_dst = self._get_default_usbkey_mount_path()
381 # Unmount if there is an existing stale mount.
382 self._unmount_drive(mount_dst)
383 # ChromeOS root fs is in /dev/sdx3
384 mount_src = usbkey_dev + '3'
385 try:
386 if not self._mount_drive(mount_src, mount_dst):
387 raise hosts.AutoservRepairError('Failed to extract firmware'
388 ' image; Unable to mount %s.' % usbkey_dev,
389 'unable to mount usbkey')
390 updater_bin = os.path.join(mount_dst,
391 'usr/sbin/chromeos-firmwareupdate')
392 self.run('%s --unpack %s' % (updater_bin, fw_dst))
393 return self.run('%s --manifest' % updater_bin).stdout
394 finally:
395 self._unmount_drive(mount_dst)
396
397 def prepare_repair_firmware_image(self, fw_dst=None):
398 """Prepare firmware image on the servohost for auto repair process
399 to consume.
400
Garry Wang4b980202020-09-24 17:00:17 -0700401 @param fw_dst: the path that we want to store firmware image on
402 the servohost.
Garry Wang2b5eef92020-08-21 16:23:35 -0700403
404 @returns: A tuple that containes ec firmware image path and bios
405 firmware image path on the servohost, or None if type of
406 image is not available based on manifest and dut's model.
407 """
408 model = self.servo_model or self._dut_host_info.model
409 if not model:
410 raise hosts.AutoservRepairError(
411 'Could not determine DUT\'s model.',
412 'model infomation unknown')
413
414 if not fw_dst:
415 fw_dst = '/tmp/firmware_image/%s' % self.servo_port
416 # Cleanup and re-create dst path to have a fresh start.
417 self.run('rm -rf %s' % fw_dst)
418 self.run('mkdir -p %s' % fw_dst)
419
420 manifest = json.loads(self._extract_firmware_image_from_usbkey(fw_dst))
Garry Wang50b56c12020-09-24 17:26:52 -0700421 # For models that have packed $MODEL_signed variant, we want use the
422 # 'signed' variant once we get DVT devices, so try to read manifest
423 # from $MODEL_signed first.
424 build = manifest.get('%s_signed' % model) or manifest.get(model)
425 if not build:
Garry Wang2b5eef92020-08-21 16:23:35 -0700426 raise hosts.AutoservRepairError('Could not find firmware manifest'
427 ' for model:%s' % model, 'model manifest not found')
428 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700429 ec_image = os.path.join(fw_dst, build['ec']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700430 except KeyError:
431 ec_image = None
432 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700433 bios_image = os.path.join(fw_dst, build['host']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700434 except KeyError:
435 bios_image = None
436 if not ec_image and not bios_image:
437 raise hosts.AutoservRepairError('Could not find any firmware image'
438 ' for model:%s' % model, 'cannot find firmware image')
439 return ec_image, bios_image
Garry Wang7b0e1b72020-03-25 19:08:59 -0700440
Garry Wang4b980202020-09-24 17:00:17 -0700441 def flash_ap_firmware_via_servo(self, image):
442 """Flash AP firmware by use a provided image.
443
444 This is will be a short term enhanment for infra repair use, it use
445 'futility update' which will automatically determine various parameters
446 needed for flashrom, and will preserve the GBB, VPD, and HWID for
447 AP firmware update.
448 @TODO(xianuowang@) Remove this method once b/148403277 implemented.
449
450 @param image: the firmware image path on servohost.
451 """
452 cmd = 'futility update -i %s --servo_port=%s'
453 self.run(cmd % (image, self.servo_port), timeout=900)
454
Garry Wang70e5d062020-04-03 18:01:05 -0700455 def _probe_and_validate_usb_dev(self):
456 """This method probe the usb dev path by talking to servo, and then
457 validate the dev path is valid block device to servohost.
458 Possible output:
459 1. Encounter error during probe usb dev, returns empty string.
460 2. probe usb dev completed without error but cannot find usb dev,
461 raise AutoservRepairError.
462 3. probe usb dev find a usb dev path, but failed validation in this
463 method, raise AutoservRepairError.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700464
Garry Wang70e5d062020-04-03 18:01:05 -0700465 @returns: A string of usb dev path(e.g. '/dev/sdb'), or empty string
466 if unexpected error occurred during probe.
467 @raises: AutoservRepairError if servo couldn't probe the usb dev path
468 (servo.probe_host_usb_dev() returns empty string), or the dev path is
469 not valid block device to servohost.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700470 """
471 logging.info('Validating image usbkey on servo.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700472 try:
Garry Wang70e5d062020-04-03 18:01:05 -0700473 usb_dev = self._servo.probe_host_usb_dev()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700474 except Exception as e:
475 # We don't want any unexpected or transient servo communicating
476 # failure block usb repair, so capture all errors here.
477 logging.error(e, exc_info=True)
478 logging.error('Unexpected error occurred on get usbkey dev path,'
479 ' skipping usbkey validation.')
480 return ''
481
Garry Wang70e5d062020-04-03 18:01:05 -0700482 if usb_dev:
483 # probe_host_usb_dev() sometimes return stale record,
484 # so we need to make sure the path exists in fdisk.
Otabek Kasimov77bff672020-10-08 15:52:03 -0700485 validate_cmd = 'fdisk -l %s' % usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700486 try:
Otabek Kasimov77bff672020-10-08 15:52:03 -0700487 resp = self.run(validate_cmd, ignore_status=True, timeout=30)
Garry Wang11441182020-06-16 18:34:14 -0700488 if resp.exit_status == 0:
489 return usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700490 logging.error('%s is reported from "image_usbkey_dev" control'
491 ' but not detected by fdisk!', usb_dev)
492 except error.AutoservRunError as e:
493 if 'Timeout encountered' in str(e):
494 logging.warning('Timeout encountered during fdisk run,'
495 ' skipping usbkey validation.')
496 return ''
497 raise
Garry Wang70e5d062020-04-03 18:01:05 -0700498
499 raise hosts.AutoservRepairError(
500 'No usbkey detected on servo, the usbkey may be either missing'
501 ' or broken. Please replace usbkey on the servo and retry.',
502 'missing usbkey')
503
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700504 def is_ec_supported(self):
Garry Wang9b8f2342020-04-17 16:34:09 -0700505 """Check if ec is supported on the servo_board"""
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700506 if self.servo_board:
507 try:
508 frm_config = config.Config(self.servo_board, self.servo_model)
509 return frm_config.chrome_ec
510 except Exception as e:
511 logging.error('Unexpected error when read from firmware'
512 ' configs; %s', str(e))
513 return False
514
Garry Wang70e5d062020-04-03 18:01:05 -0700515 def validate_image_usbkey(self):
516 """This method first validate if there is a recover usbkey on servo
517 that accessible to servohost, and second check if a ChromeOS image is
518 already on the usb drive and return the image_name so we can avoid
519 unnecessary download and flash to the recover usbkey on servo.
520
521 Please note that, there is special error handling logic here:
522 1. If unexpected error happens, we return empty string. So repair
523 actions will not get blocked.
524 2. If no working usbkey present on servo, but no errors, we'll raise
525 AutoservRepairError here.
526
527 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
528 or empty string if no test image detected, or unexpected
529 error occurred.
530 @raises: AutoservRepairError if the usbkey is not detected on servo.
531 """
532 usb_dev = self._probe_and_validate_usb_dev()
533 if usb_dev:
534 return self.get_image_name_from_usbkey(usb_dev)
535 else:
536 return ''
Garry Wang7b0e1b72020-03-25 19:08:59 -0700537
Richard Barnette1edbb162016-11-01 11:47:50 -0700538 def repair(self, silent=False):
539 """Attempt to repair servo host.
540
541 @param silent If true, suppress logging in `status.log`.
542 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700543 message = 'Beginning repair for servo host %s port %s serial %s'
544 message %= (self.hostname, self.servo_port, self.servo_serial)
545 self.record('INFO', None, None, message)
Derek Beckett3d743402021-08-04 09:25:44 -0700546 tauto_warnings.lab_services_warn_and_error("Servo repair")
Garry Wang63b8c382020-03-11 22:28:40 -0700547
Garry Wang63b8c382020-03-11 22:28:40 -0700548 def _is_critical_error(self, error):
549 if (isinstance(error, hosts.AutoservVerifyDependencyError)
550 and not error.is_critical()):
551 logging.warning('Non-critical verify failure(s) detected during'
552 ' verify/repair servo, servo connection will'
Evan Benn2c41c262020-10-28 11:34:27 +1100553 ' still be up but may not be fully functional.'
554 ' Some repair actions and servo dependent'
Garry Wang63b8c382020-03-11 22:28:40 -0700555 ' tests may not run.')
556 return False
Evan Benn2c41c262020-10-28 11:34:27 +1100557 logging.info(
558 'Critical verify failure(s) detected during repair/verify '
559 'servo. Disconnecting servo and running `stop servod`, all'
560 ' repair actions and tests that depends on servo will not '
561 'run.')
Garry Wang63b8c382020-03-11 22:28:40 -0700562 return True
Fang Deng5d518f42013-08-02 14:04:32 -0700563
Dan Shi4d478522014-02-14 13:46:32 -0800564 def get_servo(self):
565 """Get the cached servo.Servo object.
Fang Deng5d518f42013-08-02 14:04:32 -0700566
Dan Shi4d478522014-02-14 13:46:32 -0800567 @return: a servo.Servo object.
Dana Goyette353d1d92019-06-27 10:43:59 -0700568 @rtype: autotest_lib.server.cros.servo.servo.Servo
Fang Deng5d518f42013-08-02 14:04:32 -0700569 """
Dan Shi4d478522014-02-14 13:46:32 -0800570 return self._servo
571
Garry Wang79e9af62019-06-12 15:19:19 -0700572 def request_reboot(self):
573 """Request servohost to be rebooted when it's safe to by touch a file.
574 """
575 logging.debug('Request to reboot servohost %s has been created by '
Garry Wang464ff1e2019-07-18 17:20:34 -0700576 'servo with port # %s', self.hostname, self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700577 self.run('touch %s' % self._reboot_file, ignore_status=True)
578
Garry Wang464ff1e2019-07-18 17:20:34 -0700579 def withdraw_reboot_request(self):
580 """Withdraw a servohost reboot request if exists by remove the flag
581 file.
582 """
583 logging.debug('Withdrawing request to reboot servohost %s that created'
584 ' by servo with port # %s if exists.',
585 self.hostname, self.servo_port)
586 self.run('rm -f %s' % self._reboot_file, ignore_status=True)
587
Garry Wangc1288cf2019-12-17 14:58:00 -0800588 def start_servod(self, quick_startup=False):
589 """Start the servod process on servohost.
590 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800591 # Skip if running on the localhost.(crbug.com/1038168)
592 if self.is_localhost():
593 logging.debug("Servohost is a localhost, skipping start servod.")
594 return
595
596 cmd = 'start servod'
Garry Wangc1288cf2019-12-17 14:58:00 -0800597 if self.servo_board:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800598 cmd += ' BOARD=%s' % self.servo_board
Garry Wangc1288cf2019-12-17 14:58:00 -0800599 if self.servo_model:
600 cmd += ' MODEL=%s' % self.servo_model
Garry Wangc1288cf2019-12-17 14:58:00 -0800601 else:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800602 logging.warning('Board for DUT is unknown; starting servod'
603 ' assuming a pre-configured board.')
604
605 cmd += ' PORT=%d' % self.servo_port
606 if self.servo_serial:
607 cmd += ' SERIAL=%s' % self.servo_serial
Garry Wangd7367482020-02-27 13:52:40 -0800608
Garry Wangcb06f3b2020-10-08 20:56:21 -0700609 # Start servod with dual_v4 based on servo_setup.
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700610 if self.is_dual_setup():
Garry Wangcb06f3b2020-10-08 20:56:21 -0700611 cmd += ' DUAL_V4=1'
Garry Wangd7367482020-02-27 13:52:40 -0800612
Garry Wangcb06f3b2020-10-08 20:56:21 -0700613 # Start servod with CONFIG=cr50.xml which required for some pools.
614 if self._require_cr50_servod_config():
615 cmd += ' CONFIG=cr50.xml'
Garry Wangb5cee3e2020-09-16 14:58:13 -0700616
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800617 if self.servo_recovery == True:
618 cmd += ' REC_MODE=1'
619
Garry Wang6a680062020-11-03 13:40:29 -0800620 # Adding customized args if any.
621 if self.additional_servod_args:
622 cmd += ' ' + self.additional_servod_args
623
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800624 # Remove the symbolic links from the logs. This helps ensure that
625 # a failed servod instantiation does not cause us to grab old logs
626 # by mistake.
627 self.remove_latest_log_symlinks()
Garry Wangcdd27b22020-01-13 14:59:11 -0800628 self.run(cmd, timeout=60)
Garry Wangc1288cf2019-12-17 14:58:00 -0800629
630 # There's a lag between when `start servod` completes and when
631 # the _ServodConnectionVerifier trigger can actually succeed.
632 # The call to time.sleep() below gives time to make sure that
633 # the trigger won't fail after we return.
634
635 # Normally servod on servo_v3 and labstation take ~10 seconds to ready,
636 # But in the rare case all servo on a labstation are in heavy use they
637 # may take ~30 seconds. So the timeout value will double these value,
638 # and we'll try quick start up when first time initialize servohost,
639 # and use standard start up timeout in repair.
640 if quick_startup:
Garry Wang11b5e872020-03-11 15:14:08 -0700641 timeout = servo_constants.SERVOD_QUICK_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800642 else:
Garry Wang11b5e872020-03-11 15:14:08 -0700643 timeout = servo_constants.SERVOD_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800644 logging.debug('Wait %s seconds for servod process fully up.', timeout)
645 time.sleep(timeout)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700646 # Cache the initial instance timestamp to check against servod restarts
647 self._initial_instance_ts = self.get_instance_logs_ts()
Garry Wangc1288cf2019-12-17 14:58:00 -0800648
Garry Wangc1288cf2019-12-17 14:58:00 -0800649 def stop_servod(self):
650 """Stop the servod process on servohost.
651 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800652 # Skip if running on the localhost.(crbug.com/1038168)
653 if self.is_localhost():
654 logging.debug("Servohost is a localhost, skipping stop servod.")
655 return
656
Garry Wangc1288cf2019-12-17 14:58:00 -0800657 logging.debug('Stopping servod on port %s', self.servo_port)
Garry Wangcdd27b22020-01-13 14:59:11 -0800658 self.run('stop servod PORT=%d' % self.servo_port,
659 timeout=60, ignore_status=True)
Garry Wangc1288cf2019-12-17 14:58:00 -0800660 logging.debug('Wait %s seconds for servod process fully teardown.',
Garry Wang11b5e872020-03-11 15:14:08 -0700661 servo_constants.SERVOD_TEARDOWN_TIMEOUT)
662 time.sleep(servo_constants.SERVOD_TEARDOWN_TIMEOUT)
Garry Wangc1288cf2019-12-17 14:58:00 -0800663
Garry Wangc1288cf2019-12-17 14:58:00 -0800664 def restart_servod(self, quick_startup=False):
665 """Restart the servod process on servohost.
666 """
667 self.stop_servod()
668 self.start_servod(quick_startup)
669
Garry Wangffbd2162020-04-17 16:13:48 -0700670 def _process_servodtool_error(self, response):
671 """Helper function to handle non-zero servodtool response.
672 """
673 if re.search(servo_constants.ERROR_MESSAGE_USB_HUB_NOT_COMPATIBLE,
Garry Wangad245002020-05-15 15:20:23 -0700674 response.stdout):
Garry Wangffbd2162020-04-17 16:13:48 -0700675 logging.error('The servo is not plugged on a usb hub that supports'
676 ' power-cycle!')
Garry Wang000c6c02020-05-11 21:27:23 -0700677 # change the flag so we can update this label in later process.
678 self.smart_usbhub = False
Garry Wangffbd2162020-04-17 16:13:48 -0700679 return
680
681 if re.search(servo_constants.ERROR_MESSAGE_DEVICE_NOT_FOUND %
682 self.servo_serial, response.stdout):
683 logging.error('No servo with serial %s found!', self.servo_serial)
684 return
685
686 logging.error('Unexpected error occurred from usbhub control, please'
687 ' file a bug and inform chrome-fleet-software@ team!')
688
Otabek Kasimov86062d02020-11-17 13:30:22 -0800689 def get_main_servo_usb_path(self):
690 """Helper function to collect current usb-path to main servo.
691
692 The usb-path is path to the folder where usb-device was enumerated.
693 If fail then will return an empty string ('').
694
695 @returns: string, usb-path to the main servo device.
696 e.g.: '/sys/bus/usb/devices/1-6.1.3.1'
Garry Wangffbd2162020-04-17 16:13:48 -0700697 """
Otabek Kasimov09192682020-06-01 18:17:44 -0700698 # TODO remove try-except when fix crbug.com/1087964
699 try:
700 cmd = 'servodtool device -s %s usb-path' % self.servo_serial
701 resp = self.run(cmd, ignore_status=True, timeout=30)
702 except Exception as e:
703 # Here we catch only timeout errors.
704 # Other errors is filtered by ignore_status=True
705 logging.debug('Attempt to get servo usb-path failed due to '
706 'timeout; %s', e)
707 return ''
Garry Wangffbd2162020-04-17 16:13:48 -0700708 if resp.exit_status != 0:
709 self._process_servodtool_error(resp)
710 return ''
711 usb_path = resp.stdout.strip()
712 logging.info('Usb path of servo %s is %s', self.servo_serial, usb_path)
Otabek Kasimov86062d02020-11-17 13:30:22 -0800713 return usb_path
Garry Wangffbd2162020-04-17 16:13:48 -0700714
Otabek Kasimov86062d02020-11-17 13:30:22 -0800715 def _get_servo_usb_devnum(self):
716 """Helper function to collect current usb devnum of servo."""
717 usb_path = self.get_main_servo_usb_path()
718 if not usb_path:
719 return ''
720 resp = self.run('cat %s/devnum' % usb_path, ignore_status=True)
Garry Wangffbd2162020-04-17 16:13:48 -0700721 if resp.exit_status != 0:
722 self._process_servodtool_error(resp)
723 return ''
724 return resp.stdout.strip()
725
Garry Wang358aad42020-08-02 20:56:04 -0700726 def reboot_servo_v3_on_need(self):
727 """Check and reboot servo_v3 based on below conditions.
728 1. If there is an update pending on reboot.
729 2. Servo_v3 has been up for more than 96 hours.
730 """
731 if self.get_board() != 'beaglebone_servo':
732 logging.info('Servo reboot is only applicable for servo V3.')
Otabek Kasimove6df8102020-07-21 20:15:25 -0700733 return
734
Garry Wang358aad42020-08-02 20:56:04 -0700735 update_pending_reboot = (self._check_update_status() ==
736 self.UPDATE_STATE.PENDING_REBOOT)
737 uptime_hours = float(self.check_uptime())/3600
738 logging.info('Uptime of servo_v3: %s hour(s)', uptime_hours)
739 long_up_time = uptime_hours > 96
740
741 # Skip reboot if neither condition are met.
742 if not (update_pending_reboot or long_up_time):
Otabek Kasimove6df8102020-07-21 20:15:25 -0700743 return
744
Garry Wang358aad42020-08-02 20:56:04 -0700745 if update_pending_reboot:
746 message = 'Starting reboot servo_v3 because an update is pending.'
747 reboot_method = self._post_update_reboot
748 elif long_up_time:
749 message = 'Starting reboot servo_v3 because uptime > 96 hours.'
750 reboot_method = self._servo_host_reboot
751 self.record('INFO', None, None, message)
752 logging.info(message)
Otabek Kasimove6df8102020-07-21 20:15:25 -0700753 try:
Garry Wang358aad42020-08-02 20:56:04 -0700754 reboot_method()
Otabek Kasimove6df8102020-07-21 20:15:25 -0700755 message = 'Servo_v3 reboot completed successfully.'
756 except Exception as e:
757 logging.debug("Fail to reboot servo_v3; %s", e)
758 message = ('Servo_v3 reboot failed, please check debug log '
759 'for details.')
760 logging.info(message)
761 self.record('INFO', None, None, message)
Garry Wangffbd2162020-04-17 16:13:48 -0700762
763 def _reset_servo(self):
764 logging.info('Resetting servo through smart usbhub.')
Otabek Kasimov09192682020-06-01 18:17:44 -0700765 # TODO remove try-except when fix crbug.com/1087964
766 try:
767 resp = self.run('servodtool device -s %s power-cycle' %
768 self.servo_serial, ignore_status=True,
769 timeout=30)
770 if resp.exit_status != 0:
771 self._process_servodtool_error(resp)
772 return False
773 except Exception as e:
774 # Here we catch only timeout errors.
775 # Other errors is filtered by ignore_status=True
776 logging.debug('Attempt to reset servo failed due to timeout;'
777 ' %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -0700778 return False
779
780 logging.debug('Wait %s seconds for servo to come back from reset.',
781 servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
782 time.sleep(servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
Garry Wang000c6c02020-05-11 21:27:23 -0700783 # change the flag so we can update this label in later process.
784 self.smart_usbhub = True
Garry Wangffbd2162020-04-17 16:13:48 -0700785 return True
786
Garry Wangffbd2162020-04-17 16:13:48 -0700787 def reset_servo(self):
788 """Reset(power-cycle) the servo via smart usbhub.
789 """
790 if not self.is_labstation():
791 logging.info('Servo reset is not applicable to servo_v3.')
792 return
793
794 pre_reset_devnum = self._get_servo_usb_devnum()
795 logging.info('Servo usb devnum before reset: %s', pre_reset_devnum)
796 result = self._reset_servo()
797 if not result:
Garry Wangfd5c8b62020-06-08 15:36:54 -0700798 message = ('Failed to reset servo with serial: %s. (Please ignore'
799 ' this error if the DUT is not connected to a smart'
800 ' usbhub).' % self.servo_serial)
Garry Wangffbd2162020-04-17 16:13:48 -0700801 logging.warning(message)
802 self.record('INFO', None, None, message)
803 return
804
805 post_reset_devnum = self._get_servo_usb_devnum()
806 logging.info('Servo usb devnum after reset: %s', post_reset_devnum)
807 if not (pre_reset_devnum and post_reset_devnum):
808 message = ('Servo reset completed but unable to verify'
809 ' devnum change!')
810 elif pre_reset_devnum != post_reset_devnum:
811 message = ('Reset servo with serial %s completed successfully!'
812 % self.servo_serial)
813 else:
814 message = 'Servo reset completed but devnum is still not changed!'
815 logging.info(message)
816 self.record('INFO', None, None, message)
817
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800818 def _extract_compressed_logs(self, logdir, relevant_files):
819 """Decompress servod logs in |logdir|.
820
821 @param logdir: directory containing compressed servod logs.
822 @param relevant_files: list of files in |logdir| to consider.
823
824 @returns: tuple, (tarfiles, files) where
825 tarfiles: list of the compressed filenames that have been
826 extracted and deleted
827 files: list of the uncompressed files that were generated
828 """
829 # For all tar-files, first extract them to the directory, and
830 # then let the common flow handle them.
831 tarfiles = [cf for cf in relevant_files if
832 cf.endswith(self.COMPRESSION_SUFFIX)]
833 files = []
834 for f in tarfiles:
835 norm_name = os.path.basename(f)[:-len(self.COMPRESSION_SUFFIX)]
836 with tarfile.open(f) as tf:
837 # Each tarfile has only one member, as
838 # that's the compressed log.
839 member = tf.members[0]
840 # Manipulate so that it only extracts the basename, and not
841 # the directories etc.
842 member.name = norm_name
843 files.append(os.path.join(logdir, member.name))
844 tf.extract(member, logdir)
845 # File has been extracted: remove the compressed file.
846 os.remove(f)
847 return tarfiles, files
848
849 def _extract_mcu_logs(self, log_subdir):
850 """Extract MCU (EC, Cr50, etc) console output from servod debug logs.
851
852 Using the MCU_EXTRACTOR regex (above) extract and split out MCU console
853 lines from the logs to generate invidiual console logs e.g. after
854 this method, you can find an ec.txt and servo_v4.txt in |log_dir| if
855 those MCUs had any console input/output.
856
857 @param log_subdir: directory with log.DEBUG.txt main servod debug logs.
858 """
859 # Extract the MCU for each one. The MCU logs are only in the .DEBUG
860 # files
861 mcu_lines_file = os.path.join(log_subdir, 'log.DEBUG.txt')
862 if not os.path.exists(mcu_lines_file):
863 logging.info('No DEBUG logs found to extract MCU logs from.')
864 return
865 mcu_files = {}
866 mcu_file_template = '%s.txt'
867 with open(mcu_lines_file, 'r') as f:
868 for line in f:
869 match = self.MCU_EXTRACTOR.match(line)
870 if match:
871 mcu = match.group(self.MCU_GROUP).lower()
872 line = match.group(self.LINE_GROUP)
873 if mcu not in mcu_files:
874 mcu_file = os.path.join(log_subdir,
875 mcu_file_template % mcu)
876 mcu_files[mcu] = open(mcu_file, 'a')
877 fd = mcu_files[mcu]
878 fd.write(line + '\n')
879 for f in mcu_files:
880 mcu_files[f].close()
881
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800882 def remove_latest_log_symlinks(self):
883 """Remove the conveninence symlinks 'latest' servod logs."""
884 symlink_wildcard = '%s/latest*' % self.remote_log_dir
885 cmd = 'rm ' + symlink_wildcard
886 self.run(cmd, stderr_tee=None, ignore_status=True)
887
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700888 def probe_servod_restart(self, instance_ts, outdir):
889 """Grab servod logs from previous instances if part of this session.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800890
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700891 If since the last time this host called start_servod() servod crashed
892 and restarted, this helper finds those logs as well, and stores them
893 with the |OLD_LOG_SUFFIX| to investigate if necessary.
Prasad Vuppalapu5bd9da12020-03-31 01:46:47 +0000894
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700895 It also issues a panicinfo command to servo devices after the restart
896 to try and collect reboot information for debugging.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800897
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700898 @param instance_ts: the log timestamp that the current instance uses
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800899 @param outdir: directory to create a subdirectory into to place the
900 servod logs into.
901 """
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700902 if self._initial_instance_ts is None:
903 logging.info('No log timestamp grabbed successfully on servod '
904 'startup. Cannot check device restarts. Ignoring.')
905 return
906 if instance_ts == self._initial_instance_ts:
907 logging.debug('Servod appears to have run without restarting')
908 return
909 # Servod seems to have restarted (at least once). |_initial_instance_ts|
910 # is the first timestamp, and instance_ts is the current timestamp. Find
911 # all timestamps in between them, and grab the logs for each.
912 tss = self._find_instance_timestamps_between(self._initial_instance_ts,
913 instance_ts)
914 logging.info('Servod has restarted %d times between the start and the '
915 'end of this servo_host.', len(tss))
916 logging.info('This might be an issue. Will extract all logs from each '
917 'instance.')
918 logging.info('Logs that are not the currently running (about to turn '
919 'down) instance are maked with a .%s in their folder.',
920 self.OLD_LOG_SUFFIX)
921 for ts in tss:
922 self.get_instance_logs(ts, outdir, old=True)
923 # Lastly, servod has restarted due to a potential issue. Try to get
924 # panic information from servo micro and servo v4 for the current logs.
925 # This can only happen if the |_servo| attribute is initialized.
926 if self._servo:
Ruben Rodriguez Buchillon030ff162021-03-09 17:21:25 -0800927 for mcu in ['servo_micro', 'servo_v4', 'servo_v4p1']:
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700928 ctrl = '%s_uart_cmd' % mcu
929 if self._servo.has_control(ctrl):
930 logging.info('Trying to retrieve %r panicinfo into logs',
931 mcu)
932 try:
933 self._servo.set_nocheck(ctrl, 'panicinfo')
934 except error.TestFail as e:
935 logging.error('Failed to generate panicinfo for %r '
936 'logs. %s', mcu, str(e))
937
938 def _find_instance_timestamps_between(self, start_ts, end_ts):
939 """Find all log timestamps between [start_ts, end_ts).
940
941 @param start_ts: str, earliest log timestamp of interest
942 @param end_ts: str, latest log timestamp of interest
943
944 @returns: list, all timestamps between start_ts and end_ts, end_ts
945 exclusive, on the servo_host. An empty list on errors
946 """
947 # Simply get all timestamp, and then sort and remove
948 cmd = 'ls %s' % self.remote_log_dir
949 res = self.run(cmd, stderr_tee=None, ignore_status=True)
950 if res.exit_status != 0:
951 # Here we failed to find anything.
952 logging.info('Failed to find remote servod logs. Ignoring.')
953 return []
954 logfiles = res.stdout.strip().split()
955 timestamps = set()
956 for logfile in logfiles:
957 ts_match = self.TS_EXTRACTOR.match(logfile)
958 if not ts_match:
959 # Simply ignore files that fail the check. It might be the
960 # 'latest' symlinks or random files.
961 continue
962 timestamps.add(ts_match.group(self.TS_GROUP))
963 # At this point we have all unique timestamps.
964 timestamps = sorted(timestamps)
965 for ts in [start_ts, end_ts]:
966 if ts not in timestamps:
967 logging.error('Timestamp %r not in servod logs. Cannot query '
968 'for timestamps in between %r and %r', ts,
969 start_ts, end_ts)
970 return []
971 return timestamps[timestamps.index(start_ts):timestamps.index(end_ts)]
972
973 def get_instance_logs_ts(self):
974 """Retrieve the currently running servod instance's log timestamp
975
976 @returns: str, timestamp for current instance, or None on failure
977 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800978 # First, extract the timestamp. This cmd gives the real filename of
979 # the latest aka current log file.
980 cmd = ('if [ -f %(dir)s/latest.DEBUG ];'
981 'then realpath %(dir)s/latest.DEBUG;'
982 'elif [ -f %(dir)s/latest ];'
983 'then realpath %(dir)s/latest;'
984 'else exit %(code)d;'
985 'fi' % {'dir': self.remote_log_dir,
986 'code': self.NO_SYMLINKS_CODE})
987 res = self.run(cmd, stderr_tee=None, ignore_status=True)
988 if res.exit_status != 0:
989 if res.exit_status == self.NO_SYMLINKS_CODE:
990 logging.warning('servod log latest symlinks not found. '
991 'This is likely due to an error starting up '
992 'servod. Ignoring..')
993 else:
994 logging.warning('Failed to find servod logs on servo host.')
995 logging.warning(res.stderr.strip())
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700996 return None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800997 fname = os.path.basename(res.stdout.strip())
998 # From the fname, ought to extract the timestamp using the TS_EXTRACTOR
Ruben Rodriguez Buchillone9aa2b02020-03-04 12:14:28 -0800999 ts_match = self.TS_EXTRACTOR.match(fname)
1000 if not ts_match:
1001 logging.warning('Failed to extract timestamp from servod log file '
1002 '%r. Skipping. The servo host is using outdated '
1003 'servod logging and needs to be updated.', fname)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001004 return None
1005 return ts_match.group(self.TS_GROUP)
1006
Garry Wang970fda92021-06-22 18:03:43 -07001007 def get_servohost_logs(self, outdir):
1008 """Get logs that can help debugging servo/servod problem from
1009 the servohost
1010 """
1011 log_dir = os.path.join(outdir, 'servohost_%s' % self.hostname)
1012 if os.path.isdir(log_dir):
1013 # In multi-DUTs testing, each DUTs will may their own servohost
1014 # instance, where could cause duplicate efforts if they share a
1015 # same servohost, so we can just skip the collect if the log
1016 # dir already exists.
1017 logging.info(
1018 'Skip dmesg and messages logs collecting as %s'
1019 ' already exists.', log_dir)
1020 return
1021 logging.info('Collecting dmesg and messages from servohost %s',
1022 self.hostname)
1023 os.mkdir(log_dir)
1024 logging.info('Saving servohost logs to %s.', log_dir)
1025 # First collect dmesg from the servohost.
1026 crashcollect.collect_command(self, 'dmesg -H',
1027 os.path.join(log_dir, 'dmesg'))
1028 # Collect messages log from the servohost.
1029 try:
1030 self.get_file('/var/log/messages', log_dir, try_rsync=False)
1031 except error.AutoservRunError as e:
1032 logging.warning('Failed to collect messages log from servohost.')
1033
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001034 def get_instance_logs(self, instance_ts, outdir, old=False):
1035 """Collect all logs with |instance_ts| and dump into a dir in |outdir|
1036
1037 This method first collects all logs on the servo_host side pertaining
1038 to this servod instance (port, instatiation). It glues them together
1039 into combined log.[level].txt files and extracts all available MCU
1040 console I/O from the logs into individual files e.g. servo_v4.txt
1041
1042 All the output can be found in a directory inside |outdir| that
1043 this generates based on |LOG_DIR|, the servod port, and the instance
1044 timestamp on the servo_host side.
1045
1046 @param instance_ts: log timestamp to grab logfiles for
1047 @param outdir: directory to create a subdirectory into to place the
1048 servod logs into.
1049 @param old: bool, whether to append |OLD_LOG_SUFFIX| to output dir
1050 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001051 # Create the local results log dir.
1052 log_dir = os.path.join(outdir, '%s_%s.%s' % (self.LOG_DIR,
1053 str(self.servo_port),
1054 instance_ts))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001055 if old:
Garry Wang22f2e842020-09-09 20:19:19 -07001056 log_dir = '%s.%s' % (log_dir, self.OLD_LOG_SUFFIX)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001057 logging.info('Saving servod logs to %r.', log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001058 os.mkdir(log_dir)
1059 # Now, get all files with that timestamp.
1060 cmd = 'find %s -maxdepth 1 -name "log.%s*"' % (self.remote_log_dir,
1061 instance_ts)
1062 res = self.run(cmd, stderr_tee=None, ignore_status=True)
1063 files = res.stdout.strip().split()
1064 try:
1065 self.get_file(files, log_dir, try_rsync=False)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001066 if not os.listdir(log_dir):
1067 logging.info('No servod logs retrieved. Ignoring, and removing '
1068 '%r again.', log_dir)
1069 os.rmdir(log_dir)
1070 return
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001071 except error.AutoservRunError as e:
1072 result = e.result_obj
1073 if result.exit_status != 0:
1074 stderr = result.stderr.strip()
1075 logging.warning("Couldn't retrieve servod logs. Ignoring: %s",
1076 stderr or '\n%s' % result)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001077 # Remove the log_dir as nothing was added to it.
1078 os.rmdir(log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001079 return
1080 local_files = [os.path.join(log_dir, f) for f in os.listdir(log_dir)]
1081 # TODO(crrev.com/c/1793030): remove no-level case once CL is pushed
1082 for level_name in ('DEBUG', 'INFO', 'WARNING', ''):
1083 # Create the joint files for each loglevel. i.e log.DEBUG
1084 joint_file = self.JOINT_LOG_PREFIX
1085 if level_name:
1086 joint_file = '%s.%s' % (self.JOINT_LOG_PREFIX, level_name)
1087 # This helps with some online tools to avoid complaints about an
1088 # unknown filetype.
1089 joint_file = joint_file + '.txt'
1090 joint_path = os.path.join(log_dir, joint_file)
1091 files = [f for f in local_files if level_name in f]
1092 if not files:
1093 # TODO(crrev.com/c/1793030): remove no-level case once CL
1094 # is pushed
1095 continue
1096 # Extract compressed logs if any.
1097 compressed, extracted = self._extract_compressed_logs(log_dir,
1098 files)
1099 files = list(set(files) - set(compressed))
1100 files.extend(extracted)
1101 # Need to sort. As they all share the same timestamp, and
1102 # loglevel, the index itself is sufficient. The highest index
1103 # is the oldest file, therefore we need a descending sort.
1104 def sortkey(f, level=level_name):
1105 """Custom sortkey to sort based on rotation number int."""
1106 if f.endswith(level_name): return 0
1107 return int(f.split('.')[-1])
1108
1109 files.sort(reverse=True, key=sortkey)
1110 # Just rename the first file rather than building from scratch.
1111 os.rename(files[0], joint_path)
1112 with open(joint_path, 'a') as joint_f:
1113 for logfile in files[1:]:
1114 # Transfer the file to the joint file line by line.
1115 with open(logfile, 'r') as log_f:
1116 for line in log_f:
1117 joint_f.write(line)
1118 # File has been written over. Delete safely.
1119 os.remove(logfile)
1120 # Need to remove all files form |local_files| so we don't
1121 # analyze them again.
1122 local_files = list(set(local_files) - set(files) - set(compressed))
1123 # Lastly, extract MCU logs from the joint logs.
1124 self._extract_mcu_logs(log_dir)
1125
Garry Wang79e9af62019-06-12 15:19:19 -07001126 def _lock(self):
1127 """lock servohost by touching a file.
1128 """
1129 logging.debug('Locking servohost %s by touching %s file',
1130 self.hostname, self._lock_file)
1131 self.run('touch %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001132 self._is_locked = True
Garry Wang79e9af62019-06-12 15:19:19 -07001133
Garry Wang79e9af62019-06-12 15:19:19 -07001134 def _unlock(self):
1135 """Unlock servohost by removing the lock file.
1136 """
1137 logging.debug('Unlocking servohost by removing %s file',
1138 self._lock_file)
1139 self.run('rm %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001140 self._is_locked = False
Garry Wang79e9af62019-06-12 15:19:19 -07001141
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001142 def close(self):
Congbin Guofc3b8962019-03-22 17:38:46 -07001143 """Close the associated servo and the host object."""
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001144 # NOTE: throughout this method there are multiple attempts to catch
1145 # all errors. This is WAI as log grabbing should not fail tests.
1146 # However, the goal is to catch and handle/process all errors, thus
1147 # we print the traceback and ask for a bug.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001148 if self._closed:
1149 logging.debug('ServoHost is already closed.')
1150 return
Garry Wang22f2e842020-09-09 20:19:19 -07001151
1152 # Only attempt ssh related actions if servohost is sshable. We call
1153 # check_cached_up_status() first because it's lightweighted and return
1154 # much faster in the case servohost is down, however, we still want
1155 # to call is_up() later since check_cached_up_status() is ping based check
1156 # and not guarantee the servohost is sshable.
1157 servo_host_ready = self.check_cached_up_status() and self.is_up()
1158
1159 if servo_host_ready:
1160 instance_ts = self.get_instance_logs_ts()
1161 else:
1162 logging.info('Servohost is down, will skip servod log collecting.')
1163 instance_ts = None
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001164 # TODO(crbug.com/1011516): once enabled, remove the check against
1165 # localhost and instead check against log-rotiation enablement.
1166 logs_available = (instance_ts is not None and
1167 self.job and
1168 not self.is_localhost())
1169 if logs_available:
1170 # Probe whether there was a servod restart, and grab those old
1171 # logs as well.
1172 try:
1173 self.probe_servod_restart(instance_ts, self.job.resultdir)
1174 except (error.AutoservRunError, error.TestFail) as e:
1175 logging.info('Failed to grab servo logs due to: %s. '
1176 'This error is forgiven.', str(e))
1177 except Exception as e:
1178 logging.error('Unexpected error probing for old logs. %s. '
1179 'Forgiven. Please file a bug and fix or catch '
1180 'in log probing function', str(e),
1181 exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001182 if self._servo:
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001183 outdir = None if not self.job else self.job.resultdir
Congbin Guo2e5e2a22018-07-27 10:32:48 -07001184 # In some cases when we run as lab-tools, the job object is None.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001185 self._servo.close(outdir)
1186
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001187 if logs_available:
1188 # Grab current (not old like above) logs after the servo instance
1189 # was closed out.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001190 try:
Garry Wang970fda92021-06-22 18:03:43 -07001191 self.get_servohost_logs(self.job.resultdir)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001192 self.get_instance_logs(instance_ts, self.job.resultdir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001193 except error.AutoservRunError as e:
1194 logging.info('Failed to grab servo logs due to: %s. '
1195 'This error is forgiven.', str(e))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001196 except Exception as e:
1197 logging.error('Unexpected error grabbing servod logs. %s. '
1198 'Forgiven. Please file a bug and fix or catch '
1199 'in log grabbing function', str(e), exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001200
Garry Wang22f2e842020-09-09 20:19:19 -07001201 if self._is_locked and servo_host_ready:
Garry Wang7c00b0f2019-06-25 17:28:17 -07001202 # Remove the lock if the servohost has been locked.
Garry Wang79e9af62019-06-12 15:19:19 -07001203 try:
1204 self._unlock()
1205 except error.AutoservSSHTimeout:
1206 logging.error('Unlock servohost failed due to ssh timeout.'
1207 ' It may caused by servohost went down during'
1208 ' the task.')
Garry Wangc1288cf2019-12-17 14:58:00 -08001209 # We want always stop servod after task to minimum the impact of bad
1210 # servod process interfere other servods.(see crbug.com/1028665)
Garry Wang22f2e842020-09-09 20:19:19 -07001211 if servo_host_ready:
1212 try:
1213 self.stop_servod()
1214 except error.AutoservRunError as e:
1215 logging.info(
1216 "Failed to stop servod due to:\n%s\n"
1217 "This error is forgiven.", str(e))
Garry Wangc1288cf2019-12-17 14:58:00 -08001218
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001219 super(ServoHost, self).close()
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001220 # Mark closed.
1221 self._closed = True
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001222
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001223 def get_servo_state(self):
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001224 return self._servo_state
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001225
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001226 def is_servo_board_present_on_servo_v3(self):
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001227 """Check if servo board is detected on servo_v3"""
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001228 logging.debug('Started to detect servo board on servo_v3')
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001229 vid_pids = ['18d1:5004', '0403:6014']
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001230 not_detected = 'The servo board is not detected on servo_v3'
1231 try:
1232 cmd = 'lsusb | grep "%s"' % "\|".join(vid_pids)
1233 result = self.run(cmd, ignore_status=True, timeout=30)
1234 if result.exit_status == 0 and result.stdout.strip():
1235 logging.debug('The servo board is detected on servo_v3')
1236 return True
1237 logging.debug('%s; %s', not_detected, result)
1238 return False
1239 except Exception as e:
1240 # can be triggered by timeout issue due running the script
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001241 logging.error('%s; %s', not_detected, str(e))
1242 return None
1243
Garry Wangb5cee3e2020-09-16 14:58:13 -07001244 def _require_cr50_servod_config(self):
1245 """Check whether we need start servod with CONFIG=cr50.xml"""
1246 dut_host_info = self.get_dut_host_info()
1247 if not dut_host_info:
1248 return False
1249 for pool in dut_host_info.pools:
1250 if pool.startswith(servo_constants.CR50_CONFIG_POOL_PREFIX):
1251 return True
1252 return False
1253
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001254 def get_verifier_state(self, tag):
Otabek Kasimov15963492020-06-23 21:10:51 -07001255 """Return the state of servo verifier.
1256
1257 @returns: bool or None
1258 """
Derek Beckett3d743402021-08-04 09:25:44 -07001259 tauto_warnings.lab_services_warn_and_error("Servo verify state")
Otabek Kasimov15963492020-06-23 21:10:51 -07001260
Otabek Kasimov044a54b2021-05-06 19:12:18 -07001261 def get_repair_strategy_node(self, tag):
1262 """Return the instance of verifier/repair node for host by tag.
1263
1264 @returns: _DependencyNode or None
1265 """
Derek Beckett3d743402021-08-04 09:25:44 -07001266 tauto_warnings.lab_services_warn_and_error("Servo node")
Otabek Kasimov044a54b2021-05-06 19:12:18 -07001267
Otabek Kasimov15963492020-06-23 21:10:51 -07001268 def determine_servo_state(self):
1269 """Determine servo state based on the failed verifier.
1270
1271 @returns: servo state value
1272 The state detecting based on first fail verifier or collecting of
1273 them.
1274 """
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001275 ssh = self.get_verifier_state('servo_ssh')
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001276 servo_root_present = self.get_verifier_state('servo_root_present')
Otabek Kasimov044a54b2021-05-06 19:12:18 -07001277 servo_root_present_node = self.get_repair_strategy_node(
1278 'servo_root_present')
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001279 servo_v3_present = self.get_verifier_state('servo_v3_root_present')
Otabek Kasimov79be61b2021-02-18 12:30:44 -08001280 servo_fw = self.get_verifier_state('servo_fw')
Otabek Kasimov9049ebe2021-05-06 19:19:12 -07001281 servo_fw_update = self.get_repair_strategy_node('servo_fw_update')
Otabek Kasimov1614e2e2021-01-27 22:14:36 -08001282 disk_space = self.get_verifier_state('servo_disk_space')
Otabek Kasimov3c63cbf2021-04-30 18:51:31 -07001283 start_servod = self.get_verifier_state('start_servod')
1284 servod_started = self.get_verifier_state('servod_started')
Otabek Kasimov261bf402021-05-06 19:11:09 -07001285 servod_echo = self.get_verifier_state('servod_echo')
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001286 create_servo = self.get_verifier_state('servod_connection')
1287 init_servo = self.get_verifier_state('servod_control')
Otabek Kasimov1614e2e2021-01-27 22:14:36 -08001288 cr50_low_sbu = self.get_verifier_state('servo_cr50_low_sbu')
1289 cr50_off = self.get_verifier_state('servo_cr50_off')
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001290 servo_topology = self.get_verifier_state('servo_topology')
Otabek Kasimov1614e2e2021-01-27 22:14:36 -08001291 dut_connected = self.get_verifier_state('servo_dut_connected')
1292 hub_connected = self.get_verifier_state('servo_hub_connected')
1293 pwr_button = self.get_verifier_state('servo_pwr_button')
1294 lid_open = self.get_verifier_state('servo_lid_open')
1295 ec_board = self.get_verifier_state('servo_ec_board')
1296 cr50_console = self.get_verifier_state('servo_cr50_console')
1297 ccd_testlab = self.get_verifier_state('servo_ccd_testlab')
Otabek Kasimov15963492020-06-23 21:10:51 -07001298
1299 if not ssh:
1300 return servo_constants.SERVO_STATE_NO_SSH
Otabek Kasimov3c63cbf2021-04-30 18:51:31 -07001301 if start_servod == hosts.VERIFY_FAILED:
1302 return servo_constants.SERVO_STATE_SERVO_HOST_ISSUE
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001303 if servo_root_present == hosts.VERIFY_FAILED:
1304 if not self.servo_serial:
1305 return servo_constants.SERVO_STATE_WRONG_CONFIG
Otabek Kasimov044a54b2021-05-06 19:12:18 -07001306 if hasattr(servo_root_present_node, 'serial_mismatch'):
1307 return servo_constants.SERVO_STATE_SERIAL_MISMATCH
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001308 return servo_constants.SERVO_STATE_NOT_CONNECTED
1309 if servo_v3_present == hosts.VERIFY_FAILED:
1310 # if we cannot find required board on servo_v3
1311 return servo_constants.SERVO_STATE_NEED_REPLACEMENT
Otabek Kasimov79be61b2021-02-18 12:30:44 -08001312 if servo_fw == hosts.VERIFY_FAILED:
Otabek Kasimov9049ebe2021-05-06 19:19:12 -07001313 logging.info(servo_fw_update)
1314 if hasattr(servo_fw_update, 'servo_updater_issue_detected'):
1315 return servo_constants.SERVO_STATE_SERVO_UPDATER_ISSUE
Otabek Kasimov79be61b2021-02-18 12:30:44 -08001316 return servo_constants.SERVO_STATE_NEED_REPLACEMENT
Otabek Kasimov15963492020-06-23 21:10:51 -07001317
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001318 if dut_connected == hosts.VERIFY_FAILED:
1319 return servo_constants.SERVO_STATE_DUT_NOT_CONNECTED
1320 if hub_connected == hosts.VERIFY_FAILED:
1321 logging.info('Servo HUB not connected')
1322 return servo_constants.SERVO_STATE_DUT_NOT_CONNECTED
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001323
Otabek Kasimov8e88a742021-01-11 18:03:13 -08001324 if cr50_low_sbu == hosts.VERIFY_FAILED:
1325 return servo_constants.SERVO_STATE_SBU_LOW_VOLTAGE
1326 if cr50_off == hosts.VERIFY_FAILED:
1327 return servo_constants.SERVO_STATE_CR50_NOT_ENUMERATED
Otabek Kasimov6c6e2cb0b2021-03-09 17:18:45 -08001328
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001329 if servo_topology == hosts.VERIFY_FAILED:
1330 return servo_constants.SERVO_STATE_TOPOLOGY_ISSUE
1331
Otabek Kasimov261bf402021-05-06 19:11:09 -07001332 if (servod_started == hosts.VERIFY_FAILED
1333 or servod_echo == hosts.VERIFY_FAILED):
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001334 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1335
Otabek Kasimov15963492020-06-23 21:10:51 -07001336 # one of the reason why servo can not initialized
Otabek Kasimovbb3bc462020-11-03 16:40:33 -08001337 if cr50_console == hosts.VERIFY_FAILED:
1338 return servo_constants.SERVO_STATE_CR50_CONSOLE_MISSING
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001339 if ccd_testlab == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001340 return servo_constants.SERVO_STATE_CCD_TESTLAB_ISSUE
1341
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001342 if (create_servo == hosts.VERIFY_FAILED
1343 or init_servo == hosts.VERIFY_FAILED):
Otabek Kasimov261bf402021-05-06 19:11:09 -07001344 return servo_constants.SERVO_STATE_SERVOD_PROXY_ISSUE
Otabek Kasimov15963492020-06-23 21:10:51 -07001345
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001346 if ec_board == hosts.VERIFY_FAILED:
Otabek Kasimov015c15c2020-08-20 00:40:42 -07001347 return servo_constants.SERVO_STATE_EC_BROKEN
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001348 if pwr_button == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001349 return servo_constants.SERVO_STATE_BAD_RIBBON_CABLE
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001350 if lid_open == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001351 return servo_constants.SERVO_STATE_LID_OPEN_FAILED
Otabek Kasimov15963492020-06-23 21:10:51 -07001352
Otabek Kasimov15963492020-06-23 21:10:51 -07001353 logging.info('We do not have special state for this failure yet :)')
1354 return servo_constants.SERVO_STATE_BROKEN
1355
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001356 def is_servo_topology_supported(self):
1357 """Check if servo_topology is supported."""
Otabek Kasimovda994012020-11-25 15:23:04 -08001358 if not self.is_up_fast():
1359 logging.info('Servo-Host is not reachable.')
1360 return False
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001361 if not self.is_labstation():
1362 logging.info('Servo-topology supported only for labstation.')
1363 return False
1364 if not self.servo_serial:
1365 logging.info('Servo-topology required a servo serial.')
1366 return False
1367 return True
1368
1369 def get_topology(self):
1370 """Get servo topology."""
Otabek Kasimovfe41e2d2021-02-14 20:48:52 -08001371 if not self._topology:
1372 self._topology = servo_topology.ServoTopology(self)
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001373 return self._topology
1374
1375 def is_dual_setup(self):
1376 """Check is servo will run in dual setup.
1377
1378 Dual setup used only for servo_v4 when used ccd_cr50 and servo_micro
1379 at the same time.
1380 """
1381 return self.servo_setup == servo_constants.SERVO_SETUP_VALUE_DUAL_V4
1382
Otabek Kasimov39637412020-11-23 19:09:27 -08001383 def set_dut_health_profile(self, dut_health_profile):
1384 """
1385 @param dut_health_profile: A DeviceHealthProfile object.
1386 """
1387 logging.debug('setting dut_health_profile field to (%s)',
1388 dut_health_profile)
1389 self._dut_health_profile = dut_health_profile
1390
1391 def get_dut_health_profile(self):
1392 """
1393 @return A DeviceHealthProfile object.
1394 """
1395 return self._dut_health_profile
1396
Otabek Kasimov51ed19a2021-05-03 12:30:50 -07001397 def print_all_servo_of_host(self):
1398 """Print all servos detected on the host."""
1399 try:
1400 logging.info('\tDevices detected on the host:')
1401 devices = self.get_topology().get_list_available_servos()
1402 for device in devices:
1403 logging.info('\t%s', device)
1404 except Exception as e:
1405 logging.debug('(Not critical) Fail list all servos: %s', e)
1406
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001407
Richard Barnetteea3e4602016-06-10 12:36:41 -07001408def make_servo_hostname(dut_hostname):
1409 """Given a DUT's hostname, return the hostname of its servo.
1410
1411 @param dut_hostname: hostname of a DUT.
1412
1413 @return hostname of the DUT's servo.
1414
1415 """
1416 host_parts = dut_hostname.split('.')
1417 host_parts[0] = host_parts[0] + '-servo'
1418 return '.'.join(host_parts)
1419
1420
Richard Barnettee519dcd2016-08-15 17:37:17 -07001421def _map_afe_board_to_servo_board(afe_board):
1422 """Map a board we get from the AFE to a servo appropriate value.
1423
1424 Many boards are identical to other boards for servo's purposes.
1425 This function makes that mapping.
1426
1427 @param afe_board string board name received from AFE.
1428 @return board we expect servo to have.
1429
1430 """
1431 KNOWN_SUFFIXES = ['-freon', '_freon', '_moblab', '-cheets']
1432 BOARD_MAP = {'gizmo': 'panther'}
1433 mapped_board = afe_board
1434 if afe_board in BOARD_MAP:
1435 mapped_board = BOARD_MAP[afe_board]
1436 else:
1437 for suffix in KNOWN_SUFFIXES:
1438 if afe_board.endswith(suffix):
1439 mapped_board = afe_board[0:-len(suffix)]
1440 break
1441 if mapped_board != afe_board:
1442 logging.info('Mapping AFE board=%s to %s', afe_board, mapped_board)
1443 return mapped_board
1444
1445
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001446def get_servo_args_for_host(dut_host):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001447 """Return servo data associated with a given DUT.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001448
Richard Barnetteea3e4602016-06-10 12:36:41 -07001449 @param dut_host Instance of `Host` on which to find the servo
1450 attributes.
Prathmesh Prabhuf605dd32018-08-28 17:09:04 -07001451 @return `servo_args` dict with host and an optional port.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001452 """
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001453 info = dut_host.host_info_store.get()
Derek Beckettf73baca2020-08-19 15:08:47 -07001454 servo_args = {k: v for k, v in six.iteritems(info.attributes)
Garry Wang11b5e872020-03-11 15:14:08 -07001455 if k in servo_constants.SERVO_ATTR_KEYS}
Richard Barnetteea3e4602016-06-10 12:36:41 -07001456
Andrew Luo4be621d2020-03-21 07:01:13 -07001457 if servo_constants.SERVO_HOST_SSH_PORT_ATTR in servo_args:
1458 try:
1459 servo_args[servo_constants.SERVO_HOST_SSH_PORT_ATTR] = int(
1460 servo_args[servo_constants.SERVO_HOST_SSH_PORT_ATTR])
1461 except ValueError:
1462 logging.error('servo host port is not an int: %s',
1463 servo_args[servo_constants.SERVO_HOST_SSH_PORT_ATTR])
1464 # Reset servo_args because we don't want to use an invalid port.
1465 servo_args.pop(servo_constants.SERVO_HOST_SSH_PORT_ATTR, None)
1466
Garry Wang11b5e872020-03-11 15:14:08 -07001467 if servo_constants.SERVO_PORT_ATTR in servo_args:
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001468 try:
Garry Wang11b5e872020-03-11 15:14:08 -07001469 servo_args[servo_constants.SERVO_PORT_ATTR] = int(
1470 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001471 except ValueError:
1472 logging.error('servo port is not an int: %s',
Garry Wang11b5e872020-03-11 15:14:08 -07001473 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001474 # Reset servo_args because we don't want to use an invalid port.
Garry Wang11b5e872020-03-11 15:14:08 -07001475 servo_args.pop(servo_constants.SERVO_HOST_ATTR, None)
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001476
1477 if info.board:
Garry Wang11b5e872020-03-11 15:14:08 -07001478 servo_board = _map_afe_board_to_servo_board(info.board)
1479 servo_args[servo_constants.SERVO_BOARD_ATTR] = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -07001480 if info.model:
Garry Wang11b5e872020-03-11 15:14:08 -07001481 servo_args[servo_constants.SERVO_MODEL_ATTR] = info.model
1482 return servo_args if servo_constants.SERVO_HOST_ATTR in servo_args else None
Richard Barnetteea3e4602016-06-10 12:36:41 -07001483
1484
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001485def _tweak_args_for_ssp_moblab(servo_args):
Garry Wang11b5e872020-03-11 15:14:08 -07001486 if (servo_args[servo_constants.SERVO_HOST_ATTR]
1487 in ['localhost', '127.0.0.1']):
1488 servo_args[servo_constants.SERVO_HOST_ATTR] = _CONFIG.get_config_value(
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001489 'SSP', 'host_container_ip', type=str, default=None)
1490
1491
Otabek Kasimov39637412020-11-23 19:09:27 -08001492def create_servo_host(dut,
1493 servo_args,
1494 try_lab_servo=False,
1495 try_servo_repair=False,
Otabek Kasimovcdcf1ee2021-03-10 12:10:10 -08001496 try_servo_recovery=True,
Otabek Kasimov39637412020-11-23 19:09:27 -08001497 dut_host_info=None,
1498 dut_health_profile=None):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001499 """Create a ServoHost object for a given DUT, if appropriate.
Dan Shi4d478522014-02-14 13:46:32 -08001500
Richard Barnette9a26ad62016-06-10 12:03:08 -07001501 This function attempts to create and verify or repair a `ServoHost`
1502 object for a servo connected to the given `dut`, subject to various
1503 constraints imposed by the parameters:
1504 * When the `servo_args` parameter is not `None`, a servo
1505 host must be created, and must be checked with `repair()`.
1506 * Otherwise, if a servo exists in the lab and `try_lab_servo` is
1507 true:
1508 * If `try_servo_repair` is true, then create a servo host and
1509 check it with `repair()`.
1510 * Otherwise, if the servo responds to `ping` then create a
1511 servo host and check it with `verify()`.
Fang Denge545abb2014-12-30 18:43:47 -08001512
Richard Barnette9a26ad62016-06-10 12:03:08 -07001513 In cases where `servo_args` was not `None`, repair failure
1514 exceptions are passed back to the caller; otherwise, exceptions
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001515 are logged and then discarded. Note that this only happens in cases
1516 where we're called from a test (not special task) control file that
1517 has an explicit dependency on servo. In that case, we require that
1518 repair not write to `status.log`, so as to avoid polluting test
1519 results.
1520
1521 TODO(jrbarnette): The special handling for servo in test control
1522 files is a thorn in my flesh; I dearly hope to see it cut out before
1523 my retirement.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001524
1525 Parameters for a servo host consist of a host name, port number, and
1526 DUT board, and are determined from one of these sources, in order of
1527 priority:
Richard Barnetteea3e4602016-06-10 12:36:41 -07001528 * Servo attributes from the `dut` parameter take precedence over
1529 all other sources of information.
1530 * If a DNS entry for the servo based on the DUT hostname exists in
1531 the CrOS lab network, that hostname is used with the default
Richard Barnette9a26ad62016-06-10 12:03:08 -07001532 port and the DUT's board.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001533 * If no other options are found, the parameters will be taken
Richard Barnette9a26ad62016-06-10 12:03:08 -07001534 from the `servo_args` dict passed in from the caller.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001535
Otabek Kasimovcdcf1ee2021-03-10 12:10:10 -08001536 @param dut: An instance of `Host` from which to take
1537 servo parameters (if available).
1538 @param servo_args: A dictionary with servo parameters to use if
1539 they can't be found from `dut`. If this
1540 argument is supplied, unrepaired exceptions
1541 from `verify()` will be passed back to the
1542 caller.
1543 @param try_lab_servo: If not true, servo host creation will be
1544 skipped unless otherwise required by the
1545 caller.
1546 @param try_servo_repair: If true, check a servo host with
1547 `repair()` instead of `verify()`.
1548 @param try_servo_recovery: If true, start servod in recovery mode.
1549 Default value is True.
1550 @param dut_host_info: A HostInfo object of the DUT that connected
1551 to this servo.
1552 @param dut_health_profile: DUT repair info with history.
Dan Shi4d478522014-02-14 13:46:32 -08001553
1554 @returns: A ServoHost object or None. See comments above.
1555
1556 """
Garry Wang2d23a892021-04-02 22:33:56 -07001557 # We are explicitly looking for if servo_args is None here(which means
1558 # servo not needed), as servo_args == {} means servo is needed and
1559 # we expect load servo_args from host_info_store.
1560 if servo_args is None:
1561 servo_dependency = False
1562 local_run = False
1563 else:
1564 servo_dependency = True
1565 # If servo_args pass in directly, then this is a local test run.
1566 local_run = servo_constants.SERVO_HOST_ATTR in servo_args
1567
1568 if local_run:
1569 logging.warning('User input servo_args detected, will attempt'
1570 ' to start servod and initialize servo conncetion'
1571 ' directly. All servo/servohost verify and repair'
1572 ' steps will be skipped.')
1573
1574 # Loading servo args from host_info_store.
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001575 if dut is not None and (try_lab_servo or servo_dependency):
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001576 servo_args_override = get_servo_args_for_host(dut)
Richard Barnetteea3e4602016-06-10 12:36:41 -07001577 if servo_args_override is not None:
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001578 if utils.in_moblab_ssp():
1579 _tweak_args_for_ssp_moblab(servo_args_override)
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001580 logging.debug(
1581 'Overriding provided servo_args (%s) with arguments'
1582 ' determined from the host (%s)',
1583 servo_args,
1584 servo_args_override,
1585 )
Richard Barnetteea3e4602016-06-10 12:36:41 -07001586 servo_args = servo_args_override
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001587
Garry Wang2d23a892021-04-02 22:33:56 -07001588 if not servo_args:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001589 logging.debug('No servo_args provided, and failed to find overrides.')
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001590 if try_lab_servo or servo_dependency:
Otabek Kasimov646812c2020-06-23 20:01:36 -07001591 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001592 else:
1593 # For regular test case which not required the servo
1594 return None, None
1595
Garry Wang11b5e872020-03-11 15:14:08 -07001596 servo_hostname = servo_args.get(servo_constants.SERVO_HOST_ATTR)
1597 servo_port = servo_args.get(servo_constants.SERVO_PORT_ATTR)
Garry Wang2d23a892021-04-02 22:33:56 -07001598 if not local_run:
1599 if not _is_servo_host_information_exist(servo_hostname, servo_port):
1600 logging.debug(
1601 'Servo connection info missed hostname: %s , port: %s',
1602 servo_hostname, servo_port)
1603 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
1604 if not is_servo_host_information_valid(servo_hostname, servo_port):
1605 logging.debug(
1606 'Servo connection info is incorrect hostname: %s , port: %s',
1607 servo_hostname, servo_port)
1608 return None, servo_constants.SERVO_STATE_WRONG_CONFIG
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001609
Garry Wang2d23a892021-04-02 22:33:56 -07001610 if try_servo_recovery == True:
1611 servo_args[servo_constants.SERVO_RECOVERY_MODE] = True
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001612
Garry Wangebc015b2019-06-06 17:45:06 -07001613 newhost = ServoHost(**servo_args)
Garry Wang2d23a892021-04-02 22:33:56 -07001614 if local_run:
1615 try:
1616 newhost.start_servod()
1617 except:
1618 # If we failed to start servod here, we can assume the servod
1619 # either already started or the test is running against a
1620 # non-standard servohost so the user will resiponsble for ensure
1621 # servod is running.
1622 pass
1623 try:
Greg Edelstonff2665d2021-04-21 14:32:27 -06001624 newhost.initialize_servo()
Garry Wang2d23a892021-04-02 22:33:56 -07001625 newhost.initialize_dut_for_servo()
1626 newhost._servo_state = servo_constants.SERVO_STATE_WORKING
1627 return newhost, newhost.get_servo_state()
1628 except Exception as e:
1629 logging.error('Failed to initialize servo. %s', e)
1630 return None, servo_constants.SERVO_STATE_BROKEN
1631
Andrew Luo4be621d2020-03-21 07:01:13 -07001632 if newhost.use_icmp and not newhost.is_up_fast(count=3):
Otabek Kasimov32cafe92020-12-14 16:58:12 -08001633 # ServoHost has internal check to wait if servo-host is in reboot
1634 # process. If servo-host still is not available this check will stop
1635 # further attempts as we do not have any option to recover servo_host.
Otabek Kasimov39637412020-11-23 19:09:27 -08001636 return None, servo_constants.SERVO_STATE_NO_SSH
Garry Wangffbd2162020-04-17 16:13:48 -07001637
Otabek Kasimove6df8102020-07-21 20:15:25 -07001638 # Reset or reboot servo device only during AdminRepair tasks.
1639 if try_servo_repair:
1640 if newhost._is_locked:
Otabek Kasimov51ed19a2021-05-03 12:30:50 -07001641 # Print available servos on the host for debugging.
1642 newhost.print_all_servo_of_host()
Otabek Kasimove6df8102020-07-21 20:15:25 -07001643 # Reset servo if the servo is locked, as we check if the servohost
1644 # is up, if the servohost is labstation and if the servohost is in
1645 # lab inside the locking logic.
1646 newhost.reset_servo()
1647 else:
Garry Wang358aad42020-08-02 20:56:04 -07001648 try:
1649 newhost.reboot_servo_v3_on_need()
Garry Wang1f0d5332020-08-10 19:32:32 -07001650 except Exception as e:
1651 logging.info('[Non-critical] Unexpected error while trying to'
1652 ' reboot servo_v3, skipping the reboot; %s', e)
Otabek Kasimove6df8102020-07-21 20:15:25 -07001653
Otabek Kasimov2b50cdb2020-07-06 19:16:06 -07001654 if dut:
1655 newhost.set_dut_hostname(dut.hostname)
Otabek Kasimov9e90ae12020-08-14 03:01:19 -07001656 if dut_host_info:
1657 newhost.set_dut_host_info(dut_host_info)
Otabek Kasimov39637412020-11-23 19:09:27 -08001658 if dut_health_profile and (try_lab_servo or try_servo_repair):
1659 try:
1660 if newhost.is_localhost():
1661 logging.info('Servohost is a localhost, skip device'
1662 ' health profile setup...')
1663 else:
1664 dut_health_profile.init_profile(newhost)
1665 newhost.set_dut_health_profile(dut_health_profile)
1666 except Exception as e:
1667 logging.info(
1668 '[Non-critical] Unexpected error while trying to'
1669 ' load device health profile; %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -07001670
Richard Barnette9a26ad62016-06-10 12:03:08 -07001671 # Note that the logic of repair() includes everything done
1672 # by verify(). It's sufficient to call one or the other;
1673 # we don't need both.
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001674 if servo_dependency:
1675 newhost.repair(silent=True)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001676 return newhost, newhost.get_servo_state()
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001677
1678 if try_servo_repair:
1679 try:
1680 newhost.repair()
1681 except Exception:
1682 logging.exception('servo repair failed for %s', newhost.hostname)
Richard Barnette9a26ad62016-06-10 12:03:08 -07001683 else:
1684 try:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001685 newhost.verify()
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001686 except Exception:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001687 logging.exception('servo verify failed for %s', newhost.hostname)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001688 return newhost, newhost.get_servo_state()
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001689
1690
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001691def _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001692 if hostname is None or len(hostname.strip()) == 0:
1693 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001694 if port is None:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001695 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001696 if not type(port) is int:
1697 try:
1698 int(port)
1699 except ValueError:
1700 return False
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001701 return True
1702
1703
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001704def is_servo_host_information_valid(hostname, port):
Garry Wang9b8f2342020-04-17 16:34:09 -07001705 """Check if provided servo attributes are valid.
1706
1707 @param hostname Hostname of the servohost.
1708 @param port servo port number.
1709
1710 @returns: A bool value to indicate if provided servo attribute valid.
1711 """
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001712 if not _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001713 return False
1714 # checking range and correct of the port
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001715 port_int = int(port)
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001716 if port_int < 1 or port_int > 65000:
1717 return False
1718 # we expecting host contain only latters, digits and '-' or '_'
Garry Wang536d2852021-03-28 22:33:40 -07001719 if not re.match('[a-zA-Z0-9-_\.:]*$', hostname) or len(hostname) < 5:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001720 return False
1721 return True