blob: 0fd403f67b61cb5fe186c20c66a1198d462888d5 [file] [log] [blame]
Derek Beckettf73baca2020-08-19 15:08:47 -07001# Lint as: python2, python3
Fang Deng5d518f42013-08-02 14:04:32 -07002# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
3# Use of this source code is governed by a BSD-style license that can be
4# found in the LICENSE file.
5#
6# Expects to be run in an environment with sudo and no interactive password
7# prompt, such as within the Chromium OS development chroot.
8
9
10"""This file provides core logic for servo verify/repair process."""
11
12
Derek Beckettf73baca2020-08-19 15:08:47 -070013from __future__ import absolute_import
14from __future__ import division
15from __future__ import print_function
16
Fang Deng5d518f42013-08-02 14:04:32 -070017import logging
Raul E Rangel52ca2e82018-07-03 14:10:14 -060018import os
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080019import re
20import tarfile
Andrew McRaef0679932020-08-13 09:15:23 +100021import threading
Garry Wang2b5eef92020-08-21 16:23:35 -070022import json
Garry Wangc1288cf2019-12-17 14:58:00 -080023import time
Derek Beckettf73baca2020-08-19 15:08:47 -070024import six
25import six.moves.xmlrpc_client
Otabek Kasimov120b6fa2020-07-03 00:15:27 -070026import calendar
Fang Deng5d518f42013-08-02 14:04:32 -070027
28from autotest_lib.client.bin import utils
Garry Wang79e9af62019-06-12 15:19:19 -070029from autotest_lib.client.common_lib import error
Richard Barnette9a26ad62016-06-10 12:03:08 -070030from autotest_lib.client.common_lib import hosts
Garry Wang7b0e1b72020-03-25 19:08:59 -070031from autotest_lib.client.common_lib import lsbrelease_utils
Fang Deng5d518f42013-08-02 14:04:32 -070032from autotest_lib.client.common_lib.cros import retry
Richard Barnette9a26ad62016-06-10 12:03:08 -070033from autotest_lib.server.cros.servo import servo
Richard Barnetted31580e2018-05-14 19:58:00 +000034from autotest_lib.server.hosts import servo_repair
Garry Wangebc015b2019-06-06 17:45:06 -070035from autotest_lib.server.hosts import base_servohost
Garry Wang11b5e872020-03-11 15:14:08 -070036from autotest_lib.server.hosts import servo_constants
Otabek Kasimov4ea636e2020-04-14 23:35:06 -070037from autotest_lib.server.cros.faft.utils import config
Garry Wang11b5e872020-03-11 15:14:08 -070038from autotest_lib.client.common_lib import global_config
Otabek Kasimov8475cce2020-07-14 12:11:31 -070039from autotest_lib.site_utils.admin_audit import servo_updater
Otabek Kasimov382c3bb2020-10-28 13:22:45 -070040from autotest_lib.server.cros.servo.topology import servo_topology
Garry Wangd7367482020-02-27 13:52:40 -080041
Otabek Kasimov15963492020-06-23 21:10:51 -070042try:
Mike Frysinger714c5b02020-09-04 23:22:54 -040043 from autotest_lib.utils.frozen_chromite.lib import metrics
Otabek Kasimov15963492020-06-23 21:10:51 -070044except ImportError:
45 metrics = utils.metrics_mock
46
Dan Shi3b2adf62015-09-02 17:46:54 -070047_CONFIG = global_config.global_config
Fang Deng5d518f42013-08-02 14:04:32 -070048
Otabek Kasimova7ba91a2020-03-09 08:31:01 -070049
Garry Wangebc015b2019-06-06 17:45:06 -070050class ServoHost(base_servohost.BaseServoHost):
51 """Host class for a servo host(e.g. beaglebone, labstation)
Dana Goyette0b6e6402019-10-04 11:09:24 -070052 that with a servo instance for a specific port.
53
54 @type _servo: servo.Servo | None
55 """
Fang Deng5d518f42013-08-02 14:04:32 -070056
Raul E Rangel52ca2e82018-07-03 14:10:14 -060057 DEFAULT_PORT = int(os.getenv('SERVOD_PORT', '9999'))
Richard Barnette9a26ad62016-06-10 12:03:08 -070058
Dan Shie5b3c512014-08-21 12:12:09 -070059 # Timeout for initializing servo signals.
Wai-Hong Tam37b6ed32017-09-19 15:52:39 -070060 INITIALIZE_SERVO_TIMEOUT_SECS = 60
Richard Barnette9a26ad62016-06-10 12:03:08 -070061
Otabek Kasimov545739c2020-08-20 00:24:21 -070062 # Default timeout for run terminal command.
63 DEFAULT_TERMINAL_TIMEOUT = 30
64
xixuan6cf6d2f2016-01-29 15:29:00 -080065 # Ready test function
66 SERVO_READY_METHOD = 'get_version'
Fang Deng5d518f42013-08-02 14:04:32 -070067
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080068 # Directory prefix on the servo host where the servod logs are stored.
69 SERVOD_LOG_PREFIX = '/var/log/servod'
70
71 # Exit code to use when symlinks for servod logs are not found.
72 NO_SYMLINKS_CODE = 9
73
74 # Directory in the job's results directory to dump the logs into.
75 LOG_DIR = 'servod'
76
77 # Prefix for joint loglevel files in the logs.
78 JOINT_LOG_PREFIX = 'log'
79
80 # Regex group to extract timestamp from logfile name.
81 TS_GROUP = 'ts'
82
83 # This regex is used to extract the timestamp from servod logs.
Garry Wang22f2e842020-09-09 20:19:19 -070084 # files always start with log.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080085 TS_RE = (r'log.'
86 # The timestamp is of format %Y-%m-%d--%H-%M-%S.MS
87 r'(?P<%s>\d{4}(\-\d{2}){2}\-(-\d{2}){3}.\d{3})'
88 # The loglevel is optional depending on labstation version.
89 r'(.(INFO|DEBUG|WARNING))?' % TS_GROUP)
90 TS_EXTRACTOR = re.compile(TS_RE)
91
92 # Regex group to extract MCU name from logline in servod logs.
93 MCU_GROUP = 'mcu'
94
95 # Regex group to extract logline from MCU logline in servod logs.
96 LINE_GROUP = 'line'
97
98 # This regex is used to extract the mcu and the line content from an
99 # MCU logline in servod logs. e.g. EC or servo_v4 console logs.
100 # Here is an example log-line:
101 #
102 # 2020-01-23 13:15:12,223 - servo_v4 - EC3PO.Console - DEBUG -
103 # console.py:219:LogConsoleOutput - /dev/pts/9 - cc polarity: cc1
104 #
105 # Here is conceptually how they are formatted:
106 #
107 # <time> - <MCU> - EC3PO.Console - <LVL> - <file:line:func> - <pts> -
108 # <output>
109 #
Garry Wang22f2e842020-09-09 20:19:19 -0700110 # The log format starts with a timestamp
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800111 MCU_RE = (r'[\d\-]+ [\d:,]+ '
112 # The mcu that is logging this is next.
113 r'- (?P<%s>\w+) - '
114 # Next, we have more log outputs before the actual line.
115 # Information about the file line, logging function etc.
116 # Anchor on EC3PO Console, LogConsoleOutput and dev/pts.
117 # NOTE: if the log format changes, this regex needs to be
118 # adjusted.
119 r'EC3PO\.Console[\s\-\w\d:.]+LogConsoleOutput - /dev/pts/\d+ - '
120 # Lastly, we get the MCU's console line.
121 r'(?P<%s>.+$)' % (MCU_GROUP, LINE_GROUP))
122 MCU_EXTRACTOR = re.compile(MCU_RE)
123
Otabek Kasimov545739c2020-08-20 00:24:21 -0700124 # Regex to detect timeout messages when USBC pigtail has timeout issue.
125 # e.g.: [475635.427072 PD TMOUT RX 1/1]
126 USBC_PIGTAIL_TIMEOUT_RE = r'\[[\d \.]{1,20}(PD TMOUT RX 1\/1)\]'
127
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800128 # Suffix to identify compressed logfiles.
129 COMPRESSION_SUFFIX = '.tbz2'
130
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700131 # A suffix to mark servod log directories that came from instance that
132 # ran during this servo_host, but are not the last one running e.g. when
133 # an instance (on purpose, or due to a bug) restarted in the middle of the
134 # run.
135 OLD_LOG_SUFFIX = 'old'
136
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800137 def _init_attributes(self):
138 self._servo_state = None
139 self.servo_port = None
140 self.servo_board = None
141 self.servo_model = None
142 self.servo_serial = None
Garry Wangcb06f3b2020-10-08 20:56:21 -0700143 self.servo_setup = None
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800144 self.servo_recovery = None
Otabek Kasimovab4ae222021-03-06 01:38:47 -0800145 self.servo_fw_channel = None
Garry Wang6a680062020-11-03 13:40:29 -0800146 self.additional_servod_args = None
Otabek Kasimov39637412020-11-23 19:09:27 -0800147 self._dut_health_profile = None
Garry Wang000c6c02020-05-11 21:27:23 -0700148 # The flag that indicate if a servo is connected to a smart usbhub.
149 # TODO(xianuowang@) remove this flag once all usbhubs in the lab
150 # get replaced.
151 self.smart_usbhub = None
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800152 self._servo = None
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700153 self._topology = None
Andrew McRaef0679932020-08-13 09:15:23 +1000154 self._tunnel_proxy = None
155 self._tunnel_proxy_lock = threading.Lock()
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700156 self._initial_instance_ts = None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800157 # Flag to make sure that multiple calls to close do not result in the
158 # logic executing multiple times.
159 self._closed = False
Andrew McRaef0679932020-08-13 09:15:23 +1000160 # Per-thread local data
161 self._local = threading.local()
Fang Deng5d518f42013-08-02 14:04:32 -0700162
Garry Wangcb06f3b2020-10-08 20:56:21 -0700163 def _initialize(self,
164 servo_host='localhost',
165 servo_port=DEFAULT_PORT,
166 servo_board=None,
167 servo_model=None,
168 servo_serial=None,
169 servo_setup=None,
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800170 servo_recovery=None,
Otabek Kasimovab4ae222021-03-06 01:38:47 -0800171 servo_fw_channel=None,
Garry Wang6a680062020-11-03 13:40:29 -0800172 additional_servod_args=None,
Garry Wangcb06f3b2020-10-08 20:56:21 -0700173 is_in_lab=None,
174 *args,
175 **dargs):
Fang Deng5d518f42013-08-02 14:04:32 -0700176 """Initialize a ServoHost instance.
177
178 A ServoHost instance represents a host that controls a servo.
179
180 @param servo_host: Name of the host where the servod process
181 is running.
Raul E Rangel52ca2e82018-07-03 14:10:14 -0600182 @param servo_port: Port the servod process is listening on. Defaults
183 to the SERVOD_PORT environment variable if set,
184 otherwise 9999.
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700185 @param servo_board: Board that the servo is connected to.
Nick Sanders2f3c9852018-10-24 12:10:24 -0700186 @param servo_model: Model that the servo is connected to.
Garry Wangcb06f3b2020-10-08 20:56:21 -0700187 @param servo_serial: Serial number of the servo device.
188 @param servo_setup: Type of servo setup, e.g. REGULAR or DUAL_V4.
Garry Wang6a680062020-11-03 13:40:29 -0800189 @param additional_servod_args: Additional args that will append to
190 servod start command.
Dan Shi4d478522014-02-14 13:46:32 -0800191 @param is_in_lab: True if the servo host is in Cros Lab. Default is set
192 to None, for which utils.host_is_in_lab_zone will be
193 called to check if the servo host is in Cros lab.
Fang Deng5d518f42013-08-02 14:04:32 -0700194
195 """
196 super(ServoHost, self)._initialize(hostname=servo_host,
Garry Wangebc015b2019-06-06 17:45:06 -0700197 is_in_lab=is_in_lab, *args, **dargs)
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800198 self._init_attributes()
Richard Barnette42f4db92018-08-23 15:05:15 -0700199 self.servo_port = int(servo_port)
Richard Barnettee519dcd2016-08-15 17:37:17 -0700200 self.servo_board = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -0700201 self.servo_model = servo_model
Kevin Cheng643ce8a2016-09-15 15:42:12 -0700202 self.servo_serial = servo_serial
Garry Wangcb06f3b2020-10-08 20:56:21 -0700203 self.servo_setup = servo_setup
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800204 self.servo_recovery = servo_recovery
Otabek Kasimovab4ae222021-03-06 01:38:47 -0800205 self.servo_fw_channel = servo_fw_channel
Garry Wang6a680062020-11-03 13:40:29 -0800206 self.additional_servod_args = additional_servod_args
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800207
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800208 # The location of the log files on the servo host for this instance.
209 self.remote_log_dir = '%s_%s' % (self.SERVOD_LOG_PREFIX,
210 self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700211 # Path of the servo host lock file.
Derek Beckettf73baca2020-08-19 15:08:47 -0700212 self._lock_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
213 self.LOCK_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700214 # File path to declare a reboot request.
Derek Beckettf73baca2020-08-19 15:08:47 -0700215 self._reboot_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
216 self.REBOOT_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700217
218 # Lock the servo host if it's an in-lab labstation to prevent other
219 # task to reboot it until current task completes. We also wait and
220 # make sure the labstation is up here, in the case of the labstation is
221 # in the middle of reboot.
Garry Wang7c00b0f2019-06-25 17:28:17 -0700222 self._is_locked = False
Garry Wang42b4d862019-06-25 15:50:49 -0700223 if (self.wait_up(self.REBOOT_TIMEOUT) and self.is_in_lab()
224 and self.is_labstation()):
Garry Wang79e9af62019-06-12 15:19:19 -0700225 self._lock()
Garry Wang78ce64d2020-10-13 18:23:45 -0700226 try:
227 self.wait_ready()
228 except Exception as e:
229 logging.info(
230 'Unexpected error while ensure labstation'
231 ' readiness; %s', str(e))
Garry Wangebc015b2019-06-06 17:45:06 -0700232
Richard Barnette9a26ad62016-06-10 12:03:08 -0700233 self._repair_strategy = (
234 servo_repair.create_servo_repair_strategy())
Richard Barnettee519dcd2016-08-15 17:37:17 -0700235
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700236 def __str__(self):
237 return "<%s '%s:%s'>" % (
238 type(self).__name__, self.hostname, self.servo_port)
239
Richard Barnette9a26ad62016-06-10 12:03:08 -0700240 def connect_servo(self):
Garry Wang8c8dc972020-06-09 13:41:51 -0700241 """ Initialize and setup servo for later use.
242 """
243 self.initilize_servo()
244 self.initialize_dut_for_servo()
245
Garry Wang8c8dc972020-06-09 13:41:51 -0700246 def initilize_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700247 """Establish a connection to the servod server on this host.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700248
249 Initializes `self._servo` and then verifies that all network
250 connections are working. This will create an ssh tunnel if
251 it's required.
Garry Wang8c8dc972020-06-09 13:41:51 -0700252 """
253 self._servo = servo.Servo(servo_host=self,
254 servo_serial=self.servo_serial)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700255
Garry Wang8c8dc972020-06-09 13:41:51 -0700256 def initialize_dut_for_servo(self):
257 """This method will do some setup for dut control, e.g. setup
258 main servo_v4 device, and also testing the connection between servo
259 and DUT. As a side effect of testing the connection, all signals on
260 the target servo are reset to default values, and the USB stick is
Richard Barnette9a26ad62016-06-10 12:03:08 -0700261 set to the neutral (off) position.
262 """
Garry Wang8c8dc972020-06-09 13:41:51 -0700263 if not self._servo:
264 raise hosts.AutoservVerifyError('Servo object needs to be'
265 ' initialized before initialize'
266 ' DUT.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700267 timeout, _ = retry.timeout(
Garry Wang8c8dc972020-06-09 13:41:51 -0700268 self._servo.initialize_dut,
269 timeout_sec=self.INITIALIZE_SERVO_TIMEOUT_SECS)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700270 if timeout:
Garry Wang8c8dc972020-06-09 13:41:51 -0700271 raise hosts.AutoservVerifyError('Initialize dut for servo timed'
272 ' out.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700273
Richard Barnette9a26ad62016-06-10 12:03:08 -0700274 def disconnect_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700275 """Disconnect our servo if it exists.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700276
277 If we've previously successfully connected to our servo,
278 disconnect any established ssh tunnel, and set `self._servo`
279 back to `None`.
280 """
281 if self._servo:
282 # N.B. This call is safe even without a tunnel:
283 # rpc_server_tracker.disconnect() silently ignores
284 # unknown ports.
285 self.rpc_server_tracker.disconnect(self.servo_port)
286 self._servo = None
Fang Deng5d518f42013-08-02 14:04:32 -0700287
Andrew McRaef0679932020-08-13 09:15:23 +1000288 def _maybe_create_servod_ssh_tunnel_proxy(self):
289 """Create a xmlrpc proxy for use with a ssh tunnel.
290 A lock is used to safely create a singleton proxy.
291 """
292 with self._tunnel_proxy_lock:
293 if self._tunnel_proxy is None:
294 self._tunnel_proxy = self.rpc_server_tracker.xmlrpc_connect(
295 None,
296 self.servo_port,
297 ready_test_name=self.SERVO_READY_METHOD,
298 timeout_seconds=60,
299 request_timeout_seconds=3600,
300 server_desc=str(self))
301
Andrew McRaef0679932020-08-13 09:15:23 +1000302 def get_servod_server_proxy(self):
303 """Return a proxy if it exists; otherwise, create a new one.
304 A proxy can either be a ssh tunnel based proxy, or a httplib
305 based proxy.
Fang Deng5d518f42013-08-02 14:04:32 -0700306
307 @returns: An xmlrpclib.ServerProxy that is connected to the servod
308 server on the host.
Fang Deng5d518f42013-08-02 14:04:32 -0700309 """
Garry Wang11b5e872020-03-11 15:14:08 -0700310 if (servo_constants.ENABLE_SSH_TUNNEL_FOR_SERVO
311 and not self.is_localhost()):
Andrew McRaef0679932020-08-13 09:15:23 +1000312 # Check for existing ssh tunnel proxy.
313 if self._tunnel_proxy is None:
314 self._maybe_create_servod_ssh_tunnel_proxy()
315 return self._tunnel_proxy
Richard Barnette9a26ad62016-06-10 12:03:08 -0700316 else:
Andrew McRaef0679932020-08-13 09:15:23 +1000317 # xmlrpc/httplib is not thread-safe, so each thread must have its
318 # own separate proxy connection.
319 if not hasattr(self._local, "_per_thread_proxy"):
320 remote = 'http://%s:%s' % (self.hostname, self.servo_port)
Derek Beckettf73baca2020-08-19 15:08:47 -0700321 self._local._per_thread_proxy = six.moves.xmlrpc_client.ServerProxy(remote)
Andrew McRaef0679932020-08-13 09:15:23 +1000322 return self._local._per_thread_proxy
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800323
Richard Barnette1edbb162016-11-01 11:47:50 -0700324 def verify(self, silent=False):
325 """Update the servo host and verify it's in a good state.
326
327 @param silent If true, suppress logging in `status.log`.
328 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700329 message = 'Beginning verify for servo host %s port %s serial %s'
330 message %= (self.hostname, self.servo_port, self.servo_serial)
331 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700332 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700333 self._repair_strategy.verify(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700334 self._servo_state = servo_constants.SERVO_STATE_WORKING
335 self.record('INFO', None, None,
336 'ServoHost verify set servo_state as WORKING')
Garry Wang63b8c382020-03-11 22:28:40 -0700337 except Exception as e:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -0700338 if not self.is_localhost():
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700339 self._servo_state = self.determine_servo_state()
340 self.record('INFO', None, None,
341 'ServoHost verify set servo_state as %s'
342 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700343 if self._is_critical_error(e):
344 raise
Fang Deng5d518f42013-08-02 14:04:32 -0700345
Garry Wang2b5eef92020-08-21 16:23:35 -0700346 def _get_default_usbkey_mount_path(self):
347 return '/media/servo_usb/%s' % self.servo_port
Fang Deng5d518f42013-08-02 14:04:32 -0700348
Garry Wang7b0e1b72020-03-25 19:08:59 -0700349 def get_image_name_from_usbkey(self, usbkey_dev):
350 """Mount usb drive and check ChromeOS image name on it if there is
351 one. This method assumes the image_usbkey_direction is already set
352 to servo side.
353
Garry Wang4b980202020-09-24 17:00:17 -0700354 @param usbkey_dev: usbkey dev path(e.g. /dev/sdb).
Garry Wang7b0e1b72020-03-25 19:08:59 -0700355
356 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
357 or empty string if no test image detected, or unexpected
358 error occurred.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700359 """
Garry Wang70e5d062020-04-03 18:01:05 -0700360 logging.info('Checking ChromeOS image name on usbkey.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700361 mount_dst = self._get_default_usbkey_mount_path()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700362 # Unmount if there is an existing stale mount.
Garry Wang2b5eef92020-08-21 16:23:35 -0700363 self._unmount_drive(mount_dst)
364 # ChromeOS root fs is in /dev/sdx3
365 mount_src = usbkey_dev + '3'
Garry Wang7b0e1b72020-03-25 19:08:59 -0700366 try:
Garry Wang2b5eef92020-08-21 16:23:35 -0700367 if not self._mount_drive(mount_src, mount_dst):
368 logging.debug('Unexpected error occurred on mount usb drive.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700369 return ''
Garry Wang70e5d062020-04-03 18:01:05 -0700370
371 release_content = self.run(
Garry Wang2b5eef92020-08-21 16:23:35 -0700372 'cat %s/etc/lsb-release' % mount_dst,
Garry Wang70e5d062020-04-03 18:01:05 -0700373 ignore_status=True).stdout.strip()
374
375 if not re.search(r'RELEASE_TRACK=.*test', release_content):
376 logging.info('The image on usbkey is not a test image')
377 return ''
378
379 return lsbrelease_utils.get_chromeos_release_builder_path(
380 lsb_release_content=release_content)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700381 finally:
Garry Wang70e5d062020-04-03 18:01:05 -0700382 logging.debug('Image check compeleted, unmounting the usb drive.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700383 self._unmount_drive(mount_dst)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700384
Garry Wang2b5eef92020-08-21 16:23:35 -0700385 def _extract_firmware_image_from_usbkey(self, fw_dst):
386 """Extract firmware images from the usbkey on servo, this method
387 assumes there is already a ChromeOS test image staged on servo.
388
Garry Wang4b980202020-09-24 17:00:17 -0700389 @param fw_dst: the path that we'll copy firmware images to.
Garry Wang2b5eef92020-08-21 16:23:35 -0700390
391 @returns: a json format string of firmware manifest data.
392 """
393 usbkey_dev = self._probe_and_validate_usb_dev()
394 if not usbkey_dev:
395 raise hosts.AutoservRepairError('Unexpected error occurred when'
396 ' probe usbkey dev path, please check logs for detail.')
397
398 mount_dst = self._get_default_usbkey_mount_path()
399 # Unmount if there is an existing stale mount.
400 self._unmount_drive(mount_dst)
401 # ChromeOS root fs is in /dev/sdx3
402 mount_src = usbkey_dev + '3'
403 try:
404 if not self._mount_drive(mount_src, mount_dst):
405 raise hosts.AutoservRepairError('Failed to extract firmware'
406 ' image; Unable to mount %s.' % usbkey_dev,
407 'unable to mount usbkey')
408 updater_bin = os.path.join(mount_dst,
409 'usr/sbin/chromeos-firmwareupdate')
410 self.run('%s --unpack %s' % (updater_bin, fw_dst))
411 return self.run('%s --manifest' % updater_bin).stdout
412 finally:
413 self._unmount_drive(mount_dst)
414
415 def prepare_repair_firmware_image(self, fw_dst=None):
416 """Prepare firmware image on the servohost for auto repair process
417 to consume.
418
Garry Wang4b980202020-09-24 17:00:17 -0700419 @param fw_dst: the path that we want to store firmware image on
420 the servohost.
Garry Wang2b5eef92020-08-21 16:23:35 -0700421
422 @returns: A tuple that containes ec firmware image path and bios
423 firmware image path on the servohost, or None if type of
424 image is not available based on manifest and dut's model.
425 """
426 model = self.servo_model or self._dut_host_info.model
427 if not model:
428 raise hosts.AutoservRepairError(
429 'Could not determine DUT\'s model.',
430 'model infomation unknown')
431
432 if not fw_dst:
433 fw_dst = '/tmp/firmware_image/%s' % self.servo_port
434 # Cleanup and re-create dst path to have a fresh start.
435 self.run('rm -rf %s' % fw_dst)
436 self.run('mkdir -p %s' % fw_dst)
437
438 manifest = json.loads(self._extract_firmware_image_from_usbkey(fw_dst))
Garry Wang50b56c12020-09-24 17:26:52 -0700439 # For models that have packed $MODEL_signed variant, we want use the
440 # 'signed' variant once we get DVT devices, so try to read manifest
441 # from $MODEL_signed first.
442 build = manifest.get('%s_signed' % model) or manifest.get(model)
443 if not build:
Garry Wang2b5eef92020-08-21 16:23:35 -0700444 raise hosts.AutoservRepairError('Could not find firmware manifest'
445 ' for model:%s' % model, 'model manifest not found')
446 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700447 ec_image = os.path.join(fw_dst, build['ec']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700448 except KeyError:
449 ec_image = None
450 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700451 bios_image = os.path.join(fw_dst, build['host']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700452 except KeyError:
453 bios_image = None
454 if not ec_image and not bios_image:
455 raise hosts.AutoservRepairError('Could not find any firmware image'
456 ' for model:%s' % model, 'cannot find firmware image')
457 return ec_image, bios_image
Garry Wang7b0e1b72020-03-25 19:08:59 -0700458
Garry Wang4b980202020-09-24 17:00:17 -0700459 def flash_ap_firmware_via_servo(self, image):
460 """Flash AP firmware by use a provided image.
461
462 This is will be a short term enhanment for infra repair use, it use
463 'futility update' which will automatically determine various parameters
464 needed for flashrom, and will preserve the GBB, VPD, and HWID for
465 AP firmware update.
466 @TODO(xianuowang@) Remove this method once b/148403277 implemented.
467
468 @param image: the firmware image path on servohost.
469 """
470 cmd = 'futility update -i %s --servo_port=%s'
471 self.run(cmd % (image, self.servo_port), timeout=900)
472
Garry Wang70e5d062020-04-03 18:01:05 -0700473 def _probe_and_validate_usb_dev(self):
474 """This method probe the usb dev path by talking to servo, and then
475 validate the dev path is valid block device to servohost.
476 Possible output:
477 1. Encounter error during probe usb dev, returns empty string.
478 2. probe usb dev completed without error but cannot find usb dev,
479 raise AutoservRepairError.
480 3. probe usb dev find a usb dev path, but failed validation in this
481 method, raise AutoservRepairError.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700482
Garry Wang70e5d062020-04-03 18:01:05 -0700483 @returns: A string of usb dev path(e.g. '/dev/sdb'), or empty string
484 if unexpected error occurred during probe.
485 @raises: AutoservRepairError if servo couldn't probe the usb dev path
486 (servo.probe_host_usb_dev() returns empty string), or the dev path is
487 not valid block device to servohost.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700488 """
489 logging.info('Validating image usbkey on servo.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700490 try:
Garry Wang70e5d062020-04-03 18:01:05 -0700491 usb_dev = self._servo.probe_host_usb_dev()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700492 except Exception as e:
493 # We don't want any unexpected or transient servo communicating
494 # failure block usb repair, so capture all errors here.
495 logging.error(e, exc_info=True)
496 logging.error('Unexpected error occurred on get usbkey dev path,'
497 ' skipping usbkey validation.')
498 return ''
499
Garry Wang70e5d062020-04-03 18:01:05 -0700500 if usb_dev:
501 # probe_host_usb_dev() sometimes return stale record,
502 # so we need to make sure the path exists in fdisk.
Otabek Kasimov77bff672020-10-08 15:52:03 -0700503 validate_cmd = 'fdisk -l %s' % usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700504 try:
Otabek Kasimov77bff672020-10-08 15:52:03 -0700505 resp = self.run(validate_cmd, ignore_status=True, timeout=30)
Garry Wang11441182020-06-16 18:34:14 -0700506 if resp.exit_status == 0:
507 return usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700508 logging.error('%s is reported from "image_usbkey_dev" control'
509 ' but not detected by fdisk!', usb_dev)
510 except error.AutoservRunError as e:
511 if 'Timeout encountered' in str(e):
512 logging.warning('Timeout encountered during fdisk run,'
513 ' skipping usbkey validation.')
514 return ''
515 raise
Garry Wang70e5d062020-04-03 18:01:05 -0700516
517 raise hosts.AutoservRepairError(
518 'No usbkey detected on servo, the usbkey may be either missing'
519 ' or broken. Please replace usbkey on the servo and retry.',
520 'missing usbkey')
521
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700522 def is_ec_supported(self):
Garry Wang9b8f2342020-04-17 16:34:09 -0700523 """Check if ec is supported on the servo_board"""
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700524 if self.servo_board:
525 try:
526 frm_config = config.Config(self.servo_board, self.servo_model)
527 return frm_config.chrome_ec
528 except Exception as e:
529 logging.error('Unexpected error when read from firmware'
530 ' configs; %s', str(e))
531 return False
532
Garry Wang70e5d062020-04-03 18:01:05 -0700533 def validate_image_usbkey(self):
534 """This method first validate if there is a recover usbkey on servo
535 that accessible to servohost, and second check if a ChromeOS image is
536 already on the usb drive and return the image_name so we can avoid
537 unnecessary download and flash to the recover usbkey on servo.
538
539 Please note that, there is special error handling logic here:
540 1. If unexpected error happens, we return empty string. So repair
541 actions will not get blocked.
542 2. If no working usbkey present on servo, but no errors, we'll raise
543 AutoservRepairError here.
544
545 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
546 or empty string if no test image detected, or unexpected
547 error occurred.
548 @raises: AutoservRepairError if the usbkey is not detected on servo.
549 """
550 usb_dev = self._probe_and_validate_usb_dev()
551 if usb_dev:
552 return self.get_image_name_from_usbkey(usb_dev)
553 else:
554 return ''
Garry Wang7b0e1b72020-03-25 19:08:59 -0700555
Richard Barnette1edbb162016-11-01 11:47:50 -0700556 def repair(self, silent=False):
557 """Attempt to repair servo host.
558
559 @param silent If true, suppress logging in `status.log`.
560 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700561 message = 'Beginning repair for servo host %s port %s serial %s'
562 message %= (self.hostname, self.servo_port, self.servo_serial)
563 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700564 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700565 self._repair_strategy.repair(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700566 self._servo_state = servo_constants.SERVO_STATE_WORKING
567 self.record('INFO', None, None,
568 'ServoHost repair set servo_state as WORKING')
Garry Wang464ff1e2019-07-18 17:20:34 -0700569 # If target is a labstation then try to withdraw any existing
570 # reboot request created by this servo because it passed repair.
571 if self.is_labstation():
572 self.withdraw_reboot_request()
Garry Wang63b8c382020-03-11 22:28:40 -0700573 except Exception as e:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -0700574 if not self.is_localhost():
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700575 self._servo_state = self.determine_servo_state()
576 self.record('INFO', None, None,
577 'ServoHost repair set servo_state as %s'
578 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700579 if self._is_critical_error(e):
580 self.disconnect_servo()
581 self.stop_servod()
582 raise
583
Garry Wang63b8c382020-03-11 22:28:40 -0700584 def _is_critical_error(self, error):
585 if (isinstance(error, hosts.AutoservVerifyDependencyError)
586 and not error.is_critical()):
587 logging.warning('Non-critical verify failure(s) detected during'
588 ' verify/repair servo, servo connection will'
Evan Benn2c41c262020-10-28 11:34:27 +1100589 ' still be up but may not be fully functional.'
590 ' Some repair actions and servo dependent'
Garry Wang63b8c382020-03-11 22:28:40 -0700591 ' tests may not run.')
592 return False
Evan Benn2c41c262020-10-28 11:34:27 +1100593 logging.info(
594 'Critical verify failure(s) detected during repair/verify '
595 'servo. Disconnecting servo and running `stop servod`, all'
596 ' repair actions and tests that depends on servo will not '
597 'run.')
Garry Wang63b8c382020-03-11 22:28:40 -0700598 return True
Fang Deng5d518f42013-08-02 14:04:32 -0700599
Dan Shi4d478522014-02-14 13:46:32 -0800600 def get_servo(self):
601 """Get the cached servo.Servo object.
Fang Deng5d518f42013-08-02 14:04:32 -0700602
Dan Shi4d478522014-02-14 13:46:32 -0800603 @return: a servo.Servo object.
Dana Goyette353d1d92019-06-27 10:43:59 -0700604 @rtype: autotest_lib.server.cros.servo.servo.Servo
Fang Deng5d518f42013-08-02 14:04:32 -0700605 """
Dan Shi4d478522014-02-14 13:46:32 -0800606 return self._servo
607
Garry Wang79e9af62019-06-12 15:19:19 -0700608 def request_reboot(self):
609 """Request servohost to be rebooted when it's safe to by touch a file.
610 """
611 logging.debug('Request to reboot servohost %s has been created by '
Garry Wang464ff1e2019-07-18 17:20:34 -0700612 'servo with port # %s', self.hostname, self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700613 self.run('touch %s' % self._reboot_file, ignore_status=True)
614
Garry Wang464ff1e2019-07-18 17:20:34 -0700615 def withdraw_reboot_request(self):
616 """Withdraw a servohost reboot request if exists by remove the flag
617 file.
618 """
619 logging.debug('Withdrawing request to reboot servohost %s that created'
620 ' by servo with port # %s if exists.',
621 self.hostname, self.servo_port)
622 self.run('rm -f %s' % self._reboot_file, ignore_status=True)
623
Garry Wangc1288cf2019-12-17 14:58:00 -0800624 def start_servod(self, quick_startup=False):
625 """Start the servod process on servohost.
626 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800627 # Skip if running on the localhost.(crbug.com/1038168)
628 if self.is_localhost():
629 logging.debug("Servohost is a localhost, skipping start servod.")
630 return
631
632 cmd = 'start servod'
Garry Wangc1288cf2019-12-17 14:58:00 -0800633 if self.servo_board:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800634 cmd += ' BOARD=%s' % self.servo_board
Garry Wangc1288cf2019-12-17 14:58:00 -0800635 if self.servo_model:
636 cmd += ' MODEL=%s' % self.servo_model
Garry Wangc1288cf2019-12-17 14:58:00 -0800637 else:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800638 logging.warning('Board for DUT is unknown; starting servod'
639 ' assuming a pre-configured board.')
640
641 cmd += ' PORT=%d' % self.servo_port
642 if self.servo_serial:
643 cmd += ' SERIAL=%s' % self.servo_serial
Garry Wangd7367482020-02-27 13:52:40 -0800644
Garry Wangcb06f3b2020-10-08 20:56:21 -0700645 # Start servod with dual_v4 based on servo_setup.
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700646 if self.is_dual_setup():
Garry Wangcb06f3b2020-10-08 20:56:21 -0700647 cmd += ' DUAL_V4=1'
Garry Wangd7367482020-02-27 13:52:40 -0800648
Garry Wangcb06f3b2020-10-08 20:56:21 -0700649 # Start servod with CONFIG=cr50.xml which required for some pools.
650 if self._require_cr50_servod_config():
651 cmd += ' CONFIG=cr50.xml'
Garry Wangb5cee3e2020-09-16 14:58:13 -0700652
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800653 if self.servo_recovery == True:
654 cmd += ' REC_MODE=1'
655
Garry Wang6a680062020-11-03 13:40:29 -0800656 # Adding customized args if any.
657 if self.additional_servod_args:
658 cmd += ' ' + self.additional_servod_args
659
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800660 # Remove the symbolic links from the logs. This helps ensure that
661 # a failed servod instantiation does not cause us to grab old logs
662 # by mistake.
663 self.remove_latest_log_symlinks()
Garry Wangcdd27b22020-01-13 14:59:11 -0800664 self.run(cmd, timeout=60)
Garry Wangc1288cf2019-12-17 14:58:00 -0800665
666 # There's a lag between when `start servod` completes and when
667 # the _ServodConnectionVerifier trigger can actually succeed.
668 # The call to time.sleep() below gives time to make sure that
669 # the trigger won't fail after we return.
670
671 # Normally servod on servo_v3 and labstation take ~10 seconds to ready,
672 # But in the rare case all servo on a labstation are in heavy use they
673 # may take ~30 seconds. So the timeout value will double these value,
674 # and we'll try quick start up when first time initialize servohost,
675 # and use standard start up timeout in repair.
676 if quick_startup:
Garry Wang11b5e872020-03-11 15:14:08 -0700677 timeout = servo_constants.SERVOD_QUICK_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800678 else:
Garry Wang11b5e872020-03-11 15:14:08 -0700679 timeout = servo_constants.SERVOD_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800680 logging.debug('Wait %s seconds for servod process fully up.', timeout)
681 time.sleep(timeout)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700682 # Cache the initial instance timestamp to check against servod restarts
683 self._initial_instance_ts = self.get_instance_logs_ts()
Garry Wangc1288cf2019-12-17 14:58:00 -0800684
Garry Wangc1288cf2019-12-17 14:58:00 -0800685 def stop_servod(self):
686 """Stop the servod process on servohost.
687 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800688 # Skip if running on the localhost.(crbug.com/1038168)
689 if self.is_localhost():
690 logging.debug("Servohost is a localhost, skipping stop servod.")
691 return
692
Garry Wangc1288cf2019-12-17 14:58:00 -0800693 logging.debug('Stopping servod on port %s', self.servo_port)
Garry Wangcdd27b22020-01-13 14:59:11 -0800694 self.run('stop servod PORT=%d' % self.servo_port,
695 timeout=60, ignore_status=True)
Garry Wangc1288cf2019-12-17 14:58:00 -0800696 logging.debug('Wait %s seconds for servod process fully teardown.',
Garry Wang11b5e872020-03-11 15:14:08 -0700697 servo_constants.SERVOD_TEARDOWN_TIMEOUT)
698 time.sleep(servo_constants.SERVOD_TEARDOWN_TIMEOUT)
Garry Wangc1288cf2019-12-17 14:58:00 -0800699
Garry Wangc1288cf2019-12-17 14:58:00 -0800700 def restart_servod(self, quick_startup=False):
701 """Restart the servod process on servohost.
702 """
703 self.stop_servod()
704 self.start_servod(quick_startup)
705
Garry Wangffbd2162020-04-17 16:13:48 -0700706 def _process_servodtool_error(self, response):
707 """Helper function to handle non-zero servodtool response.
708 """
709 if re.search(servo_constants.ERROR_MESSAGE_USB_HUB_NOT_COMPATIBLE,
Garry Wangad245002020-05-15 15:20:23 -0700710 response.stdout):
Garry Wangffbd2162020-04-17 16:13:48 -0700711 logging.error('The servo is not plugged on a usb hub that supports'
712 ' power-cycle!')
Garry Wang000c6c02020-05-11 21:27:23 -0700713 # change the flag so we can update this label in later process.
714 self.smart_usbhub = False
Garry Wangffbd2162020-04-17 16:13:48 -0700715 return
716
717 if re.search(servo_constants.ERROR_MESSAGE_DEVICE_NOT_FOUND %
718 self.servo_serial, response.stdout):
719 logging.error('No servo with serial %s found!', self.servo_serial)
720 return
721
722 logging.error('Unexpected error occurred from usbhub control, please'
723 ' file a bug and inform chrome-fleet-software@ team!')
724
Otabek Kasimov86062d02020-11-17 13:30:22 -0800725 def get_main_servo_usb_path(self):
726 """Helper function to collect current usb-path to main servo.
727
728 The usb-path is path to the folder where usb-device was enumerated.
729 If fail then will return an empty string ('').
730
731 @returns: string, usb-path to the main servo device.
732 e.g.: '/sys/bus/usb/devices/1-6.1.3.1'
Garry Wangffbd2162020-04-17 16:13:48 -0700733 """
Otabek Kasimov09192682020-06-01 18:17:44 -0700734 # TODO remove try-except when fix crbug.com/1087964
735 try:
736 cmd = 'servodtool device -s %s usb-path' % self.servo_serial
737 resp = self.run(cmd, ignore_status=True, timeout=30)
738 except Exception as e:
739 # Here we catch only timeout errors.
740 # Other errors is filtered by ignore_status=True
741 logging.debug('Attempt to get servo usb-path failed due to '
742 'timeout; %s', e)
743 return ''
Garry Wangffbd2162020-04-17 16:13:48 -0700744 if resp.exit_status != 0:
745 self._process_servodtool_error(resp)
746 return ''
747 usb_path = resp.stdout.strip()
748 logging.info('Usb path of servo %s is %s', self.servo_serial, usb_path)
Otabek Kasimov86062d02020-11-17 13:30:22 -0800749 return usb_path
Garry Wangffbd2162020-04-17 16:13:48 -0700750
Otabek Kasimov86062d02020-11-17 13:30:22 -0800751 def _get_servo_usb_devnum(self):
752 """Helper function to collect current usb devnum of servo."""
753 usb_path = self.get_main_servo_usb_path()
754 if not usb_path:
755 return ''
756 resp = self.run('cat %s/devnum' % usb_path, ignore_status=True)
Garry Wangffbd2162020-04-17 16:13:48 -0700757 if resp.exit_status != 0:
758 self._process_servodtool_error(resp)
759 return ''
760 return resp.stdout.strip()
761
Garry Wang358aad42020-08-02 20:56:04 -0700762 def reboot_servo_v3_on_need(self):
763 """Check and reboot servo_v3 based on below conditions.
764 1. If there is an update pending on reboot.
765 2. Servo_v3 has been up for more than 96 hours.
766 """
767 if self.get_board() != 'beaglebone_servo':
768 logging.info('Servo reboot is only applicable for servo V3.')
Otabek Kasimove6df8102020-07-21 20:15:25 -0700769 return
770
Garry Wang358aad42020-08-02 20:56:04 -0700771 update_pending_reboot = (self._check_update_status() ==
772 self.UPDATE_STATE.PENDING_REBOOT)
773 uptime_hours = float(self.check_uptime())/3600
774 logging.info('Uptime of servo_v3: %s hour(s)', uptime_hours)
775 long_up_time = uptime_hours > 96
776
777 # Skip reboot if neither condition are met.
778 if not (update_pending_reboot or long_up_time):
Otabek Kasimove6df8102020-07-21 20:15:25 -0700779 return
780
Garry Wang358aad42020-08-02 20:56:04 -0700781 if update_pending_reboot:
782 message = 'Starting reboot servo_v3 because an update is pending.'
783 reboot_method = self._post_update_reboot
784 elif long_up_time:
785 message = 'Starting reboot servo_v3 because uptime > 96 hours.'
786 reboot_method = self._servo_host_reboot
787 self.record('INFO', None, None, message)
788 logging.info(message)
Otabek Kasimove6df8102020-07-21 20:15:25 -0700789 try:
Garry Wang358aad42020-08-02 20:56:04 -0700790 reboot_method()
Otabek Kasimove6df8102020-07-21 20:15:25 -0700791 message = 'Servo_v3 reboot completed successfully.'
792 except Exception as e:
793 logging.debug("Fail to reboot servo_v3; %s", e)
794 message = ('Servo_v3 reboot failed, please check debug log '
795 'for details.')
796 logging.info(message)
797 self.record('INFO', None, None, message)
Garry Wangffbd2162020-04-17 16:13:48 -0700798
799 def _reset_servo(self):
800 logging.info('Resetting servo through smart usbhub.')
Otabek Kasimov09192682020-06-01 18:17:44 -0700801 # TODO remove try-except when fix crbug.com/1087964
802 try:
803 resp = self.run('servodtool device -s %s power-cycle' %
804 self.servo_serial, ignore_status=True,
805 timeout=30)
806 if resp.exit_status != 0:
807 self._process_servodtool_error(resp)
808 return False
809 except Exception as e:
810 # Here we catch only timeout errors.
811 # Other errors is filtered by ignore_status=True
812 logging.debug('Attempt to reset servo failed due to timeout;'
813 ' %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -0700814 return False
815
816 logging.debug('Wait %s seconds for servo to come back from reset.',
817 servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
818 time.sleep(servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
Garry Wang000c6c02020-05-11 21:27:23 -0700819 # change the flag so we can update this label in later process.
820 self.smart_usbhub = True
Garry Wangffbd2162020-04-17 16:13:48 -0700821 return True
822
Garry Wangffbd2162020-04-17 16:13:48 -0700823 def reset_servo(self):
824 """Reset(power-cycle) the servo via smart usbhub.
825 """
826 if not self.is_labstation():
827 logging.info('Servo reset is not applicable to servo_v3.')
828 return
829
830 pre_reset_devnum = self._get_servo_usb_devnum()
831 logging.info('Servo usb devnum before reset: %s', pre_reset_devnum)
832 result = self._reset_servo()
833 if not result:
Garry Wangfd5c8b62020-06-08 15:36:54 -0700834 message = ('Failed to reset servo with serial: %s. (Please ignore'
835 ' this error if the DUT is not connected to a smart'
836 ' usbhub).' % self.servo_serial)
Garry Wangffbd2162020-04-17 16:13:48 -0700837 logging.warning(message)
838 self.record('INFO', None, None, message)
839 return
840
841 post_reset_devnum = self._get_servo_usb_devnum()
842 logging.info('Servo usb devnum after reset: %s', post_reset_devnum)
843 if not (pre_reset_devnum and post_reset_devnum):
844 message = ('Servo reset completed but unable to verify'
845 ' devnum change!')
846 elif pre_reset_devnum != post_reset_devnum:
847 message = ('Reset servo with serial %s completed successfully!'
848 % self.servo_serial)
849 else:
850 message = 'Servo reset completed but devnum is still not changed!'
851 logging.info(message)
852 self.record('INFO', None, None, message)
853
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800854 def _extract_compressed_logs(self, logdir, relevant_files):
855 """Decompress servod logs in |logdir|.
856
857 @param logdir: directory containing compressed servod logs.
858 @param relevant_files: list of files in |logdir| to consider.
859
860 @returns: tuple, (tarfiles, files) where
861 tarfiles: list of the compressed filenames that have been
862 extracted and deleted
863 files: list of the uncompressed files that were generated
864 """
865 # For all tar-files, first extract them to the directory, and
866 # then let the common flow handle them.
867 tarfiles = [cf for cf in relevant_files if
868 cf.endswith(self.COMPRESSION_SUFFIX)]
869 files = []
870 for f in tarfiles:
871 norm_name = os.path.basename(f)[:-len(self.COMPRESSION_SUFFIX)]
872 with tarfile.open(f) as tf:
873 # Each tarfile has only one member, as
874 # that's the compressed log.
875 member = tf.members[0]
876 # Manipulate so that it only extracts the basename, and not
877 # the directories etc.
878 member.name = norm_name
879 files.append(os.path.join(logdir, member.name))
880 tf.extract(member, logdir)
881 # File has been extracted: remove the compressed file.
882 os.remove(f)
883 return tarfiles, files
884
885 def _extract_mcu_logs(self, log_subdir):
886 """Extract MCU (EC, Cr50, etc) console output from servod debug logs.
887
888 Using the MCU_EXTRACTOR regex (above) extract and split out MCU console
889 lines from the logs to generate invidiual console logs e.g. after
890 this method, you can find an ec.txt and servo_v4.txt in |log_dir| if
891 those MCUs had any console input/output.
892
893 @param log_subdir: directory with log.DEBUG.txt main servod debug logs.
894 """
895 # Extract the MCU for each one. The MCU logs are only in the .DEBUG
896 # files
897 mcu_lines_file = os.path.join(log_subdir, 'log.DEBUG.txt')
898 if not os.path.exists(mcu_lines_file):
899 logging.info('No DEBUG logs found to extract MCU logs from.')
900 return
901 mcu_files = {}
902 mcu_file_template = '%s.txt'
903 with open(mcu_lines_file, 'r') as f:
904 for line in f:
905 match = self.MCU_EXTRACTOR.match(line)
906 if match:
907 mcu = match.group(self.MCU_GROUP).lower()
908 line = match.group(self.LINE_GROUP)
909 if mcu not in mcu_files:
910 mcu_file = os.path.join(log_subdir,
911 mcu_file_template % mcu)
912 mcu_files[mcu] = open(mcu_file, 'a')
913 fd = mcu_files[mcu]
914 fd.write(line + '\n')
915 for f in mcu_files:
916 mcu_files[f].close()
917
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800918 def remove_latest_log_symlinks(self):
919 """Remove the conveninence symlinks 'latest' servod logs."""
920 symlink_wildcard = '%s/latest*' % self.remote_log_dir
921 cmd = 'rm ' + symlink_wildcard
922 self.run(cmd, stderr_tee=None, ignore_status=True)
923
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700924 def probe_servod_restart(self, instance_ts, outdir):
925 """Grab servod logs from previous instances if part of this session.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800926
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700927 If since the last time this host called start_servod() servod crashed
928 and restarted, this helper finds those logs as well, and stores them
929 with the |OLD_LOG_SUFFIX| to investigate if necessary.
Prasad Vuppalapu5bd9da12020-03-31 01:46:47 +0000930
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700931 It also issues a panicinfo command to servo devices after the restart
932 to try and collect reboot information for debugging.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800933
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700934 @param instance_ts: the log timestamp that the current instance uses
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800935 @param outdir: directory to create a subdirectory into to place the
936 servod logs into.
937 """
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700938 if self._initial_instance_ts is None:
939 logging.info('No log timestamp grabbed successfully on servod '
940 'startup. Cannot check device restarts. Ignoring.')
941 return
942 if instance_ts == self._initial_instance_ts:
943 logging.debug('Servod appears to have run without restarting')
944 return
945 # Servod seems to have restarted (at least once). |_initial_instance_ts|
946 # is the first timestamp, and instance_ts is the current timestamp. Find
947 # all timestamps in between them, and grab the logs for each.
948 tss = self._find_instance_timestamps_between(self._initial_instance_ts,
949 instance_ts)
950 logging.info('Servod has restarted %d times between the start and the '
951 'end of this servo_host.', len(tss))
952 logging.info('This might be an issue. Will extract all logs from each '
953 'instance.')
954 logging.info('Logs that are not the currently running (about to turn '
955 'down) instance are maked with a .%s in their folder.',
956 self.OLD_LOG_SUFFIX)
957 for ts in tss:
958 self.get_instance_logs(ts, outdir, old=True)
959 # Lastly, servod has restarted due to a potential issue. Try to get
960 # panic information from servo micro and servo v4 for the current logs.
961 # This can only happen if the |_servo| attribute is initialized.
962 if self._servo:
963 for mcu in ['servo_micro', 'servo_v4']:
964 ctrl = '%s_uart_cmd' % mcu
965 if self._servo.has_control(ctrl):
966 logging.info('Trying to retrieve %r panicinfo into logs',
967 mcu)
968 try:
969 self._servo.set_nocheck(ctrl, 'panicinfo')
970 except error.TestFail as e:
971 logging.error('Failed to generate panicinfo for %r '
972 'logs. %s', mcu, str(e))
973
974 def _find_instance_timestamps_between(self, start_ts, end_ts):
975 """Find all log timestamps between [start_ts, end_ts).
976
977 @param start_ts: str, earliest log timestamp of interest
978 @param end_ts: str, latest log timestamp of interest
979
980 @returns: list, all timestamps between start_ts and end_ts, end_ts
981 exclusive, on the servo_host. An empty list on errors
982 """
983 # Simply get all timestamp, and then sort and remove
984 cmd = 'ls %s' % self.remote_log_dir
985 res = self.run(cmd, stderr_tee=None, ignore_status=True)
986 if res.exit_status != 0:
987 # Here we failed to find anything.
988 logging.info('Failed to find remote servod logs. Ignoring.')
989 return []
990 logfiles = res.stdout.strip().split()
991 timestamps = set()
992 for logfile in logfiles:
993 ts_match = self.TS_EXTRACTOR.match(logfile)
994 if not ts_match:
995 # Simply ignore files that fail the check. It might be the
996 # 'latest' symlinks or random files.
997 continue
998 timestamps.add(ts_match.group(self.TS_GROUP))
999 # At this point we have all unique timestamps.
1000 timestamps = sorted(timestamps)
1001 for ts in [start_ts, end_ts]:
1002 if ts not in timestamps:
1003 logging.error('Timestamp %r not in servod logs. Cannot query '
1004 'for timestamps in between %r and %r', ts,
1005 start_ts, end_ts)
1006 return []
1007 return timestamps[timestamps.index(start_ts):timestamps.index(end_ts)]
1008
1009 def get_instance_logs_ts(self):
1010 """Retrieve the currently running servod instance's log timestamp
1011
1012 @returns: str, timestamp for current instance, or None on failure
1013 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001014 # First, extract the timestamp. This cmd gives the real filename of
1015 # the latest aka current log file.
1016 cmd = ('if [ -f %(dir)s/latest.DEBUG ];'
1017 'then realpath %(dir)s/latest.DEBUG;'
1018 'elif [ -f %(dir)s/latest ];'
1019 'then realpath %(dir)s/latest;'
1020 'else exit %(code)d;'
1021 'fi' % {'dir': self.remote_log_dir,
1022 'code': self.NO_SYMLINKS_CODE})
1023 res = self.run(cmd, stderr_tee=None, ignore_status=True)
1024 if res.exit_status != 0:
1025 if res.exit_status == self.NO_SYMLINKS_CODE:
1026 logging.warning('servod log latest symlinks not found. '
1027 'This is likely due to an error starting up '
1028 'servod. Ignoring..')
1029 else:
1030 logging.warning('Failed to find servod logs on servo host.')
1031 logging.warning(res.stderr.strip())
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001032 return None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001033 fname = os.path.basename(res.stdout.strip())
1034 # From the fname, ought to extract the timestamp using the TS_EXTRACTOR
Ruben Rodriguez Buchillone9aa2b02020-03-04 12:14:28 -08001035 ts_match = self.TS_EXTRACTOR.match(fname)
1036 if not ts_match:
1037 logging.warning('Failed to extract timestamp from servod log file '
1038 '%r. Skipping. The servo host is using outdated '
1039 'servod logging and needs to be updated.', fname)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001040 return None
1041 return ts_match.group(self.TS_GROUP)
1042
1043 def get_instance_logs(self, instance_ts, outdir, old=False):
1044 """Collect all logs with |instance_ts| and dump into a dir in |outdir|
1045
1046 This method first collects all logs on the servo_host side pertaining
1047 to this servod instance (port, instatiation). It glues them together
1048 into combined log.[level].txt files and extracts all available MCU
1049 console I/O from the logs into individual files e.g. servo_v4.txt
1050
1051 All the output can be found in a directory inside |outdir| that
1052 this generates based on |LOG_DIR|, the servod port, and the instance
1053 timestamp on the servo_host side.
1054
1055 @param instance_ts: log timestamp to grab logfiles for
1056 @param outdir: directory to create a subdirectory into to place the
1057 servod logs into.
1058 @param old: bool, whether to append |OLD_LOG_SUFFIX| to output dir
1059 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001060 # Create the local results log dir.
1061 log_dir = os.path.join(outdir, '%s_%s.%s' % (self.LOG_DIR,
1062 str(self.servo_port),
1063 instance_ts))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001064 if old:
Garry Wang22f2e842020-09-09 20:19:19 -07001065 log_dir = '%s.%s' % (log_dir, self.OLD_LOG_SUFFIX)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001066 logging.info('Saving servod logs to %r.', log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001067 os.mkdir(log_dir)
1068 # Now, get all files with that timestamp.
1069 cmd = 'find %s -maxdepth 1 -name "log.%s*"' % (self.remote_log_dir,
1070 instance_ts)
1071 res = self.run(cmd, stderr_tee=None, ignore_status=True)
1072 files = res.stdout.strip().split()
1073 try:
1074 self.get_file(files, log_dir, try_rsync=False)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001075 if not os.listdir(log_dir):
1076 logging.info('No servod logs retrieved. Ignoring, and removing '
1077 '%r again.', log_dir)
1078 os.rmdir(log_dir)
1079 return
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001080 except error.AutoservRunError as e:
1081 result = e.result_obj
1082 if result.exit_status != 0:
1083 stderr = result.stderr.strip()
1084 logging.warning("Couldn't retrieve servod logs. Ignoring: %s",
1085 stderr or '\n%s' % result)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001086 # Remove the log_dir as nothing was added to it.
1087 os.rmdir(log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001088 return
1089 local_files = [os.path.join(log_dir, f) for f in os.listdir(log_dir)]
1090 # TODO(crrev.com/c/1793030): remove no-level case once CL is pushed
1091 for level_name in ('DEBUG', 'INFO', 'WARNING', ''):
1092 # Create the joint files for each loglevel. i.e log.DEBUG
1093 joint_file = self.JOINT_LOG_PREFIX
1094 if level_name:
1095 joint_file = '%s.%s' % (self.JOINT_LOG_PREFIX, level_name)
1096 # This helps with some online tools to avoid complaints about an
1097 # unknown filetype.
1098 joint_file = joint_file + '.txt'
1099 joint_path = os.path.join(log_dir, joint_file)
1100 files = [f for f in local_files if level_name in f]
1101 if not files:
1102 # TODO(crrev.com/c/1793030): remove no-level case once CL
1103 # is pushed
1104 continue
1105 # Extract compressed logs if any.
1106 compressed, extracted = self._extract_compressed_logs(log_dir,
1107 files)
1108 files = list(set(files) - set(compressed))
1109 files.extend(extracted)
1110 # Need to sort. As they all share the same timestamp, and
1111 # loglevel, the index itself is sufficient. The highest index
1112 # is the oldest file, therefore we need a descending sort.
1113 def sortkey(f, level=level_name):
1114 """Custom sortkey to sort based on rotation number int."""
1115 if f.endswith(level_name): return 0
1116 return int(f.split('.')[-1])
1117
1118 files.sort(reverse=True, key=sortkey)
1119 # Just rename the first file rather than building from scratch.
1120 os.rename(files[0], joint_path)
1121 with open(joint_path, 'a') as joint_f:
1122 for logfile in files[1:]:
1123 # Transfer the file to the joint file line by line.
1124 with open(logfile, 'r') as log_f:
1125 for line in log_f:
1126 joint_f.write(line)
1127 # File has been written over. Delete safely.
1128 os.remove(logfile)
1129 # Need to remove all files form |local_files| so we don't
1130 # analyze them again.
1131 local_files = list(set(local_files) - set(files) - set(compressed))
1132 # Lastly, extract MCU logs from the joint logs.
1133 self._extract_mcu_logs(log_dir)
1134
Garry Wang79e9af62019-06-12 15:19:19 -07001135 def _lock(self):
1136 """lock servohost by touching a file.
1137 """
1138 logging.debug('Locking servohost %s by touching %s file',
1139 self.hostname, self._lock_file)
1140 self.run('touch %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001141 self._is_locked = True
Garry Wang79e9af62019-06-12 15:19:19 -07001142
Garry Wang79e9af62019-06-12 15:19:19 -07001143 def _unlock(self):
1144 """Unlock servohost by removing the lock file.
1145 """
1146 logging.debug('Unlocking servohost by removing %s file',
1147 self._lock_file)
1148 self.run('rm %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001149 self._is_locked = False
Garry Wang79e9af62019-06-12 15:19:19 -07001150
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001151 def close(self):
Congbin Guofc3b8962019-03-22 17:38:46 -07001152 """Close the associated servo and the host object."""
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001153 # NOTE: throughout this method there are multiple attempts to catch
1154 # all errors. This is WAI as log grabbing should not fail tests.
1155 # However, the goal is to catch and handle/process all errors, thus
1156 # we print the traceback and ask for a bug.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001157 if self._closed:
1158 logging.debug('ServoHost is already closed.')
1159 return
Garry Wang22f2e842020-09-09 20:19:19 -07001160
1161 # Only attempt ssh related actions if servohost is sshable. We call
1162 # check_cached_up_status() first because it's lightweighted and return
1163 # much faster in the case servohost is down, however, we still want
1164 # to call is_up() later since check_cached_up_status() is ping based check
1165 # and not guarantee the servohost is sshable.
1166 servo_host_ready = self.check_cached_up_status() and self.is_up()
1167
1168 if servo_host_ready:
1169 instance_ts = self.get_instance_logs_ts()
1170 else:
1171 logging.info('Servohost is down, will skip servod log collecting.')
1172 instance_ts = None
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001173 # TODO(crbug.com/1011516): once enabled, remove the check against
1174 # localhost and instead check against log-rotiation enablement.
1175 logs_available = (instance_ts is not None and
1176 self.job and
1177 not self.is_localhost())
1178 if logs_available:
1179 # Probe whether there was a servod restart, and grab those old
1180 # logs as well.
1181 try:
1182 self.probe_servod_restart(instance_ts, self.job.resultdir)
1183 except (error.AutoservRunError, error.TestFail) as e:
1184 logging.info('Failed to grab servo logs due to: %s. '
1185 'This error is forgiven.', str(e))
1186 except Exception as e:
1187 logging.error('Unexpected error probing for old logs. %s. '
1188 'Forgiven. Please file a bug and fix or catch '
1189 'in log probing function', str(e),
1190 exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001191 if self._servo:
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001192 outdir = None if not self.job else self.job.resultdir
Congbin Guo2e5e2a22018-07-27 10:32:48 -07001193 # In some cases when we run as lab-tools, the job object is None.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001194 self._servo.close(outdir)
1195
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001196 if logs_available:
1197 # Grab current (not old like above) logs after the servo instance
1198 # was closed out.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001199 try:
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001200 self.get_instance_logs(instance_ts, self.job.resultdir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001201 except error.AutoservRunError as e:
1202 logging.info('Failed to grab servo logs due to: %s. '
1203 'This error is forgiven.', str(e))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001204 except Exception as e:
1205 logging.error('Unexpected error grabbing servod logs. %s. '
1206 'Forgiven. Please file a bug and fix or catch '
1207 'in log grabbing function', str(e), exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001208
Garry Wang22f2e842020-09-09 20:19:19 -07001209 if self._is_locked and servo_host_ready:
Garry Wang7c00b0f2019-06-25 17:28:17 -07001210 # Remove the lock if the servohost has been locked.
Garry Wang79e9af62019-06-12 15:19:19 -07001211 try:
1212 self._unlock()
1213 except error.AutoservSSHTimeout:
1214 logging.error('Unlock servohost failed due to ssh timeout.'
1215 ' It may caused by servohost went down during'
1216 ' the task.')
Garry Wangc1288cf2019-12-17 14:58:00 -08001217 # We want always stop servod after task to minimum the impact of bad
1218 # servod process interfere other servods.(see crbug.com/1028665)
Garry Wang22f2e842020-09-09 20:19:19 -07001219 if servo_host_ready:
1220 try:
1221 self.stop_servod()
1222 except error.AutoservRunError as e:
1223 logging.info(
1224 "Failed to stop servod due to:\n%s\n"
1225 "This error is forgiven.", str(e))
Garry Wangc1288cf2019-12-17 14:58:00 -08001226
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001227 super(ServoHost, self).close()
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001228 # Mark closed.
1229 self._closed = True
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001230
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001231 def get_servo_state(self):
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001232 return self._servo_state
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001233
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001234 def _get_host_metrics_data(self):
1235 return {'port': self.servo_port,
Otabek Kasimov0ea47362020-07-11 20:55:09 -07001236 'host': self.get_dut_hostname() or self.hostname,
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001237 'board': self.servo_board or ''}
1238
Otabek Kasimov15aafec2021-03-05 16:22:42 -08001239 def is_servo_board_present_on_servo_v3(self):
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001240 """Check if servo board is detected on servo_v3"""
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001241 logging.debug('Started to detect servo board on servo_v3')
Otabek Kasimov15aafec2021-03-05 16:22:42 -08001242 vid_pids = ['18d1:5004', '0403:6014']
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001243 not_detected = 'The servo board is not detected on servo_v3'
1244 try:
1245 cmd = 'lsusb | grep "%s"' % "\|".join(vid_pids)
1246 result = self.run(cmd, ignore_status=True, timeout=30)
1247 if result.exit_status == 0 and result.stdout.strip():
1248 logging.debug('The servo board is detected on servo_v3')
1249 return True
1250 logging.debug('%s; %s', not_detected, result)
1251 return False
1252 except Exception as e:
1253 # can be triggered by timeout issue due running the script
1254 metrics.Counter(
1255 'chromeos/autotest/repair/servo_detection/timeout'
1256 ).increment(fields=self._get_host_metrics_data())
1257 logging.error('%s; %s', not_detected, str(e))
1258 return None
1259
Garry Wangb5cee3e2020-09-16 14:58:13 -07001260 def _require_cr50_servod_config(self):
1261 """Check whether we need start servod with CONFIG=cr50.xml"""
1262 dut_host_info = self.get_dut_host_info()
1263 if not dut_host_info:
1264 return False
1265 for pool in dut_host_info.pools:
1266 if pool.startswith(servo_constants.CR50_CONFIG_POOL_PREFIX):
1267 return True
1268 return False
1269
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001270 def get_verifier_state(self, tag):
Otabek Kasimov15963492020-06-23 21:10:51 -07001271 """Return the state of servo verifier.
1272
1273 @returns: bool or None
1274 """
1275 return self._repair_strategy.verifier_is_good(tag)
1276
1277 def determine_servo_state(self):
1278 """Determine servo state based on the failed verifier.
1279
1280 @returns: servo state value
1281 The state detecting based on first fail verifier or collecting of
1282 them.
1283 """
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001284 ssh = self.get_verifier_state('servo_ssh')
Otabek Kasimov15aafec2021-03-05 16:22:42 -08001285 servo_root_present = self.get_verifier_state('servo_root_present')
1286 servo_v3_present = self.get_verifier_state('servo_v3_root_present')
Otabek Kasimov79be61b2021-02-18 12:30:44 -08001287 servo_fw = self.get_verifier_state('servo_fw')
Otabek Kasimov1614e2e2021-01-27 22:14:36 -08001288 disk_space = self.get_verifier_state('servo_disk_space')
1289 start_servod = self.get_verifier_state('servod_started')
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001290 create_servo = self.get_verifier_state('servod_connection')
1291 init_servo = self.get_verifier_state('servod_control')
Otabek Kasimov1614e2e2021-01-27 22:14:36 -08001292 cr50_low_sbu = self.get_verifier_state('servo_cr50_low_sbu')
1293 cr50_off = self.get_verifier_state('servo_cr50_off')
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001294 servo_topology = self.get_verifier_state('servo_topology')
Otabek Kasimov1614e2e2021-01-27 22:14:36 -08001295 dut_connected = self.get_verifier_state('servo_dut_connected')
1296 hub_connected = self.get_verifier_state('servo_hub_connected')
1297 pwr_button = self.get_verifier_state('servo_pwr_button')
1298 lid_open = self.get_verifier_state('servo_lid_open')
1299 ec_board = self.get_verifier_state('servo_ec_board')
1300 cr50_console = self.get_verifier_state('servo_cr50_console')
1301 ccd_testlab = self.get_verifier_state('servo_ccd_testlab')
Otabek Kasimov15963492020-06-23 21:10:51 -07001302
1303 if not ssh:
1304 return servo_constants.SERVO_STATE_NO_SSH
Otabek Kasimov15aafec2021-03-05 16:22:42 -08001305 if servo_root_present == hosts.VERIFY_FAILED:
1306 if not self.servo_serial:
1307 return servo_constants.SERVO_STATE_WRONG_CONFIG
1308 return servo_constants.SERVO_STATE_NOT_CONNECTED
1309 if servo_v3_present == hosts.VERIFY_FAILED:
1310 # if we cannot find required board on servo_v3
1311 return servo_constants.SERVO_STATE_NEED_REPLACEMENT
Otabek Kasimov79be61b2021-02-18 12:30:44 -08001312 if servo_fw == hosts.VERIFY_FAILED:
1313 return servo_constants.SERVO_STATE_NEED_REPLACEMENT
Otabek Kasimov15963492020-06-23 21:10:51 -07001314
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001315 if dut_connected == hosts.VERIFY_FAILED:
1316 return servo_constants.SERVO_STATE_DUT_NOT_CONNECTED
1317 if hub_connected == hosts.VERIFY_FAILED:
1318 logging.info('Servo HUB not connected')
1319 return servo_constants.SERVO_STATE_DUT_NOT_CONNECTED
Otabek Kasimov15aafec2021-03-05 16:22:42 -08001320
Otabek Kasimov8e88a742021-01-11 18:03:13 -08001321 if cr50_low_sbu == hosts.VERIFY_FAILED:
1322 return servo_constants.SERVO_STATE_SBU_LOW_VOLTAGE
1323 if cr50_off == hosts.VERIFY_FAILED:
1324 return servo_constants.SERVO_STATE_CR50_NOT_ENUMERATED
Otabek Kasimov15aafec2021-03-05 16:22:42 -08001325
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001326 if servo_topology == hosts.VERIFY_FAILED:
1327 return servo_constants.SERVO_STATE_TOPOLOGY_ISSUE
1328
Otabek Kasimovd5065bd2020-11-23 23:32:36 -08001329 # TODO(otabek@): detect special cases detected by pwr_button
1330 if dut_connected == hosts.VERIFY_SUCCESS:
1331 if pwr_button == hosts.VERIFY_FAILED:
1332 metrics.Counter(
1333 'chromeos/autotest/repair/servo_unexpected/pwr_button2'
1334 ).increment(fields=self._get_host_metrics_data())
Otabek Kasimova7eb4dc2020-09-16 10:25:17 -07001335
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001336 if start_servod == hosts.VERIFY_FAILED:
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001337 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1338
Otabek Kasimov15963492020-06-23 21:10:51 -07001339 # one of the reason why servo can not initialized
Otabek Kasimovbb3bc462020-11-03 16:40:33 -08001340 if cr50_console == hosts.VERIFY_FAILED:
1341 return servo_constants.SERVO_STATE_CR50_CONSOLE_MISSING
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001342 if ccd_testlab == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001343 return servo_constants.SERVO_STATE_CCD_TESTLAB_ISSUE
1344
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001345 if (create_servo == hosts.VERIFY_FAILED
1346 or init_servo == hosts.VERIFY_FAILED):
Otabek Kasimov15963492020-06-23 21:10:51 -07001347 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1348
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001349 if ec_board == hosts.VERIFY_FAILED:
Otabek Kasimov015c15c2020-08-20 00:40:42 -07001350 return servo_constants.SERVO_STATE_EC_BROKEN
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001351 if pwr_button == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001352 return servo_constants.SERVO_STATE_BAD_RIBBON_CABLE
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001353 if lid_open == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001354 return servo_constants.SERVO_STATE_LID_OPEN_FAILED
Otabek Kasimov15963492020-06-23 21:10:51 -07001355
Otabek Kasimov15963492020-06-23 21:10:51 -07001356 metrics.Counter(
1357 'chromeos/autotest/repair/unknown_servo_state'
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001358 ).increment(fields=self._get_host_metrics_data())
Otabek Kasimov15963492020-06-23 21:10:51 -07001359 logging.info('We do not have special state for this failure yet :)')
1360 return servo_constants.SERVO_STATE_BROKEN
1361
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001362 def is_servo_topology_supported(self):
1363 """Check if servo_topology is supported."""
Otabek Kasimovda994012020-11-25 15:23:04 -08001364 if not self.is_up_fast():
1365 logging.info('Servo-Host is not reachable.')
1366 return False
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001367 if not self.is_labstation():
1368 logging.info('Servo-topology supported only for labstation.')
1369 return False
1370 if not self.servo_serial:
1371 logging.info('Servo-topology required a servo serial.')
1372 return False
1373 return True
1374
1375 def get_topology(self):
1376 """Get servo topology."""
Otabek Kasimovfe41e2d2021-02-14 20:48:52 -08001377 if not self._topology:
1378 self._topology = servo_topology.ServoTopology(self)
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001379 return self._topology
1380
1381 def is_dual_setup(self):
1382 """Check is servo will run in dual setup.
1383
1384 Dual setup used only for servo_v4 when used ccd_cr50 and servo_micro
1385 at the same time.
1386 """
1387 return self.servo_setup == servo_constants.SERVO_SETUP_VALUE_DUAL_V4
1388
Otabek Kasimov39637412020-11-23 19:09:27 -08001389 def set_dut_health_profile(self, dut_health_profile):
1390 """
1391 @param dut_health_profile: A DeviceHealthProfile object.
1392 """
1393 logging.debug('setting dut_health_profile field to (%s)',
1394 dut_health_profile)
1395 self._dut_health_profile = dut_health_profile
1396
1397 def get_dut_health_profile(self):
1398 """
1399 @return A DeviceHealthProfile object.
1400 """
1401 return self._dut_health_profile
1402
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001403
Richard Barnetteea3e4602016-06-10 12:36:41 -07001404def make_servo_hostname(dut_hostname):
1405 """Given a DUT's hostname, return the hostname of its servo.
1406
1407 @param dut_hostname: hostname of a DUT.
1408
1409 @return hostname of the DUT's servo.
1410
1411 """
1412 host_parts = dut_hostname.split('.')
1413 host_parts[0] = host_parts[0] + '-servo'
1414 return '.'.join(host_parts)
1415
1416
Richard Barnettee519dcd2016-08-15 17:37:17 -07001417def _map_afe_board_to_servo_board(afe_board):
1418 """Map a board we get from the AFE to a servo appropriate value.
1419
1420 Many boards are identical to other boards for servo's purposes.
1421 This function makes that mapping.
1422
1423 @param afe_board string board name received from AFE.
1424 @return board we expect servo to have.
1425
1426 """
1427 KNOWN_SUFFIXES = ['-freon', '_freon', '_moblab', '-cheets']
1428 BOARD_MAP = {'gizmo': 'panther'}
1429 mapped_board = afe_board
1430 if afe_board in BOARD_MAP:
1431 mapped_board = BOARD_MAP[afe_board]
1432 else:
1433 for suffix in KNOWN_SUFFIXES:
1434 if afe_board.endswith(suffix):
1435 mapped_board = afe_board[0:-len(suffix)]
1436 break
1437 if mapped_board != afe_board:
1438 logging.info('Mapping AFE board=%s to %s', afe_board, mapped_board)
1439 return mapped_board
1440
1441
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001442def get_servo_args_for_host(dut_host):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001443 """Return servo data associated with a given DUT.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001444
Richard Barnetteea3e4602016-06-10 12:36:41 -07001445 @param dut_host Instance of `Host` on which to find the servo
1446 attributes.
Prathmesh Prabhuf605dd32018-08-28 17:09:04 -07001447 @return `servo_args` dict with host and an optional port.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001448 """
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001449 info = dut_host.host_info_store.get()
Derek Beckettf73baca2020-08-19 15:08:47 -07001450 servo_args = {k: v for k, v in six.iteritems(info.attributes)
Garry Wang11b5e872020-03-11 15:14:08 -07001451 if k in servo_constants.SERVO_ATTR_KEYS}
Richard Barnetteea3e4602016-06-10 12:36:41 -07001452
Andrew Luo4be621d2020-03-21 07:01:13 -07001453 if servo_constants.SERVO_HOST_SSH_PORT_ATTR in servo_args:
1454 try:
1455 servo_args[servo_constants.SERVO_HOST_SSH_PORT_ATTR] = int(
1456 servo_args[servo_constants.SERVO_HOST_SSH_PORT_ATTR])
1457 except ValueError:
1458 logging.error('servo host port is not an int: %s',
1459 servo_args[servo_constants.SERVO_HOST_SSH_PORT_ATTR])
1460 # Reset servo_args because we don't want to use an invalid port.
1461 servo_args.pop(servo_constants.SERVO_HOST_SSH_PORT_ATTR, None)
1462
Garry Wang11b5e872020-03-11 15:14:08 -07001463 if servo_constants.SERVO_PORT_ATTR in servo_args:
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001464 try:
Garry Wang11b5e872020-03-11 15:14:08 -07001465 servo_args[servo_constants.SERVO_PORT_ATTR] = int(
1466 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001467 except ValueError:
1468 logging.error('servo port is not an int: %s',
Garry Wang11b5e872020-03-11 15:14:08 -07001469 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001470 # Reset servo_args because we don't want to use an invalid port.
Garry Wang11b5e872020-03-11 15:14:08 -07001471 servo_args.pop(servo_constants.SERVO_HOST_ATTR, None)
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001472
1473 if info.board:
Garry Wang11b5e872020-03-11 15:14:08 -07001474 servo_board = _map_afe_board_to_servo_board(info.board)
1475 servo_args[servo_constants.SERVO_BOARD_ATTR] = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -07001476 if info.model:
Garry Wang11b5e872020-03-11 15:14:08 -07001477 servo_args[servo_constants.SERVO_MODEL_ATTR] = info.model
1478 return servo_args if servo_constants.SERVO_HOST_ATTR in servo_args else None
Richard Barnetteea3e4602016-06-10 12:36:41 -07001479
1480
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001481def _tweak_args_for_ssp_moblab(servo_args):
Garry Wang11b5e872020-03-11 15:14:08 -07001482 if (servo_args[servo_constants.SERVO_HOST_ATTR]
1483 in ['localhost', '127.0.0.1']):
1484 servo_args[servo_constants.SERVO_HOST_ATTR] = _CONFIG.get_config_value(
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001485 'SSP', 'host_container_ip', type=str, default=None)
1486
1487
Otabek Kasimov39637412020-11-23 19:09:27 -08001488def create_servo_host(dut,
1489 servo_args,
1490 try_lab_servo=False,
1491 try_servo_repair=False,
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001492 try_servo_recovery=False,
Otabek Kasimov39637412020-11-23 19:09:27 -08001493 dut_host_info=None,
1494 dut_health_profile=None):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001495 """Create a ServoHost object for a given DUT, if appropriate.
Dan Shi4d478522014-02-14 13:46:32 -08001496
Richard Barnette9a26ad62016-06-10 12:03:08 -07001497 This function attempts to create and verify or repair a `ServoHost`
1498 object for a servo connected to the given `dut`, subject to various
1499 constraints imposed by the parameters:
1500 * When the `servo_args` parameter is not `None`, a servo
1501 host must be created, and must be checked with `repair()`.
1502 * Otherwise, if a servo exists in the lab and `try_lab_servo` is
1503 true:
1504 * If `try_servo_repair` is true, then create a servo host and
1505 check it with `repair()`.
1506 * Otherwise, if the servo responds to `ping` then create a
1507 servo host and check it with `verify()`.
Fang Denge545abb2014-12-30 18:43:47 -08001508
Richard Barnette9a26ad62016-06-10 12:03:08 -07001509 In cases where `servo_args` was not `None`, repair failure
1510 exceptions are passed back to the caller; otherwise, exceptions
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001511 are logged and then discarded. Note that this only happens in cases
1512 where we're called from a test (not special task) control file that
1513 has an explicit dependency on servo. In that case, we require that
1514 repair not write to `status.log`, so as to avoid polluting test
1515 results.
1516
1517 TODO(jrbarnette): The special handling for servo in test control
1518 files is a thorn in my flesh; I dearly hope to see it cut out before
1519 my retirement.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001520
1521 Parameters for a servo host consist of a host name, port number, and
1522 DUT board, and are determined from one of these sources, in order of
1523 priority:
Richard Barnetteea3e4602016-06-10 12:36:41 -07001524 * Servo attributes from the `dut` parameter take precedence over
1525 all other sources of information.
1526 * If a DNS entry for the servo based on the DUT hostname exists in
1527 the CrOS lab network, that hostname is used with the default
Richard Barnette9a26ad62016-06-10 12:03:08 -07001528 port and the DUT's board.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001529 * If no other options are found, the parameters will be taken
Richard Barnette9a26ad62016-06-10 12:03:08 -07001530 from the `servo_args` dict passed in from the caller.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001531
1532 @param dut An instance of `Host` from which to take
1533 servo parameters (if available).
1534 @param servo_args A dictionary with servo parameters to use if
1535 they can't be found from `dut`. If this
1536 argument is supplied, unrepaired exceptions
1537 from `verify()` will be passed back to the
1538 caller.
1539 @param try_lab_servo If not true, servo host creation will be
1540 skipped unless otherwise required by the
1541 caller.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001542 @param try_servo_repair If true, check a servo host with
1543 `repair()` instead of `verify()`.
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001544 @param try_servo_recovery If true, start servod in recovery mode.
Otabek Kasimov8475cce2020-07-14 12:11:31 -07001545 @param dut_host_info: A HostInfo object of the DUT that connected
1546 to this servo.
Otabek Kasimov39637412020-11-23 19:09:27 -08001547 @param dut_health_profile: DUT repair info with history.
Dan Shi4d478522014-02-14 13:46:32 -08001548
1549 @returns: A ServoHost object or None. See comments above.
1550
1551 """
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001552 servo_dependency = servo_args is not None
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001553 if dut is not None and (try_lab_servo or servo_dependency):
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001554 servo_args_override = get_servo_args_for_host(dut)
Richard Barnetteea3e4602016-06-10 12:36:41 -07001555 if servo_args_override is not None:
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001556 if utils.in_moblab_ssp():
1557 _tweak_args_for_ssp_moblab(servo_args_override)
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001558 logging.debug(
1559 'Overriding provided servo_args (%s) with arguments'
1560 ' determined from the host (%s)',
1561 servo_args,
1562 servo_args_override,
1563 )
Richard Barnetteea3e4602016-06-10 12:36:41 -07001564 servo_args = servo_args_override
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001565
Richard Barnetteea3e4602016-06-10 12:36:41 -07001566 if servo_args is None:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001567 logging.debug('No servo_args provided, and failed to find overrides.')
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001568 if try_lab_servo or servo_dependency:
Otabek Kasimov646812c2020-06-23 20:01:36 -07001569 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001570 else:
1571 # For regular test case which not required the servo
1572 return None, None
1573
Garry Wang11b5e872020-03-11 15:14:08 -07001574 servo_hostname = servo_args.get(servo_constants.SERVO_HOST_ATTR)
1575 servo_port = servo_args.get(servo_constants.SERVO_PORT_ATTR)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001576 if not _is_servo_host_information_exist(servo_hostname, servo_port):
1577 logging.debug(
1578 'Servo connection info missed hostname: %s , port: %s',
1579 servo_hostname, servo_port)
Otabek Kasimov646812c2020-06-23 20:01:36 -07001580 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001581 if not is_servo_host_information_valid(servo_hostname, servo_port):
1582 logging.debug(
1583 'Servo connection info is incorrect hostname: %s , port: %s',
1584 servo_hostname, servo_port)
Garry Wang11b5e872020-03-11 15:14:08 -07001585 return None, servo_constants.SERVO_STATE_WRONG_CONFIG
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001586
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001587 if try_servo_recovery == True:
1588 servo_args[servo_constants.SERVO_RECOVERY_MODE] = True
1589
Garry Wangebc015b2019-06-06 17:45:06 -07001590 newhost = ServoHost(**servo_args)
Andrew Luo4be621d2020-03-21 07:01:13 -07001591 if newhost.use_icmp and not newhost.is_up_fast(count=3):
Otabek Kasimov32cafe92020-12-14 16:58:12 -08001592 # ServoHost has internal check to wait if servo-host is in reboot
1593 # process. If servo-host still is not available this check will stop
1594 # further attempts as we do not have any option to recover servo_host.
Otabek Kasimov39637412020-11-23 19:09:27 -08001595 return None, servo_constants.SERVO_STATE_NO_SSH
Garry Wangffbd2162020-04-17 16:13:48 -07001596
Otabek Kasimove6df8102020-07-21 20:15:25 -07001597 # Reset or reboot servo device only during AdminRepair tasks.
1598 if try_servo_repair:
1599 if newhost._is_locked:
1600 # Reset servo if the servo is locked, as we check if the servohost
1601 # is up, if the servohost is labstation and if the servohost is in
1602 # lab inside the locking logic.
1603 newhost.reset_servo()
1604 else:
Garry Wang358aad42020-08-02 20:56:04 -07001605 try:
1606 newhost.reboot_servo_v3_on_need()
Garry Wang1f0d5332020-08-10 19:32:32 -07001607 except Exception as e:
1608 logging.info('[Non-critical] Unexpected error while trying to'
1609 ' reboot servo_v3, skipping the reboot; %s', e)
Otabek Kasimove6df8102020-07-21 20:15:25 -07001610
Otabek Kasimov2b50cdb2020-07-06 19:16:06 -07001611 if dut:
1612 newhost.set_dut_hostname(dut.hostname)
Otabek Kasimov9e90ae12020-08-14 03:01:19 -07001613 if dut_host_info:
1614 newhost.set_dut_host_info(dut_host_info)
Otabek Kasimov39637412020-11-23 19:09:27 -08001615 if dut_health_profile and (try_lab_servo or try_servo_repair):
1616 try:
1617 if newhost.is_localhost():
1618 logging.info('Servohost is a localhost, skip device'
1619 ' health profile setup...')
1620 else:
1621 dut_health_profile.init_profile(newhost)
1622 newhost.set_dut_health_profile(dut_health_profile)
1623 except Exception as e:
1624 logging.info(
1625 '[Non-critical] Unexpected error while trying to'
1626 ' load device health profile; %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -07001627
Richard Barnette9a26ad62016-06-10 12:03:08 -07001628 # Note that the logic of repair() includes everything done
1629 # by verify(). It's sufficient to call one or the other;
1630 # we don't need both.
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001631 if servo_dependency:
1632 newhost.repair(silent=True)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001633 return newhost, newhost.get_servo_state()
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001634
1635 if try_servo_repair:
1636 try:
1637 newhost.repair()
1638 except Exception:
1639 logging.exception('servo repair failed for %s', newhost.hostname)
Richard Barnette9a26ad62016-06-10 12:03:08 -07001640 else:
1641 try:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001642 newhost.verify()
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001643 except Exception:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001644 logging.exception('servo verify failed for %s', newhost.hostname)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001645 return newhost, newhost.get_servo_state()
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001646
1647
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001648def _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001649 if hostname is None or len(hostname.strip()) == 0:
1650 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001651 if port is None:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001652 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001653 if not type(port) is int:
1654 try:
1655 int(port)
1656 except ValueError:
1657 return False
1658
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001659 return True
1660
1661
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001662def is_servo_host_information_valid(hostname, port):
Garry Wang9b8f2342020-04-17 16:34:09 -07001663 """Check if provided servo attributes are valid.
1664
1665 @param hostname Hostname of the servohost.
1666 @param port servo port number.
1667
1668 @returns: A bool value to indicate if provided servo attribute valid.
1669 """
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001670 if not _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001671 return False
1672 # checking range and correct of the port
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001673 port_int = int(port)
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001674 if port_int < 1 or port_int > 65000:
1675 return False
1676 # we expecting host contain only latters, digits and '-' or '_'
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001677 if not re.match('[a-zA-Z0-9-_\.]*$', hostname) or len(hostname) < 5:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001678 return False
1679 return True