blob: 6c6c09c0b73b257dff54c509543034cf2ff10eca [file] [log] [blame]
Derek Beckettf73baca2020-08-19 15:08:47 -07001# Lint as: python2, python3
Fang Deng5d518f42013-08-02 14:04:32 -07002# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
3# Use of this source code is governed by a BSD-style license that can be
4# found in the LICENSE file.
5#
6# Expects to be run in an environment with sudo and no interactive password
7# prompt, such as within the Chromium OS development chroot.
8
9
10"""This file provides core logic for servo verify/repair process."""
11
12
Derek Beckettf73baca2020-08-19 15:08:47 -070013from __future__ import absolute_import
14from __future__ import division
15from __future__ import print_function
16
Fang Deng5d518f42013-08-02 14:04:32 -070017import logging
Raul E Rangel52ca2e82018-07-03 14:10:14 -060018import os
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080019import re
20import tarfile
Andrew McRaef0679932020-08-13 09:15:23 +100021import threading
Garry Wang2b5eef92020-08-21 16:23:35 -070022import json
Garry Wangc1288cf2019-12-17 14:58:00 -080023import time
Derek Beckettf73baca2020-08-19 15:08:47 -070024import six
25import six.moves.xmlrpc_client
Otabek Kasimov120b6fa2020-07-03 00:15:27 -070026import calendar
Fang Deng5d518f42013-08-02 14:04:32 -070027
28from autotest_lib.client.bin import utils
Garry Wang79e9af62019-06-12 15:19:19 -070029from autotest_lib.client.common_lib import error
Richard Barnette9a26ad62016-06-10 12:03:08 -070030from autotest_lib.client.common_lib import hosts
Garry Wang7b0e1b72020-03-25 19:08:59 -070031from autotest_lib.client.common_lib import lsbrelease_utils
Fang Deng5d518f42013-08-02 14:04:32 -070032from autotest_lib.client.common_lib.cros import retry
Christopher Wileycef1f902014-06-19 11:11:23 -070033from autotest_lib.client.common_lib.cros.network import ping_runner
Richard Barnette9a26ad62016-06-10 12:03:08 -070034from autotest_lib.server.cros.servo import servo
Richard Barnetted31580e2018-05-14 19:58:00 +000035from autotest_lib.server.hosts import servo_repair
Garry Wangebc015b2019-06-06 17:45:06 -070036from autotest_lib.server.hosts import base_servohost
Garry Wang11b5e872020-03-11 15:14:08 -070037from autotest_lib.server.hosts import servo_constants
Otabek Kasimov4ea636e2020-04-14 23:35:06 -070038from autotest_lib.server.cros.faft.utils import config
Garry Wang11b5e872020-03-11 15:14:08 -070039from autotest_lib.client.common_lib import global_config
Otabek Kasimov8475cce2020-07-14 12:11:31 -070040from autotest_lib.site_utils.admin_audit import servo_updater
Otabek Kasimov382c3bb2020-10-28 13:22:45 -070041from autotest_lib.server.cros.servo.topology import servo_topology
Garry Wangd7367482020-02-27 13:52:40 -080042
Otabek Kasimov15963492020-06-23 21:10:51 -070043try:
44 from chromite.lib import metrics
45except ImportError:
46 metrics = utils.metrics_mock
47
Dan Shi3b2adf62015-09-02 17:46:54 -070048_CONFIG = global_config.global_config
Fang Deng5d518f42013-08-02 14:04:32 -070049
Otabek Kasimova7ba91a2020-03-09 08:31:01 -070050
Garry Wangebc015b2019-06-06 17:45:06 -070051class ServoHost(base_servohost.BaseServoHost):
52 """Host class for a servo host(e.g. beaglebone, labstation)
Dana Goyette0b6e6402019-10-04 11:09:24 -070053 that with a servo instance for a specific port.
54
55 @type _servo: servo.Servo | None
56 """
Fang Deng5d518f42013-08-02 14:04:32 -070057
Raul E Rangel52ca2e82018-07-03 14:10:14 -060058 DEFAULT_PORT = int(os.getenv('SERVOD_PORT', '9999'))
Richard Barnette9a26ad62016-06-10 12:03:08 -070059
Dan Shie5b3c512014-08-21 12:12:09 -070060 # Timeout for initializing servo signals.
Wai-Hong Tam37b6ed32017-09-19 15:52:39 -070061 INITIALIZE_SERVO_TIMEOUT_SECS = 60
Richard Barnette9a26ad62016-06-10 12:03:08 -070062
Otabek Kasimov545739c2020-08-20 00:24:21 -070063 # Default timeout for run terminal command.
64 DEFAULT_TERMINAL_TIMEOUT = 30
65
xixuan6cf6d2f2016-01-29 15:29:00 -080066 # Ready test function
67 SERVO_READY_METHOD = 'get_version'
Fang Deng5d518f42013-08-02 14:04:32 -070068
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080069 # Directory prefix on the servo host where the servod logs are stored.
70 SERVOD_LOG_PREFIX = '/var/log/servod'
71
72 # Exit code to use when symlinks for servod logs are not found.
73 NO_SYMLINKS_CODE = 9
74
75 # Directory in the job's results directory to dump the logs into.
76 LOG_DIR = 'servod'
77
78 # Prefix for joint loglevel files in the logs.
79 JOINT_LOG_PREFIX = 'log'
80
81 # Regex group to extract timestamp from logfile name.
82 TS_GROUP = 'ts'
83
84 # This regex is used to extract the timestamp from servod logs.
Garry Wang22f2e842020-09-09 20:19:19 -070085 # files always start with log.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080086 TS_RE = (r'log.'
87 # The timestamp is of format %Y-%m-%d--%H-%M-%S.MS
88 r'(?P<%s>\d{4}(\-\d{2}){2}\-(-\d{2}){3}.\d{3})'
89 # The loglevel is optional depending on labstation version.
90 r'(.(INFO|DEBUG|WARNING))?' % TS_GROUP)
91 TS_EXTRACTOR = re.compile(TS_RE)
92
93 # Regex group to extract MCU name from logline in servod logs.
94 MCU_GROUP = 'mcu'
95
96 # Regex group to extract logline from MCU logline in servod logs.
97 LINE_GROUP = 'line'
98
99 # This regex is used to extract the mcu and the line content from an
100 # MCU logline in servod logs. e.g. EC or servo_v4 console logs.
101 # Here is an example log-line:
102 #
103 # 2020-01-23 13:15:12,223 - servo_v4 - EC3PO.Console - DEBUG -
104 # console.py:219:LogConsoleOutput - /dev/pts/9 - cc polarity: cc1
105 #
106 # Here is conceptually how they are formatted:
107 #
108 # <time> - <MCU> - EC3PO.Console - <LVL> - <file:line:func> - <pts> -
109 # <output>
110 #
Garry Wang22f2e842020-09-09 20:19:19 -0700111 # The log format starts with a timestamp
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800112 MCU_RE = (r'[\d\-]+ [\d:,]+ '
113 # The mcu that is logging this is next.
114 r'- (?P<%s>\w+) - '
115 # Next, we have more log outputs before the actual line.
116 # Information about the file line, logging function etc.
117 # Anchor on EC3PO Console, LogConsoleOutput and dev/pts.
118 # NOTE: if the log format changes, this regex needs to be
119 # adjusted.
120 r'EC3PO\.Console[\s\-\w\d:.]+LogConsoleOutput - /dev/pts/\d+ - '
121 # Lastly, we get the MCU's console line.
122 r'(?P<%s>.+$)' % (MCU_GROUP, LINE_GROUP))
123 MCU_EXTRACTOR = re.compile(MCU_RE)
124
Otabek Kasimov545739c2020-08-20 00:24:21 -0700125 # Regex to detect timeout messages when USBC pigtail has timeout issue.
126 # e.g.: [475635.427072 PD TMOUT RX 1/1]
127 USBC_PIGTAIL_TIMEOUT_RE = r'\[[\d \.]{1,20}(PD TMOUT RX 1\/1)\]'
128
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800129 # Suffix to identify compressed logfiles.
130 COMPRESSION_SUFFIX = '.tbz2'
131
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700132 # A suffix to mark servod log directories that came from instance that
133 # ran during this servo_host, but are not the last one running e.g. when
134 # an instance (on purpose, or due to a bug) restarted in the middle of the
135 # run.
136 OLD_LOG_SUFFIX = 'old'
137
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700138 # Mapping servo board with their vid-pid
139 SERVO_VID_PID = {
140 'servo_v4':'18d1:501b',
141 'ccd_cr50':'18d1:5014',
142 'servo_micro':'18d1:501a',
143 'servo_v3':['18d1:5004', '0403:6014'],
144 }
145
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800146 def _init_attributes(self):
147 self._servo_state = None
148 self.servo_port = None
149 self.servo_board = None
150 self.servo_model = None
151 self.servo_serial = None
Garry Wangcb06f3b2020-10-08 20:56:21 -0700152 self.servo_setup = None
Garry Wang6a680062020-11-03 13:40:29 -0800153 self.additional_servod_args = None
Garry Wang000c6c02020-05-11 21:27:23 -0700154 # The flag that indicate if a servo is connected to a smart usbhub.
155 # TODO(xianuowang@) remove this flag once all usbhubs in the lab
156 # get replaced.
157 self.smart_usbhub = None
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800158 self._servo = None
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700159 self._topology = None
Andrew McRaef0679932020-08-13 09:15:23 +1000160 self._tunnel_proxy = None
161 self._tunnel_proxy_lock = threading.Lock()
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700162 self._initial_instance_ts = None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800163 # Flag to make sure that multiple calls to close do not result in the
164 # logic executing multiple times.
165 self._closed = False
Andrew McRaef0679932020-08-13 09:15:23 +1000166 # Per-thread local data
167 self._local = threading.local()
Fang Deng5d518f42013-08-02 14:04:32 -0700168
Garry Wangcb06f3b2020-10-08 20:56:21 -0700169 def _initialize(self,
170 servo_host='localhost',
171 servo_port=DEFAULT_PORT,
172 servo_board=None,
173 servo_model=None,
174 servo_serial=None,
175 servo_setup=None,
Garry Wang6a680062020-11-03 13:40:29 -0800176 additional_servod_args=None,
Garry Wangcb06f3b2020-10-08 20:56:21 -0700177 is_in_lab=None,
178 *args,
179 **dargs):
Fang Deng5d518f42013-08-02 14:04:32 -0700180 """Initialize a ServoHost instance.
181
182 A ServoHost instance represents a host that controls a servo.
183
184 @param servo_host: Name of the host where the servod process
185 is running.
Raul E Rangel52ca2e82018-07-03 14:10:14 -0600186 @param servo_port: Port the servod process is listening on. Defaults
187 to the SERVOD_PORT environment variable if set,
188 otherwise 9999.
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700189 @param servo_board: Board that the servo is connected to.
Nick Sanders2f3c9852018-10-24 12:10:24 -0700190 @param servo_model: Model that the servo is connected to.
Garry Wangcb06f3b2020-10-08 20:56:21 -0700191 @param servo_serial: Serial number of the servo device.
192 @param servo_setup: Type of servo setup, e.g. REGULAR or DUAL_V4.
Garry Wang6a680062020-11-03 13:40:29 -0800193 @param additional_servod_args: Additional args that will append to
194 servod start command.
Dan Shi4d478522014-02-14 13:46:32 -0800195 @param is_in_lab: True if the servo host is in Cros Lab. Default is set
196 to None, for which utils.host_is_in_lab_zone will be
197 called to check if the servo host is in Cros lab.
Fang Deng5d518f42013-08-02 14:04:32 -0700198
199 """
200 super(ServoHost, self)._initialize(hostname=servo_host,
Garry Wangebc015b2019-06-06 17:45:06 -0700201 is_in_lab=is_in_lab, *args, **dargs)
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800202 self._init_attributes()
Richard Barnette42f4db92018-08-23 15:05:15 -0700203 self.servo_port = int(servo_port)
Richard Barnettee519dcd2016-08-15 17:37:17 -0700204 self.servo_board = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -0700205 self.servo_model = servo_model
Kevin Cheng643ce8a2016-09-15 15:42:12 -0700206 self.servo_serial = servo_serial
Garry Wangcb06f3b2020-10-08 20:56:21 -0700207 self.servo_setup = servo_setup
Garry Wang6a680062020-11-03 13:40:29 -0800208 self.additional_servod_args = additional_servod_args
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800209
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700210 if self.is_servo_topology_supported():
211 self._topology = servo_topology.ServoTopology(self)
212
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800213 # The location of the log files on the servo host for this instance.
214 self.remote_log_dir = '%s_%s' % (self.SERVOD_LOG_PREFIX,
215 self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700216 # Path of the servo host lock file.
Derek Beckettf73baca2020-08-19 15:08:47 -0700217 self._lock_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
218 self.LOCK_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700219 # File path to declare a reboot request.
Derek Beckettf73baca2020-08-19 15:08:47 -0700220 self._reboot_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
221 self.REBOOT_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700222
223 # Lock the servo host if it's an in-lab labstation to prevent other
224 # task to reboot it until current task completes. We also wait and
225 # make sure the labstation is up here, in the case of the labstation is
226 # in the middle of reboot.
Garry Wang7c00b0f2019-06-25 17:28:17 -0700227 self._is_locked = False
Garry Wang42b4d862019-06-25 15:50:49 -0700228 if (self.wait_up(self.REBOOT_TIMEOUT) and self.is_in_lab()
229 and self.is_labstation()):
Garry Wang79e9af62019-06-12 15:19:19 -0700230 self._lock()
Garry Wang78ce64d2020-10-13 18:23:45 -0700231 try:
232 self.wait_ready()
233 except Exception as e:
234 logging.info(
235 'Unexpected error while ensure labstation'
236 ' readiness; %s', str(e))
Garry Wangebc015b2019-06-06 17:45:06 -0700237
Richard Barnette9a26ad62016-06-10 12:03:08 -0700238 self._repair_strategy = (
239 servo_repair.create_servo_repair_strategy())
Richard Barnettee519dcd2016-08-15 17:37:17 -0700240
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700241 def __str__(self):
242 return "<%s '%s:%s'>" % (
243 type(self).__name__, self.hostname, self.servo_port)
244
Richard Barnette9a26ad62016-06-10 12:03:08 -0700245 def connect_servo(self):
Garry Wang8c8dc972020-06-09 13:41:51 -0700246 """ Initialize and setup servo for later use.
247 """
248 self.initilize_servo()
249 self.initialize_dut_for_servo()
250
Garry Wang8c8dc972020-06-09 13:41:51 -0700251 def initilize_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700252 """Establish a connection to the servod server on this host.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700253
254 Initializes `self._servo` and then verifies that all network
255 connections are working. This will create an ssh tunnel if
256 it's required.
Garry Wang8c8dc972020-06-09 13:41:51 -0700257 """
258 self._servo = servo.Servo(servo_host=self,
259 servo_serial=self.servo_serial)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700260
Garry Wang8c8dc972020-06-09 13:41:51 -0700261 def initialize_dut_for_servo(self):
262 """This method will do some setup for dut control, e.g. setup
263 main servo_v4 device, and also testing the connection between servo
264 and DUT. As a side effect of testing the connection, all signals on
265 the target servo are reset to default values, and the USB stick is
Richard Barnette9a26ad62016-06-10 12:03:08 -0700266 set to the neutral (off) position.
267 """
Garry Wang8c8dc972020-06-09 13:41:51 -0700268 if not self._servo:
269 raise hosts.AutoservVerifyError('Servo object needs to be'
270 ' initialized before initialize'
271 ' DUT.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700272 timeout, _ = retry.timeout(
Garry Wang8c8dc972020-06-09 13:41:51 -0700273 self._servo.initialize_dut,
274 timeout_sec=self.INITIALIZE_SERVO_TIMEOUT_SECS)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700275 if timeout:
Garry Wang8c8dc972020-06-09 13:41:51 -0700276 raise hosts.AutoservVerifyError('Initialize dut for servo timed'
277 ' out.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700278
Richard Barnette9a26ad62016-06-10 12:03:08 -0700279 def disconnect_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700280 """Disconnect our servo if it exists.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700281
282 If we've previously successfully connected to our servo,
283 disconnect any established ssh tunnel, and set `self._servo`
284 back to `None`.
285 """
286 if self._servo:
287 # N.B. This call is safe even without a tunnel:
288 # rpc_server_tracker.disconnect() silently ignores
289 # unknown ports.
290 self.rpc_server_tracker.disconnect(self.servo_port)
291 self._servo = None
Fang Deng5d518f42013-08-02 14:04:32 -0700292
Andrew McRaef0679932020-08-13 09:15:23 +1000293 def _maybe_create_servod_ssh_tunnel_proxy(self):
294 """Create a xmlrpc proxy for use with a ssh tunnel.
295 A lock is used to safely create a singleton proxy.
296 """
297 with self._tunnel_proxy_lock:
298 if self._tunnel_proxy is None:
299 self._tunnel_proxy = self.rpc_server_tracker.xmlrpc_connect(
300 None,
301 self.servo_port,
302 ready_test_name=self.SERVO_READY_METHOD,
303 timeout_seconds=60,
304 request_timeout_seconds=3600,
305 server_desc=str(self))
306
Andrew McRaef0679932020-08-13 09:15:23 +1000307 def get_servod_server_proxy(self):
308 """Return a proxy if it exists; otherwise, create a new one.
309 A proxy can either be a ssh tunnel based proxy, or a httplib
310 based proxy.
Fang Deng5d518f42013-08-02 14:04:32 -0700311
312 @returns: An xmlrpclib.ServerProxy that is connected to the servod
313 server on the host.
Fang Deng5d518f42013-08-02 14:04:32 -0700314 """
Garry Wang11b5e872020-03-11 15:14:08 -0700315 if (servo_constants.ENABLE_SSH_TUNNEL_FOR_SERVO
316 and not self.is_localhost()):
Andrew McRaef0679932020-08-13 09:15:23 +1000317 # Check for existing ssh tunnel proxy.
318 if self._tunnel_proxy is None:
319 self._maybe_create_servod_ssh_tunnel_proxy()
320 return self._tunnel_proxy
Richard Barnette9a26ad62016-06-10 12:03:08 -0700321 else:
Andrew McRaef0679932020-08-13 09:15:23 +1000322 # xmlrpc/httplib is not thread-safe, so each thread must have its
323 # own separate proxy connection.
324 if not hasattr(self._local, "_per_thread_proxy"):
325 remote = 'http://%s:%s' % (self.hostname, self.servo_port)
Derek Beckettf73baca2020-08-19 15:08:47 -0700326 self._local._per_thread_proxy = six.moves.xmlrpc_client.ServerProxy(remote)
Andrew McRaef0679932020-08-13 09:15:23 +1000327 return self._local._per_thread_proxy
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800328
Richard Barnette1edbb162016-11-01 11:47:50 -0700329 def verify(self, silent=False):
330 """Update the servo host and verify it's in a good state.
331
332 @param silent If true, suppress logging in `status.log`.
333 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700334 message = 'Beginning verify for servo host %s port %s serial %s'
335 message %= (self.hostname, self.servo_port, self.servo_serial)
336 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700337 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700338 self._repair_strategy.verify(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700339 self._servo_state = servo_constants.SERVO_STATE_WORKING
340 self.record('INFO', None, None,
341 'ServoHost verify set servo_state as WORKING')
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700342 if self._topology:
343 self._topology.generate()
Garry Wang63b8c382020-03-11 22:28:40 -0700344 except Exception as e:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -0700345 if not self.is_localhost():
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700346 self._servo_state = self.determine_servo_state()
347 self.record('INFO', None, None,
348 'ServoHost verify set servo_state as %s'
349 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700350 if self._is_critical_error(e):
351 raise
Fang Deng5d518f42013-08-02 14:04:32 -0700352
Garry Wang2b5eef92020-08-21 16:23:35 -0700353 def _get_default_usbkey_mount_path(self):
354 return '/media/servo_usb/%s' % self.servo_port
Fang Deng5d518f42013-08-02 14:04:32 -0700355
Garry Wang7b0e1b72020-03-25 19:08:59 -0700356 def get_image_name_from_usbkey(self, usbkey_dev):
357 """Mount usb drive and check ChromeOS image name on it if there is
358 one. This method assumes the image_usbkey_direction is already set
359 to servo side.
360
Garry Wang4b980202020-09-24 17:00:17 -0700361 @param usbkey_dev: usbkey dev path(e.g. /dev/sdb).
Garry Wang7b0e1b72020-03-25 19:08:59 -0700362
363 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
364 or empty string if no test image detected, or unexpected
365 error occurred.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700366 """
Garry Wang70e5d062020-04-03 18:01:05 -0700367 logging.info('Checking ChromeOS image name on usbkey.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700368 mount_dst = self._get_default_usbkey_mount_path()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700369 # Unmount if there is an existing stale mount.
Garry Wang2b5eef92020-08-21 16:23:35 -0700370 self._unmount_drive(mount_dst)
371 # ChromeOS root fs is in /dev/sdx3
372 mount_src = usbkey_dev + '3'
Garry Wang7b0e1b72020-03-25 19:08:59 -0700373 try:
Garry Wang2b5eef92020-08-21 16:23:35 -0700374 if not self._mount_drive(mount_src, mount_dst):
375 logging.debug('Unexpected error occurred on mount usb drive.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700376 return ''
Garry Wang70e5d062020-04-03 18:01:05 -0700377
378 release_content = self.run(
Garry Wang2b5eef92020-08-21 16:23:35 -0700379 'cat %s/etc/lsb-release' % mount_dst,
Garry Wang70e5d062020-04-03 18:01:05 -0700380 ignore_status=True).stdout.strip()
381
382 if not re.search(r'RELEASE_TRACK=.*test', release_content):
383 logging.info('The image on usbkey is not a test image')
384 return ''
385
386 return lsbrelease_utils.get_chromeos_release_builder_path(
387 lsb_release_content=release_content)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700388 finally:
Garry Wang70e5d062020-04-03 18:01:05 -0700389 logging.debug('Image check compeleted, unmounting the usb drive.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700390 self._unmount_drive(mount_dst)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700391
Garry Wang2b5eef92020-08-21 16:23:35 -0700392 def _extract_firmware_image_from_usbkey(self, fw_dst):
393 """Extract firmware images from the usbkey on servo, this method
394 assumes there is already a ChromeOS test image staged on servo.
395
Garry Wang4b980202020-09-24 17:00:17 -0700396 @param fw_dst: the path that we'll copy firmware images to.
Garry Wang2b5eef92020-08-21 16:23:35 -0700397
398 @returns: a json format string of firmware manifest data.
399 """
400 usbkey_dev = self._probe_and_validate_usb_dev()
401 if not usbkey_dev:
402 raise hosts.AutoservRepairError('Unexpected error occurred when'
403 ' probe usbkey dev path, please check logs for detail.')
404
405 mount_dst = self._get_default_usbkey_mount_path()
406 # Unmount if there is an existing stale mount.
407 self._unmount_drive(mount_dst)
408 # ChromeOS root fs is in /dev/sdx3
409 mount_src = usbkey_dev + '3'
410 try:
411 if not self._mount_drive(mount_src, mount_dst):
412 raise hosts.AutoservRepairError('Failed to extract firmware'
413 ' image; Unable to mount %s.' % usbkey_dev,
414 'unable to mount usbkey')
415 updater_bin = os.path.join(mount_dst,
416 'usr/sbin/chromeos-firmwareupdate')
417 self.run('%s --unpack %s' % (updater_bin, fw_dst))
418 return self.run('%s --manifest' % updater_bin).stdout
419 finally:
420 self._unmount_drive(mount_dst)
421
422 def prepare_repair_firmware_image(self, fw_dst=None):
423 """Prepare firmware image on the servohost for auto repair process
424 to consume.
425
Garry Wang4b980202020-09-24 17:00:17 -0700426 @param fw_dst: the path that we want to store firmware image on
427 the servohost.
Garry Wang2b5eef92020-08-21 16:23:35 -0700428
429 @returns: A tuple that containes ec firmware image path and bios
430 firmware image path on the servohost, or None if type of
431 image is not available based on manifest and dut's model.
432 """
433 model = self.servo_model or self._dut_host_info.model
434 if not model:
435 raise hosts.AutoservRepairError(
436 'Could not determine DUT\'s model.',
437 'model infomation unknown')
438
439 if not fw_dst:
440 fw_dst = '/tmp/firmware_image/%s' % self.servo_port
441 # Cleanup and re-create dst path to have a fresh start.
442 self.run('rm -rf %s' % fw_dst)
443 self.run('mkdir -p %s' % fw_dst)
444
445 manifest = json.loads(self._extract_firmware_image_from_usbkey(fw_dst))
Garry Wang50b56c12020-09-24 17:26:52 -0700446 # For models that have packed $MODEL_signed variant, we want use the
447 # 'signed' variant once we get DVT devices, so try to read manifest
448 # from $MODEL_signed first.
449 build = manifest.get('%s_signed' % model) or manifest.get(model)
450 if not build:
Garry Wang2b5eef92020-08-21 16:23:35 -0700451 raise hosts.AutoservRepairError('Could not find firmware manifest'
452 ' for model:%s' % model, 'model manifest not found')
453 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700454 ec_image = os.path.join(fw_dst, build['ec']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700455 except KeyError:
456 ec_image = None
457 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700458 bios_image = os.path.join(fw_dst, build['host']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700459 except KeyError:
460 bios_image = None
461 if not ec_image and not bios_image:
462 raise hosts.AutoservRepairError('Could not find any firmware image'
463 ' for model:%s' % model, 'cannot find firmware image')
464 return ec_image, bios_image
Garry Wang7b0e1b72020-03-25 19:08:59 -0700465
Garry Wang4b980202020-09-24 17:00:17 -0700466 def flash_ap_firmware_via_servo(self, image):
467 """Flash AP firmware by use a provided image.
468
469 This is will be a short term enhanment for infra repair use, it use
470 'futility update' which will automatically determine various parameters
471 needed for flashrom, and will preserve the GBB, VPD, and HWID for
472 AP firmware update.
473 @TODO(xianuowang@) Remove this method once b/148403277 implemented.
474
475 @param image: the firmware image path on servohost.
476 """
477 cmd = 'futility update -i %s --servo_port=%s'
478 self.run(cmd % (image, self.servo_port), timeout=900)
479
Garry Wang70e5d062020-04-03 18:01:05 -0700480 def _probe_and_validate_usb_dev(self):
481 """This method probe the usb dev path by talking to servo, and then
482 validate the dev path is valid block device to servohost.
483 Possible output:
484 1. Encounter error during probe usb dev, returns empty string.
485 2. probe usb dev completed without error but cannot find usb dev,
486 raise AutoservRepairError.
487 3. probe usb dev find a usb dev path, but failed validation in this
488 method, raise AutoservRepairError.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700489
Garry Wang70e5d062020-04-03 18:01:05 -0700490 @returns: A string of usb dev path(e.g. '/dev/sdb'), or empty string
491 if unexpected error occurred during probe.
492 @raises: AutoservRepairError if servo couldn't probe the usb dev path
493 (servo.probe_host_usb_dev() returns empty string), or the dev path is
494 not valid block device to servohost.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700495 """
496 logging.info('Validating image usbkey on servo.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700497 try:
Garry Wang70e5d062020-04-03 18:01:05 -0700498 usb_dev = self._servo.probe_host_usb_dev()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700499 except Exception as e:
500 # We don't want any unexpected or transient servo communicating
501 # failure block usb repair, so capture all errors here.
502 logging.error(e, exc_info=True)
503 logging.error('Unexpected error occurred on get usbkey dev path,'
504 ' skipping usbkey validation.')
505 return ''
506
Garry Wang70e5d062020-04-03 18:01:05 -0700507 if usb_dev:
508 # probe_host_usb_dev() sometimes return stale record,
509 # so we need to make sure the path exists in fdisk.
Otabek Kasimov77bff672020-10-08 15:52:03 -0700510 validate_cmd = 'fdisk -l %s' % usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700511 try:
Otabek Kasimov77bff672020-10-08 15:52:03 -0700512 resp = self.run(validate_cmd, ignore_status=True, timeout=30)
Garry Wang11441182020-06-16 18:34:14 -0700513 if resp.exit_status == 0:
514 return usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700515 logging.error('%s is reported from "image_usbkey_dev" control'
516 ' but not detected by fdisk!', usb_dev)
517 except error.AutoservRunError as e:
518 if 'Timeout encountered' in str(e):
519 logging.warning('Timeout encountered during fdisk run,'
520 ' skipping usbkey validation.')
521 return ''
522 raise
Garry Wang70e5d062020-04-03 18:01:05 -0700523
524 raise hosts.AutoservRepairError(
525 'No usbkey detected on servo, the usbkey may be either missing'
526 ' or broken. Please replace usbkey on the servo and retry.',
527 'missing usbkey')
528
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700529 def is_ec_supported(self):
Garry Wang9b8f2342020-04-17 16:34:09 -0700530 """Check if ec is supported on the servo_board"""
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700531 if self.servo_board:
532 try:
533 frm_config = config.Config(self.servo_board, self.servo_model)
534 return frm_config.chrome_ec
535 except Exception as e:
536 logging.error('Unexpected error when read from firmware'
537 ' configs; %s', str(e))
538 return False
539
Garry Wang70e5d062020-04-03 18:01:05 -0700540 def validate_image_usbkey(self):
541 """This method first validate if there is a recover usbkey on servo
542 that accessible to servohost, and second check if a ChromeOS image is
543 already on the usb drive and return the image_name so we can avoid
544 unnecessary download and flash to the recover usbkey on servo.
545
546 Please note that, there is special error handling logic here:
547 1. If unexpected error happens, we return empty string. So repair
548 actions will not get blocked.
549 2. If no working usbkey present on servo, but no errors, we'll raise
550 AutoservRepairError here.
551
552 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
553 or empty string if no test image detected, or unexpected
554 error occurred.
555 @raises: AutoservRepairError if the usbkey is not detected on servo.
556 """
557 usb_dev = self._probe_and_validate_usb_dev()
558 if usb_dev:
559 return self.get_image_name_from_usbkey(usb_dev)
560 else:
561 return ''
Garry Wang7b0e1b72020-03-25 19:08:59 -0700562
Richard Barnette1edbb162016-11-01 11:47:50 -0700563 def repair(self, silent=False):
564 """Attempt to repair servo host.
565
566 @param silent If true, suppress logging in `status.log`.
567 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700568 message = 'Beginning repair for servo host %s port %s serial %s'
569 message %= (self.hostname, self.servo_port, self.servo_serial)
570 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700571 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700572 self._repair_strategy.repair(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700573 self._servo_state = servo_constants.SERVO_STATE_WORKING
574 self.record('INFO', None, None,
575 'ServoHost repair set servo_state as WORKING')
Garry Wang464ff1e2019-07-18 17:20:34 -0700576 # If target is a labstation then try to withdraw any existing
577 # reboot request created by this servo because it passed repair.
578 if self.is_labstation():
579 self.withdraw_reboot_request()
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700580 if self._topology:
581 self._topology.generate()
Garry Wang63b8c382020-03-11 22:28:40 -0700582 except Exception as e:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -0700583 if not self.is_localhost():
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700584 self._servo_state = self.determine_servo_state()
585 self.record('INFO', None, None,
586 'ServoHost repair set servo_state as %s'
587 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700588 if self._is_critical_error(e):
589 self.disconnect_servo()
590 self.stop_servod()
591 raise
592
Garry Wang63b8c382020-03-11 22:28:40 -0700593 def _is_critical_error(self, error):
594 if (isinstance(error, hosts.AutoservVerifyDependencyError)
595 and not error.is_critical()):
596 logging.warning('Non-critical verify failure(s) detected during'
597 ' verify/repair servo, servo connection will'
Evan Benn2c41c262020-10-28 11:34:27 +1100598 ' still be up but may not be fully functional.'
599 ' Some repair actions and servo dependent'
Garry Wang63b8c382020-03-11 22:28:40 -0700600 ' tests may not run.')
601 return False
Evan Benn2c41c262020-10-28 11:34:27 +1100602 logging.info(
603 'Critical verify failure(s) detected during repair/verify '
604 'servo. Disconnecting servo and running `stop servod`, all'
605 ' repair actions and tests that depends on servo will not '
606 'run.')
Garry Wang63b8c382020-03-11 22:28:40 -0700607 return True
Fang Deng5d518f42013-08-02 14:04:32 -0700608
Dan Shi4d478522014-02-14 13:46:32 -0800609 def get_servo(self):
610 """Get the cached servo.Servo object.
Fang Deng5d518f42013-08-02 14:04:32 -0700611
Dan Shi4d478522014-02-14 13:46:32 -0800612 @return: a servo.Servo object.
Dana Goyette353d1d92019-06-27 10:43:59 -0700613 @rtype: autotest_lib.server.cros.servo.servo.Servo
Fang Deng5d518f42013-08-02 14:04:32 -0700614 """
Dan Shi4d478522014-02-14 13:46:32 -0800615 return self._servo
616
Garry Wang79e9af62019-06-12 15:19:19 -0700617 def request_reboot(self):
618 """Request servohost to be rebooted when it's safe to by touch a file.
619 """
620 logging.debug('Request to reboot servohost %s has been created by '
Garry Wang464ff1e2019-07-18 17:20:34 -0700621 'servo with port # %s', self.hostname, self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700622 self.run('touch %s' % self._reboot_file, ignore_status=True)
623
Garry Wang464ff1e2019-07-18 17:20:34 -0700624 def withdraw_reboot_request(self):
625 """Withdraw a servohost reboot request if exists by remove the flag
626 file.
627 """
628 logging.debug('Withdrawing request to reboot servohost %s that created'
629 ' by servo with port # %s if exists.',
630 self.hostname, self.servo_port)
631 self.run('rm -f %s' % self._reboot_file, ignore_status=True)
632
Garry Wangc1288cf2019-12-17 14:58:00 -0800633 def start_servod(self, quick_startup=False):
634 """Start the servod process on servohost.
635 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800636 # Skip if running on the localhost.(crbug.com/1038168)
637 if self.is_localhost():
638 logging.debug("Servohost is a localhost, skipping start servod.")
639 return
640
641 cmd = 'start servod'
Garry Wangc1288cf2019-12-17 14:58:00 -0800642 if self.servo_board:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800643 cmd += ' BOARD=%s' % self.servo_board
Garry Wangc1288cf2019-12-17 14:58:00 -0800644 if self.servo_model:
645 cmd += ' MODEL=%s' % self.servo_model
Garry Wangc1288cf2019-12-17 14:58:00 -0800646 else:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800647 logging.warning('Board for DUT is unknown; starting servod'
648 ' assuming a pre-configured board.')
649
650 cmd += ' PORT=%d' % self.servo_port
651 if self.servo_serial:
652 cmd += ' SERIAL=%s' % self.servo_serial
Garry Wangd7367482020-02-27 13:52:40 -0800653
Garry Wangcb06f3b2020-10-08 20:56:21 -0700654 # Start servod with dual_v4 based on servo_setup.
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700655 if self.is_dual_setup():
Garry Wangcb06f3b2020-10-08 20:56:21 -0700656 cmd += ' DUAL_V4=1'
Garry Wangd7367482020-02-27 13:52:40 -0800657
Garry Wangcb06f3b2020-10-08 20:56:21 -0700658 # Start servod with CONFIG=cr50.xml which required for some pools.
659 if self._require_cr50_servod_config():
660 cmd += ' CONFIG=cr50.xml'
Garry Wangb5cee3e2020-09-16 14:58:13 -0700661
Garry Wang6a680062020-11-03 13:40:29 -0800662 # Adding customized args if any.
663 if self.additional_servod_args:
664 cmd += ' ' + self.additional_servod_args
665
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800666 # Remove the symbolic links from the logs. This helps ensure that
667 # a failed servod instantiation does not cause us to grab old logs
668 # by mistake.
669 self.remove_latest_log_symlinks()
Garry Wangcdd27b22020-01-13 14:59:11 -0800670 self.run(cmd, timeout=60)
Garry Wangc1288cf2019-12-17 14:58:00 -0800671
672 # There's a lag between when `start servod` completes and when
673 # the _ServodConnectionVerifier trigger can actually succeed.
674 # The call to time.sleep() below gives time to make sure that
675 # the trigger won't fail after we return.
676
677 # Normally servod on servo_v3 and labstation take ~10 seconds to ready,
678 # But in the rare case all servo on a labstation are in heavy use they
679 # may take ~30 seconds. So the timeout value will double these value,
680 # and we'll try quick start up when first time initialize servohost,
681 # and use standard start up timeout in repair.
682 if quick_startup:
Garry Wang11b5e872020-03-11 15:14:08 -0700683 timeout = servo_constants.SERVOD_QUICK_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800684 else:
Garry Wang11b5e872020-03-11 15:14:08 -0700685 timeout = servo_constants.SERVOD_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800686 logging.debug('Wait %s seconds for servod process fully up.', timeout)
687 time.sleep(timeout)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700688 # Cache the initial instance timestamp to check against servod restarts
689 self._initial_instance_ts = self.get_instance_logs_ts()
Garry Wangc1288cf2019-12-17 14:58:00 -0800690
Garry Wangc1288cf2019-12-17 14:58:00 -0800691 def stop_servod(self):
692 """Stop the servod process on servohost.
693 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800694 # Skip if running on the localhost.(crbug.com/1038168)
695 if self.is_localhost():
696 logging.debug("Servohost is a localhost, skipping stop servod.")
697 return
698
Garry Wangc1288cf2019-12-17 14:58:00 -0800699 logging.debug('Stopping servod on port %s', self.servo_port)
Garry Wangcdd27b22020-01-13 14:59:11 -0800700 self.run('stop servod PORT=%d' % self.servo_port,
701 timeout=60, ignore_status=True)
Garry Wangc1288cf2019-12-17 14:58:00 -0800702 logging.debug('Wait %s seconds for servod process fully teardown.',
Garry Wang11b5e872020-03-11 15:14:08 -0700703 servo_constants.SERVOD_TEARDOWN_TIMEOUT)
704 time.sleep(servo_constants.SERVOD_TEARDOWN_TIMEOUT)
Garry Wangc1288cf2019-12-17 14:58:00 -0800705
Garry Wangc1288cf2019-12-17 14:58:00 -0800706 def restart_servod(self, quick_startup=False):
707 """Restart the servod process on servohost.
708 """
709 self.stop_servod()
710 self.start_servod(quick_startup)
711
Garry Wangffbd2162020-04-17 16:13:48 -0700712 def _process_servodtool_error(self, response):
713 """Helper function to handle non-zero servodtool response.
714 """
715 if re.search(servo_constants.ERROR_MESSAGE_USB_HUB_NOT_COMPATIBLE,
Garry Wangad245002020-05-15 15:20:23 -0700716 response.stdout):
Garry Wangffbd2162020-04-17 16:13:48 -0700717 logging.error('The servo is not plugged on a usb hub that supports'
718 ' power-cycle!')
Garry Wang000c6c02020-05-11 21:27:23 -0700719 # change the flag so we can update this label in later process.
720 self.smart_usbhub = False
Garry Wangffbd2162020-04-17 16:13:48 -0700721 return
722
723 if re.search(servo_constants.ERROR_MESSAGE_DEVICE_NOT_FOUND %
724 self.servo_serial, response.stdout):
725 logging.error('No servo with serial %s found!', self.servo_serial)
726 return
727
728 logging.error('Unexpected error occurred from usbhub control, please'
729 ' file a bug and inform chrome-fleet-software@ team!')
730
Garry Wangffbd2162020-04-17 16:13:48 -0700731 def _get_servo_usb_devnum(self):
732 """Helper function to collect current usb devnum of servo.
733 """
Otabek Kasimov09192682020-06-01 18:17:44 -0700734 # TODO remove try-except when fix crbug.com/1087964
735 try:
736 cmd = 'servodtool device -s %s usb-path' % self.servo_serial
737 resp = self.run(cmd, ignore_status=True, timeout=30)
738 except Exception as e:
739 # Here we catch only timeout errors.
740 # Other errors is filtered by ignore_status=True
741 logging.debug('Attempt to get servo usb-path failed due to '
742 'timeout; %s', e)
743 return ''
744
Garry Wangffbd2162020-04-17 16:13:48 -0700745 if resp.exit_status != 0:
746 self._process_servodtool_error(resp)
747 return ''
748 usb_path = resp.stdout.strip()
749 logging.info('Usb path of servo %s is %s', self.servo_serial, usb_path)
750
751 resp = self.run('cat %s/devnum' % usb_path,
752 ignore_status=True)
753 if resp.exit_status != 0:
754 self._process_servodtool_error(resp)
755 return ''
756 return resp.stdout.strip()
757
Garry Wang358aad42020-08-02 20:56:04 -0700758 def reboot_servo_v3_on_need(self):
759 """Check and reboot servo_v3 based on below conditions.
760 1. If there is an update pending on reboot.
761 2. Servo_v3 has been up for more than 96 hours.
762 """
763 if self.get_board() != 'beaglebone_servo':
764 logging.info('Servo reboot is only applicable for servo V3.')
Otabek Kasimove6df8102020-07-21 20:15:25 -0700765 return
766
Garry Wang358aad42020-08-02 20:56:04 -0700767 update_pending_reboot = (self._check_update_status() ==
768 self.UPDATE_STATE.PENDING_REBOOT)
769 uptime_hours = float(self.check_uptime())/3600
770 logging.info('Uptime of servo_v3: %s hour(s)', uptime_hours)
771 long_up_time = uptime_hours > 96
772
773 # Skip reboot if neither condition are met.
774 if not (update_pending_reboot or long_up_time):
Otabek Kasimove6df8102020-07-21 20:15:25 -0700775 return
776
Garry Wang358aad42020-08-02 20:56:04 -0700777 if update_pending_reboot:
778 message = 'Starting reboot servo_v3 because an update is pending.'
779 reboot_method = self._post_update_reboot
780 elif long_up_time:
781 message = 'Starting reboot servo_v3 because uptime > 96 hours.'
782 reboot_method = self._servo_host_reboot
783 self.record('INFO', None, None, message)
784 logging.info(message)
Otabek Kasimove6df8102020-07-21 20:15:25 -0700785 try:
Garry Wang358aad42020-08-02 20:56:04 -0700786 reboot_method()
Otabek Kasimove6df8102020-07-21 20:15:25 -0700787 message = 'Servo_v3 reboot completed successfully.'
788 except Exception as e:
789 logging.debug("Fail to reboot servo_v3; %s", e)
790 message = ('Servo_v3 reboot failed, please check debug log '
791 'for details.')
792 logging.info(message)
793 self.record('INFO', None, None, message)
Garry Wangffbd2162020-04-17 16:13:48 -0700794
795 def _reset_servo(self):
796 logging.info('Resetting servo through smart usbhub.')
Otabek Kasimov09192682020-06-01 18:17:44 -0700797 # TODO remove try-except when fix crbug.com/1087964
798 try:
799 resp = self.run('servodtool device -s %s power-cycle' %
800 self.servo_serial, ignore_status=True,
801 timeout=30)
802 if resp.exit_status != 0:
803 self._process_servodtool_error(resp)
804 return False
805 except Exception as e:
806 # Here we catch only timeout errors.
807 # Other errors is filtered by ignore_status=True
808 logging.debug('Attempt to reset servo failed due to timeout;'
809 ' %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -0700810 return False
811
812 logging.debug('Wait %s seconds for servo to come back from reset.',
813 servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
814 time.sleep(servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
Garry Wang000c6c02020-05-11 21:27:23 -0700815 # change the flag so we can update this label in later process.
816 self.smart_usbhub = True
Garry Wangffbd2162020-04-17 16:13:48 -0700817 return True
818
Garry Wangffbd2162020-04-17 16:13:48 -0700819 def reset_servo(self):
820 """Reset(power-cycle) the servo via smart usbhub.
821 """
822 if not self.is_labstation():
823 logging.info('Servo reset is not applicable to servo_v3.')
824 return
825
826 pre_reset_devnum = self._get_servo_usb_devnum()
827 logging.info('Servo usb devnum before reset: %s', pre_reset_devnum)
828 result = self._reset_servo()
829 if not result:
Garry Wangfd5c8b62020-06-08 15:36:54 -0700830 message = ('Failed to reset servo with serial: %s. (Please ignore'
831 ' this error if the DUT is not connected to a smart'
832 ' usbhub).' % self.servo_serial)
Garry Wangffbd2162020-04-17 16:13:48 -0700833 logging.warning(message)
834 self.record('INFO', None, None, message)
835 return
836
837 post_reset_devnum = self._get_servo_usb_devnum()
838 logging.info('Servo usb devnum after reset: %s', post_reset_devnum)
839 if not (pre_reset_devnum and post_reset_devnum):
840 message = ('Servo reset completed but unable to verify'
841 ' devnum change!')
842 elif pre_reset_devnum != post_reset_devnum:
843 message = ('Reset servo with serial %s completed successfully!'
844 % self.servo_serial)
845 else:
846 message = 'Servo reset completed but devnum is still not changed!'
847 logging.info(message)
848 self.record('INFO', None, None, message)
849
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800850 def _extract_compressed_logs(self, logdir, relevant_files):
851 """Decompress servod logs in |logdir|.
852
853 @param logdir: directory containing compressed servod logs.
854 @param relevant_files: list of files in |logdir| to consider.
855
856 @returns: tuple, (tarfiles, files) where
857 tarfiles: list of the compressed filenames that have been
858 extracted and deleted
859 files: list of the uncompressed files that were generated
860 """
861 # For all tar-files, first extract them to the directory, and
862 # then let the common flow handle them.
863 tarfiles = [cf for cf in relevant_files if
864 cf.endswith(self.COMPRESSION_SUFFIX)]
865 files = []
866 for f in tarfiles:
867 norm_name = os.path.basename(f)[:-len(self.COMPRESSION_SUFFIX)]
868 with tarfile.open(f) as tf:
869 # Each tarfile has only one member, as
870 # that's the compressed log.
871 member = tf.members[0]
872 # Manipulate so that it only extracts the basename, and not
873 # the directories etc.
874 member.name = norm_name
875 files.append(os.path.join(logdir, member.name))
876 tf.extract(member, logdir)
877 # File has been extracted: remove the compressed file.
878 os.remove(f)
879 return tarfiles, files
880
881 def _extract_mcu_logs(self, log_subdir):
882 """Extract MCU (EC, Cr50, etc) console output from servod debug logs.
883
884 Using the MCU_EXTRACTOR regex (above) extract and split out MCU console
885 lines from the logs to generate invidiual console logs e.g. after
886 this method, you can find an ec.txt and servo_v4.txt in |log_dir| if
887 those MCUs had any console input/output.
888
889 @param log_subdir: directory with log.DEBUG.txt main servod debug logs.
890 """
891 # Extract the MCU for each one. The MCU logs are only in the .DEBUG
892 # files
893 mcu_lines_file = os.path.join(log_subdir, 'log.DEBUG.txt')
894 if not os.path.exists(mcu_lines_file):
895 logging.info('No DEBUG logs found to extract MCU logs from.')
896 return
897 mcu_files = {}
898 mcu_file_template = '%s.txt'
899 with open(mcu_lines_file, 'r') as f:
900 for line in f:
901 match = self.MCU_EXTRACTOR.match(line)
902 if match:
903 mcu = match.group(self.MCU_GROUP).lower()
904 line = match.group(self.LINE_GROUP)
905 if mcu not in mcu_files:
906 mcu_file = os.path.join(log_subdir,
907 mcu_file_template % mcu)
908 mcu_files[mcu] = open(mcu_file, 'a')
909 fd = mcu_files[mcu]
910 fd.write(line + '\n')
911 for f in mcu_files:
912 mcu_files[f].close()
913
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800914 def remove_latest_log_symlinks(self):
915 """Remove the conveninence symlinks 'latest' servod logs."""
916 symlink_wildcard = '%s/latest*' % self.remote_log_dir
917 cmd = 'rm ' + symlink_wildcard
918 self.run(cmd, stderr_tee=None, ignore_status=True)
919
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700920 def probe_servod_restart(self, instance_ts, outdir):
921 """Grab servod logs from previous instances if part of this session.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800922
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700923 If since the last time this host called start_servod() servod crashed
924 and restarted, this helper finds those logs as well, and stores them
925 with the |OLD_LOG_SUFFIX| to investigate if necessary.
Prasad Vuppalapu5bd9da12020-03-31 01:46:47 +0000926
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700927 It also issues a panicinfo command to servo devices after the restart
928 to try and collect reboot information for debugging.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800929
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700930 @param instance_ts: the log timestamp that the current instance uses
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800931 @param outdir: directory to create a subdirectory into to place the
932 servod logs into.
933 """
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700934 if self._initial_instance_ts is None:
935 logging.info('No log timestamp grabbed successfully on servod '
936 'startup. Cannot check device restarts. Ignoring.')
937 return
938 if instance_ts == self._initial_instance_ts:
939 logging.debug('Servod appears to have run without restarting')
940 return
941 # Servod seems to have restarted (at least once). |_initial_instance_ts|
942 # is the first timestamp, and instance_ts is the current timestamp. Find
943 # all timestamps in between them, and grab the logs for each.
944 tss = self._find_instance_timestamps_between(self._initial_instance_ts,
945 instance_ts)
946 logging.info('Servod has restarted %d times between the start and the '
947 'end of this servo_host.', len(tss))
948 logging.info('This might be an issue. Will extract all logs from each '
949 'instance.')
950 logging.info('Logs that are not the currently running (about to turn '
951 'down) instance are maked with a .%s in their folder.',
952 self.OLD_LOG_SUFFIX)
953 for ts in tss:
954 self.get_instance_logs(ts, outdir, old=True)
955 # Lastly, servod has restarted due to a potential issue. Try to get
956 # panic information from servo micro and servo v4 for the current logs.
957 # This can only happen if the |_servo| attribute is initialized.
958 if self._servo:
959 for mcu in ['servo_micro', 'servo_v4']:
960 ctrl = '%s_uart_cmd' % mcu
961 if self._servo.has_control(ctrl):
962 logging.info('Trying to retrieve %r panicinfo into logs',
963 mcu)
964 try:
965 self._servo.set_nocheck(ctrl, 'panicinfo')
966 except error.TestFail as e:
967 logging.error('Failed to generate panicinfo for %r '
968 'logs. %s', mcu, str(e))
969
970 def _find_instance_timestamps_between(self, start_ts, end_ts):
971 """Find all log timestamps between [start_ts, end_ts).
972
973 @param start_ts: str, earliest log timestamp of interest
974 @param end_ts: str, latest log timestamp of interest
975
976 @returns: list, all timestamps between start_ts and end_ts, end_ts
977 exclusive, on the servo_host. An empty list on errors
978 """
979 # Simply get all timestamp, and then sort and remove
980 cmd = 'ls %s' % self.remote_log_dir
981 res = self.run(cmd, stderr_tee=None, ignore_status=True)
982 if res.exit_status != 0:
983 # Here we failed to find anything.
984 logging.info('Failed to find remote servod logs. Ignoring.')
985 return []
986 logfiles = res.stdout.strip().split()
987 timestamps = set()
988 for logfile in logfiles:
989 ts_match = self.TS_EXTRACTOR.match(logfile)
990 if not ts_match:
991 # Simply ignore files that fail the check. It might be the
992 # 'latest' symlinks or random files.
993 continue
994 timestamps.add(ts_match.group(self.TS_GROUP))
995 # At this point we have all unique timestamps.
996 timestamps = sorted(timestamps)
997 for ts in [start_ts, end_ts]:
998 if ts not in timestamps:
999 logging.error('Timestamp %r not in servod logs. Cannot query '
1000 'for timestamps in between %r and %r', ts,
1001 start_ts, end_ts)
1002 return []
1003 return timestamps[timestamps.index(start_ts):timestamps.index(end_ts)]
1004
1005 def get_instance_logs_ts(self):
1006 """Retrieve the currently running servod instance's log timestamp
1007
1008 @returns: str, timestamp for current instance, or None on failure
1009 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001010 # First, extract the timestamp. This cmd gives the real filename of
1011 # the latest aka current log file.
1012 cmd = ('if [ -f %(dir)s/latest.DEBUG ];'
1013 'then realpath %(dir)s/latest.DEBUG;'
1014 'elif [ -f %(dir)s/latest ];'
1015 'then realpath %(dir)s/latest;'
1016 'else exit %(code)d;'
1017 'fi' % {'dir': self.remote_log_dir,
1018 'code': self.NO_SYMLINKS_CODE})
1019 res = self.run(cmd, stderr_tee=None, ignore_status=True)
1020 if res.exit_status != 0:
1021 if res.exit_status == self.NO_SYMLINKS_CODE:
1022 logging.warning('servod log latest symlinks not found. '
1023 'This is likely due to an error starting up '
1024 'servod. Ignoring..')
1025 else:
1026 logging.warning('Failed to find servod logs on servo host.')
1027 logging.warning(res.stderr.strip())
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001028 return None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001029 fname = os.path.basename(res.stdout.strip())
1030 # From the fname, ought to extract the timestamp using the TS_EXTRACTOR
Ruben Rodriguez Buchillone9aa2b02020-03-04 12:14:28 -08001031 ts_match = self.TS_EXTRACTOR.match(fname)
1032 if not ts_match:
1033 logging.warning('Failed to extract timestamp from servod log file '
1034 '%r. Skipping. The servo host is using outdated '
1035 'servod logging and needs to be updated.', fname)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001036 return None
1037 return ts_match.group(self.TS_GROUP)
1038
1039 def get_instance_logs(self, instance_ts, outdir, old=False):
1040 """Collect all logs with |instance_ts| and dump into a dir in |outdir|
1041
1042 This method first collects all logs on the servo_host side pertaining
1043 to this servod instance (port, instatiation). It glues them together
1044 into combined log.[level].txt files and extracts all available MCU
1045 console I/O from the logs into individual files e.g. servo_v4.txt
1046
1047 All the output can be found in a directory inside |outdir| that
1048 this generates based on |LOG_DIR|, the servod port, and the instance
1049 timestamp on the servo_host side.
1050
1051 @param instance_ts: log timestamp to grab logfiles for
1052 @param outdir: directory to create a subdirectory into to place the
1053 servod logs into.
1054 @param old: bool, whether to append |OLD_LOG_SUFFIX| to output dir
1055 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001056 # Create the local results log dir.
1057 log_dir = os.path.join(outdir, '%s_%s.%s' % (self.LOG_DIR,
1058 str(self.servo_port),
1059 instance_ts))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001060 if old:
Garry Wang22f2e842020-09-09 20:19:19 -07001061 log_dir = '%s.%s' % (log_dir, self.OLD_LOG_SUFFIX)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001062 logging.info('Saving servod logs to %r.', log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001063 os.mkdir(log_dir)
1064 # Now, get all files with that timestamp.
1065 cmd = 'find %s -maxdepth 1 -name "log.%s*"' % (self.remote_log_dir,
1066 instance_ts)
1067 res = self.run(cmd, stderr_tee=None, ignore_status=True)
1068 files = res.stdout.strip().split()
1069 try:
1070 self.get_file(files, log_dir, try_rsync=False)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001071 if not os.listdir(log_dir):
1072 logging.info('No servod logs retrieved. Ignoring, and removing '
1073 '%r again.', log_dir)
1074 os.rmdir(log_dir)
1075 return
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001076 except error.AutoservRunError as e:
1077 result = e.result_obj
1078 if result.exit_status != 0:
1079 stderr = result.stderr.strip()
1080 logging.warning("Couldn't retrieve servod logs. Ignoring: %s",
1081 stderr or '\n%s' % result)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001082 # Remove the log_dir as nothing was added to it.
1083 os.rmdir(log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001084 return
1085 local_files = [os.path.join(log_dir, f) for f in os.listdir(log_dir)]
1086 # TODO(crrev.com/c/1793030): remove no-level case once CL is pushed
1087 for level_name in ('DEBUG', 'INFO', 'WARNING', ''):
1088 # Create the joint files for each loglevel. i.e log.DEBUG
1089 joint_file = self.JOINT_LOG_PREFIX
1090 if level_name:
1091 joint_file = '%s.%s' % (self.JOINT_LOG_PREFIX, level_name)
1092 # This helps with some online tools to avoid complaints about an
1093 # unknown filetype.
1094 joint_file = joint_file + '.txt'
1095 joint_path = os.path.join(log_dir, joint_file)
1096 files = [f for f in local_files if level_name in f]
1097 if not files:
1098 # TODO(crrev.com/c/1793030): remove no-level case once CL
1099 # is pushed
1100 continue
1101 # Extract compressed logs if any.
1102 compressed, extracted = self._extract_compressed_logs(log_dir,
1103 files)
1104 files = list(set(files) - set(compressed))
1105 files.extend(extracted)
1106 # Need to sort. As they all share the same timestamp, and
1107 # loglevel, the index itself is sufficient. The highest index
1108 # is the oldest file, therefore we need a descending sort.
1109 def sortkey(f, level=level_name):
1110 """Custom sortkey to sort based on rotation number int."""
1111 if f.endswith(level_name): return 0
1112 return int(f.split('.')[-1])
1113
1114 files.sort(reverse=True, key=sortkey)
1115 # Just rename the first file rather than building from scratch.
1116 os.rename(files[0], joint_path)
1117 with open(joint_path, 'a') as joint_f:
1118 for logfile in files[1:]:
1119 # Transfer the file to the joint file line by line.
1120 with open(logfile, 'r') as log_f:
1121 for line in log_f:
1122 joint_f.write(line)
1123 # File has been written over. Delete safely.
1124 os.remove(logfile)
1125 # Need to remove all files form |local_files| so we don't
1126 # analyze them again.
1127 local_files = list(set(local_files) - set(files) - set(compressed))
1128 # Lastly, extract MCU logs from the joint logs.
1129 self._extract_mcu_logs(log_dir)
1130
Garry Wang79e9af62019-06-12 15:19:19 -07001131 def _lock(self):
1132 """lock servohost by touching a file.
1133 """
1134 logging.debug('Locking servohost %s by touching %s file',
1135 self.hostname, self._lock_file)
1136 self.run('touch %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001137 self._is_locked = True
Garry Wang79e9af62019-06-12 15:19:19 -07001138
Garry Wang79e9af62019-06-12 15:19:19 -07001139 def _unlock(self):
1140 """Unlock servohost by removing the lock file.
1141 """
1142 logging.debug('Unlocking servohost by removing %s file',
1143 self._lock_file)
1144 self.run('rm %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001145 self._is_locked = False
Garry Wang79e9af62019-06-12 15:19:19 -07001146
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001147 def close(self):
Congbin Guofc3b8962019-03-22 17:38:46 -07001148 """Close the associated servo and the host object."""
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001149 # NOTE: throughout this method there are multiple attempts to catch
1150 # all errors. This is WAI as log grabbing should not fail tests.
1151 # However, the goal is to catch and handle/process all errors, thus
1152 # we print the traceback and ask for a bug.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001153 if self._closed:
1154 logging.debug('ServoHost is already closed.')
1155 return
Garry Wang22f2e842020-09-09 20:19:19 -07001156
1157 # Only attempt ssh related actions if servohost is sshable. We call
1158 # check_cached_up_status() first because it's lightweighted and return
1159 # much faster in the case servohost is down, however, we still want
1160 # to call is_up() later since check_cached_up_status() is ping based check
1161 # and not guarantee the servohost is sshable.
1162 servo_host_ready = self.check_cached_up_status() and self.is_up()
1163
1164 if servo_host_ready:
1165 instance_ts = self.get_instance_logs_ts()
1166 else:
1167 logging.info('Servohost is down, will skip servod log collecting.')
1168 instance_ts = None
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001169 # TODO(crbug.com/1011516): once enabled, remove the check against
1170 # localhost and instead check against log-rotiation enablement.
1171 logs_available = (instance_ts is not None and
1172 self.job and
1173 not self.is_localhost())
1174 if logs_available:
1175 # Probe whether there was a servod restart, and grab those old
1176 # logs as well.
1177 try:
1178 self.probe_servod_restart(instance_ts, self.job.resultdir)
1179 except (error.AutoservRunError, error.TestFail) as e:
1180 logging.info('Failed to grab servo logs due to: %s. '
1181 'This error is forgiven.', str(e))
1182 except Exception as e:
1183 logging.error('Unexpected error probing for old logs. %s. '
1184 'Forgiven. Please file a bug and fix or catch '
1185 'in log probing function', str(e),
1186 exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001187 if self._servo:
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001188 outdir = None if not self.job else self.job.resultdir
Congbin Guo2e5e2a22018-07-27 10:32:48 -07001189 # In some cases when we run as lab-tools, the job object is None.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001190 self._servo.close(outdir)
1191
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001192 if logs_available:
1193 # Grab current (not old like above) logs after the servo instance
1194 # was closed out.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001195 try:
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001196 self.get_instance_logs(instance_ts, self.job.resultdir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001197 except error.AutoservRunError as e:
1198 logging.info('Failed to grab servo logs due to: %s. '
1199 'This error is forgiven.', str(e))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001200 except Exception as e:
1201 logging.error('Unexpected error grabbing servod logs. %s. '
1202 'Forgiven. Please file a bug and fix or catch '
1203 'in log grabbing function', str(e), exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001204
Garry Wang22f2e842020-09-09 20:19:19 -07001205 if self._is_locked and servo_host_ready:
Garry Wang7c00b0f2019-06-25 17:28:17 -07001206 # Remove the lock if the servohost has been locked.
Garry Wang79e9af62019-06-12 15:19:19 -07001207 try:
1208 self._unlock()
1209 except error.AutoservSSHTimeout:
1210 logging.error('Unlock servohost failed due to ssh timeout.'
1211 ' It may caused by servohost went down during'
1212 ' the task.')
Garry Wangc1288cf2019-12-17 14:58:00 -08001213 # We want always stop servod after task to minimum the impact of bad
1214 # servod process interfere other servods.(see crbug.com/1028665)
Garry Wang22f2e842020-09-09 20:19:19 -07001215 if servo_host_ready:
1216 try:
1217 self.stop_servod()
1218 except error.AutoservRunError as e:
1219 logging.info(
1220 "Failed to stop servod due to:\n%s\n"
1221 "This error is forgiven.", str(e))
Garry Wangc1288cf2019-12-17 14:58:00 -08001222
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001223 super(ServoHost, self).close()
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001224 # Mark closed.
1225 self._closed = True
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001226
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001227 def get_servo_state(self):
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001228 return self._servo_state
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001229
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001230 def _get_host_metrics_data(self):
1231 return {'port': self.servo_port,
Otabek Kasimov0ea47362020-07-11 20:55:09 -07001232 'host': self.get_dut_hostname() or self.hostname,
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001233 'board': self.servo_board or ''}
1234
1235 def _is_servo_device_connected(self, servo_type, serial):
1236 """Check if device is connected to the labstation.
1237
1238 Works for all servo devices connected to the labstation.
1239 For servo_v3 please use 'self._is_servo_board_present_on_servo_v3'
1240
1241 @param servo_type: The type of servo device. Expecting value can be
1242 servo_v4 or servo_micro.
1243 @param serial: The serial number of the device to detect it.
1244 """
1245 vid_pid = self.SERVO_VID_PID.get(servo_type)
1246 if not vid_pid or not serial:
1247 # device cannot detected without VID/PID or serial number
1248 return False
1249 logging.debug('Started to detect %s', servo_type)
1250 try:
1251 cmd = 'lsusb -v -d %s |grep iSerial |grep %s' % (vid_pid, serial)
1252 result = self.run(cmd, ignore_status=True, timeout=30)
1253 if result.exit_status == 0 and result.stdout.strip():
1254 logging.debug('The %s is plugged in to the host.', servo_type)
1255 return True
1256 logging.debug('%s device is not detected; %s', servo_type, result)
1257 return False
1258 except Exception as e:
1259 # can be triggered by timeout issue due running the script
1260 metrics.Counter(
1261 'chromeos/autotest/repair/servo_detection/timeout'
1262 ).increment(fields=self._get_host_metrics_data())
1263 logging.error('%s device is not detected; %s', servo_type, str(e))
1264 return None
1265
1266 def _is_servo_board_present_on_servo_v3(self):
1267 """Check if servo board is detected on servo_v3"""
1268 vid_pids = self.SERVO_VID_PID['servo_v3']
1269 if not vid_pids or len(vid_pids) == 0:
1270 # device cannot detected without VID/PID
1271 return False
1272 logging.debug('Started to detect servo board on servo_v3')
1273 not_detected = 'The servo board is not detected on servo_v3'
1274 try:
1275 cmd = 'lsusb | grep "%s"' % "\|".join(vid_pids)
1276 result = self.run(cmd, ignore_status=True, timeout=30)
1277 if result.exit_status == 0 and result.stdout.strip():
1278 logging.debug('The servo board is detected on servo_v3')
1279 return True
1280 logging.debug('%s; %s', not_detected, result)
1281 return False
1282 except Exception as e:
1283 # can be triggered by timeout issue due running the script
1284 metrics.Counter(
1285 'chromeos/autotest/repair/servo_detection/timeout'
1286 ).increment(fields=self._get_host_metrics_data())
1287 logging.error('%s; %s', not_detected, str(e))
1288 return None
1289
Otabek Kasimov120b6fa2020-07-03 00:15:27 -07001290 def _is_main_device_not_detected_on_servo_v4(self):
1291 """Check if servod cannot find main device on servo.
1292
1293 The check based on reading servod logs for servo_v4.
1294 """
1295 if not self._initial_instance_ts:
1296 # latest log not found
1297 return False
1298 logging.debug('latest log for servod created at %s',
1299 self._initial_instance_ts)
1300 try:
1301 log_created = calendar.timegm(time.strptime(
1302 self._initial_instance_ts,
1303 "%Y-%m-%d--%H-%M-%S.%f"))
1304 except ValueError as e:
1305 logging.debug('Cannot read time from log file name: %s',
1306 self._initial_instance_ts)
1307 return False
1308 min_time_created = calendar.timegm(time.gmtime())
1309 if min_time_created > log_created + 3600:
1310 # the log file is old we cannot use it
1311 logging.debug('log file was created more than hour ago, too old')
1312 return False
1313 logging.debug('latest log was created not longer then 1 hour ago')
1314
1315 # check if servod can detect main device by servo_v4
1316 message = 'ERROR - No servo micro or CCD detected for board'
1317 cmd = ('cat /var/log/servod_%s/log.%s.INFO |grep "%s"'
1318 % (self.servo_port, self._initial_instance_ts, message))
1319 result = self.run(cmd, ignore_status=True)
1320 if result.stdout.strip():
1321 logging.info('Servod cannot detect main device on the servo; '
1322 'Can be caused by bad hardware of servo or '
1323 'issue on the DUT side.')
1324 return True
1325 logging.debug('The main device is detected')
1326 return False
1327
Garry Wangb5cee3e2020-09-16 14:58:13 -07001328 def _require_cr50_servod_config(self):
1329 """Check whether we need start servod with CONFIG=cr50.xml"""
1330 dut_host_info = self.get_dut_host_info()
1331 if not dut_host_info:
1332 return False
1333 for pool in dut_host_info.pools:
1334 if pool.startswith(servo_constants.CR50_CONFIG_POOL_PREFIX):
1335 return True
1336 return False
1337
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001338 def get_verifier_state(self, tag):
Otabek Kasimov15963492020-06-23 21:10:51 -07001339 """Return the state of servo verifier.
1340
1341 @returns: bool or None
1342 """
1343 return self._repair_strategy.verifier_is_good(tag)
1344
1345 def determine_servo_state(self):
1346 """Determine servo state based on the failed verifier.
1347
1348 @returns: servo state value
1349 The state detecting based on first fail verifier or collecting of
1350 them.
1351 """
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001352 ssh = self.get_verifier_state('servo_ssh')
1353 disk_space = self.get_verifier_state('disk_space')
1354 start_servod = self.get_verifier_state('servod_job')
1355 create_servo = self.get_verifier_state('servod_connection')
1356 init_servo = self.get_verifier_state('servod_control')
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001357 servo_topology = self.get_verifier_state('servo_topology')
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001358 dut_connected = self.get_verifier_state('dut_connected')
1359 pwr_button = self.get_verifier_state('pwr_button')
1360 lid_open = self.get_verifier_state('lid_open')
1361 ec_board = self.get_verifier_state('ec_board')
Otabek Kasimovbb3bc462020-11-03 16:40:33 -08001362 cr50_console = self.get_verifier_state('cr50_console')
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001363 ccd_testlab = self.get_verifier_state('ccd_testlab')
Otabek Kasimov15963492020-06-23 21:10:51 -07001364
1365 if not ssh:
1366 return servo_constants.SERVO_STATE_NO_SSH
1367
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001368 if (start_servod == hosts.VERIFY_FAILED
1369 or create_servo == hosts.VERIFY_FAILED):
Otabek Kasimov066bdb82020-08-12 15:57:44 -07001370 # sometimes servo can start with out present servo
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001371 if self.is_labstation():
1372 if not self.servo_serial:
1373 return servo_constants.SERVO_STATE_WRONG_CONFIG
1374 if self._is_servo_device_connected(
1375 'servo_v4',
1376 self.servo_serial) == False:
1377 return servo_constants.SERVO_STATE_NOT_CONNECTED
1378 elif self._is_servo_board_present_on_servo_v3() == False:
1379 return servo_constants.SERVO_STATE_NOT_CONNECTED
Otabek Kasimov066bdb82020-08-12 15:57:44 -07001380
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001381 if servo_topology == hosts.VERIFY_FAILED:
1382 return servo_constants.SERVO_STATE_TOPOLOGY_ISSUE
1383
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001384 if dut_connected == hosts.VERIFY_FAILED:
1385 if pwr_button == hosts.VERIFY_SUCCESS:
Otabek Kasimova7eb4dc2020-09-16 10:25:17 -07001386 # unexpected case
1387 metrics.Counter(
1388 'chromeos/autotest/repair/servo_unexpected/pwr_button'
1389 ).increment(fields=self._get_host_metrics_data())
1390 return servo_constants.SERVO_STATE_DUT_NOT_CONNECTED
1391
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001392 if start_servod == hosts.VERIFY_FAILED:
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001393 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1394
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001395 if create_servo == hosts.VERIFY_FAILED:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -07001396 if (self.is_labstation()
1397 and self._is_main_device_not_detected_on_servo_v4()):
1398 servo_type = None
1399 if self.get_dut_host_info():
1400 servo_type = self.get_dut_host_info().get_label_value(
1401 servo_constants.SERVO_TYPE_LABEL_PREFIX)
1402 if servo_type and 'servo_micro' in servo_type:
1403 serial = self.get_servo_micro_serial_number()
1404 logging.debug('servo_micro serial: %s', serial)
1405 if self._is_servo_device_detected('servo_micro',
1406 serial):
1407 return servo_constants.SERVO_STATE_BAD_RIBBON_CABLE
1408 # Device can be not detected because of DUT
1409 # TODO (otabek) update after b/159755652 and b/159754985
1410 metrics.Counter(
1411 'chromeos/autotest/repair/servo_state/needs_replacement'
1412 ).increment(fields=self._get_host_metrics_data())
1413 elif not self.is_labstation():
1414 # Here need logic to check if flex cable is connected
1415 pass
1416
Otabek Kasimov15963492020-06-23 21:10:51 -07001417 # one of the reason why servo can not initialized
Otabek Kasimovbb3bc462020-11-03 16:40:33 -08001418 if cr50_console == hosts.VERIFY_FAILED:
1419 return servo_constants.SERVO_STATE_CR50_CONSOLE_MISSING
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001420 if ccd_testlab == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001421 return servo_constants.SERVO_STATE_CCD_TESTLAB_ISSUE
1422
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001423 if (create_servo == hosts.VERIFY_FAILED
1424 or init_servo == hosts.VERIFY_FAILED):
Otabek Kasimov15963492020-06-23 21:10:51 -07001425 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1426
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001427 if ec_board == hosts.VERIFY_FAILED:
Otabek Kasimov015c15c2020-08-20 00:40:42 -07001428 return servo_constants.SERVO_STATE_EC_BROKEN
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001429 if pwr_button == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001430 return servo_constants.SERVO_STATE_BAD_RIBBON_CABLE
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001431 if lid_open == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001432 return servo_constants.SERVO_STATE_LID_OPEN_FAILED
Otabek Kasimov15963492020-06-23 21:10:51 -07001433
Otabek Kasimov15963492020-06-23 21:10:51 -07001434 metrics.Counter(
1435 'chromeos/autotest/repair/unknown_servo_state'
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001436 ).increment(fields=self._get_host_metrics_data())
Otabek Kasimov15963492020-06-23 21:10:51 -07001437 logging.info('We do not have special state for this failure yet :)')
1438 return servo_constants.SERVO_STATE_BROKEN
1439
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001440 def is_servo_topology_supported(self):
1441 """Check if servo_topology is supported."""
1442 if not self.is_labstation():
1443 logging.info('Servo-topology supported only for labstation.')
1444 return False
1445 if not self.servo_serial:
1446 logging.info('Servo-topology required a servo serial.')
1447 return False
1448 return True
1449
1450 def get_topology(self):
1451 """Get servo topology."""
1452 return self._topology
1453
1454 def is_dual_setup(self):
1455 """Check is servo will run in dual setup.
1456
1457 Dual setup used only for servo_v4 when used ccd_cr50 and servo_micro
1458 at the same time.
1459 """
1460 return self.servo_setup == servo_constants.SERVO_SETUP_VALUE_DUAL_V4
1461
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001462
Richard Barnetteea3e4602016-06-10 12:36:41 -07001463def make_servo_hostname(dut_hostname):
1464 """Given a DUT's hostname, return the hostname of its servo.
1465
1466 @param dut_hostname: hostname of a DUT.
1467
1468 @return hostname of the DUT's servo.
1469
1470 """
1471 host_parts = dut_hostname.split('.')
1472 host_parts[0] = host_parts[0] + '-servo'
1473 return '.'.join(host_parts)
1474
1475
1476def servo_host_is_up(servo_hostname):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001477 """Given a servo host name, return if it's up or not.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001478
1479 @param servo_hostname: hostname of the servo host.
1480
1481 @return True if it's up, False otherwise
1482 """
1483 # Technically, this duplicates the SSH ping done early in the servo
1484 # proxy initialization code. However, this ping ends in a couple
1485 # seconds when if fails, rather than the 60 seconds it takes to decide
1486 # that an SSH ping has timed out. Specifically, that timeout happens
1487 # when our servo DNS name resolves, but there is no host at that IP.
1488 logging.info('Pinging servo host at %s', servo_hostname)
1489 ping_config = ping_runner.PingConfig(
1490 servo_hostname, count=3,
1491 ignore_result=True, ignore_status=True)
1492 return ping_runner.PingRunner().ping(ping_config).received > 0
1493
1494
Richard Barnettee519dcd2016-08-15 17:37:17 -07001495def _map_afe_board_to_servo_board(afe_board):
1496 """Map a board we get from the AFE to a servo appropriate value.
1497
1498 Many boards are identical to other boards for servo's purposes.
1499 This function makes that mapping.
1500
1501 @param afe_board string board name received from AFE.
1502 @return board we expect servo to have.
1503
1504 """
1505 KNOWN_SUFFIXES = ['-freon', '_freon', '_moblab', '-cheets']
1506 BOARD_MAP = {'gizmo': 'panther'}
1507 mapped_board = afe_board
1508 if afe_board in BOARD_MAP:
1509 mapped_board = BOARD_MAP[afe_board]
1510 else:
1511 for suffix in KNOWN_SUFFIXES:
1512 if afe_board.endswith(suffix):
1513 mapped_board = afe_board[0:-len(suffix)]
1514 break
1515 if mapped_board != afe_board:
1516 logging.info('Mapping AFE board=%s to %s', afe_board, mapped_board)
1517 return mapped_board
1518
1519
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001520def get_servo_args_for_host(dut_host):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001521 """Return servo data associated with a given DUT.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001522
Richard Barnetteea3e4602016-06-10 12:36:41 -07001523 @param dut_host Instance of `Host` on which to find the servo
1524 attributes.
Prathmesh Prabhuf605dd32018-08-28 17:09:04 -07001525 @return `servo_args` dict with host and an optional port.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001526 """
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001527 info = dut_host.host_info_store.get()
Derek Beckettf73baca2020-08-19 15:08:47 -07001528 servo_args = {k: v for k, v in six.iteritems(info.attributes)
Garry Wang11b5e872020-03-11 15:14:08 -07001529 if k in servo_constants.SERVO_ATTR_KEYS}
Richard Barnetteea3e4602016-06-10 12:36:41 -07001530
Garry Wang11b5e872020-03-11 15:14:08 -07001531 if servo_constants.SERVO_PORT_ATTR in servo_args:
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001532 try:
Garry Wang11b5e872020-03-11 15:14:08 -07001533 servo_args[servo_constants.SERVO_PORT_ATTR] = int(
1534 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001535 except ValueError:
1536 logging.error('servo port is not an int: %s',
Garry Wang11b5e872020-03-11 15:14:08 -07001537 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001538 # Reset servo_args because we don't want to use an invalid port.
Garry Wang11b5e872020-03-11 15:14:08 -07001539 servo_args.pop(servo_constants.SERVO_HOST_ATTR, None)
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001540
1541 if info.board:
Garry Wang11b5e872020-03-11 15:14:08 -07001542 servo_board = _map_afe_board_to_servo_board(info.board)
1543 servo_args[servo_constants.SERVO_BOARD_ATTR] = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -07001544 if info.model:
Garry Wang11b5e872020-03-11 15:14:08 -07001545 servo_args[servo_constants.SERVO_MODEL_ATTR] = info.model
1546 return servo_args if servo_constants.SERVO_HOST_ATTR in servo_args else None
Richard Barnetteea3e4602016-06-10 12:36:41 -07001547
1548
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001549def _tweak_args_for_ssp_moblab(servo_args):
Garry Wang11b5e872020-03-11 15:14:08 -07001550 if (servo_args[servo_constants.SERVO_HOST_ATTR]
1551 in ['localhost', '127.0.0.1']):
1552 servo_args[servo_constants.SERVO_HOST_ATTR] = _CONFIG.get_config_value(
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001553 'SSP', 'host_container_ip', type=str, default=None)
1554
1555
Dan Shi023aae32016-05-25 11:13:01 -07001556def create_servo_host(dut, servo_args, try_lab_servo=False,
Gregory Nisbetde13e2a2019-12-09 22:44:00 -08001557 try_servo_repair=False, dut_host_info=None):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001558 """Create a ServoHost object for a given DUT, if appropriate.
Dan Shi4d478522014-02-14 13:46:32 -08001559
Richard Barnette9a26ad62016-06-10 12:03:08 -07001560 This function attempts to create and verify or repair a `ServoHost`
1561 object for a servo connected to the given `dut`, subject to various
1562 constraints imposed by the parameters:
1563 * When the `servo_args` parameter is not `None`, a servo
1564 host must be created, and must be checked with `repair()`.
1565 * Otherwise, if a servo exists in the lab and `try_lab_servo` is
1566 true:
1567 * If `try_servo_repair` is true, then create a servo host and
1568 check it with `repair()`.
1569 * Otherwise, if the servo responds to `ping` then create a
1570 servo host and check it with `verify()`.
Fang Denge545abb2014-12-30 18:43:47 -08001571
Richard Barnette9a26ad62016-06-10 12:03:08 -07001572 In cases where `servo_args` was not `None`, repair failure
1573 exceptions are passed back to the caller; otherwise, exceptions
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001574 are logged and then discarded. Note that this only happens in cases
1575 where we're called from a test (not special task) control file that
1576 has an explicit dependency on servo. In that case, we require that
1577 repair not write to `status.log`, so as to avoid polluting test
1578 results.
1579
1580 TODO(jrbarnette): The special handling for servo in test control
1581 files is a thorn in my flesh; I dearly hope to see it cut out before
1582 my retirement.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001583
1584 Parameters for a servo host consist of a host name, port number, and
1585 DUT board, and are determined from one of these sources, in order of
1586 priority:
Richard Barnetteea3e4602016-06-10 12:36:41 -07001587 * Servo attributes from the `dut` parameter take precedence over
1588 all other sources of information.
1589 * If a DNS entry for the servo based on the DUT hostname exists in
1590 the CrOS lab network, that hostname is used with the default
Richard Barnette9a26ad62016-06-10 12:03:08 -07001591 port and the DUT's board.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001592 * If no other options are found, the parameters will be taken
Richard Barnette9a26ad62016-06-10 12:03:08 -07001593 from the `servo_args` dict passed in from the caller.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001594
1595 @param dut An instance of `Host` from which to take
1596 servo parameters (if available).
1597 @param servo_args A dictionary with servo parameters to use if
1598 they can't be found from `dut`. If this
1599 argument is supplied, unrepaired exceptions
1600 from `verify()` will be passed back to the
1601 caller.
1602 @param try_lab_servo If not true, servo host creation will be
1603 skipped unless otherwise required by the
1604 caller.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001605 @param try_servo_repair If true, check a servo host with
1606 `repair()` instead of `verify()`.
Otabek Kasimov8475cce2020-07-14 12:11:31 -07001607 @param dut_host_info: A HostInfo object of the DUT that connected
1608 to this servo.
Dan Shi4d478522014-02-14 13:46:32 -08001609
1610 @returns: A ServoHost object or None. See comments above.
1611
1612 """
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001613 servo_dependency = servo_args is not None
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001614 if dut is not None and (try_lab_servo or servo_dependency):
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001615 servo_args_override = get_servo_args_for_host(dut)
Richard Barnetteea3e4602016-06-10 12:36:41 -07001616 if servo_args_override is not None:
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001617 if utils.in_moblab_ssp():
1618 _tweak_args_for_ssp_moblab(servo_args_override)
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001619 logging.debug(
1620 'Overriding provided servo_args (%s) with arguments'
1621 ' determined from the host (%s)',
1622 servo_args,
1623 servo_args_override,
1624 )
Richard Barnetteea3e4602016-06-10 12:36:41 -07001625 servo_args = servo_args_override
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001626
Richard Barnetteea3e4602016-06-10 12:36:41 -07001627 if servo_args is None:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001628 logging.debug('No servo_args provided, and failed to find overrides.')
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001629 if try_lab_servo or servo_dependency:
Otabek Kasimov646812c2020-06-23 20:01:36 -07001630 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001631 else:
1632 # For regular test case which not required the servo
1633 return None, None
1634
Garry Wang11b5e872020-03-11 15:14:08 -07001635 servo_hostname = servo_args.get(servo_constants.SERVO_HOST_ATTR)
1636 servo_port = servo_args.get(servo_constants.SERVO_PORT_ATTR)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001637 if not _is_servo_host_information_exist(servo_hostname, servo_port):
1638 logging.debug(
1639 'Servo connection info missed hostname: %s , port: %s',
1640 servo_hostname, servo_port)
Otabek Kasimov646812c2020-06-23 20:01:36 -07001641 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001642 if not is_servo_host_information_valid(servo_hostname, servo_port):
1643 logging.debug(
1644 'Servo connection info is incorrect hostname: %s , port: %s',
1645 servo_hostname, servo_port)
Garry Wang11b5e872020-03-11 15:14:08 -07001646 return None, servo_constants.SERVO_STATE_WRONG_CONFIG
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001647 if (not servo_dependency and not try_servo_repair and
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001648 not servo_host_is_up(servo_hostname)):
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001649 logging.debug('ServoHost is not up.')
Otabek Kasimov646812c2020-06-23 20:01:36 -07001650 return None, servo_constants.SERVO_STATE_NO_SSH
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001651
Garry Wangebc015b2019-06-06 17:45:06 -07001652 newhost = ServoHost(**servo_args)
Garry Wangffbd2162020-04-17 16:13:48 -07001653
Otabek Kasimove6df8102020-07-21 20:15:25 -07001654 # Reset or reboot servo device only during AdminRepair tasks.
1655 if try_servo_repair:
1656 if newhost._is_locked:
1657 # Reset servo if the servo is locked, as we check if the servohost
1658 # is up, if the servohost is labstation and if the servohost is in
1659 # lab inside the locking logic.
1660 newhost.reset_servo()
1661 else:
Garry Wang358aad42020-08-02 20:56:04 -07001662 try:
1663 newhost.reboot_servo_v3_on_need()
Garry Wang1f0d5332020-08-10 19:32:32 -07001664 except Exception as e:
1665 logging.info('[Non-critical] Unexpected error while trying to'
1666 ' reboot servo_v3, skipping the reboot; %s', e)
Otabek Kasimove6df8102020-07-21 20:15:25 -07001667
Otabek Kasimov2b50cdb2020-07-06 19:16:06 -07001668 if dut:
1669 newhost.set_dut_hostname(dut.hostname)
Otabek Kasimov9e90ae12020-08-14 03:01:19 -07001670 if dut_host_info:
1671 newhost.set_dut_host_info(dut_host_info)
Garry Wangffbd2162020-04-17 16:13:48 -07001672
Otabek Kasimov8475cce2020-07-14 12:11:31 -07001673 if try_lab_servo or try_servo_repair:
1674 try:
1675 logging.info("Check and update servo firmware.")
1676 servo_updater.update_servo_firmware(
1677 newhost,
1678 force_update=False)
1679 except Exception as e:
1680 logging.error("Servo device update error: %s", e)
1681
Garry Wangcdd27b22020-01-13 14:59:11 -08001682 try:
1683 newhost.restart_servod(quick_startup=True)
1684 except error.AutoservSSHTimeout:
1685 logging.warning("Restart servod failed due ssh connection "
1686 "to servohost timed out. This error is forgiven"
1687 " here, we will retry in servo repair process.")
1688 except error.AutoservRunError as e:
1689 logging.warning("Restart servod failed due to:\n%s\n"
1690 "This error is forgiven here, we will retry"
1691 " in servo repair process.", str(e))
Garry Wangebc015b2019-06-06 17:45:06 -07001692
Richard Barnette9a26ad62016-06-10 12:03:08 -07001693 # Note that the logic of repair() includes everything done
1694 # by verify(). It's sufficient to call one or the other;
1695 # we don't need both.
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001696 if servo_dependency:
1697 newhost.repair(silent=True)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001698 return newhost, newhost.get_servo_state()
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001699
1700 if try_servo_repair:
1701 try:
1702 newhost.repair()
1703 except Exception:
1704 logging.exception('servo repair failed for %s', newhost.hostname)
Richard Barnette9a26ad62016-06-10 12:03:08 -07001705 else:
1706 try:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001707 newhost.verify()
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001708 except Exception:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001709 logging.exception('servo verify failed for %s', newhost.hostname)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001710 return newhost, newhost.get_servo_state()
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001711
1712
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001713def _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001714 if hostname is None or len(hostname.strip()) == 0:
1715 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001716 if port is None:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001717 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001718 if not type(port) is int:
1719 try:
1720 int(port)
1721 except ValueError:
1722 return False
1723
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001724 return True
1725
1726
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001727def is_servo_host_information_valid(hostname, port):
Garry Wang9b8f2342020-04-17 16:34:09 -07001728 """Check if provided servo attributes are valid.
1729
1730 @param hostname Hostname of the servohost.
1731 @param port servo port number.
1732
1733 @returns: A bool value to indicate if provided servo attribute valid.
1734 """
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001735 if not _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001736 return False
1737 # checking range and correct of the port
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001738 port_int = int(port)
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001739 if port_int < 1 or port_int > 65000:
1740 return False
1741 # we expecting host contain only latters, digits and '-' or '_'
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001742 if not re.match('[a-zA-Z0-9-_\.]*$', hostname) or len(hostname) < 5:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001743 return False
1744 return True