blob: a402115b59e35cfca69314792c40ebeb7ea09242 [file] [log] [blame]
Derek Beckettf73baca2020-08-19 15:08:47 -07001# Lint as: python2, python3
Fang Deng5d518f42013-08-02 14:04:32 -07002# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
3# Use of this source code is governed by a BSD-style license that can be
4# found in the LICENSE file.
5#
6# Expects to be run in an environment with sudo and no interactive password
7# prompt, such as within the Chromium OS development chroot.
8
9
10"""This file provides core logic for servo verify/repair process."""
11
12
Derek Beckettf73baca2020-08-19 15:08:47 -070013from __future__ import absolute_import
14from __future__ import division
15from __future__ import print_function
16
Fang Deng5d518f42013-08-02 14:04:32 -070017import logging
Raul E Rangel52ca2e82018-07-03 14:10:14 -060018import os
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080019import re
20import tarfile
Andrew McRaef0679932020-08-13 09:15:23 +100021import threading
Garry Wang2b5eef92020-08-21 16:23:35 -070022import json
Garry Wangc1288cf2019-12-17 14:58:00 -080023import time
Derek Beckettf73baca2020-08-19 15:08:47 -070024import six
25import six.moves.xmlrpc_client
Otabek Kasimov120b6fa2020-07-03 00:15:27 -070026import calendar
Fang Deng5d518f42013-08-02 14:04:32 -070027
28from autotest_lib.client.bin import utils
Garry Wang79e9af62019-06-12 15:19:19 -070029from autotest_lib.client.common_lib import error
Richard Barnette9a26ad62016-06-10 12:03:08 -070030from autotest_lib.client.common_lib import hosts
Garry Wang7b0e1b72020-03-25 19:08:59 -070031from autotest_lib.client.common_lib import lsbrelease_utils
Fang Deng5d518f42013-08-02 14:04:32 -070032from autotest_lib.client.common_lib.cros import retry
Richard Barnette9a26ad62016-06-10 12:03:08 -070033from autotest_lib.server.cros.servo import servo
Richard Barnetted31580e2018-05-14 19:58:00 +000034from autotest_lib.server.hosts import servo_repair
Garry Wangebc015b2019-06-06 17:45:06 -070035from autotest_lib.server.hosts import base_servohost
Garry Wang11b5e872020-03-11 15:14:08 -070036from autotest_lib.server.hosts import servo_constants
Otabek Kasimov4ea636e2020-04-14 23:35:06 -070037from autotest_lib.server.cros.faft.utils import config
Garry Wang11b5e872020-03-11 15:14:08 -070038from autotest_lib.client.common_lib import global_config
Otabek Kasimov8475cce2020-07-14 12:11:31 -070039from autotest_lib.site_utils.admin_audit import servo_updater
Otabek Kasimov382c3bb2020-10-28 13:22:45 -070040from autotest_lib.server.cros.servo.topology import servo_topology
Garry Wangd7367482020-02-27 13:52:40 -080041
Otabek Kasimov15963492020-06-23 21:10:51 -070042try:
Mike Frysinger714c5b02020-09-04 23:22:54 -040043 from autotest_lib.utils.frozen_chromite.lib import metrics
Otabek Kasimov15963492020-06-23 21:10:51 -070044except ImportError:
45 metrics = utils.metrics_mock
46
Dan Shi3b2adf62015-09-02 17:46:54 -070047_CONFIG = global_config.global_config
Fang Deng5d518f42013-08-02 14:04:32 -070048
Otabek Kasimova7ba91a2020-03-09 08:31:01 -070049
Garry Wangebc015b2019-06-06 17:45:06 -070050class ServoHost(base_servohost.BaseServoHost):
51 """Host class for a servo host(e.g. beaglebone, labstation)
Dana Goyette0b6e6402019-10-04 11:09:24 -070052 that with a servo instance for a specific port.
53
54 @type _servo: servo.Servo | None
55 """
Fang Deng5d518f42013-08-02 14:04:32 -070056
Raul E Rangel52ca2e82018-07-03 14:10:14 -060057 DEFAULT_PORT = int(os.getenv('SERVOD_PORT', '9999'))
Richard Barnette9a26ad62016-06-10 12:03:08 -070058
Dan Shie5b3c512014-08-21 12:12:09 -070059 # Timeout for initializing servo signals.
Wai-Hong Tam37b6ed32017-09-19 15:52:39 -070060 INITIALIZE_SERVO_TIMEOUT_SECS = 60
Richard Barnette9a26ad62016-06-10 12:03:08 -070061
Otabek Kasimov545739c2020-08-20 00:24:21 -070062 # Default timeout for run terminal command.
63 DEFAULT_TERMINAL_TIMEOUT = 30
64
xixuan6cf6d2f2016-01-29 15:29:00 -080065 # Ready test function
66 SERVO_READY_METHOD = 'get_version'
Fang Deng5d518f42013-08-02 14:04:32 -070067
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080068 # Directory prefix on the servo host where the servod logs are stored.
69 SERVOD_LOG_PREFIX = '/var/log/servod'
70
71 # Exit code to use when symlinks for servod logs are not found.
72 NO_SYMLINKS_CODE = 9
73
74 # Directory in the job's results directory to dump the logs into.
75 LOG_DIR = 'servod'
76
77 # Prefix for joint loglevel files in the logs.
78 JOINT_LOG_PREFIX = 'log'
79
80 # Regex group to extract timestamp from logfile name.
81 TS_GROUP = 'ts'
82
83 # This regex is used to extract the timestamp from servod logs.
Garry Wang22f2e842020-09-09 20:19:19 -070084 # files always start with log.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080085 TS_RE = (r'log.'
86 # The timestamp is of format %Y-%m-%d--%H-%M-%S.MS
87 r'(?P<%s>\d{4}(\-\d{2}){2}\-(-\d{2}){3}.\d{3})'
88 # The loglevel is optional depending on labstation version.
89 r'(.(INFO|DEBUG|WARNING))?' % TS_GROUP)
90 TS_EXTRACTOR = re.compile(TS_RE)
91
92 # Regex group to extract MCU name from logline in servod logs.
93 MCU_GROUP = 'mcu'
94
95 # Regex group to extract logline from MCU logline in servod logs.
96 LINE_GROUP = 'line'
97
98 # This regex is used to extract the mcu and the line content from an
99 # MCU logline in servod logs. e.g. EC or servo_v4 console logs.
100 # Here is an example log-line:
101 #
102 # 2020-01-23 13:15:12,223 - servo_v4 - EC3PO.Console - DEBUG -
103 # console.py:219:LogConsoleOutput - /dev/pts/9 - cc polarity: cc1
104 #
105 # Here is conceptually how they are formatted:
106 #
107 # <time> - <MCU> - EC3PO.Console - <LVL> - <file:line:func> - <pts> -
108 # <output>
109 #
Garry Wang22f2e842020-09-09 20:19:19 -0700110 # The log format starts with a timestamp
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800111 MCU_RE = (r'[\d\-]+ [\d:,]+ '
112 # The mcu that is logging this is next.
113 r'- (?P<%s>\w+) - '
114 # Next, we have more log outputs before the actual line.
115 # Information about the file line, logging function etc.
116 # Anchor on EC3PO Console, LogConsoleOutput and dev/pts.
117 # NOTE: if the log format changes, this regex needs to be
118 # adjusted.
119 r'EC3PO\.Console[\s\-\w\d:.]+LogConsoleOutput - /dev/pts/\d+ - '
120 # Lastly, we get the MCU's console line.
121 r'(?P<%s>.+$)' % (MCU_GROUP, LINE_GROUP))
122 MCU_EXTRACTOR = re.compile(MCU_RE)
123
Otabek Kasimov545739c2020-08-20 00:24:21 -0700124 # Regex to detect timeout messages when USBC pigtail has timeout issue.
125 # e.g.: [475635.427072 PD TMOUT RX 1/1]
126 USBC_PIGTAIL_TIMEOUT_RE = r'\[[\d \.]{1,20}(PD TMOUT RX 1\/1)\]'
127
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800128 # Suffix to identify compressed logfiles.
129 COMPRESSION_SUFFIX = '.tbz2'
130
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700131 # A suffix to mark servod log directories that came from instance that
132 # ran during this servo_host, but are not the last one running e.g. when
133 # an instance (on purpose, or due to a bug) restarted in the middle of the
134 # run.
135 OLD_LOG_SUFFIX = 'old'
136
Otabek Kasimovce34f532021-03-09 08:28:55 +0000137 # Mapping servo board with their vid-pid
138 SERVO_VID_PID = {
139 'servo_v4': '18d1:501b',
140 'ccd_cr50': '18d1:5014',
141 'servo_micro': '18d1:501a',
142 'servo_v3': ['18d1:5004', '0403:6014'],
143 'c2d2': '1d81:5041',
144 }
145
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800146 def _init_attributes(self):
147 self._servo_state = None
148 self.servo_port = None
149 self.servo_board = None
150 self.servo_model = None
151 self.servo_serial = None
Garry Wangcb06f3b2020-10-08 20:56:21 -0700152 self.servo_setup = None
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800153 self.servo_recovery = None
Otabek Kasimovab4ae222021-03-06 01:38:47 -0800154 self.servo_fw_channel = None
Garry Wang6a680062020-11-03 13:40:29 -0800155 self.additional_servod_args = None
Otabek Kasimov39637412020-11-23 19:09:27 -0800156 self._dut_health_profile = None
Garry Wang000c6c02020-05-11 21:27:23 -0700157 # The flag that indicate if a servo is connected to a smart usbhub.
158 # TODO(xianuowang@) remove this flag once all usbhubs in the lab
159 # get replaced.
160 self.smart_usbhub = None
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800161 self._servo = None
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700162 self._topology = None
Andrew McRaef0679932020-08-13 09:15:23 +1000163 self._tunnel_proxy = None
164 self._tunnel_proxy_lock = threading.Lock()
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700165 self._initial_instance_ts = None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800166 # Flag to make sure that multiple calls to close do not result in the
167 # logic executing multiple times.
168 self._closed = False
Andrew McRaef0679932020-08-13 09:15:23 +1000169 # Per-thread local data
170 self._local = threading.local()
Fang Deng5d518f42013-08-02 14:04:32 -0700171
Garry Wangcb06f3b2020-10-08 20:56:21 -0700172 def _initialize(self,
173 servo_host='localhost',
174 servo_port=DEFAULT_PORT,
175 servo_board=None,
176 servo_model=None,
177 servo_serial=None,
178 servo_setup=None,
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800179 servo_recovery=None,
Otabek Kasimovab4ae222021-03-06 01:38:47 -0800180 servo_fw_channel=None,
Garry Wang6a680062020-11-03 13:40:29 -0800181 additional_servod_args=None,
Garry Wangcb06f3b2020-10-08 20:56:21 -0700182 is_in_lab=None,
183 *args,
184 **dargs):
Fang Deng5d518f42013-08-02 14:04:32 -0700185 """Initialize a ServoHost instance.
186
187 A ServoHost instance represents a host that controls a servo.
188
189 @param servo_host: Name of the host where the servod process
190 is running.
Raul E Rangel52ca2e82018-07-03 14:10:14 -0600191 @param servo_port: Port the servod process is listening on. Defaults
192 to the SERVOD_PORT environment variable if set,
193 otherwise 9999.
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700194 @param servo_board: Board that the servo is connected to.
Nick Sanders2f3c9852018-10-24 12:10:24 -0700195 @param servo_model: Model that the servo is connected to.
Garry Wangcb06f3b2020-10-08 20:56:21 -0700196 @param servo_serial: Serial number of the servo device.
197 @param servo_setup: Type of servo setup, e.g. REGULAR or DUAL_V4.
Garry Wang6a680062020-11-03 13:40:29 -0800198 @param additional_servod_args: Additional args that will append to
199 servod start command.
Dan Shi4d478522014-02-14 13:46:32 -0800200 @param is_in_lab: True if the servo host is in Cros Lab. Default is set
201 to None, for which utils.host_is_in_lab_zone will be
202 called to check if the servo host is in Cros lab.
Fang Deng5d518f42013-08-02 14:04:32 -0700203
204 """
205 super(ServoHost, self)._initialize(hostname=servo_host,
Garry Wangebc015b2019-06-06 17:45:06 -0700206 is_in_lab=is_in_lab, *args, **dargs)
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800207 self._init_attributes()
Richard Barnette42f4db92018-08-23 15:05:15 -0700208 self.servo_port = int(servo_port)
Richard Barnettee519dcd2016-08-15 17:37:17 -0700209 self.servo_board = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -0700210 self.servo_model = servo_model
Kevin Cheng643ce8a2016-09-15 15:42:12 -0700211 self.servo_serial = servo_serial
Garry Wangcb06f3b2020-10-08 20:56:21 -0700212 self.servo_setup = servo_setup
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800213 self.servo_recovery = servo_recovery
Otabek Kasimovab4ae222021-03-06 01:38:47 -0800214 self.servo_fw_channel = servo_fw_channel
Garry Wang6a680062020-11-03 13:40:29 -0800215 self.additional_servod_args = additional_servod_args
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800216
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800217 # The location of the log files on the servo host for this instance.
218 self.remote_log_dir = '%s_%s' % (self.SERVOD_LOG_PREFIX,
219 self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700220 # Path of the servo host lock file.
Derek Beckettf73baca2020-08-19 15:08:47 -0700221 self._lock_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
222 self.LOCK_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700223 # File path to declare a reboot request.
Derek Beckettf73baca2020-08-19 15:08:47 -0700224 self._reboot_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
225 self.REBOOT_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700226
227 # Lock the servo host if it's an in-lab labstation to prevent other
228 # task to reboot it until current task completes. We also wait and
229 # make sure the labstation is up here, in the case of the labstation is
230 # in the middle of reboot.
Garry Wang7c00b0f2019-06-25 17:28:17 -0700231 self._is_locked = False
Garry Wang42b4d862019-06-25 15:50:49 -0700232 if (self.wait_up(self.REBOOT_TIMEOUT) and self.is_in_lab()
233 and self.is_labstation()):
Garry Wang79e9af62019-06-12 15:19:19 -0700234 self._lock()
Garry Wang78ce64d2020-10-13 18:23:45 -0700235 try:
236 self.wait_ready()
237 except Exception as e:
238 logging.info(
239 'Unexpected error while ensure labstation'
240 ' readiness; %s', str(e))
Garry Wangebc015b2019-06-06 17:45:06 -0700241
Richard Barnette9a26ad62016-06-10 12:03:08 -0700242 self._repair_strategy = (
243 servo_repair.create_servo_repair_strategy())
Richard Barnettee519dcd2016-08-15 17:37:17 -0700244
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700245 def __str__(self):
246 return "<%s '%s:%s'>" % (
247 type(self).__name__, self.hostname, self.servo_port)
248
Richard Barnette9a26ad62016-06-10 12:03:08 -0700249 def connect_servo(self):
Garry Wang8c8dc972020-06-09 13:41:51 -0700250 """ Initialize and setup servo for later use.
251 """
252 self.initilize_servo()
253 self.initialize_dut_for_servo()
254
Garry Wang8c8dc972020-06-09 13:41:51 -0700255 def initilize_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700256 """Establish a connection to the servod server on this host.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700257
258 Initializes `self._servo` and then verifies that all network
259 connections are working. This will create an ssh tunnel if
260 it's required.
Garry Wang8c8dc972020-06-09 13:41:51 -0700261 """
262 self._servo = servo.Servo(servo_host=self,
263 servo_serial=self.servo_serial)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700264
Garry Wang8c8dc972020-06-09 13:41:51 -0700265 def initialize_dut_for_servo(self):
266 """This method will do some setup for dut control, e.g. setup
267 main servo_v4 device, and also testing the connection between servo
268 and DUT. As a side effect of testing the connection, all signals on
269 the target servo are reset to default values, and the USB stick is
Richard Barnette9a26ad62016-06-10 12:03:08 -0700270 set to the neutral (off) position.
271 """
Garry Wang8c8dc972020-06-09 13:41:51 -0700272 if not self._servo:
273 raise hosts.AutoservVerifyError('Servo object needs to be'
274 ' initialized before initialize'
275 ' DUT.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700276 timeout, _ = retry.timeout(
Garry Wang8c8dc972020-06-09 13:41:51 -0700277 self._servo.initialize_dut,
278 timeout_sec=self.INITIALIZE_SERVO_TIMEOUT_SECS)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700279 if timeout:
Garry Wang8c8dc972020-06-09 13:41:51 -0700280 raise hosts.AutoservVerifyError('Initialize dut for servo timed'
281 ' out.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700282
Richard Barnette9a26ad62016-06-10 12:03:08 -0700283 def disconnect_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700284 """Disconnect our servo if it exists.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700285
286 If we've previously successfully connected to our servo,
287 disconnect any established ssh tunnel, and set `self._servo`
288 back to `None`.
289 """
290 if self._servo:
291 # N.B. This call is safe even without a tunnel:
292 # rpc_server_tracker.disconnect() silently ignores
293 # unknown ports.
294 self.rpc_server_tracker.disconnect(self.servo_port)
295 self._servo = None
Fang Deng5d518f42013-08-02 14:04:32 -0700296
Andrew McRaef0679932020-08-13 09:15:23 +1000297 def _maybe_create_servod_ssh_tunnel_proxy(self):
298 """Create a xmlrpc proxy for use with a ssh tunnel.
299 A lock is used to safely create a singleton proxy.
300 """
301 with self._tunnel_proxy_lock:
302 if self._tunnel_proxy is None:
303 self._tunnel_proxy = self.rpc_server_tracker.xmlrpc_connect(
304 None,
305 self.servo_port,
306 ready_test_name=self.SERVO_READY_METHOD,
307 timeout_seconds=60,
308 request_timeout_seconds=3600,
309 server_desc=str(self))
310
Andrew McRaef0679932020-08-13 09:15:23 +1000311 def get_servod_server_proxy(self):
312 """Return a proxy if it exists; otherwise, create a new one.
313 A proxy can either be a ssh tunnel based proxy, or a httplib
314 based proxy.
Fang Deng5d518f42013-08-02 14:04:32 -0700315
316 @returns: An xmlrpclib.ServerProxy that is connected to the servod
317 server on the host.
Fang Deng5d518f42013-08-02 14:04:32 -0700318 """
Garry Wang11b5e872020-03-11 15:14:08 -0700319 if (servo_constants.ENABLE_SSH_TUNNEL_FOR_SERVO
320 and not self.is_localhost()):
Andrew McRaef0679932020-08-13 09:15:23 +1000321 # Check for existing ssh tunnel proxy.
322 if self._tunnel_proxy is None:
323 self._maybe_create_servod_ssh_tunnel_proxy()
324 return self._tunnel_proxy
Richard Barnette9a26ad62016-06-10 12:03:08 -0700325 else:
Andrew McRaef0679932020-08-13 09:15:23 +1000326 # xmlrpc/httplib is not thread-safe, so each thread must have its
327 # own separate proxy connection.
328 if not hasattr(self._local, "_per_thread_proxy"):
329 remote = 'http://%s:%s' % (self.hostname, self.servo_port)
Derek Beckettf73baca2020-08-19 15:08:47 -0700330 self._local._per_thread_proxy = six.moves.xmlrpc_client.ServerProxy(remote)
Andrew McRaef0679932020-08-13 09:15:23 +1000331 return self._local._per_thread_proxy
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800332
Richard Barnette1edbb162016-11-01 11:47:50 -0700333 def verify(self, silent=False):
334 """Update the servo host and verify it's in a good state.
335
336 @param silent If true, suppress logging in `status.log`.
337 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700338 message = 'Beginning verify for servo host %s port %s serial %s'
339 message %= (self.hostname, self.servo_port, self.servo_serial)
340 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700341 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700342 self._repair_strategy.verify(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700343 self._servo_state = servo_constants.SERVO_STATE_WORKING
344 self.record('INFO', None, None,
345 'ServoHost verify set servo_state as WORKING')
Garry Wang63b8c382020-03-11 22:28:40 -0700346 except Exception as e:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -0700347 if not self.is_localhost():
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700348 self._servo_state = self.determine_servo_state()
349 self.record('INFO', None, None,
350 'ServoHost verify set servo_state as %s'
351 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700352 if self._is_critical_error(e):
353 raise
Fang Deng5d518f42013-08-02 14:04:32 -0700354
Garry Wang2b5eef92020-08-21 16:23:35 -0700355 def _get_default_usbkey_mount_path(self):
356 return '/media/servo_usb/%s' % self.servo_port
Fang Deng5d518f42013-08-02 14:04:32 -0700357
Garry Wang7b0e1b72020-03-25 19:08:59 -0700358 def get_image_name_from_usbkey(self, usbkey_dev):
359 """Mount usb drive and check ChromeOS image name on it if there is
360 one. This method assumes the image_usbkey_direction is already set
361 to servo side.
362
Garry Wang4b980202020-09-24 17:00:17 -0700363 @param usbkey_dev: usbkey dev path(e.g. /dev/sdb).
Garry Wang7b0e1b72020-03-25 19:08:59 -0700364
365 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
366 or empty string if no test image detected, or unexpected
367 error occurred.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700368 """
Garry Wang70e5d062020-04-03 18:01:05 -0700369 logging.info('Checking ChromeOS image name on usbkey.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700370 mount_dst = self._get_default_usbkey_mount_path()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700371 # Unmount if there is an existing stale mount.
Garry Wang2b5eef92020-08-21 16:23:35 -0700372 self._unmount_drive(mount_dst)
373 # ChromeOS root fs is in /dev/sdx3
374 mount_src = usbkey_dev + '3'
Garry Wang7b0e1b72020-03-25 19:08:59 -0700375 try:
Garry Wang2b5eef92020-08-21 16:23:35 -0700376 if not self._mount_drive(mount_src, mount_dst):
377 logging.debug('Unexpected error occurred on mount usb drive.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700378 return ''
Garry Wang70e5d062020-04-03 18:01:05 -0700379
380 release_content = self.run(
Garry Wang2b5eef92020-08-21 16:23:35 -0700381 'cat %s/etc/lsb-release' % mount_dst,
Garry Wang70e5d062020-04-03 18:01:05 -0700382 ignore_status=True).stdout.strip()
383
384 if not re.search(r'RELEASE_TRACK=.*test', release_content):
385 logging.info('The image on usbkey is not a test image')
386 return ''
387
388 return lsbrelease_utils.get_chromeos_release_builder_path(
389 lsb_release_content=release_content)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700390 finally:
Garry Wang70e5d062020-04-03 18:01:05 -0700391 logging.debug('Image check compeleted, unmounting the usb drive.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700392 self._unmount_drive(mount_dst)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700393
Garry Wang2b5eef92020-08-21 16:23:35 -0700394 def _extract_firmware_image_from_usbkey(self, fw_dst):
395 """Extract firmware images from the usbkey on servo, this method
396 assumes there is already a ChromeOS test image staged on servo.
397
Garry Wang4b980202020-09-24 17:00:17 -0700398 @param fw_dst: the path that we'll copy firmware images to.
Garry Wang2b5eef92020-08-21 16:23:35 -0700399
400 @returns: a json format string of firmware manifest data.
401 """
402 usbkey_dev = self._probe_and_validate_usb_dev()
403 if not usbkey_dev:
404 raise hosts.AutoservRepairError('Unexpected error occurred when'
405 ' probe usbkey dev path, please check logs for detail.')
406
407 mount_dst = self._get_default_usbkey_mount_path()
408 # Unmount if there is an existing stale mount.
409 self._unmount_drive(mount_dst)
410 # ChromeOS root fs is in /dev/sdx3
411 mount_src = usbkey_dev + '3'
412 try:
413 if not self._mount_drive(mount_src, mount_dst):
414 raise hosts.AutoservRepairError('Failed to extract firmware'
415 ' image; Unable to mount %s.' % usbkey_dev,
416 'unable to mount usbkey')
417 updater_bin = os.path.join(mount_dst,
418 'usr/sbin/chromeos-firmwareupdate')
419 self.run('%s --unpack %s' % (updater_bin, fw_dst))
420 return self.run('%s --manifest' % updater_bin).stdout
421 finally:
422 self._unmount_drive(mount_dst)
423
424 def prepare_repair_firmware_image(self, fw_dst=None):
425 """Prepare firmware image on the servohost for auto repair process
426 to consume.
427
Garry Wang4b980202020-09-24 17:00:17 -0700428 @param fw_dst: the path that we want to store firmware image on
429 the servohost.
Garry Wang2b5eef92020-08-21 16:23:35 -0700430
431 @returns: A tuple that containes ec firmware image path and bios
432 firmware image path on the servohost, or None if type of
433 image is not available based on manifest and dut's model.
434 """
435 model = self.servo_model or self._dut_host_info.model
436 if not model:
437 raise hosts.AutoservRepairError(
438 'Could not determine DUT\'s model.',
439 'model infomation unknown')
440
441 if not fw_dst:
442 fw_dst = '/tmp/firmware_image/%s' % self.servo_port
443 # Cleanup and re-create dst path to have a fresh start.
444 self.run('rm -rf %s' % fw_dst)
445 self.run('mkdir -p %s' % fw_dst)
446
447 manifest = json.loads(self._extract_firmware_image_from_usbkey(fw_dst))
Garry Wang50b56c12020-09-24 17:26:52 -0700448 # For models that have packed $MODEL_signed variant, we want use the
449 # 'signed' variant once we get DVT devices, so try to read manifest
450 # from $MODEL_signed first.
451 build = manifest.get('%s_signed' % model) or manifest.get(model)
452 if not build:
Garry Wang2b5eef92020-08-21 16:23:35 -0700453 raise hosts.AutoservRepairError('Could not find firmware manifest'
454 ' for model:%s' % model, 'model manifest not found')
455 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700456 ec_image = os.path.join(fw_dst, build['ec']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700457 except KeyError:
458 ec_image = None
459 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700460 bios_image = os.path.join(fw_dst, build['host']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700461 except KeyError:
462 bios_image = None
463 if not ec_image and not bios_image:
464 raise hosts.AutoservRepairError('Could not find any firmware image'
465 ' for model:%s' % model, 'cannot find firmware image')
466 return ec_image, bios_image
Garry Wang7b0e1b72020-03-25 19:08:59 -0700467
Garry Wang4b980202020-09-24 17:00:17 -0700468 def flash_ap_firmware_via_servo(self, image):
469 """Flash AP firmware by use a provided image.
470
471 This is will be a short term enhanment for infra repair use, it use
472 'futility update' which will automatically determine various parameters
473 needed for flashrom, and will preserve the GBB, VPD, and HWID for
474 AP firmware update.
475 @TODO(xianuowang@) Remove this method once b/148403277 implemented.
476
477 @param image: the firmware image path on servohost.
478 """
479 cmd = 'futility update -i %s --servo_port=%s'
480 self.run(cmd % (image, self.servo_port), timeout=900)
481
Garry Wang70e5d062020-04-03 18:01:05 -0700482 def _probe_and_validate_usb_dev(self):
483 """This method probe the usb dev path by talking to servo, and then
484 validate the dev path is valid block device to servohost.
485 Possible output:
486 1. Encounter error during probe usb dev, returns empty string.
487 2. probe usb dev completed without error but cannot find usb dev,
488 raise AutoservRepairError.
489 3. probe usb dev find a usb dev path, but failed validation in this
490 method, raise AutoservRepairError.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700491
Garry Wang70e5d062020-04-03 18:01:05 -0700492 @returns: A string of usb dev path(e.g. '/dev/sdb'), or empty string
493 if unexpected error occurred during probe.
494 @raises: AutoservRepairError if servo couldn't probe the usb dev path
495 (servo.probe_host_usb_dev() returns empty string), or the dev path is
496 not valid block device to servohost.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700497 """
498 logging.info('Validating image usbkey on servo.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700499 try:
Garry Wang70e5d062020-04-03 18:01:05 -0700500 usb_dev = self._servo.probe_host_usb_dev()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700501 except Exception as e:
502 # We don't want any unexpected or transient servo communicating
503 # failure block usb repair, so capture all errors here.
504 logging.error(e, exc_info=True)
505 logging.error('Unexpected error occurred on get usbkey dev path,'
506 ' skipping usbkey validation.')
507 return ''
508
Garry Wang70e5d062020-04-03 18:01:05 -0700509 if usb_dev:
510 # probe_host_usb_dev() sometimes return stale record,
511 # so we need to make sure the path exists in fdisk.
Otabek Kasimov77bff672020-10-08 15:52:03 -0700512 validate_cmd = 'fdisk -l %s' % usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700513 try:
Otabek Kasimov77bff672020-10-08 15:52:03 -0700514 resp = self.run(validate_cmd, ignore_status=True, timeout=30)
Garry Wang11441182020-06-16 18:34:14 -0700515 if resp.exit_status == 0:
516 return usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700517 logging.error('%s is reported from "image_usbkey_dev" control'
518 ' but not detected by fdisk!', usb_dev)
519 except error.AutoservRunError as e:
520 if 'Timeout encountered' in str(e):
521 logging.warning('Timeout encountered during fdisk run,'
522 ' skipping usbkey validation.')
523 return ''
524 raise
Garry Wang70e5d062020-04-03 18:01:05 -0700525
526 raise hosts.AutoservRepairError(
527 'No usbkey detected on servo, the usbkey may be either missing'
528 ' or broken. Please replace usbkey on the servo and retry.',
529 'missing usbkey')
530
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700531 def is_ec_supported(self):
Garry Wang9b8f2342020-04-17 16:34:09 -0700532 """Check if ec is supported on the servo_board"""
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700533 if self.servo_board:
534 try:
535 frm_config = config.Config(self.servo_board, self.servo_model)
536 return frm_config.chrome_ec
537 except Exception as e:
538 logging.error('Unexpected error when read from firmware'
539 ' configs; %s', str(e))
540 return False
541
Garry Wang70e5d062020-04-03 18:01:05 -0700542 def validate_image_usbkey(self):
543 """This method first validate if there is a recover usbkey on servo
544 that accessible to servohost, and second check if a ChromeOS image is
545 already on the usb drive and return the image_name so we can avoid
546 unnecessary download and flash to the recover usbkey on servo.
547
548 Please note that, there is special error handling logic here:
549 1. If unexpected error happens, we return empty string. So repair
550 actions will not get blocked.
551 2. If no working usbkey present on servo, but no errors, we'll raise
552 AutoservRepairError here.
553
554 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
555 or empty string if no test image detected, or unexpected
556 error occurred.
557 @raises: AutoservRepairError if the usbkey is not detected on servo.
558 """
559 usb_dev = self._probe_and_validate_usb_dev()
560 if usb_dev:
561 return self.get_image_name_from_usbkey(usb_dev)
562 else:
563 return ''
Garry Wang7b0e1b72020-03-25 19:08:59 -0700564
Richard Barnette1edbb162016-11-01 11:47:50 -0700565 def repair(self, silent=False):
566 """Attempt to repair servo host.
567
568 @param silent If true, suppress logging in `status.log`.
569 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700570 message = 'Beginning repair for servo host %s port %s serial %s'
571 message %= (self.hostname, self.servo_port, self.servo_serial)
572 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700573 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700574 self._repair_strategy.repair(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700575 self._servo_state = servo_constants.SERVO_STATE_WORKING
576 self.record('INFO', None, None,
577 'ServoHost repair set servo_state as WORKING')
Garry Wang464ff1e2019-07-18 17:20:34 -0700578 # If target is a labstation then try to withdraw any existing
579 # reboot request created by this servo because it passed repair.
580 if self.is_labstation():
581 self.withdraw_reboot_request()
Garry Wang63b8c382020-03-11 22:28:40 -0700582 except Exception as e:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -0700583 if not self.is_localhost():
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700584 self._servo_state = self.determine_servo_state()
585 self.record('INFO', None, None,
586 'ServoHost repair set servo_state as %s'
587 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700588 if self._is_critical_error(e):
589 self.disconnect_servo()
590 self.stop_servod()
591 raise
592
Garry Wang63b8c382020-03-11 22:28:40 -0700593 def _is_critical_error(self, error):
594 if (isinstance(error, hosts.AutoservVerifyDependencyError)
595 and not error.is_critical()):
596 logging.warning('Non-critical verify failure(s) detected during'
597 ' verify/repair servo, servo connection will'
Evan Benn2c41c262020-10-28 11:34:27 +1100598 ' still be up but may not be fully functional.'
599 ' Some repair actions and servo dependent'
Garry Wang63b8c382020-03-11 22:28:40 -0700600 ' tests may not run.')
601 return False
Evan Benn2c41c262020-10-28 11:34:27 +1100602 logging.info(
603 'Critical verify failure(s) detected during repair/verify '
604 'servo. Disconnecting servo and running `stop servod`, all'
605 ' repair actions and tests that depends on servo will not '
606 'run.')
Garry Wang63b8c382020-03-11 22:28:40 -0700607 return True
Fang Deng5d518f42013-08-02 14:04:32 -0700608
Dan Shi4d478522014-02-14 13:46:32 -0800609 def get_servo(self):
610 """Get the cached servo.Servo object.
Fang Deng5d518f42013-08-02 14:04:32 -0700611
Dan Shi4d478522014-02-14 13:46:32 -0800612 @return: a servo.Servo object.
Dana Goyette353d1d92019-06-27 10:43:59 -0700613 @rtype: autotest_lib.server.cros.servo.servo.Servo
Fang Deng5d518f42013-08-02 14:04:32 -0700614 """
Dan Shi4d478522014-02-14 13:46:32 -0800615 return self._servo
616
Garry Wang79e9af62019-06-12 15:19:19 -0700617 def request_reboot(self):
618 """Request servohost to be rebooted when it's safe to by touch a file.
619 """
620 logging.debug('Request to reboot servohost %s has been created by '
Garry Wang464ff1e2019-07-18 17:20:34 -0700621 'servo with port # %s', self.hostname, self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700622 self.run('touch %s' % self._reboot_file, ignore_status=True)
623
Garry Wang464ff1e2019-07-18 17:20:34 -0700624 def withdraw_reboot_request(self):
625 """Withdraw a servohost reboot request if exists by remove the flag
626 file.
627 """
628 logging.debug('Withdrawing request to reboot servohost %s that created'
629 ' by servo with port # %s if exists.',
630 self.hostname, self.servo_port)
631 self.run('rm -f %s' % self._reboot_file, ignore_status=True)
632
Garry Wangc1288cf2019-12-17 14:58:00 -0800633 def start_servod(self, quick_startup=False):
634 """Start the servod process on servohost.
635 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800636 # Skip if running on the localhost.(crbug.com/1038168)
637 if self.is_localhost():
638 logging.debug("Servohost is a localhost, skipping start servod.")
639 return
640
641 cmd = 'start servod'
Garry Wangc1288cf2019-12-17 14:58:00 -0800642 if self.servo_board:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800643 cmd += ' BOARD=%s' % self.servo_board
Garry Wangc1288cf2019-12-17 14:58:00 -0800644 if self.servo_model:
645 cmd += ' MODEL=%s' % self.servo_model
Garry Wangc1288cf2019-12-17 14:58:00 -0800646 else:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800647 logging.warning('Board for DUT is unknown; starting servod'
648 ' assuming a pre-configured board.')
649
650 cmd += ' PORT=%d' % self.servo_port
651 if self.servo_serial:
652 cmd += ' SERIAL=%s' % self.servo_serial
Garry Wangd7367482020-02-27 13:52:40 -0800653
Garry Wangcb06f3b2020-10-08 20:56:21 -0700654 # Start servod with dual_v4 based on servo_setup.
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700655 if self.is_dual_setup():
Garry Wangcb06f3b2020-10-08 20:56:21 -0700656 cmd += ' DUAL_V4=1'
Garry Wangd7367482020-02-27 13:52:40 -0800657
Garry Wangcb06f3b2020-10-08 20:56:21 -0700658 # Start servod with CONFIG=cr50.xml which required for some pools.
659 if self._require_cr50_servod_config():
660 cmd += ' CONFIG=cr50.xml'
Garry Wangb5cee3e2020-09-16 14:58:13 -0700661
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800662 if self.servo_recovery == True:
663 cmd += ' REC_MODE=1'
664
Garry Wang6a680062020-11-03 13:40:29 -0800665 # Adding customized args if any.
666 if self.additional_servod_args:
667 cmd += ' ' + self.additional_servod_args
668
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800669 # Remove the symbolic links from the logs. This helps ensure that
670 # a failed servod instantiation does not cause us to grab old logs
671 # by mistake.
672 self.remove_latest_log_symlinks()
Garry Wangcdd27b22020-01-13 14:59:11 -0800673 self.run(cmd, timeout=60)
Garry Wangc1288cf2019-12-17 14:58:00 -0800674
675 # There's a lag between when `start servod` completes and when
676 # the _ServodConnectionVerifier trigger can actually succeed.
677 # The call to time.sleep() below gives time to make sure that
678 # the trigger won't fail after we return.
679
680 # Normally servod on servo_v3 and labstation take ~10 seconds to ready,
681 # But in the rare case all servo on a labstation are in heavy use they
682 # may take ~30 seconds. So the timeout value will double these value,
683 # and we'll try quick start up when first time initialize servohost,
684 # and use standard start up timeout in repair.
685 if quick_startup:
Garry Wang11b5e872020-03-11 15:14:08 -0700686 timeout = servo_constants.SERVOD_QUICK_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800687 else:
Garry Wang11b5e872020-03-11 15:14:08 -0700688 timeout = servo_constants.SERVOD_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800689 logging.debug('Wait %s seconds for servod process fully up.', timeout)
690 time.sleep(timeout)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700691 # Cache the initial instance timestamp to check against servod restarts
692 self._initial_instance_ts = self.get_instance_logs_ts()
Garry Wangc1288cf2019-12-17 14:58:00 -0800693
Garry Wangc1288cf2019-12-17 14:58:00 -0800694 def stop_servod(self):
695 """Stop the servod process on servohost.
696 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800697 # Skip if running on the localhost.(crbug.com/1038168)
698 if self.is_localhost():
699 logging.debug("Servohost is a localhost, skipping stop servod.")
700 return
701
Garry Wangc1288cf2019-12-17 14:58:00 -0800702 logging.debug('Stopping servod on port %s', self.servo_port)
Garry Wangcdd27b22020-01-13 14:59:11 -0800703 self.run('stop servod PORT=%d' % self.servo_port,
704 timeout=60, ignore_status=True)
Garry Wangc1288cf2019-12-17 14:58:00 -0800705 logging.debug('Wait %s seconds for servod process fully teardown.',
Garry Wang11b5e872020-03-11 15:14:08 -0700706 servo_constants.SERVOD_TEARDOWN_TIMEOUT)
707 time.sleep(servo_constants.SERVOD_TEARDOWN_TIMEOUT)
Garry Wangc1288cf2019-12-17 14:58:00 -0800708
Garry Wangc1288cf2019-12-17 14:58:00 -0800709 def restart_servod(self, quick_startup=False):
710 """Restart the servod process on servohost.
711 """
712 self.stop_servod()
713 self.start_servod(quick_startup)
714
Garry Wangffbd2162020-04-17 16:13:48 -0700715 def _process_servodtool_error(self, response):
716 """Helper function to handle non-zero servodtool response.
717 """
718 if re.search(servo_constants.ERROR_MESSAGE_USB_HUB_NOT_COMPATIBLE,
Garry Wangad245002020-05-15 15:20:23 -0700719 response.stdout):
Garry Wangffbd2162020-04-17 16:13:48 -0700720 logging.error('The servo is not plugged on a usb hub that supports'
721 ' power-cycle!')
Garry Wang000c6c02020-05-11 21:27:23 -0700722 # change the flag so we can update this label in later process.
723 self.smart_usbhub = False
Garry Wangffbd2162020-04-17 16:13:48 -0700724 return
725
726 if re.search(servo_constants.ERROR_MESSAGE_DEVICE_NOT_FOUND %
727 self.servo_serial, response.stdout):
728 logging.error('No servo with serial %s found!', self.servo_serial)
729 return
730
731 logging.error('Unexpected error occurred from usbhub control, please'
732 ' file a bug and inform chrome-fleet-software@ team!')
733
Otabek Kasimov86062d02020-11-17 13:30:22 -0800734 def get_main_servo_usb_path(self):
735 """Helper function to collect current usb-path to main servo.
736
737 The usb-path is path to the folder where usb-device was enumerated.
738 If fail then will return an empty string ('').
739
740 @returns: string, usb-path to the main servo device.
741 e.g.: '/sys/bus/usb/devices/1-6.1.3.1'
Garry Wangffbd2162020-04-17 16:13:48 -0700742 """
Otabek Kasimov09192682020-06-01 18:17:44 -0700743 # TODO remove try-except when fix crbug.com/1087964
744 try:
745 cmd = 'servodtool device -s %s usb-path' % self.servo_serial
746 resp = self.run(cmd, ignore_status=True, timeout=30)
747 except Exception as e:
748 # Here we catch only timeout errors.
749 # Other errors is filtered by ignore_status=True
750 logging.debug('Attempt to get servo usb-path failed due to '
751 'timeout; %s', e)
752 return ''
Garry Wangffbd2162020-04-17 16:13:48 -0700753 if resp.exit_status != 0:
754 self._process_servodtool_error(resp)
755 return ''
756 usb_path = resp.stdout.strip()
757 logging.info('Usb path of servo %s is %s', self.servo_serial, usb_path)
Otabek Kasimov86062d02020-11-17 13:30:22 -0800758 return usb_path
Garry Wangffbd2162020-04-17 16:13:48 -0700759
Otabek Kasimov86062d02020-11-17 13:30:22 -0800760 def _get_servo_usb_devnum(self):
761 """Helper function to collect current usb devnum of servo."""
762 usb_path = self.get_main_servo_usb_path()
763 if not usb_path:
764 return ''
765 resp = self.run('cat %s/devnum' % usb_path, ignore_status=True)
Garry Wangffbd2162020-04-17 16:13:48 -0700766 if resp.exit_status != 0:
767 self._process_servodtool_error(resp)
768 return ''
769 return resp.stdout.strip()
770
Garry Wang358aad42020-08-02 20:56:04 -0700771 def reboot_servo_v3_on_need(self):
772 """Check and reboot servo_v3 based on below conditions.
773 1. If there is an update pending on reboot.
774 2. Servo_v3 has been up for more than 96 hours.
775 """
776 if self.get_board() != 'beaglebone_servo':
777 logging.info('Servo reboot is only applicable for servo V3.')
Otabek Kasimove6df8102020-07-21 20:15:25 -0700778 return
779
Garry Wang358aad42020-08-02 20:56:04 -0700780 update_pending_reboot = (self._check_update_status() ==
781 self.UPDATE_STATE.PENDING_REBOOT)
782 uptime_hours = float(self.check_uptime())/3600
783 logging.info('Uptime of servo_v3: %s hour(s)', uptime_hours)
784 long_up_time = uptime_hours > 96
785
786 # Skip reboot if neither condition are met.
787 if not (update_pending_reboot or long_up_time):
Otabek Kasimove6df8102020-07-21 20:15:25 -0700788 return
789
Garry Wang358aad42020-08-02 20:56:04 -0700790 if update_pending_reboot:
791 message = 'Starting reboot servo_v3 because an update is pending.'
792 reboot_method = self._post_update_reboot
793 elif long_up_time:
794 message = 'Starting reboot servo_v3 because uptime > 96 hours.'
795 reboot_method = self._servo_host_reboot
796 self.record('INFO', None, None, message)
797 logging.info(message)
Otabek Kasimove6df8102020-07-21 20:15:25 -0700798 try:
Garry Wang358aad42020-08-02 20:56:04 -0700799 reboot_method()
Otabek Kasimove6df8102020-07-21 20:15:25 -0700800 message = 'Servo_v3 reboot completed successfully.'
801 except Exception as e:
802 logging.debug("Fail to reboot servo_v3; %s", e)
803 message = ('Servo_v3 reboot failed, please check debug log '
804 'for details.')
805 logging.info(message)
806 self.record('INFO', None, None, message)
Garry Wangffbd2162020-04-17 16:13:48 -0700807
808 def _reset_servo(self):
809 logging.info('Resetting servo through smart usbhub.')
Otabek Kasimov09192682020-06-01 18:17:44 -0700810 # TODO remove try-except when fix crbug.com/1087964
811 try:
812 resp = self.run('servodtool device -s %s power-cycle' %
813 self.servo_serial, ignore_status=True,
814 timeout=30)
815 if resp.exit_status != 0:
816 self._process_servodtool_error(resp)
817 return False
818 except Exception as e:
819 # Here we catch only timeout errors.
820 # Other errors is filtered by ignore_status=True
821 logging.debug('Attempt to reset servo failed due to timeout;'
822 ' %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -0700823 return False
824
825 logging.debug('Wait %s seconds for servo to come back from reset.',
826 servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
827 time.sleep(servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
Garry Wang000c6c02020-05-11 21:27:23 -0700828 # change the flag so we can update this label in later process.
829 self.smart_usbhub = True
Garry Wangffbd2162020-04-17 16:13:48 -0700830 return True
831
Garry Wangffbd2162020-04-17 16:13:48 -0700832 def reset_servo(self):
833 """Reset(power-cycle) the servo via smart usbhub.
834 """
835 if not self.is_labstation():
836 logging.info('Servo reset is not applicable to servo_v3.')
837 return
838
839 pre_reset_devnum = self._get_servo_usb_devnum()
840 logging.info('Servo usb devnum before reset: %s', pre_reset_devnum)
841 result = self._reset_servo()
842 if not result:
Garry Wangfd5c8b62020-06-08 15:36:54 -0700843 message = ('Failed to reset servo with serial: %s. (Please ignore'
844 ' this error if the DUT is not connected to a smart'
845 ' usbhub).' % self.servo_serial)
Garry Wangffbd2162020-04-17 16:13:48 -0700846 logging.warning(message)
847 self.record('INFO', None, None, message)
848 return
849
850 post_reset_devnum = self._get_servo_usb_devnum()
851 logging.info('Servo usb devnum after reset: %s', post_reset_devnum)
852 if not (pre_reset_devnum and post_reset_devnum):
853 message = ('Servo reset completed but unable to verify'
854 ' devnum change!')
855 elif pre_reset_devnum != post_reset_devnum:
856 message = ('Reset servo with serial %s completed successfully!'
857 % self.servo_serial)
858 else:
859 message = 'Servo reset completed but devnum is still not changed!'
860 logging.info(message)
861 self.record('INFO', None, None, message)
862
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800863 def _extract_compressed_logs(self, logdir, relevant_files):
864 """Decompress servod logs in |logdir|.
865
866 @param logdir: directory containing compressed servod logs.
867 @param relevant_files: list of files in |logdir| to consider.
868
869 @returns: tuple, (tarfiles, files) where
870 tarfiles: list of the compressed filenames that have been
871 extracted and deleted
872 files: list of the uncompressed files that were generated
873 """
874 # For all tar-files, first extract them to the directory, and
875 # then let the common flow handle them.
876 tarfiles = [cf for cf in relevant_files if
877 cf.endswith(self.COMPRESSION_SUFFIX)]
878 files = []
879 for f in tarfiles:
880 norm_name = os.path.basename(f)[:-len(self.COMPRESSION_SUFFIX)]
881 with tarfile.open(f) as tf:
882 # Each tarfile has only one member, as
883 # that's the compressed log.
884 member = tf.members[0]
885 # Manipulate so that it only extracts the basename, and not
886 # the directories etc.
887 member.name = norm_name
888 files.append(os.path.join(logdir, member.name))
889 tf.extract(member, logdir)
890 # File has been extracted: remove the compressed file.
891 os.remove(f)
892 return tarfiles, files
893
894 def _extract_mcu_logs(self, log_subdir):
895 """Extract MCU (EC, Cr50, etc) console output from servod debug logs.
896
897 Using the MCU_EXTRACTOR regex (above) extract and split out MCU console
898 lines from the logs to generate invidiual console logs e.g. after
899 this method, you can find an ec.txt and servo_v4.txt in |log_dir| if
900 those MCUs had any console input/output.
901
902 @param log_subdir: directory with log.DEBUG.txt main servod debug logs.
903 """
904 # Extract the MCU for each one. The MCU logs are only in the .DEBUG
905 # files
906 mcu_lines_file = os.path.join(log_subdir, 'log.DEBUG.txt')
907 if not os.path.exists(mcu_lines_file):
908 logging.info('No DEBUG logs found to extract MCU logs from.')
909 return
910 mcu_files = {}
911 mcu_file_template = '%s.txt'
912 with open(mcu_lines_file, 'r') as f:
913 for line in f:
914 match = self.MCU_EXTRACTOR.match(line)
915 if match:
916 mcu = match.group(self.MCU_GROUP).lower()
917 line = match.group(self.LINE_GROUP)
918 if mcu not in mcu_files:
919 mcu_file = os.path.join(log_subdir,
920 mcu_file_template % mcu)
921 mcu_files[mcu] = open(mcu_file, 'a')
922 fd = mcu_files[mcu]
923 fd.write(line + '\n')
924 for f in mcu_files:
925 mcu_files[f].close()
926
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800927 def remove_latest_log_symlinks(self):
928 """Remove the conveninence symlinks 'latest' servod logs."""
929 symlink_wildcard = '%s/latest*' % self.remote_log_dir
930 cmd = 'rm ' + symlink_wildcard
931 self.run(cmd, stderr_tee=None, ignore_status=True)
932
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700933 def probe_servod_restart(self, instance_ts, outdir):
934 """Grab servod logs from previous instances if part of this session.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800935
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700936 If since the last time this host called start_servod() servod crashed
937 and restarted, this helper finds those logs as well, and stores them
938 with the |OLD_LOG_SUFFIX| to investigate if necessary.
Prasad Vuppalapu5bd9da12020-03-31 01:46:47 +0000939
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700940 It also issues a panicinfo command to servo devices after the restart
941 to try and collect reboot information for debugging.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800942
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700943 @param instance_ts: the log timestamp that the current instance uses
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800944 @param outdir: directory to create a subdirectory into to place the
945 servod logs into.
946 """
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700947 if self._initial_instance_ts is None:
948 logging.info('No log timestamp grabbed successfully on servod '
949 'startup. Cannot check device restarts. Ignoring.')
950 return
951 if instance_ts == self._initial_instance_ts:
952 logging.debug('Servod appears to have run without restarting')
953 return
954 # Servod seems to have restarted (at least once). |_initial_instance_ts|
955 # is the first timestamp, and instance_ts is the current timestamp. Find
956 # all timestamps in between them, and grab the logs for each.
957 tss = self._find_instance_timestamps_between(self._initial_instance_ts,
958 instance_ts)
959 logging.info('Servod has restarted %d times between the start and the '
960 'end of this servo_host.', len(tss))
961 logging.info('This might be an issue. Will extract all logs from each '
962 'instance.')
963 logging.info('Logs that are not the currently running (about to turn '
964 'down) instance are maked with a .%s in their folder.',
965 self.OLD_LOG_SUFFIX)
966 for ts in tss:
967 self.get_instance_logs(ts, outdir, old=True)
968 # Lastly, servod has restarted due to a potential issue. Try to get
969 # panic information from servo micro and servo v4 for the current logs.
970 # This can only happen if the |_servo| attribute is initialized.
971 if self._servo:
972 for mcu in ['servo_micro', 'servo_v4']:
973 ctrl = '%s_uart_cmd' % mcu
974 if self._servo.has_control(ctrl):
975 logging.info('Trying to retrieve %r panicinfo into logs',
976 mcu)
977 try:
978 self._servo.set_nocheck(ctrl, 'panicinfo')
979 except error.TestFail as e:
980 logging.error('Failed to generate panicinfo for %r '
981 'logs. %s', mcu, str(e))
982
983 def _find_instance_timestamps_between(self, start_ts, end_ts):
984 """Find all log timestamps between [start_ts, end_ts).
985
986 @param start_ts: str, earliest log timestamp of interest
987 @param end_ts: str, latest log timestamp of interest
988
989 @returns: list, all timestamps between start_ts and end_ts, end_ts
990 exclusive, on the servo_host. An empty list on errors
991 """
992 # Simply get all timestamp, and then sort and remove
993 cmd = 'ls %s' % self.remote_log_dir
994 res = self.run(cmd, stderr_tee=None, ignore_status=True)
995 if res.exit_status != 0:
996 # Here we failed to find anything.
997 logging.info('Failed to find remote servod logs. Ignoring.')
998 return []
999 logfiles = res.stdout.strip().split()
1000 timestamps = set()
1001 for logfile in logfiles:
1002 ts_match = self.TS_EXTRACTOR.match(logfile)
1003 if not ts_match:
1004 # Simply ignore files that fail the check. It might be the
1005 # 'latest' symlinks or random files.
1006 continue
1007 timestamps.add(ts_match.group(self.TS_GROUP))
1008 # At this point we have all unique timestamps.
1009 timestamps = sorted(timestamps)
1010 for ts in [start_ts, end_ts]:
1011 if ts not in timestamps:
1012 logging.error('Timestamp %r not in servod logs. Cannot query '
1013 'for timestamps in between %r and %r', ts,
1014 start_ts, end_ts)
1015 return []
1016 return timestamps[timestamps.index(start_ts):timestamps.index(end_ts)]
1017
1018 def get_instance_logs_ts(self):
1019 """Retrieve the currently running servod instance's log timestamp
1020
1021 @returns: str, timestamp for current instance, or None on failure
1022 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001023 # First, extract the timestamp. This cmd gives the real filename of
1024 # the latest aka current log file.
1025 cmd = ('if [ -f %(dir)s/latest.DEBUG ];'
1026 'then realpath %(dir)s/latest.DEBUG;'
1027 'elif [ -f %(dir)s/latest ];'
1028 'then realpath %(dir)s/latest;'
1029 'else exit %(code)d;'
1030 'fi' % {'dir': self.remote_log_dir,
1031 'code': self.NO_SYMLINKS_CODE})
1032 res = self.run(cmd, stderr_tee=None, ignore_status=True)
1033 if res.exit_status != 0:
1034 if res.exit_status == self.NO_SYMLINKS_CODE:
1035 logging.warning('servod log latest symlinks not found. '
1036 'This is likely due to an error starting up '
1037 'servod. Ignoring..')
1038 else:
1039 logging.warning('Failed to find servod logs on servo host.')
1040 logging.warning(res.stderr.strip())
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001041 return None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001042 fname = os.path.basename(res.stdout.strip())
1043 # From the fname, ought to extract the timestamp using the TS_EXTRACTOR
Ruben Rodriguez Buchillone9aa2b02020-03-04 12:14:28 -08001044 ts_match = self.TS_EXTRACTOR.match(fname)
1045 if not ts_match:
1046 logging.warning('Failed to extract timestamp from servod log file '
1047 '%r. Skipping. The servo host is using outdated '
1048 'servod logging and needs to be updated.', fname)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001049 return None
1050 return ts_match.group(self.TS_GROUP)
1051
1052 def get_instance_logs(self, instance_ts, outdir, old=False):
1053 """Collect all logs with |instance_ts| and dump into a dir in |outdir|
1054
1055 This method first collects all logs on the servo_host side pertaining
1056 to this servod instance (port, instatiation). It glues them together
1057 into combined log.[level].txt files and extracts all available MCU
1058 console I/O from the logs into individual files e.g. servo_v4.txt
1059
1060 All the output can be found in a directory inside |outdir| that
1061 this generates based on |LOG_DIR|, the servod port, and the instance
1062 timestamp on the servo_host side.
1063
1064 @param instance_ts: log timestamp to grab logfiles for
1065 @param outdir: directory to create a subdirectory into to place the
1066 servod logs into.
1067 @param old: bool, whether to append |OLD_LOG_SUFFIX| to output dir
1068 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001069 # Create the local results log dir.
1070 log_dir = os.path.join(outdir, '%s_%s.%s' % (self.LOG_DIR,
1071 str(self.servo_port),
1072 instance_ts))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001073 if old:
Garry Wang22f2e842020-09-09 20:19:19 -07001074 log_dir = '%s.%s' % (log_dir, self.OLD_LOG_SUFFIX)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001075 logging.info('Saving servod logs to %r.', log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001076 os.mkdir(log_dir)
1077 # Now, get all files with that timestamp.
1078 cmd = 'find %s -maxdepth 1 -name "log.%s*"' % (self.remote_log_dir,
1079 instance_ts)
1080 res = self.run(cmd, stderr_tee=None, ignore_status=True)
1081 files = res.stdout.strip().split()
1082 try:
1083 self.get_file(files, log_dir, try_rsync=False)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001084 if not os.listdir(log_dir):
1085 logging.info('No servod logs retrieved. Ignoring, and removing '
1086 '%r again.', log_dir)
1087 os.rmdir(log_dir)
1088 return
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001089 except error.AutoservRunError as e:
1090 result = e.result_obj
1091 if result.exit_status != 0:
1092 stderr = result.stderr.strip()
1093 logging.warning("Couldn't retrieve servod logs. Ignoring: %s",
1094 stderr or '\n%s' % result)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001095 # Remove the log_dir as nothing was added to it.
1096 os.rmdir(log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001097 return
1098 local_files = [os.path.join(log_dir, f) for f in os.listdir(log_dir)]
1099 # TODO(crrev.com/c/1793030): remove no-level case once CL is pushed
1100 for level_name in ('DEBUG', 'INFO', 'WARNING', ''):
1101 # Create the joint files for each loglevel. i.e log.DEBUG
1102 joint_file = self.JOINT_LOG_PREFIX
1103 if level_name:
1104 joint_file = '%s.%s' % (self.JOINT_LOG_PREFIX, level_name)
1105 # This helps with some online tools to avoid complaints about an
1106 # unknown filetype.
1107 joint_file = joint_file + '.txt'
1108 joint_path = os.path.join(log_dir, joint_file)
1109 files = [f for f in local_files if level_name in f]
1110 if not files:
1111 # TODO(crrev.com/c/1793030): remove no-level case once CL
1112 # is pushed
1113 continue
1114 # Extract compressed logs if any.
1115 compressed, extracted = self._extract_compressed_logs(log_dir,
1116 files)
1117 files = list(set(files) - set(compressed))
1118 files.extend(extracted)
1119 # Need to sort. As they all share the same timestamp, and
1120 # loglevel, the index itself is sufficient. The highest index
1121 # is the oldest file, therefore we need a descending sort.
1122 def sortkey(f, level=level_name):
1123 """Custom sortkey to sort based on rotation number int."""
1124 if f.endswith(level_name): return 0
1125 return int(f.split('.')[-1])
1126
1127 files.sort(reverse=True, key=sortkey)
1128 # Just rename the first file rather than building from scratch.
1129 os.rename(files[0], joint_path)
1130 with open(joint_path, 'a') as joint_f:
1131 for logfile in files[1:]:
1132 # Transfer the file to the joint file line by line.
1133 with open(logfile, 'r') as log_f:
1134 for line in log_f:
1135 joint_f.write(line)
1136 # File has been written over. Delete safely.
1137 os.remove(logfile)
1138 # Need to remove all files form |local_files| so we don't
1139 # analyze them again.
1140 local_files = list(set(local_files) - set(files) - set(compressed))
1141 # Lastly, extract MCU logs from the joint logs.
1142 self._extract_mcu_logs(log_dir)
1143
Garry Wang79e9af62019-06-12 15:19:19 -07001144 def _lock(self):
1145 """lock servohost by touching a file.
1146 """
1147 logging.debug('Locking servohost %s by touching %s file',
1148 self.hostname, self._lock_file)
1149 self.run('touch %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001150 self._is_locked = True
Garry Wang79e9af62019-06-12 15:19:19 -07001151
Garry Wang79e9af62019-06-12 15:19:19 -07001152 def _unlock(self):
1153 """Unlock servohost by removing the lock file.
1154 """
1155 logging.debug('Unlocking servohost by removing %s file',
1156 self._lock_file)
1157 self.run('rm %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001158 self._is_locked = False
Garry Wang79e9af62019-06-12 15:19:19 -07001159
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001160 def close(self):
Congbin Guofc3b8962019-03-22 17:38:46 -07001161 """Close the associated servo and the host object."""
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001162 # NOTE: throughout this method there are multiple attempts to catch
1163 # all errors. This is WAI as log grabbing should not fail tests.
1164 # However, the goal is to catch and handle/process all errors, thus
1165 # we print the traceback and ask for a bug.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001166 if self._closed:
1167 logging.debug('ServoHost is already closed.')
1168 return
Garry Wang22f2e842020-09-09 20:19:19 -07001169
1170 # Only attempt ssh related actions if servohost is sshable. We call
1171 # check_cached_up_status() first because it's lightweighted and return
1172 # much faster in the case servohost is down, however, we still want
1173 # to call is_up() later since check_cached_up_status() is ping based check
1174 # and not guarantee the servohost is sshable.
1175 servo_host_ready = self.check_cached_up_status() and self.is_up()
1176
1177 if servo_host_ready:
1178 instance_ts = self.get_instance_logs_ts()
1179 else:
1180 logging.info('Servohost is down, will skip servod log collecting.')
1181 instance_ts = None
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001182 # TODO(crbug.com/1011516): once enabled, remove the check against
1183 # localhost and instead check against log-rotiation enablement.
1184 logs_available = (instance_ts is not None and
1185 self.job and
1186 not self.is_localhost())
1187 if logs_available:
1188 # Probe whether there was a servod restart, and grab those old
1189 # logs as well.
1190 try:
1191 self.probe_servod_restart(instance_ts, self.job.resultdir)
1192 except (error.AutoservRunError, error.TestFail) as e:
1193 logging.info('Failed to grab servo logs due to: %s. '
1194 'This error is forgiven.', str(e))
1195 except Exception as e:
1196 logging.error('Unexpected error probing for old logs. %s. '
1197 'Forgiven. Please file a bug and fix or catch '
1198 'in log probing function', str(e),
1199 exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001200 if self._servo:
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001201 outdir = None if not self.job else self.job.resultdir
Congbin Guo2e5e2a22018-07-27 10:32:48 -07001202 # In some cases when we run as lab-tools, the job object is None.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001203 self._servo.close(outdir)
1204
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001205 if logs_available:
1206 # Grab current (not old like above) logs after the servo instance
1207 # was closed out.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001208 try:
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001209 self.get_instance_logs(instance_ts, self.job.resultdir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001210 except error.AutoservRunError as e:
1211 logging.info('Failed to grab servo logs due to: %s. '
1212 'This error is forgiven.', str(e))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001213 except Exception as e:
1214 logging.error('Unexpected error grabbing servod logs. %s. '
1215 'Forgiven. Please file a bug and fix or catch '
1216 'in log grabbing function', str(e), exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001217
Garry Wang22f2e842020-09-09 20:19:19 -07001218 if self._is_locked and servo_host_ready:
Garry Wang7c00b0f2019-06-25 17:28:17 -07001219 # Remove the lock if the servohost has been locked.
Garry Wang79e9af62019-06-12 15:19:19 -07001220 try:
1221 self._unlock()
1222 except error.AutoservSSHTimeout:
1223 logging.error('Unlock servohost failed due to ssh timeout.'
1224 ' It may caused by servohost went down during'
1225 ' the task.')
Garry Wangc1288cf2019-12-17 14:58:00 -08001226 # We want always stop servod after task to minimum the impact of bad
1227 # servod process interfere other servods.(see crbug.com/1028665)
Garry Wang22f2e842020-09-09 20:19:19 -07001228 if servo_host_ready:
1229 try:
1230 self.stop_servod()
1231 except error.AutoservRunError as e:
1232 logging.info(
1233 "Failed to stop servod due to:\n%s\n"
1234 "This error is forgiven.", str(e))
Garry Wangc1288cf2019-12-17 14:58:00 -08001235
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001236 super(ServoHost, self).close()
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001237 # Mark closed.
1238 self._closed = True
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001239
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001240 def get_servo_state(self):
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001241 return self._servo_state
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001242
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001243 def _get_host_metrics_data(self):
1244 return {'port': self.servo_port,
Otabek Kasimov0ea47362020-07-11 20:55:09 -07001245 'host': self.get_dut_hostname() or self.hostname,
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001246 'board': self.servo_board or ''}
1247
Otabek Kasimovce34f532021-03-09 08:28:55 +00001248 def _is_servo_device_connected(self, servo_type, serial):
1249 """Check if device is connected to the labstation.
1250
1251 Works for all servo devices connected to the labstation.
1252 For servo_v3 please use 'self._is_servo_board_present_on_servo_v3'
1253
1254 @param servo_type: The type of servo device. Expecting value can be
1255 servo_v4 or servo_micro.
1256 @param serial: The serial number of the device to detect it.
1257 """
1258 vid_pid = self.SERVO_VID_PID.get(servo_type)
1259 if not vid_pid or not serial:
1260 # device cannot detected without VID/PID or serial number
1261 return False
1262 logging.debug('Started to detect %s', servo_type)
1263 try:
1264 cmd = 'lsusb -v -d %s |grep iSerial |grep %s' % (vid_pid, serial)
1265 result = self.run(cmd, ignore_status=True, timeout=30)
1266 if result.exit_status == 0 and result.stdout.strip():
1267 logging.debug('The %s is plugged in to the host.', servo_type)
1268 return True
1269 logging.debug('%s device is not detected; %s', servo_type, result)
1270 return False
1271 except Exception as e:
1272 # can be triggered by timeout issue due running the script
1273 metrics.Counter(
1274 'chromeos/autotest/repair/servo_detection/timeout'
1275 ).increment(fields=self._get_host_metrics_data())
1276 logging.error('%s device is not detected; %s', servo_type, str(e))
1277 return None
1278
1279 def _is_servo_board_present_on_servo_v3(self):
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001280 """Check if servo board is detected on servo_v3"""
Otabek Kasimovce34f532021-03-09 08:28:55 +00001281 vid_pids = self.SERVO_VID_PID['servo_v3']
1282 if not vid_pids or len(vid_pids) == 0:
1283 # device cannot detected without VID/PID
1284 return False
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001285 logging.debug('Started to detect servo board on servo_v3')
1286 not_detected = 'The servo board is not detected on servo_v3'
1287 try:
1288 cmd = 'lsusb | grep "%s"' % "\|".join(vid_pids)
1289 result = self.run(cmd, ignore_status=True, timeout=30)
1290 if result.exit_status == 0 and result.stdout.strip():
1291 logging.debug('The servo board is detected on servo_v3')
1292 return True
1293 logging.debug('%s; %s', not_detected, result)
1294 return False
1295 except Exception as e:
1296 # can be triggered by timeout issue due running the script
1297 metrics.Counter(
1298 'chromeos/autotest/repair/servo_detection/timeout'
1299 ).increment(fields=self._get_host_metrics_data())
1300 logging.error('%s; %s', not_detected, str(e))
1301 return None
1302
Otabek Kasimovce34f532021-03-09 08:28:55 +00001303 def _is_main_device_not_detected_on_servo_v4(self):
1304 """Check if servod cannot find main device on servo.
1305
1306 The check based on reading servod logs for servo_v4.
1307 """
1308 if not self._initial_instance_ts:
1309 # latest log not found
1310 return False
1311 logging.debug('latest log for servod created at %s',
1312 self._initial_instance_ts)
1313 try:
1314 log_created = calendar.timegm(time.strptime(
1315 self._initial_instance_ts,
1316 "%Y-%m-%d--%H-%M-%S.%f"))
1317 except ValueError as e:
1318 logging.debug('Cannot read time from log file name: %s',
1319 self._initial_instance_ts)
1320 return False
1321 min_time_created = calendar.timegm(time.gmtime())
1322 if min_time_created > log_created + 3600:
1323 # the log file is old we cannot use it
1324 logging.debug('log file was created more than hour ago, too old')
1325 return False
1326 logging.debug('latest log was created not longer then 1 hour ago')
1327
1328 # check if servod can detect main device by servo_v4
1329 message = 'ERROR - No servo micro or CCD detected for board'
1330 cmd = ('cat /var/log/servod_%s/log.%s.INFO |grep "%s"'
1331 % (self.servo_port, self._initial_instance_ts, message))
1332 result = self.run(cmd, ignore_status=True)
1333 if result.stdout.strip():
1334 logging.info('Servod cannot detect main device on the servo; '
1335 'Can be caused by bad hardware of servo or '
1336 'issue on the DUT side.')
1337 return True
1338 logging.debug('The main device is detected')
1339 return False
1340
Garry Wangb5cee3e2020-09-16 14:58:13 -07001341 def _require_cr50_servod_config(self):
1342 """Check whether we need start servod with CONFIG=cr50.xml"""
1343 dut_host_info = self.get_dut_host_info()
1344 if not dut_host_info:
1345 return False
1346 for pool in dut_host_info.pools:
1347 if pool.startswith(servo_constants.CR50_CONFIG_POOL_PREFIX):
1348 return True
1349 return False
1350
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001351 def get_verifier_state(self, tag):
Otabek Kasimov15963492020-06-23 21:10:51 -07001352 """Return the state of servo verifier.
1353
1354 @returns: bool or None
1355 """
1356 return self._repair_strategy.verifier_is_good(tag)
1357
1358 def determine_servo_state(self):
1359 """Determine servo state based on the failed verifier.
1360
1361 @returns: servo state value
1362 The state detecting based on first fail verifier or collecting of
1363 them.
1364 """
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001365 ssh = self.get_verifier_state('servo_ssh')
Otabek Kasimov79be61b2021-02-18 12:30:44 -08001366 servo_fw = self.get_verifier_state('servo_fw')
Otabek Kasimov1614e2e2021-01-27 22:14:36 -08001367 disk_space = self.get_verifier_state('servo_disk_space')
1368 start_servod = self.get_verifier_state('servod_started')
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001369 create_servo = self.get_verifier_state('servod_connection')
1370 init_servo = self.get_verifier_state('servod_control')
Otabek Kasimov1614e2e2021-01-27 22:14:36 -08001371 cr50_low_sbu = self.get_verifier_state('servo_cr50_low_sbu')
1372 cr50_off = self.get_verifier_state('servo_cr50_off')
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001373 servo_topology = self.get_verifier_state('servo_topology')
Otabek Kasimov1614e2e2021-01-27 22:14:36 -08001374 dut_connected = self.get_verifier_state('servo_dut_connected')
1375 hub_connected = self.get_verifier_state('servo_hub_connected')
1376 pwr_button = self.get_verifier_state('servo_pwr_button')
1377 lid_open = self.get_verifier_state('servo_lid_open')
1378 ec_board = self.get_verifier_state('servo_ec_board')
1379 cr50_console = self.get_verifier_state('servo_cr50_console')
1380 ccd_testlab = self.get_verifier_state('servo_ccd_testlab')
Otabek Kasimov15963492020-06-23 21:10:51 -07001381
1382 if not ssh:
1383 return servo_constants.SERVO_STATE_NO_SSH
Otabek Kasimov79be61b2021-02-18 12:30:44 -08001384 if servo_fw == hosts.VERIFY_FAILED:
1385 return servo_constants.SERVO_STATE_NEED_REPLACEMENT
Otabek Kasimov15963492020-06-23 21:10:51 -07001386
Otabek Kasimovce34f532021-03-09 08:28:55 +00001387 if (start_servod == hosts.VERIFY_FAILED
1388 or create_servo == hosts.VERIFY_FAILED):
1389 # sometimes servo can start with out present servo
1390 if self.is_labstation():
1391 if not self.servo_serial:
1392 return servo_constants.SERVO_STATE_WRONG_CONFIG
1393 if self._is_servo_device_connected(
1394 'servo_v4',
1395 self.servo_serial) == False:
1396 return servo_constants.SERVO_STATE_NOT_CONNECTED
1397 elif self._is_servo_board_present_on_servo_v3() == False:
1398 return servo_constants.SERVO_STATE_NOT_CONNECTED
1399
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001400 if dut_connected == hosts.VERIFY_FAILED:
1401 return servo_constants.SERVO_STATE_DUT_NOT_CONNECTED
1402 if hub_connected == hosts.VERIFY_FAILED:
1403 logging.info('Servo HUB not connected')
1404 return servo_constants.SERVO_STATE_DUT_NOT_CONNECTED
Otabek Kasimov8e88a742021-01-11 18:03:13 -08001405 if cr50_low_sbu == hosts.VERIFY_FAILED:
1406 return servo_constants.SERVO_STATE_SBU_LOW_VOLTAGE
1407 if cr50_off == hosts.VERIFY_FAILED:
1408 return servo_constants.SERVO_STATE_CR50_NOT_ENUMERATED
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001409 if servo_topology == hosts.VERIFY_FAILED:
1410 return servo_constants.SERVO_STATE_TOPOLOGY_ISSUE
1411
Otabek Kasimovd5065bd2020-11-23 23:32:36 -08001412 # TODO(otabek@): detect special cases detected by pwr_button
1413 if dut_connected == hosts.VERIFY_SUCCESS:
1414 if pwr_button == hosts.VERIFY_FAILED:
1415 metrics.Counter(
1416 'chromeos/autotest/repair/servo_unexpected/pwr_button2'
1417 ).increment(fields=self._get_host_metrics_data())
Otabek Kasimova7eb4dc2020-09-16 10:25:17 -07001418
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001419 if start_servod == hosts.VERIFY_FAILED:
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001420 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1421
Otabek Kasimovce34f532021-03-09 08:28:55 +00001422 if create_servo == hosts.VERIFY_FAILED:
1423 if (self.is_labstation()
1424 and self._is_main_device_not_detected_on_servo_v4()):
1425 servo_type = None
1426 if self.get_dut_host_info():
1427 servo_type = self.get_dut_host_info().get_label_value(
1428 servo_constants.SERVO_TYPE_LABEL_PREFIX)
1429 if servo_type and 'servo_micro' in servo_type:
1430 serial = self.get_servo_micro_serial_number()
1431 logging.debug('servo_micro serial: %s', serial)
1432 if self._is_servo_device_detected('servo_micro',
1433 serial):
1434 return servo_constants.SERVO_STATE_BAD_RIBBON_CABLE
1435 # Device can be not detected because of DUT
1436 # TODO (otabek) update after b/159755652 and b/159754985
1437 metrics.Counter(
1438 'chromeos/autotest/repair/servo_state/needs_replacement'
1439 ).increment(fields=self._get_host_metrics_data())
1440 elif not self.is_labstation():
1441 # Here need logic to check if flex cable is connected
1442 pass
1443
Otabek Kasimov15963492020-06-23 21:10:51 -07001444 # one of the reason why servo can not initialized
Otabek Kasimovbb3bc462020-11-03 16:40:33 -08001445 if cr50_console == hosts.VERIFY_FAILED:
1446 return servo_constants.SERVO_STATE_CR50_CONSOLE_MISSING
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001447 if ccd_testlab == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001448 return servo_constants.SERVO_STATE_CCD_TESTLAB_ISSUE
1449
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001450 if (create_servo == hosts.VERIFY_FAILED
1451 or init_servo == hosts.VERIFY_FAILED):
Otabek Kasimov15963492020-06-23 21:10:51 -07001452 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1453
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001454 if ec_board == hosts.VERIFY_FAILED:
Otabek Kasimov015c15c2020-08-20 00:40:42 -07001455 return servo_constants.SERVO_STATE_EC_BROKEN
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001456 if pwr_button == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001457 return servo_constants.SERVO_STATE_BAD_RIBBON_CABLE
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001458 if lid_open == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001459 return servo_constants.SERVO_STATE_LID_OPEN_FAILED
Otabek Kasimov15963492020-06-23 21:10:51 -07001460
Otabek Kasimov15963492020-06-23 21:10:51 -07001461 metrics.Counter(
1462 'chromeos/autotest/repair/unknown_servo_state'
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001463 ).increment(fields=self._get_host_metrics_data())
Otabek Kasimov15963492020-06-23 21:10:51 -07001464 logging.info('We do not have special state for this failure yet :)')
1465 return servo_constants.SERVO_STATE_BROKEN
1466
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001467 def is_servo_topology_supported(self):
1468 """Check if servo_topology is supported."""
Otabek Kasimovda994012020-11-25 15:23:04 -08001469 if not self.is_up_fast():
1470 logging.info('Servo-Host is not reachable.')
1471 return False
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001472 if not self.is_labstation():
1473 logging.info('Servo-topology supported only for labstation.')
1474 return False
1475 if not self.servo_serial:
1476 logging.info('Servo-topology required a servo serial.')
1477 return False
1478 return True
1479
1480 def get_topology(self):
1481 """Get servo topology."""
Otabek Kasimovfe41e2d2021-02-14 20:48:52 -08001482 if not self._topology:
1483 self._topology = servo_topology.ServoTopology(self)
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001484 return self._topology
1485
1486 def is_dual_setup(self):
1487 """Check is servo will run in dual setup.
1488
1489 Dual setup used only for servo_v4 when used ccd_cr50 and servo_micro
1490 at the same time.
1491 """
1492 return self.servo_setup == servo_constants.SERVO_SETUP_VALUE_DUAL_V4
1493
Otabek Kasimov39637412020-11-23 19:09:27 -08001494 def set_dut_health_profile(self, dut_health_profile):
1495 """
1496 @param dut_health_profile: A DeviceHealthProfile object.
1497 """
1498 logging.debug('setting dut_health_profile field to (%s)',
1499 dut_health_profile)
1500 self._dut_health_profile = dut_health_profile
1501
1502 def get_dut_health_profile(self):
1503 """
1504 @return A DeviceHealthProfile object.
1505 """
1506 return self._dut_health_profile
1507
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001508
Richard Barnetteea3e4602016-06-10 12:36:41 -07001509def make_servo_hostname(dut_hostname):
1510 """Given a DUT's hostname, return the hostname of its servo.
1511
1512 @param dut_hostname: hostname of a DUT.
1513
1514 @return hostname of the DUT's servo.
1515
1516 """
1517 host_parts = dut_hostname.split('.')
1518 host_parts[0] = host_parts[0] + '-servo'
1519 return '.'.join(host_parts)
1520
1521
Richard Barnettee519dcd2016-08-15 17:37:17 -07001522def _map_afe_board_to_servo_board(afe_board):
1523 """Map a board we get from the AFE to a servo appropriate value.
1524
1525 Many boards are identical to other boards for servo's purposes.
1526 This function makes that mapping.
1527
1528 @param afe_board string board name received from AFE.
1529 @return board we expect servo to have.
1530
1531 """
1532 KNOWN_SUFFIXES = ['-freon', '_freon', '_moblab', '-cheets']
1533 BOARD_MAP = {'gizmo': 'panther'}
1534 mapped_board = afe_board
1535 if afe_board in BOARD_MAP:
1536 mapped_board = BOARD_MAP[afe_board]
1537 else:
1538 for suffix in KNOWN_SUFFIXES:
1539 if afe_board.endswith(suffix):
1540 mapped_board = afe_board[0:-len(suffix)]
1541 break
1542 if mapped_board != afe_board:
1543 logging.info('Mapping AFE board=%s to %s', afe_board, mapped_board)
1544 return mapped_board
1545
1546
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001547def get_servo_args_for_host(dut_host):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001548 """Return servo data associated with a given DUT.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001549
Richard Barnetteea3e4602016-06-10 12:36:41 -07001550 @param dut_host Instance of `Host` on which to find the servo
1551 attributes.
Prathmesh Prabhuf605dd32018-08-28 17:09:04 -07001552 @return `servo_args` dict with host and an optional port.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001553 """
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001554 info = dut_host.host_info_store.get()
Derek Beckettf73baca2020-08-19 15:08:47 -07001555 servo_args = {k: v for k, v in six.iteritems(info.attributes)
Garry Wang11b5e872020-03-11 15:14:08 -07001556 if k in servo_constants.SERVO_ATTR_KEYS}
Richard Barnetteea3e4602016-06-10 12:36:41 -07001557
Andrew Luo4be621d2020-03-21 07:01:13 -07001558 if servo_constants.SERVO_HOST_SSH_PORT_ATTR in servo_args:
1559 try:
1560 servo_args[servo_constants.SERVO_HOST_SSH_PORT_ATTR] = int(
1561 servo_args[servo_constants.SERVO_HOST_SSH_PORT_ATTR])
1562 except ValueError:
1563 logging.error('servo host port is not an int: %s',
1564 servo_args[servo_constants.SERVO_HOST_SSH_PORT_ATTR])
1565 # Reset servo_args because we don't want to use an invalid port.
1566 servo_args.pop(servo_constants.SERVO_HOST_SSH_PORT_ATTR, None)
1567
Garry Wang11b5e872020-03-11 15:14:08 -07001568 if servo_constants.SERVO_PORT_ATTR in servo_args:
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001569 try:
Garry Wang11b5e872020-03-11 15:14:08 -07001570 servo_args[servo_constants.SERVO_PORT_ATTR] = int(
1571 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001572 except ValueError:
1573 logging.error('servo port is not an int: %s',
Garry Wang11b5e872020-03-11 15:14:08 -07001574 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001575 # Reset servo_args because we don't want to use an invalid port.
Garry Wang11b5e872020-03-11 15:14:08 -07001576 servo_args.pop(servo_constants.SERVO_HOST_ATTR, None)
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001577
1578 if info.board:
Garry Wang11b5e872020-03-11 15:14:08 -07001579 servo_board = _map_afe_board_to_servo_board(info.board)
1580 servo_args[servo_constants.SERVO_BOARD_ATTR] = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -07001581 if info.model:
Garry Wang11b5e872020-03-11 15:14:08 -07001582 servo_args[servo_constants.SERVO_MODEL_ATTR] = info.model
1583 return servo_args if servo_constants.SERVO_HOST_ATTR in servo_args else None
Richard Barnetteea3e4602016-06-10 12:36:41 -07001584
1585
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001586def _tweak_args_for_ssp_moblab(servo_args):
Garry Wang11b5e872020-03-11 15:14:08 -07001587 if (servo_args[servo_constants.SERVO_HOST_ATTR]
1588 in ['localhost', '127.0.0.1']):
1589 servo_args[servo_constants.SERVO_HOST_ATTR] = _CONFIG.get_config_value(
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001590 'SSP', 'host_container_ip', type=str, default=None)
1591
1592
Otabek Kasimov39637412020-11-23 19:09:27 -08001593def create_servo_host(dut,
1594 servo_args,
1595 try_lab_servo=False,
1596 try_servo_repair=False,
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001597 try_servo_recovery=False,
Otabek Kasimov39637412020-11-23 19:09:27 -08001598 dut_host_info=None,
1599 dut_health_profile=None):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001600 """Create a ServoHost object for a given DUT, if appropriate.
Dan Shi4d478522014-02-14 13:46:32 -08001601
Richard Barnette9a26ad62016-06-10 12:03:08 -07001602 This function attempts to create and verify or repair a `ServoHost`
1603 object for a servo connected to the given `dut`, subject to various
1604 constraints imposed by the parameters:
1605 * When the `servo_args` parameter is not `None`, a servo
1606 host must be created, and must be checked with `repair()`.
1607 * Otherwise, if a servo exists in the lab and `try_lab_servo` is
1608 true:
1609 * If `try_servo_repair` is true, then create a servo host and
1610 check it with `repair()`.
1611 * Otherwise, if the servo responds to `ping` then create a
1612 servo host and check it with `verify()`.
Fang Denge545abb2014-12-30 18:43:47 -08001613
Richard Barnette9a26ad62016-06-10 12:03:08 -07001614 In cases where `servo_args` was not `None`, repair failure
1615 exceptions are passed back to the caller; otherwise, exceptions
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001616 are logged and then discarded. Note that this only happens in cases
1617 where we're called from a test (not special task) control file that
1618 has an explicit dependency on servo. In that case, we require that
1619 repair not write to `status.log`, so as to avoid polluting test
1620 results.
1621
1622 TODO(jrbarnette): The special handling for servo in test control
1623 files is a thorn in my flesh; I dearly hope to see it cut out before
1624 my retirement.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001625
1626 Parameters for a servo host consist of a host name, port number, and
1627 DUT board, and are determined from one of these sources, in order of
1628 priority:
Richard Barnetteea3e4602016-06-10 12:36:41 -07001629 * Servo attributes from the `dut` parameter take precedence over
1630 all other sources of information.
1631 * If a DNS entry for the servo based on the DUT hostname exists in
1632 the CrOS lab network, that hostname is used with the default
Richard Barnette9a26ad62016-06-10 12:03:08 -07001633 port and the DUT's board.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001634 * If no other options are found, the parameters will be taken
Richard Barnette9a26ad62016-06-10 12:03:08 -07001635 from the `servo_args` dict passed in from the caller.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001636
1637 @param dut An instance of `Host` from which to take
1638 servo parameters (if available).
1639 @param servo_args A dictionary with servo parameters to use if
1640 they can't be found from `dut`. If this
1641 argument is supplied, unrepaired exceptions
1642 from `verify()` will be passed back to the
1643 caller.
1644 @param try_lab_servo If not true, servo host creation will be
1645 skipped unless otherwise required by the
1646 caller.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001647 @param try_servo_repair If true, check a servo host with
1648 `repair()` instead of `verify()`.
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001649 @param try_servo_recovery If true, start servod in recovery mode.
Otabek Kasimov8475cce2020-07-14 12:11:31 -07001650 @param dut_host_info: A HostInfo object of the DUT that connected
1651 to this servo.
Otabek Kasimov39637412020-11-23 19:09:27 -08001652 @param dut_health_profile: DUT repair info with history.
Dan Shi4d478522014-02-14 13:46:32 -08001653
1654 @returns: A ServoHost object or None. See comments above.
1655
1656 """
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001657 servo_dependency = servo_args is not None
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001658 if dut is not None and (try_lab_servo or servo_dependency):
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001659 servo_args_override = get_servo_args_for_host(dut)
Richard Barnetteea3e4602016-06-10 12:36:41 -07001660 if servo_args_override is not None:
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001661 if utils.in_moblab_ssp():
1662 _tweak_args_for_ssp_moblab(servo_args_override)
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001663 logging.debug(
1664 'Overriding provided servo_args (%s) with arguments'
1665 ' determined from the host (%s)',
1666 servo_args,
1667 servo_args_override,
1668 )
Richard Barnetteea3e4602016-06-10 12:36:41 -07001669 servo_args = servo_args_override
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001670
Richard Barnetteea3e4602016-06-10 12:36:41 -07001671 if servo_args is None:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001672 logging.debug('No servo_args provided, and failed to find overrides.')
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001673 if try_lab_servo or servo_dependency:
Otabek Kasimov646812c2020-06-23 20:01:36 -07001674 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001675 else:
1676 # For regular test case which not required the servo
1677 return None, None
1678
Garry Wang11b5e872020-03-11 15:14:08 -07001679 servo_hostname = servo_args.get(servo_constants.SERVO_HOST_ATTR)
1680 servo_port = servo_args.get(servo_constants.SERVO_PORT_ATTR)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001681 if not _is_servo_host_information_exist(servo_hostname, servo_port):
1682 logging.debug(
1683 'Servo connection info missed hostname: %s , port: %s',
1684 servo_hostname, servo_port)
Otabek Kasimov646812c2020-06-23 20:01:36 -07001685 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001686 if not is_servo_host_information_valid(servo_hostname, servo_port):
1687 logging.debug(
1688 'Servo connection info is incorrect hostname: %s , port: %s',
1689 servo_hostname, servo_port)
Garry Wang11b5e872020-03-11 15:14:08 -07001690 return None, servo_constants.SERVO_STATE_WRONG_CONFIG
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001691
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001692 if try_servo_recovery == True:
1693 servo_args[servo_constants.SERVO_RECOVERY_MODE] = True
1694
Garry Wangebc015b2019-06-06 17:45:06 -07001695 newhost = ServoHost(**servo_args)
Andrew Luo4be621d2020-03-21 07:01:13 -07001696 if newhost.use_icmp and not newhost.is_up_fast(count=3):
Otabek Kasimov32cafe92020-12-14 16:58:12 -08001697 # ServoHost has internal check to wait if servo-host is in reboot
1698 # process. If servo-host still is not available this check will stop
1699 # further attempts as we do not have any option to recover servo_host.
Otabek Kasimov39637412020-11-23 19:09:27 -08001700 return None, servo_constants.SERVO_STATE_NO_SSH
Garry Wangffbd2162020-04-17 16:13:48 -07001701
Otabek Kasimove6df8102020-07-21 20:15:25 -07001702 # Reset or reboot servo device only during AdminRepair tasks.
1703 if try_servo_repair:
1704 if newhost._is_locked:
1705 # Reset servo if the servo is locked, as we check if the servohost
1706 # is up, if the servohost is labstation and if the servohost is in
1707 # lab inside the locking logic.
1708 newhost.reset_servo()
1709 else:
Garry Wang358aad42020-08-02 20:56:04 -07001710 try:
1711 newhost.reboot_servo_v3_on_need()
Garry Wang1f0d5332020-08-10 19:32:32 -07001712 except Exception as e:
1713 logging.info('[Non-critical] Unexpected error while trying to'
1714 ' reboot servo_v3, skipping the reboot; %s', e)
Otabek Kasimove6df8102020-07-21 20:15:25 -07001715
Otabek Kasimov2b50cdb2020-07-06 19:16:06 -07001716 if dut:
1717 newhost.set_dut_hostname(dut.hostname)
Otabek Kasimov9e90ae12020-08-14 03:01:19 -07001718 if dut_host_info:
1719 newhost.set_dut_host_info(dut_host_info)
Otabek Kasimov39637412020-11-23 19:09:27 -08001720 if dut_health_profile and (try_lab_servo or try_servo_repair):
1721 try:
1722 if newhost.is_localhost():
1723 logging.info('Servohost is a localhost, skip device'
1724 ' health profile setup...')
1725 else:
1726 dut_health_profile.init_profile(newhost)
1727 newhost.set_dut_health_profile(dut_health_profile)
1728 except Exception as e:
1729 logging.info(
1730 '[Non-critical] Unexpected error while trying to'
1731 ' load device health profile; %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -07001732
Richard Barnette9a26ad62016-06-10 12:03:08 -07001733 # Note that the logic of repair() includes everything done
1734 # by verify(). It's sufficient to call one or the other;
1735 # we don't need both.
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001736 if servo_dependency:
1737 newhost.repair(silent=True)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001738 return newhost, newhost.get_servo_state()
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001739
1740 if try_servo_repair:
1741 try:
1742 newhost.repair()
1743 except Exception:
1744 logging.exception('servo repair failed for %s', newhost.hostname)
Richard Barnette9a26ad62016-06-10 12:03:08 -07001745 else:
1746 try:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001747 newhost.verify()
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001748 except Exception:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001749 logging.exception('servo verify failed for %s', newhost.hostname)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001750 return newhost, newhost.get_servo_state()
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001751
1752
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001753def _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001754 if hostname is None or len(hostname.strip()) == 0:
1755 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001756 if port is None:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001757 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001758 if not type(port) is int:
1759 try:
1760 int(port)
1761 except ValueError:
1762 return False
1763
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001764 return True
1765
1766
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001767def is_servo_host_information_valid(hostname, port):
Garry Wang9b8f2342020-04-17 16:34:09 -07001768 """Check if provided servo attributes are valid.
1769
1770 @param hostname Hostname of the servohost.
1771 @param port servo port number.
1772
1773 @returns: A bool value to indicate if provided servo attribute valid.
1774 """
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001775 if not _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001776 return False
1777 # checking range and correct of the port
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001778 port_int = int(port)
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001779 if port_int < 1 or port_int > 65000:
1780 return False
1781 # we expecting host contain only latters, digits and '-' or '_'
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001782 if not re.match('[a-zA-Z0-9-_\.]*$', hostname) or len(hostname) < 5:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001783 return False
1784 return True