blob: 7a4808181151d39b8b56ec3e8831a29aab8502ff [file] [log] [blame]
Derek Beckettf73baca2020-08-19 15:08:47 -07001# Lint as: python2, python3
Fang Deng5d518f42013-08-02 14:04:32 -07002# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
3# Use of this source code is governed by a BSD-style license that can be
4# found in the LICENSE file.
5#
6# Expects to be run in an environment with sudo and no interactive password
7# prompt, such as within the Chromium OS development chroot.
8
9
10"""This file provides core logic for servo verify/repair process."""
11
12
Derek Beckettf73baca2020-08-19 15:08:47 -070013from __future__ import absolute_import
14from __future__ import division
15from __future__ import print_function
16
Fang Deng5d518f42013-08-02 14:04:32 -070017import logging
Raul E Rangel52ca2e82018-07-03 14:10:14 -060018import os
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080019import re
20import tarfile
Andrew McRaef0679932020-08-13 09:15:23 +100021import threading
Garry Wang2b5eef92020-08-21 16:23:35 -070022import json
Garry Wangc1288cf2019-12-17 14:58:00 -080023import time
Derek Beckettf73baca2020-08-19 15:08:47 -070024import six
25import six.moves.xmlrpc_client
Otabek Kasimov120b6fa2020-07-03 00:15:27 -070026import calendar
Fang Deng5d518f42013-08-02 14:04:32 -070027
28from autotest_lib.client.bin import utils
Garry Wang79e9af62019-06-12 15:19:19 -070029from autotest_lib.client.common_lib import error
Richard Barnette9a26ad62016-06-10 12:03:08 -070030from autotest_lib.client.common_lib import hosts
Garry Wang7b0e1b72020-03-25 19:08:59 -070031from autotest_lib.client.common_lib import lsbrelease_utils
Fang Deng5d518f42013-08-02 14:04:32 -070032from autotest_lib.client.common_lib.cros import retry
Richard Barnette9a26ad62016-06-10 12:03:08 -070033from autotest_lib.server.cros.servo import servo
Richard Barnetted31580e2018-05-14 19:58:00 +000034from autotest_lib.server.hosts import servo_repair
Garry Wangebc015b2019-06-06 17:45:06 -070035from autotest_lib.server.hosts import base_servohost
Garry Wang11b5e872020-03-11 15:14:08 -070036from autotest_lib.server.hosts import servo_constants
Otabek Kasimov4ea636e2020-04-14 23:35:06 -070037from autotest_lib.server.cros.faft.utils import config
Garry Wang11b5e872020-03-11 15:14:08 -070038from autotest_lib.client.common_lib import global_config
Otabek Kasimov8475cce2020-07-14 12:11:31 -070039from autotest_lib.site_utils.admin_audit import servo_updater
Otabek Kasimov382c3bb2020-10-28 13:22:45 -070040from autotest_lib.server.cros.servo.topology import servo_topology
Garry Wangd7367482020-02-27 13:52:40 -080041
Otabek Kasimov15963492020-06-23 21:10:51 -070042try:
Mike Frysinger714c5b02020-09-04 23:22:54 -040043 from autotest_lib.utils.frozen_chromite.lib import metrics
Otabek Kasimov15963492020-06-23 21:10:51 -070044except ImportError:
45 metrics = utils.metrics_mock
46
Dan Shi3b2adf62015-09-02 17:46:54 -070047_CONFIG = global_config.global_config
Fang Deng5d518f42013-08-02 14:04:32 -070048
Otabek Kasimova7ba91a2020-03-09 08:31:01 -070049
Garry Wangebc015b2019-06-06 17:45:06 -070050class ServoHost(base_servohost.BaseServoHost):
51 """Host class for a servo host(e.g. beaglebone, labstation)
Dana Goyette0b6e6402019-10-04 11:09:24 -070052 that with a servo instance for a specific port.
53
54 @type _servo: servo.Servo | None
55 """
Fang Deng5d518f42013-08-02 14:04:32 -070056
Raul E Rangel52ca2e82018-07-03 14:10:14 -060057 DEFAULT_PORT = int(os.getenv('SERVOD_PORT', '9999'))
Richard Barnette9a26ad62016-06-10 12:03:08 -070058
Dan Shie5b3c512014-08-21 12:12:09 -070059 # Timeout for initializing servo signals.
Wai-Hong Tam37b6ed32017-09-19 15:52:39 -070060 INITIALIZE_SERVO_TIMEOUT_SECS = 60
Richard Barnette9a26ad62016-06-10 12:03:08 -070061
Otabek Kasimov545739c2020-08-20 00:24:21 -070062 # Default timeout for run terminal command.
63 DEFAULT_TERMINAL_TIMEOUT = 30
64
xixuan6cf6d2f2016-01-29 15:29:00 -080065 # Ready test function
66 SERVO_READY_METHOD = 'get_version'
Fang Deng5d518f42013-08-02 14:04:32 -070067
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080068 # Directory prefix on the servo host where the servod logs are stored.
69 SERVOD_LOG_PREFIX = '/var/log/servod'
70
71 # Exit code to use when symlinks for servod logs are not found.
72 NO_SYMLINKS_CODE = 9
73
74 # Directory in the job's results directory to dump the logs into.
75 LOG_DIR = 'servod'
76
77 # Prefix for joint loglevel files in the logs.
78 JOINT_LOG_PREFIX = 'log'
79
80 # Regex group to extract timestamp from logfile name.
81 TS_GROUP = 'ts'
82
83 # This regex is used to extract the timestamp from servod logs.
Garry Wang22f2e842020-09-09 20:19:19 -070084 # files always start with log.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080085 TS_RE = (r'log.'
86 # The timestamp is of format %Y-%m-%d--%H-%M-%S.MS
87 r'(?P<%s>\d{4}(\-\d{2}){2}\-(-\d{2}){3}.\d{3})'
88 # The loglevel is optional depending on labstation version.
89 r'(.(INFO|DEBUG|WARNING))?' % TS_GROUP)
90 TS_EXTRACTOR = re.compile(TS_RE)
91
92 # Regex group to extract MCU name from logline in servod logs.
93 MCU_GROUP = 'mcu'
94
95 # Regex group to extract logline from MCU logline in servod logs.
96 LINE_GROUP = 'line'
97
98 # This regex is used to extract the mcu and the line content from an
99 # MCU logline in servod logs. e.g. EC or servo_v4 console logs.
100 # Here is an example log-line:
101 #
102 # 2020-01-23 13:15:12,223 - servo_v4 - EC3PO.Console - DEBUG -
103 # console.py:219:LogConsoleOutput - /dev/pts/9 - cc polarity: cc1
104 #
105 # Here is conceptually how they are formatted:
106 #
107 # <time> - <MCU> - EC3PO.Console - <LVL> - <file:line:func> - <pts> -
108 # <output>
109 #
Garry Wang22f2e842020-09-09 20:19:19 -0700110 # The log format starts with a timestamp
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800111 MCU_RE = (r'[\d\-]+ [\d:,]+ '
112 # The mcu that is logging this is next.
113 r'- (?P<%s>\w+) - '
114 # Next, we have more log outputs before the actual line.
115 # Information about the file line, logging function etc.
116 # Anchor on EC3PO Console, LogConsoleOutput and dev/pts.
117 # NOTE: if the log format changes, this regex needs to be
118 # adjusted.
119 r'EC3PO\.Console[\s\-\w\d:.]+LogConsoleOutput - /dev/pts/\d+ - '
120 # Lastly, we get the MCU's console line.
121 r'(?P<%s>.+$)' % (MCU_GROUP, LINE_GROUP))
122 MCU_EXTRACTOR = re.compile(MCU_RE)
123
Otabek Kasimov545739c2020-08-20 00:24:21 -0700124 # Regex to detect timeout messages when USBC pigtail has timeout issue.
125 # e.g.: [475635.427072 PD TMOUT RX 1/1]
126 USBC_PIGTAIL_TIMEOUT_RE = r'\[[\d \.]{1,20}(PD TMOUT RX 1\/1)\]'
127
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800128 # Suffix to identify compressed logfiles.
129 COMPRESSION_SUFFIX = '.tbz2'
130
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700131 # A suffix to mark servod log directories that came from instance that
132 # ran during this servo_host, but are not the last one running e.g. when
133 # an instance (on purpose, or due to a bug) restarted in the middle of the
134 # run.
135 OLD_LOG_SUFFIX = 'old'
136
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700137 # Mapping servo board with their vid-pid
138 SERVO_VID_PID = {
Evan Green817a8d02020-12-01 16:45:36 -0800139 'servo_v4': '18d1:501b',
140 'ccd_cr50': '18d1:5014',
141 'servo_micro': '18d1:501a',
142 'servo_v3': ['18d1:5004', '0403:6014'],
143 'c2d2': '1d81:5041',
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700144 }
145
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800146 def _init_attributes(self):
147 self._servo_state = None
148 self.servo_port = None
149 self.servo_board = None
150 self.servo_model = None
151 self.servo_serial = None
Garry Wangcb06f3b2020-10-08 20:56:21 -0700152 self.servo_setup = None
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800153 self.servo_recovery = None
Garry Wang6a680062020-11-03 13:40:29 -0800154 self.additional_servod_args = None
Otabek Kasimov39637412020-11-23 19:09:27 -0800155 self._dut_health_profile = None
Garry Wang000c6c02020-05-11 21:27:23 -0700156 # The flag that indicate if a servo is connected to a smart usbhub.
157 # TODO(xianuowang@) remove this flag once all usbhubs in the lab
158 # get replaced.
159 self.smart_usbhub = None
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800160 self._servo = None
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700161 self._topology = None
Andrew McRaef0679932020-08-13 09:15:23 +1000162 self._tunnel_proxy = None
163 self._tunnel_proxy_lock = threading.Lock()
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700164 self._initial_instance_ts = None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800165 # Flag to make sure that multiple calls to close do not result in the
166 # logic executing multiple times.
167 self._closed = False
Andrew McRaef0679932020-08-13 09:15:23 +1000168 # Per-thread local data
169 self._local = threading.local()
Fang Deng5d518f42013-08-02 14:04:32 -0700170
Garry Wangcb06f3b2020-10-08 20:56:21 -0700171 def _initialize(self,
172 servo_host='localhost',
173 servo_port=DEFAULT_PORT,
174 servo_board=None,
175 servo_model=None,
176 servo_serial=None,
177 servo_setup=None,
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800178 servo_recovery=None,
Garry Wang6a680062020-11-03 13:40:29 -0800179 additional_servod_args=None,
Garry Wangcb06f3b2020-10-08 20:56:21 -0700180 is_in_lab=None,
181 *args,
182 **dargs):
Fang Deng5d518f42013-08-02 14:04:32 -0700183 """Initialize a ServoHost instance.
184
185 A ServoHost instance represents a host that controls a servo.
186
187 @param servo_host: Name of the host where the servod process
188 is running.
Raul E Rangel52ca2e82018-07-03 14:10:14 -0600189 @param servo_port: Port the servod process is listening on. Defaults
190 to the SERVOD_PORT environment variable if set,
191 otherwise 9999.
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700192 @param servo_board: Board that the servo is connected to.
Nick Sanders2f3c9852018-10-24 12:10:24 -0700193 @param servo_model: Model that the servo is connected to.
Garry Wangcb06f3b2020-10-08 20:56:21 -0700194 @param servo_serial: Serial number of the servo device.
195 @param servo_setup: Type of servo setup, e.g. REGULAR or DUAL_V4.
Garry Wang6a680062020-11-03 13:40:29 -0800196 @param additional_servod_args: Additional args that will append to
197 servod start command.
Dan Shi4d478522014-02-14 13:46:32 -0800198 @param is_in_lab: True if the servo host is in Cros Lab. Default is set
199 to None, for which utils.host_is_in_lab_zone will be
200 called to check if the servo host is in Cros lab.
Fang Deng5d518f42013-08-02 14:04:32 -0700201
202 """
203 super(ServoHost, self)._initialize(hostname=servo_host,
Garry Wangebc015b2019-06-06 17:45:06 -0700204 is_in_lab=is_in_lab, *args, **dargs)
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800205 self._init_attributes()
Richard Barnette42f4db92018-08-23 15:05:15 -0700206 self.servo_port = int(servo_port)
Richard Barnettee519dcd2016-08-15 17:37:17 -0700207 self.servo_board = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -0700208 self.servo_model = servo_model
Kevin Cheng643ce8a2016-09-15 15:42:12 -0700209 self.servo_serial = servo_serial
Garry Wangcb06f3b2020-10-08 20:56:21 -0700210 self.servo_setup = servo_setup
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800211 self.servo_recovery = servo_recovery
Garry Wang6a680062020-11-03 13:40:29 -0800212 self.additional_servod_args = additional_servod_args
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800213
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800214 # The location of the log files on the servo host for this instance.
215 self.remote_log_dir = '%s_%s' % (self.SERVOD_LOG_PREFIX,
216 self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700217 # Path of the servo host lock file.
Derek Beckettf73baca2020-08-19 15:08:47 -0700218 self._lock_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
219 self.LOCK_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700220 # File path to declare a reboot request.
Derek Beckettf73baca2020-08-19 15:08:47 -0700221 self._reboot_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
222 self.REBOOT_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700223
224 # Lock the servo host if it's an in-lab labstation to prevent other
225 # task to reboot it until current task completes. We also wait and
226 # make sure the labstation is up here, in the case of the labstation is
227 # in the middle of reboot.
Garry Wang7c00b0f2019-06-25 17:28:17 -0700228 self._is_locked = False
Garry Wang42b4d862019-06-25 15:50:49 -0700229 if (self.wait_up(self.REBOOT_TIMEOUT) and self.is_in_lab()
230 and self.is_labstation()):
Garry Wang79e9af62019-06-12 15:19:19 -0700231 self._lock()
Garry Wang78ce64d2020-10-13 18:23:45 -0700232 try:
233 self.wait_ready()
234 except Exception as e:
235 logging.info(
236 'Unexpected error while ensure labstation'
237 ' readiness; %s', str(e))
Garry Wangebc015b2019-06-06 17:45:06 -0700238
Richard Barnette9a26ad62016-06-10 12:03:08 -0700239 self._repair_strategy = (
240 servo_repair.create_servo_repair_strategy())
Richard Barnettee519dcd2016-08-15 17:37:17 -0700241
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700242 def __str__(self):
243 return "<%s '%s:%s'>" % (
244 type(self).__name__, self.hostname, self.servo_port)
245
Richard Barnette9a26ad62016-06-10 12:03:08 -0700246 def connect_servo(self):
Garry Wang8c8dc972020-06-09 13:41:51 -0700247 """ Initialize and setup servo for later use.
248 """
249 self.initilize_servo()
250 self.initialize_dut_for_servo()
251
Garry Wang8c8dc972020-06-09 13:41:51 -0700252 def initilize_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700253 """Establish a connection to the servod server on this host.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700254
255 Initializes `self._servo` and then verifies that all network
256 connections are working. This will create an ssh tunnel if
257 it's required.
Garry Wang8c8dc972020-06-09 13:41:51 -0700258 """
259 self._servo = servo.Servo(servo_host=self,
260 servo_serial=self.servo_serial)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700261
Garry Wang8c8dc972020-06-09 13:41:51 -0700262 def initialize_dut_for_servo(self):
263 """This method will do some setup for dut control, e.g. setup
264 main servo_v4 device, and also testing the connection between servo
265 and DUT. As a side effect of testing the connection, all signals on
266 the target servo are reset to default values, and the USB stick is
Richard Barnette9a26ad62016-06-10 12:03:08 -0700267 set to the neutral (off) position.
268 """
Garry Wang8c8dc972020-06-09 13:41:51 -0700269 if not self._servo:
270 raise hosts.AutoservVerifyError('Servo object needs to be'
271 ' initialized before initialize'
272 ' DUT.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700273 timeout, _ = retry.timeout(
Garry Wang8c8dc972020-06-09 13:41:51 -0700274 self._servo.initialize_dut,
275 timeout_sec=self.INITIALIZE_SERVO_TIMEOUT_SECS)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700276 if timeout:
Garry Wang8c8dc972020-06-09 13:41:51 -0700277 raise hosts.AutoservVerifyError('Initialize dut for servo timed'
278 ' out.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700279
Richard Barnette9a26ad62016-06-10 12:03:08 -0700280 def disconnect_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700281 """Disconnect our servo if it exists.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700282
283 If we've previously successfully connected to our servo,
284 disconnect any established ssh tunnel, and set `self._servo`
285 back to `None`.
286 """
287 if self._servo:
288 # N.B. This call is safe even without a tunnel:
289 # rpc_server_tracker.disconnect() silently ignores
290 # unknown ports.
291 self.rpc_server_tracker.disconnect(self.servo_port)
292 self._servo = None
Fang Deng5d518f42013-08-02 14:04:32 -0700293
Andrew McRaef0679932020-08-13 09:15:23 +1000294 def _maybe_create_servod_ssh_tunnel_proxy(self):
295 """Create a xmlrpc proxy for use with a ssh tunnel.
296 A lock is used to safely create a singleton proxy.
297 """
298 with self._tunnel_proxy_lock:
299 if self._tunnel_proxy is None:
300 self._tunnel_proxy = self.rpc_server_tracker.xmlrpc_connect(
301 None,
302 self.servo_port,
303 ready_test_name=self.SERVO_READY_METHOD,
304 timeout_seconds=60,
305 request_timeout_seconds=3600,
306 server_desc=str(self))
307
Andrew McRaef0679932020-08-13 09:15:23 +1000308 def get_servod_server_proxy(self):
309 """Return a proxy if it exists; otherwise, create a new one.
310 A proxy can either be a ssh tunnel based proxy, or a httplib
311 based proxy.
Fang Deng5d518f42013-08-02 14:04:32 -0700312
313 @returns: An xmlrpclib.ServerProxy that is connected to the servod
314 server on the host.
Fang Deng5d518f42013-08-02 14:04:32 -0700315 """
Garry Wang11b5e872020-03-11 15:14:08 -0700316 if (servo_constants.ENABLE_SSH_TUNNEL_FOR_SERVO
317 and not self.is_localhost()):
Andrew McRaef0679932020-08-13 09:15:23 +1000318 # Check for existing ssh tunnel proxy.
319 if self._tunnel_proxy is None:
320 self._maybe_create_servod_ssh_tunnel_proxy()
321 return self._tunnel_proxy
Richard Barnette9a26ad62016-06-10 12:03:08 -0700322 else:
Andrew McRaef0679932020-08-13 09:15:23 +1000323 # xmlrpc/httplib is not thread-safe, so each thread must have its
324 # own separate proxy connection.
325 if not hasattr(self._local, "_per_thread_proxy"):
326 remote = 'http://%s:%s' % (self.hostname, self.servo_port)
Derek Beckettf73baca2020-08-19 15:08:47 -0700327 self._local._per_thread_proxy = six.moves.xmlrpc_client.ServerProxy(remote)
Andrew McRaef0679932020-08-13 09:15:23 +1000328 return self._local._per_thread_proxy
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800329
Richard Barnette1edbb162016-11-01 11:47:50 -0700330 def verify(self, silent=False):
331 """Update the servo host and verify it's in a good state.
332
333 @param silent If true, suppress logging in `status.log`.
334 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700335 message = 'Beginning verify for servo host %s port %s serial %s'
336 message %= (self.hostname, self.servo_port, self.servo_serial)
337 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700338 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700339 self._repair_strategy.verify(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700340 self._servo_state = servo_constants.SERVO_STATE_WORKING
341 self.record('INFO', None, None,
342 'ServoHost verify set servo_state as WORKING')
Garry Wang63b8c382020-03-11 22:28:40 -0700343 except Exception as e:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -0700344 if not self.is_localhost():
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700345 self._servo_state = self.determine_servo_state()
346 self.record('INFO', None, None,
347 'ServoHost verify set servo_state as %s'
348 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700349 if self._is_critical_error(e):
350 raise
Fang Deng5d518f42013-08-02 14:04:32 -0700351
Garry Wang2b5eef92020-08-21 16:23:35 -0700352 def _get_default_usbkey_mount_path(self):
353 return '/media/servo_usb/%s' % self.servo_port
Fang Deng5d518f42013-08-02 14:04:32 -0700354
Garry Wang7b0e1b72020-03-25 19:08:59 -0700355 def get_image_name_from_usbkey(self, usbkey_dev):
356 """Mount usb drive and check ChromeOS image name on it if there is
357 one. This method assumes the image_usbkey_direction is already set
358 to servo side.
359
Garry Wang4b980202020-09-24 17:00:17 -0700360 @param usbkey_dev: usbkey dev path(e.g. /dev/sdb).
Garry Wang7b0e1b72020-03-25 19:08:59 -0700361
362 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
363 or empty string if no test image detected, or unexpected
364 error occurred.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700365 """
Garry Wang70e5d062020-04-03 18:01:05 -0700366 logging.info('Checking ChromeOS image name on usbkey.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700367 mount_dst = self._get_default_usbkey_mount_path()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700368 # Unmount if there is an existing stale mount.
Garry Wang2b5eef92020-08-21 16:23:35 -0700369 self._unmount_drive(mount_dst)
370 # ChromeOS root fs is in /dev/sdx3
371 mount_src = usbkey_dev + '3'
Garry Wang7b0e1b72020-03-25 19:08:59 -0700372 try:
Garry Wang2b5eef92020-08-21 16:23:35 -0700373 if not self._mount_drive(mount_src, mount_dst):
374 logging.debug('Unexpected error occurred on mount usb drive.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700375 return ''
Garry Wang70e5d062020-04-03 18:01:05 -0700376
377 release_content = self.run(
Garry Wang2b5eef92020-08-21 16:23:35 -0700378 'cat %s/etc/lsb-release' % mount_dst,
Garry Wang70e5d062020-04-03 18:01:05 -0700379 ignore_status=True).stdout.strip()
380
381 if not re.search(r'RELEASE_TRACK=.*test', release_content):
382 logging.info('The image on usbkey is not a test image')
383 return ''
384
385 return lsbrelease_utils.get_chromeos_release_builder_path(
386 lsb_release_content=release_content)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700387 finally:
Garry Wang70e5d062020-04-03 18:01:05 -0700388 logging.debug('Image check compeleted, unmounting the usb drive.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700389 self._unmount_drive(mount_dst)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700390
Garry Wang2b5eef92020-08-21 16:23:35 -0700391 def _extract_firmware_image_from_usbkey(self, fw_dst):
392 """Extract firmware images from the usbkey on servo, this method
393 assumes there is already a ChromeOS test image staged on servo.
394
Garry Wang4b980202020-09-24 17:00:17 -0700395 @param fw_dst: the path that we'll copy firmware images to.
Garry Wang2b5eef92020-08-21 16:23:35 -0700396
397 @returns: a json format string of firmware manifest data.
398 """
399 usbkey_dev = self._probe_and_validate_usb_dev()
400 if not usbkey_dev:
401 raise hosts.AutoservRepairError('Unexpected error occurred when'
402 ' probe usbkey dev path, please check logs for detail.')
403
404 mount_dst = self._get_default_usbkey_mount_path()
405 # Unmount if there is an existing stale mount.
406 self._unmount_drive(mount_dst)
407 # ChromeOS root fs is in /dev/sdx3
408 mount_src = usbkey_dev + '3'
409 try:
410 if not self._mount_drive(mount_src, mount_dst):
411 raise hosts.AutoservRepairError('Failed to extract firmware'
412 ' image; Unable to mount %s.' % usbkey_dev,
413 'unable to mount usbkey')
414 updater_bin = os.path.join(mount_dst,
415 'usr/sbin/chromeos-firmwareupdate')
416 self.run('%s --unpack %s' % (updater_bin, fw_dst))
417 return self.run('%s --manifest' % updater_bin).stdout
418 finally:
419 self._unmount_drive(mount_dst)
420
421 def prepare_repair_firmware_image(self, fw_dst=None):
422 """Prepare firmware image on the servohost for auto repair process
423 to consume.
424
Garry Wang4b980202020-09-24 17:00:17 -0700425 @param fw_dst: the path that we want to store firmware image on
426 the servohost.
Garry Wang2b5eef92020-08-21 16:23:35 -0700427
428 @returns: A tuple that containes ec firmware image path and bios
429 firmware image path on the servohost, or None if type of
430 image is not available based on manifest and dut's model.
431 """
432 model = self.servo_model or self._dut_host_info.model
433 if not model:
434 raise hosts.AutoservRepairError(
435 'Could not determine DUT\'s model.',
436 'model infomation unknown')
437
438 if not fw_dst:
439 fw_dst = '/tmp/firmware_image/%s' % self.servo_port
440 # Cleanup and re-create dst path to have a fresh start.
441 self.run('rm -rf %s' % fw_dst)
442 self.run('mkdir -p %s' % fw_dst)
443
444 manifest = json.loads(self._extract_firmware_image_from_usbkey(fw_dst))
Garry Wang50b56c12020-09-24 17:26:52 -0700445 # For models that have packed $MODEL_signed variant, we want use the
446 # 'signed' variant once we get DVT devices, so try to read manifest
447 # from $MODEL_signed first.
448 build = manifest.get('%s_signed' % model) or manifest.get(model)
449 if not build:
Garry Wang2b5eef92020-08-21 16:23:35 -0700450 raise hosts.AutoservRepairError('Could not find firmware manifest'
451 ' for model:%s' % model, 'model manifest not found')
452 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700453 ec_image = os.path.join(fw_dst, build['ec']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700454 except KeyError:
455 ec_image = None
456 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700457 bios_image = os.path.join(fw_dst, build['host']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700458 except KeyError:
459 bios_image = None
460 if not ec_image and not bios_image:
461 raise hosts.AutoservRepairError('Could not find any firmware image'
462 ' for model:%s' % model, 'cannot find firmware image')
463 return ec_image, bios_image
Garry Wang7b0e1b72020-03-25 19:08:59 -0700464
Garry Wang4b980202020-09-24 17:00:17 -0700465 def flash_ap_firmware_via_servo(self, image):
466 """Flash AP firmware by use a provided image.
467
468 This is will be a short term enhanment for infra repair use, it use
469 'futility update' which will automatically determine various parameters
470 needed for flashrom, and will preserve the GBB, VPD, and HWID for
471 AP firmware update.
472 @TODO(xianuowang@) Remove this method once b/148403277 implemented.
473
474 @param image: the firmware image path on servohost.
475 """
476 cmd = 'futility update -i %s --servo_port=%s'
477 self.run(cmd % (image, self.servo_port), timeout=900)
478
Garry Wang70e5d062020-04-03 18:01:05 -0700479 def _probe_and_validate_usb_dev(self):
480 """This method probe the usb dev path by talking to servo, and then
481 validate the dev path is valid block device to servohost.
482 Possible output:
483 1. Encounter error during probe usb dev, returns empty string.
484 2. probe usb dev completed without error but cannot find usb dev,
485 raise AutoservRepairError.
486 3. probe usb dev find a usb dev path, but failed validation in this
487 method, raise AutoservRepairError.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700488
Garry Wang70e5d062020-04-03 18:01:05 -0700489 @returns: A string of usb dev path(e.g. '/dev/sdb'), or empty string
490 if unexpected error occurred during probe.
491 @raises: AutoservRepairError if servo couldn't probe the usb dev path
492 (servo.probe_host_usb_dev() returns empty string), or the dev path is
493 not valid block device to servohost.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700494 """
495 logging.info('Validating image usbkey on servo.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700496 try:
Garry Wang70e5d062020-04-03 18:01:05 -0700497 usb_dev = self._servo.probe_host_usb_dev()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700498 except Exception as e:
499 # We don't want any unexpected or transient servo communicating
500 # failure block usb repair, so capture all errors here.
501 logging.error(e, exc_info=True)
502 logging.error('Unexpected error occurred on get usbkey dev path,'
503 ' skipping usbkey validation.')
504 return ''
505
Garry Wang70e5d062020-04-03 18:01:05 -0700506 if usb_dev:
507 # probe_host_usb_dev() sometimes return stale record,
508 # so we need to make sure the path exists in fdisk.
Otabek Kasimov77bff672020-10-08 15:52:03 -0700509 validate_cmd = 'fdisk -l %s' % usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700510 try:
Otabek Kasimov77bff672020-10-08 15:52:03 -0700511 resp = self.run(validate_cmd, ignore_status=True, timeout=30)
Garry Wang11441182020-06-16 18:34:14 -0700512 if resp.exit_status == 0:
513 return usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700514 logging.error('%s is reported from "image_usbkey_dev" control'
515 ' but not detected by fdisk!', usb_dev)
516 except error.AutoservRunError as e:
517 if 'Timeout encountered' in str(e):
518 logging.warning('Timeout encountered during fdisk run,'
519 ' skipping usbkey validation.')
520 return ''
521 raise
Garry Wang70e5d062020-04-03 18:01:05 -0700522
523 raise hosts.AutoservRepairError(
524 'No usbkey detected on servo, the usbkey may be either missing'
525 ' or broken. Please replace usbkey on the servo and retry.',
526 'missing usbkey')
527
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700528 def is_ec_supported(self):
Garry Wang9b8f2342020-04-17 16:34:09 -0700529 """Check if ec is supported on the servo_board"""
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700530 if self.servo_board:
531 try:
532 frm_config = config.Config(self.servo_board, self.servo_model)
533 return frm_config.chrome_ec
534 except Exception as e:
535 logging.error('Unexpected error when read from firmware'
536 ' configs; %s', str(e))
537 return False
538
Garry Wang70e5d062020-04-03 18:01:05 -0700539 def validate_image_usbkey(self):
540 """This method first validate if there is a recover usbkey on servo
541 that accessible to servohost, and second check if a ChromeOS image is
542 already on the usb drive and return the image_name so we can avoid
543 unnecessary download and flash to the recover usbkey on servo.
544
545 Please note that, there is special error handling logic here:
546 1. If unexpected error happens, we return empty string. So repair
547 actions will not get blocked.
548 2. If no working usbkey present on servo, but no errors, we'll raise
549 AutoservRepairError here.
550
551 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
552 or empty string if no test image detected, or unexpected
553 error occurred.
554 @raises: AutoservRepairError if the usbkey is not detected on servo.
555 """
556 usb_dev = self._probe_and_validate_usb_dev()
557 if usb_dev:
558 return self.get_image_name_from_usbkey(usb_dev)
559 else:
560 return ''
Garry Wang7b0e1b72020-03-25 19:08:59 -0700561
Richard Barnette1edbb162016-11-01 11:47:50 -0700562 def repair(self, silent=False):
563 """Attempt to repair servo host.
564
565 @param silent If true, suppress logging in `status.log`.
566 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700567 message = 'Beginning repair for servo host %s port %s serial %s'
568 message %= (self.hostname, self.servo_port, self.servo_serial)
569 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700570 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700571 self._repair_strategy.repair(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700572 self._servo_state = servo_constants.SERVO_STATE_WORKING
573 self.record('INFO', None, None,
574 'ServoHost repair set servo_state as WORKING')
Garry Wang464ff1e2019-07-18 17:20:34 -0700575 # If target is a labstation then try to withdraw any existing
576 # reboot request created by this servo because it passed repair.
577 if self.is_labstation():
578 self.withdraw_reboot_request()
Garry Wang63b8c382020-03-11 22:28:40 -0700579 except Exception as e:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -0700580 if not self.is_localhost():
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700581 self._servo_state = self.determine_servo_state()
582 self.record('INFO', None, None,
583 'ServoHost repair set servo_state as %s'
584 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700585 if self._is_critical_error(e):
586 self.disconnect_servo()
587 self.stop_servod()
588 raise
589
Garry Wang63b8c382020-03-11 22:28:40 -0700590 def _is_critical_error(self, error):
591 if (isinstance(error, hosts.AutoservVerifyDependencyError)
592 and not error.is_critical()):
593 logging.warning('Non-critical verify failure(s) detected during'
594 ' verify/repair servo, servo connection will'
Evan Benn2c41c262020-10-28 11:34:27 +1100595 ' still be up but may not be fully functional.'
596 ' Some repair actions and servo dependent'
Garry Wang63b8c382020-03-11 22:28:40 -0700597 ' tests may not run.')
598 return False
Evan Benn2c41c262020-10-28 11:34:27 +1100599 logging.info(
600 'Critical verify failure(s) detected during repair/verify '
601 'servo. Disconnecting servo and running `stop servod`, all'
602 ' repair actions and tests that depends on servo will not '
603 'run.')
Garry Wang63b8c382020-03-11 22:28:40 -0700604 return True
Fang Deng5d518f42013-08-02 14:04:32 -0700605
Dan Shi4d478522014-02-14 13:46:32 -0800606 def get_servo(self):
607 """Get the cached servo.Servo object.
Fang Deng5d518f42013-08-02 14:04:32 -0700608
Dan Shi4d478522014-02-14 13:46:32 -0800609 @return: a servo.Servo object.
Dana Goyette353d1d92019-06-27 10:43:59 -0700610 @rtype: autotest_lib.server.cros.servo.servo.Servo
Fang Deng5d518f42013-08-02 14:04:32 -0700611 """
Dan Shi4d478522014-02-14 13:46:32 -0800612 return self._servo
613
Garry Wang79e9af62019-06-12 15:19:19 -0700614 def request_reboot(self):
615 """Request servohost to be rebooted when it's safe to by touch a file.
616 """
617 logging.debug('Request to reboot servohost %s has been created by '
Garry Wang464ff1e2019-07-18 17:20:34 -0700618 'servo with port # %s', self.hostname, self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700619 self.run('touch %s' % self._reboot_file, ignore_status=True)
620
Garry Wang464ff1e2019-07-18 17:20:34 -0700621 def withdraw_reboot_request(self):
622 """Withdraw a servohost reboot request if exists by remove the flag
623 file.
624 """
625 logging.debug('Withdrawing request to reboot servohost %s that created'
626 ' by servo with port # %s if exists.',
627 self.hostname, self.servo_port)
628 self.run('rm -f %s' % self._reboot_file, ignore_status=True)
629
Garry Wangc1288cf2019-12-17 14:58:00 -0800630 def start_servod(self, quick_startup=False):
631 """Start the servod process on servohost.
632 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800633 # Skip if running on the localhost.(crbug.com/1038168)
634 if self.is_localhost():
635 logging.debug("Servohost is a localhost, skipping start servod.")
636 return
637
638 cmd = 'start servod'
Garry Wangc1288cf2019-12-17 14:58:00 -0800639 if self.servo_board:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800640 cmd += ' BOARD=%s' % self.servo_board
Garry Wangc1288cf2019-12-17 14:58:00 -0800641 if self.servo_model:
642 cmd += ' MODEL=%s' % self.servo_model
Garry Wangc1288cf2019-12-17 14:58:00 -0800643 else:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800644 logging.warning('Board for DUT is unknown; starting servod'
645 ' assuming a pre-configured board.')
646
647 cmd += ' PORT=%d' % self.servo_port
648 if self.servo_serial:
649 cmd += ' SERIAL=%s' % self.servo_serial
Garry Wangd7367482020-02-27 13:52:40 -0800650
Garry Wangcb06f3b2020-10-08 20:56:21 -0700651 # Start servod with dual_v4 based on servo_setup.
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700652 if self.is_dual_setup():
Garry Wangcb06f3b2020-10-08 20:56:21 -0700653 cmd += ' DUAL_V4=1'
Garry Wangd7367482020-02-27 13:52:40 -0800654
Garry Wangcb06f3b2020-10-08 20:56:21 -0700655 # Start servod with CONFIG=cr50.xml which required for some pools.
656 if self._require_cr50_servod_config():
657 cmd += ' CONFIG=cr50.xml'
Garry Wangb5cee3e2020-09-16 14:58:13 -0700658
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -0800659 if self.servo_recovery == True:
660 cmd += ' REC_MODE=1'
661
Garry Wang6a680062020-11-03 13:40:29 -0800662 # Adding customized args if any.
663 if self.additional_servod_args:
664 cmd += ' ' + self.additional_servod_args
665
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800666 # Remove the symbolic links from the logs. This helps ensure that
667 # a failed servod instantiation does not cause us to grab old logs
668 # by mistake.
669 self.remove_latest_log_symlinks()
Garry Wangcdd27b22020-01-13 14:59:11 -0800670 self.run(cmd, timeout=60)
Garry Wangc1288cf2019-12-17 14:58:00 -0800671
672 # There's a lag between when `start servod` completes and when
673 # the _ServodConnectionVerifier trigger can actually succeed.
674 # The call to time.sleep() below gives time to make sure that
675 # the trigger won't fail after we return.
676
677 # Normally servod on servo_v3 and labstation take ~10 seconds to ready,
678 # But in the rare case all servo on a labstation are in heavy use they
679 # may take ~30 seconds. So the timeout value will double these value,
680 # and we'll try quick start up when first time initialize servohost,
681 # and use standard start up timeout in repair.
682 if quick_startup:
Garry Wang11b5e872020-03-11 15:14:08 -0700683 timeout = servo_constants.SERVOD_QUICK_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800684 else:
Garry Wang11b5e872020-03-11 15:14:08 -0700685 timeout = servo_constants.SERVOD_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800686 logging.debug('Wait %s seconds for servod process fully up.', timeout)
687 time.sleep(timeout)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700688 # Cache the initial instance timestamp to check against servod restarts
689 self._initial_instance_ts = self.get_instance_logs_ts()
Garry Wangc1288cf2019-12-17 14:58:00 -0800690
Garry Wangc1288cf2019-12-17 14:58:00 -0800691 def stop_servod(self):
692 """Stop the servod process on servohost.
693 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800694 # Skip if running on the localhost.(crbug.com/1038168)
695 if self.is_localhost():
696 logging.debug("Servohost is a localhost, skipping stop servod.")
697 return
698
Garry Wangc1288cf2019-12-17 14:58:00 -0800699 logging.debug('Stopping servod on port %s', self.servo_port)
Garry Wangcdd27b22020-01-13 14:59:11 -0800700 self.run('stop servod PORT=%d' % self.servo_port,
701 timeout=60, ignore_status=True)
Garry Wangc1288cf2019-12-17 14:58:00 -0800702 logging.debug('Wait %s seconds for servod process fully teardown.',
Garry Wang11b5e872020-03-11 15:14:08 -0700703 servo_constants.SERVOD_TEARDOWN_TIMEOUT)
704 time.sleep(servo_constants.SERVOD_TEARDOWN_TIMEOUT)
Garry Wangc1288cf2019-12-17 14:58:00 -0800705
Garry Wangc1288cf2019-12-17 14:58:00 -0800706 def restart_servod(self, quick_startup=False):
707 """Restart the servod process on servohost.
708 """
709 self.stop_servod()
710 self.start_servod(quick_startup)
711
Garry Wangffbd2162020-04-17 16:13:48 -0700712 def _process_servodtool_error(self, response):
713 """Helper function to handle non-zero servodtool response.
714 """
715 if re.search(servo_constants.ERROR_MESSAGE_USB_HUB_NOT_COMPATIBLE,
Garry Wangad245002020-05-15 15:20:23 -0700716 response.stdout):
Garry Wangffbd2162020-04-17 16:13:48 -0700717 logging.error('The servo is not plugged on a usb hub that supports'
718 ' power-cycle!')
Garry Wang000c6c02020-05-11 21:27:23 -0700719 # change the flag so we can update this label in later process.
720 self.smart_usbhub = False
Garry Wangffbd2162020-04-17 16:13:48 -0700721 return
722
723 if re.search(servo_constants.ERROR_MESSAGE_DEVICE_NOT_FOUND %
724 self.servo_serial, response.stdout):
725 logging.error('No servo with serial %s found!', self.servo_serial)
726 return
727
728 logging.error('Unexpected error occurred from usbhub control, please'
729 ' file a bug and inform chrome-fleet-software@ team!')
730
Otabek Kasimov86062d02020-11-17 13:30:22 -0800731 def get_main_servo_usb_path(self):
732 """Helper function to collect current usb-path to main servo.
733
734 The usb-path is path to the folder where usb-device was enumerated.
735 If fail then will return an empty string ('').
736
737 @returns: string, usb-path to the main servo device.
738 e.g.: '/sys/bus/usb/devices/1-6.1.3.1'
Garry Wangffbd2162020-04-17 16:13:48 -0700739 """
Otabek Kasimov09192682020-06-01 18:17:44 -0700740 # TODO remove try-except when fix crbug.com/1087964
741 try:
742 cmd = 'servodtool device -s %s usb-path' % self.servo_serial
743 resp = self.run(cmd, ignore_status=True, timeout=30)
744 except Exception as e:
745 # Here we catch only timeout errors.
746 # Other errors is filtered by ignore_status=True
747 logging.debug('Attempt to get servo usb-path failed due to '
748 'timeout; %s', e)
749 return ''
Garry Wangffbd2162020-04-17 16:13:48 -0700750 if resp.exit_status != 0:
751 self._process_servodtool_error(resp)
752 return ''
753 usb_path = resp.stdout.strip()
754 logging.info('Usb path of servo %s is %s', self.servo_serial, usb_path)
Otabek Kasimov86062d02020-11-17 13:30:22 -0800755 return usb_path
Garry Wangffbd2162020-04-17 16:13:48 -0700756
Otabek Kasimov86062d02020-11-17 13:30:22 -0800757 def _get_servo_usb_devnum(self):
758 """Helper function to collect current usb devnum of servo."""
759 usb_path = self.get_main_servo_usb_path()
760 if not usb_path:
761 return ''
762 resp = self.run('cat %s/devnum' % usb_path, ignore_status=True)
Garry Wangffbd2162020-04-17 16:13:48 -0700763 if resp.exit_status != 0:
764 self._process_servodtool_error(resp)
765 return ''
766 return resp.stdout.strip()
767
Garry Wang358aad42020-08-02 20:56:04 -0700768 def reboot_servo_v3_on_need(self):
769 """Check and reboot servo_v3 based on below conditions.
770 1. If there is an update pending on reboot.
771 2. Servo_v3 has been up for more than 96 hours.
772 """
773 if self.get_board() != 'beaglebone_servo':
774 logging.info('Servo reboot is only applicable for servo V3.')
Otabek Kasimove6df8102020-07-21 20:15:25 -0700775 return
776
Garry Wang358aad42020-08-02 20:56:04 -0700777 update_pending_reboot = (self._check_update_status() ==
778 self.UPDATE_STATE.PENDING_REBOOT)
779 uptime_hours = float(self.check_uptime())/3600
780 logging.info('Uptime of servo_v3: %s hour(s)', uptime_hours)
781 long_up_time = uptime_hours > 96
782
783 # Skip reboot if neither condition are met.
784 if not (update_pending_reboot or long_up_time):
Otabek Kasimove6df8102020-07-21 20:15:25 -0700785 return
786
Garry Wang358aad42020-08-02 20:56:04 -0700787 if update_pending_reboot:
788 message = 'Starting reboot servo_v3 because an update is pending.'
789 reboot_method = self._post_update_reboot
790 elif long_up_time:
791 message = 'Starting reboot servo_v3 because uptime > 96 hours.'
792 reboot_method = self._servo_host_reboot
793 self.record('INFO', None, None, message)
794 logging.info(message)
Otabek Kasimove6df8102020-07-21 20:15:25 -0700795 try:
Garry Wang358aad42020-08-02 20:56:04 -0700796 reboot_method()
Otabek Kasimove6df8102020-07-21 20:15:25 -0700797 message = 'Servo_v3 reboot completed successfully.'
798 except Exception as e:
799 logging.debug("Fail to reboot servo_v3; %s", e)
800 message = ('Servo_v3 reboot failed, please check debug log '
801 'for details.')
802 logging.info(message)
803 self.record('INFO', None, None, message)
Garry Wangffbd2162020-04-17 16:13:48 -0700804
805 def _reset_servo(self):
806 logging.info('Resetting servo through smart usbhub.')
Otabek Kasimov09192682020-06-01 18:17:44 -0700807 # TODO remove try-except when fix crbug.com/1087964
808 try:
809 resp = self.run('servodtool device -s %s power-cycle' %
810 self.servo_serial, ignore_status=True,
811 timeout=30)
812 if resp.exit_status != 0:
813 self._process_servodtool_error(resp)
814 return False
815 except Exception as e:
816 # Here we catch only timeout errors.
817 # Other errors is filtered by ignore_status=True
818 logging.debug('Attempt to reset servo failed due to timeout;'
819 ' %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -0700820 return False
821
822 logging.debug('Wait %s seconds for servo to come back from reset.',
823 servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
824 time.sleep(servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
Garry Wang000c6c02020-05-11 21:27:23 -0700825 # change the flag so we can update this label in later process.
826 self.smart_usbhub = True
Garry Wangffbd2162020-04-17 16:13:48 -0700827 return True
828
Garry Wangffbd2162020-04-17 16:13:48 -0700829 def reset_servo(self):
830 """Reset(power-cycle) the servo via smart usbhub.
831 """
832 if not self.is_labstation():
833 logging.info('Servo reset is not applicable to servo_v3.')
834 return
835
836 pre_reset_devnum = self._get_servo_usb_devnum()
837 logging.info('Servo usb devnum before reset: %s', pre_reset_devnum)
838 result = self._reset_servo()
839 if not result:
Garry Wangfd5c8b62020-06-08 15:36:54 -0700840 message = ('Failed to reset servo with serial: %s. (Please ignore'
841 ' this error if the DUT is not connected to a smart'
842 ' usbhub).' % self.servo_serial)
Garry Wangffbd2162020-04-17 16:13:48 -0700843 logging.warning(message)
844 self.record('INFO', None, None, message)
845 return
846
847 post_reset_devnum = self._get_servo_usb_devnum()
848 logging.info('Servo usb devnum after reset: %s', post_reset_devnum)
849 if not (pre_reset_devnum and post_reset_devnum):
850 message = ('Servo reset completed but unable to verify'
851 ' devnum change!')
852 elif pre_reset_devnum != post_reset_devnum:
853 message = ('Reset servo with serial %s completed successfully!'
854 % self.servo_serial)
855 else:
856 message = 'Servo reset completed but devnum is still not changed!'
857 logging.info(message)
858 self.record('INFO', None, None, message)
859
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800860 def _extract_compressed_logs(self, logdir, relevant_files):
861 """Decompress servod logs in |logdir|.
862
863 @param logdir: directory containing compressed servod logs.
864 @param relevant_files: list of files in |logdir| to consider.
865
866 @returns: tuple, (tarfiles, files) where
867 tarfiles: list of the compressed filenames that have been
868 extracted and deleted
869 files: list of the uncompressed files that were generated
870 """
871 # For all tar-files, first extract them to the directory, and
872 # then let the common flow handle them.
873 tarfiles = [cf for cf in relevant_files if
874 cf.endswith(self.COMPRESSION_SUFFIX)]
875 files = []
876 for f in tarfiles:
877 norm_name = os.path.basename(f)[:-len(self.COMPRESSION_SUFFIX)]
878 with tarfile.open(f) as tf:
879 # Each tarfile has only one member, as
880 # that's the compressed log.
881 member = tf.members[0]
882 # Manipulate so that it only extracts the basename, and not
883 # the directories etc.
884 member.name = norm_name
885 files.append(os.path.join(logdir, member.name))
886 tf.extract(member, logdir)
887 # File has been extracted: remove the compressed file.
888 os.remove(f)
889 return tarfiles, files
890
891 def _extract_mcu_logs(self, log_subdir):
892 """Extract MCU (EC, Cr50, etc) console output from servod debug logs.
893
894 Using the MCU_EXTRACTOR regex (above) extract and split out MCU console
895 lines from the logs to generate invidiual console logs e.g. after
896 this method, you can find an ec.txt and servo_v4.txt in |log_dir| if
897 those MCUs had any console input/output.
898
899 @param log_subdir: directory with log.DEBUG.txt main servod debug logs.
900 """
901 # Extract the MCU for each one. The MCU logs are only in the .DEBUG
902 # files
903 mcu_lines_file = os.path.join(log_subdir, 'log.DEBUG.txt')
904 if not os.path.exists(mcu_lines_file):
905 logging.info('No DEBUG logs found to extract MCU logs from.')
906 return
907 mcu_files = {}
908 mcu_file_template = '%s.txt'
909 with open(mcu_lines_file, 'r') as f:
910 for line in f:
911 match = self.MCU_EXTRACTOR.match(line)
912 if match:
913 mcu = match.group(self.MCU_GROUP).lower()
914 line = match.group(self.LINE_GROUP)
915 if mcu not in mcu_files:
916 mcu_file = os.path.join(log_subdir,
917 mcu_file_template % mcu)
918 mcu_files[mcu] = open(mcu_file, 'a')
919 fd = mcu_files[mcu]
920 fd.write(line + '\n')
921 for f in mcu_files:
922 mcu_files[f].close()
923
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800924 def remove_latest_log_symlinks(self):
925 """Remove the conveninence symlinks 'latest' servod logs."""
926 symlink_wildcard = '%s/latest*' % self.remote_log_dir
927 cmd = 'rm ' + symlink_wildcard
928 self.run(cmd, stderr_tee=None, ignore_status=True)
929
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700930 def probe_servod_restart(self, instance_ts, outdir):
931 """Grab servod logs from previous instances if part of this session.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800932
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700933 If since the last time this host called start_servod() servod crashed
934 and restarted, this helper finds those logs as well, and stores them
935 with the |OLD_LOG_SUFFIX| to investigate if necessary.
Prasad Vuppalapu5bd9da12020-03-31 01:46:47 +0000936
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700937 It also issues a panicinfo command to servo devices after the restart
938 to try and collect reboot information for debugging.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800939
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700940 @param instance_ts: the log timestamp that the current instance uses
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800941 @param outdir: directory to create a subdirectory into to place the
942 servod logs into.
943 """
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700944 if self._initial_instance_ts is None:
945 logging.info('No log timestamp grabbed successfully on servod '
946 'startup. Cannot check device restarts. Ignoring.')
947 return
948 if instance_ts == self._initial_instance_ts:
949 logging.debug('Servod appears to have run without restarting')
950 return
951 # Servod seems to have restarted (at least once). |_initial_instance_ts|
952 # is the first timestamp, and instance_ts is the current timestamp. Find
953 # all timestamps in between them, and grab the logs for each.
954 tss = self._find_instance_timestamps_between(self._initial_instance_ts,
955 instance_ts)
956 logging.info('Servod has restarted %d times between the start and the '
957 'end of this servo_host.', len(tss))
958 logging.info('This might be an issue. Will extract all logs from each '
959 'instance.')
960 logging.info('Logs that are not the currently running (about to turn '
961 'down) instance are maked with a .%s in their folder.',
962 self.OLD_LOG_SUFFIX)
963 for ts in tss:
964 self.get_instance_logs(ts, outdir, old=True)
965 # Lastly, servod has restarted due to a potential issue. Try to get
966 # panic information from servo micro and servo v4 for the current logs.
967 # This can only happen if the |_servo| attribute is initialized.
968 if self._servo:
969 for mcu in ['servo_micro', 'servo_v4']:
970 ctrl = '%s_uart_cmd' % mcu
971 if self._servo.has_control(ctrl):
972 logging.info('Trying to retrieve %r panicinfo into logs',
973 mcu)
974 try:
975 self._servo.set_nocheck(ctrl, 'panicinfo')
976 except error.TestFail as e:
977 logging.error('Failed to generate panicinfo for %r '
978 'logs. %s', mcu, str(e))
979
980 def _find_instance_timestamps_between(self, start_ts, end_ts):
981 """Find all log timestamps between [start_ts, end_ts).
982
983 @param start_ts: str, earliest log timestamp of interest
984 @param end_ts: str, latest log timestamp of interest
985
986 @returns: list, all timestamps between start_ts and end_ts, end_ts
987 exclusive, on the servo_host. An empty list on errors
988 """
989 # Simply get all timestamp, and then sort and remove
990 cmd = 'ls %s' % self.remote_log_dir
991 res = self.run(cmd, stderr_tee=None, ignore_status=True)
992 if res.exit_status != 0:
993 # Here we failed to find anything.
994 logging.info('Failed to find remote servod logs. Ignoring.')
995 return []
996 logfiles = res.stdout.strip().split()
997 timestamps = set()
998 for logfile in logfiles:
999 ts_match = self.TS_EXTRACTOR.match(logfile)
1000 if not ts_match:
1001 # Simply ignore files that fail the check. It might be the
1002 # 'latest' symlinks or random files.
1003 continue
1004 timestamps.add(ts_match.group(self.TS_GROUP))
1005 # At this point we have all unique timestamps.
1006 timestamps = sorted(timestamps)
1007 for ts in [start_ts, end_ts]:
1008 if ts not in timestamps:
1009 logging.error('Timestamp %r not in servod logs. Cannot query '
1010 'for timestamps in between %r and %r', ts,
1011 start_ts, end_ts)
1012 return []
1013 return timestamps[timestamps.index(start_ts):timestamps.index(end_ts)]
1014
1015 def get_instance_logs_ts(self):
1016 """Retrieve the currently running servod instance's log timestamp
1017
1018 @returns: str, timestamp for current instance, or None on failure
1019 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001020 # First, extract the timestamp. This cmd gives the real filename of
1021 # the latest aka current log file.
1022 cmd = ('if [ -f %(dir)s/latest.DEBUG ];'
1023 'then realpath %(dir)s/latest.DEBUG;'
1024 'elif [ -f %(dir)s/latest ];'
1025 'then realpath %(dir)s/latest;'
1026 'else exit %(code)d;'
1027 'fi' % {'dir': self.remote_log_dir,
1028 'code': self.NO_SYMLINKS_CODE})
1029 res = self.run(cmd, stderr_tee=None, ignore_status=True)
1030 if res.exit_status != 0:
1031 if res.exit_status == self.NO_SYMLINKS_CODE:
1032 logging.warning('servod log latest symlinks not found. '
1033 'This is likely due to an error starting up '
1034 'servod. Ignoring..')
1035 else:
1036 logging.warning('Failed to find servod logs on servo host.')
1037 logging.warning(res.stderr.strip())
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001038 return None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001039 fname = os.path.basename(res.stdout.strip())
1040 # From the fname, ought to extract the timestamp using the TS_EXTRACTOR
Ruben Rodriguez Buchillone9aa2b02020-03-04 12:14:28 -08001041 ts_match = self.TS_EXTRACTOR.match(fname)
1042 if not ts_match:
1043 logging.warning('Failed to extract timestamp from servod log file '
1044 '%r. Skipping. The servo host is using outdated '
1045 'servod logging and needs to be updated.', fname)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001046 return None
1047 return ts_match.group(self.TS_GROUP)
1048
1049 def get_instance_logs(self, instance_ts, outdir, old=False):
1050 """Collect all logs with |instance_ts| and dump into a dir in |outdir|
1051
1052 This method first collects all logs on the servo_host side pertaining
1053 to this servod instance (port, instatiation). It glues them together
1054 into combined log.[level].txt files and extracts all available MCU
1055 console I/O from the logs into individual files e.g. servo_v4.txt
1056
1057 All the output can be found in a directory inside |outdir| that
1058 this generates based on |LOG_DIR|, the servod port, and the instance
1059 timestamp on the servo_host side.
1060
1061 @param instance_ts: log timestamp to grab logfiles for
1062 @param outdir: directory to create a subdirectory into to place the
1063 servod logs into.
1064 @param old: bool, whether to append |OLD_LOG_SUFFIX| to output dir
1065 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001066 # Create the local results log dir.
1067 log_dir = os.path.join(outdir, '%s_%s.%s' % (self.LOG_DIR,
1068 str(self.servo_port),
1069 instance_ts))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001070 if old:
Garry Wang22f2e842020-09-09 20:19:19 -07001071 log_dir = '%s.%s' % (log_dir, self.OLD_LOG_SUFFIX)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001072 logging.info('Saving servod logs to %r.', log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001073 os.mkdir(log_dir)
1074 # Now, get all files with that timestamp.
1075 cmd = 'find %s -maxdepth 1 -name "log.%s*"' % (self.remote_log_dir,
1076 instance_ts)
1077 res = self.run(cmd, stderr_tee=None, ignore_status=True)
1078 files = res.stdout.strip().split()
1079 try:
1080 self.get_file(files, log_dir, try_rsync=False)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001081 if not os.listdir(log_dir):
1082 logging.info('No servod logs retrieved. Ignoring, and removing '
1083 '%r again.', log_dir)
1084 os.rmdir(log_dir)
1085 return
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001086 except error.AutoservRunError as e:
1087 result = e.result_obj
1088 if result.exit_status != 0:
1089 stderr = result.stderr.strip()
1090 logging.warning("Couldn't retrieve servod logs. Ignoring: %s",
1091 stderr or '\n%s' % result)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001092 # Remove the log_dir as nothing was added to it.
1093 os.rmdir(log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001094 return
1095 local_files = [os.path.join(log_dir, f) for f in os.listdir(log_dir)]
1096 # TODO(crrev.com/c/1793030): remove no-level case once CL is pushed
1097 for level_name in ('DEBUG', 'INFO', 'WARNING', ''):
1098 # Create the joint files for each loglevel. i.e log.DEBUG
1099 joint_file = self.JOINT_LOG_PREFIX
1100 if level_name:
1101 joint_file = '%s.%s' % (self.JOINT_LOG_PREFIX, level_name)
1102 # This helps with some online tools to avoid complaints about an
1103 # unknown filetype.
1104 joint_file = joint_file + '.txt'
1105 joint_path = os.path.join(log_dir, joint_file)
1106 files = [f for f in local_files if level_name in f]
1107 if not files:
1108 # TODO(crrev.com/c/1793030): remove no-level case once CL
1109 # is pushed
1110 continue
1111 # Extract compressed logs if any.
1112 compressed, extracted = self._extract_compressed_logs(log_dir,
1113 files)
1114 files = list(set(files) - set(compressed))
1115 files.extend(extracted)
1116 # Need to sort. As they all share the same timestamp, and
1117 # loglevel, the index itself is sufficient. The highest index
1118 # is the oldest file, therefore we need a descending sort.
1119 def sortkey(f, level=level_name):
1120 """Custom sortkey to sort based on rotation number int."""
1121 if f.endswith(level_name): return 0
1122 return int(f.split('.')[-1])
1123
1124 files.sort(reverse=True, key=sortkey)
1125 # Just rename the first file rather than building from scratch.
1126 os.rename(files[0], joint_path)
1127 with open(joint_path, 'a') as joint_f:
1128 for logfile in files[1:]:
1129 # Transfer the file to the joint file line by line.
1130 with open(logfile, 'r') as log_f:
1131 for line in log_f:
1132 joint_f.write(line)
1133 # File has been written over. Delete safely.
1134 os.remove(logfile)
1135 # Need to remove all files form |local_files| so we don't
1136 # analyze them again.
1137 local_files = list(set(local_files) - set(files) - set(compressed))
1138 # Lastly, extract MCU logs from the joint logs.
1139 self._extract_mcu_logs(log_dir)
1140
Garry Wang79e9af62019-06-12 15:19:19 -07001141 def _lock(self):
1142 """lock servohost by touching a file.
1143 """
1144 logging.debug('Locking servohost %s by touching %s file',
1145 self.hostname, self._lock_file)
1146 self.run('touch %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001147 self._is_locked = True
Garry Wang79e9af62019-06-12 15:19:19 -07001148
Garry Wang79e9af62019-06-12 15:19:19 -07001149 def _unlock(self):
1150 """Unlock servohost by removing the lock file.
1151 """
1152 logging.debug('Unlocking servohost by removing %s file',
1153 self._lock_file)
1154 self.run('rm %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001155 self._is_locked = False
Garry Wang79e9af62019-06-12 15:19:19 -07001156
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001157 def close(self):
Congbin Guofc3b8962019-03-22 17:38:46 -07001158 """Close the associated servo and the host object."""
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001159 # NOTE: throughout this method there are multiple attempts to catch
1160 # all errors. This is WAI as log grabbing should not fail tests.
1161 # However, the goal is to catch and handle/process all errors, thus
1162 # we print the traceback and ask for a bug.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001163 if self._closed:
1164 logging.debug('ServoHost is already closed.')
1165 return
Garry Wang22f2e842020-09-09 20:19:19 -07001166
1167 # Only attempt ssh related actions if servohost is sshable. We call
1168 # check_cached_up_status() first because it's lightweighted and return
1169 # much faster in the case servohost is down, however, we still want
1170 # to call is_up() later since check_cached_up_status() is ping based check
1171 # and not guarantee the servohost is sshable.
1172 servo_host_ready = self.check_cached_up_status() and self.is_up()
1173
1174 if servo_host_ready:
1175 instance_ts = self.get_instance_logs_ts()
1176 else:
1177 logging.info('Servohost is down, will skip servod log collecting.')
1178 instance_ts = None
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001179 # TODO(crbug.com/1011516): once enabled, remove the check against
1180 # localhost and instead check against log-rotiation enablement.
1181 logs_available = (instance_ts is not None and
1182 self.job and
1183 not self.is_localhost())
1184 if logs_available:
1185 # Probe whether there was a servod restart, and grab those old
1186 # logs as well.
1187 try:
1188 self.probe_servod_restart(instance_ts, self.job.resultdir)
1189 except (error.AutoservRunError, error.TestFail) as e:
1190 logging.info('Failed to grab servo logs due to: %s. '
1191 'This error is forgiven.', str(e))
1192 except Exception as e:
1193 logging.error('Unexpected error probing for old logs. %s. '
1194 'Forgiven. Please file a bug and fix or catch '
1195 'in log probing function', str(e),
1196 exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001197 if self._servo:
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001198 outdir = None if not self.job else self.job.resultdir
Congbin Guo2e5e2a22018-07-27 10:32:48 -07001199 # In some cases when we run as lab-tools, the job object is None.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001200 self._servo.close(outdir)
1201
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001202 if logs_available:
1203 # Grab current (not old like above) logs after the servo instance
1204 # was closed out.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001205 try:
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001206 self.get_instance_logs(instance_ts, self.job.resultdir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001207 except error.AutoservRunError as e:
1208 logging.info('Failed to grab servo logs due to: %s. '
1209 'This error is forgiven.', str(e))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001210 except Exception as e:
1211 logging.error('Unexpected error grabbing servod logs. %s. '
1212 'Forgiven. Please file a bug and fix or catch '
1213 'in log grabbing function', str(e), exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001214
Garry Wang22f2e842020-09-09 20:19:19 -07001215 if self._is_locked and servo_host_ready:
Garry Wang7c00b0f2019-06-25 17:28:17 -07001216 # Remove the lock if the servohost has been locked.
Garry Wang79e9af62019-06-12 15:19:19 -07001217 try:
1218 self._unlock()
1219 except error.AutoservSSHTimeout:
1220 logging.error('Unlock servohost failed due to ssh timeout.'
1221 ' It may caused by servohost went down during'
1222 ' the task.')
Garry Wangc1288cf2019-12-17 14:58:00 -08001223 # We want always stop servod after task to minimum the impact of bad
1224 # servod process interfere other servods.(see crbug.com/1028665)
Garry Wang22f2e842020-09-09 20:19:19 -07001225 if servo_host_ready:
1226 try:
1227 self.stop_servod()
1228 except error.AutoservRunError as e:
1229 logging.info(
1230 "Failed to stop servod due to:\n%s\n"
1231 "This error is forgiven.", str(e))
Garry Wangc1288cf2019-12-17 14:58:00 -08001232
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001233 super(ServoHost, self).close()
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001234 # Mark closed.
1235 self._closed = True
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001236
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001237 def get_servo_state(self):
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001238 return self._servo_state
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001239
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001240 def _get_host_metrics_data(self):
1241 return {'port': self.servo_port,
Otabek Kasimov0ea47362020-07-11 20:55:09 -07001242 'host': self.get_dut_hostname() or self.hostname,
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001243 'board': self.servo_board or ''}
1244
1245 def _is_servo_device_connected(self, servo_type, serial):
1246 """Check if device is connected to the labstation.
1247
1248 Works for all servo devices connected to the labstation.
1249 For servo_v3 please use 'self._is_servo_board_present_on_servo_v3'
1250
1251 @param servo_type: The type of servo device. Expecting value can be
1252 servo_v4 or servo_micro.
1253 @param serial: The serial number of the device to detect it.
1254 """
1255 vid_pid = self.SERVO_VID_PID.get(servo_type)
1256 if not vid_pid or not serial:
1257 # device cannot detected without VID/PID or serial number
1258 return False
1259 logging.debug('Started to detect %s', servo_type)
1260 try:
1261 cmd = 'lsusb -v -d %s |grep iSerial |grep %s' % (vid_pid, serial)
1262 result = self.run(cmd, ignore_status=True, timeout=30)
1263 if result.exit_status == 0 and result.stdout.strip():
1264 logging.debug('The %s is plugged in to the host.', servo_type)
1265 return True
1266 logging.debug('%s device is not detected; %s', servo_type, result)
1267 return False
1268 except Exception as e:
1269 # can be triggered by timeout issue due running the script
1270 metrics.Counter(
1271 'chromeos/autotest/repair/servo_detection/timeout'
1272 ).increment(fields=self._get_host_metrics_data())
1273 logging.error('%s device is not detected; %s', servo_type, str(e))
1274 return None
1275
1276 def _is_servo_board_present_on_servo_v3(self):
1277 """Check if servo board is detected on servo_v3"""
1278 vid_pids = self.SERVO_VID_PID['servo_v3']
1279 if not vid_pids or len(vid_pids) == 0:
1280 # device cannot detected without VID/PID
1281 return False
1282 logging.debug('Started to detect servo board on servo_v3')
1283 not_detected = 'The servo board is not detected on servo_v3'
1284 try:
1285 cmd = 'lsusb | grep "%s"' % "\|".join(vid_pids)
1286 result = self.run(cmd, ignore_status=True, timeout=30)
1287 if result.exit_status == 0 and result.stdout.strip():
1288 logging.debug('The servo board is detected on servo_v3')
1289 return True
1290 logging.debug('%s; %s', not_detected, result)
1291 return False
1292 except Exception as e:
1293 # can be triggered by timeout issue due running the script
1294 metrics.Counter(
1295 'chromeos/autotest/repair/servo_detection/timeout'
1296 ).increment(fields=self._get_host_metrics_data())
1297 logging.error('%s; %s', not_detected, str(e))
1298 return None
1299
Otabek Kasimov120b6fa2020-07-03 00:15:27 -07001300 def _is_main_device_not_detected_on_servo_v4(self):
1301 """Check if servod cannot find main device on servo.
1302
1303 The check based on reading servod logs for servo_v4.
1304 """
1305 if not self._initial_instance_ts:
1306 # latest log not found
1307 return False
1308 logging.debug('latest log for servod created at %s',
1309 self._initial_instance_ts)
1310 try:
1311 log_created = calendar.timegm(time.strptime(
1312 self._initial_instance_ts,
1313 "%Y-%m-%d--%H-%M-%S.%f"))
1314 except ValueError as e:
1315 logging.debug('Cannot read time from log file name: %s',
1316 self._initial_instance_ts)
1317 return False
1318 min_time_created = calendar.timegm(time.gmtime())
1319 if min_time_created > log_created + 3600:
1320 # the log file is old we cannot use it
1321 logging.debug('log file was created more than hour ago, too old')
1322 return False
1323 logging.debug('latest log was created not longer then 1 hour ago')
1324
1325 # check if servod can detect main device by servo_v4
1326 message = 'ERROR - No servo micro or CCD detected for board'
1327 cmd = ('cat /var/log/servod_%s/log.%s.INFO |grep "%s"'
1328 % (self.servo_port, self._initial_instance_ts, message))
1329 result = self.run(cmd, ignore_status=True)
1330 if result.stdout.strip():
1331 logging.info('Servod cannot detect main device on the servo; '
1332 'Can be caused by bad hardware of servo or '
1333 'issue on the DUT side.')
1334 return True
1335 logging.debug('The main device is detected')
1336 return False
1337
Garry Wangb5cee3e2020-09-16 14:58:13 -07001338 def _require_cr50_servod_config(self):
1339 """Check whether we need start servod with CONFIG=cr50.xml"""
1340 dut_host_info = self.get_dut_host_info()
1341 if not dut_host_info:
1342 return False
1343 for pool in dut_host_info.pools:
1344 if pool.startswith(servo_constants.CR50_CONFIG_POOL_PREFIX):
1345 return True
1346 return False
1347
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001348 def get_verifier_state(self, tag):
Otabek Kasimov15963492020-06-23 21:10:51 -07001349 """Return the state of servo verifier.
1350
1351 @returns: bool or None
1352 """
1353 return self._repair_strategy.verifier_is_good(tag)
1354
1355 def determine_servo_state(self):
1356 """Determine servo state based on the failed verifier.
1357
1358 @returns: servo state value
1359 The state detecting based on first fail verifier or collecting of
1360 them.
1361 """
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001362 ssh = self.get_verifier_state('servo_ssh')
Otabek Kasimov1614e2e2021-01-27 22:14:36 -08001363 disk_space = self.get_verifier_state('servo_disk_space')
1364 start_servod = self.get_verifier_state('servod_started')
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001365 create_servo = self.get_verifier_state('servod_connection')
1366 init_servo = self.get_verifier_state('servod_control')
Otabek Kasimov1614e2e2021-01-27 22:14:36 -08001367 cr50_low_sbu = self.get_verifier_state('servo_cr50_low_sbu')
1368 cr50_off = self.get_verifier_state('servo_cr50_off')
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001369 servo_topology = self.get_verifier_state('servo_topology')
Otabek Kasimov1614e2e2021-01-27 22:14:36 -08001370 dut_connected = self.get_verifier_state('servo_dut_connected')
1371 hub_connected = self.get_verifier_state('servo_hub_connected')
1372 pwr_button = self.get_verifier_state('servo_pwr_button')
1373 lid_open = self.get_verifier_state('servo_lid_open')
1374 ec_board = self.get_verifier_state('servo_ec_board')
1375 cr50_console = self.get_verifier_state('servo_cr50_console')
1376 ccd_testlab = self.get_verifier_state('servo_ccd_testlab')
Otabek Kasimov15963492020-06-23 21:10:51 -07001377
1378 if not ssh:
1379 return servo_constants.SERVO_STATE_NO_SSH
1380
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001381 if (start_servod == hosts.VERIFY_FAILED
1382 or create_servo == hosts.VERIFY_FAILED):
Otabek Kasimov066bdb82020-08-12 15:57:44 -07001383 # sometimes servo can start with out present servo
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001384 if self.is_labstation():
1385 if not self.servo_serial:
1386 return servo_constants.SERVO_STATE_WRONG_CONFIG
1387 if self._is_servo_device_connected(
1388 'servo_v4',
1389 self.servo_serial) == False:
1390 return servo_constants.SERVO_STATE_NOT_CONNECTED
1391 elif self._is_servo_board_present_on_servo_v3() == False:
1392 return servo_constants.SERVO_STATE_NOT_CONNECTED
Otabek Kasimov066bdb82020-08-12 15:57:44 -07001393
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001394 if dut_connected == hosts.VERIFY_FAILED:
1395 return servo_constants.SERVO_STATE_DUT_NOT_CONNECTED
1396 if hub_connected == hosts.VERIFY_FAILED:
1397 logging.info('Servo HUB not connected')
1398 return servo_constants.SERVO_STATE_DUT_NOT_CONNECTED
Otabek Kasimov8e88a742021-01-11 18:03:13 -08001399 if cr50_low_sbu == hosts.VERIFY_FAILED:
1400 return servo_constants.SERVO_STATE_SBU_LOW_VOLTAGE
1401 if cr50_off == hosts.VERIFY_FAILED:
1402 return servo_constants.SERVO_STATE_CR50_NOT_ENUMERATED
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001403 if servo_topology == hosts.VERIFY_FAILED:
1404 return servo_constants.SERVO_STATE_TOPOLOGY_ISSUE
1405
Otabek Kasimovd5065bd2020-11-23 23:32:36 -08001406 # TODO(otabek@): detect special cases detected by pwr_button
1407 if dut_connected == hosts.VERIFY_SUCCESS:
1408 if pwr_button == hosts.VERIFY_FAILED:
1409 metrics.Counter(
1410 'chromeos/autotest/repair/servo_unexpected/pwr_button2'
1411 ).increment(fields=self._get_host_metrics_data())
Otabek Kasimova7eb4dc2020-09-16 10:25:17 -07001412
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001413 if start_servod == hosts.VERIFY_FAILED:
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001414 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1415
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001416 if create_servo == hosts.VERIFY_FAILED:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -07001417 if (self.is_labstation()
1418 and self._is_main_device_not_detected_on_servo_v4()):
1419 servo_type = None
1420 if self.get_dut_host_info():
1421 servo_type = self.get_dut_host_info().get_label_value(
1422 servo_constants.SERVO_TYPE_LABEL_PREFIX)
1423 if servo_type and 'servo_micro' in servo_type:
1424 serial = self.get_servo_micro_serial_number()
1425 logging.debug('servo_micro serial: %s', serial)
1426 if self._is_servo_device_detected('servo_micro',
1427 serial):
1428 return servo_constants.SERVO_STATE_BAD_RIBBON_CABLE
1429 # Device can be not detected because of DUT
1430 # TODO (otabek) update after b/159755652 and b/159754985
1431 metrics.Counter(
1432 'chromeos/autotest/repair/servo_state/needs_replacement'
1433 ).increment(fields=self._get_host_metrics_data())
1434 elif not self.is_labstation():
1435 # Here need logic to check if flex cable is connected
1436 pass
1437
Otabek Kasimov15963492020-06-23 21:10:51 -07001438 # one of the reason why servo can not initialized
Otabek Kasimovbb3bc462020-11-03 16:40:33 -08001439 if cr50_console == hosts.VERIFY_FAILED:
1440 return servo_constants.SERVO_STATE_CR50_CONSOLE_MISSING
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001441 if ccd_testlab == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001442 return servo_constants.SERVO_STATE_CCD_TESTLAB_ISSUE
1443
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001444 if (create_servo == hosts.VERIFY_FAILED
1445 or init_servo == hosts.VERIFY_FAILED):
Otabek Kasimov15963492020-06-23 21:10:51 -07001446 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1447
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001448 if ec_board == hosts.VERIFY_FAILED:
Otabek Kasimov015c15c2020-08-20 00:40:42 -07001449 return servo_constants.SERVO_STATE_EC_BROKEN
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001450 if pwr_button == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001451 return servo_constants.SERVO_STATE_BAD_RIBBON_CABLE
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001452 if lid_open == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001453 return servo_constants.SERVO_STATE_LID_OPEN_FAILED
Otabek Kasimov15963492020-06-23 21:10:51 -07001454
Otabek Kasimov15963492020-06-23 21:10:51 -07001455 metrics.Counter(
1456 'chromeos/autotest/repair/unknown_servo_state'
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001457 ).increment(fields=self._get_host_metrics_data())
Otabek Kasimov15963492020-06-23 21:10:51 -07001458 logging.info('We do not have special state for this failure yet :)')
1459 return servo_constants.SERVO_STATE_BROKEN
1460
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001461 def is_servo_topology_supported(self):
1462 """Check if servo_topology is supported."""
Otabek Kasimovda994012020-11-25 15:23:04 -08001463 if not self.is_up_fast():
1464 logging.info('Servo-Host is not reachable.')
1465 return False
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001466 if not self.is_labstation():
1467 logging.info('Servo-topology supported only for labstation.')
1468 return False
1469 if not self.servo_serial:
1470 logging.info('Servo-topology required a servo serial.')
1471 return False
1472 return True
1473
1474 def get_topology(self):
1475 """Get servo topology."""
Otabek Kasimovfe41e2d2021-02-14 20:48:52 -08001476 if not self._topology:
1477 self._topology = servo_topology.ServoTopology(self)
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001478 return self._topology
1479
1480 def is_dual_setup(self):
1481 """Check is servo will run in dual setup.
1482
1483 Dual setup used only for servo_v4 when used ccd_cr50 and servo_micro
1484 at the same time.
1485 """
1486 return self.servo_setup == servo_constants.SERVO_SETUP_VALUE_DUAL_V4
1487
Otabek Kasimov39637412020-11-23 19:09:27 -08001488 def set_dut_health_profile(self, dut_health_profile):
1489 """
1490 @param dut_health_profile: A DeviceHealthProfile object.
1491 """
1492 logging.debug('setting dut_health_profile field to (%s)',
1493 dut_health_profile)
1494 self._dut_health_profile = dut_health_profile
1495
1496 def get_dut_health_profile(self):
1497 """
1498 @return A DeviceHealthProfile object.
1499 """
1500 return self._dut_health_profile
1501
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001502
Richard Barnetteea3e4602016-06-10 12:36:41 -07001503def make_servo_hostname(dut_hostname):
1504 """Given a DUT's hostname, return the hostname of its servo.
1505
1506 @param dut_hostname: hostname of a DUT.
1507
1508 @return hostname of the DUT's servo.
1509
1510 """
1511 host_parts = dut_hostname.split('.')
1512 host_parts[0] = host_parts[0] + '-servo'
1513 return '.'.join(host_parts)
1514
1515
Richard Barnettee519dcd2016-08-15 17:37:17 -07001516def _map_afe_board_to_servo_board(afe_board):
1517 """Map a board we get from the AFE to a servo appropriate value.
1518
1519 Many boards are identical to other boards for servo's purposes.
1520 This function makes that mapping.
1521
1522 @param afe_board string board name received from AFE.
1523 @return board we expect servo to have.
1524
1525 """
1526 KNOWN_SUFFIXES = ['-freon', '_freon', '_moblab', '-cheets']
1527 BOARD_MAP = {'gizmo': 'panther'}
1528 mapped_board = afe_board
1529 if afe_board in BOARD_MAP:
1530 mapped_board = BOARD_MAP[afe_board]
1531 else:
1532 for suffix in KNOWN_SUFFIXES:
1533 if afe_board.endswith(suffix):
1534 mapped_board = afe_board[0:-len(suffix)]
1535 break
1536 if mapped_board != afe_board:
1537 logging.info('Mapping AFE board=%s to %s', afe_board, mapped_board)
1538 return mapped_board
1539
1540
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001541def get_servo_args_for_host(dut_host):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001542 """Return servo data associated with a given DUT.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001543
Richard Barnetteea3e4602016-06-10 12:36:41 -07001544 @param dut_host Instance of `Host` on which to find the servo
1545 attributes.
Prathmesh Prabhuf605dd32018-08-28 17:09:04 -07001546 @return `servo_args` dict with host and an optional port.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001547 """
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001548 info = dut_host.host_info_store.get()
Derek Beckettf73baca2020-08-19 15:08:47 -07001549 servo_args = {k: v for k, v in six.iteritems(info.attributes)
Garry Wang11b5e872020-03-11 15:14:08 -07001550 if k in servo_constants.SERVO_ATTR_KEYS}
Richard Barnetteea3e4602016-06-10 12:36:41 -07001551
Andrew Luo4be621d2020-03-21 07:01:13 -07001552 if servo_constants.SERVO_HOST_SSH_PORT_ATTR in servo_args:
1553 try:
1554 servo_args[servo_constants.SERVO_HOST_SSH_PORT_ATTR] = int(
1555 servo_args[servo_constants.SERVO_HOST_SSH_PORT_ATTR])
1556 except ValueError:
1557 logging.error('servo host port is not an int: %s',
1558 servo_args[servo_constants.SERVO_HOST_SSH_PORT_ATTR])
1559 # Reset servo_args because we don't want to use an invalid port.
1560 servo_args.pop(servo_constants.SERVO_HOST_SSH_PORT_ATTR, None)
1561
Garry Wang11b5e872020-03-11 15:14:08 -07001562 if servo_constants.SERVO_PORT_ATTR in servo_args:
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001563 try:
Garry Wang11b5e872020-03-11 15:14:08 -07001564 servo_args[servo_constants.SERVO_PORT_ATTR] = int(
1565 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001566 except ValueError:
1567 logging.error('servo port is not an int: %s',
Garry Wang11b5e872020-03-11 15:14:08 -07001568 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001569 # Reset servo_args because we don't want to use an invalid port.
Garry Wang11b5e872020-03-11 15:14:08 -07001570 servo_args.pop(servo_constants.SERVO_HOST_ATTR, None)
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001571
1572 if info.board:
Garry Wang11b5e872020-03-11 15:14:08 -07001573 servo_board = _map_afe_board_to_servo_board(info.board)
1574 servo_args[servo_constants.SERVO_BOARD_ATTR] = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -07001575 if info.model:
Garry Wang11b5e872020-03-11 15:14:08 -07001576 servo_args[servo_constants.SERVO_MODEL_ATTR] = info.model
1577 return servo_args if servo_constants.SERVO_HOST_ATTR in servo_args else None
Richard Barnetteea3e4602016-06-10 12:36:41 -07001578
1579
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001580def _tweak_args_for_ssp_moblab(servo_args):
Garry Wang11b5e872020-03-11 15:14:08 -07001581 if (servo_args[servo_constants.SERVO_HOST_ATTR]
1582 in ['localhost', '127.0.0.1']):
1583 servo_args[servo_constants.SERVO_HOST_ATTR] = _CONFIG.get_config_value(
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001584 'SSP', 'host_container_ip', type=str, default=None)
1585
1586
Otabek Kasimov39637412020-11-23 19:09:27 -08001587def create_servo_host(dut,
1588 servo_args,
1589 try_lab_servo=False,
1590 try_servo_repair=False,
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001591 try_servo_recovery=False,
Otabek Kasimov39637412020-11-23 19:09:27 -08001592 dut_host_info=None,
1593 dut_health_profile=None):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001594 """Create a ServoHost object for a given DUT, if appropriate.
Dan Shi4d478522014-02-14 13:46:32 -08001595
Richard Barnette9a26ad62016-06-10 12:03:08 -07001596 This function attempts to create and verify or repair a `ServoHost`
1597 object for a servo connected to the given `dut`, subject to various
1598 constraints imposed by the parameters:
1599 * When the `servo_args` parameter is not `None`, a servo
1600 host must be created, and must be checked with `repair()`.
1601 * Otherwise, if a servo exists in the lab and `try_lab_servo` is
1602 true:
1603 * If `try_servo_repair` is true, then create a servo host and
1604 check it with `repair()`.
1605 * Otherwise, if the servo responds to `ping` then create a
1606 servo host and check it with `verify()`.
Fang Denge545abb2014-12-30 18:43:47 -08001607
Richard Barnette9a26ad62016-06-10 12:03:08 -07001608 In cases where `servo_args` was not `None`, repair failure
1609 exceptions are passed back to the caller; otherwise, exceptions
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001610 are logged and then discarded. Note that this only happens in cases
1611 where we're called from a test (not special task) control file that
1612 has an explicit dependency on servo. In that case, we require that
1613 repair not write to `status.log`, so as to avoid polluting test
1614 results.
1615
1616 TODO(jrbarnette): The special handling for servo in test control
1617 files is a thorn in my flesh; I dearly hope to see it cut out before
1618 my retirement.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001619
1620 Parameters for a servo host consist of a host name, port number, and
1621 DUT board, and are determined from one of these sources, in order of
1622 priority:
Richard Barnetteea3e4602016-06-10 12:36:41 -07001623 * Servo attributes from the `dut` parameter take precedence over
1624 all other sources of information.
1625 * If a DNS entry for the servo based on the DUT hostname exists in
1626 the CrOS lab network, that hostname is used with the default
Richard Barnette9a26ad62016-06-10 12:03:08 -07001627 port and the DUT's board.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001628 * If no other options are found, the parameters will be taken
Richard Barnette9a26ad62016-06-10 12:03:08 -07001629 from the `servo_args` dict passed in from the caller.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001630
1631 @param dut An instance of `Host` from which to take
1632 servo parameters (if available).
1633 @param servo_args A dictionary with servo parameters to use if
1634 they can't be found from `dut`. If this
1635 argument is supplied, unrepaired exceptions
1636 from `verify()` will be passed back to the
1637 caller.
1638 @param try_lab_servo If not true, servo host creation will be
1639 skipped unless otherwise required by the
1640 caller.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001641 @param try_servo_repair If true, check a servo host with
1642 `repair()` instead of `verify()`.
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001643 @param try_servo_recovery If true, start servod in recovery mode.
Otabek Kasimov8475cce2020-07-14 12:11:31 -07001644 @param dut_host_info: A HostInfo object of the DUT that connected
1645 to this servo.
Otabek Kasimov39637412020-11-23 19:09:27 -08001646 @param dut_health_profile: DUT repair info with history.
Dan Shi4d478522014-02-14 13:46:32 -08001647
1648 @returns: A ServoHost object or None. See comments above.
1649
1650 """
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001651 servo_dependency = servo_args is not None
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001652 if dut is not None and (try_lab_servo or servo_dependency):
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001653 servo_args_override = get_servo_args_for_host(dut)
Richard Barnetteea3e4602016-06-10 12:36:41 -07001654 if servo_args_override is not None:
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001655 if utils.in_moblab_ssp():
1656 _tweak_args_for_ssp_moblab(servo_args_override)
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001657 logging.debug(
1658 'Overriding provided servo_args (%s) with arguments'
1659 ' determined from the host (%s)',
1660 servo_args,
1661 servo_args_override,
1662 )
Richard Barnetteea3e4602016-06-10 12:36:41 -07001663 servo_args = servo_args_override
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001664
Richard Barnetteea3e4602016-06-10 12:36:41 -07001665 if servo_args is None:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001666 logging.debug('No servo_args provided, and failed to find overrides.')
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001667 if try_lab_servo or servo_dependency:
Otabek Kasimov646812c2020-06-23 20:01:36 -07001668 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001669 else:
1670 # For regular test case which not required the servo
1671 return None, None
1672
Garry Wang11b5e872020-03-11 15:14:08 -07001673 servo_hostname = servo_args.get(servo_constants.SERVO_HOST_ATTR)
1674 servo_port = servo_args.get(servo_constants.SERVO_PORT_ATTR)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001675 if not _is_servo_host_information_exist(servo_hostname, servo_port):
1676 logging.debug(
1677 'Servo connection info missed hostname: %s , port: %s',
1678 servo_hostname, servo_port)
Otabek Kasimov646812c2020-06-23 20:01:36 -07001679 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001680 if not is_servo_host_information_valid(servo_hostname, servo_port):
1681 logging.debug(
1682 'Servo connection info is incorrect hostname: %s , port: %s',
1683 servo_hostname, servo_port)
Garry Wang11b5e872020-03-11 15:14:08 -07001684 return None, servo_constants.SERVO_STATE_WRONG_CONFIG
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001685
Otabek Kasimov1b70e8d2020-12-30 13:51:00 -08001686 if try_servo_recovery == True:
1687 servo_args[servo_constants.SERVO_RECOVERY_MODE] = True
1688
Garry Wangebc015b2019-06-06 17:45:06 -07001689 newhost = ServoHost(**servo_args)
Andrew Luo4be621d2020-03-21 07:01:13 -07001690 if newhost.use_icmp and not newhost.is_up_fast(count=3):
Otabek Kasimov32cafe92020-12-14 16:58:12 -08001691 # ServoHost has internal check to wait if servo-host is in reboot
1692 # process. If servo-host still is not available this check will stop
1693 # further attempts as we do not have any option to recover servo_host.
Otabek Kasimov39637412020-11-23 19:09:27 -08001694 return None, servo_constants.SERVO_STATE_NO_SSH
Garry Wangffbd2162020-04-17 16:13:48 -07001695
Otabek Kasimove6df8102020-07-21 20:15:25 -07001696 # Reset or reboot servo device only during AdminRepair tasks.
1697 if try_servo_repair:
1698 if newhost._is_locked:
1699 # Reset servo if the servo is locked, as we check if the servohost
1700 # is up, if the servohost is labstation and if the servohost is in
1701 # lab inside the locking logic.
1702 newhost.reset_servo()
1703 else:
Garry Wang358aad42020-08-02 20:56:04 -07001704 try:
1705 newhost.reboot_servo_v3_on_need()
Garry Wang1f0d5332020-08-10 19:32:32 -07001706 except Exception as e:
1707 logging.info('[Non-critical] Unexpected error while trying to'
1708 ' reboot servo_v3, skipping the reboot; %s', e)
Otabek Kasimove6df8102020-07-21 20:15:25 -07001709
Otabek Kasimov2b50cdb2020-07-06 19:16:06 -07001710 if dut:
1711 newhost.set_dut_hostname(dut.hostname)
Otabek Kasimov9e90ae12020-08-14 03:01:19 -07001712 if dut_host_info:
1713 newhost.set_dut_host_info(dut_host_info)
Otabek Kasimov39637412020-11-23 19:09:27 -08001714 if dut_health_profile and (try_lab_servo or try_servo_repair):
1715 try:
1716 if newhost.is_localhost():
1717 logging.info('Servohost is a localhost, skip device'
1718 ' health profile setup...')
1719 else:
1720 dut_health_profile.init_profile(newhost)
1721 newhost.set_dut_health_profile(dut_health_profile)
1722 except Exception as e:
1723 logging.info(
1724 '[Non-critical] Unexpected error while trying to'
1725 ' load device health profile; %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -07001726
Otabek Kasimov8475cce2020-07-14 12:11:31 -07001727 if try_lab_servo or try_servo_repair:
1728 try:
1729 logging.info("Check and update servo firmware.")
Otabek Kasimov10e27972021-02-13 18:06:39 -08001730 servo_updater.update_servo_firmware(newhost,
1731 try_attempt_count=3,
1732 force_update=False,
1733 try_force_update=False)
Otabek Kasimov8475cce2020-07-14 12:11:31 -07001734 except Exception as e:
1735 logging.error("Servo device update error: %s", e)
1736
Garry Wangcdd27b22020-01-13 14:59:11 -08001737 try:
1738 newhost.restart_servod(quick_startup=True)
1739 except error.AutoservSSHTimeout:
1740 logging.warning("Restart servod failed due ssh connection "
1741 "to servohost timed out. This error is forgiven"
1742 " here, we will retry in servo repair process.")
1743 except error.AutoservRunError as e:
1744 logging.warning("Restart servod failed due to:\n%s\n"
1745 "This error is forgiven here, we will retry"
1746 " in servo repair process.", str(e))
Garry Wangebc015b2019-06-06 17:45:06 -07001747
Richard Barnette9a26ad62016-06-10 12:03:08 -07001748 # Note that the logic of repair() includes everything done
1749 # by verify(). It's sufficient to call one or the other;
1750 # we don't need both.
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001751 if servo_dependency:
1752 newhost.repair(silent=True)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001753 return newhost, newhost.get_servo_state()
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001754
1755 if try_servo_repair:
1756 try:
1757 newhost.repair()
1758 except Exception:
1759 logging.exception('servo repair failed for %s', newhost.hostname)
Richard Barnette9a26ad62016-06-10 12:03:08 -07001760 else:
1761 try:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001762 newhost.verify()
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001763 except Exception:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001764 logging.exception('servo verify failed for %s', newhost.hostname)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001765 return newhost, newhost.get_servo_state()
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001766
1767
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001768def _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001769 if hostname is None or len(hostname.strip()) == 0:
1770 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001771 if port is None:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001772 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001773 if not type(port) is int:
1774 try:
1775 int(port)
1776 except ValueError:
1777 return False
1778
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001779 return True
1780
1781
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001782def is_servo_host_information_valid(hostname, port):
Garry Wang9b8f2342020-04-17 16:34:09 -07001783 """Check if provided servo attributes are valid.
1784
1785 @param hostname Hostname of the servohost.
1786 @param port servo port number.
1787
1788 @returns: A bool value to indicate if provided servo attribute valid.
1789 """
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001790 if not _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001791 return False
1792 # checking range and correct of the port
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001793 port_int = int(port)
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001794 if port_int < 1 or port_int > 65000:
1795 return False
1796 # we expecting host contain only latters, digits and '-' or '_'
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001797 if not re.match('[a-zA-Z0-9-_\.]*$', hostname) or len(hostname) < 5:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001798 return False
1799 return True