blob: 0e35dda2a7be659f5a1be9c0f5442433287100e2 [file] [log] [blame]
Derek Beckettf73baca2020-08-19 15:08:47 -07001# Lint as: python2, python3
Fang Deng5d518f42013-08-02 14:04:32 -07002# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
3# Use of this source code is governed by a BSD-style license that can be
4# found in the LICENSE file.
5#
6# Expects to be run in an environment with sudo and no interactive password
7# prompt, such as within the Chromium OS development chroot.
8
9
10"""This file provides core logic for servo verify/repair process."""
11
12
Derek Beckettf73baca2020-08-19 15:08:47 -070013from __future__ import absolute_import
14from __future__ import division
15from __future__ import print_function
16
Fang Deng5d518f42013-08-02 14:04:32 -070017import logging
Raul E Rangel52ca2e82018-07-03 14:10:14 -060018import os
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080019import re
20import tarfile
Andrew McRaef0679932020-08-13 09:15:23 +100021import threading
Garry Wang2b5eef92020-08-21 16:23:35 -070022import json
Garry Wangc1288cf2019-12-17 14:58:00 -080023import time
Derek Beckettf73baca2020-08-19 15:08:47 -070024import six
25import six.moves.xmlrpc_client
Otabek Kasimov120b6fa2020-07-03 00:15:27 -070026import calendar
Fang Deng5d518f42013-08-02 14:04:32 -070027
28from autotest_lib.client.bin import utils
Garry Wang79e9af62019-06-12 15:19:19 -070029from autotest_lib.client.common_lib import error
Richard Barnette9a26ad62016-06-10 12:03:08 -070030from autotest_lib.client.common_lib import hosts
Garry Wang7b0e1b72020-03-25 19:08:59 -070031from autotest_lib.client.common_lib import lsbrelease_utils
Fang Deng5d518f42013-08-02 14:04:32 -070032from autotest_lib.client.common_lib.cros import retry
Christopher Wileycef1f902014-06-19 11:11:23 -070033from autotest_lib.client.common_lib.cros.network import ping_runner
Richard Barnette9a26ad62016-06-10 12:03:08 -070034from autotest_lib.server.cros.servo import servo
Richard Barnetted31580e2018-05-14 19:58:00 +000035from autotest_lib.server.hosts import servo_repair
Garry Wangebc015b2019-06-06 17:45:06 -070036from autotest_lib.server.hosts import base_servohost
Garry Wang11b5e872020-03-11 15:14:08 -070037from autotest_lib.server.hosts import servo_constants
Otabek Kasimov4ea636e2020-04-14 23:35:06 -070038from autotest_lib.server.cros.faft.utils import config
Garry Wang11b5e872020-03-11 15:14:08 -070039from autotest_lib.client.common_lib import global_config
Otabek Kasimov8475cce2020-07-14 12:11:31 -070040from autotest_lib.site_utils.admin_audit import servo_updater
Otabek Kasimov382c3bb2020-10-28 13:22:45 -070041from autotest_lib.server.cros.servo.topology import servo_topology
Garry Wangd7367482020-02-27 13:52:40 -080042
Otabek Kasimov15963492020-06-23 21:10:51 -070043try:
44 from chromite.lib import metrics
45except ImportError:
46 metrics = utils.metrics_mock
47
Dan Shi3b2adf62015-09-02 17:46:54 -070048_CONFIG = global_config.global_config
Fang Deng5d518f42013-08-02 14:04:32 -070049
Otabek Kasimova7ba91a2020-03-09 08:31:01 -070050
Garry Wangebc015b2019-06-06 17:45:06 -070051class ServoHost(base_servohost.BaseServoHost):
52 """Host class for a servo host(e.g. beaglebone, labstation)
Dana Goyette0b6e6402019-10-04 11:09:24 -070053 that with a servo instance for a specific port.
54
55 @type _servo: servo.Servo | None
56 """
Fang Deng5d518f42013-08-02 14:04:32 -070057
Raul E Rangel52ca2e82018-07-03 14:10:14 -060058 DEFAULT_PORT = int(os.getenv('SERVOD_PORT', '9999'))
Richard Barnette9a26ad62016-06-10 12:03:08 -070059
Dan Shie5b3c512014-08-21 12:12:09 -070060 # Timeout for initializing servo signals.
Wai-Hong Tam37b6ed32017-09-19 15:52:39 -070061 INITIALIZE_SERVO_TIMEOUT_SECS = 60
Richard Barnette9a26ad62016-06-10 12:03:08 -070062
Otabek Kasimov545739c2020-08-20 00:24:21 -070063 # Default timeout for run terminal command.
64 DEFAULT_TERMINAL_TIMEOUT = 30
65
xixuan6cf6d2f2016-01-29 15:29:00 -080066 # Ready test function
67 SERVO_READY_METHOD = 'get_version'
Fang Deng5d518f42013-08-02 14:04:32 -070068
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080069 # Directory prefix on the servo host where the servod logs are stored.
70 SERVOD_LOG_PREFIX = '/var/log/servod'
71
72 # Exit code to use when symlinks for servod logs are not found.
73 NO_SYMLINKS_CODE = 9
74
75 # Directory in the job's results directory to dump the logs into.
76 LOG_DIR = 'servod'
77
78 # Prefix for joint loglevel files in the logs.
79 JOINT_LOG_PREFIX = 'log'
80
81 # Regex group to extract timestamp from logfile name.
82 TS_GROUP = 'ts'
83
84 # This regex is used to extract the timestamp from servod logs.
Garry Wang22f2e842020-09-09 20:19:19 -070085 # files always start with log.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080086 TS_RE = (r'log.'
87 # The timestamp is of format %Y-%m-%d--%H-%M-%S.MS
88 r'(?P<%s>\d{4}(\-\d{2}){2}\-(-\d{2}){3}.\d{3})'
89 # The loglevel is optional depending on labstation version.
90 r'(.(INFO|DEBUG|WARNING))?' % TS_GROUP)
91 TS_EXTRACTOR = re.compile(TS_RE)
92
93 # Regex group to extract MCU name from logline in servod logs.
94 MCU_GROUP = 'mcu'
95
96 # Regex group to extract logline from MCU logline in servod logs.
97 LINE_GROUP = 'line'
98
99 # This regex is used to extract the mcu and the line content from an
100 # MCU logline in servod logs. e.g. EC or servo_v4 console logs.
101 # Here is an example log-line:
102 #
103 # 2020-01-23 13:15:12,223 - servo_v4 - EC3PO.Console - DEBUG -
104 # console.py:219:LogConsoleOutput - /dev/pts/9 - cc polarity: cc1
105 #
106 # Here is conceptually how they are formatted:
107 #
108 # <time> - <MCU> - EC3PO.Console - <LVL> - <file:line:func> - <pts> -
109 # <output>
110 #
Garry Wang22f2e842020-09-09 20:19:19 -0700111 # The log format starts with a timestamp
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800112 MCU_RE = (r'[\d\-]+ [\d:,]+ '
113 # The mcu that is logging this is next.
114 r'- (?P<%s>\w+) - '
115 # Next, we have more log outputs before the actual line.
116 # Information about the file line, logging function etc.
117 # Anchor on EC3PO Console, LogConsoleOutput and dev/pts.
118 # NOTE: if the log format changes, this regex needs to be
119 # adjusted.
120 r'EC3PO\.Console[\s\-\w\d:.]+LogConsoleOutput - /dev/pts/\d+ - '
121 # Lastly, we get the MCU's console line.
122 r'(?P<%s>.+$)' % (MCU_GROUP, LINE_GROUP))
123 MCU_EXTRACTOR = re.compile(MCU_RE)
124
Otabek Kasimov545739c2020-08-20 00:24:21 -0700125 # Regex to detect timeout messages when USBC pigtail has timeout issue.
126 # e.g.: [475635.427072 PD TMOUT RX 1/1]
127 USBC_PIGTAIL_TIMEOUT_RE = r'\[[\d \.]{1,20}(PD TMOUT RX 1\/1)\]'
128
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800129 # Suffix to identify compressed logfiles.
130 COMPRESSION_SUFFIX = '.tbz2'
131
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700132 # A suffix to mark servod log directories that came from instance that
133 # ran during this servo_host, but are not the last one running e.g. when
134 # an instance (on purpose, or due to a bug) restarted in the middle of the
135 # run.
136 OLD_LOG_SUFFIX = 'old'
137
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700138 # Mapping servo board with their vid-pid
139 SERVO_VID_PID = {
140 'servo_v4':'18d1:501b',
141 'ccd_cr50':'18d1:5014',
142 'servo_micro':'18d1:501a',
143 'servo_v3':['18d1:5004', '0403:6014'],
144 }
145
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800146 def _init_attributes(self):
147 self._servo_state = None
148 self.servo_port = None
149 self.servo_board = None
150 self.servo_model = None
151 self.servo_serial = None
Garry Wangcb06f3b2020-10-08 20:56:21 -0700152 self.servo_setup = None
Garry Wang6a680062020-11-03 13:40:29 -0800153 self.additional_servod_args = None
Otabek Kasimov39637412020-11-23 19:09:27 -0800154 self._dut_health_profile = None
Garry Wang000c6c02020-05-11 21:27:23 -0700155 # The flag that indicate if a servo is connected to a smart usbhub.
156 # TODO(xianuowang@) remove this flag once all usbhubs in the lab
157 # get replaced.
158 self.smart_usbhub = None
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800159 self._servo = None
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700160 self._topology = None
Andrew McRaef0679932020-08-13 09:15:23 +1000161 self._tunnel_proxy = None
162 self._tunnel_proxy_lock = threading.Lock()
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700163 self._initial_instance_ts = None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800164 # Flag to make sure that multiple calls to close do not result in the
165 # logic executing multiple times.
166 self._closed = False
Andrew McRaef0679932020-08-13 09:15:23 +1000167 # Per-thread local data
168 self._local = threading.local()
Fang Deng5d518f42013-08-02 14:04:32 -0700169
Garry Wangcb06f3b2020-10-08 20:56:21 -0700170 def _initialize(self,
171 servo_host='localhost',
172 servo_port=DEFAULT_PORT,
173 servo_board=None,
174 servo_model=None,
175 servo_serial=None,
176 servo_setup=None,
Garry Wang6a680062020-11-03 13:40:29 -0800177 additional_servod_args=None,
Garry Wangcb06f3b2020-10-08 20:56:21 -0700178 is_in_lab=None,
179 *args,
180 **dargs):
Fang Deng5d518f42013-08-02 14:04:32 -0700181 """Initialize a ServoHost instance.
182
183 A ServoHost instance represents a host that controls a servo.
184
185 @param servo_host: Name of the host where the servod process
186 is running.
Raul E Rangel52ca2e82018-07-03 14:10:14 -0600187 @param servo_port: Port the servod process is listening on. Defaults
188 to the SERVOD_PORT environment variable if set,
189 otherwise 9999.
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700190 @param servo_board: Board that the servo is connected to.
Nick Sanders2f3c9852018-10-24 12:10:24 -0700191 @param servo_model: Model that the servo is connected to.
Garry Wangcb06f3b2020-10-08 20:56:21 -0700192 @param servo_serial: Serial number of the servo device.
193 @param servo_setup: Type of servo setup, e.g. REGULAR or DUAL_V4.
Garry Wang6a680062020-11-03 13:40:29 -0800194 @param additional_servod_args: Additional args that will append to
195 servod start command.
Dan Shi4d478522014-02-14 13:46:32 -0800196 @param is_in_lab: True if the servo host is in Cros Lab. Default is set
197 to None, for which utils.host_is_in_lab_zone will be
198 called to check if the servo host is in Cros lab.
Fang Deng5d518f42013-08-02 14:04:32 -0700199
200 """
201 super(ServoHost, self)._initialize(hostname=servo_host,
Garry Wangebc015b2019-06-06 17:45:06 -0700202 is_in_lab=is_in_lab, *args, **dargs)
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800203 self._init_attributes()
Richard Barnette42f4db92018-08-23 15:05:15 -0700204 self.servo_port = int(servo_port)
Richard Barnettee519dcd2016-08-15 17:37:17 -0700205 self.servo_board = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -0700206 self.servo_model = servo_model
Kevin Cheng643ce8a2016-09-15 15:42:12 -0700207 self.servo_serial = servo_serial
Garry Wangcb06f3b2020-10-08 20:56:21 -0700208 self.servo_setup = servo_setup
Garry Wang6a680062020-11-03 13:40:29 -0800209 self.additional_servod_args = additional_servod_args
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800210
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700211 if self.is_servo_topology_supported():
212 self._topology = servo_topology.ServoTopology(self)
213
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800214 # The location of the log files on the servo host for this instance.
215 self.remote_log_dir = '%s_%s' % (self.SERVOD_LOG_PREFIX,
216 self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700217 # Path of the servo host lock file.
Derek Beckettf73baca2020-08-19 15:08:47 -0700218 self._lock_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
219 self.LOCK_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700220 # File path to declare a reboot request.
Derek Beckettf73baca2020-08-19 15:08:47 -0700221 self._reboot_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
222 self.REBOOT_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700223
224 # Lock the servo host if it's an in-lab labstation to prevent other
225 # task to reboot it until current task completes. We also wait and
226 # make sure the labstation is up here, in the case of the labstation is
227 # in the middle of reboot.
Garry Wang7c00b0f2019-06-25 17:28:17 -0700228 self._is_locked = False
Garry Wang42b4d862019-06-25 15:50:49 -0700229 if (self.wait_up(self.REBOOT_TIMEOUT) and self.is_in_lab()
230 and self.is_labstation()):
Garry Wang79e9af62019-06-12 15:19:19 -0700231 self._lock()
Garry Wang78ce64d2020-10-13 18:23:45 -0700232 try:
233 self.wait_ready()
234 except Exception as e:
235 logging.info(
236 'Unexpected error while ensure labstation'
237 ' readiness; %s', str(e))
Garry Wangebc015b2019-06-06 17:45:06 -0700238
Richard Barnette9a26ad62016-06-10 12:03:08 -0700239 self._repair_strategy = (
240 servo_repair.create_servo_repair_strategy())
Richard Barnettee519dcd2016-08-15 17:37:17 -0700241
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700242 def __str__(self):
243 return "<%s '%s:%s'>" % (
244 type(self).__name__, self.hostname, self.servo_port)
245
Richard Barnette9a26ad62016-06-10 12:03:08 -0700246 def connect_servo(self):
Garry Wang8c8dc972020-06-09 13:41:51 -0700247 """ Initialize and setup servo for later use.
248 """
249 self.initilize_servo()
250 self.initialize_dut_for_servo()
251
Garry Wang8c8dc972020-06-09 13:41:51 -0700252 def initilize_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700253 """Establish a connection to the servod server on this host.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700254
255 Initializes `self._servo` and then verifies that all network
256 connections are working. This will create an ssh tunnel if
257 it's required.
Garry Wang8c8dc972020-06-09 13:41:51 -0700258 """
259 self._servo = servo.Servo(servo_host=self,
260 servo_serial=self.servo_serial)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700261
Garry Wang8c8dc972020-06-09 13:41:51 -0700262 def initialize_dut_for_servo(self):
263 """This method will do some setup for dut control, e.g. setup
264 main servo_v4 device, and also testing the connection between servo
265 and DUT. As a side effect of testing the connection, all signals on
266 the target servo are reset to default values, and the USB stick is
Richard Barnette9a26ad62016-06-10 12:03:08 -0700267 set to the neutral (off) position.
268 """
Garry Wang8c8dc972020-06-09 13:41:51 -0700269 if not self._servo:
270 raise hosts.AutoservVerifyError('Servo object needs to be'
271 ' initialized before initialize'
272 ' DUT.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700273 timeout, _ = retry.timeout(
Garry Wang8c8dc972020-06-09 13:41:51 -0700274 self._servo.initialize_dut,
275 timeout_sec=self.INITIALIZE_SERVO_TIMEOUT_SECS)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700276 if timeout:
Garry Wang8c8dc972020-06-09 13:41:51 -0700277 raise hosts.AutoservVerifyError('Initialize dut for servo timed'
278 ' out.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700279
Richard Barnette9a26ad62016-06-10 12:03:08 -0700280 def disconnect_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700281 """Disconnect our servo if it exists.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700282
283 If we've previously successfully connected to our servo,
284 disconnect any established ssh tunnel, and set `self._servo`
285 back to `None`.
286 """
287 if self._servo:
288 # N.B. This call is safe even without a tunnel:
289 # rpc_server_tracker.disconnect() silently ignores
290 # unknown ports.
291 self.rpc_server_tracker.disconnect(self.servo_port)
292 self._servo = None
Fang Deng5d518f42013-08-02 14:04:32 -0700293
Andrew McRaef0679932020-08-13 09:15:23 +1000294 def _maybe_create_servod_ssh_tunnel_proxy(self):
295 """Create a xmlrpc proxy for use with a ssh tunnel.
296 A lock is used to safely create a singleton proxy.
297 """
298 with self._tunnel_proxy_lock:
299 if self._tunnel_proxy is None:
300 self._tunnel_proxy = self.rpc_server_tracker.xmlrpc_connect(
301 None,
302 self.servo_port,
303 ready_test_name=self.SERVO_READY_METHOD,
304 timeout_seconds=60,
305 request_timeout_seconds=3600,
306 server_desc=str(self))
307
Andrew McRaef0679932020-08-13 09:15:23 +1000308 def get_servod_server_proxy(self):
309 """Return a proxy if it exists; otherwise, create a new one.
310 A proxy can either be a ssh tunnel based proxy, or a httplib
311 based proxy.
Fang Deng5d518f42013-08-02 14:04:32 -0700312
313 @returns: An xmlrpclib.ServerProxy that is connected to the servod
314 server on the host.
Fang Deng5d518f42013-08-02 14:04:32 -0700315 """
Garry Wang11b5e872020-03-11 15:14:08 -0700316 if (servo_constants.ENABLE_SSH_TUNNEL_FOR_SERVO
317 and not self.is_localhost()):
Andrew McRaef0679932020-08-13 09:15:23 +1000318 # Check for existing ssh tunnel proxy.
319 if self._tunnel_proxy is None:
320 self._maybe_create_servod_ssh_tunnel_proxy()
321 return self._tunnel_proxy
Richard Barnette9a26ad62016-06-10 12:03:08 -0700322 else:
Andrew McRaef0679932020-08-13 09:15:23 +1000323 # xmlrpc/httplib is not thread-safe, so each thread must have its
324 # own separate proxy connection.
325 if not hasattr(self._local, "_per_thread_proxy"):
326 remote = 'http://%s:%s' % (self.hostname, self.servo_port)
Derek Beckettf73baca2020-08-19 15:08:47 -0700327 self._local._per_thread_proxy = six.moves.xmlrpc_client.ServerProxy(remote)
Andrew McRaef0679932020-08-13 09:15:23 +1000328 return self._local._per_thread_proxy
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800329
Richard Barnette1edbb162016-11-01 11:47:50 -0700330 def verify(self, silent=False):
331 """Update the servo host and verify it's in a good state.
332
333 @param silent If true, suppress logging in `status.log`.
334 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700335 message = 'Beginning verify for servo host %s port %s serial %s'
336 message %= (self.hostname, self.servo_port, self.servo_serial)
337 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700338 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700339 self._repair_strategy.verify(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700340 self._servo_state = servo_constants.SERVO_STATE_WORKING
341 self.record('INFO', None, None,
342 'ServoHost verify set servo_state as WORKING')
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700343 if self._topology:
344 self._topology.generate()
Garry Wang63b8c382020-03-11 22:28:40 -0700345 except Exception as e:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -0700346 if not self.is_localhost():
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700347 self._servo_state = self.determine_servo_state()
348 self.record('INFO', None, None,
349 'ServoHost verify set servo_state as %s'
350 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700351 if self._is_critical_error(e):
352 raise
Fang Deng5d518f42013-08-02 14:04:32 -0700353
Garry Wang2b5eef92020-08-21 16:23:35 -0700354 def _get_default_usbkey_mount_path(self):
355 return '/media/servo_usb/%s' % self.servo_port
Fang Deng5d518f42013-08-02 14:04:32 -0700356
Garry Wang7b0e1b72020-03-25 19:08:59 -0700357 def get_image_name_from_usbkey(self, usbkey_dev):
358 """Mount usb drive and check ChromeOS image name on it if there is
359 one. This method assumes the image_usbkey_direction is already set
360 to servo side.
361
Garry Wang4b980202020-09-24 17:00:17 -0700362 @param usbkey_dev: usbkey dev path(e.g. /dev/sdb).
Garry Wang7b0e1b72020-03-25 19:08:59 -0700363
364 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
365 or empty string if no test image detected, or unexpected
366 error occurred.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700367 """
Garry Wang70e5d062020-04-03 18:01:05 -0700368 logging.info('Checking ChromeOS image name on usbkey.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700369 mount_dst = self._get_default_usbkey_mount_path()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700370 # Unmount if there is an existing stale mount.
Garry Wang2b5eef92020-08-21 16:23:35 -0700371 self._unmount_drive(mount_dst)
372 # ChromeOS root fs is in /dev/sdx3
373 mount_src = usbkey_dev + '3'
Garry Wang7b0e1b72020-03-25 19:08:59 -0700374 try:
Garry Wang2b5eef92020-08-21 16:23:35 -0700375 if not self._mount_drive(mount_src, mount_dst):
376 logging.debug('Unexpected error occurred on mount usb drive.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700377 return ''
Garry Wang70e5d062020-04-03 18:01:05 -0700378
379 release_content = self.run(
Garry Wang2b5eef92020-08-21 16:23:35 -0700380 'cat %s/etc/lsb-release' % mount_dst,
Garry Wang70e5d062020-04-03 18:01:05 -0700381 ignore_status=True).stdout.strip()
382
383 if not re.search(r'RELEASE_TRACK=.*test', release_content):
384 logging.info('The image on usbkey is not a test image')
385 return ''
386
387 return lsbrelease_utils.get_chromeos_release_builder_path(
388 lsb_release_content=release_content)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700389 finally:
Garry Wang70e5d062020-04-03 18:01:05 -0700390 logging.debug('Image check compeleted, unmounting the usb drive.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700391 self._unmount_drive(mount_dst)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700392
Garry Wang2b5eef92020-08-21 16:23:35 -0700393 def _extract_firmware_image_from_usbkey(self, fw_dst):
394 """Extract firmware images from the usbkey on servo, this method
395 assumes there is already a ChromeOS test image staged on servo.
396
Garry Wang4b980202020-09-24 17:00:17 -0700397 @param fw_dst: the path that we'll copy firmware images to.
Garry Wang2b5eef92020-08-21 16:23:35 -0700398
399 @returns: a json format string of firmware manifest data.
400 """
401 usbkey_dev = self._probe_and_validate_usb_dev()
402 if not usbkey_dev:
403 raise hosts.AutoservRepairError('Unexpected error occurred when'
404 ' probe usbkey dev path, please check logs for detail.')
405
406 mount_dst = self._get_default_usbkey_mount_path()
407 # Unmount if there is an existing stale mount.
408 self._unmount_drive(mount_dst)
409 # ChromeOS root fs is in /dev/sdx3
410 mount_src = usbkey_dev + '3'
411 try:
412 if not self._mount_drive(mount_src, mount_dst):
413 raise hosts.AutoservRepairError('Failed to extract firmware'
414 ' image; Unable to mount %s.' % usbkey_dev,
415 'unable to mount usbkey')
416 updater_bin = os.path.join(mount_dst,
417 'usr/sbin/chromeos-firmwareupdate')
418 self.run('%s --unpack %s' % (updater_bin, fw_dst))
419 return self.run('%s --manifest' % updater_bin).stdout
420 finally:
421 self._unmount_drive(mount_dst)
422
423 def prepare_repair_firmware_image(self, fw_dst=None):
424 """Prepare firmware image on the servohost for auto repair process
425 to consume.
426
Garry Wang4b980202020-09-24 17:00:17 -0700427 @param fw_dst: the path that we want to store firmware image on
428 the servohost.
Garry Wang2b5eef92020-08-21 16:23:35 -0700429
430 @returns: A tuple that containes ec firmware image path and bios
431 firmware image path on the servohost, or None if type of
432 image is not available based on manifest and dut's model.
433 """
434 model = self.servo_model or self._dut_host_info.model
435 if not model:
436 raise hosts.AutoservRepairError(
437 'Could not determine DUT\'s model.',
438 'model infomation unknown')
439
440 if not fw_dst:
441 fw_dst = '/tmp/firmware_image/%s' % self.servo_port
442 # Cleanup and re-create dst path to have a fresh start.
443 self.run('rm -rf %s' % fw_dst)
444 self.run('mkdir -p %s' % fw_dst)
445
446 manifest = json.loads(self._extract_firmware_image_from_usbkey(fw_dst))
Garry Wang50b56c12020-09-24 17:26:52 -0700447 # For models that have packed $MODEL_signed variant, we want use the
448 # 'signed' variant once we get DVT devices, so try to read manifest
449 # from $MODEL_signed first.
450 build = manifest.get('%s_signed' % model) or manifest.get(model)
451 if not build:
Garry Wang2b5eef92020-08-21 16:23:35 -0700452 raise hosts.AutoservRepairError('Could not find firmware manifest'
453 ' for model:%s' % model, 'model manifest not found')
454 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700455 ec_image = os.path.join(fw_dst, build['ec']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700456 except KeyError:
457 ec_image = None
458 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700459 bios_image = os.path.join(fw_dst, build['host']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700460 except KeyError:
461 bios_image = None
462 if not ec_image and not bios_image:
463 raise hosts.AutoservRepairError('Could not find any firmware image'
464 ' for model:%s' % model, 'cannot find firmware image')
465 return ec_image, bios_image
Garry Wang7b0e1b72020-03-25 19:08:59 -0700466
Garry Wang4b980202020-09-24 17:00:17 -0700467 def flash_ap_firmware_via_servo(self, image):
468 """Flash AP firmware by use a provided image.
469
470 This is will be a short term enhanment for infra repair use, it use
471 'futility update' which will automatically determine various parameters
472 needed for flashrom, and will preserve the GBB, VPD, and HWID for
473 AP firmware update.
474 @TODO(xianuowang@) Remove this method once b/148403277 implemented.
475
476 @param image: the firmware image path on servohost.
477 """
478 cmd = 'futility update -i %s --servo_port=%s'
479 self.run(cmd % (image, self.servo_port), timeout=900)
480
Garry Wang70e5d062020-04-03 18:01:05 -0700481 def _probe_and_validate_usb_dev(self):
482 """This method probe the usb dev path by talking to servo, and then
483 validate the dev path is valid block device to servohost.
484 Possible output:
485 1. Encounter error during probe usb dev, returns empty string.
486 2. probe usb dev completed without error but cannot find usb dev,
487 raise AutoservRepairError.
488 3. probe usb dev find a usb dev path, but failed validation in this
489 method, raise AutoservRepairError.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700490
Garry Wang70e5d062020-04-03 18:01:05 -0700491 @returns: A string of usb dev path(e.g. '/dev/sdb'), or empty string
492 if unexpected error occurred during probe.
493 @raises: AutoservRepairError if servo couldn't probe the usb dev path
494 (servo.probe_host_usb_dev() returns empty string), or the dev path is
495 not valid block device to servohost.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700496 """
497 logging.info('Validating image usbkey on servo.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700498 try:
Garry Wang70e5d062020-04-03 18:01:05 -0700499 usb_dev = self._servo.probe_host_usb_dev()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700500 except Exception as e:
501 # We don't want any unexpected or transient servo communicating
502 # failure block usb repair, so capture all errors here.
503 logging.error(e, exc_info=True)
504 logging.error('Unexpected error occurred on get usbkey dev path,'
505 ' skipping usbkey validation.')
506 return ''
507
Garry Wang70e5d062020-04-03 18:01:05 -0700508 if usb_dev:
509 # probe_host_usb_dev() sometimes return stale record,
510 # so we need to make sure the path exists in fdisk.
Otabek Kasimov77bff672020-10-08 15:52:03 -0700511 validate_cmd = 'fdisk -l %s' % usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700512 try:
Otabek Kasimov77bff672020-10-08 15:52:03 -0700513 resp = self.run(validate_cmd, ignore_status=True, timeout=30)
Garry Wang11441182020-06-16 18:34:14 -0700514 if resp.exit_status == 0:
515 return usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700516 logging.error('%s is reported from "image_usbkey_dev" control'
517 ' but not detected by fdisk!', usb_dev)
518 except error.AutoservRunError as e:
519 if 'Timeout encountered' in str(e):
520 logging.warning('Timeout encountered during fdisk run,'
521 ' skipping usbkey validation.')
522 return ''
523 raise
Garry Wang70e5d062020-04-03 18:01:05 -0700524
525 raise hosts.AutoservRepairError(
526 'No usbkey detected on servo, the usbkey may be either missing'
527 ' or broken. Please replace usbkey on the servo and retry.',
528 'missing usbkey')
529
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700530 def is_ec_supported(self):
Garry Wang9b8f2342020-04-17 16:34:09 -0700531 """Check if ec is supported on the servo_board"""
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700532 if self.servo_board:
533 try:
534 frm_config = config.Config(self.servo_board, self.servo_model)
535 return frm_config.chrome_ec
536 except Exception as e:
537 logging.error('Unexpected error when read from firmware'
538 ' configs; %s', str(e))
539 return False
540
Garry Wang70e5d062020-04-03 18:01:05 -0700541 def validate_image_usbkey(self):
542 """This method first validate if there is a recover usbkey on servo
543 that accessible to servohost, and second check if a ChromeOS image is
544 already on the usb drive and return the image_name so we can avoid
545 unnecessary download and flash to the recover usbkey on servo.
546
547 Please note that, there is special error handling logic here:
548 1. If unexpected error happens, we return empty string. So repair
549 actions will not get blocked.
550 2. If no working usbkey present on servo, but no errors, we'll raise
551 AutoservRepairError here.
552
553 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
554 or empty string if no test image detected, or unexpected
555 error occurred.
556 @raises: AutoservRepairError if the usbkey is not detected on servo.
557 """
558 usb_dev = self._probe_and_validate_usb_dev()
559 if usb_dev:
560 return self.get_image_name_from_usbkey(usb_dev)
561 else:
562 return ''
Garry Wang7b0e1b72020-03-25 19:08:59 -0700563
Richard Barnette1edbb162016-11-01 11:47:50 -0700564 def repair(self, silent=False):
565 """Attempt to repair servo host.
566
567 @param silent If true, suppress logging in `status.log`.
568 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700569 message = 'Beginning repair for servo host %s port %s serial %s'
570 message %= (self.hostname, self.servo_port, self.servo_serial)
571 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700572 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700573 self._repair_strategy.repair(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700574 self._servo_state = servo_constants.SERVO_STATE_WORKING
575 self.record('INFO', None, None,
576 'ServoHost repair set servo_state as WORKING')
Garry Wang464ff1e2019-07-18 17:20:34 -0700577 # If target is a labstation then try to withdraw any existing
578 # reboot request created by this servo because it passed repair.
579 if self.is_labstation():
580 self.withdraw_reboot_request()
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700581 if self._topology:
582 self._topology.generate()
Garry Wang63b8c382020-03-11 22:28:40 -0700583 except Exception as e:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -0700584 if not self.is_localhost():
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700585 self._servo_state = self.determine_servo_state()
586 self.record('INFO', None, None,
587 'ServoHost repair set servo_state as %s'
588 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700589 if self._is_critical_error(e):
590 self.disconnect_servo()
591 self.stop_servod()
592 raise
593
Garry Wang63b8c382020-03-11 22:28:40 -0700594 def _is_critical_error(self, error):
595 if (isinstance(error, hosts.AutoservVerifyDependencyError)
596 and not error.is_critical()):
597 logging.warning('Non-critical verify failure(s) detected during'
598 ' verify/repair servo, servo connection will'
Evan Benn2c41c262020-10-28 11:34:27 +1100599 ' still be up but may not be fully functional.'
600 ' Some repair actions and servo dependent'
Garry Wang63b8c382020-03-11 22:28:40 -0700601 ' tests may not run.')
602 return False
Evan Benn2c41c262020-10-28 11:34:27 +1100603 logging.info(
604 'Critical verify failure(s) detected during repair/verify '
605 'servo. Disconnecting servo and running `stop servod`, all'
606 ' repair actions and tests that depends on servo will not '
607 'run.')
Garry Wang63b8c382020-03-11 22:28:40 -0700608 return True
Fang Deng5d518f42013-08-02 14:04:32 -0700609
Dan Shi4d478522014-02-14 13:46:32 -0800610 def get_servo(self):
611 """Get the cached servo.Servo object.
Fang Deng5d518f42013-08-02 14:04:32 -0700612
Dan Shi4d478522014-02-14 13:46:32 -0800613 @return: a servo.Servo object.
Dana Goyette353d1d92019-06-27 10:43:59 -0700614 @rtype: autotest_lib.server.cros.servo.servo.Servo
Fang Deng5d518f42013-08-02 14:04:32 -0700615 """
Dan Shi4d478522014-02-14 13:46:32 -0800616 return self._servo
617
Garry Wang79e9af62019-06-12 15:19:19 -0700618 def request_reboot(self):
619 """Request servohost to be rebooted when it's safe to by touch a file.
620 """
621 logging.debug('Request to reboot servohost %s has been created by '
Garry Wang464ff1e2019-07-18 17:20:34 -0700622 'servo with port # %s', self.hostname, self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700623 self.run('touch %s' % self._reboot_file, ignore_status=True)
624
Garry Wang464ff1e2019-07-18 17:20:34 -0700625 def withdraw_reboot_request(self):
626 """Withdraw a servohost reboot request if exists by remove the flag
627 file.
628 """
629 logging.debug('Withdrawing request to reboot servohost %s that created'
630 ' by servo with port # %s if exists.',
631 self.hostname, self.servo_port)
632 self.run('rm -f %s' % self._reboot_file, ignore_status=True)
633
Garry Wangc1288cf2019-12-17 14:58:00 -0800634 def start_servod(self, quick_startup=False):
635 """Start the servod process on servohost.
636 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800637 # Skip if running on the localhost.(crbug.com/1038168)
638 if self.is_localhost():
639 logging.debug("Servohost is a localhost, skipping start servod.")
640 return
641
642 cmd = 'start servod'
Garry Wangc1288cf2019-12-17 14:58:00 -0800643 if self.servo_board:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800644 cmd += ' BOARD=%s' % self.servo_board
Garry Wangc1288cf2019-12-17 14:58:00 -0800645 if self.servo_model:
646 cmd += ' MODEL=%s' % self.servo_model
Garry Wangc1288cf2019-12-17 14:58:00 -0800647 else:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800648 logging.warning('Board for DUT is unknown; starting servod'
649 ' assuming a pre-configured board.')
650
651 cmd += ' PORT=%d' % self.servo_port
652 if self.servo_serial:
653 cmd += ' SERIAL=%s' % self.servo_serial
Garry Wangd7367482020-02-27 13:52:40 -0800654
Garry Wangcb06f3b2020-10-08 20:56:21 -0700655 # Start servod with dual_v4 based on servo_setup.
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700656 if self.is_dual_setup():
Garry Wangcb06f3b2020-10-08 20:56:21 -0700657 cmd += ' DUAL_V4=1'
Garry Wangd7367482020-02-27 13:52:40 -0800658
Garry Wangcb06f3b2020-10-08 20:56:21 -0700659 # Start servod with CONFIG=cr50.xml which required for some pools.
660 if self._require_cr50_servod_config():
661 cmd += ' CONFIG=cr50.xml'
Garry Wangb5cee3e2020-09-16 14:58:13 -0700662
Garry Wang6a680062020-11-03 13:40:29 -0800663 # Adding customized args if any.
664 if self.additional_servod_args:
665 cmd += ' ' + self.additional_servod_args
666
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800667 # Remove the symbolic links from the logs. This helps ensure that
668 # a failed servod instantiation does not cause us to grab old logs
669 # by mistake.
670 self.remove_latest_log_symlinks()
Garry Wangcdd27b22020-01-13 14:59:11 -0800671 self.run(cmd, timeout=60)
Garry Wangc1288cf2019-12-17 14:58:00 -0800672
673 # There's a lag between when `start servod` completes and when
674 # the _ServodConnectionVerifier trigger can actually succeed.
675 # The call to time.sleep() below gives time to make sure that
676 # the trigger won't fail after we return.
677
678 # Normally servod on servo_v3 and labstation take ~10 seconds to ready,
679 # But in the rare case all servo on a labstation are in heavy use they
680 # may take ~30 seconds. So the timeout value will double these value,
681 # and we'll try quick start up when first time initialize servohost,
682 # and use standard start up timeout in repair.
683 if quick_startup:
Garry Wang11b5e872020-03-11 15:14:08 -0700684 timeout = servo_constants.SERVOD_QUICK_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800685 else:
Garry Wang11b5e872020-03-11 15:14:08 -0700686 timeout = servo_constants.SERVOD_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800687 logging.debug('Wait %s seconds for servod process fully up.', timeout)
688 time.sleep(timeout)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700689 # Cache the initial instance timestamp to check against servod restarts
690 self._initial_instance_ts = self.get_instance_logs_ts()
Garry Wangc1288cf2019-12-17 14:58:00 -0800691
Garry Wangc1288cf2019-12-17 14:58:00 -0800692 def stop_servod(self):
693 """Stop the servod process on servohost.
694 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800695 # Skip if running on the localhost.(crbug.com/1038168)
696 if self.is_localhost():
697 logging.debug("Servohost is a localhost, skipping stop servod.")
698 return
699
Garry Wangc1288cf2019-12-17 14:58:00 -0800700 logging.debug('Stopping servod on port %s', self.servo_port)
Garry Wangcdd27b22020-01-13 14:59:11 -0800701 self.run('stop servod PORT=%d' % self.servo_port,
702 timeout=60, ignore_status=True)
Garry Wangc1288cf2019-12-17 14:58:00 -0800703 logging.debug('Wait %s seconds for servod process fully teardown.',
Garry Wang11b5e872020-03-11 15:14:08 -0700704 servo_constants.SERVOD_TEARDOWN_TIMEOUT)
705 time.sleep(servo_constants.SERVOD_TEARDOWN_TIMEOUT)
Garry Wangc1288cf2019-12-17 14:58:00 -0800706
Garry Wangc1288cf2019-12-17 14:58:00 -0800707 def restart_servod(self, quick_startup=False):
708 """Restart the servod process on servohost.
709 """
710 self.stop_servod()
711 self.start_servod(quick_startup)
712
Garry Wangffbd2162020-04-17 16:13:48 -0700713 def _process_servodtool_error(self, response):
714 """Helper function to handle non-zero servodtool response.
715 """
716 if re.search(servo_constants.ERROR_MESSAGE_USB_HUB_NOT_COMPATIBLE,
Garry Wangad245002020-05-15 15:20:23 -0700717 response.stdout):
Garry Wangffbd2162020-04-17 16:13:48 -0700718 logging.error('The servo is not plugged on a usb hub that supports'
719 ' power-cycle!')
Garry Wang000c6c02020-05-11 21:27:23 -0700720 # change the flag so we can update this label in later process.
721 self.smart_usbhub = False
Garry Wangffbd2162020-04-17 16:13:48 -0700722 return
723
724 if re.search(servo_constants.ERROR_MESSAGE_DEVICE_NOT_FOUND %
725 self.servo_serial, response.stdout):
726 logging.error('No servo with serial %s found!', self.servo_serial)
727 return
728
729 logging.error('Unexpected error occurred from usbhub control, please'
730 ' file a bug and inform chrome-fleet-software@ team!')
731
Otabek Kasimov86062d02020-11-17 13:30:22 -0800732 def get_main_servo_usb_path(self):
733 """Helper function to collect current usb-path to main servo.
734
735 The usb-path is path to the folder where usb-device was enumerated.
736 If fail then will return an empty string ('').
737
738 @returns: string, usb-path to the main servo device.
739 e.g.: '/sys/bus/usb/devices/1-6.1.3.1'
Garry Wangffbd2162020-04-17 16:13:48 -0700740 """
Otabek Kasimov09192682020-06-01 18:17:44 -0700741 # TODO remove try-except when fix crbug.com/1087964
742 try:
743 cmd = 'servodtool device -s %s usb-path' % self.servo_serial
744 resp = self.run(cmd, ignore_status=True, timeout=30)
745 except Exception as e:
746 # Here we catch only timeout errors.
747 # Other errors is filtered by ignore_status=True
748 logging.debug('Attempt to get servo usb-path failed due to '
749 'timeout; %s', e)
750 return ''
Garry Wangffbd2162020-04-17 16:13:48 -0700751 if resp.exit_status != 0:
752 self._process_servodtool_error(resp)
753 return ''
754 usb_path = resp.stdout.strip()
755 logging.info('Usb path of servo %s is %s', self.servo_serial, usb_path)
Otabek Kasimov86062d02020-11-17 13:30:22 -0800756 return usb_path
Garry Wangffbd2162020-04-17 16:13:48 -0700757
Otabek Kasimov86062d02020-11-17 13:30:22 -0800758 def _get_servo_usb_devnum(self):
759 """Helper function to collect current usb devnum of servo."""
760 usb_path = self.get_main_servo_usb_path()
761 if not usb_path:
762 return ''
763 resp = self.run('cat %s/devnum' % usb_path, ignore_status=True)
Garry Wangffbd2162020-04-17 16:13:48 -0700764 if resp.exit_status != 0:
765 self._process_servodtool_error(resp)
766 return ''
767 return resp.stdout.strip()
768
Garry Wang358aad42020-08-02 20:56:04 -0700769 def reboot_servo_v3_on_need(self):
770 """Check and reboot servo_v3 based on below conditions.
771 1. If there is an update pending on reboot.
772 2. Servo_v3 has been up for more than 96 hours.
773 """
774 if self.get_board() != 'beaglebone_servo':
775 logging.info('Servo reboot is only applicable for servo V3.')
Otabek Kasimove6df8102020-07-21 20:15:25 -0700776 return
777
Garry Wang358aad42020-08-02 20:56:04 -0700778 update_pending_reboot = (self._check_update_status() ==
779 self.UPDATE_STATE.PENDING_REBOOT)
780 uptime_hours = float(self.check_uptime())/3600
781 logging.info('Uptime of servo_v3: %s hour(s)', uptime_hours)
782 long_up_time = uptime_hours > 96
783
784 # Skip reboot if neither condition are met.
785 if not (update_pending_reboot or long_up_time):
Otabek Kasimove6df8102020-07-21 20:15:25 -0700786 return
787
Garry Wang358aad42020-08-02 20:56:04 -0700788 if update_pending_reboot:
789 message = 'Starting reboot servo_v3 because an update is pending.'
790 reboot_method = self._post_update_reboot
791 elif long_up_time:
792 message = 'Starting reboot servo_v3 because uptime > 96 hours.'
793 reboot_method = self._servo_host_reboot
794 self.record('INFO', None, None, message)
795 logging.info(message)
Otabek Kasimove6df8102020-07-21 20:15:25 -0700796 try:
Garry Wang358aad42020-08-02 20:56:04 -0700797 reboot_method()
Otabek Kasimove6df8102020-07-21 20:15:25 -0700798 message = 'Servo_v3 reboot completed successfully.'
799 except Exception as e:
800 logging.debug("Fail to reboot servo_v3; %s", e)
801 message = ('Servo_v3 reboot failed, please check debug log '
802 'for details.')
803 logging.info(message)
804 self.record('INFO', None, None, message)
Garry Wangffbd2162020-04-17 16:13:48 -0700805
806 def _reset_servo(self):
807 logging.info('Resetting servo through smart usbhub.')
Otabek Kasimov09192682020-06-01 18:17:44 -0700808 # TODO remove try-except when fix crbug.com/1087964
809 try:
810 resp = self.run('servodtool device -s %s power-cycle' %
811 self.servo_serial, ignore_status=True,
812 timeout=30)
813 if resp.exit_status != 0:
814 self._process_servodtool_error(resp)
815 return False
816 except Exception as e:
817 # Here we catch only timeout errors.
818 # Other errors is filtered by ignore_status=True
819 logging.debug('Attempt to reset servo failed due to timeout;'
820 ' %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -0700821 return False
822
823 logging.debug('Wait %s seconds for servo to come back from reset.',
824 servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
825 time.sleep(servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
Garry Wang000c6c02020-05-11 21:27:23 -0700826 # change the flag so we can update this label in later process.
827 self.smart_usbhub = True
Garry Wangffbd2162020-04-17 16:13:48 -0700828 return True
829
Garry Wangffbd2162020-04-17 16:13:48 -0700830 def reset_servo(self):
831 """Reset(power-cycle) the servo via smart usbhub.
832 """
833 if not self.is_labstation():
834 logging.info('Servo reset is not applicable to servo_v3.')
835 return
836
837 pre_reset_devnum = self._get_servo_usb_devnum()
838 logging.info('Servo usb devnum before reset: %s', pre_reset_devnum)
839 result = self._reset_servo()
840 if not result:
Garry Wangfd5c8b62020-06-08 15:36:54 -0700841 message = ('Failed to reset servo with serial: %s. (Please ignore'
842 ' this error if the DUT is not connected to a smart'
843 ' usbhub).' % self.servo_serial)
Garry Wangffbd2162020-04-17 16:13:48 -0700844 logging.warning(message)
845 self.record('INFO', None, None, message)
846 return
847
848 post_reset_devnum = self._get_servo_usb_devnum()
849 logging.info('Servo usb devnum after reset: %s', post_reset_devnum)
850 if not (pre_reset_devnum and post_reset_devnum):
851 message = ('Servo reset completed but unable to verify'
852 ' devnum change!')
853 elif pre_reset_devnum != post_reset_devnum:
854 message = ('Reset servo with serial %s completed successfully!'
855 % self.servo_serial)
856 else:
857 message = 'Servo reset completed but devnum is still not changed!'
858 logging.info(message)
859 self.record('INFO', None, None, message)
860
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800861 def _extract_compressed_logs(self, logdir, relevant_files):
862 """Decompress servod logs in |logdir|.
863
864 @param logdir: directory containing compressed servod logs.
865 @param relevant_files: list of files in |logdir| to consider.
866
867 @returns: tuple, (tarfiles, files) where
868 tarfiles: list of the compressed filenames that have been
869 extracted and deleted
870 files: list of the uncompressed files that were generated
871 """
872 # For all tar-files, first extract them to the directory, and
873 # then let the common flow handle them.
874 tarfiles = [cf for cf in relevant_files if
875 cf.endswith(self.COMPRESSION_SUFFIX)]
876 files = []
877 for f in tarfiles:
878 norm_name = os.path.basename(f)[:-len(self.COMPRESSION_SUFFIX)]
879 with tarfile.open(f) as tf:
880 # Each tarfile has only one member, as
881 # that's the compressed log.
882 member = tf.members[0]
883 # Manipulate so that it only extracts the basename, and not
884 # the directories etc.
885 member.name = norm_name
886 files.append(os.path.join(logdir, member.name))
887 tf.extract(member, logdir)
888 # File has been extracted: remove the compressed file.
889 os.remove(f)
890 return tarfiles, files
891
892 def _extract_mcu_logs(self, log_subdir):
893 """Extract MCU (EC, Cr50, etc) console output from servod debug logs.
894
895 Using the MCU_EXTRACTOR regex (above) extract and split out MCU console
896 lines from the logs to generate invidiual console logs e.g. after
897 this method, you can find an ec.txt and servo_v4.txt in |log_dir| if
898 those MCUs had any console input/output.
899
900 @param log_subdir: directory with log.DEBUG.txt main servod debug logs.
901 """
902 # Extract the MCU for each one. The MCU logs are only in the .DEBUG
903 # files
904 mcu_lines_file = os.path.join(log_subdir, 'log.DEBUG.txt')
905 if not os.path.exists(mcu_lines_file):
906 logging.info('No DEBUG logs found to extract MCU logs from.')
907 return
908 mcu_files = {}
909 mcu_file_template = '%s.txt'
910 with open(mcu_lines_file, 'r') as f:
911 for line in f:
912 match = self.MCU_EXTRACTOR.match(line)
913 if match:
914 mcu = match.group(self.MCU_GROUP).lower()
915 line = match.group(self.LINE_GROUP)
916 if mcu not in mcu_files:
917 mcu_file = os.path.join(log_subdir,
918 mcu_file_template % mcu)
919 mcu_files[mcu] = open(mcu_file, 'a')
920 fd = mcu_files[mcu]
921 fd.write(line + '\n')
922 for f in mcu_files:
923 mcu_files[f].close()
924
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800925 def remove_latest_log_symlinks(self):
926 """Remove the conveninence symlinks 'latest' servod logs."""
927 symlink_wildcard = '%s/latest*' % self.remote_log_dir
928 cmd = 'rm ' + symlink_wildcard
929 self.run(cmd, stderr_tee=None, ignore_status=True)
930
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700931 def probe_servod_restart(self, instance_ts, outdir):
932 """Grab servod logs from previous instances if part of this session.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800933
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700934 If since the last time this host called start_servod() servod crashed
935 and restarted, this helper finds those logs as well, and stores them
936 with the |OLD_LOG_SUFFIX| to investigate if necessary.
Prasad Vuppalapu5bd9da12020-03-31 01:46:47 +0000937
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700938 It also issues a panicinfo command to servo devices after the restart
939 to try and collect reboot information for debugging.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800940
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700941 @param instance_ts: the log timestamp that the current instance uses
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800942 @param outdir: directory to create a subdirectory into to place the
943 servod logs into.
944 """
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700945 if self._initial_instance_ts is None:
946 logging.info('No log timestamp grabbed successfully on servod '
947 'startup. Cannot check device restarts. Ignoring.')
948 return
949 if instance_ts == self._initial_instance_ts:
950 logging.debug('Servod appears to have run without restarting')
951 return
952 # Servod seems to have restarted (at least once). |_initial_instance_ts|
953 # is the first timestamp, and instance_ts is the current timestamp. Find
954 # all timestamps in between them, and grab the logs for each.
955 tss = self._find_instance_timestamps_between(self._initial_instance_ts,
956 instance_ts)
957 logging.info('Servod has restarted %d times between the start and the '
958 'end of this servo_host.', len(tss))
959 logging.info('This might be an issue. Will extract all logs from each '
960 'instance.')
961 logging.info('Logs that are not the currently running (about to turn '
962 'down) instance are maked with a .%s in their folder.',
963 self.OLD_LOG_SUFFIX)
964 for ts in tss:
965 self.get_instance_logs(ts, outdir, old=True)
966 # Lastly, servod has restarted due to a potential issue. Try to get
967 # panic information from servo micro and servo v4 for the current logs.
968 # This can only happen if the |_servo| attribute is initialized.
969 if self._servo:
970 for mcu in ['servo_micro', 'servo_v4']:
971 ctrl = '%s_uart_cmd' % mcu
972 if self._servo.has_control(ctrl):
973 logging.info('Trying to retrieve %r panicinfo into logs',
974 mcu)
975 try:
976 self._servo.set_nocheck(ctrl, 'panicinfo')
977 except error.TestFail as e:
978 logging.error('Failed to generate panicinfo for %r '
979 'logs. %s', mcu, str(e))
980
981 def _find_instance_timestamps_between(self, start_ts, end_ts):
982 """Find all log timestamps between [start_ts, end_ts).
983
984 @param start_ts: str, earliest log timestamp of interest
985 @param end_ts: str, latest log timestamp of interest
986
987 @returns: list, all timestamps between start_ts and end_ts, end_ts
988 exclusive, on the servo_host. An empty list on errors
989 """
990 # Simply get all timestamp, and then sort and remove
991 cmd = 'ls %s' % self.remote_log_dir
992 res = self.run(cmd, stderr_tee=None, ignore_status=True)
993 if res.exit_status != 0:
994 # Here we failed to find anything.
995 logging.info('Failed to find remote servod logs. Ignoring.')
996 return []
997 logfiles = res.stdout.strip().split()
998 timestamps = set()
999 for logfile in logfiles:
1000 ts_match = self.TS_EXTRACTOR.match(logfile)
1001 if not ts_match:
1002 # Simply ignore files that fail the check. It might be the
1003 # 'latest' symlinks or random files.
1004 continue
1005 timestamps.add(ts_match.group(self.TS_GROUP))
1006 # At this point we have all unique timestamps.
1007 timestamps = sorted(timestamps)
1008 for ts in [start_ts, end_ts]:
1009 if ts not in timestamps:
1010 logging.error('Timestamp %r not in servod logs. Cannot query '
1011 'for timestamps in between %r and %r', ts,
1012 start_ts, end_ts)
1013 return []
1014 return timestamps[timestamps.index(start_ts):timestamps.index(end_ts)]
1015
1016 def get_instance_logs_ts(self):
1017 """Retrieve the currently running servod instance's log timestamp
1018
1019 @returns: str, timestamp for current instance, or None on failure
1020 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001021 # First, extract the timestamp. This cmd gives the real filename of
1022 # the latest aka current log file.
1023 cmd = ('if [ -f %(dir)s/latest.DEBUG ];'
1024 'then realpath %(dir)s/latest.DEBUG;'
1025 'elif [ -f %(dir)s/latest ];'
1026 'then realpath %(dir)s/latest;'
1027 'else exit %(code)d;'
1028 'fi' % {'dir': self.remote_log_dir,
1029 'code': self.NO_SYMLINKS_CODE})
1030 res = self.run(cmd, stderr_tee=None, ignore_status=True)
1031 if res.exit_status != 0:
1032 if res.exit_status == self.NO_SYMLINKS_CODE:
1033 logging.warning('servod log latest symlinks not found. '
1034 'This is likely due to an error starting up '
1035 'servod. Ignoring..')
1036 else:
1037 logging.warning('Failed to find servod logs on servo host.')
1038 logging.warning(res.stderr.strip())
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001039 return None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001040 fname = os.path.basename(res.stdout.strip())
1041 # From the fname, ought to extract the timestamp using the TS_EXTRACTOR
Ruben Rodriguez Buchillone9aa2b02020-03-04 12:14:28 -08001042 ts_match = self.TS_EXTRACTOR.match(fname)
1043 if not ts_match:
1044 logging.warning('Failed to extract timestamp from servod log file '
1045 '%r. Skipping. The servo host is using outdated '
1046 'servod logging and needs to be updated.', fname)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001047 return None
1048 return ts_match.group(self.TS_GROUP)
1049
1050 def get_instance_logs(self, instance_ts, outdir, old=False):
1051 """Collect all logs with |instance_ts| and dump into a dir in |outdir|
1052
1053 This method first collects all logs on the servo_host side pertaining
1054 to this servod instance (port, instatiation). It glues them together
1055 into combined log.[level].txt files and extracts all available MCU
1056 console I/O from the logs into individual files e.g. servo_v4.txt
1057
1058 All the output can be found in a directory inside |outdir| that
1059 this generates based on |LOG_DIR|, the servod port, and the instance
1060 timestamp on the servo_host side.
1061
1062 @param instance_ts: log timestamp to grab logfiles for
1063 @param outdir: directory to create a subdirectory into to place the
1064 servod logs into.
1065 @param old: bool, whether to append |OLD_LOG_SUFFIX| to output dir
1066 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001067 # Create the local results log dir.
1068 log_dir = os.path.join(outdir, '%s_%s.%s' % (self.LOG_DIR,
1069 str(self.servo_port),
1070 instance_ts))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001071 if old:
Garry Wang22f2e842020-09-09 20:19:19 -07001072 log_dir = '%s.%s' % (log_dir, self.OLD_LOG_SUFFIX)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001073 logging.info('Saving servod logs to %r.', log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001074 os.mkdir(log_dir)
1075 # Now, get all files with that timestamp.
1076 cmd = 'find %s -maxdepth 1 -name "log.%s*"' % (self.remote_log_dir,
1077 instance_ts)
1078 res = self.run(cmd, stderr_tee=None, ignore_status=True)
1079 files = res.stdout.strip().split()
1080 try:
1081 self.get_file(files, log_dir, try_rsync=False)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001082 if not os.listdir(log_dir):
1083 logging.info('No servod logs retrieved. Ignoring, and removing '
1084 '%r again.', log_dir)
1085 os.rmdir(log_dir)
1086 return
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001087 except error.AutoservRunError as e:
1088 result = e.result_obj
1089 if result.exit_status != 0:
1090 stderr = result.stderr.strip()
1091 logging.warning("Couldn't retrieve servod logs. Ignoring: %s",
1092 stderr or '\n%s' % result)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001093 # Remove the log_dir as nothing was added to it.
1094 os.rmdir(log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001095 return
1096 local_files = [os.path.join(log_dir, f) for f in os.listdir(log_dir)]
1097 # TODO(crrev.com/c/1793030): remove no-level case once CL is pushed
1098 for level_name in ('DEBUG', 'INFO', 'WARNING', ''):
1099 # Create the joint files for each loglevel. i.e log.DEBUG
1100 joint_file = self.JOINT_LOG_PREFIX
1101 if level_name:
1102 joint_file = '%s.%s' % (self.JOINT_LOG_PREFIX, level_name)
1103 # This helps with some online tools to avoid complaints about an
1104 # unknown filetype.
1105 joint_file = joint_file + '.txt'
1106 joint_path = os.path.join(log_dir, joint_file)
1107 files = [f for f in local_files if level_name in f]
1108 if not files:
1109 # TODO(crrev.com/c/1793030): remove no-level case once CL
1110 # is pushed
1111 continue
1112 # Extract compressed logs if any.
1113 compressed, extracted = self._extract_compressed_logs(log_dir,
1114 files)
1115 files = list(set(files) - set(compressed))
1116 files.extend(extracted)
1117 # Need to sort. As they all share the same timestamp, and
1118 # loglevel, the index itself is sufficient. The highest index
1119 # is the oldest file, therefore we need a descending sort.
1120 def sortkey(f, level=level_name):
1121 """Custom sortkey to sort based on rotation number int."""
1122 if f.endswith(level_name): return 0
1123 return int(f.split('.')[-1])
1124
1125 files.sort(reverse=True, key=sortkey)
1126 # Just rename the first file rather than building from scratch.
1127 os.rename(files[0], joint_path)
1128 with open(joint_path, 'a') as joint_f:
1129 for logfile in files[1:]:
1130 # Transfer the file to the joint file line by line.
1131 with open(logfile, 'r') as log_f:
1132 for line in log_f:
1133 joint_f.write(line)
1134 # File has been written over. Delete safely.
1135 os.remove(logfile)
1136 # Need to remove all files form |local_files| so we don't
1137 # analyze them again.
1138 local_files = list(set(local_files) - set(files) - set(compressed))
1139 # Lastly, extract MCU logs from the joint logs.
1140 self._extract_mcu_logs(log_dir)
1141
Garry Wang79e9af62019-06-12 15:19:19 -07001142 def _lock(self):
1143 """lock servohost by touching a file.
1144 """
1145 logging.debug('Locking servohost %s by touching %s file',
1146 self.hostname, self._lock_file)
1147 self.run('touch %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001148 self._is_locked = True
Garry Wang79e9af62019-06-12 15:19:19 -07001149
Garry Wang79e9af62019-06-12 15:19:19 -07001150 def _unlock(self):
1151 """Unlock servohost by removing the lock file.
1152 """
1153 logging.debug('Unlocking servohost by removing %s file',
1154 self._lock_file)
1155 self.run('rm %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001156 self._is_locked = False
Garry Wang79e9af62019-06-12 15:19:19 -07001157
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001158 def close(self):
Congbin Guofc3b8962019-03-22 17:38:46 -07001159 """Close the associated servo and the host object."""
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001160 # NOTE: throughout this method there are multiple attempts to catch
1161 # all errors. This is WAI as log grabbing should not fail tests.
1162 # However, the goal is to catch and handle/process all errors, thus
1163 # we print the traceback and ask for a bug.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001164 if self._closed:
1165 logging.debug('ServoHost is already closed.')
1166 return
Garry Wang22f2e842020-09-09 20:19:19 -07001167
1168 # Only attempt ssh related actions if servohost is sshable. We call
1169 # check_cached_up_status() first because it's lightweighted and return
1170 # much faster in the case servohost is down, however, we still want
1171 # to call is_up() later since check_cached_up_status() is ping based check
1172 # and not guarantee the servohost is sshable.
1173 servo_host_ready = self.check_cached_up_status() and self.is_up()
1174
1175 if servo_host_ready:
1176 instance_ts = self.get_instance_logs_ts()
1177 else:
1178 logging.info('Servohost is down, will skip servod log collecting.')
1179 instance_ts = None
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001180 # TODO(crbug.com/1011516): once enabled, remove the check against
1181 # localhost and instead check against log-rotiation enablement.
1182 logs_available = (instance_ts is not None and
1183 self.job and
1184 not self.is_localhost())
1185 if logs_available:
1186 # Probe whether there was a servod restart, and grab those old
1187 # logs as well.
1188 try:
1189 self.probe_servod_restart(instance_ts, self.job.resultdir)
1190 except (error.AutoservRunError, error.TestFail) as e:
1191 logging.info('Failed to grab servo logs due to: %s. '
1192 'This error is forgiven.', str(e))
1193 except Exception as e:
1194 logging.error('Unexpected error probing for old logs. %s. '
1195 'Forgiven. Please file a bug and fix or catch '
1196 'in log probing function', str(e),
1197 exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001198 if self._servo:
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001199 outdir = None if not self.job else self.job.resultdir
Congbin Guo2e5e2a22018-07-27 10:32:48 -07001200 # In some cases when we run as lab-tools, the job object is None.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001201 self._servo.close(outdir)
1202
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001203 if logs_available:
1204 # Grab current (not old like above) logs after the servo instance
1205 # was closed out.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001206 try:
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001207 self.get_instance_logs(instance_ts, self.job.resultdir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001208 except error.AutoservRunError as e:
1209 logging.info('Failed to grab servo logs due to: %s. '
1210 'This error is forgiven.', str(e))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001211 except Exception as e:
1212 logging.error('Unexpected error grabbing servod logs. %s. '
1213 'Forgiven. Please file a bug and fix or catch '
1214 'in log grabbing function', str(e), exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001215
Garry Wang22f2e842020-09-09 20:19:19 -07001216 if self._is_locked and servo_host_ready:
Garry Wang7c00b0f2019-06-25 17:28:17 -07001217 # Remove the lock if the servohost has been locked.
Garry Wang79e9af62019-06-12 15:19:19 -07001218 try:
1219 self._unlock()
1220 except error.AutoservSSHTimeout:
1221 logging.error('Unlock servohost failed due to ssh timeout.'
1222 ' It may caused by servohost went down during'
1223 ' the task.')
Garry Wangc1288cf2019-12-17 14:58:00 -08001224 # We want always stop servod after task to minimum the impact of bad
1225 # servod process interfere other servods.(see crbug.com/1028665)
Garry Wang22f2e842020-09-09 20:19:19 -07001226 if servo_host_ready:
1227 try:
1228 self.stop_servod()
1229 except error.AutoservRunError as e:
1230 logging.info(
1231 "Failed to stop servod due to:\n%s\n"
1232 "This error is forgiven.", str(e))
Garry Wangc1288cf2019-12-17 14:58:00 -08001233
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001234 super(ServoHost, self).close()
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001235 # Mark closed.
1236 self._closed = True
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001237
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001238 def get_servo_state(self):
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001239 return self._servo_state
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001240
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001241 def _get_host_metrics_data(self):
1242 return {'port': self.servo_port,
Otabek Kasimov0ea47362020-07-11 20:55:09 -07001243 'host': self.get_dut_hostname() or self.hostname,
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001244 'board': self.servo_board or ''}
1245
1246 def _is_servo_device_connected(self, servo_type, serial):
1247 """Check if device is connected to the labstation.
1248
1249 Works for all servo devices connected to the labstation.
1250 For servo_v3 please use 'self._is_servo_board_present_on_servo_v3'
1251
1252 @param servo_type: The type of servo device. Expecting value can be
1253 servo_v4 or servo_micro.
1254 @param serial: The serial number of the device to detect it.
1255 """
1256 vid_pid = self.SERVO_VID_PID.get(servo_type)
1257 if not vid_pid or not serial:
1258 # device cannot detected without VID/PID or serial number
1259 return False
1260 logging.debug('Started to detect %s', servo_type)
1261 try:
1262 cmd = 'lsusb -v -d %s |grep iSerial |grep %s' % (vid_pid, serial)
1263 result = self.run(cmd, ignore_status=True, timeout=30)
1264 if result.exit_status == 0 and result.stdout.strip():
1265 logging.debug('The %s is plugged in to the host.', servo_type)
1266 return True
1267 logging.debug('%s device is not detected; %s', servo_type, result)
1268 return False
1269 except Exception as e:
1270 # can be triggered by timeout issue due running the script
1271 metrics.Counter(
1272 'chromeos/autotest/repair/servo_detection/timeout'
1273 ).increment(fields=self._get_host_metrics_data())
1274 logging.error('%s device is not detected; %s', servo_type, str(e))
1275 return None
1276
1277 def _is_servo_board_present_on_servo_v3(self):
1278 """Check if servo board is detected on servo_v3"""
1279 vid_pids = self.SERVO_VID_PID['servo_v3']
1280 if not vid_pids or len(vid_pids) == 0:
1281 # device cannot detected without VID/PID
1282 return False
1283 logging.debug('Started to detect servo board on servo_v3')
1284 not_detected = 'The servo board is not detected on servo_v3'
1285 try:
1286 cmd = 'lsusb | grep "%s"' % "\|".join(vid_pids)
1287 result = self.run(cmd, ignore_status=True, timeout=30)
1288 if result.exit_status == 0 and result.stdout.strip():
1289 logging.debug('The servo board is detected on servo_v3')
1290 return True
1291 logging.debug('%s; %s', not_detected, result)
1292 return False
1293 except Exception as e:
1294 # can be triggered by timeout issue due running the script
1295 metrics.Counter(
1296 'chromeos/autotest/repair/servo_detection/timeout'
1297 ).increment(fields=self._get_host_metrics_data())
1298 logging.error('%s; %s', not_detected, str(e))
1299 return None
1300
Otabek Kasimov120b6fa2020-07-03 00:15:27 -07001301 def _is_main_device_not_detected_on_servo_v4(self):
1302 """Check if servod cannot find main device on servo.
1303
1304 The check based on reading servod logs for servo_v4.
1305 """
1306 if not self._initial_instance_ts:
1307 # latest log not found
1308 return False
1309 logging.debug('latest log for servod created at %s',
1310 self._initial_instance_ts)
1311 try:
1312 log_created = calendar.timegm(time.strptime(
1313 self._initial_instance_ts,
1314 "%Y-%m-%d--%H-%M-%S.%f"))
1315 except ValueError as e:
1316 logging.debug('Cannot read time from log file name: %s',
1317 self._initial_instance_ts)
1318 return False
1319 min_time_created = calendar.timegm(time.gmtime())
1320 if min_time_created > log_created + 3600:
1321 # the log file is old we cannot use it
1322 logging.debug('log file was created more than hour ago, too old')
1323 return False
1324 logging.debug('latest log was created not longer then 1 hour ago')
1325
1326 # check if servod can detect main device by servo_v4
1327 message = 'ERROR - No servo micro or CCD detected for board'
1328 cmd = ('cat /var/log/servod_%s/log.%s.INFO |grep "%s"'
1329 % (self.servo_port, self._initial_instance_ts, message))
1330 result = self.run(cmd, ignore_status=True)
1331 if result.stdout.strip():
1332 logging.info('Servod cannot detect main device on the servo; '
1333 'Can be caused by bad hardware of servo or '
1334 'issue on the DUT side.')
1335 return True
1336 logging.debug('The main device is detected')
1337 return False
1338
Garry Wangb5cee3e2020-09-16 14:58:13 -07001339 def _require_cr50_servod_config(self):
1340 """Check whether we need start servod with CONFIG=cr50.xml"""
1341 dut_host_info = self.get_dut_host_info()
1342 if not dut_host_info:
1343 return False
1344 for pool in dut_host_info.pools:
1345 if pool.startswith(servo_constants.CR50_CONFIG_POOL_PREFIX):
1346 return True
1347 return False
1348
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001349 def get_verifier_state(self, tag):
Otabek Kasimov15963492020-06-23 21:10:51 -07001350 """Return the state of servo verifier.
1351
1352 @returns: bool or None
1353 """
1354 return self._repair_strategy.verifier_is_good(tag)
1355
1356 def determine_servo_state(self):
1357 """Determine servo state based on the failed verifier.
1358
1359 @returns: servo state value
1360 The state detecting based on first fail verifier or collecting of
1361 them.
1362 """
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001363 ssh = self.get_verifier_state('servo_ssh')
1364 disk_space = self.get_verifier_state('disk_space')
1365 start_servod = self.get_verifier_state('servod_job')
1366 create_servo = self.get_verifier_state('servod_connection')
1367 init_servo = self.get_verifier_state('servod_control')
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001368 servo_topology = self.get_verifier_state('servo_topology')
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001369 dut_connected = self.get_verifier_state('dut_connected')
Otabek Kasimov9fb2cee2020-11-23 23:06:55 -08001370 hub_connected = self.get_verifier_state('hub_connected')
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001371 pwr_button = self.get_verifier_state('pwr_button')
1372 lid_open = self.get_verifier_state('lid_open')
1373 ec_board = self.get_verifier_state('ec_board')
Otabek Kasimovbb3bc462020-11-03 16:40:33 -08001374 cr50_console = self.get_verifier_state('cr50_console')
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001375 ccd_testlab = self.get_verifier_state('ccd_testlab')
Otabek Kasimov15963492020-06-23 21:10:51 -07001376
1377 if not ssh:
1378 return servo_constants.SERVO_STATE_NO_SSH
1379
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001380 if (start_servod == hosts.VERIFY_FAILED
1381 or create_servo == hosts.VERIFY_FAILED):
Otabek Kasimov066bdb82020-08-12 15:57:44 -07001382 # sometimes servo can start with out present servo
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001383 if self.is_labstation():
1384 if not self.servo_serial:
1385 return servo_constants.SERVO_STATE_WRONG_CONFIG
1386 if self._is_servo_device_connected(
1387 'servo_v4',
1388 self.servo_serial) == False:
1389 return servo_constants.SERVO_STATE_NOT_CONNECTED
1390 elif self._is_servo_board_present_on_servo_v3() == False:
1391 return servo_constants.SERVO_STATE_NOT_CONNECTED
Otabek Kasimov066bdb82020-08-12 15:57:44 -07001392
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001393 if servo_topology == hosts.VERIFY_FAILED:
1394 return servo_constants.SERVO_STATE_TOPOLOGY_ISSUE
1395
Otabek Kasimov9fb2cee2020-11-23 23:06:55 -08001396 if (dut_connected == hosts.VERIFY_FAILED
1397 or hub_connected == hosts.VERIFY_FAILED):
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001398 if pwr_button == hosts.VERIFY_SUCCESS:
Otabek Kasimova7eb4dc2020-09-16 10:25:17 -07001399 # unexpected case
1400 metrics.Counter(
1401 'chromeos/autotest/repair/servo_unexpected/pwr_button'
1402 ).increment(fields=self._get_host_metrics_data())
1403 return servo_constants.SERVO_STATE_DUT_NOT_CONNECTED
1404
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001405 if start_servod == hosts.VERIFY_FAILED:
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001406 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1407
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001408 if create_servo == hosts.VERIFY_FAILED:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -07001409 if (self.is_labstation()
1410 and self._is_main_device_not_detected_on_servo_v4()):
1411 servo_type = None
1412 if self.get_dut_host_info():
1413 servo_type = self.get_dut_host_info().get_label_value(
1414 servo_constants.SERVO_TYPE_LABEL_PREFIX)
1415 if servo_type and 'servo_micro' in servo_type:
1416 serial = self.get_servo_micro_serial_number()
1417 logging.debug('servo_micro serial: %s', serial)
1418 if self._is_servo_device_detected('servo_micro',
1419 serial):
1420 return servo_constants.SERVO_STATE_BAD_RIBBON_CABLE
1421 # Device can be not detected because of DUT
1422 # TODO (otabek) update after b/159755652 and b/159754985
1423 metrics.Counter(
1424 'chromeos/autotest/repair/servo_state/needs_replacement'
1425 ).increment(fields=self._get_host_metrics_data())
1426 elif not self.is_labstation():
1427 # Here need logic to check if flex cable is connected
1428 pass
1429
Otabek Kasimov15963492020-06-23 21:10:51 -07001430 # one of the reason why servo can not initialized
Otabek Kasimovbb3bc462020-11-03 16:40:33 -08001431 if cr50_console == hosts.VERIFY_FAILED:
1432 return servo_constants.SERVO_STATE_CR50_CONSOLE_MISSING
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001433 if ccd_testlab == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001434 return servo_constants.SERVO_STATE_CCD_TESTLAB_ISSUE
1435
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001436 if (create_servo == hosts.VERIFY_FAILED
1437 or init_servo == hosts.VERIFY_FAILED):
Otabek Kasimov15963492020-06-23 21:10:51 -07001438 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1439
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001440 if ec_board == hosts.VERIFY_FAILED:
Otabek Kasimov015c15c2020-08-20 00:40:42 -07001441 return servo_constants.SERVO_STATE_EC_BROKEN
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001442 if pwr_button == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001443 return servo_constants.SERVO_STATE_BAD_RIBBON_CABLE
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001444 if lid_open == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001445 return servo_constants.SERVO_STATE_LID_OPEN_FAILED
Otabek Kasimov15963492020-06-23 21:10:51 -07001446
Otabek Kasimov15963492020-06-23 21:10:51 -07001447 metrics.Counter(
1448 'chromeos/autotest/repair/unknown_servo_state'
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001449 ).increment(fields=self._get_host_metrics_data())
Otabek Kasimov15963492020-06-23 21:10:51 -07001450 logging.info('We do not have special state for this failure yet :)')
1451 return servo_constants.SERVO_STATE_BROKEN
1452
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001453 def is_servo_topology_supported(self):
1454 """Check if servo_topology is supported."""
1455 if not self.is_labstation():
1456 logging.info('Servo-topology supported only for labstation.')
1457 return False
1458 if not self.servo_serial:
1459 logging.info('Servo-topology required a servo serial.')
1460 return False
1461 return True
1462
1463 def get_topology(self):
1464 """Get servo topology."""
1465 return self._topology
1466
1467 def is_dual_setup(self):
1468 """Check is servo will run in dual setup.
1469
1470 Dual setup used only for servo_v4 when used ccd_cr50 and servo_micro
1471 at the same time.
1472 """
1473 return self.servo_setup == servo_constants.SERVO_SETUP_VALUE_DUAL_V4
1474
Otabek Kasimov39637412020-11-23 19:09:27 -08001475 def set_dut_health_profile(self, dut_health_profile):
1476 """
1477 @param dut_health_profile: A DeviceHealthProfile object.
1478 """
1479 logging.debug('setting dut_health_profile field to (%s)',
1480 dut_health_profile)
1481 self._dut_health_profile = dut_health_profile
1482
1483 def get_dut_health_profile(self):
1484 """
1485 @return A DeviceHealthProfile object.
1486 """
1487 return self._dut_health_profile
1488
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001489
Richard Barnetteea3e4602016-06-10 12:36:41 -07001490def make_servo_hostname(dut_hostname):
1491 """Given a DUT's hostname, return the hostname of its servo.
1492
1493 @param dut_hostname: hostname of a DUT.
1494
1495 @return hostname of the DUT's servo.
1496
1497 """
1498 host_parts = dut_hostname.split('.')
1499 host_parts[0] = host_parts[0] + '-servo'
1500 return '.'.join(host_parts)
1501
1502
1503def servo_host_is_up(servo_hostname):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001504 """Given a servo host name, return if it's up or not.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001505
1506 @param servo_hostname: hostname of the servo host.
1507
1508 @return True if it's up, False otherwise
1509 """
1510 # Technically, this duplicates the SSH ping done early in the servo
1511 # proxy initialization code. However, this ping ends in a couple
1512 # seconds when if fails, rather than the 60 seconds it takes to decide
1513 # that an SSH ping has timed out. Specifically, that timeout happens
1514 # when our servo DNS name resolves, but there is no host at that IP.
1515 logging.info('Pinging servo host at %s', servo_hostname)
1516 ping_config = ping_runner.PingConfig(
1517 servo_hostname, count=3,
1518 ignore_result=True, ignore_status=True)
1519 return ping_runner.PingRunner().ping(ping_config).received > 0
1520
1521
Richard Barnettee519dcd2016-08-15 17:37:17 -07001522def _map_afe_board_to_servo_board(afe_board):
1523 """Map a board we get from the AFE to a servo appropriate value.
1524
1525 Many boards are identical to other boards for servo's purposes.
1526 This function makes that mapping.
1527
1528 @param afe_board string board name received from AFE.
1529 @return board we expect servo to have.
1530
1531 """
1532 KNOWN_SUFFIXES = ['-freon', '_freon', '_moblab', '-cheets']
1533 BOARD_MAP = {'gizmo': 'panther'}
1534 mapped_board = afe_board
1535 if afe_board in BOARD_MAP:
1536 mapped_board = BOARD_MAP[afe_board]
1537 else:
1538 for suffix in KNOWN_SUFFIXES:
1539 if afe_board.endswith(suffix):
1540 mapped_board = afe_board[0:-len(suffix)]
1541 break
1542 if mapped_board != afe_board:
1543 logging.info('Mapping AFE board=%s to %s', afe_board, mapped_board)
1544 return mapped_board
1545
1546
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001547def get_servo_args_for_host(dut_host):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001548 """Return servo data associated with a given DUT.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001549
Richard Barnetteea3e4602016-06-10 12:36:41 -07001550 @param dut_host Instance of `Host` on which to find the servo
1551 attributes.
Prathmesh Prabhuf605dd32018-08-28 17:09:04 -07001552 @return `servo_args` dict with host and an optional port.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001553 """
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001554 info = dut_host.host_info_store.get()
Derek Beckettf73baca2020-08-19 15:08:47 -07001555 servo_args = {k: v for k, v in six.iteritems(info.attributes)
Garry Wang11b5e872020-03-11 15:14:08 -07001556 if k in servo_constants.SERVO_ATTR_KEYS}
Richard Barnetteea3e4602016-06-10 12:36:41 -07001557
Garry Wang11b5e872020-03-11 15:14:08 -07001558 if servo_constants.SERVO_PORT_ATTR in servo_args:
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001559 try:
Garry Wang11b5e872020-03-11 15:14:08 -07001560 servo_args[servo_constants.SERVO_PORT_ATTR] = int(
1561 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001562 except ValueError:
1563 logging.error('servo port is not an int: %s',
Garry Wang11b5e872020-03-11 15:14:08 -07001564 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001565 # Reset servo_args because we don't want to use an invalid port.
Garry Wang11b5e872020-03-11 15:14:08 -07001566 servo_args.pop(servo_constants.SERVO_HOST_ATTR, None)
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001567
1568 if info.board:
Garry Wang11b5e872020-03-11 15:14:08 -07001569 servo_board = _map_afe_board_to_servo_board(info.board)
1570 servo_args[servo_constants.SERVO_BOARD_ATTR] = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -07001571 if info.model:
Garry Wang11b5e872020-03-11 15:14:08 -07001572 servo_args[servo_constants.SERVO_MODEL_ATTR] = info.model
1573 return servo_args if servo_constants.SERVO_HOST_ATTR in servo_args else None
Richard Barnetteea3e4602016-06-10 12:36:41 -07001574
1575
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001576def _tweak_args_for_ssp_moblab(servo_args):
Garry Wang11b5e872020-03-11 15:14:08 -07001577 if (servo_args[servo_constants.SERVO_HOST_ATTR]
1578 in ['localhost', '127.0.0.1']):
1579 servo_args[servo_constants.SERVO_HOST_ATTR] = _CONFIG.get_config_value(
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001580 'SSP', 'host_container_ip', type=str, default=None)
1581
1582
Otabek Kasimov39637412020-11-23 19:09:27 -08001583def create_servo_host(dut,
1584 servo_args,
1585 try_lab_servo=False,
1586 try_servo_repair=False,
1587 dut_host_info=None,
1588 dut_health_profile=None):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001589 """Create a ServoHost object for a given DUT, if appropriate.
Dan Shi4d478522014-02-14 13:46:32 -08001590
Richard Barnette9a26ad62016-06-10 12:03:08 -07001591 This function attempts to create and verify or repair a `ServoHost`
1592 object for a servo connected to the given `dut`, subject to various
1593 constraints imposed by the parameters:
1594 * When the `servo_args` parameter is not `None`, a servo
1595 host must be created, and must be checked with `repair()`.
1596 * Otherwise, if a servo exists in the lab and `try_lab_servo` is
1597 true:
1598 * If `try_servo_repair` is true, then create a servo host and
1599 check it with `repair()`.
1600 * Otherwise, if the servo responds to `ping` then create a
1601 servo host and check it with `verify()`.
Fang Denge545abb2014-12-30 18:43:47 -08001602
Richard Barnette9a26ad62016-06-10 12:03:08 -07001603 In cases where `servo_args` was not `None`, repair failure
1604 exceptions are passed back to the caller; otherwise, exceptions
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001605 are logged and then discarded. Note that this only happens in cases
1606 where we're called from a test (not special task) control file that
1607 has an explicit dependency on servo. In that case, we require that
1608 repair not write to `status.log`, so as to avoid polluting test
1609 results.
1610
1611 TODO(jrbarnette): The special handling for servo in test control
1612 files is a thorn in my flesh; I dearly hope to see it cut out before
1613 my retirement.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001614
1615 Parameters for a servo host consist of a host name, port number, and
1616 DUT board, and are determined from one of these sources, in order of
1617 priority:
Richard Barnetteea3e4602016-06-10 12:36:41 -07001618 * Servo attributes from the `dut` parameter take precedence over
1619 all other sources of information.
1620 * If a DNS entry for the servo based on the DUT hostname exists in
1621 the CrOS lab network, that hostname is used with the default
Richard Barnette9a26ad62016-06-10 12:03:08 -07001622 port and the DUT's board.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001623 * If no other options are found, the parameters will be taken
Richard Barnette9a26ad62016-06-10 12:03:08 -07001624 from the `servo_args` dict passed in from the caller.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001625
1626 @param dut An instance of `Host` from which to take
1627 servo parameters (if available).
1628 @param servo_args A dictionary with servo parameters to use if
1629 they can't be found from `dut`. If this
1630 argument is supplied, unrepaired exceptions
1631 from `verify()` will be passed back to the
1632 caller.
1633 @param try_lab_servo If not true, servo host creation will be
1634 skipped unless otherwise required by the
1635 caller.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001636 @param try_servo_repair If true, check a servo host with
1637 `repair()` instead of `verify()`.
Otabek Kasimov8475cce2020-07-14 12:11:31 -07001638 @param dut_host_info: A HostInfo object of the DUT that connected
1639 to this servo.
Otabek Kasimov39637412020-11-23 19:09:27 -08001640 @param dut_health_profile: DUT repair info with history.
Dan Shi4d478522014-02-14 13:46:32 -08001641
1642 @returns: A ServoHost object or None. See comments above.
1643
1644 """
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001645 servo_dependency = servo_args is not None
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001646 if dut is not None and (try_lab_servo or servo_dependency):
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001647 servo_args_override = get_servo_args_for_host(dut)
Richard Barnetteea3e4602016-06-10 12:36:41 -07001648 if servo_args_override is not None:
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001649 if utils.in_moblab_ssp():
1650 _tweak_args_for_ssp_moblab(servo_args_override)
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001651 logging.debug(
1652 'Overriding provided servo_args (%s) with arguments'
1653 ' determined from the host (%s)',
1654 servo_args,
1655 servo_args_override,
1656 )
Richard Barnetteea3e4602016-06-10 12:36:41 -07001657 servo_args = servo_args_override
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001658
Richard Barnetteea3e4602016-06-10 12:36:41 -07001659 if servo_args is None:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001660 logging.debug('No servo_args provided, and failed to find overrides.')
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001661 if try_lab_servo or servo_dependency:
Otabek Kasimov646812c2020-06-23 20:01:36 -07001662 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001663 else:
1664 # For regular test case which not required the servo
1665 return None, None
1666
Garry Wang11b5e872020-03-11 15:14:08 -07001667 servo_hostname = servo_args.get(servo_constants.SERVO_HOST_ATTR)
1668 servo_port = servo_args.get(servo_constants.SERVO_PORT_ATTR)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001669 if not _is_servo_host_information_exist(servo_hostname, servo_port):
1670 logging.debug(
1671 'Servo connection info missed hostname: %s , port: %s',
1672 servo_hostname, servo_port)
Otabek Kasimov646812c2020-06-23 20:01:36 -07001673 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001674 if not is_servo_host_information_valid(servo_hostname, servo_port):
1675 logging.debug(
1676 'Servo connection info is incorrect hostname: %s , port: %s',
1677 servo_hostname, servo_port)
Garry Wang11b5e872020-03-11 15:14:08 -07001678 return None, servo_constants.SERVO_STATE_WRONG_CONFIG
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001679 if (not servo_dependency and not try_servo_repair and
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001680 not servo_host_is_up(servo_hostname)):
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001681 logging.debug('ServoHost is not up.')
Otabek Kasimov646812c2020-06-23 20:01:36 -07001682 return None, servo_constants.SERVO_STATE_NO_SSH
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001683
Garry Wangebc015b2019-06-06 17:45:06 -07001684 newhost = ServoHost(**servo_args)
Otabek Kasimov39637412020-11-23 19:09:27 -08001685 if not newhost.is_up_fast():
1686 # We do not have any option to recover servo_host.
1687 # If servo_host is not pingable then we can stop here.
1688 return None, servo_constants.SERVO_STATE_NO_SSH
Garry Wangffbd2162020-04-17 16:13:48 -07001689
Otabek Kasimove6df8102020-07-21 20:15:25 -07001690 # Reset or reboot servo device only during AdminRepair tasks.
1691 if try_servo_repair:
1692 if newhost._is_locked:
1693 # Reset servo if the servo is locked, as we check if the servohost
1694 # is up, if the servohost is labstation and if the servohost is in
1695 # lab inside the locking logic.
1696 newhost.reset_servo()
1697 else:
Garry Wang358aad42020-08-02 20:56:04 -07001698 try:
1699 newhost.reboot_servo_v3_on_need()
Garry Wang1f0d5332020-08-10 19:32:32 -07001700 except Exception as e:
1701 logging.info('[Non-critical] Unexpected error while trying to'
1702 ' reboot servo_v3, skipping the reboot; %s', e)
Otabek Kasimove6df8102020-07-21 20:15:25 -07001703
Otabek Kasimov2b50cdb2020-07-06 19:16:06 -07001704 if dut:
1705 newhost.set_dut_hostname(dut.hostname)
Otabek Kasimov9e90ae12020-08-14 03:01:19 -07001706 if dut_host_info:
1707 newhost.set_dut_host_info(dut_host_info)
Otabek Kasimov39637412020-11-23 19:09:27 -08001708 if dut_health_profile and (try_lab_servo or try_servo_repair):
1709 try:
1710 if newhost.is_localhost():
1711 logging.info('Servohost is a localhost, skip device'
1712 ' health profile setup...')
1713 else:
1714 dut_health_profile.init_profile(newhost)
1715 newhost.set_dut_health_profile(dut_health_profile)
1716 except Exception as e:
1717 logging.info(
1718 '[Non-critical] Unexpected error while trying to'
1719 ' load device health profile; %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -07001720
Otabek Kasimov8475cce2020-07-14 12:11:31 -07001721 if try_lab_servo or try_servo_repair:
1722 try:
1723 logging.info("Check and update servo firmware.")
1724 servo_updater.update_servo_firmware(
1725 newhost,
1726 force_update=False)
1727 except Exception as e:
1728 logging.error("Servo device update error: %s", e)
1729
Garry Wangcdd27b22020-01-13 14:59:11 -08001730 try:
1731 newhost.restart_servod(quick_startup=True)
1732 except error.AutoservSSHTimeout:
1733 logging.warning("Restart servod failed due ssh connection "
1734 "to servohost timed out. This error is forgiven"
1735 " here, we will retry in servo repair process.")
1736 except error.AutoservRunError as e:
1737 logging.warning("Restart servod failed due to:\n%s\n"
1738 "This error is forgiven here, we will retry"
1739 " in servo repair process.", str(e))
Garry Wangebc015b2019-06-06 17:45:06 -07001740
Richard Barnette9a26ad62016-06-10 12:03:08 -07001741 # Note that the logic of repair() includes everything done
1742 # by verify(). It's sufficient to call one or the other;
1743 # we don't need both.
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001744 if servo_dependency:
1745 newhost.repair(silent=True)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001746 return newhost, newhost.get_servo_state()
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001747
1748 if try_servo_repair:
1749 try:
1750 newhost.repair()
1751 except Exception:
1752 logging.exception('servo repair failed for %s', newhost.hostname)
Richard Barnette9a26ad62016-06-10 12:03:08 -07001753 else:
1754 try:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001755 newhost.verify()
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001756 except Exception:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001757 logging.exception('servo verify failed for %s', newhost.hostname)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001758 return newhost, newhost.get_servo_state()
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001759
1760
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001761def _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001762 if hostname is None or len(hostname.strip()) == 0:
1763 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001764 if port is None:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001765 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001766 if not type(port) is int:
1767 try:
1768 int(port)
1769 except ValueError:
1770 return False
1771
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001772 return True
1773
1774
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001775def is_servo_host_information_valid(hostname, port):
Garry Wang9b8f2342020-04-17 16:34:09 -07001776 """Check if provided servo attributes are valid.
1777
1778 @param hostname Hostname of the servohost.
1779 @param port servo port number.
1780
1781 @returns: A bool value to indicate if provided servo attribute valid.
1782 """
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001783 if not _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001784 return False
1785 # checking range and correct of the port
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001786 port_int = int(port)
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001787 if port_int < 1 or port_int > 65000:
1788 return False
1789 # we expecting host contain only latters, digits and '-' or '_'
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001790 if not re.match('[a-zA-Z0-9-_\.]*$', hostname) or len(hostname) < 5:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001791 return False
1792 return True