blob: 01d951883f3b0116011584310662ce7df55392ef [file] [log] [blame]
Derek Beckettf73baca2020-08-19 15:08:47 -07001# Lint as: python2, python3
Fang Deng5d518f42013-08-02 14:04:32 -07002# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
3# Use of this source code is governed by a BSD-style license that can be
4# found in the LICENSE file.
5#
6# Expects to be run in an environment with sudo and no interactive password
7# prompt, such as within the Chromium OS development chroot.
8
9
10"""This file provides core logic for servo verify/repair process."""
11
12
Derek Beckettf73baca2020-08-19 15:08:47 -070013from __future__ import absolute_import
14from __future__ import division
15from __future__ import print_function
16
Fang Deng5d518f42013-08-02 14:04:32 -070017import logging
Raul E Rangel52ca2e82018-07-03 14:10:14 -060018import os
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080019import re
20import tarfile
Andrew McRaef0679932020-08-13 09:15:23 +100021import threading
Garry Wang2b5eef92020-08-21 16:23:35 -070022import json
Garry Wangc1288cf2019-12-17 14:58:00 -080023import time
Derek Beckettf73baca2020-08-19 15:08:47 -070024import six
25import six.moves.xmlrpc_client
Otabek Kasimov120b6fa2020-07-03 00:15:27 -070026import calendar
Fang Deng5d518f42013-08-02 14:04:32 -070027
28from autotest_lib.client.bin import utils
Garry Wang79e9af62019-06-12 15:19:19 -070029from autotest_lib.client.common_lib import error
Richard Barnette9a26ad62016-06-10 12:03:08 -070030from autotest_lib.client.common_lib import hosts
Garry Wang7b0e1b72020-03-25 19:08:59 -070031from autotest_lib.client.common_lib import lsbrelease_utils
Fang Deng5d518f42013-08-02 14:04:32 -070032from autotest_lib.client.common_lib.cros import retry
Christopher Wileycef1f902014-06-19 11:11:23 -070033from autotest_lib.client.common_lib.cros.network import ping_runner
Richard Barnette9a26ad62016-06-10 12:03:08 -070034from autotest_lib.server.cros.servo import servo
Richard Barnetted31580e2018-05-14 19:58:00 +000035from autotest_lib.server.hosts import servo_repair
Garry Wangebc015b2019-06-06 17:45:06 -070036from autotest_lib.server.hosts import base_servohost
Garry Wang11b5e872020-03-11 15:14:08 -070037from autotest_lib.server.hosts import servo_constants
Otabek Kasimov4ea636e2020-04-14 23:35:06 -070038from autotest_lib.server.cros.faft.utils import config
Garry Wang11b5e872020-03-11 15:14:08 -070039from autotest_lib.client.common_lib import global_config
Otabek Kasimov8475cce2020-07-14 12:11:31 -070040from autotest_lib.site_utils.admin_audit import servo_updater
Otabek Kasimov382c3bb2020-10-28 13:22:45 -070041from autotest_lib.server.cros.servo.topology import servo_topology
Garry Wangd7367482020-02-27 13:52:40 -080042
Otabek Kasimov15963492020-06-23 21:10:51 -070043try:
44 from chromite.lib import metrics
45except ImportError:
46 metrics = utils.metrics_mock
47
Dan Shi3b2adf62015-09-02 17:46:54 -070048_CONFIG = global_config.global_config
Fang Deng5d518f42013-08-02 14:04:32 -070049
Otabek Kasimova7ba91a2020-03-09 08:31:01 -070050
Garry Wangebc015b2019-06-06 17:45:06 -070051class ServoHost(base_servohost.BaseServoHost):
52 """Host class for a servo host(e.g. beaglebone, labstation)
Dana Goyette0b6e6402019-10-04 11:09:24 -070053 that with a servo instance for a specific port.
54
55 @type _servo: servo.Servo | None
56 """
Fang Deng5d518f42013-08-02 14:04:32 -070057
Raul E Rangel52ca2e82018-07-03 14:10:14 -060058 DEFAULT_PORT = int(os.getenv('SERVOD_PORT', '9999'))
Richard Barnette9a26ad62016-06-10 12:03:08 -070059
Dan Shie5b3c512014-08-21 12:12:09 -070060 # Timeout for initializing servo signals.
Wai-Hong Tam37b6ed32017-09-19 15:52:39 -070061 INITIALIZE_SERVO_TIMEOUT_SECS = 60
Richard Barnette9a26ad62016-06-10 12:03:08 -070062
Otabek Kasimov545739c2020-08-20 00:24:21 -070063 # Default timeout for run terminal command.
64 DEFAULT_TERMINAL_TIMEOUT = 30
65
xixuan6cf6d2f2016-01-29 15:29:00 -080066 # Ready test function
67 SERVO_READY_METHOD = 'get_version'
Fang Deng5d518f42013-08-02 14:04:32 -070068
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080069 # Directory prefix on the servo host where the servod logs are stored.
70 SERVOD_LOG_PREFIX = '/var/log/servod'
71
72 # Exit code to use when symlinks for servod logs are not found.
73 NO_SYMLINKS_CODE = 9
74
75 # Directory in the job's results directory to dump the logs into.
76 LOG_DIR = 'servod'
77
78 # Prefix for joint loglevel files in the logs.
79 JOINT_LOG_PREFIX = 'log'
80
81 # Regex group to extract timestamp from logfile name.
82 TS_GROUP = 'ts'
83
84 # This regex is used to extract the timestamp from servod logs.
Garry Wang22f2e842020-09-09 20:19:19 -070085 # files always start with log.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -080086 TS_RE = (r'log.'
87 # The timestamp is of format %Y-%m-%d--%H-%M-%S.MS
88 r'(?P<%s>\d{4}(\-\d{2}){2}\-(-\d{2}){3}.\d{3})'
89 # The loglevel is optional depending on labstation version.
90 r'(.(INFO|DEBUG|WARNING))?' % TS_GROUP)
91 TS_EXTRACTOR = re.compile(TS_RE)
92
93 # Regex group to extract MCU name from logline in servod logs.
94 MCU_GROUP = 'mcu'
95
96 # Regex group to extract logline from MCU logline in servod logs.
97 LINE_GROUP = 'line'
98
99 # This regex is used to extract the mcu and the line content from an
100 # MCU logline in servod logs. e.g. EC or servo_v4 console logs.
101 # Here is an example log-line:
102 #
103 # 2020-01-23 13:15:12,223 - servo_v4 - EC3PO.Console - DEBUG -
104 # console.py:219:LogConsoleOutput - /dev/pts/9 - cc polarity: cc1
105 #
106 # Here is conceptually how they are formatted:
107 #
108 # <time> - <MCU> - EC3PO.Console - <LVL> - <file:line:func> - <pts> -
109 # <output>
110 #
Garry Wang22f2e842020-09-09 20:19:19 -0700111 # The log format starts with a timestamp
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800112 MCU_RE = (r'[\d\-]+ [\d:,]+ '
113 # The mcu that is logging this is next.
114 r'- (?P<%s>\w+) - '
115 # Next, we have more log outputs before the actual line.
116 # Information about the file line, logging function etc.
117 # Anchor on EC3PO Console, LogConsoleOutput and dev/pts.
118 # NOTE: if the log format changes, this regex needs to be
119 # adjusted.
120 r'EC3PO\.Console[\s\-\w\d:.]+LogConsoleOutput - /dev/pts/\d+ - '
121 # Lastly, we get the MCU's console line.
122 r'(?P<%s>.+$)' % (MCU_GROUP, LINE_GROUP))
123 MCU_EXTRACTOR = re.compile(MCU_RE)
124
Otabek Kasimov545739c2020-08-20 00:24:21 -0700125 # Regex to detect timeout messages when USBC pigtail has timeout issue.
126 # e.g.: [475635.427072 PD TMOUT RX 1/1]
127 USBC_PIGTAIL_TIMEOUT_RE = r'\[[\d \.]{1,20}(PD TMOUT RX 1\/1)\]'
128
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800129 # Suffix to identify compressed logfiles.
130 COMPRESSION_SUFFIX = '.tbz2'
131
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700132 # A suffix to mark servod log directories that came from instance that
133 # ran during this servo_host, but are not the last one running e.g. when
134 # an instance (on purpose, or due to a bug) restarted in the middle of the
135 # run.
136 OLD_LOG_SUFFIX = 'old'
137
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700138 # Mapping servo board with their vid-pid
139 SERVO_VID_PID = {
140 'servo_v4':'18d1:501b',
141 'ccd_cr50':'18d1:5014',
142 'servo_micro':'18d1:501a',
143 'servo_v3':['18d1:5004', '0403:6014'],
144 }
145
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800146 def _init_attributes(self):
147 self._servo_state = None
148 self.servo_port = None
149 self.servo_board = None
150 self.servo_model = None
151 self.servo_serial = None
Garry Wangcb06f3b2020-10-08 20:56:21 -0700152 self.servo_setup = None
Garry Wang000c6c02020-05-11 21:27:23 -0700153 # The flag that indicate if a servo is connected to a smart usbhub.
154 # TODO(xianuowang@) remove this flag once all usbhubs in the lab
155 # get replaced.
156 self.smart_usbhub = None
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800157 self._servo = None
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700158 self._topology = None
Andrew McRaef0679932020-08-13 09:15:23 +1000159 self._tunnel_proxy = None
160 self._tunnel_proxy_lock = threading.Lock()
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700161 self._initial_instance_ts = None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800162 # Flag to make sure that multiple calls to close do not result in the
163 # logic executing multiple times.
164 self._closed = False
Andrew McRaef0679932020-08-13 09:15:23 +1000165 # Per-thread local data
166 self._local = threading.local()
Fang Deng5d518f42013-08-02 14:04:32 -0700167
Garry Wangcb06f3b2020-10-08 20:56:21 -0700168 def _initialize(self,
169 servo_host='localhost',
170 servo_port=DEFAULT_PORT,
171 servo_board=None,
172 servo_model=None,
173 servo_serial=None,
174 servo_setup=None,
175 is_in_lab=None,
176 *args,
177 **dargs):
Fang Deng5d518f42013-08-02 14:04:32 -0700178 """Initialize a ServoHost instance.
179
180 A ServoHost instance represents a host that controls a servo.
181
182 @param servo_host: Name of the host where the servod process
183 is running.
Raul E Rangel52ca2e82018-07-03 14:10:14 -0600184 @param servo_port: Port the servod process is listening on. Defaults
185 to the SERVOD_PORT environment variable if set,
186 otherwise 9999.
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700187 @param servo_board: Board that the servo is connected to.
Nick Sanders2f3c9852018-10-24 12:10:24 -0700188 @param servo_model: Model that the servo is connected to.
Garry Wangcb06f3b2020-10-08 20:56:21 -0700189 @param servo_serial: Serial number of the servo device.
190 @param servo_setup: Type of servo setup, e.g. REGULAR or DUAL_V4.
Dan Shi4d478522014-02-14 13:46:32 -0800191 @param is_in_lab: True if the servo host is in Cros Lab. Default is set
192 to None, for which utils.host_is_in_lab_zone will be
193 called to check if the servo host is in Cros lab.
Fang Deng5d518f42013-08-02 14:04:32 -0700194
195 """
196 super(ServoHost, self)._initialize(hostname=servo_host,
Garry Wangebc015b2019-06-06 17:45:06 -0700197 is_in_lab=is_in_lab, *args, **dargs)
Otabek Kasimovcc9738e2020-02-14 16:17:15 -0800198 self._init_attributes()
Richard Barnette42f4db92018-08-23 15:05:15 -0700199 self.servo_port = int(servo_port)
Richard Barnettee519dcd2016-08-15 17:37:17 -0700200 self.servo_board = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -0700201 self.servo_model = servo_model
Kevin Cheng643ce8a2016-09-15 15:42:12 -0700202 self.servo_serial = servo_serial
Garry Wangcb06f3b2020-10-08 20:56:21 -0700203 self.servo_setup = servo_setup
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800204
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700205 if self.is_servo_topology_supported():
206 self._topology = servo_topology.ServoTopology(self)
207
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800208 # The location of the log files on the servo host for this instance.
209 self.remote_log_dir = '%s_%s' % (self.SERVOD_LOG_PREFIX,
210 self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700211 # Path of the servo host lock file.
Derek Beckettf73baca2020-08-19 15:08:47 -0700212 self._lock_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
213 self.LOCK_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700214 # File path to declare a reboot request.
Derek Beckettf73baca2020-08-19 15:08:47 -0700215 self._reboot_file = (self.TEMP_FILE_DIR + str(self.servo_port) +
216 self.REBOOT_FILE_POSTFIX)
Garry Wang79e9af62019-06-12 15:19:19 -0700217
218 # Lock the servo host if it's an in-lab labstation to prevent other
219 # task to reboot it until current task completes. We also wait and
220 # make sure the labstation is up here, in the case of the labstation is
221 # in the middle of reboot.
Garry Wang7c00b0f2019-06-25 17:28:17 -0700222 self._is_locked = False
Garry Wang42b4d862019-06-25 15:50:49 -0700223 if (self.wait_up(self.REBOOT_TIMEOUT) and self.is_in_lab()
224 and self.is_labstation()):
Garry Wang79e9af62019-06-12 15:19:19 -0700225 self._lock()
Garry Wang78ce64d2020-10-13 18:23:45 -0700226 try:
227 self.wait_ready()
228 except Exception as e:
229 logging.info(
230 'Unexpected error while ensure labstation'
231 ' readiness; %s', str(e))
Garry Wangebc015b2019-06-06 17:45:06 -0700232
Richard Barnette9a26ad62016-06-10 12:03:08 -0700233 self._repair_strategy = (
234 servo_repair.create_servo_repair_strategy())
Richard Barnettee519dcd2016-08-15 17:37:17 -0700235
Dana Goyetteafa62fd2020-03-16 13:45:27 -0700236 def __str__(self):
237 return "<%s '%s:%s'>" % (
238 type(self).__name__, self.hostname, self.servo_port)
239
Richard Barnette9a26ad62016-06-10 12:03:08 -0700240 def connect_servo(self):
Garry Wang8c8dc972020-06-09 13:41:51 -0700241 """ Initialize and setup servo for later use.
242 """
243 self.initilize_servo()
244 self.initialize_dut_for_servo()
245
Garry Wang8c8dc972020-06-09 13:41:51 -0700246 def initilize_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700247 """Establish a connection to the servod server on this host.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700248
249 Initializes `self._servo` and then verifies that all network
250 connections are working. This will create an ssh tunnel if
251 it's required.
Garry Wang8c8dc972020-06-09 13:41:51 -0700252 """
253 self._servo = servo.Servo(servo_host=self,
254 servo_serial=self.servo_serial)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700255
Garry Wang8c8dc972020-06-09 13:41:51 -0700256 def initialize_dut_for_servo(self):
257 """This method will do some setup for dut control, e.g. setup
258 main servo_v4 device, and also testing the connection between servo
259 and DUT. As a side effect of testing the connection, all signals on
260 the target servo are reset to default values, and the USB stick is
Richard Barnette9a26ad62016-06-10 12:03:08 -0700261 set to the neutral (off) position.
262 """
Garry Wang8c8dc972020-06-09 13:41:51 -0700263 if not self._servo:
264 raise hosts.AutoservVerifyError('Servo object needs to be'
265 ' initialized before initialize'
266 ' DUT.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700267 timeout, _ = retry.timeout(
Garry Wang8c8dc972020-06-09 13:41:51 -0700268 self._servo.initialize_dut,
269 timeout_sec=self.INITIALIZE_SERVO_TIMEOUT_SECS)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700270 if timeout:
Garry Wang8c8dc972020-06-09 13:41:51 -0700271 raise hosts.AutoservVerifyError('Initialize dut for servo timed'
272 ' out.')
Richard Barnette9a26ad62016-06-10 12:03:08 -0700273
Richard Barnette9a26ad62016-06-10 12:03:08 -0700274 def disconnect_servo(self):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -0700275 """Disconnect our servo if it exists.
Richard Barnette9a26ad62016-06-10 12:03:08 -0700276
277 If we've previously successfully connected to our servo,
278 disconnect any established ssh tunnel, and set `self._servo`
279 back to `None`.
280 """
281 if self._servo:
282 # N.B. This call is safe even without a tunnel:
283 # rpc_server_tracker.disconnect() silently ignores
284 # unknown ports.
285 self.rpc_server_tracker.disconnect(self.servo_port)
286 self._servo = None
Fang Deng5d518f42013-08-02 14:04:32 -0700287
Andrew McRaef0679932020-08-13 09:15:23 +1000288 def _maybe_create_servod_ssh_tunnel_proxy(self):
289 """Create a xmlrpc proxy for use with a ssh tunnel.
290 A lock is used to safely create a singleton proxy.
291 """
292 with self._tunnel_proxy_lock:
293 if self._tunnel_proxy is None:
294 self._tunnel_proxy = self.rpc_server_tracker.xmlrpc_connect(
295 None,
296 self.servo_port,
297 ready_test_name=self.SERVO_READY_METHOD,
298 timeout_seconds=60,
299 request_timeout_seconds=3600,
300 server_desc=str(self))
301
Andrew McRaef0679932020-08-13 09:15:23 +1000302 def get_servod_server_proxy(self):
303 """Return a proxy if it exists; otherwise, create a new one.
304 A proxy can either be a ssh tunnel based proxy, or a httplib
305 based proxy.
Fang Deng5d518f42013-08-02 14:04:32 -0700306
307 @returns: An xmlrpclib.ServerProxy that is connected to the servod
308 server on the host.
Fang Deng5d518f42013-08-02 14:04:32 -0700309 """
Garry Wang11b5e872020-03-11 15:14:08 -0700310 if (servo_constants.ENABLE_SSH_TUNNEL_FOR_SERVO
311 and not self.is_localhost()):
Andrew McRaef0679932020-08-13 09:15:23 +1000312 # Check for existing ssh tunnel proxy.
313 if self._tunnel_proxy is None:
314 self._maybe_create_servod_ssh_tunnel_proxy()
315 return self._tunnel_proxy
Richard Barnette9a26ad62016-06-10 12:03:08 -0700316 else:
Andrew McRaef0679932020-08-13 09:15:23 +1000317 # xmlrpc/httplib is not thread-safe, so each thread must have its
318 # own separate proxy connection.
319 if not hasattr(self._local, "_per_thread_proxy"):
320 remote = 'http://%s:%s' % (self.hostname, self.servo_port)
Derek Beckettf73baca2020-08-19 15:08:47 -0700321 self._local._per_thread_proxy = six.moves.xmlrpc_client.ServerProxy(remote)
Andrew McRaef0679932020-08-13 09:15:23 +1000322 return self._local._per_thread_proxy
Wai-Hong Tam3a8a2552019-11-19 14:28:04 +0800323
Richard Barnette1edbb162016-11-01 11:47:50 -0700324 def verify(self, silent=False):
325 """Update the servo host and verify it's in a good state.
326
327 @param silent If true, suppress logging in `status.log`.
328 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700329 message = 'Beginning verify for servo host %s port %s serial %s'
330 message %= (self.hostname, self.servo_port, self.servo_serial)
331 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700332 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700333 self._repair_strategy.verify(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700334 self._servo_state = servo_constants.SERVO_STATE_WORKING
335 self.record('INFO', None, None,
336 'ServoHost verify set servo_state as WORKING')
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700337 if self._topology:
338 self._topology.generate()
Garry Wang63b8c382020-03-11 22:28:40 -0700339 except Exception as e:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -0700340 if not self.is_localhost():
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700341 self._servo_state = self.determine_servo_state()
342 self.record('INFO', None, None,
343 'ServoHost verify set servo_state as %s'
344 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700345 if self._is_critical_error(e):
346 raise
Fang Deng5d518f42013-08-02 14:04:32 -0700347
Garry Wang2b5eef92020-08-21 16:23:35 -0700348 def _get_default_usbkey_mount_path(self):
349 return '/media/servo_usb/%s' % self.servo_port
Fang Deng5d518f42013-08-02 14:04:32 -0700350
Garry Wang7b0e1b72020-03-25 19:08:59 -0700351 def get_image_name_from_usbkey(self, usbkey_dev):
352 """Mount usb drive and check ChromeOS image name on it if there is
353 one. This method assumes the image_usbkey_direction is already set
354 to servo side.
355
Garry Wang4b980202020-09-24 17:00:17 -0700356 @param usbkey_dev: usbkey dev path(e.g. /dev/sdb).
Garry Wang7b0e1b72020-03-25 19:08:59 -0700357
358 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
359 or empty string if no test image detected, or unexpected
360 error occurred.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700361 """
Garry Wang70e5d062020-04-03 18:01:05 -0700362 logging.info('Checking ChromeOS image name on usbkey.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700363 mount_dst = self._get_default_usbkey_mount_path()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700364 # Unmount if there is an existing stale mount.
Garry Wang2b5eef92020-08-21 16:23:35 -0700365 self._unmount_drive(mount_dst)
366 # ChromeOS root fs is in /dev/sdx3
367 mount_src = usbkey_dev + '3'
Garry Wang7b0e1b72020-03-25 19:08:59 -0700368 try:
Garry Wang2b5eef92020-08-21 16:23:35 -0700369 if not self._mount_drive(mount_src, mount_dst):
370 logging.debug('Unexpected error occurred on mount usb drive.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700371 return ''
Garry Wang70e5d062020-04-03 18:01:05 -0700372
373 release_content = self.run(
Garry Wang2b5eef92020-08-21 16:23:35 -0700374 'cat %s/etc/lsb-release' % mount_dst,
Garry Wang70e5d062020-04-03 18:01:05 -0700375 ignore_status=True).stdout.strip()
376
377 if not re.search(r'RELEASE_TRACK=.*test', release_content):
378 logging.info('The image on usbkey is not a test image')
379 return ''
380
381 return lsbrelease_utils.get_chromeos_release_builder_path(
382 lsb_release_content=release_content)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700383 finally:
Garry Wang70e5d062020-04-03 18:01:05 -0700384 logging.debug('Image check compeleted, unmounting the usb drive.')
Garry Wang2b5eef92020-08-21 16:23:35 -0700385 self._unmount_drive(mount_dst)
Garry Wang7b0e1b72020-03-25 19:08:59 -0700386
Garry Wang2b5eef92020-08-21 16:23:35 -0700387 def _extract_firmware_image_from_usbkey(self, fw_dst):
388 """Extract firmware images from the usbkey on servo, this method
389 assumes there is already a ChromeOS test image staged on servo.
390
Garry Wang4b980202020-09-24 17:00:17 -0700391 @param fw_dst: the path that we'll copy firmware images to.
Garry Wang2b5eef92020-08-21 16:23:35 -0700392
393 @returns: a json format string of firmware manifest data.
394 """
395 usbkey_dev = self._probe_and_validate_usb_dev()
396 if not usbkey_dev:
397 raise hosts.AutoservRepairError('Unexpected error occurred when'
398 ' probe usbkey dev path, please check logs for detail.')
399
400 mount_dst = self._get_default_usbkey_mount_path()
401 # Unmount if there is an existing stale mount.
402 self._unmount_drive(mount_dst)
403 # ChromeOS root fs is in /dev/sdx3
404 mount_src = usbkey_dev + '3'
405 try:
406 if not self._mount_drive(mount_src, mount_dst):
407 raise hosts.AutoservRepairError('Failed to extract firmware'
408 ' image; Unable to mount %s.' % usbkey_dev,
409 'unable to mount usbkey')
410 updater_bin = os.path.join(mount_dst,
411 'usr/sbin/chromeos-firmwareupdate')
412 self.run('%s --unpack %s' % (updater_bin, fw_dst))
413 return self.run('%s --manifest' % updater_bin).stdout
414 finally:
415 self._unmount_drive(mount_dst)
416
417 def prepare_repair_firmware_image(self, fw_dst=None):
418 """Prepare firmware image on the servohost for auto repair process
419 to consume.
420
Garry Wang4b980202020-09-24 17:00:17 -0700421 @param fw_dst: the path that we want to store firmware image on
422 the servohost.
Garry Wang2b5eef92020-08-21 16:23:35 -0700423
424 @returns: A tuple that containes ec firmware image path and bios
425 firmware image path on the servohost, or None if type of
426 image is not available based on manifest and dut's model.
427 """
428 model = self.servo_model or self._dut_host_info.model
429 if not model:
430 raise hosts.AutoservRepairError(
431 'Could not determine DUT\'s model.',
432 'model infomation unknown')
433
434 if not fw_dst:
435 fw_dst = '/tmp/firmware_image/%s' % self.servo_port
436 # Cleanup and re-create dst path to have a fresh start.
437 self.run('rm -rf %s' % fw_dst)
438 self.run('mkdir -p %s' % fw_dst)
439
440 manifest = json.loads(self._extract_firmware_image_from_usbkey(fw_dst))
Garry Wang50b56c12020-09-24 17:26:52 -0700441 # For models that have packed $MODEL_signed variant, we want use the
442 # 'signed' variant once we get DVT devices, so try to read manifest
443 # from $MODEL_signed first.
444 build = manifest.get('%s_signed' % model) or manifest.get(model)
445 if not build:
Garry Wang2b5eef92020-08-21 16:23:35 -0700446 raise hosts.AutoservRepairError('Could not find firmware manifest'
447 ' for model:%s' % model, 'model manifest not found')
448 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700449 ec_image = os.path.join(fw_dst, build['ec']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700450 except KeyError:
451 ec_image = None
452 try:
Garry Wang50b56c12020-09-24 17:26:52 -0700453 bios_image = os.path.join(fw_dst, build['host']['image'])
Garry Wang2b5eef92020-08-21 16:23:35 -0700454 except KeyError:
455 bios_image = None
456 if not ec_image and not bios_image:
457 raise hosts.AutoservRepairError('Could not find any firmware image'
458 ' for model:%s' % model, 'cannot find firmware image')
459 return ec_image, bios_image
Garry Wang7b0e1b72020-03-25 19:08:59 -0700460
Garry Wang4b980202020-09-24 17:00:17 -0700461 def flash_ap_firmware_via_servo(self, image):
462 """Flash AP firmware by use a provided image.
463
464 This is will be a short term enhanment for infra repair use, it use
465 'futility update' which will automatically determine various parameters
466 needed for flashrom, and will preserve the GBB, VPD, and HWID for
467 AP firmware update.
468 @TODO(xianuowang@) Remove this method once b/148403277 implemented.
469
470 @param image: the firmware image path on servohost.
471 """
472 cmd = 'futility update -i %s --servo_port=%s'
473 self.run(cmd % (image, self.servo_port), timeout=900)
474
Garry Wang70e5d062020-04-03 18:01:05 -0700475 def _probe_and_validate_usb_dev(self):
476 """This method probe the usb dev path by talking to servo, and then
477 validate the dev path is valid block device to servohost.
478 Possible output:
479 1. Encounter error during probe usb dev, returns empty string.
480 2. probe usb dev completed without error but cannot find usb dev,
481 raise AutoservRepairError.
482 3. probe usb dev find a usb dev path, but failed validation in this
483 method, raise AutoservRepairError.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700484
Garry Wang70e5d062020-04-03 18:01:05 -0700485 @returns: A string of usb dev path(e.g. '/dev/sdb'), or empty string
486 if unexpected error occurred during probe.
487 @raises: AutoservRepairError if servo couldn't probe the usb dev path
488 (servo.probe_host_usb_dev() returns empty string), or the dev path is
489 not valid block device to servohost.
Garry Wang7b0e1b72020-03-25 19:08:59 -0700490 """
491 logging.info('Validating image usbkey on servo.')
Garry Wang7b0e1b72020-03-25 19:08:59 -0700492 try:
Garry Wang70e5d062020-04-03 18:01:05 -0700493 usb_dev = self._servo.probe_host_usb_dev()
Garry Wang7b0e1b72020-03-25 19:08:59 -0700494 except Exception as e:
495 # We don't want any unexpected or transient servo communicating
496 # failure block usb repair, so capture all errors here.
497 logging.error(e, exc_info=True)
498 logging.error('Unexpected error occurred on get usbkey dev path,'
499 ' skipping usbkey validation.')
500 return ''
501
Garry Wang70e5d062020-04-03 18:01:05 -0700502 if usb_dev:
503 # probe_host_usb_dev() sometimes return stale record,
504 # so we need to make sure the path exists in fdisk.
Otabek Kasimov77bff672020-10-08 15:52:03 -0700505 validate_cmd = 'fdisk -l %s' % usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700506 try:
Otabek Kasimov77bff672020-10-08 15:52:03 -0700507 resp = self.run(validate_cmd, ignore_status=True, timeout=30)
Garry Wang11441182020-06-16 18:34:14 -0700508 if resp.exit_status == 0:
509 return usb_dev
Garry Wang11441182020-06-16 18:34:14 -0700510 logging.error('%s is reported from "image_usbkey_dev" control'
511 ' but not detected by fdisk!', usb_dev)
512 except error.AutoservRunError as e:
513 if 'Timeout encountered' in str(e):
514 logging.warning('Timeout encountered during fdisk run,'
515 ' skipping usbkey validation.')
516 return ''
517 raise
Garry Wang70e5d062020-04-03 18:01:05 -0700518
519 raise hosts.AutoservRepairError(
520 'No usbkey detected on servo, the usbkey may be either missing'
521 ' or broken. Please replace usbkey on the servo and retry.',
522 'missing usbkey')
523
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700524 def is_ec_supported(self):
Garry Wang9b8f2342020-04-17 16:34:09 -0700525 """Check if ec is supported on the servo_board"""
Otabek Kasimov4ea636e2020-04-14 23:35:06 -0700526 if self.servo_board:
527 try:
528 frm_config = config.Config(self.servo_board, self.servo_model)
529 return frm_config.chrome_ec
530 except Exception as e:
531 logging.error('Unexpected error when read from firmware'
532 ' configs; %s', str(e))
533 return False
534
Garry Wang70e5d062020-04-03 18:01:05 -0700535 def validate_image_usbkey(self):
536 """This method first validate if there is a recover usbkey on servo
537 that accessible to servohost, and second check if a ChromeOS image is
538 already on the usb drive and return the image_name so we can avoid
539 unnecessary download and flash to the recover usbkey on servo.
540
541 Please note that, there is special error handling logic here:
542 1. If unexpected error happens, we return empty string. So repair
543 actions will not get blocked.
544 2. If no working usbkey present on servo, but no errors, we'll raise
545 AutoservRepairError here.
546
547 @returns: image_name on the usbkey, e.g. nami-release/R82.10138.0.0,
548 or empty string if no test image detected, or unexpected
549 error occurred.
550 @raises: AutoservRepairError if the usbkey is not detected on servo.
551 """
552 usb_dev = self._probe_and_validate_usb_dev()
553 if usb_dev:
554 return self.get_image_name_from_usbkey(usb_dev)
555 else:
556 return ''
Garry Wang7b0e1b72020-03-25 19:08:59 -0700557
Richard Barnette1edbb162016-11-01 11:47:50 -0700558 def repair(self, silent=False):
559 """Attempt to repair servo host.
560
561 @param silent If true, suppress logging in `status.log`.
562 """
Richard Barnetteabbdc252018-07-26 16:57:42 -0700563 message = 'Beginning repair for servo host %s port %s serial %s'
564 message %= (self.hostname, self.servo_port, self.servo_serial)
565 self.record('INFO', None, None, message)
Richard Barnette9a26ad62016-06-10 12:03:08 -0700566 try:
Richard Barnette1edbb162016-11-01 11:47:50 -0700567 self._repair_strategy.repair(self, silent)
Garry Wang11b5e872020-03-11 15:14:08 -0700568 self._servo_state = servo_constants.SERVO_STATE_WORKING
569 self.record('INFO', None, None,
570 'ServoHost repair set servo_state as WORKING')
Garry Wang464ff1e2019-07-18 17:20:34 -0700571 # If target is a labstation then try to withdraw any existing
572 # reboot request created by this servo because it passed repair.
573 if self.is_labstation():
574 self.withdraw_reboot_request()
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700575 if self._topology:
576 self._topology.generate()
Garry Wang63b8c382020-03-11 22:28:40 -0700577 except Exception as e:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -0700578 if not self.is_localhost():
Otabek Kasimovc6f30412020-06-30 20:08:12 -0700579 self._servo_state = self.determine_servo_state()
580 self.record('INFO', None, None,
581 'ServoHost repair set servo_state as %s'
582 % self._servo_state)
Garry Wang63b8c382020-03-11 22:28:40 -0700583 if self._is_critical_error(e):
584 self.disconnect_servo()
585 self.stop_servod()
586 raise
587
Garry Wang63b8c382020-03-11 22:28:40 -0700588 def _is_critical_error(self, error):
589 if (isinstance(error, hosts.AutoservVerifyDependencyError)
590 and not error.is_critical()):
591 logging.warning('Non-critical verify failure(s) detected during'
592 ' verify/repair servo, servo connection will'
Evan Benn2c41c262020-10-28 11:34:27 +1100593 ' still be up but may not be fully functional.'
594 ' Some repair actions and servo dependent'
Garry Wang63b8c382020-03-11 22:28:40 -0700595 ' tests may not run.')
596 return False
Evan Benn2c41c262020-10-28 11:34:27 +1100597 logging.info(
598 'Critical verify failure(s) detected during repair/verify '
599 'servo. Disconnecting servo and running `stop servod`, all'
600 ' repair actions and tests that depends on servo will not '
601 'run.')
Garry Wang63b8c382020-03-11 22:28:40 -0700602 return True
Fang Deng5d518f42013-08-02 14:04:32 -0700603
Dan Shi4d478522014-02-14 13:46:32 -0800604 def get_servo(self):
605 """Get the cached servo.Servo object.
Fang Deng5d518f42013-08-02 14:04:32 -0700606
Dan Shi4d478522014-02-14 13:46:32 -0800607 @return: a servo.Servo object.
Dana Goyette353d1d92019-06-27 10:43:59 -0700608 @rtype: autotest_lib.server.cros.servo.servo.Servo
Fang Deng5d518f42013-08-02 14:04:32 -0700609 """
Dan Shi4d478522014-02-14 13:46:32 -0800610 return self._servo
611
Garry Wang79e9af62019-06-12 15:19:19 -0700612 def request_reboot(self):
613 """Request servohost to be rebooted when it's safe to by touch a file.
614 """
615 logging.debug('Request to reboot servohost %s has been created by '
Garry Wang464ff1e2019-07-18 17:20:34 -0700616 'servo with port # %s', self.hostname, self.servo_port)
Garry Wang79e9af62019-06-12 15:19:19 -0700617 self.run('touch %s' % self._reboot_file, ignore_status=True)
618
Garry Wang464ff1e2019-07-18 17:20:34 -0700619 def withdraw_reboot_request(self):
620 """Withdraw a servohost reboot request if exists by remove the flag
621 file.
622 """
623 logging.debug('Withdrawing request to reboot servohost %s that created'
624 ' by servo with port # %s if exists.',
625 self.hostname, self.servo_port)
626 self.run('rm -f %s' % self._reboot_file, ignore_status=True)
627
Garry Wangc1288cf2019-12-17 14:58:00 -0800628 def start_servod(self, quick_startup=False):
629 """Start the servod process on servohost.
630 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800631 # Skip if running on the localhost.(crbug.com/1038168)
632 if self.is_localhost():
633 logging.debug("Servohost is a localhost, skipping start servod.")
634 return
635
636 cmd = 'start servod'
Garry Wangc1288cf2019-12-17 14:58:00 -0800637 if self.servo_board:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800638 cmd += ' BOARD=%s' % self.servo_board
Garry Wangc1288cf2019-12-17 14:58:00 -0800639 if self.servo_model:
640 cmd += ' MODEL=%s' % self.servo_model
Garry Wangc1288cf2019-12-17 14:58:00 -0800641 else:
Garry Wang2ac15ee2019-12-30 19:03:02 -0800642 logging.warning('Board for DUT is unknown; starting servod'
643 ' assuming a pre-configured board.')
644
645 cmd += ' PORT=%d' % self.servo_port
646 if self.servo_serial:
647 cmd += ' SERIAL=%s' % self.servo_serial
Garry Wangd7367482020-02-27 13:52:40 -0800648
Garry Wangcb06f3b2020-10-08 20:56:21 -0700649 # Start servod with dual_v4 based on servo_setup.
Otabek Kasimov382c3bb2020-10-28 13:22:45 -0700650 if self.is_dual_setup():
Garry Wangcb06f3b2020-10-08 20:56:21 -0700651 cmd += ' DUAL_V4=1'
Garry Wangd7367482020-02-27 13:52:40 -0800652
Garry Wangcb06f3b2020-10-08 20:56:21 -0700653 # Start servod with CONFIG=cr50.xml which required for some pools.
654 if self._require_cr50_servod_config():
655 cmd += ' CONFIG=cr50.xml'
Garry Wangb5cee3e2020-09-16 14:58:13 -0700656
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800657 # Remove the symbolic links from the logs. This helps ensure that
658 # a failed servod instantiation does not cause us to grab old logs
659 # by mistake.
660 self.remove_latest_log_symlinks()
Garry Wangcdd27b22020-01-13 14:59:11 -0800661 self.run(cmd, timeout=60)
Garry Wangc1288cf2019-12-17 14:58:00 -0800662
663 # There's a lag between when `start servod` completes and when
664 # the _ServodConnectionVerifier trigger can actually succeed.
665 # The call to time.sleep() below gives time to make sure that
666 # the trigger won't fail after we return.
667
668 # Normally servod on servo_v3 and labstation take ~10 seconds to ready,
669 # But in the rare case all servo on a labstation are in heavy use they
670 # may take ~30 seconds. So the timeout value will double these value,
671 # and we'll try quick start up when first time initialize servohost,
672 # and use standard start up timeout in repair.
673 if quick_startup:
Garry Wang11b5e872020-03-11 15:14:08 -0700674 timeout = servo_constants.SERVOD_QUICK_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800675 else:
Garry Wang11b5e872020-03-11 15:14:08 -0700676 timeout = servo_constants.SERVOD_STARTUP_TIMEOUT
Garry Wangc1288cf2019-12-17 14:58:00 -0800677 logging.debug('Wait %s seconds for servod process fully up.', timeout)
678 time.sleep(timeout)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700679 # Cache the initial instance timestamp to check against servod restarts
680 self._initial_instance_ts = self.get_instance_logs_ts()
Garry Wangc1288cf2019-12-17 14:58:00 -0800681
Garry Wangc1288cf2019-12-17 14:58:00 -0800682 def stop_servod(self):
683 """Stop the servod process on servohost.
684 """
Garry Wang2ac15ee2019-12-30 19:03:02 -0800685 # Skip if running on the localhost.(crbug.com/1038168)
686 if self.is_localhost():
687 logging.debug("Servohost is a localhost, skipping stop servod.")
688 return
689
Garry Wangc1288cf2019-12-17 14:58:00 -0800690 logging.debug('Stopping servod on port %s', self.servo_port)
Garry Wangcdd27b22020-01-13 14:59:11 -0800691 self.run('stop servod PORT=%d' % self.servo_port,
692 timeout=60, ignore_status=True)
Garry Wangc1288cf2019-12-17 14:58:00 -0800693 logging.debug('Wait %s seconds for servod process fully teardown.',
Garry Wang11b5e872020-03-11 15:14:08 -0700694 servo_constants.SERVOD_TEARDOWN_TIMEOUT)
695 time.sleep(servo_constants.SERVOD_TEARDOWN_TIMEOUT)
Garry Wangc1288cf2019-12-17 14:58:00 -0800696
Garry Wangc1288cf2019-12-17 14:58:00 -0800697 def restart_servod(self, quick_startup=False):
698 """Restart the servod process on servohost.
699 """
700 self.stop_servod()
701 self.start_servod(quick_startup)
702
Garry Wangffbd2162020-04-17 16:13:48 -0700703 def _process_servodtool_error(self, response):
704 """Helper function to handle non-zero servodtool response.
705 """
706 if re.search(servo_constants.ERROR_MESSAGE_USB_HUB_NOT_COMPATIBLE,
Garry Wangad245002020-05-15 15:20:23 -0700707 response.stdout):
Garry Wangffbd2162020-04-17 16:13:48 -0700708 logging.error('The servo is not plugged on a usb hub that supports'
709 ' power-cycle!')
Garry Wang000c6c02020-05-11 21:27:23 -0700710 # change the flag so we can update this label in later process.
711 self.smart_usbhub = False
Garry Wangffbd2162020-04-17 16:13:48 -0700712 return
713
714 if re.search(servo_constants.ERROR_MESSAGE_DEVICE_NOT_FOUND %
715 self.servo_serial, response.stdout):
716 logging.error('No servo with serial %s found!', self.servo_serial)
717 return
718
719 logging.error('Unexpected error occurred from usbhub control, please'
720 ' file a bug and inform chrome-fleet-software@ team!')
721
Garry Wangffbd2162020-04-17 16:13:48 -0700722 def _get_servo_usb_devnum(self):
723 """Helper function to collect current usb devnum of servo.
724 """
Otabek Kasimov09192682020-06-01 18:17:44 -0700725 # TODO remove try-except when fix crbug.com/1087964
726 try:
727 cmd = 'servodtool device -s %s usb-path' % self.servo_serial
728 resp = self.run(cmd, ignore_status=True, timeout=30)
729 except Exception as e:
730 # Here we catch only timeout errors.
731 # Other errors is filtered by ignore_status=True
732 logging.debug('Attempt to get servo usb-path failed due to '
733 'timeout; %s', e)
734 return ''
735
Garry Wangffbd2162020-04-17 16:13:48 -0700736 if resp.exit_status != 0:
737 self._process_servodtool_error(resp)
738 return ''
739 usb_path = resp.stdout.strip()
740 logging.info('Usb path of servo %s is %s', self.servo_serial, usb_path)
741
742 resp = self.run('cat %s/devnum' % usb_path,
743 ignore_status=True)
744 if resp.exit_status != 0:
745 self._process_servodtool_error(resp)
746 return ''
747 return resp.stdout.strip()
748
Garry Wang358aad42020-08-02 20:56:04 -0700749 def reboot_servo_v3_on_need(self):
750 """Check and reboot servo_v3 based on below conditions.
751 1. If there is an update pending on reboot.
752 2. Servo_v3 has been up for more than 96 hours.
753 """
754 if self.get_board() != 'beaglebone_servo':
755 logging.info('Servo reboot is only applicable for servo V3.')
Otabek Kasimove6df8102020-07-21 20:15:25 -0700756 return
757
Garry Wang358aad42020-08-02 20:56:04 -0700758 update_pending_reboot = (self._check_update_status() ==
759 self.UPDATE_STATE.PENDING_REBOOT)
760 uptime_hours = float(self.check_uptime())/3600
761 logging.info('Uptime of servo_v3: %s hour(s)', uptime_hours)
762 long_up_time = uptime_hours > 96
763
764 # Skip reboot if neither condition are met.
765 if not (update_pending_reboot or long_up_time):
Otabek Kasimove6df8102020-07-21 20:15:25 -0700766 return
767
Garry Wang358aad42020-08-02 20:56:04 -0700768 if update_pending_reboot:
769 message = 'Starting reboot servo_v3 because an update is pending.'
770 reboot_method = self._post_update_reboot
771 elif long_up_time:
772 message = 'Starting reboot servo_v3 because uptime > 96 hours.'
773 reboot_method = self._servo_host_reboot
774 self.record('INFO', None, None, message)
775 logging.info(message)
Otabek Kasimove6df8102020-07-21 20:15:25 -0700776 try:
Garry Wang358aad42020-08-02 20:56:04 -0700777 reboot_method()
Otabek Kasimove6df8102020-07-21 20:15:25 -0700778 message = 'Servo_v3 reboot completed successfully.'
779 except Exception as e:
780 logging.debug("Fail to reboot servo_v3; %s", e)
781 message = ('Servo_v3 reboot failed, please check debug log '
782 'for details.')
783 logging.info(message)
784 self.record('INFO', None, None, message)
Garry Wangffbd2162020-04-17 16:13:48 -0700785
786 def _reset_servo(self):
787 logging.info('Resetting servo through smart usbhub.')
Otabek Kasimov09192682020-06-01 18:17:44 -0700788 # TODO remove try-except when fix crbug.com/1087964
789 try:
790 resp = self.run('servodtool device -s %s power-cycle' %
791 self.servo_serial, ignore_status=True,
792 timeout=30)
793 if resp.exit_status != 0:
794 self._process_servodtool_error(resp)
795 return False
796 except Exception as e:
797 # Here we catch only timeout errors.
798 # Other errors is filtered by ignore_status=True
799 logging.debug('Attempt to reset servo failed due to timeout;'
800 ' %s', e)
Garry Wangffbd2162020-04-17 16:13:48 -0700801 return False
802
803 logging.debug('Wait %s seconds for servo to come back from reset.',
804 servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
805 time.sleep(servo_constants.SERVO_RESET_TIMEOUT_SECONDS)
Garry Wang000c6c02020-05-11 21:27:23 -0700806 # change the flag so we can update this label in later process.
807 self.smart_usbhub = True
Garry Wangffbd2162020-04-17 16:13:48 -0700808 return True
809
Garry Wangffbd2162020-04-17 16:13:48 -0700810 def reset_servo(self):
811 """Reset(power-cycle) the servo via smart usbhub.
812 """
813 if not self.is_labstation():
814 logging.info('Servo reset is not applicable to servo_v3.')
815 return
816
817 pre_reset_devnum = self._get_servo_usb_devnum()
818 logging.info('Servo usb devnum before reset: %s', pre_reset_devnum)
819 result = self._reset_servo()
820 if not result:
Garry Wangfd5c8b62020-06-08 15:36:54 -0700821 message = ('Failed to reset servo with serial: %s. (Please ignore'
822 ' this error if the DUT is not connected to a smart'
823 ' usbhub).' % self.servo_serial)
Garry Wangffbd2162020-04-17 16:13:48 -0700824 logging.warning(message)
825 self.record('INFO', None, None, message)
826 return
827
828 post_reset_devnum = self._get_servo_usb_devnum()
829 logging.info('Servo usb devnum after reset: %s', post_reset_devnum)
830 if not (pre_reset_devnum and post_reset_devnum):
831 message = ('Servo reset completed but unable to verify'
832 ' devnum change!')
833 elif pre_reset_devnum != post_reset_devnum:
834 message = ('Reset servo with serial %s completed successfully!'
835 % self.servo_serial)
836 else:
837 message = 'Servo reset completed but devnum is still not changed!'
838 logging.info(message)
839 self.record('INFO', None, None, message)
840
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800841 def _extract_compressed_logs(self, logdir, relevant_files):
842 """Decompress servod logs in |logdir|.
843
844 @param logdir: directory containing compressed servod logs.
845 @param relevant_files: list of files in |logdir| to consider.
846
847 @returns: tuple, (tarfiles, files) where
848 tarfiles: list of the compressed filenames that have been
849 extracted and deleted
850 files: list of the uncompressed files that were generated
851 """
852 # For all tar-files, first extract them to the directory, and
853 # then let the common flow handle them.
854 tarfiles = [cf for cf in relevant_files if
855 cf.endswith(self.COMPRESSION_SUFFIX)]
856 files = []
857 for f in tarfiles:
858 norm_name = os.path.basename(f)[:-len(self.COMPRESSION_SUFFIX)]
859 with tarfile.open(f) as tf:
860 # Each tarfile has only one member, as
861 # that's the compressed log.
862 member = tf.members[0]
863 # Manipulate so that it only extracts the basename, and not
864 # the directories etc.
865 member.name = norm_name
866 files.append(os.path.join(logdir, member.name))
867 tf.extract(member, logdir)
868 # File has been extracted: remove the compressed file.
869 os.remove(f)
870 return tarfiles, files
871
872 def _extract_mcu_logs(self, log_subdir):
873 """Extract MCU (EC, Cr50, etc) console output from servod debug logs.
874
875 Using the MCU_EXTRACTOR regex (above) extract and split out MCU console
876 lines from the logs to generate invidiual console logs e.g. after
877 this method, you can find an ec.txt and servo_v4.txt in |log_dir| if
878 those MCUs had any console input/output.
879
880 @param log_subdir: directory with log.DEBUG.txt main servod debug logs.
881 """
882 # Extract the MCU for each one. The MCU logs are only in the .DEBUG
883 # files
884 mcu_lines_file = os.path.join(log_subdir, 'log.DEBUG.txt')
885 if not os.path.exists(mcu_lines_file):
886 logging.info('No DEBUG logs found to extract MCU logs from.')
887 return
888 mcu_files = {}
889 mcu_file_template = '%s.txt'
890 with open(mcu_lines_file, 'r') as f:
891 for line in f:
892 match = self.MCU_EXTRACTOR.match(line)
893 if match:
894 mcu = match.group(self.MCU_GROUP).lower()
895 line = match.group(self.LINE_GROUP)
896 if mcu not in mcu_files:
897 mcu_file = os.path.join(log_subdir,
898 mcu_file_template % mcu)
899 mcu_files[mcu] = open(mcu_file, 'a')
900 fd = mcu_files[mcu]
901 fd.write(line + '\n')
902 for f in mcu_files:
903 mcu_files[f].close()
904
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800905 def remove_latest_log_symlinks(self):
906 """Remove the conveninence symlinks 'latest' servod logs."""
907 symlink_wildcard = '%s/latest*' % self.remote_log_dir
908 cmd = 'rm ' + symlink_wildcard
909 self.run(cmd, stderr_tee=None, ignore_status=True)
910
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700911 def probe_servod_restart(self, instance_ts, outdir):
912 """Grab servod logs from previous instances if part of this session.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800913
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700914 If since the last time this host called start_servod() servod crashed
915 and restarted, this helper finds those logs as well, and stores them
916 with the |OLD_LOG_SUFFIX| to investigate if necessary.
Prasad Vuppalapu5bd9da12020-03-31 01:46:47 +0000917
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700918 It also issues a panicinfo command to servo devices after the restart
919 to try and collect reboot information for debugging.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800920
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700921 @param instance_ts: the log timestamp that the current instance uses
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -0800922 @param outdir: directory to create a subdirectory into to place the
923 servod logs into.
924 """
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -0700925 if self._initial_instance_ts is None:
926 logging.info('No log timestamp grabbed successfully on servod '
927 'startup. Cannot check device restarts. Ignoring.')
928 return
929 if instance_ts == self._initial_instance_ts:
930 logging.debug('Servod appears to have run without restarting')
931 return
932 # Servod seems to have restarted (at least once). |_initial_instance_ts|
933 # is the first timestamp, and instance_ts is the current timestamp. Find
934 # all timestamps in between them, and grab the logs for each.
935 tss = self._find_instance_timestamps_between(self._initial_instance_ts,
936 instance_ts)
937 logging.info('Servod has restarted %d times between the start and the '
938 'end of this servo_host.', len(tss))
939 logging.info('This might be an issue. Will extract all logs from each '
940 'instance.')
941 logging.info('Logs that are not the currently running (about to turn '
942 'down) instance are maked with a .%s in their folder.',
943 self.OLD_LOG_SUFFIX)
944 for ts in tss:
945 self.get_instance_logs(ts, outdir, old=True)
946 # Lastly, servod has restarted due to a potential issue. Try to get
947 # panic information from servo micro and servo v4 for the current logs.
948 # This can only happen if the |_servo| attribute is initialized.
949 if self._servo:
950 for mcu in ['servo_micro', 'servo_v4']:
951 ctrl = '%s_uart_cmd' % mcu
952 if self._servo.has_control(ctrl):
953 logging.info('Trying to retrieve %r panicinfo into logs',
954 mcu)
955 try:
956 self._servo.set_nocheck(ctrl, 'panicinfo')
957 except error.TestFail as e:
958 logging.error('Failed to generate panicinfo for %r '
959 'logs. %s', mcu, str(e))
960
961 def _find_instance_timestamps_between(self, start_ts, end_ts):
962 """Find all log timestamps between [start_ts, end_ts).
963
964 @param start_ts: str, earliest log timestamp of interest
965 @param end_ts: str, latest log timestamp of interest
966
967 @returns: list, all timestamps between start_ts and end_ts, end_ts
968 exclusive, on the servo_host. An empty list on errors
969 """
970 # Simply get all timestamp, and then sort and remove
971 cmd = 'ls %s' % self.remote_log_dir
972 res = self.run(cmd, stderr_tee=None, ignore_status=True)
973 if res.exit_status != 0:
974 # Here we failed to find anything.
975 logging.info('Failed to find remote servod logs. Ignoring.')
976 return []
977 logfiles = res.stdout.strip().split()
978 timestamps = set()
979 for logfile in logfiles:
980 ts_match = self.TS_EXTRACTOR.match(logfile)
981 if not ts_match:
982 # Simply ignore files that fail the check. It might be the
983 # 'latest' symlinks or random files.
984 continue
985 timestamps.add(ts_match.group(self.TS_GROUP))
986 # At this point we have all unique timestamps.
987 timestamps = sorted(timestamps)
988 for ts in [start_ts, end_ts]:
989 if ts not in timestamps:
990 logging.error('Timestamp %r not in servod logs. Cannot query '
991 'for timestamps in between %r and %r', ts,
992 start_ts, end_ts)
993 return []
994 return timestamps[timestamps.index(start_ts):timestamps.index(end_ts)]
995
996 def get_instance_logs_ts(self):
997 """Retrieve the currently running servod instance's log timestamp
998
999 @returns: str, timestamp for current instance, or None on failure
1000 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001001 # First, extract the timestamp. This cmd gives the real filename of
1002 # the latest aka current log file.
1003 cmd = ('if [ -f %(dir)s/latest.DEBUG ];'
1004 'then realpath %(dir)s/latest.DEBUG;'
1005 'elif [ -f %(dir)s/latest ];'
1006 'then realpath %(dir)s/latest;'
1007 'else exit %(code)d;'
1008 'fi' % {'dir': self.remote_log_dir,
1009 'code': self.NO_SYMLINKS_CODE})
1010 res = self.run(cmd, stderr_tee=None, ignore_status=True)
1011 if res.exit_status != 0:
1012 if res.exit_status == self.NO_SYMLINKS_CODE:
1013 logging.warning('servod log latest symlinks not found. '
1014 'This is likely due to an error starting up '
1015 'servod. Ignoring..')
1016 else:
1017 logging.warning('Failed to find servod logs on servo host.')
1018 logging.warning(res.stderr.strip())
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001019 return None
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001020 fname = os.path.basename(res.stdout.strip())
1021 # From the fname, ought to extract the timestamp using the TS_EXTRACTOR
Ruben Rodriguez Buchillone9aa2b02020-03-04 12:14:28 -08001022 ts_match = self.TS_EXTRACTOR.match(fname)
1023 if not ts_match:
1024 logging.warning('Failed to extract timestamp from servod log file '
1025 '%r. Skipping. The servo host is using outdated '
1026 'servod logging and needs to be updated.', fname)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001027 return None
1028 return ts_match.group(self.TS_GROUP)
1029
1030 def get_instance_logs(self, instance_ts, outdir, old=False):
1031 """Collect all logs with |instance_ts| and dump into a dir in |outdir|
1032
1033 This method first collects all logs on the servo_host side pertaining
1034 to this servod instance (port, instatiation). It glues them together
1035 into combined log.[level].txt files and extracts all available MCU
1036 console I/O from the logs into individual files e.g. servo_v4.txt
1037
1038 All the output can be found in a directory inside |outdir| that
1039 this generates based on |LOG_DIR|, the servod port, and the instance
1040 timestamp on the servo_host side.
1041
1042 @param instance_ts: log timestamp to grab logfiles for
1043 @param outdir: directory to create a subdirectory into to place the
1044 servod logs into.
1045 @param old: bool, whether to append |OLD_LOG_SUFFIX| to output dir
1046 """
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001047 # Create the local results log dir.
1048 log_dir = os.path.join(outdir, '%s_%s.%s' % (self.LOG_DIR,
1049 str(self.servo_port),
1050 instance_ts))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001051 if old:
Garry Wang22f2e842020-09-09 20:19:19 -07001052 log_dir = '%s.%s' % (log_dir, self.OLD_LOG_SUFFIX)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001053 logging.info('Saving servod logs to %r.', log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001054 os.mkdir(log_dir)
1055 # Now, get all files with that timestamp.
1056 cmd = 'find %s -maxdepth 1 -name "log.%s*"' % (self.remote_log_dir,
1057 instance_ts)
1058 res = self.run(cmd, stderr_tee=None, ignore_status=True)
1059 files = res.stdout.strip().split()
1060 try:
1061 self.get_file(files, log_dir, try_rsync=False)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001062 if not os.listdir(log_dir):
1063 logging.info('No servod logs retrieved. Ignoring, and removing '
1064 '%r again.', log_dir)
1065 os.rmdir(log_dir)
1066 return
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001067 except error.AutoservRunError as e:
1068 result = e.result_obj
1069 if result.exit_status != 0:
1070 stderr = result.stderr.strip()
1071 logging.warning("Couldn't retrieve servod logs. Ignoring: %s",
1072 stderr or '\n%s' % result)
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001073 # Remove the log_dir as nothing was added to it.
1074 os.rmdir(log_dir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001075 return
1076 local_files = [os.path.join(log_dir, f) for f in os.listdir(log_dir)]
1077 # TODO(crrev.com/c/1793030): remove no-level case once CL is pushed
1078 for level_name in ('DEBUG', 'INFO', 'WARNING', ''):
1079 # Create the joint files for each loglevel. i.e log.DEBUG
1080 joint_file = self.JOINT_LOG_PREFIX
1081 if level_name:
1082 joint_file = '%s.%s' % (self.JOINT_LOG_PREFIX, level_name)
1083 # This helps with some online tools to avoid complaints about an
1084 # unknown filetype.
1085 joint_file = joint_file + '.txt'
1086 joint_path = os.path.join(log_dir, joint_file)
1087 files = [f for f in local_files if level_name in f]
1088 if not files:
1089 # TODO(crrev.com/c/1793030): remove no-level case once CL
1090 # is pushed
1091 continue
1092 # Extract compressed logs if any.
1093 compressed, extracted = self._extract_compressed_logs(log_dir,
1094 files)
1095 files = list(set(files) - set(compressed))
1096 files.extend(extracted)
1097 # Need to sort. As they all share the same timestamp, and
1098 # loglevel, the index itself is sufficient. The highest index
1099 # is the oldest file, therefore we need a descending sort.
1100 def sortkey(f, level=level_name):
1101 """Custom sortkey to sort based on rotation number int."""
1102 if f.endswith(level_name): return 0
1103 return int(f.split('.')[-1])
1104
1105 files.sort(reverse=True, key=sortkey)
1106 # Just rename the first file rather than building from scratch.
1107 os.rename(files[0], joint_path)
1108 with open(joint_path, 'a') as joint_f:
1109 for logfile in files[1:]:
1110 # Transfer the file to the joint file line by line.
1111 with open(logfile, 'r') as log_f:
1112 for line in log_f:
1113 joint_f.write(line)
1114 # File has been written over. Delete safely.
1115 os.remove(logfile)
1116 # Need to remove all files form |local_files| so we don't
1117 # analyze them again.
1118 local_files = list(set(local_files) - set(files) - set(compressed))
1119 # Lastly, extract MCU logs from the joint logs.
1120 self._extract_mcu_logs(log_dir)
1121
Garry Wang79e9af62019-06-12 15:19:19 -07001122 def _lock(self):
1123 """lock servohost by touching a file.
1124 """
1125 logging.debug('Locking servohost %s by touching %s file',
1126 self.hostname, self._lock_file)
1127 self.run('touch %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001128 self._is_locked = True
Garry Wang79e9af62019-06-12 15:19:19 -07001129
Garry Wang79e9af62019-06-12 15:19:19 -07001130 def _unlock(self):
1131 """Unlock servohost by removing the lock file.
1132 """
1133 logging.debug('Unlocking servohost by removing %s file',
1134 self._lock_file)
1135 self.run('rm %s' % self._lock_file, ignore_status=True)
Garry Wang7c00b0f2019-06-25 17:28:17 -07001136 self._is_locked = False
Garry Wang79e9af62019-06-12 15:19:19 -07001137
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001138 def close(self):
Congbin Guofc3b8962019-03-22 17:38:46 -07001139 """Close the associated servo and the host object."""
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001140 # NOTE: throughout this method there are multiple attempts to catch
1141 # all errors. This is WAI as log grabbing should not fail tests.
1142 # However, the goal is to catch and handle/process all errors, thus
1143 # we print the traceback and ask for a bug.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001144 if self._closed:
1145 logging.debug('ServoHost is already closed.')
1146 return
Garry Wang22f2e842020-09-09 20:19:19 -07001147
1148 # Only attempt ssh related actions if servohost is sshable. We call
1149 # check_cached_up_status() first because it's lightweighted and return
1150 # much faster in the case servohost is down, however, we still want
1151 # to call is_up() later since check_cached_up_status() is ping based check
1152 # and not guarantee the servohost is sshable.
1153 servo_host_ready = self.check_cached_up_status() and self.is_up()
1154
1155 if servo_host_ready:
1156 instance_ts = self.get_instance_logs_ts()
1157 else:
1158 logging.info('Servohost is down, will skip servod log collecting.')
1159 instance_ts = None
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001160 # TODO(crbug.com/1011516): once enabled, remove the check against
1161 # localhost and instead check against log-rotiation enablement.
1162 logs_available = (instance_ts is not None and
1163 self.job and
1164 not self.is_localhost())
1165 if logs_available:
1166 # Probe whether there was a servod restart, and grab those old
1167 # logs as well.
1168 try:
1169 self.probe_servod_restart(instance_ts, self.job.resultdir)
1170 except (error.AutoservRunError, error.TestFail) as e:
1171 logging.info('Failed to grab servo logs due to: %s. '
1172 'This error is forgiven.', str(e))
1173 except Exception as e:
1174 logging.error('Unexpected error probing for old logs. %s. '
1175 'Forgiven. Please file a bug and fix or catch '
1176 'in log probing function', str(e),
1177 exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001178 if self._servo:
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001179 outdir = None if not self.job else self.job.resultdir
Congbin Guo2e5e2a22018-07-27 10:32:48 -07001180 # In some cases when we run as lab-tools, the job object is None.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001181 self._servo.close(outdir)
1182
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001183 if logs_available:
1184 # Grab current (not old like above) logs after the servo instance
1185 # was closed out.
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001186 try:
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001187 self.get_instance_logs(instance_ts, self.job.resultdir)
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001188 except error.AutoservRunError as e:
1189 logging.info('Failed to grab servo logs due to: %s. '
1190 'This error is forgiven.', str(e))
Ruben Rodriguez Buchillon5bac3062020-03-25 21:32:58 -07001191 except Exception as e:
1192 logging.error('Unexpected error grabbing servod logs. %s. '
1193 'Forgiven. Please file a bug and fix or catch '
1194 'in log grabbing function', str(e), exc_info=True)
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001195
Garry Wang22f2e842020-09-09 20:19:19 -07001196 if self._is_locked and servo_host_ready:
Garry Wang7c00b0f2019-06-25 17:28:17 -07001197 # Remove the lock if the servohost has been locked.
Garry Wang79e9af62019-06-12 15:19:19 -07001198 try:
1199 self._unlock()
1200 except error.AutoservSSHTimeout:
1201 logging.error('Unlock servohost failed due to ssh timeout.'
1202 ' It may caused by servohost went down during'
1203 ' the task.')
Garry Wangc1288cf2019-12-17 14:58:00 -08001204 # We want always stop servod after task to minimum the impact of bad
1205 # servod process interfere other servods.(see crbug.com/1028665)
Garry Wang22f2e842020-09-09 20:19:19 -07001206 if servo_host_ready:
1207 try:
1208 self.stop_servod()
1209 except error.AutoservRunError as e:
1210 logging.info(
1211 "Failed to stop servod due to:\n%s\n"
1212 "This error is forgiven.", str(e))
Garry Wangc1288cf2019-12-17 14:58:00 -08001213
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001214 super(ServoHost, self).close()
Ruben Rodriguez Buchillon93084d02020-01-21 15:17:36 -08001215 # Mark closed.
1216 self._closed = True
Congbin Guoa1f9cba2018-07-03 11:36:59 -07001217
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001218 def get_servo_state(self):
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001219 return self._servo_state
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001220
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001221 def _get_host_metrics_data(self):
1222 return {'port': self.servo_port,
Otabek Kasimov0ea47362020-07-11 20:55:09 -07001223 'host': self.get_dut_hostname() or self.hostname,
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001224 'board': self.servo_board or ''}
1225
1226 def _is_servo_device_connected(self, servo_type, serial):
1227 """Check if device is connected to the labstation.
1228
1229 Works for all servo devices connected to the labstation.
1230 For servo_v3 please use 'self._is_servo_board_present_on_servo_v3'
1231
1232 @param servo_type: The type of servo device. Expecting value can be
1233 servo_v4 or servo_micro.
1234 @param serial: The serial number of the device to detect it.
1235 """
1236 vid_pid = self.SERVO_VID_PID.get(servo_type)
1237 if not vid_pid or not serial:
1238 # device cannot detected without VID/PID or serial number
1239 return False
1240 logging.debug('Started to detect %s', servo_type)
1241 try:
1242 cmd = 'lsusb -v -d %s |grep iSerial |grep %s' % (vid_pid, serial)
1243 result = self.run(cmd, ignore_status=True, timeout=30)
1244 if result.exit_status == 0 and result.stdout.strip():
1245 logging.debug('The %s is plugged in to the host.', servo_type)
1246 return True
1247 logging.debug('%s device is not detected; %s', servo_type, result)
1248 return False
1249 except Exception as e:
1250 # can be triggered by timeout issue due running the script
1251 metrics.Counter(
1252 'chromeos/autotest/repair/servo_detection/timeout'
1253 ).increment(fields=self._get_host_metrics_data())
1254 logging.error('%s device is not detected; %s', servo_type, str(e))
1255 return None
1256
1257 def _is_servo_board_present_on_servo_v3(self):
1258 """Check if servo board is detected on servo_v3"""
1259 vid_pids = self.SERVO_VID_PID['servo_v3']
1260 if not vid_pids or len(vid_pids) == 0:
1261 # device cannot detected without VID/PID
1262 return False
1263 logging.debug('Started to detect servo board on servo_v3')
1264 not_detected = 'The servo board is not detected on servo_v3'
1265 try:
1266 cmd = 'lsusb | grep "%s"' % "\|".join(vid_pids)
1267 result = self.run(cmd, ignore_status=True, timeout=30)
1268 if result.exit_status == 0 and result.stdout.strip():
1269 logging.debug('The servo board is detected on servo_v3')
1270 return True
1271 logging.debug('%s; %s', not_detected, result)
1272 return False
1273 except Exception as e:
1274 # can be triggered by timeout issue due running the script
1275 metrics.Counter(
1276 'chromeos/autotest/repair/servo_detection/timeout'
1277 ).increment(fields=self._get_host_metrics_data())
1278 logging.error('%s; %s', not_detected, str(e))
1279 return None
1280
Otabek Kasimov120b6fa2020-07-03 00:15:27 -07001281 def _is_main_device_not_detected_on_servo_v4(self):
1282 """Check if servod cannot find main device on servo.
1283
1284 The check based on reading servod logs for servo_v4.
1285 """
1286 if not self._initial_instance_ts:
1287 # latest log not found
1288 return False
1289 logging.debug('latest log for servod created at %s',
1290 self._initial_instance_ts)
1291 try:
1292 log_created = calendar.timegm(time.strptime(
1293 self._initial_instance_ts,
1294 "%Y-%m-%d--%H-%M-%S.%f"))
1295 except ValueError as e:
1296 logging.debug('Cannot read time from log file name: %s',
1297 self._initial_instance_ts)
1298 return False
1299 min_time_created = calendar.timegm(time.gmtime())
1300 if min_time_created > log_created + 3600:
1301 # the log file is old we cannot use it
1302 logging.debug('log file was created more than hour ago, too old')
1303 return False
1304 logging.debug('latest log was created not longer then 1 hour ago')
1305
1306 # check if servod can detect main device by servo_v4
1307 message = 'ERROR - No servo micro or CCD detected for board'
1308 cmd = ('cat /var/log/servod_%s/log.%s.INFO |grep "%s"'
1309 % (self.servo_port, self._initial_instance_ts, message))
1310 result = self.run(cmd, ignore_status=True)
1311 if result.stdout.strip():
1312 logging.info('Servod cannot detect main device on the servo; '
1313 'Can be caused by bad hardware of servo or '
1314 'issue on the DUT side.')
1315 return True
1316 logging.debug('The main device is detected')
1317 return False
1318
Garry Wangb5cee3e2020-09-16 14:58:13 -07001319 def _require_cr50_servod_config(self):
1320 """Check whether we need start servod with CONFIG=cr50.xml"""
1321 dut_host_info = self.get_dut_host_info()
1322 if not dut_host_info:
1323 return False
1324 for pool in dut_host_info.pools:
1325 if pool.startswith(servo_constants.CR50_CONFIG_POOL_PREFIX):
1326 return True
1327 return False
1328
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001329 def get_verifier_state(self, tag):
Otabek Kasimov15963492020-06-23 21:10:51 -07001330 """Return the state of servo verifier.
1331
1332 @returns: bool or None
1333 """
1334 return self._repair_strategy.verifier_is_good(tag)
1335
1336 def determine_servo_state(self):
1337 """Determine servo state based on the failed verifier.
1338
1339 @returns: servo state value
1340 The state detecting based on first fail verifier or collecting of
1341 them.
1342 """
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001343 ssh = self.get_verifier_state('servo_ssh')
1344 disk_space = self.get_verifier_state('disk_space')
1345 start_servod = self.get_verifier_state('servod_job')
1346 create_servo = self.get_verifier_state('servod_connection')
1347 init_servo = self.get_verifier_state('servod_control')
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001348 servo_topology = self.get_verifier_state('servo_topology')
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001349 dut_connected = self.get_verifier_state('dut_connected')
1350 pwr_button = self.get_verifier_state('pwr_button')
1351 lid_open = self.get_verifier_state('lid_open')
1352 ec_board = self.get_verifier_state('ec_board')
1353 ccd_testlab = self.get_verifier_state('ccd_testlab')
Otabek Kasimov15963492020-06-23 21:10:51 -07001354
1355 if not ssh:
1356 return servo_constants.SERVO_STATE_NO_SSH
1357
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001358 if (start_servod == hosts.VERIFY_FAILED
1359 or create_servo == hosts.VERIFY_FAILED):
Otabek Kasimov066bdb82020-08-12 15:57:44 -07001360 # sometimes servo can start with out present servo
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001361 if self.is_labstation():
1362 if not self.servo_serial:
1363 return servo_constants.SERVO_STATE_WRONG_CONFIG
1364 if self._is_servo_device_connected(
1365 'servo_v4',
1366 self.servo_serial) == False:
1367 return servo_constants.SERVO_STATE_NOT_CONNECTED
1368 elif self._is_servo_board_present_on_servo_v3() == False:
1369 return servo_constants.SERVO_STATE_NOT_CONNECTED
Otabek Kasimov066bdb82020-08-12 15:57:44 -07001370
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001371 if servo_topology == hosts.VERIFY_FAILED:
1372 return servo_constants.SERVO_STATE_TOPOLOGY_ISSUE
1373
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001374 if dut_connected == hosts.VERIFY_FAILED:
1375 if pwr_button == hosts.VERIFY_SUCCESS:
Otabek Kasimova7eb4dc2020-09-16 10:25:17 -07001376 # unexpected case
1377 metrics.Counter(
1378 'chromeos/autotest/repair/servo_unexpected/pwr_button'
1379 ).increment(fields=self._get_host_metrics_data())
1380 return servo_constants.SERVO_STATE_DUT_NOT_CONNECTED
1381
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001382 if start_servod == hosts.VERIFY_FAILED:
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001383 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1384
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001385 if create_servo == hosts.VERIFY_FAILED:
Otabek Kasimov120b6fa2020-07-03 00:15:27 -07001386 if (self.is_labstation()
1387 and self._is_main_device_not_detected_on_servo_v4()):
1388 servo_type = None
1389 if self.get_dut_host_info():
1390 servo_type = self.get_dut_host_info().get_label_value(
1391 servo_constants.SERVO_TYPE_LABEL_PREFIX)
1392 if servo_type and 'servo_micro' in servo_type:
1393 serial = self.get_servo_micro_serial_number()
1394 logging.debug('servo_micro serial: %s', serial)
1395 if self._is_servo_device_detected('servo_micro',
1396 serial):
1397 return servo_constants.SERVO_STATE_BAD_RIBBON_CABLE
1398 # Device can be not detected because of DUT
1399 # TODO (otabek) update after b/159755652 and b/159754985
1400 metrics.Counter(
1401 'chromeos/autotest/repair/servo_state/needs_replacement'
1402 ).increment(fields=self._get_host_metrics_data())
1403 elif not self.is_labstation():
1404 # Here need logic to check if flex cable is connected
1405 pass
1406
Otabek Kasimov15963492020-06-23 21:10:51 -07001407 # one of the reason why servo can not initialized
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001408 if ccd_testlab == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001409 return servo_constants.SERVO_STATE_CCD_TESTLAB_ISSUE
1410
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001411 if (create_servo == hosts.VERIFY_FAILED
1412 or init_servo == hosts.VERIFY_FAILED):
Otabek Kasimov15963492020-06-23 21:10:51 -07001413 return servo_constants.SERVO_STATE_SERVOD_ISSUE
1414
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001415 if ec_board == hosts.VERIFY_FAILED:
Otabek Kasimov015c15c2020-08-20 00:40:42 -07001416 return servo_constants.SERVO_STATE_EC_BROKEN
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001417 if pwr_button == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001418 return servo_constants.SERVO_STATE_BAD_RIBBON_CABLE
Otabek Kasimov8bb09912020-10-01 14:44:57 -07001419 if lid_open == hosts.VERIFY_FAILED:
Otabek Kasimov15963492020-06-23 21:10:51 -07001420 return servo_constants.SERVO_STATE_LID_OPEN_FAILED
Otabek Kasimov15963492020-06-23 21:10:51 -07001421
Otabek Kasimov15963492020-06-23 21:10:51 -07001422 metrics.Counter(
1423 'chromeos/autotest/repair/unknown_servo_state'
Otabek Kasimovc6f30412020-06-30 20:08:12 -07001424 ).increment(fields=self._get_host_metrics_data())
Otabek Kasimov15963492020-06-23 21:10:51 -07001425 logging.info('We do not have special state for this failure yet :)')
1426 return servo_constants.SERVO_STATE_BROKEN
1427
Otabek Kasimov382c3bb2020-10-28 13:22:45 -07001428 def is_servo_topology_supported(self):
1429 """Check if servo_topology is supported."""
1430 if not self.is_labstation():
1431 logging.info('Servo-topology supported only for labstation.')
1432 return False
1433 if not self.servo_serial:
1434 logging.info('Servo-topology required a servo serial.')
1435 return False
1436 return True
1437
1438 def get_topology(self):
1439 """Get servo topology."""
1440 return self._topology
1441
1442 def is_dual_setup(self):
1443 """Check is servo will run in dual setup.
1444
1445 Dual setup used only for servo_v4 when used ccd_cr50 and servo_micro
1446 at the same time.
1447 """
1448 return self.servo_setup == servo_constants.SERVO_SETUP_VALUE_DUAL_V4
1449
Otabek Kasimovcc9738e2020-02-14 16:17:15 -08001450
Richard Barnetteea3e4602016-06-10 12:36:41 -07001451def make_servo_hostname(dut_hostname):
1452 """Given a DUT's hostname, return the hostname of its servo.
1453
1454 @param dut_hostname: hostname of a DUT.
1455
1456 @return hostname of the DUT's servo.
1457
1458 """
1459 host_parts = dut_hostname.split('.')
1460 host_parts[0] = host_parts[0] + '-servo'
1461 return '.'.join(host_parts)
1462
1463
1464def servo_host_is_up(servo_hostname):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001465 """Given a servo host name, return if it's up or not.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001466
1467 @param servo_hostname: hostname of the servo host.
1468
1469 @return True if it's up, False otherwise
1470 """
1471 # Technically, this duplicates the SSH ping done early in the servo
1472 # proxy initialization code. However, this ping ends in a couple
1473 # seconds when if fails, rather than the 60 seconds it takes to decide
1474 # that an SSH ping has timed out. Specifically, that timeout happens
1475 # when our servo DNS name resolves, but there is no host at that IP.
1476 logging.info('Pinging servo host at %s', servo_hostname)
1477 ping_config = ping_runner.PingConfig(
1478 servo_hostname, count=3,
1479 ignore_result=True, ignore_status=True)
1480 return ping_runner.PingRunner().ping(ping_config).received > 0
1481
1482
Richard Barnettee519dcd2016-08-15 17:37:17 -07001483def _map_afe_board_to_servo_board(afe_board):
1484 """Map a board we get from the AFE to a servo appropriate value.
1485
1486 Many boards are identical to other boards for servo's purposes.
1487 This function makes that mapping.
1488
1489 @param afe_board string board name received from AFE.
1490 @return board we expect servo to have.
1491
1492 """
1493 KNOWN_SUFFIXES = ['-freon', '_freon', '_moblab', '-cheets']
1494 BOARD_MAP = {'gizmo': 'panther'}
1495 mapped_board = afe_board
1496 if afe_board in BOARD_MAP:
1497 mapped_board = BOARD_MAP[afe_board]
1498 else:
1499 for suffix in KNOWN_SUFFIXES:
1500 if afe_board.endswith(suffix):
1501 mapped_board = afe_board[0:-len(suffix)]
1502 break
1503 if mapped_board != afe_board:
1504 logging.info('Mapping AFE board=%s to %s', afe_board, mapped_board)
1505 return mapped_board
1506
1507
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001508def get_servo_args_for_host(dut_host):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001509 """Return servo data associated with a given DUT.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001510
Richard Barnetteea3e4602016-06-10 12:36:41 -07001511 @param dut_host Instance of `Host` on which to find the servo
1512 attributes.
Prathmesh Prabhuf605dd32018-08-28 17:09:04 -07001513 @return `servo_args` dict with host and an optional port.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001514 """
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001515 info = dut_host.host_info_store.get()
Derek Beckettf73baca2020-08-19 15:08:47 -07001516 servo_args = {k: v for k, v in six.iteritems(info.attributes)
Garry Wang11b5e872020-03-11 15:14:08 -07001517 if k in servo_constants.SERVO_ATTR_KEYS}
Richard Barnetteea3e4602016-06-10 12:36:41 -07001518
Garry Wang11b5e872020-03-11 15:14:08 -07001519 if servo_constants.SERVO_PORT_ATTR in servo_args:
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001520 try:
Garry Wang11b5e872020-03-11 15:14:08 -07001521 servo_args[servo_constants.SERVO_PORT_ATTR] = int(
1522 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001523 except ValueError:
1524 logging.error('servo port is not an int: %s',
Garry Wang11b5e872020-03-11 15:14:08 -07001525 servo_args[servo_constants.SERVO_PORT_ATTR])
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001526 # Reset servo_args because we don't want to use an invalid port.
Garry Wang11b5e872020-03-11 15:14:08 -07001527 servo_args.pop(servo_constants.SERVO_HOST_ATTR, None)
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001528
1529 if info.board:
Garry Wang11b5e872020-03-11 15:14:08 -07001530 servo_board = _map_afe_board_to_servo_board(info.board)
1531 servo_args[servo_constants.SERVO_BOARD_ATTR] = servo_board
Nick Sanders2f3c9852018-10-24 12:10:24 -07001532 if info.model:
Garry Wang11b5e872020-03-11 15:14:08 -07001533 servo_args[servo_constants.SERVO_MODEL_ATTR] = info.model
1534 return servo_args if servo_constants.SERVO_HOST_ATTR in servo_args else None
Richard Barnetteea3e4602016-06-10 12:36:41 -07001535
1536
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001537def _tweak_args_for_ssp_moblab(servo_args):
Garry Wang11b5e872020-03-11 15:14:08 -07001538 if (servo_args[servo_constants.SERVO_HOST_ATTR]
1539 in ['localhost', '127.0.0.1']):
1540 servo_args[servo_constants.SERVO_HOST_ATTR] = _CONFIG.get_config_value(
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001541 'SSP', 'host_container_ip', type=str, default=None)
1542
1543
Dan Shi023aae32016-05-25 11:13:01 -07001544def create_servo_host(dut, servo_args, try_lab_servo=False,
Gregory Nisbetde13e2a2019-12-09 22:44:00 -08001545 try_servo_repair=False, dut_host_info=None):
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001546 """Create a ServoHost object for a given DUT, if appropriate.
Dan Shi4d478522014-02-14 13:46:32 -08001547
Richard Barnette9a26ad62016-06-10 12:03:08 -07001548 This function attempts to create and verify or repair a `ServoHost`
1549 object for a servo connected to the given `dut`, subject to various
1550 constraints imposed by the parameters:
1551 * When the `servo_args` parameter is not `None`, a servo
1552 host must be created, and must be checked with `repair()`.
1553 * Otherwise, if a servo exists in the lab and `try_lab_servo` is
1554 true:
1555 * If `try_servo_repair` is true, then create a servo host and
1556 check it with `repair()`.
1557 * Otherwise, if the servo responds to `ping` then create a
1558 servo host and check it with `verify()`.
Fang Denge545abb2014-12-30 18:43:47 -08001559
Richard Barnette9a26ad62016-06-10 12:03:08 -07001560 In cases where `servo_args` was not `None`, repair failure
1561 exceptions are passed back to the caller; otherwise, exceptions
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001562 are logged and then discarded. Note that this only happens in cases
1563 where we're called from a test (not special task) control file that
1564 has an explicit dependency on servo. In that case, we require that
1565 repair not write to `status.log`, so as to avoid polluting test
1566 results.
1567
1568 TODO(jrbarnette): The special handling for servo in test control
1569 files is a thorn in my flesh; I dearly hope to see it cut out before
1570 my retirement.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001571
1572 Parameters for a servo host consist of a host name, port number, and
1573 DUT board, and are determined from one of these sources, in order of
1574 priority:
Richard Barnetteea3e4602016-06-10 12:36:41 -07001575 * Servo attributes from the `dut` parameter take precedence over
1576 all other sources of information.
1577 * If a DNS entry for the servo based on the DUT hostname exists in
1578 the CrOS lab network, that hostname is used with the default
Richard Barnette9a26ad62016-06-10 12:03:08 -07001579 port and the DUT's board.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001580 * If no other options are found, the parameters will be taken
Richard Barnette9a26ad62016-06-10 12:03:08 -07001581 from the `servo_args` dict passed in from the caller.
Richard Barnetteea3e4602016-06-10 12:36:41 -07001582
1583 @param dut An instance of `Host` from which to take
1584 servo parameters (if available).
1585 @param servo_args A dictionary with servo parameters to use if
1586 they can't be found from `dut`. If this
1587 argument is supplied, unrepaired exceptions
1588 from `verify()` will be passed back to the
1589 caller.
1590 @param try_lab_servo If not true, servo host creation will be
1591 skipped unless otherwise required by the
1592 caller.
Richard Barnette9a26ad62016-06-10 12:03:08 -07001593 @param try_servo_repair If true, check a servo host with
1594 `repair()` instead of `verify()`.
Otabek Kasimov8475cce2020-07-14 12:11:31 -07001595 @param dut_host_info: A HostInfo object of the DUT that connected
1596 to this servo.
Dan Shi4d478522014-02-14 13:46:32 -08001597
1598 @returns: A ServoHost object or None. See comments above.
1599
1600 """
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001601 servo_dependency = servo_args is not None
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001602 if dut is not None and (try_lab_servo or servo_dependency):
Prathmesh Prabhub4810232018-09-07 13:24:08 -07001603 servo_args_override = get_servo_args_for_host(dut)
Richard Barnetteea3e4602016-06-10 12:36:41 -07001604 if servo_args_override is not None:
Prathmesh Prabhuefb1b482018-08-28 17:15:05 -07001605 if utils.in_moblab_ssp():
1606 _tweak_args_for_ssp_moblab(servo_args_override)
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001607 logging.debug(
1608 'Overriding provided servo_args (%s) with arguments'
1609 ' determined from the host (%s)',
1610 servo_args,
1611 servo_args_override,
1612 )
Richard Barnetteea3e4602016-06-10 12:36:41 -07001613 servo_args = servo_args_override
Prathmesh Prabhucba44292018-08-28 17:44:45 -07001614
Richard Barnetteea3e4602016-06-10 12:36:41 -07001615 if servo_args is None:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001616 logging.debug('No servo_args provided, and failed to find overrides.')
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001617 if try_lab_servo or servo_dependency:
Otabek Kasimov646812c2020-06-23 20:01:36 -07001618 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001619 else:
1620 # For regular test case which not required the servo
1621 return None, None
1622
Garry Wang11b5e872020-03-11 15:14:08 -07001623 servo_hostname = servo_args.get(servo_constants.SERVO_HOST_ATTR)
1624 servo_port = servo_args.get(servo_constants.SERVO_PORT_ATTR)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001625 if not _is_servo_host_information_exist(servo_hostname, servo_port):
1626 logging.debug(
1627 'Servo connection info missed hostname: %s , port: %s',
1628 servo_hostname, servo_port)
Otabek Kasimov646812c2020-06-23 20:01:36 -07001629 return None, servo_constants.SERVO_STATE_MISSING_CONFIG
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001630 if not is_servo_host_information_valid(servo_hostname, servo_port):
1631 logging.debug(
1632 'Servo connection info is incorrect hostname: %s , port: %s',
1633 servo_hostname, servo_port)
Garry Wang11b5e872020-03-11 15:14:08 -07001634 return None, servo_constants.SERVO_STATE_WRONG_CONFIG
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001635 if (not servo_dependency and not try_servo_repair and
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001636 not servo_host_is_up(servo_hostname)):
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001637 logging.debug('ServoHost is not up.')
Otabek Kasimov646812c2020-06-23 20:01:36 -07001638 return None, servo_constants.SERVO_STATE_NO_SSH
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001639
Garry Wangebc015b2019-06-06 17:45:06 -07001640 newhost = ServoHost(**servo_args)
Garry Wangffbd2162020-04-17 16:13:48 -07001641
Otabek Kasimove6df8102020-07-21 20:15:25 -07001642 # Reset or reboot servo device only during AdminRepair tasks.
1643 if try_servo_repair:
1644 if newhost._is_locked:
1645 # Reset servo if the servo is locked, as we check if the servohost
1646 # is up, if the servohost is labstation and if the servohost is in
1647 # lab inside the locking logic.
1648 newhost.reset_servo()
1649 else:
Garry Wang358aad42020-08-02 20:56:04 -07001650 try:
1651 newhost.reboot_servo_v3_on_need()
Garry Wang1f0d5332020-08-10 19:32:32 -07001652 except Exception as e:
1653 logging.info('[Non-critical] Unexpected error while trying to'
1654 ' reboot servo_v3, skipping the reboot; %s', e)
Otabek Kasimove6df8102020-07-21 20:15:25 -07001655
Otabek Kasimov2b50cdb2020-07-06 19:16:06 -07001656 if dut:
1657 newhost.set_dut_hostname(dut.hostname)
Otabek Kasimov9e90ae12020-08-14 03:01:19 -07001658 if dut_host_info:
1659 newhost.set_dut_host_info(dut_host_info)
Garry Wangffbd2162020-04-17 16:13:48 -07001660
Otabek Kasimov8475cce2020-07-14 12:11:31 -07001661 if try_lab_servo or try_servo_repair:
1662 try:
1663 logging.info("Check and update servo firmware.")
1664 servo_updater.update_servo_firmware(
1665 newhost,
1666 force_update=False)
1667 except Exception as e:
1668 logging.error("Servo device update error: %s", e)
1669
Garry Wangcdd27b22020-01-13 14:59:11 -08001670 try:
1671 newhost.restart_servod(quick_startup=True)
1672 except error.AutoservSSHTimeout:
1673 logging.warning("Restart servod failed due ssh connection "
1674 "to servohost timed out. This error is forgiven"
1675 " here, we will retry in servo repair process.")
1676 except error.AutoservRunError as e:
1677 logging.warning("Restart servod failed due to:\n%s\n"
1678 "This error is forgiven here, we will retry"
1679 " in servo repair process.", str(e))
Garry Wangebc015b2019-06-06 17:45:06 -07001680
Richard Barnette9a26ad62016-06-10 12:03:08 -07001681 # Note that the logic of repair() includes everything done
1682 # by verify(). It's sufficient to call one or the other;
1683 # we don't need both.
Richard Barnette07c2e1d2016-10-26 14:24:28 -07001684 if servo_dependency:
1685 newhost.repair(silent=True)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001686 return newhost, newhost.get_servo_state()
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001687
1688 if try_servo_repair:
1689 try:
1690 newhost.repair()
1691 except Exception:
1692 logging.exception('servo repair failed for %s', newhost.hostname)
Richard Barnette9a26ad62016-06-10 12:03:08 -07001693 else:
1694 try:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001695 newhost.verify()
Kevin Cheng5f2ba6c2016-09-28 10:20:05 -07001696 except Exception:
Prathmesh Prabhu88bf6052018-08-28 16:21:26 -07001697 logging.exception('servo verify failed for %s', newhost.hostname)
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001698 return newhost, newhost.get_servo_state()
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001699
1700
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001701def _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001702 if hostname is None or len(hostname.strip()) == 0:
1703 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001704 if port is None:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001705 return False
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001706 if not type(port) is int:
1707 try:
1708 int(port)
1709 except ValueError:
1710 return False
1711
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001712 return True
1713
1714
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001715def is_servo_host_information_valid(hostname, port):
Garry Wang9b8f2342020-04-17 16:34:09 -07001716 """Check if provided servo attributes are valid.
1717
1718 @param hostname Hostname of the servohost.
1719 @param port servo port number.
1720
1721 @returns: A bool value to indicate if provided servo attribute valid.
1722 """
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001723 if not _is_servo_host_information_exist(hostname, port):
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001724 return False
1725 # checking range and correct of the port
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001726 port_int = int(port)
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001727 if port_int < 1 or port_int > 65000:
1728 return False
1729 # we expecting host contain only latters, digits and '-' or '_'
Otabek Kasimova7ba91a2020-03-09 08:31:01 -07001730 if not re.match('[a-zA-Z0-9-_\.]*$', hostname) or len(hostname) < 5:
Otabek Kasimov7267a7a2020-03-04 11:18:45 -08001731 return False
1732 return True