Caroline Tice | f6ef439 | 2017-04-06 17:16:05 -0700 | [diff] [blame] | 1 | #!/usr/bin/env python2 |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 2 | # -*- coding: utf-8 -*- |
Zhizhou Yang | 4713fd1 | 2019-09-24 10:32:00 -0700 | [diff] [blame] | 3 | # |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 4 | # Copyright 2019 The Chromium OS Authors. All rights reserved. |
| 5 | # Use of this source code is governed by a BSD-style license that can be |
| 6 | # found in the LICENSE file. |
| 7 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 8 | """This module controls locking and unlocking of test machines.""" |
| 9 | |
| 10 | from __future__ import print_function |
| 11 | |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 12 | import argparse |
Zhizhou Yang | 5322d4a | 2019-09-30 13:10:29 -0700 | [diff] [blame] | 13 | import enum |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 14 | import getpass |
| 15 | import os |
| 16 | import sys |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 17 | |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 18 | import file_lock_machine |
| 19 | |
| 20 | from cros_utils import command_executer |
Caroline Tice | a8af9a7 | 2016-07-20 12:52:59 -0700 | [diff] [blame] | 21 | from cros_utils import logger |
| 22 | from cros_utils import machines |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 23 | |
Luis Lozano | f2a3ef4 | 2015-12-15 13:49:30 -0800 | [diff] [blame] | 24 | |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 25 | class AFELockException(Exception): |
| 26 | """Base class for exceptions in this module.""" |
| 27 | |
| 28 | |
| 29 | class MachineNotPingable(AFELockException): |
| 30 | """Raised when machine does not respond to ping.""" |
| 31 | |
| 32 | |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 33 | class LockingError(AFELockException): |
| 34 | """Raised when server fails to lock/unlock machine as requested.""" |
| 35 | |
| 36 | |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 37 | class DontOwnLock(AFELockException): |
| 38 | """Raised when user attmepts to unlock machine locked by someone else.""" |
| 39 | # This should not be raised if the user specified '--force' |
| 40 | |
| 41 | |
| 42 | class NoAFEServer(AFELockException): |
| 43 | """Raised when cannot find/access the autotest server.""" |
| 44 | |
| 45 | |
| 46 | class AFEAccessError(AFELockException): |
| 47 | """Raised when cannot get information about lab machine from lab server.""" |
| 48 | |
| 49 | |
Zhizhou Yang | 5322d4a | 2019-09-30 13:10:29 -0700 | [diff] [blame] | 50 | class MachineType(enum.Enum): |
| 51 | """Enum class to hold machine type.""" |
| 52 | AFE = 'afe' |
| 53 | LOCAL = 'local' |
| 54 | SKYLAB = 'skylab' |
| 55 | |
| 56 | |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 57 | class AFELockManager(object): |
| 58 | """Class for locking/unlocking machines vie Autotest Front End servers. |
| 59 | |
Zhizhou Yang | 4713fd1 | 2019-09-24 10:32:00 -0700 | [diff] [blame] | 60 | This class contains methods for checking the locked status of machines, |
| 61 | and for changing the locked status. It handles HW lab machines (both AFE |
| 62 | and Skylab), and local machines, using appropriate locking mechanisms for |
| 63 | each. |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 64 | |
| 65 | !!!IMPORTANT NOTE!!! The AFE server can only be called from the main |
| 66 | thread/process of a program. If you launch threads and try to call it |
| 67 | from a thread, you will get an error. This has to do with restrictions |
| 68 | in the Python virtual machine (and signal handling) and cannot be changed. |
| 69 | """ |
| 70 | |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 71 | SKYLAB_PATH = '/usr/local/bin/skylab' |
| 72 | LEASE_MINS = 600 |
Zhizhou Yang | f723413 | 2019-10-03 14:09:22 -0700 | [diff] [blame] | 73 | SKYLAB_CREDENTIAL = '/usr/local/google/home/mobiletc-prebuild' \ |
| 74 | '/sheriff_utils/skylab_credential' \ |
| 75 | '/chromeos-swarming-credential.json' |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 76 | SWARMING = 'chromite/third_party/swarming.client/swarming.py' |
| 77 | SUCCESS = 0 |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 78 | |
Luis Lozano | f2a3ef4 | 2015-12-15 13:49:30 -0800 | [diff] [blame] | 79 | def __init__(self, |
| 80 | remotes, |
| 81 | force_option, |
| 82 | chromeos_root, |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 83 | locks_dir='', |
Luis Lozano | f2a3ef4 | 2015-12-15 13:49:30 -0800 | [diff] [blame] | 84 | log=None): |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 85 | """Initializes an AFELockManager object. |
| 86 | |
| 87 | Args: |
| 88 | remotes: A list of machine names or ip addresses to be managed. Names |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 89 | and ip addresses should be represented as strings. If the list is |
| 90 | empty, the lock manager will get all known machines. |
| 91 | force_option: A Boolean indicating whether or not to force an unlock of |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 92 | a machine that was locked by someone else. |
| 93 | chromeos_root: The ChromeOS chroot to use for the autotest scripts. |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 94 | locks_dir: A directory used for file locking local devices. |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 95 | log: If not None, this is the logger object to be used for writing out |
| 96 | informational output messages. It is expected to be an instance of |
Caroline Tice | a8af9a7 | 2016-07-20 12:52:59 -0700 | [diff] [blame] | 97 | Logger class from cros_utils/logger.py. |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 98 | """ |
| 99 | self.chromeos_root = chromeos_root |
| 100 | self.user = getpass.getuser() |
| 101 | self.logger = log or logger.GetLogger() |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 102 | self.ce = command_executer.GetCommandExecuter(self.logger) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 103 | autotest_path = os.path.join(chromeos_root, |
| 104 | 'src/third_party/autotest/files') |
| 105 | |
cmtice | d1172b4 | 2015-06-12 15:14:09 -0700 | [diff] [blame] | 106 | sys.path.append(chromeos_root) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 107 | sys.path.append(autotest_path) |
| 108 | sys.path.append(os.path.join(autotest_path, 'server', 'cros')) |
| 109 | |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 110 | self.locks_dir = locks_dir |
| 111 | |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 112 | # We have to wait to do these imports until the paths above have |
| 113 | # been fixed. |
Yunlian Jiang | d97422a | 2015-12-16 11:06:13 -0800 | [diff] [blame] | 114 | # pylint: disable=import-error |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 115 | from client import setup_modules |
Caroline Tice | 6b16138 | 2016-09-15 15:03:46 -0700 | [diff] [blame] | 116 | setup_modules.setup( |
| 117 | base_path=autotest_path, root_module_name='autotest_lib') |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 118 | |
| 119 | from dynamic_suite import frontend_wrappers |
| 120 | |
Caroline Tice | 6b16138 | 2016-09-15 15:03:46 -0700 | [diff] [blame] | 121 | self.afe = frontend_wrappers.RetryingAFE( |
| 122 | timeout_min=30, delay_sec=10, debug=False, server='cautotest') |
| 123 | |
Caroline Tice | 6b16138 | 2016-09-15 15:03:46 -0700 | [diff] [blame] | 124 | self.machines = list(set(remotes)) or [] |
| 125 | self.toolchain_lab_machines = self.GetAllToolchainLabMachines() |
Caroline Tice | 6b16138 | 2016-09-15 15:03:46 -0700 | [diff] [blame] | 126 | |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 127 | if not self.machines: |
Zhizhou Yang | 4713fd1 | 2019-09-24 10:32:00 -0700 | [diff] [blame] | 128 | self.machines = self.toolchain_lab_machines |
Caroline Tice | 6b16138 | 2016-09-15 15:03:46 -0700 | [diff] [blame] | 129 | self.force = force_option |
| 130 | |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 131 | self.local_machines = [] |
| 132 | self.skylab_machines = [] |
| 133 | |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 134 | def CheckMachine(self, machine, error_msg): |
| 135 | """Verifies that machine is responding to ping. |
| 136 | |
| 137 | Args: |
| 138 | machine: String containing the name or ip address of machine to check. |
| 139 | error_msg: Message to print if ping fails. |
| 140 | |
| 141 | Raises: |
| 142 | MachineNotPingable: If machine is not responding to 'ping' |
| 143 | """ |
| 144 | if not machines.MachineIsPingable(machine, logging_level='none'): |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 145 | cros_machine = machine + '.cros' |
| 146 | if not machines.MachineIsPingable(cros_machine, logging_level='none'): |
| 147 | raise MachineNotPingable(error_msg) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 148 | |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 149 | def GetAllToolchainLabMachines(self): |
| 150 | """Gets a list of all the toolchain machines in the ChromeOS HW lab. |
| 151 | |
| 152 | Returns: |
| 153 | A list of names of the toolchain machines in the ChromeOS HW lab. |
| 154 | """ |
Luis Lozano | f2a3ef4 | 2015-12-15 13:49:30 -0800 | [diff] [blame] | 155 | machines_file = os.path.join( |
| 156 | os.path.dirname(__file__), 'crosperf', 'default_remotes') |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 157 | machine_list = [] |
| 158 | with open(machines_file, 'r') as input_file: |
| 159 | lines = input_file.readlines() |
| 160 | for line in lines: |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 161 | _, remotes = line.split(':') |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 162 | remotes = remotes.strip() |
| 163 | for r in remotes.split(): |
| 164 | machine_list.append(r.strip()) |
| 165 | return machine_list |
| 166 | |
Zhizhou Yang | 5322d4a | 2019-09-30 13:10:29 -0700 | [diff] [blame] | 167 | def GetMachineType(self, m): |
| 168 | """Get where the machine is located. |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 169 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 170 | Args: |
Zhizhou Yang | 5322d4a | 2019-09-30 13:10:29 -0700 | [diff] [blame] | 171 | m: String containing the name or ip address of machine. |
| 172 | |
| 173 | Returns: |
| 174 | Value of the type in MachineType Enum. |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 175 | """ |
Zhizhou Yang | 5322d4a | 2019-09-30 13:10:29 -0700 | [diff] [blame] | 176 | if m in self.local_machines: |
| 177 | return MachineType.LOCAL |
| 178 | if m in self.skylab_machines: |
| 179 | return MachineType.SKYLAB |
| 180 | return MachineType.AFE |
| 181 | |
| 182 | def PrintStatusHeader(self): |
| 183 | """Prints the status header lines for machines.""" |
| 184 | print('\nMachine (Board)\t\t\t\t\tStatus') |
| 185 | print('---------------\t\t\t\t\t------') |
| 186 | |
| 187 | def PrintStatus(self, m, state, machine_type): |
| 188 | """Prints status for a single machine. |
| 189 | |
| 190 | Args: |
| 191 | m: String containing the name or ip address of machine. |
| 192 | state: A dictionary of the current state of the machine. |
| 193 | machine_type: MachineType to determine where the machine is located. |
| 194 | """ |
| 195 | if state['locked']: |
| 196 | if (machine_type == MachineType.AFE and |
| 197 | m not in self.toolchain_lab_machines): |
| 198 | m += '.cros' |
| 199 | print('%s (%s)\t%slocked by %s since %s' % |
| 200 | (m, state['board'], '\t\t\t' if machine_type == MachineType.LOCAL |
| 201 | else '', state['locked_by'], state['lock_time'])) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 202 | else: |
Zhizhou Yang | 5322d4a | 2019-09-30 13:10:29 -0700 | [diff] [blame] | 203 | print( |
| 204 | '%s (%s)\t\t%sunlocked' % (m, state['board'], '\t\t' if |
| 205 | machine_type == MachineType.LOCAL else '')) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 206 | |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 207 | def AddMachineToLocal(self, machine): |
| 208 | """Adds a machine to local machine list. |
| 209 | |
| 210 | Args: |
| 211 | machine: The machine to be added. |
| 212 | """ |
| 213 | if machine not in self.local_machines: |
| 214 | self.local_machines.append(machine) |
| 215 | |
| 216 | def AddMachineToSkylab(self, machine): |
| 217 | """Adds a machine to skylab machine list. |
| 218 | |
| 219 | Args: |
| 220 | machine: The machine to be added. |
| 221 | """ |
| 222 | if machine not in self.skylab_machines: |
| 223 | self.skylab_machines.append(machine) |
| 224 | |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 225 | def ListMachineStates(self, machine_states): |
| 226 | """Gets and prints the current status for a list of machines. |
| 227 | |
| 228 | Prints out the current status for all of the machines in the current |
| 229 | AFELockManager's list of machines (set when the object is initialized). |
| 230 | |
| 231 | Args: |
| 232 | machine_states: A dictionary of the current state of every machine in |
| 233 | the current AFELockManager's list of machines. Normally obtained by |
| 234 | calling AFELockManager::GetMachineStates. |
| 235 | """ |
Zhizhou Yang | 5322d4a | 2019-09-30 13:10:29 -0700 | [diff] [blame] | 236 | self.PrintStatusHeader() |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 237 | for m in machine_states: |
Zhizhou Yang | 5322d4a | 2019-09-30 13:10:29 -0700 | [diff] [blame] | 238 | machine_type = self.GetMachineType(m) |
| 239 | state = machine_states[m] |
| 240 | self.PrintStatus(m, state, machine_type) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 241 | |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 242 | def UpdateLockInAFE(self, should_lock_machine, machine): |
| 243 | """Calls an AFE server to lock/unlock a machine. |
| 244 | |
| 245 | Args: |
| 246 | should_lock_machine: Boolean indicating whether to lock the machine (True) |
| 247 | or unlock the machine (False). |
| 248 | machine: The machine to update. |
| 249 | |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 250 | Returns: |
| 251 | True if requested action succeeded, else False. |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 252 | """ |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 253 | kwargs = {'locked': should_lock_machine} |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 254 | if should_lock_machine: |
| 255 | kwargs['lock_reason'] = 'toolchain user request (%s)' % self.user |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 256 | |
Caroline Tice | 3f43271 | 2015-12-07 14:51:53 -0800 | [diff] [blame] | 257 | cros_name = machine + '.cros' |
| 258 | if cros_name in self.toolchain_lab_machines: |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 259 | machine = cros_name |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 260 | if machine in self.toolchain_lab_machines: |
| 261 | m = machine.split('.')[0] |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 262 | afe_server = self.afe |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 263 | |
| 264 | try: |
Caroline Tice | f6ef439 | 2017-04-06 17:16:05 -0700 | [diff] [blame] | 265 | afe_server.run( |
| 266 | 'modify_hosts', |
| 267 | host_filter_data={'hostname__in': [m]}, |
| 268 | update_data=kwargs) |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 269 | except Exception: |
| 270 | return False |
| 271 | return True |
| 272 | |
| 273 | def UpdateLockInSkylab(self, should_lock_machine, machine): |
| 274 | """Ask skylab to lease/release a machine. |
| 275 | |
| 276 | Args: |
| 277 | should_lock_machine: Boolean indicating whether to lock the machine (True) |
| 278 | or unlock the machine (False). |
| 279 | machine: The machine to update. |
| 280 | |
| 281 | Returns: |
| 282 | True if requested action succeeded, else False. |
| 283 | """ |
| 284 | try: |
| 285 | if should_lock_machine: |
| 286 | ret = self.LeaseSkylabMachine(machine) |
| 287 | else: |
| 288 | ret = self.ReleaseSkylabMachine(machine) |
| 289 | except Exception: |
| 290 | return False |
| 291 | return ret |
| 292 | |
| 293 | def UpdateFileLock(self, should_lock_machine, machine): |
| 294 | """Use file lock for local machines, |
| 295 | |
| 296 | Args: |
| 297 | should_lock_machine: Boolean indicating whether to lock the machine (True) |
| 298 | or unlock the machine (False). |
| 299 | machine: The machine to update. |
| 300 | |
| 301 | Returns: |
| 302 | True if requested action succeeded, else False. |
| 303 | """ |
| 304 | try: |
| 305 | if should_lock_machine: |
| 306 | ret = file_lock_machine.Machine(machine, self.locks_dir).Lock( |
| 307 | True, sys.argv[0]) |
| 308 | else: |
| 309 | ret = file_lock_machine.Machine(machine, self.locks_dir).Unlock(True) |
| 310 | except Exception: |
| 311 | return False |
| 312 | return ret |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 313 | |
| 314 | def UpdateMachines(self, lock_machines): |
| 315 | """Sets the locked state of the machines to the requested value. |
| 316 | |
| 317 | The machines updated are the ones in self.machines (specified when the |
| 318 | class object was intialized). |
| 319 | |
| 320 | Args: |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 321 | lock_machines: Boolean indicating whether to lock the machines (True) or |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 322 | unlock the machines (False). |
cmtice | f3eb803 | 2015-07-27 13:55:52 -0700 | [diff] [blame] | 323 | |
| 324 | Returns: |
| 325 | A list of the machines whose state was successfully updated. |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 326 | """ |
cmtice | f3eb803 | 2015-07-27 13:55:52 -0700 | [diff] [blame] | 327 | updated_machines = [] |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 328 | action = 'Locking' if lock_machines else 'Unlocking' |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 329 | for m in self.machines: |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 330 | # TODO(zhizhouy): Handling exceptions with more details when locking |
| 331 | # doesn't succeed. |
Zhizhou Yang | 5322d4a | 2019-09-30 13:10:29 -0700 | [diff] [blame] | 332 | machine_type = self.GetMachineType(m) |
| 333 | if machine_type == MachineType.SKYLAB: |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 334 | ret = self.UpdateLockInSkylab(lock_machines, m) |
Zhizhou Yang | 5322d4a | 2019-09-30 13:10:29 -0700 | [diff] [blame] | 335 | elif machine_type == MachineType.LOCAL: |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 336 | ret = self.UpdateFileLock(lock_machines, m) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 337 | else: |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 338 | ret = self.UpdateLockInAFE(lock_machines, m) |
cmtice | f3eb803 | 2015-07-27 13:55:52 -0700 | [diff] [blame] | 339 | |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 340 | if ret: |
| 341 | self.logger.LogOutput( |
Zhizhou Yang | 5322d4a | 2019-09-30 13:10:29 -0700 | [diff] [blame] | 342 | '%s %s machine succeeded: %s.' % (action, machine_type.value, m)) |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 343 | updated_machines.append(m) |
| 344 | else: |
| 345 | self.logger.LogOutput( |
Zhizhou Yang | 5322d4a | 2019-09-30 13:10:29 -0700 | [diff] [blame] | 346 | '%s %s machine failed: %s.' % (action, machine_type.value, m)) |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 347 | |
| 348 | self.machines = updated_machines |
cmtice | f3eb803 | 2015-07-27 13:55:52 -0700 | [diff] [blame] | 349 | return updated_machines |
| 350 | |
| 351 | def _InternalRemoveMachine(self, machine): |
| 352 | """Remove machine from internal list of machines. |
| 353 | |
| 354 | Args: |
| 355 | machine: Name of machine to be removed from internal list. |
| 356 | """ |
| 357 | # Check to see if machine is lab machine and if so, make sure it has |
| 358 | # ".cros" on the end. |
| 359 | cros_machine = machine |
| 360 | if machine.find('rack') > 0 and machine.find('row') > 0: |
| 361 | if machine.find('.cros') == -1: |
| 362 | cros_machine = cros_machine + '.cros' |
| 363 | |
Caroline Tice | f6ef439 | 2017-04-06 17:16:05 -0700 | [diff] [blame] | 364 | self.machines = [ |
| 365 | m for m in self.machines if m != cros_machine and m != machine |
| 366 | ] |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 367 | |
| 368 | def CheckMachineLocks(self, machine_states, cmd): |
| 369 | """Check that every machine in requested list is in the proper state. |
| 370 | |
| 371 | If the cmd is 'unlock' verify that every machine is locked by requestor. |
| 372 | If the cmd is 'lock' verify that every machine is currently unlocked. |
| 373 | |
| 374 | Args: |
| 375 | machine_states: A dictionary of the current state of every machine in |
| 376 | the current AFELockManager's list of machines. Normally obtained by |
| 377 | calling AFELockManager::GetMachineStates. |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 378 | cmd: The user-requested action for the machines: 'lock' or 'unlock'. |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 379 | |
| 380 | Raises: |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 381 | DontOwnLock: The lock on a requested machine is owned by someone else. |
| 382 | """ |
| 383 | for k, state in machine_states.iteritems(): |
| 384 | if cmd == 'unlock': |
| 385 | if not state['locked']: |
cmtice | f3eb803 | 2015-07-27 13:55:52 -0700 | [diff] [blame] | 386 | self.logger.LogWarning('Attempt to unlock already unlocked machine ' |
| 387 | '(%s).' % k) |
| 388 | self._InternalRemoveMachine(k) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 389 | |
Zhizhou Yang | 5322d4a | 2019-09-30 13:10:29 -0700 | [diff] [blame] | 390 | # TODO(zhizhouy): Skylab doesn't support host info such as locked_by. |
| 391 | # Need to update this when skylab supports it. |
| 392 | if (state['locked'] and state['locked_by'] and |
| 393 | state['locked_by'] != self.user): |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 394 | raise DontOwnLock('Attempt to unlock machine (%s) locked by someone ' |
| 395 | 'else (%s).' % (k, state['locked_by'])) |
| 396 | elif cmd == 'lock': |
| 397 | if state['locked']: |
Caroline Tice | f6ef439 | 2017-04-06 17:16:05 -0700 | [diff] [blame] | 398 | self.logger.LogWarning( |
| 399 | 'Attempt to lock already locked machine (%s)' % k) |
cmtice | f3eb803 | 2015-07-27 13:55:52 -0700 | [diff] [blame] | 400 | self._InternalRemoveMachine(k) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 401 | |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 402 | def GetMachineStates(self, cmd=''): |
| 403 | """Gets the current state of all the requested machines. |
| 404 | |
Zhizhou Yang | 4713fd1 | 2019-09-24 10:32:00 -0700 | [diff] [blame] | 405 | Gets the current state of all the requested machines. Stores the data in a |
| 406 | dictionary keyed by machine name. |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 407 | |
| 408 | Args: |
| 409 | cmd: The command for which we are getting the machine states. This is |
| 410 | important because if one of the requested machines is missing we raise |
| 411 | an exception, unless the requested command is 'add'. |
| 412 | |
| 413 | Returns: |
| 414 | A dictionary of machine states for all the machines in the AFELockManager |
| 415 | object. |
| 416 | |
| 417 | Raises: |
Zhizhou Yang | 4713fd1 | 2019-09-24 10:32:00 -0700 | [diff] [blame] | 418 | NoAFEServer: Cannot find the HW Lab AFE server. |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 419 | AFEAccessError: An error occurred when querying the server about a |
| 420 | machine. |
| 421 | """ |
Zhizhou Yang | 4713fd1 | 2019-09-24 10:32:00 -0700 | [diff] [blame] | 422 | if not self.afe: |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 423 | raise NoAFEServer('Error: Cannot connect to main AFE server.') |
| 424 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 425 | machine_list = {} |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 426 | for m in self.machines: |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 427 | # For local or skylab machines, we simply set {'locked': status} for them |
| 428 | # TODO(zhizhouy): This is a quick fix since skylab cannot return host info |
| 429 | # as afe does. We need to get more info such as locked_by when skylab |
| 430 | # supports that. |
| 431 | if m in self.local_machines or m in self.skylab_machines: |
Zhizhou Yang | 5322d4a | 2019-09-30 13:10:29 -0700 | [diff] [blame] | 432 | values = { |
| 433 | 'locked': 0 if cmd == 'lock' else 1, |
| 434 | 'board': '??', |
| 435 | 'locked_by': '', |
| 436 | 'lock_time': '' |
| 437 | } |
| 438 | machine_list[m] = values |
Zhizhou Yang | 4713fd1 | 2019-09-24 10:32:00 -0700 | [diff] [blame] | 439 | else: |
| 440 | # For autotest machines, we use afe APIs to get locking info. |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 441 | mod_host = m.split('.')[0] |
| 442 | host_info = self.afe.get_hosts(hostname=mod_host) |
| 443 | if not host_info: |
| 444 | raise AFEAccessError('Unable to get information about %s from main' |
| 445 | ' autotest server.' % m) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 446 | host_info = host_info[0] |
| 447 | name = host_info.hostname |
| 448 | values = {} |
| 449 | values['board'] = host_info.platform if host_info.platform else '??' |
| 450 | values['locked'] = host_info.locked |
| 451 | if host_info.locked: |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 452 | values['locked_by'] = host_info.locked_by |
| 453 | values['lock_time'] = host_info.lock_time |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 454 | else: |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 455 | values['locked_by'] = '' |
| 456 | values['lock_time'] = '' |
| 457 | machine_list[name] = values |
Zhizhou Yang | 4713fd1 | 2019-09-24 10:32:00 -0700 | [diff] [blame] | 458 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 459 | return machine_list |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 460 | |
Zhizhou Yang | cdd9e34 | 2019-09-19 20:56:32 -0700 | [diff] [blame] | 461 | def CheckMachineInSkylab(self, machine): |
| 462 | """Run command to check if machine is in Skylab or not. |
| 463 | |
| 464 | Returns: |
| 465 | True if machine in skylab, else False |
| 466 | """ |
| 467 | credential = '' |
| 468 | if os.path.exists(self.SKYLAB_CREDENTIAL): |
| 469 | credential = '--auth-service-account-json %s' % self.SKYLAB_CREDENTIAL |
| 470 | swarming = os.path.join(self.chromeos_root, self.SWARMING) |
| 471 | cmd = (('%s query --swarming https://chromeos-swarming.appspot.com ' \ |
| 472 | "%s 'bots/list?is_dead=FALSE&dimensions=dut_name:%s'") % \ |
| 473 | (swarming, |
| 474 | credential, |
| 475 | machine.rstrip('.cros'))) |
| 476 | ret_tup = self.ce.RunCommandWOutput(cmd) |
| 477 | # The command will return a json output as stdout. If machine not in skylab |
| 478 | # stdout will look like this: |
| 479 | # { |
| 480 | # "death_timeout": "600", |
| 481 | # "now": "TIMESTAMP" |
| 482 | # } |
| 483 | # Otherwise there will be a tuple starting with 'items', we simply detect |
| 484 | # this keyword for result. |
| 485 | if 'items' not in ret_tup[1]: |
| 486 | return False |
| 487 | else: |
| 488 | return True |
| 489 | |
| 490 | def LeaseSkylabMachine(self, machine): |
| 491 | """Run command to lease dut from skylab. |
| 492 | |
| 493 | Returns: |
| 494 | True if succeeded, False if failed. |
| 495 | """ |
| 496 | credential = '' |
| 497 | if os.path.exists(self.SKYLAB_CREDENTIAL): |
| 498 | credential = '-service-account-json %s' % self.SKYLAB_CREDENTIAL |
| 499 | cmd = (('%s lease-dut -minutes %s %s %s') % \ |
| 500 | (self.SKYLAB_PATH, |
| 501 | self.LEASE_MINS, |
| 502 | credential, |
| 503 | machine.rstrip('.cros'))) |
| 504 | # Wait 120 seconds for server to start the lease task, if not started, |
| 505 | # we will treat it as unavailable. |
| 506 | check_interval_time = 120 |
| 507 | retval = self.ce.RunCommand(cmd, command_timeout=check_interval_time) |
| 508 | return retval == self.SUCCESS |
| 509 | |
| 510 | def ReleaseSkylabMachine(self, machine): |
| 511 | """Run command to release dut from skylab. |
| 512 | |
| 513 | Returns: |
| 514 | True if succeeded, False if failed. |
| 515 | """ |
| 516 | credential = '' |
| 517 | if os.path.exists(self.SKYLAB_CREDENTIAL): |
| 518 | credential = '-service-account-json %s' % self.SKYLAB_CREDENTIAL |
| 519 | cmd = (('%s release-dut %s %s') % \ |
| 520 | (self.SKYLAB_PATH, |
| 521 | credential, |
| 522 | machine.rstrip('.cros'))) |
| 523 | retval = self.ce.RunCommand(cmd) |
| 524 | return retval == self.SUCCESS |
| 525 | |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 526 | |
| 527 | def Main(argv): |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 528 | """Parse the options, initialize lock manager and dispatch proper method. |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 529 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 530 | Args: |
| 531 | argv: The options with which this script was invoked. |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 532 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 533 | Returns: |
| 534 | 0 unless an exception is raised. |
| 535 | """ |
| 536 | parser = argparse.ArgumentParser() |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 537 | |
Caroline Tice | 6b16138 | 2016-09-15 15:03:46 -0700 | [diff] [blame] | 538 | parser.add_argument( |
| 539 | '--list', |
| 540 | dest='cmd', |
| 541 | action='store_const', |
| 542 | const='status', |
| 543 | help='List current status of all known machines.') |
| 544 | parser.add_argument( |
| 545 | '--lock', |
| 546 | dest='cmd', |
| 547 | action='store_const', |
| 548 | const='lock', |
| 549 | help='Lock given machine(s).') |
| 550 | parser.add_argument( |
| 551 | '--unlock', |
| 552 | dest='cmd', |
| 553 | action='store_const', |
| 554 | const='unlock', |
| 555 | help='Unlock given machine(s).') |
| 556 | parser.add_argument( |
| 557 | '--status', |
| 558 | dest='cmd', |
| 559 | action='store_const', |
| 560 | const='status', |
| 561 | help='List current status of given machine(s).') |
| 562 | parser.add_argument( |
Caroline Tice | 6b16138 | 2016-09-15 15:03:46 -0700 | [diff] [blame] | 563 | '--remote', dest='remote', help='machines on which to operate') |
| 564 | parser.add_argument( |
| 565 | '--chromeos_root', |
| 566 | dest='chromeos_root', |
| 567 | required=True, |
| 568 | help='ChromeOS root to use for autotest scripts.') |
| 569 | parser.add_argument( |
Caroline Tice | 6b16138 | 2016-09-15 15:03:46 -0700 | [diff] [blame] | 570 | '--force', |
| 571 | dest='force', |
| 572 | action='store_true', |
| 573 | default=False, |
| 574 | help='Force lock/unlock of machines, even if not' |
| 575 | ' current lock owner.') |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 576 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 577 | options = parser.parse_args(argv) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 578 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 579 | if not options.remote and options.cmd != 'status': |
| 580 | parser.error('No machines specified for operation.') |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 581 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 582 | if not os.path.isdir(options.chromeos_root): |
| 583 | parser.error('Cannot find chromeos_root: %s.' % options.chromeos_root) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 584 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 585 | if not options.cmd: |
| 586 | parser.error('No operation selected (--list, --status, --lock, --unlock,' |
| 587 | ' --add_machine, --remove_machine).') |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 588 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 589 | machine_list = [] |
| 590 | if options.remote: |
| 591 | machine_list = options.remote.split() |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 592 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 593 | lock_manager = AFELockManager(machine_list, options.force, |
Zhizhou Yang | 4713fd1 | 2019-09-24 10:32:00 -0700 | [diff] [blame] | 594 | options.chromeos_root) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 595 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 596 | machine_states = lock_manager.GetMachineStates(cmd=options.cmd) |
| 597 | cmd = options.cmd |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 598 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 599 | if cmd == 'status': |
| 600 | lock_manager.ListMachineStates(machine_states) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 601 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 602 | elif cmd == 'lock': |
| 603 | if not lock_manager.force: |
| 604 | lock_manager.CheckMachineLocks(machine_states, cmd) |
| 605 | lock_manager.UpdateMachines(True) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 606 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 607 | elif cmd == 'unlock': |
| 608 | if not lock_manager.force: |
| 609 | lock_manager.CheckMachineLocks(machine_states, cmd) |
| 610 | lock_manager.UpdateMachines(False) |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 611 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 612 | elif cmd == 'add': |
| 613 | lock_manager.AddMachinesToLocalServer() |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 614 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 615 | elif cmd == 'remove': |
| 616 | lock_manager.RemoveMachinesFromLocalServer() |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 617 | |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 618 | return 0 |
cmtice | e5bc63b | 2015-05-27 16:59:37 -0700 | [diff] [blame] | 619 | |
| 620 | |
| 621 | if __name__ == '__main__': |
Caroline Tice | a448645 | 2015-12-08 13:43:23 -0800 | [diff] [blame] | 622 | sys.exit(Main(sys.argv[1:])) |