Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 1 | #!/usr/bin/python -u |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 2 | # -*- coding: utf-8 -*- |
| 3 | # |
Jon Salz | 37eccbd | 2012-05-25 16:06:52 +0800 | [diff] [blame] | 4 | # Copyright (c) 2012 The Chromium OS Authors. All rights reserved. |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 5 | # Use of this source code is governed by a BSD-style license that can be |
| 6 | # found in the LICENSE file. |
| 7 | |
| 8 | ''' |
| 9 | The main factory flow that runs the factory test and finalizes a device. |
| 10 | ''' |
| 11 | |
Jon Salz | e12c2b3 | 2013-06-25 16:24:34 +0800 | [diff] [blame] | 12 | import glob |
Jon Salz | 0405ab5 | 2012-03-16 15:26:52 +0800 | [diff] [blame] | 13 | import logging |
| 14 | import os |
Jon Salz | 73e0fd0 | 2012-04-04 11:46:38 +0800 | [diff] [blame] | 15 | import Queue |
Jon Salz | e12c2b3 | 2013-06-25 16:24:34 +0800 | [diff] [blame] | 16 | import shutil |
Jon Salz | 77c151e | 2012-08-28 07:20:37 +0800 | [diff] [blame] | 17 | import signal |
Jon Salz | 0405ab5 | 2012-03-16 15:26:52 +0800 | [diff] [blame] | 18 | import sys |
Jon Salz | eff9418 | 2013-06-19 15:06:28 +0800 | [diff] [blame] | 19 | import syslog |
Jon Salz | 0405ab5 | 2012-03-16 15:26:52 +0800 | [diff] [blame] | 20 | import threading |
| 21 | import time |
| 22 | import traceback |
Jon Salz | 258a40c | 2012-04-19 12:34:01 +0800 | [diff] [blame] | 23 | import uuid |
Jon Salz | b10cf51 | 2012-08-09 17:29:21 +0800 | [diff] [blame] | 24 | from xmlrpclib import Binary |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 25 | from collections import deque |
| 26 | from optparse import OptionParser |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 27 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 28 | import factory_common # pylint: disable=W0611 |
jcliang | cd68818 | 2012-08-20 21:01:26 +0800 | [diff] [blame] | 29 | from cros.factory import event_log |
| 30 | from cros.factory import system |
Cheng-Yi Chiang | d040652 | 2013-04-01 15:40:18 +0800 | [diff] [blame] | 31 | from cros.factory.event_log import EventLog, FloatDigit |
Tom Wai-Hong Tam | d33723e | 2013-04-10 21:14:37 +0800 | [diff] [blame] | 32 | from cros.factory.event_log_watcher import EventLogWatcher |
jcliang | cd68818 | 2012-08-20 21:01:26 +0800 | [diff] [blame] | 33 | from cros.factory.goofy import test_environment |
| 34 | from cros.factory.goofy import time_sanitizer |
Jon Salz | 8359178 | 2012-06-26 11:09:58 +0800 | [diff] [blame] | 35 | from cros.factory.goofy import updater |
jcliang | cd68818 | 2012-08-20 21:01:26 +0800 | [diff] [blame] | 36 | from cros.factory.goofy.goofy_rpc import GoofyRPC |
| 37 | from cros.factory.goofy.invocation import TestInvocation |
| 38 | from cros.factory.goofy.prespawner import Prespawner |
Cheng-Yi Chiang | 344b10f | 2013-05-03 16:44:03 +0800 | [diff] [blame] | 39 | from cros.factory.goofy.system_log_manager import SystemLogManager |
jcliang | cd68818 | 2012-08-20 21:01:26 +0800 | [diff] [blame] | 40 | from cros.factory.goofy.web_socket_manager import WebSocketManager |
Cheng-Yi Chiang | d818695 | 2013-04-04 23:41:14 +0800 | [diff] [blame] | 41 | from cros.factory.system.board import Board, BoardException |
jcliang | cd68818 | 2012-08-20 21:01:26 +0800 | [diff] [blame] | 42 | from cros.factory.system.charge_manager import ChargeManager |
Cheng-Yi Chiang | cdfa418 | 2013-05-05 03:20:19 +0800 | [diff] [blame] | 43 | from cros.factory.system.core_dump_manager import CoreDumpManager |
Jon Salz | ce6a7f8 | 2013-06-10 18:22:54 +0800 | [diff] [blame] | 44 | from cros.factory.system.cpufreq_manager import CpufreqManager |
Jon Salz | b92c511 | 2012-09-21 15:40:11 +0800 | [diff] [blame] | 45 | from cros.factory.system import disk_space |
jcliang | cd68818 | 2012-08-20 21:01:26 +0800 | [diff] [blame] | 46 | from cros.factory.test import factory |
| 47 | from cros.factory.test import state |
Jon Salz | 51528e1 | 2012-07-02 18:54:45 +0800 | [diff] [blame] | 48 | from cros.factory.test import shopfloor |
Jon Salz | 8359178 | 2012-06-26 11:09:58 +0800 | [diff] [blame] | 49 | from cros.factory.test import utils |
Jon Salz | 128b093 | 2013-07-03 16:55:26 +0800 | [diff] [blame^] | 50 | from cros.factory.test.test_lists import test_lists |
Jon Salz | 8359178 | 2012-06-26 11:09:58 +0800 | [diff] [blame] | 51 | from cros.factory.test.event import Event |
| 52 | from cros.factory.test.event import EventClient |
| 53 | from cros.factory.test.event import EventServer |
jcliang | cd68818 | 2012-08-20 21:01:26 +0800 | [diff] [blame] | 54 | from cros.factory.test.factory import TestState |
Dean Liao | 592e4d5 | 2013-01-10 20:06:39 +0800 | [diff] [blame] | 55 | from cros.factory.tools.key_filter import KeyFilter |
Jon Salz | 2af235d | 2013-06-24 14:47:21 +0800 | [diff] [blame] | 56 | from cros.factory.utils import file_utils |
Jon Salz | 78c3239 | 2012-07-25 14:18:29 +0800 | [diff] [blame] | 57 | from cros.factory.utils.process_utils import Spawn |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 58 | |
| 59 | |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 60 | HWID_CFG_PATH = '/usr/local/share/chromeos-hwid/cfg' |
Chun-ta Lin | 279e7e9 | 2013-02-19 17:40:39 +0800 | [diff] [blame] | 61 | CACHES_DIR = os.path.join(factory.get_state_root(), "caches") |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 62 | |
Jon Salz | 8796e36 | 2012-05-24 11:39:09 +0800 | [diff] [blame] | 63 | # File that suppresses reboot if present (e.g., for development). |
| 64 | NO_REBOOT_FILE = '/var/log/factory.noreboot' |
| 65 | |
Jon Salz | 5c344f6 | 2012-07-13 14:31:16 +0800 | [diff] [blame] | 66 | # Value for tests_after_shutdown that forces auto-run (e.g., after |
| 67 | # a factory update, when the available set of tests might change). |
| 68 | FORCE_AUTO_RUN = 'force_auto_run' |
| 69 | |
cychiang | 2188674 | 2012-07-05 15:16:32 +0800 | [diff] [blame] | 70 | RUN_QUEUE_TIMEOUT_SECS = 10 |
| 71 | |
Justin Chuang | 8381398 | 2013-05-13 01:26:32 +0800 | [diff] [blame] | 72 | # Sync disks when battery level is higher than this value. |
| 73 | # Otherwise, power loss during disk sync operation may incur even worse outcome. |
| 74 | MIN_BATTERY_LEVEL_FOR_DISK_SYNC = 1.0 |
| 75 | |
Jon Salz | e12c2b3 | 2013-06-25 16:24:34 +0800 | [diff] [blame] | 76 | MAX_CRASH_FILE_SIZE = 64*1024 |
| 77 | |
Jon Salz | 758e6cc | 2012-04-03 15:47:07 +0800 | [diff] [blame] | 78 | GOOFY_IN_CHROOT_WARNING = '\n' + ('*' * 70) + ''' |
| 79 | You are running Goofy inside the chroot. Autotests are not supported. |
| 80 | |
| 81 | To use Goofy in the chroot, first install an Xvnc server: |
| 82 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 83 | sudo apt-get install tightvncserver |
Jon Salz | 758e6cc | 2012-04-03 15:47:07 +0800 | [diff] [blame] | 84 | |
| 85 | ...and then start a VNC X server outside the chroot: |
| 86 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 87 | vncserver :10 & |
| 88 | vncviewer :10 |
Jon Salz | 758e6cc | 2012-04-03 15:47:07 +0800 | [diff] [blame] | 89 | |
| 90 | ...and run Goofy as follows: |
| 91 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 92 | env --unset=XAUTHORITY DISPLAY=localhost:10 python goofy.py |
Jon Salz | 758e6cc | 2012-04-03 15:47:07 +0800 | [diff] [blame] | 93 | ''' + ('*' * 70) |
Jon Salz | 73e0fd0 | 2012-04-04 11:46:38 +0800 | [diff] [blame] | 94 | suppress_chroot_warning = False |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 95 | |
| 96 | def get_hwid_cfg(): |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 97 | ''' |
| 98 | Returns the HWID config tag, or an empty string if none can be found. |
| 99 | ''' |
| 100 | if 'CROS_HWID' in os.environ: |
| 101 | return os.environ['CROS_HWID'] |
| 102 | if os.path.exists(HWID_CFG_PATH): |
| 103 | with open(HWID_CFG_PATH, 'rt') as hwid_cfg_handle: |
| 104 | return hwid_cfg_handle.read().strip() |
| 105 | return '' |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 106 | |
| 107 | |
Jon Salz | 73e0fd0 | 2012-04-04 11:46:38 +0800 | [diff] [blame] | 108 | _inited_logging = False |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 109 | |
| 110 | class Goofy(object): |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 111 | ''' |
| 112 | The main factory flow. |
| 113 | |
| 114 | Note that all methods in this class must be invoked from the main |
| 115 | (event) thread. Other threads, such as callbacks and TestInvocation |
| 116 | methods, should instead post events on the run queue. |
| 117 | |
| 118 | TODO: Unit tests. (chrome-os-partner:7409) |
| 119 | |
| 120 | Properties: |
| 121 | uuid: A unique UUID for this invocation of Goofy. |
| 122 | state_instance: An instance of FactoryState. |
| 123 | state_server: The FactoryState XML/RPC server. |
| 124 | state_server_thread: A thread running state_server. |
| 125 | event_server: The EventServer socket server. |
| 126 | event_server_thread: A thread running event_server. |
| 127 | event_client: A client to the event server. |
| 128 | connection_manager: The connection_manager object. |
Cheng-Yi Chiang | 835f268 | 2013-05-06 22:15:48 +0800 | [diff] [blame] | 129 | system_log_manager: The SystemLogManager object. |
| 130 | core_dump_manager: The CoreDumpManager object. |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 131 | ui_process: The factory ui process object. |
| 132 | run_queue: A queue of callbacks to invoke from the main thread. |
| 133 | invocations: A map from FactoryTest objects to the corresponding |
| 134 | TestInvocations objects representing active tests. |
| 135 | tests_to_run: A deque of tests that should be run when the current |
| 136 | test(s) complete. |
| 137 | options: Command-line options. |
| 138 | args: Command-line args. |
| 139 | test_list: The test list. |
Jon Salz | 128b093 | 2013-07-03 16:55:26 +0800 | [diff] [blame^] | 140 | test_lists: All new-style test lists. |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 141 | event_handlers: Map of Event.Type to the method used to handle that |
| 142 | event. If the method has an 'event' argument, the event is passed |
| 143 | to the handler. |
| 144 | exceptions: Exceptions encountered in invocation threads. |
Jon Salz | 3c493bb | 2013-02-07 17:24:58 +0800 | [diff] [blame] | 145 | last_log_disk_space_message: The last message we logged about disk space |
| 146 | (to avoid duplication). |
Cheng-Yi Chiang | cdfa418 | 2013-05-05 03:20:19 +0800 | [diff] [blame] | 147 | last_kick_sync_time: The last time to kick system_log_manager to sync |
| 148 | because of core dump files (to avoid kicking too soon then abort the |
| 149 | sync.) |
Jon Salz | 416f9cc | 2013-05-10 18:32:50 +0800 | [diff] [blame] | 150 | hooks: A Hooks object containing hooks for various Goofy actions. |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 151 | ''' |
| 152 | def __init__(self): |
| 153 | self.uuid = str(uuid.uuid4()) |
| 154 | self.state_instance = None |
| 155 | self.state_server = None |
| 156 | self.state_server_thread = None |
Jon Salz | 16d1054 | 2012-07-23 12:18:45 +0800 | [diff] [blame] | 157 | self.goofy_rpc = None |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 158 | self.event_server = None |
| 159 | self.event_server_thread = None |
| 160 | self.event_client = None |
| 161 | self.connection_manager = None |
Vic Yang | 4953fc1 | 2012-07-26 16:19:53 +0800 | [diff] [blame] | 162 | self.charge_manager = None |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 163 | self.time_sanitizer = None |
| 164 | self.time_synced = False |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 165 | self.log_watcher = None |
Cheng-Yi Chiang | 344b10f | 2013-05-03 16:44:03 +0800 | [diff] [blame] | 166 | self.system_log_manager = None |
Cheng-Yi Chiang | 835f268 | 2013-05-06 22:15:48 +0800 | [diff] [blame] | 167 | self.core_dump_manager = None |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 168 | self.event_log = None |
| 169 | self.prespawner = None |
| 170 | self.ui_process = None |
Jon Salz | c79a998 | 2012-08-30 04:42:01 +0800 | [diff] [blame] | 171 | self.dummy_shopfloor = None |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 172 | self.run_queue = Queue.Queue() |
| 173 | self.invocations = {} |
| 174 | self.tests_to_run = deque() |
| 175 | self.visible_test = None |
| 176 | self.chrome = None |
Jon Salz | 416f9cc | 2013-05-10 18:32:50 +0800 | [diff] [blame] | 177 | self.hooks = None |
Vic Yang | d8990da | 2013-06-27 16:57:43 +0800 | [diff] [blame] | 178 | self.cpu_usage_watcher = None |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 179 | |
| 180 | self.options = None |
| 181 | self.args = None |
| 182 | self.test_list = None |
Jon Salz | 128b093 | 2013-07-03 16:55:26 +0800 | [diff] [blame^] | 183 | self.test_lists = None |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 184 | self.on_ui_startup = [] |
| 185 | self.env = None |
Jon Salz | b22d117 | 2012-08-06 10:38:57 +0800 | [diff] [blame] | 186 | self.last_idle = None |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 187 | self.last_shutdown_time = None |
cychiang | 2188674 | 2012-07-05 15:16:32 +0800 | [diff] [blame] | 188 | self.last_update_check = None |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 189 | self.last_sync_time = None |
Jon Salz | b92c511 | 2012-09-21 15:40:11 +0800 | [diff] [blame] | 190 | self.last_log_disk_space_time = None |
Jon Salz | 3c493bb | 2013-02-07 17:24:58 +0800 | [diff] [blame] | 191 | self.last_log_disk_space_message = None |
Justin Chuang | 8381398 | 2013-05-13 01:26:32 +0800 | [diff] [blame] | 192 | self.last_check_battery_time = None |
| 193 | self.last_check_battery_message = None |
Cheng-Yi Chiang | cdfa418 | 2013-05-05 03:20:19 +0800 | [diff] [blame] | 194 | self.last_kick_sync_time = None |
Vic Yang | 311ddb8 | 2012-09-26 12:08:28 +0800 | [diff] [blame] | 195 | self.exclusive_items = set() |
Jon Salz | 0f99660 | 2012-10-03 15:26:48 +0800 | [diff] [blame] | 196 | self.event_log = None |
Dean Liao | 592e4d5 | 2013-01-10 20:06:39 +0800 | [diff] [blame] | 197 | self.key_filter = None |
Jon Salz | ce6a7f8 | 2013-06-10 18:22:54 +0800 | [diff] [blame] | 198 | self.cpufreq_manager = None |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 199 | |
Jon Salz | 85a3988 | 2012-07-05 16:45:04 +0800 | [diff] [blame] | 200 | def test_or_root(event, parent_or_group=True): |
| 201 | '''Returns the test affected by a particular event. |
| 202 | |
| 203 | Args: |
| 204 | event: The event containing an optional 'path' attribute. |
| 205 | parent_on_group: If True, returns the top-level parent for a test (the |
| 206 | root node of the tests that need to be run together if the given test |
| 207 | path is to be run). |
| 208 | ''' |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 209 | try: |
| 210 | path = event.path |
| 211 | except AttributeError: |
| 212 | path = None |
| 213 | |
| 214 | if path: |
Jon Salz | 85a3988 | 2012-07-05 16:45:04 +0800 | [diff] [blame] | 215 | test = self.test_list.lookup_path(path) |
| 216 | if parent_or_group: |
| 217 | test = test.get_top_level_parent_or_group() |
| 218 | return test |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 219 | else: |
| 220 | return self.test_list |
| 221 | |
| 222 | self.event_handlers = { |
| 223 | Event.Type.SWITCH_TEST: self.handle_switch_test, |
| 224 | Event.Type.SHOW_NEXT_ACTIVE_TEST: |
| 225 | lambda event: self.show_next_active_test(), |
| 226 | Event.Type.RESTART_TESTS: |
| 227 | lambda event: self.restart_tests(root=test_or_root(event)), |
| 228 | Event.Type.AUTO_RUN: |
| 229 | lambda event: self.auto_run(root=test_or_root(event)), |
| 230 | Event.Type.RE_RUN_FAILED: |
| 231 | lambda event: self.re_run_failed(root=test_or_root(event)), |
| 232 | Event.Type.RUN_TESTS_WITH_STATUS: |
| 233 | lambda event: self.run_tests_with_status( |
| 234 | event.status, |
| 235 | root=test_or_root(event)), |
| 236 | Event.Type.REVIEW: |
| 237 | lambda event: self.show_review_information(), |
| 238 | Event.Type.UPDATE_SYSTEM_INFO: |
| 239 | lambda event: self.update_system_info(), |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 240 | Event.Type.STOP: |
Jon Salz | 85a3988 | 2012-07-05 16:45:04 +0800 | [diff] [blame] | 241 | lambda event: self.stop(root=test_or_root(event, False), |
Jon Salz | 6dc031d | 2013-06-19 13:06:23 +0800 | [diff] [blame] | 242 | fail=getattr(event, 'fail', False), |
| 243 | reason=getattr(event, 'reason', None)), |
Jon Salz | 36fbbb5 | 2012-07-05 13:45:06 +0800 | [diff] [blame] | 244 | Event.Type.SET_VISIBLE_TEST: |
| 245 | lambda event: self.set_visible_test( |
| 246 | self.test_list.lookup_path(event.path)), |
Jon Salz | 4712ac7 | 2013-02-07 17:12:05 +0800 | [diff] [blame] | 247 | Event.Type.CLEAR_STATE: |
| 248 | lambda event: self.clear_state(self.test_list.lookup_path(event.path)), |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 249 | } |
| 250 | |
| 251 | self.exceptions = [] |
| 252 | self.web_socket_manager = None |
| 253 | |
| 254 | def destroy(self): |
| 255 | if self.chrome: |
| 256 | self.chrome.kill() |
| 257 | self.chrome = None |
Jon Salz | c79a998 | 2012-08-30 04:42:01 +0800 | [diff] [blame] | 258 | if self.dummy_shopfloor: |
| 259 | self.dummy_shopfloor.kill() |
| 260 | self.dummy_shopfloor = None |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 261 | if self.ui_process: |
| 262 | utils.kill_process_tree(self.ui_process, 'ui') |
| 263 | self.ui_process = None |
| 264 | if self.web_socket_manager: |
| 265 | logging.info('Stopping web sockets') |
| 266 | self.web_socket_manager.close() |
| 267 | self.web_socket_manager = None |
| 268 | if self.state_server_thread: |
| 269 | logging.info('Stopping state server') |
| 270 | self.state_server.shutdown() |
| 271 | self.state_server_thread.join() |
| 272 | self.state_server.server_close() |
| 273 | self.state_server_thread = None |
| 274 | if self.state_instance: |
| 275 | self.state_instance.close() |
| 276 | if self.event_server_thread: |
| 277 | logging.info('Stopping event server') |
| 278 | self.event_server.shutdown() # pylint: disable=E1101 |
| 279 | self.event_server_thread.join() |
| 280 | self.event_server.server_close() |
| 281 | self.event_server_thread = None |
| 282 | if self.log_watcher: |
| 283 | if self.log_watcher.IsThreadStarted(): |
| 284 | self.log_watcher.StopWatchThread() |
| 285 | self.log_watcher = None |
Cheng-Yi Chiang | 344b10f | 2013-05-03 16:44:03 +0800 | [diff] [blame] | 286 | if self.system_log_manager: |
| 287 | if self.system_log_manager.IsThreadRunning(): |
| 288 | self.system_log_manager.StopSyncThread() |
| 289 | self.system_log_manager = None |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 290 | if self.prespawner: |
| 291 | logging.info('Stopping prespawner') |
| 292 | self.prespawner.stop() |
| 293 | self.prespawner = None |
| 294 | if self.event_client: |
| 295 | logging.info('Closing event client') |
| 296 | self.event_client.close() |
| 297 | self.event_client = None |
Jon Salz | ddf0d05 | 2013-06-18 12:52:44 +0800 | [diff] [blame] | 298 | if self.cpufreq_manager: |
| 299 | self.cpufreq_manager.Stop() |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 300 | if self.event_log: |
| 301 | self.event_log.Close() |
| 302 | self.event_log = None |
Dean Liao | 592e4d5 | 2013-01-10 20:06:39 +0800 | [diff] [blame] | 303 | if self.key_filter: |
| 304 | self.key_filter.Stop() |
Vic Yang | d8990da | 2013-06-27 16:57:43 +0800 | [diff] [blame] | 305 | if self.cpu_usage_watcher: |
| 306 | self.cpu_usage_watcher.terminate() |
Dean Liao | 592e4d5 | 2013-01-10 20:06:39 +0800 | [diff] [blame] | 307 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 308 | self.check_exceptions() |
| 309 | logging.info('Done destroying Goofy') |
| 310 | |
| 311 | def start_state_server(self): |
Jon Salz | 2af235d | 2013-06-24 14:47:21 +0800 | [diff] [blame] | 312 | # Before starting state server, remount stateful partitions with |
| 313 | # no commit flag. The default commit time (commit=600) makes corruption |
| 314 | # too likely. |
| 315 | file_utils.ResetCommitTime() |
| 316 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 317 | self.state_instance, self.state_server = ( |
| 318 | state.create_server(bind_address='0.0.0.0')) |
Jon Salz | 16d1054 | 2012-07-23 12:18:45 +0800 | [diff] [blame] | 319 | self.goofy_rpc = GoofyRPC(self) |
| 320 | self.goofy_rpc.RegisterMethods(self.state_instance) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 321 | logging.info('Starting state server') |
| 322 | self.state_server_thread = threading.Thread( |
| 323 | target=self.state_server.serve_forever, |
| 324 | name='StateServer') |
| 325 | self.state_server_thread.start() |
| 326 | |
| 327 | def start_event_server(self): |
| 328 | self.event_server = EventServer() |
| 329 | logging.info('Starting factory event server') |
| 330 | self.event_server_thread = threading.Thread( |
| 331 | target=self.event_server.serve_forever, |
| 332 | name='EventServer') # pylint: disable=E1101 |
| 333 | self.event_server_thread.start() |
| 334 | |
| 335 | self.event_client = EventClient( |
| 336 | callback=self.handle_event, event_loop=self.run_queue) |
| 337 | |
| 338 | self.web_socket_manager = WebSocketManager(self.uuid) |
| 339 | self.state_server.add_handler("/event", |
| 340 | self.web_socket_manager.handle_web_socket) |
| 341 | |
| 342 | def start_ui(self): |
| 343 | ui_proc_args = [ |
| 344 | os.path.join(factory.FACTORY_PACKAGE_PATH, 'test', 'ui.py'), |
| 345 | self.options.test_list] |
| 346 | if self.options.verbose: |
| 347 | ui_proc_args.append('-v') |
| 348 | logging.info('Starting ui %s', ui_proc_args) |
Jon Salz | 78c3239 | 2012-07-25 14:18:29 +0800 | [diff] [blame] | 349 | self.ui_process = Spawn(ui_proc_args) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 350 | logging.info('Waiting for UI to come up...') |
| 351 | self.event_client.wait( |
| 352 | lambda event: event.type == Event.Type.UI_READY) |
| 353 | logging.info('UI has started') |
| 354 | |
| 355 | def set_visible_test(self, test): |
| 356 | if self.visible_test == test: |
| 357 | return |
Jon Salz | 2f2d42c | 2012-07-30 12:30:34 +0800 | [diff] [blame] | 358 | if test and not test.has_ui: |
| 359 | return |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 360 | |
| 361 | if test: |
| 362 | test.update_state(visible=True) |
| 363 | if self.visible_test: |
| 364 | self.visible_test.update_state(visible=False) |
| 365 | self.visible_test = test |
| 366 | |
Jon Salz | d4306c8 | 2012-11-30 15:16:36 +0800 | [diff] [blame] | 367 | def _log_startup_messages(self): |
| 368 | '''Logs the tail of var/log/messages and mosys and EC console logs.''' |
| 369 | # TODO(jsalz): This is mostly a copy-and-paste of code in init_states, |
| 370 | # for factory-3004.B only. Consolidate and merge back to ToT. |
| 371 | if utils.in_chroot(): |
| 372 | return |
| 373 | |
| 374 | try: |
| 375 | var_log_messages = ( |
| 376 | utils.var_log_messages_before_reboot()) |
| 377 | logging.info( |
| 378 | 'Tail of /var/log/messages before last reboot:\n' |
| 379 | '%s', ('\n'.join( |
| 380 | ' ' + x for x in var_log_messages))) |
| 381 | except: # pylint: disable=W0702 |
| 382 | logging.exception('Unable to grok /var/log/messages') |
| 383 | |
| 384 | try: |
| 385 | mosys_log = utils.Spawn( |
| 386 | ['mosys', 'eventlog', 'list'], |
| 387 | read_stdout=True, log_stderr_on_error=True).stdout_data |
| 388 | logging.info('System eventlog from mosys:\n%s\n', mosys_log) |
| 389 | except: # pylint: disable=W0702 |
| 390 | logging.exception('Unable to read mosys eventlog') |
| 391 | |
| 392 | try: |
Vic Yang | 8341dde | 2013-01-29 16:48:52 +0800 | [diff] [blame] | 393 | board = system.GetBoard() |
| 394 | ec_console_log = board.GetECConsoleLog() |
Jon Salz | d4306c8 | 2012-11-30 15:16:36 +0800 | [diff] [blame] | 395 | logging.info('EC console log after reboot:\n%s\n', ec_console_log) |
| 396 | except: # pylint: disable=W0702 |
| 397 | logging.exception('Error retrieving EC console log') |
| 398 | |
Vic Yang | 079f987 | 2013-07-01 11:32:00 +0800 | [diff] [blame] | 399 | try: |
| 400 | board = system.GetBoard() |
| 401 | ec_panic_info = board.GetECPanicInfo() |
| 402 | logging.info('EC panic info after reboot:\n%s\n', ec_panic_info) |
| 403 | except: # pylint: disable=W0702 |
| 404 | logging.exception('Error retrieving EC panic info') |
| 405 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 406 | def handle_shutdown_complete(self, test, test_state): |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 407 | ''' |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 408 | Handles the case where a shutdown was detected during a shutdown step. |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 409 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 410 | @param test: The ShutdownStep. |
| 411 | @param test_state: The test state. |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 412 | ''' |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 413 | test_state = test.update_state(increment_shutdown_count=1) |
| 414 | logging.info('Detected shutdown (%d of %d)', |
| 415 | test_state.shutdown_count, test.iterations) |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 416 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 417 | def log_and_update_state(status, error_msg, **kw): |
| 418 | self.event_log.Log('rebooted', |
| 419 | status=status, error_msg=error_msg, **kw) |
Jon Salz | d4306c8 | 2012-11-30 15:16:36 +0800 | [diff] [blame] | 420 | logging.info('Rebooted: status=%s, %s', status, |
| 421 | (('error_msg=%s' % error_msg) if error_msg else None)) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 422 | test.update_state(status=status, error_msg=error_msg) |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 423 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 424 | if not self.last_shutdown_time: |
| 425 | log_and_update_state(status=TestState.FAILED, |
| 426 | error_msg='Unable to read shutdown_time') |
| 427 | return |
Jon Salz | 258a40c | 2012-04-19 12:34:01 +0800 | [diff] [blame] | 428 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 429 | now = time.time() |
| 430 | logging.info('%.03f s passed since reboot', |
| 431 | now - self.last_shutdown_time) |
Jon Salz | 258a40c | 2012-04-19 12:34:01 +0800 | [diff] [blame] | 432 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 433 | if self.last_shutdown_time > now: |
| 434 | test.update_state(status=TestState.FAILED, |
| 435 | error_msg='Time moved backward during reboot') |
| 436 | elif (isinstance(test, factory.RebootStep) and |
| 437 | self.test_list.options.max_reboot_time_secs and |
| 438 | (now - self.last_shutdown_time > |
| 439 | self.test_list.options.max_reboot_time_secs)): |
| 440 | # A reboot took too long; fail. (We don't check this for |
| 441 | # HaltSteps, because the machine could be halted for a |
| 442 | # very long time, and even unplugged with battery backup, |
| 443 | # thus hosing the clock.) |
| 444 | log_and_update_state( |
| 445 | status=TestState.FAILED, |
| 446 | error_msg=('More than %d s elapsed during reboot ' |
| 447 | '(%.03f s, from %s to %s)' % ( |
| 448 | self.test_list.options.max_reboot_time_secs, |
| 449 | now - self.last_shutdown_time, |
| 450 | utils.TimeString(self.last_shutdown_time), |
| 451 | utils.TimeString(now))), |
| 452 | duration=(now-self.last_shutdown_time)) |
Jon Salz | d4306c8 | 2012-11-30 15:16:36 +0800 | [diff] [blame] | 453 | self._log_startup_messages() |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 454 | elif test_state.shutdown_count == test.iterations: |
| 455 | # Good! |
| 456 | log_and_update_state(status=TestState.PASSED, |
| 457 | duration=(now - self.last_shutdown_time), |
| 458 | error_msg='') |
| 459 | elif test_state.shutdown_count > test.iterations: |
| 460 | # Shut down too many times |
| 461 | log_and_update_state(status=TestState.FAILED, |
| 462 | error_msg='Too many shutdowns') |
Jon Salz | d4306c8 | 2012-11-30 15:16:36 +0800 | [diff] [blame] | 463 | self._log_startup_messages() |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 464 | elif utils.are_shift_keys_depressed(): |
| 465 | logging.info('Shift keys are depressed; cancelling restarts') |
| 466 | # Abort shutdown |
| 467 | log_and_update_state( |
| 468 | status=TestState.FAILED, |
| 469 | error_msg='Shutdown aborted with double shift keys') |
Jon Salz | a6711d7 | 2012-07-18 14:33:03 +0800 | [diff] [blame] | 470 | self.cancel_pending_tests() |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 471 | else: |
| 472 | def handler(): |
| 473 | if self._prompt_cancel_shutdown( |
| 474 | test, test_state.shutdown_count + 1): |
Jon Salz | a6711d7 | 2012-07-18 14:33:03 +0800 | [diff] [blame] | 475 | factory.console.info('Shutdown aborted by operator') |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 476 | log_and_update_state( |
| 477 | status=TestState.FAILED, |
| 478 | error_msg='Shutdown aborted by operator') |
Jon Salz | a6711d7 | 2012-07-18 14:33:03 +0800 | [diff] [blame] | 479 | self.cancel_pending_tests() |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 480 | return |
Jon Salz | 0405ab5 | 2012-03-16 15:26:52 +0800 | [diff] [blame] | 481 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 482 | # Time to shutdown again |
| 483 | log_and_update_state( |
| 484 | status=TestState.ACTIVE, |
| 485 | error_msg='', |
| 486 | iteration=test_state.shutdown_count) |
Jon Salz | 73e0fd0 | 2012-04-04 11:46:38 +0800 | [diff] [blame] | 487 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 488 | self.event_log.Log('shutdown', operation='reboot') |
| 489 | self.state_instance.set_shared_data('shutdown_time', |
| 490 | time.time()) |
| 491 | self.env.shutdown('reboot') |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 492 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 493 | self.on_ui_startup.append(handler) |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 494 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 495 | def _prompt_cancel_shutdown(self, test, iteration): |
| 496 | if self.options.ui != 'chrome': |
| 497 | return False |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 498 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 499 | pending_shutdown_data = { |
| 500 | 'delay_secs': test.delay_secs, |
| 501 | 'time': time.time() + test.delay_secs, |
| 502 | 'operation': test.operation, |
| 503 | 'iteration': iteration, |
| 504 | 'iterations': test.iterations, |
| 505 | } |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 506 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 507 | # Create a new (threaded) event client since we |
| 508 | # don't want to use the event loop for this. |
| 509 | with EventClient() as event_client: |
| 510 | event_client.post_event(Event(Event.Type.PENDING_SHUTDOWN, |
| 511 | **pending_shutdown_data)) |
| 512 | aborted = event_client.wait( |
| 513 | lambda event: event.type == Event.Type.CANCEL_SHUTDOWN, |
| 514 | timeout=test.delay_secs) is not None |
| 515 | if aborted: |
| 516 | event_client.post_event(Event(Event.Type.PENDING_SHUTDOWN)) |
| 517 | return aborted |
Jon Salz | 258a40c | 2012-04-19 12:34:01 +0800 | [diff] [blame] | 518 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 519 | def init_states(self): |
| 520 | ''' |
| 521 | Initializes all states on startup. |
| 522 | ''' |
| 523 | for test in self.test_list.get_all_tests(): |
| 524 | # Make sure the state server knows about all the tests, |
| 525 | # defaulting to an untested state. |
| 526 | test.update_state(update_parent=False, visible=False) |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 527 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 528 | var_log_messages = None |
Vic Yang | a9c3221 | 2012-08-16 20:07:54 +0800 | [diff] [blame] | 529 | mosys_log = None |
Vic Yang | e4c275d | 2012-08-28 01:50:20 +0800 | [diff] [blame] | 530 | ec_console_log = None |
Vic Yang | 079f987 | 2013-07-01 11:32:00 +0800 | [diff] [blame] | 531 | ec_panic_info = None |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 532 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 533 | # Any 'active' tests should be marked as failed now. |
| 534 | for test in self.test_list.walk(): |
Jon Salz | a6711d7 | 2012-07-18 14:33:03 +0800 | [diff] [blame] | 535 | if not test.is_leaf(): |
| 536 | # Don't bother with parents; they will be updated when their |
| 537 | # children are updated. |
| 538 | continue |
| 539 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 540 | test_state = test.get_state() |
| 541 | if test_state.status != TestState.ACTIVE: |
| 542 | continue |
| 543 | if isinstance(test, factory.ShutdownStep): |
| 544 | # Shutdown while the test was active - that's good. |
| 545 | self.handle_shutdown_complete(test, test_state) |
| 546 | else: |
| 547 | # Unexpected shutdown. Grab /var/log/messages for context. |
| 548 | if var_log_messages is None: |
| 549 | try: |
| 550 | var_log_messages = ( |
| 551 | utils.var_log_messages_before_reboot()) |
| 552 | # Write it to the log, to make it easier to |
| 553 | # correlate with /var/log/messages. |
| 554 | logging.info( |
| 555 | 'Unexpected shutdown. ' |
| 556 | 'Tail of /var/log/messages before last reboot:\n' |
| 557 | '%s', ('\n'.join( |
| 558 | ' ' + x for x in var_log_messages))) |
| 559 | except: # pylint: disable=W0702 |
| 560 | logging.exception('Unable to grok /var/log/messages') |
| 561 | var_log_messages = [] |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 562 | |
Jon Salz | 008f4ea | 2012-08-28 05:39:45 +0800 | [diff] [blame] | 563 | if mosys_log is None and not utils.in_chroot(): |
| 564 | try: |
| 565 | mosys_log = utils.Spawn( |
| 566 | ['mosys', 'eventlog', 'list'], |
| 567 | read_stdout=True, log_stderr_on_error=True).stdout_data |
| 568 | # Write it to the log also. |
| 569 | logging.info('System eventlog from mosys:\n%s\n', mosys_log) |
| 570 | except: # pylint: disable=W0702 |
| 571 | logging.exception('Unable to read mosys eventlog') |
Vic Yang | a9c3221 | 2012-08-16 20:07:54 +0800 | [diff] [blame] | 572 | |
Vic Yang | e4c275d | 2012-08-28 01:50:20 +0800 | [diff] [blame] | 573 | if ec_console_log is None: |
| 574 | try: |
Vic Yang | 8341dde | 2013-01-29 16:48:52 +0800 | [diff] [blame] | 575 | board = system.GetBoard() |
| 576 | ec_console_log = board.GetECConsoleLog() |
Vic Yang | e4c275d | 2012-08-28 01:50:20 +0800 | [diff] [blame] | 577 | logging.info('EC console log after reboot:\n%s\n', ec_console_log) |
Jon Salz | fe1f665 | 2012-09-07 05:40:14 +0800 | [diff] [blame] | 578 | except: # pylint: disable=W0702 |
Vic Yang | e4c275d | 2012-08-28 01:50:20 +0800 | [diff] [blame] | 579 | logging.exception('Error retrieving EC console log') |
| 580 | |
Vic Yang | 079f987 | 2013-07-01 11:32:00 +0800 | [diff] [blame] | 581 | if ec_panic_info is None: |
| 582 | try: |
| 583 | board = system.GetBoard() |
| 584 | ec_panic_info = board.GetECPanicInfo() |
| 585 | logging.info('EC panic info after reboot:\n%s\n', ec_panic_info) |
| 586 | except: # pylint: disable=W0702 |
| 587 | logging.exception('Error retrieving EC panic info') |
| 588 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 589 | error_msg = 'Unexpected shutdown while test was running' |
| 590 | self.event_log.Log('end_test', |
| 591 | path=test.path, |
| 592 | status=TestState.FAILED, |
| 593 | invocation=test.get_state().invocation, |
| 594 | error_msg=error_msg, |
Vic Yang | a9c3221 | 2012-08-16 20:07:54 +0800 | [diff] [blame] | 595 | var_log_messages='\n'.join(var_log_messages), |
| 596 | mosys_log=mosys_log) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 597 | test.update_state( |
| 598 | status=TestState.FAILED, |
| 599 | error_msg=error_msg) |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 600 | |
Jon Salz | 50efe94 | 2012-07-26 11:54:10 +0800 | [diff] [blame] | 601 | if not test.never_fails: |
| 602 | # For "never_fails" tests (such as "Start"), don't cancel |
| 603 | # pending tests, since reboot is expected. |
| 604 | factory.console.info('Unexpected shutdown while test %s ' |
| 605 | 'running; cancelling any pending tests', |
| 606 | test.path) |
| 607 | self.state_instance.set_shared_data('tests_after_shutdown', []) |
Jon Salz | 69806bb | 2012-07-20 18:05:02 +0800 | [diff] [blame] | 608 | |
Jon Salz | 008f4ea | 2012-08-28 05:39:45 +0800 | [diff] [blame] | 609 | self.update_skipped_tests() |
| 610 | |
| 611 | def update_skipped_tests(self): |
| 612 | ''' |
| 613 | Updates skipped states based on run_if. |
| 614 | ''' |
| 615 | for t in self.test_list.walk(): |
| 616 | if t.is_leaf() and t.run_if_table_name: |
| 617 | skip = False |
| 618 | try: |
| 619 | aux = shopfloor.get_selected_aux_data(t.run_if_table_name) |
| 620 | value = aux.get(t.run_if_col) |
| 621 | if value is not None: |
| 622 | skip = (not value) ^ t.run_if_not |
| 623 | except ValueError: |
| 624 | # Not available; assume it shouldn't be skipped |
| 625 | pass |
| 626 | |
| 627 | test_state = t.get_state() |
| 628 | if ((not skip) and |
| 629 | (test_state.status == TestState.PASSED) and |
| 630 | (test_state.error_msg == TestState.SKIPPED_MSG)): |
| 631 | # It was marked as skipped before, but now we need to run it. |
| 632 | # Mark as untested. |
| 633 | t.update_state(skip=skip, status=TestState.UNTESTED, error_msg='') |
| 634 | else: |
| 635 | t.update_state(skip=skip) |
| 636 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 637 | def show_next_active_test(self): |
| 638 | ''' |
| 639 | Rotates to the next visible active test. |
| 640 | ''' |
| 641 | self.reap_completed_tests() |
| 642 | active_tests = [ |
| 643 | t for t in self.test_list.walk() |
| 644 | if t.is_leaf() and t.get_state().status == TestState.ACTIVE] |
| 645 | if not active_tests: |
| 646 | return |
Jon Salz | 4f6c717 | 2012-06-11 20:45:36 +0800 | [diff] [blame] | 647 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 648 | try: |
| 649 | next_test = active_tests[ |
| 650 | (active_tests.index(self.visible_test) + 1) % len(active_tests)] |
| 651 | except ValueError: # visible_test not present in active_tests |
| 652 | next_test = active_tests[0] |
Jon Salz | 4f6c717 | 2012-06-11 20:45:36 +0800 | [diff] [blame] | 653 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 654 | self.set_visible_test(next_test) |
Jon Salz | 4f6c717 | 2012-06-11 20:45:36 +0800 | [diff] [blame] | 655 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 656 | def handle_event(self, event): |
| 657 | ''' |
| 658 | Handles an event from the event server. |
| 659 | ''' |
| 660 | handler = self.event_handlers.get(event.type) |
| 661 | if handler: |
| 662 | handler(event) |
| 663 | else: |
| 664 | # We don't register handlers for all event types - just ignore |
| 665 | # this event. |
| 666 | logging.debug('Unbound event type %s', event.type) |
Jon Salz | 4f6c717 | 2012-06-11 20:45:36 +0800 | [diff] [blame] | 667 | |
Vic Yang | aabf9fd | 2013-04-09 18:56:13 +0800 | [diff] [blame] | 668 | def check_critical_factory_note(self): |
| 669 | ''' |
| 670 | Returns True if the last factory note is critical. |
| 671 | ''' |
| 672 | notes = self.state_instance.get_shared_data('factory_note', True) |
| 673 | return notes and notes[-1]['level'] == 'CRITICAL' |
| 674 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 675 | def run_next_test(self): |
| 676 | ''' |
| 677 | Runs the next eligible test (or tests) in self.tests_to_run. |
| 678 | ''' |
| 679 | self.reap_completed_tests() |
Vic Yang | aabf9fd | 2013-04-09 18:56:13 +0800 | [diff] [blame] | 680 | if self.tests_to_run and self.check_critical_factory_note(): |
| 681 | self.tests_to_run.clear() |
| 682 | return |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 683 | while self.tests_to_run: |
| 684 | logging.debug('Tests to run: %s', |
| 685 | [x.path for x in self.tests_to_run]) |
Jon Salz | 94eb56f | 2012-06-12 18:01:12 +0800 | [diff] [blame] | 686 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 687 | test = self.tests_to_run[0] |
Jon Salz | 94eb56f | 2012-06-12 18:01:12 +0800 | [diff] [blame] | 688 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 689 | if test in self.invocations: |
| 690 | logging.info('Next test %s is already running', test.path) |
| 691 | self.tests_to_run.popleft() |
| 692 | return |
Jon Salz | 94eb56f | 2012-06-12 18:01:12 +0800 | [diff] [blame] | 693 | |
Jon Salz | a141292 | 2012-07-23 16:04:17 +0800 | [diff] [blame] | 694 | for requirement in test.require_run: |
| 695 | for i in requirement.test.walk(): |
| 696 | if i.get_state().status == TestState.ACTIVE: |
Jon Salz | 304a75d | 2012-07-06 11:14:15 +0800 | [diff] [blame] | 697 | logging.info('Waiting for active test %s to complete ' |
Jon Salz | a141292 | 2012-07-23 16:04:17 +0800 | [diff] [blame] | 698 | 'before running %s', i.path, test.path) |
Jon Salz | 304a75d | 2012-07-06 11:14:15 +0800 | [diff] [blame] | 699 | return |
| 700 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 701 | if self.invocations and not (test.backgroundable and all( |
| 702 | [x.backgroundable for x in self.invocations])): |
| 703 | logging.debug('Waiting for non-backgroundable tests to ' |
| 704 | 'complete before running %s', test.path) |
| 705 | return |
Jon Salz | 94eb56f | 2012-06-12 18:01:12 +0800 | [diff] [blame] | 706 | |
Jon Salz | 3e6f520 | 2012-10-15 15:08:29 +0800 | [diff] [blame] | 707 | if test.get_state().skip: |
| 708 | factory.console.info('Skipping test %s', test.path) |
| 709 | test.update_state(status=TestState.PASSED, |
| 710 | error_msg=TestState.SKIPPED_MSG) |
| 711 | self.tests_to_run.popleft() |
| 712 | continue |
| 713 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 714 | self.tests_to_run.popleft() |
Jon Salz | 94eb56f | 2012-06-12 18:01:12 +0800 | [diff] [blame] | 715 | |
Jon Salz | 304a75d | 2012-07-06 11:14:15 +0800 | [diff] [blame] | 716 | untested = set() |
Jon Salz | a141292 | 2012-07-23 16:04:17 +0800 | [diff] [blame] | 717 | for requirement in test.require_run: |
| 718 | for i in requirement.test.walk(): |
| 719 | if i == test: |
Jon Salz | 304a75d | 2012-07-06 11:14:15 +0800 | [diff] [blame] | 720 | # We've hit this test itself; stop checking |
| 721 | break |
Jon Salz | a141292 | 2012-07-23 16:04:17 +0800 | [diff] [blame] | 722 | if ((i.get_state().status == TestState.UNTESTED) or |
| 723 | (requirement.passed and i.get_state().status != |
| 724 | TestState.PASSED)): |
Jon Salz | 304a75d | 2012-07-06 11:14:15 +0800 | [diff] [blame] | 725 | # Found an untested test; move on to the next |
| 726 | # element in require_run. |
Jon Salz | a141292 | 2012-07-23 16:04:17 +0800 | [diff] [blame] | 727 | untested.add(i) |
Jon Salz | 304a75d | 2012-07-06 11:14:15 +0800 | [diff] [blame] | 728 | break |
| 729 | |
| 730 | if untested: |
| 731 | untested_paths = ', '.join(sorted([x.path for x in untested])) |
| 732 | if self.state_instance.get_shared_data('engineering_mode', |
| 733 | optional=True): |
| 734 | # In engineering mode, we'll let it go. |
| 735 | factory.console.warn('In engineering mode; running ' |
| 736 | '%s even though required tests ' |
| 737 | '[%s] have not completed', |
| 738 | test.path, untested_paths) |
| 739 | else: |
| 740 | # Not in engineering mode; mark it failed. |
| 741 | error_msg = ('Required tests [%s] have not been run yet' |
| 742 | % untested_paths) |
| 743 | factory.console.error('Not running %s: %s', |
| 744 | test.path, error_msg) |
| 745 | test.update_state(status=TestState.FAILED, |
| 746 | error_msg=error_msg) |
| 747 | continue |
| 748 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 749 | if isinstance(test, factory.ShutdownStep): |
| 750 | if os.path.exists(NO_REBOOT_FILE): |
| 751 | test.update_state( |
| 752 | status=TestState.FAILED, increment_count=1, |
| 753 | error_msg=('Skipped shutdown since %s is present' % |
Jon Salz | 304a75d | 2012-07-06 11:14:15 +0800 | [diff] [blame] | 754 | NO_REBOOT_FILE)) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 755 | continue |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 756 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 757 | test.update_state(status=TestState.ACTIVE, increment_count=1, |
| 758 | error_msg='', shutdown_count=0) |
| 759 | if self._prompt_cancel_shutdown(test, 1): |
| 760 | self.event_log.Log('reboot_cancelled') |
| 761 | test.update_state( |
| 762 | status=TestState.FAILED, increment_count=1, |
| 763 | error_msg='Shutdown aborted by operator', |
| 764 | shutdown_count=0) |
chungyi | afe8f77 | 2012-08-15 19:36:29 +0800 | [diff] [blame] | 765 | continue |
Jon Salz | 2f757d4 | 2012-06-27 17:06:42 +0800 | [diff] [blame] | 766 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 767 | # Save pending test list in the state server |
Jon Salz | dbf398f | 2012-06-14 17:30:01 +0800 | [diff] [blame] | 768 | self.state_instance.set_shared_data( |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 769 | 'tests_after_shutdown', |
| 770 | [t.path for t in self.tests_to_run]) |
| 771 | # Save shutdown time |
| 772 | self.state_instance.set_shared_data('shutdown_time', |
| 773 | time.time()) |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 774 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 775 | with self.env.lock: |
| 776 | self.event_log.Log('shutdown', operation=test.operation) |
| 777 | shutdown_result = self.env.shutdown(test.operation) |
| 778 | if shutdown_result: |
| 779 | # That's all, folks! |
| 780 | self.run_queue.put(None) |
| 781 | return |
| 782 | else: |
| 783 | # Just pass (e.g., in the chroot). |
| 784 | test.update_state(status=TestState.PASSED) |
| 785 | self.state_instance.set_shared_data( |
| 786 | 'tests_after_shutdown', None) |
| 787 | # Send event with no fields to indicate that there is no |
| 788 | # longer a pending shutdown. |
| 789 | self.event_client.post_event(Event( |
| 790 | Event.Type.PENDING_SHUTDOWN)) |
| 791 | continue |
Jon Salz | 258a40c | 2012-04-19 12:34:01 +0800 | [diff] [blame] | 792 | |
Cheng-Yi Chiang | ce05c00 | 2013-04-04 02:13:17 +0800 | [diff] [blame] | 793 | self._run_test(test, test.iterations, test.retries) |
Jon Salz | 1acc874 | 2012-07-17 17:45:55 +0800 | [diff] [blame] | 794 | |
Cheng-Yi Chiang | ce05c00 | 2013-04-04 02:13:17 +0800 | [diff] [blame] | 795 | def _run_test(self, test, iterations_left=None, retries_left=None): |
Jon Salz | 1acc874 | 2012-07-17 17:45:55 +0800 | [diff] [blame] | 796 | invoc = TestInvocation(self, test, on_completion=self.run_next_test) |
| 797 | new_state = test.update_state( |
| 798 | status=TestState.ACTIVE, increment_count=1, error_msg='', |
Jon Salz | bd42ce1 | 2012-09-18 08:03:59 +0800 | [diff] [blame] | 799 | invocation=invoc.uuid, iterations_left=iterations_left, |
Cheng-Yi Chiang | ce05c00 | 2013-04-04 02:13:17 +0800 | [diff] [blame] | 800 | retries_left=retries_left, |
Jon Salz | bd42ce1 | 2012-09-18 08:03:59 +0800 | [diff] [blame] | 801 | visible=(self.visible_test == test)) |
Jon Salz | 1acc874 | 2012-07-17 17:45:55 +0800 | [diff] [blame] | 802 | invoc.count = new_state.count |
| 803 | |
| 804 | self.invocations[test] = invoc |
| 805 | if self.visible_test is None and test.has_ui: |
| 806 | self.set_visible_test(test) |
Vic Yang | 311ddb8 | 2012-09-26 12:08:28 +0800 | [diff] [blame] | 807 | self.check_exclusive() |
Jon Salz | 1acc874 | 2012-07-17 17:45:55 +0800 | [diff] [blame] | 808 | invoc.start() |
Jon Salz | 5f2a067 | 2012-05-22 17:14:06 +0800 | [diff] [blame] | 809 | |
Vic Yang | 311ddb8 | 2012-09-26 12:08:28 +0800 | [diff] [blame] | 810 | def check_exclusive(self): |
Jon Salz | ce6a7f8 | 2013-06-10 18:22:54 +0800 | [diff] [blame] | 811 | # alias since this is really long |
| 812 | EXCL_OPT = factory.FactoryTest.EXCLUSIVE_OPTIONS |
| 813 | |
Vic Yang | 311ddb8 | 2012-09-26 12:08:28 +0800 | [diff] [blame] | 814 | current_exclusive_items = set([ |
Jon Salz | ce6a7f8 | 2013-06-10 18:22:54 +0800 | [diff] [blame] | 815 | item for item in EXCL_OPT |
Vic Yang | 311ddb8 | 2012-09-26 12:08:28 +0800 | [diff] [blame] | 816 | if any([test.is_exclusive(item) for test in self.invocations])]) |
| 817 | |
| 818 | new_exclusive_items = current_exclusive_items - self.exclusive_items |
Jon Salz | ce6a7f8 | 2013-06-10 18:22:54 +0800 | [diff] [blame] | 819 | if EXCL_OPT.NETWORKING in new_exclusive_items: |
Vic Yang | 311ddb8 | 2012-09-26 12:08:28 +0800 | [diff] [blame] | 820 | logging.info('Disabling network') |
| 821 | self.connection_manager.DisableNetworking() |
Jon Salz | ce6a7f8 | 2013-06-10 18:22:54 +0800 | [diff] [blame] | 822 | if EXCL_OPT.CHARGER in new_exclusive_items: |
Vic Yang | 311ddb8 | 2012-09-26 12:08:28 +0800 | [diff] [blame] | 823 | logging.info('Stop controlling charger') |
| 824 | |
| 825 | new_non_exclusive_items = self.exclusive_items - current_exclusive_items |
Jon Salz | ce6a7f8 | 2013-06-10 18:22:54 +0800 | [diff] [blame] | 826 | if EXCL_OPT.NETWORKING in new_non_exclusive_items: |
Vic Yang | 311ddb8 | 2012-09-26 12:08:28 +0800 | [diff] [blame] | 827 | logging.info('Re-enabling network') |
| 828 | self.connection_manager.EnableNetworking() |
Jon Salz | ce6a7f8 | 2013-06-10 18:22:54 +0800 | [diff] [blame] | 829 | if EXCL_OPT.CHARGER in new_non_exclusive_items: |
Vic Yang | 311ddb8 | 2012-09-26 12:08:28 +0800 | [diff] [blame] | 830 | logging.info('Start controlling charger') |
| 831 | |
Jon Salz | ce6a7f8 | 2013-06-10 18:22:54 +0800 | [diff] [blame] | 832 | if self.cpufreq_manager: |
| 833 | enabled = EXCL_OPT.CPUFREQ not in current_exclusive_items |
| 834 | try: |
| 835 | self.cpufreq_manager.SetEnabled(enabled) |
| 836 | except: # pylint: disable=W0702 |
| 837 | logging.exception('Unable to %s cpufreq services', |
| 838 | 'enable' if enabled else 'disable') |
| 839 | |
Vic Yang | 311ddb8 | 2012-09-26 12:08:28 +0800 | [diff] [blame] | 840 | # Only adjust charge state if not excluded |
Jon Salz | ce6a7f8 | 2013-06-10 18:22:54 +0800 | [diff] [blame] | 841 | if (EXCL_OPT.CHARGER not in current_exclusive_items and |
| 842 | not utils.in_chroot()): |
Cheng-Yi Chiang | d818695 | 2013-04-04 23:41:14 +0800 | [diff] [blame] | 843 | if self.charge_manager: |
| 844 | self.charge_manager.AdjustChargeState() |
| 845 | else: |
| 846 | try: |
| 847 | system.GetBoard().SetChargeState(Board.ChargeState.CHARGE) |
| 848 | except BoardException: |
| 849 | logging.exception('Unable to set charge state on this board') |
Vic Yang | 311ddb8 | 2012-09-26 12:08:28 +0800 | [diff] [blame] | 850 | |
| 851 | self.exclusive_items = current_exclusive_items |
Jon Salz | 5da61e6 | 2012-05-31 13:06:22 +0800 | [diff] [blame] | 852 | |
cychiang | 2188674 | 2012-07-05 15:16:32 +0800 | [diff] [blame] | 853 | def check_for_updates(self): |
| 854 | ''' |
| 855 | Schedules an asynchronous check for updates if necessary. |
| 856 | ''' |
| 857 | if not self.test_list.options.update_period_secs: |
| 858 | # Not enabled. |
| 859 | return |
| 860 | |
| 861 | now = time.time() |
| 862 | if self.last_update_check and ( |
| 863 | now - self.last_update_check < |
| 864 | self.test_list.options.update_period_secs): |
| 865 | # Not yet time for another check. |
| 866 | return |
| 867 | |
| 868 | self.last_update_check = now |
| 869 | |
| 870 | def handle_check_for_update(reached_shopfloor, md5sum, needs_update): |
| 871 | if reached_shopfloor: |
| 872 | new_update_md5sum = md5sum if needs_update else None |
| 873 | if system.SystemInfo.update_md5sum != new_update_md5sum: |
| 874 | logging.info('Received new update MD5SUM: %s', new_update_md5sum) |
| 875 | system.SystemInfo.update_md5sum = new_update_md5sum |
| 876 | self.run_queue.put(self.update_system_info) |
| 877 | |
| 878 | updater.CheckForUpdateAsync( |
| 879 | handle_check_for_update, |
| 880 | self.test_list.options.shopfloor_timeout_secs) |
| 881 | |
Jon Salz | a6711d7 | 2012-07-18 14:33:03 +0800 | [diff] [blame] | 882 | def cancel_pending_tests(self): |
| 883 | '''Cancels any tests in the run queue.''' |
| 884 | self.run_tests([]) |
| 885 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 886 | def run_tests(self, subtrees, untested_only=False): |
| 887 | ''' |
| 888 | Runs tests under subtree. |
Jon Salz | 258a40c | 2012-04-19 12:34:01 +0800 | [diff] [blame] | 889 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 890 | The tests are run in order unless one fails (then stops). |
| 891 | Backgroundable tests are run simultaneously; when a foreground test is |
| 892 | encountered, we wait for all active tests to finish before continuing. |
Jon Salz | b1b3909 | 2012-05-03 02:05:09 +0800 | [diff] [blame] | 893 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 894 | @param subtrees: Node or nodes containing tests to run (may either be |
| 895 | a single test or a list). Duplicates will be ignored. |
| 896 | ''' |
| 897 | if type(subtrees) != list: |
| 898 | subtrees = [subtrees] |
Jon Salz | 258a40c | 2012-04-19 12:34:01 +0800 | [diff] [blame] | 899 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 900 | # Nodes we've seen so far, to avoid duplicates. |
| 901 | seen = set() |
Jon Salz | 94eb56f | 2012-06-12 18:01:12 +0800 | [diff] [blame] | 902 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 903 | self.tests_to_run = deque() |
| 904 | for subtree in subtrees: |
| 905 | for test in subtree.walk(): |
| 906 | if test in seen: |
| 907 | continue |
| 908 | seen.add(test) |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 909 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 910 | if not test.is_leaf(): |
| 911 | continue |
| 912 | if (untested_only and |
| 913 | test.get_state().status != TestState.UNTESTED): |
| 914 | continue |
| 915 | self.tests_to_run.append(test) |
| 916 | self.run_next_test() |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 917 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 918 | def reap_completed_tests(self): |
| 919 | ''' |
| 920 | Removes completed tests from the set of active tests. |
| 921 | |
| 922 | Also updates the visible test if it was reaped. |
| 923 | ''' |
Cheng-Yi Chiang | 5ac22ca | 2013-04-12 17:45:26 +0800 | [diff] [blame] | 924 | test_completed = False |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 925 | for t, v in dict(self.invocations).iteritems(): |
| 926 | if v.is_completed(): |
Cheng-Yi Chiang | 5ac22ca | 2013-04-12 17:45:26 +0800 | [diff] [blame] | 927 | test_completed = True |
Jon Salz | 1acc874 | 2012-07-17 17:45:55 +0800 | [diff] [blame] | 928 | new_state = t.update_state(**v.update_state_on_completion) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 929 | del self.invocations[t] |
| 930 | |
Chun-Ta Lin | 54e17e4 | 2012-09-06 22:05:13 +0800 | [diff] [blame] | 931 | # Stop on failure if flag is true. |
| 932 | if (self.test_list.options.stop_on_failure and |
| 933 | new_state.status == TestState.FAILED): |
| 934 | # Clean all the tests to cause goofy to stop. |
| 935 | self.tests_to_run = [] |
| 936 | factory.console.info("Stop on failure triggered. Empty the queue.") |
| 937 | |
Jon Salz | 1acc874 | 2012-07-17 17:45:55 +0800 | [diff] [blame] | 938 | if new_state.iterations_left and new_state.status == TestState.PASSED: |
| 939 | # Play it again, Sam! |
| 940 | self._run_test(t) |
Cheng-Yi Chiang | ce05c00 | 2013-04-04 02:13:17 +0800 | [diff] [blame] | 941 | # new_state.retries_left is obtained after update. |
| 942 | # For retries_left == 0, test can still be run for the last time. |
| 943 | elif (new_state.retries_left >= 0 and |
| 944 | new_state.status == TestState.FAILED): |
| 945 | # Still have to retry, Sam! |
| 946 | self._run_test(t) |
Jon Salz | 1acc874 | 2012-07-17 17:45:55 +0800 | [diff] [blame] | 947 | |
Cheng-Yi Chiang | 5ac22ca | 2013-04-12 17:45:26 +0800 | [diff] [blame] | 948 | if test_completed: |
Vic Yang | f01c59f | 2013-04-19 17:37:56 +0800 | [diff] [blame] | 949 | self.log_watcher.KickWatchThread() |
Cheng-Yi Chiang | 5ac22ca | 2013-04-12 17:45:26 +0800 | [diff] [blame] | 950 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 951 | if (self.visible_test is None or |
Jon Salz | 85a3988 | 2012-07-05 16:45:04 +0800 | [diff] [blame] | 952 | self.visible_test not in self.invocations): |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 953 | self.set_visible_test(None) |
| 954 | # Make the first running test, if any, the visible test |
| 955 | for t in self.test_list.walk(): |
| 956 | if t in self.invocations: |
| 957 | self.set_visible_test(t) |
| 958 | break |
| 959 | |
Jon Salz | 6dc031d | 2013-06-19 13:06:23 +0800 | [diff] [blame] | 960 | def kill_active_tests(self, abort, root=None, reason=None): |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 961 | ''' |
| 962 | Kills and waits for all active tests. |
| 963 | |
Jon Salz | 85a3988 | 2012-07-05 16:45:04 +0800 | [diff] [blame] | 964 | Args: |
| 965 | abort: True to change state of killed tests to FAILED, False for |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 966 | UNTESTED. |
Jon Salz | 85a3988 | 2012-07-05 16:45:04 +0800 | [diff] [blame] | 967 | root: If set, only kills tests with root as an ancestor. |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 968 | ''' |
| 969 | self.reap_completed_tests() |
| 970 | for test, invoc in self.invocations.items(): |
Jon Salz | 85a3988 | 2012-07-05 16:45:04 +0800 | [diff] [blame] | 971 | if root and not test.has_ancestor(root): |
| 972 | continue |
| 973 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 974 | factory.console.info('Killing active test %s...' % test.path) |
Jon Salz | 6dc031d | 2013-06-19 13:06:23 +0800 | [diff] [blame] | 975 | invoc.abort_and_join(reason) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 976 | factory.console.info('Killed %s' % test.path) |
Jon Salz | 1acc874 | 2012-07-17 17:45:55 +0800 | [diff] [blame] | 977 | test.update_state(**invoc.update_state_on_completion) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 978 | del self.invocations[test] |
Jon Salz | 1acc874 | 2012-07-17 17:45:55 +0800 | [diff] [blame] | 979 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 980 | if not abort: |
| 981 | test.update_state(status=TestState.UNTESTED) |
| 982 | self.reap_completed_tests() |
| 983 | |
Jon Salz | 6dc031d | 2013-06-19 13:06:23 +0800 | [diff] [blame] | 984 | def stop(self, root=None, fail=False, reason=None): |
| 985 | self.kill_active_tests(fail, root, reason) |
Jon Salz | 85a3988 | 2012-07-05 16:45:04 +0800 | [diff] [blame] | 986 | # Remove any tests in the run queue under the root. |
| 987 | self.tests_to_run = deque([x for x in self.tests_to_run |
| 988 | if root and not x.has_ancestor(root)]) |
| 989 | self.run_next_test() |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 990 | |
Jon Salz | 4712ac7 | 2013-02-07 17:12:05 +0800 | [diff] [blame] | 991 | def clear_state(self, root=None): |
Jon Salz | 6dc031d | 2013-06-19 13:06:23 +0800 | [diff] [blame] | 992 | self.stop(root, reason='Clearing test state') |
Jon Salz | 4712ac7 | 2013-02-07 17:12:05 +0800 | [diff] [blame] | 993 | for f in root.walk(): |
| 994 | if f.is_leaf(): |
| 995 | f.update_state(status=TestState.UNTESTED) |
| 996 | |
Jon Salz | 6dc031d | 2013-06-19 13:06:23 +0800 | [diff] [blame] | 997 | def abort_active_tests(self, reason=None): |
| 998 | self.kill_active_tests(True, reason=reason) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 999 | |
| 1000 | def main(self): |
Jon Salz | eff9418 | 2013-06-19 15:06:28 +0800 | [diff] [blame] | 1001 | syslog.openlog('goofy') |
| 1002 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1003 | try: |
| 1004 | self.init() |
| 1005 | self.event_log.Log('goofy_init', |
| 1006 | success=True) |
| 1007 | except: |
| 1008 | if self.event_log: |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 1009 | try: |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1010 | self.event_log.Log('goofy_init', |
| 1011 | success=False, |
| 1012 | trace=traceback.format_exc()) |
| 1013 | except: # pylint: disable=W0702 |
| 1014 | pass |
| 1015 | raise |
| 1016 | |
Jon Salz | eff9418 | 2013-06-19 15:06:28 +0800 | [diff] [blame] | 1017 | syslog.syslog('Goofy (factory test harness) starting') |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1018 | self.run() |
| 1019 | |
| 1020 | def update_system_info(self): |
| 1021 | '''Updates system info.''' |
| 1022 | system_info = system.SystemInfo() |
| 1023 | self.state_instance.set_shared_data('system_info', system_info.__dict__) |
| 1024 | self.event_client.post_event(Event(Event.Type.SYSTEM_INFO, |
| 1025 | system_info=system_info.__dict__)) |
| 1026 | logging.info('System info: %r', system_info.__dict__) |
| 1027 | |
Jon Salz | eb42f0d | 2012-07-27 19:14:04 +0800 | [diff] [blame] | 1028 | def update_factory(self, auto_run_on_restart=False, post_update_hook=None): |
| 1029 | '''Commences updating factory software. |
| 1030 | |
| 1031 | Args: |
| 1032 | auto_run_on_restart: Auto-run when the machine comes back up. |
| 1033 | post_update_hook: Code to call after update but immediately before |
| 1034 | restart. |
| 1035 | |
| 1036 | Returns: |
| 1037 | Never if the update was successful (we just reboot). |
| 1038 | False if the update was unnecessary (no update available). |
| 1039 | ''' |
Jon Salz | 6dc031d | 2013-06-19 13:06:23 +0800 | [diff] [blame] | 1040 | self.kill_active_tests(False, reason='Factory software update') |
Jon Salz | a6711d7 | 2012-07-18 14:33:03 +0800 | [diff] [blame] | 1041 | self.cancel_pending_tests() |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1042 | |
Jon Salz | 5c344f6 | 2012-07-13 14:31:16 +0800 | [diff] [blame] | 1043 | def pre_update_hook(): |
| 1044 | if auto_run_on_restart: |
| 1045 | self.state_instance.set_shared_data('tests_after_shutdown', |
| 1046 | FORCE_AUTO_RUN) |
| 1047 | self.state_instance.close() |
| 1048 | |
Jon Salz | eb42f0d | 2012-07-27 19:14:04 +0800 | [diff] [blame] | 1049 | if updater.TryUpdate(pre_update_hook=pre_update_hook): |
| 1050 | if post_update_hook: |
| 1051 | post_update_hook() |
| 1052 | self.env.shutdown('reboot') |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1053 | |
Jon Salz | cef132a | 2012-08-30 04:58:08 +0800 | [diff] [blame] | 1054 | def handle_sigint(self, dummy_signum, dummy_frame): |
Jon Salz | 77c151e | 2012-08-28 07:20:37 +0800 | [diff] [blame] | 1055 | logging.error('Received SIGINT') |
| 1056 | self.run_queue.put(None) |
| 1057 | raise KeyboardInterrupt() |
| 1058 | |
Jon Salz | e12c2b3 | 2013-06-25 16:24:34 +0800 | [diff] [blame] | 1059 | def find_kcrashes(self): |
| 1060 | """Finds kcrash files, logs them, and marks them as seen.""" |
| 1061 | seen_crashes = set( |
| 1062 | self.state_instance.get_shared_data('seen_crashes', optional=True) |
| 1063 | or []) |
| 1064 | |
| 1065 | for path in glob.glob('/var/spool/crash/*'): |
| 1066 | if not os.path.isfile(path): |
| 1067 | continue |
| 1068 | if path in seen_crashes: |
| 1069 | continue |
| 1070 | try: |
| 1071 | stat = os.stat(path) |
| 1072 | mtime = utils.TimeString(stat.st_mtime) |
| 1073 | logging.info( |
| 1074 | 'Found new crash file %s (%d bytes at %s)', |
| 1075 | path, stat.st_size, mtime) |
| 1076 | extra_log_args = {} |
| 1077 | |
| 1078 | try: |
| 1079 | _, ext = os.path.splitext(path) |
| 1080 | if ext in ['.kcrash', '.meta']: |
| 1081 | ext = ext.replace('.', '') |
| 1082 | with open(path) as f: |
| 1083 | data = f.read(MAX_CRASH_FILE_SIZE) |
| 1084 | tell = f.tell() |
| 1085 | logging.info( |
| 1086 | 'Contents of %s%s:%s', |
| 1087 | path, |
| 1088 | ('' if tell == stat.st_size |
| 1089 | else '(truncated to %d bytes)' % MAX_CRASH_FILE_SIZE), |
| 1090 | ('\n' + data).replace('\n', '\n ' + ext + '> ')) |
| 1091 | extra_log_args['data'] = data |
| 1092 | |
| 1093 | # Copy to /var/factory/kcrash for posterity |
| 1094 | kcrash_dir = factory.get_factory_root('kcrash') |
| 1095 | utils.TryMakeDirs(kcrash_dir) |
| 1096 | shutil.copy(path, kcrash_dir) |
| 1097 | logging.info('Copied to %s', |
| 1098 | os.path.join(kcrash_dir, os.path.basename(path))) |
| 1099 | finally: |
| 1100 | # Even if something goes wrong with the above, still try to |
| 1101 | # log to event log |
| 1102 | self.event_log.Log('crash_file', |
| 1103 | path=path, size=stat.st_size, mtime=mtime, |
| 1104 | **extra_log_args) |
| 1105 | except: # pylint: disable=W0702 |
| 1106 | logging.exception('Unable to handle crash files %s', path) |
| 1107 | seen_crashes.add(path) |
| 1108 | |
| 1109 | self.state_instance.set_shared_data('seen_crashes', list(seen_crashes)) |
| 1110 | |
Jon Salz | 128b093 | 2013-07-03 16:55:26 +0800 | [diff] [blame^] | 1111 | def GetTestList(self, test_list_id): |
| 1112 | """Returns the test list with the given ID. |
| 1113 | |
| 1114 | Raises: |
| 1115 | TestListError: The test list ID is not valid. |
| 1116 | """ |
| 1117 | try: |
| 1118 | return self.test_lists[test_list_id] |
| 1119 | except KeyError: |
| 1120 | raise test_lists.TestListError( |
| 1121 | '%r is not a valid test list ID (available IDs are [%s])' % ( |
| 1122 | test_list_id, ', '.join(sorted(self.test_lists.keys())))) |
| 1123 | |
| 1124 | def InitTestLists(self): |
| 1125 | """Reads in all test lists and sets the active test list.""" |
| 1126 | self.test_lists = test_lists.BuildAllTestLists() |
| 1127 | |
| 1128 | if not self.options.test_list: |
| 1129 | self.options.test_list = test_lists.GetActiveTestListId() |
| 1130 | |
| 1131 | if os.sep in self.options.test_list: |
| 1132 | # It's a path pointing to an old-style test list; use it. |
| 1133 | self.test_list = factory.read_test_list(self.options.test_list) |
| 1134 | else: |
| 1135 | self.test_list = self.GetTestList(self.options.test_list) |
| 1136 | |
| 1137 | logging.info('Active test list: %s', self.test_list.test_list_id) |
| 1138 | |
| 1139 | if isinstance(self.test_list, test_lists.OldStyleTestList): |
| 1140 | # Actually load it in. (See OldStyleTestList for an explanation |
| 1141 | # of why this is necessary.) |
| 1142 | self.test_list = self.test_list.Load() |
| 1143 | |
| 1144 | self.test_list.state_instance = self.state_instance |
| 1145 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1146 | def init(self, args=None, env=None): |
| 1147 | '''Initializes Goofy. |
| 1148 | |
| 1149 | Args: |
| 1150 | args: A list of command-line arguments. Uses sys.argv if |
| 1151 | args is None. |
| 1152 | env: An Environment instance to use (or None to choose |
| 1153 | FakeChrootEnvironment or DUTEnvironment as appropriate). |
| 1154 | ''' |
Jon Salz | 77c151e | 2012-08-28 07:20:37 +0800 | [diff] [blame] | 1155 | signal.signal(signal.SIGINT, self.handle_sigint) |
| 1156 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1157 | parser = OptionParser() |
| 1158 | parser.add_option('-v', '--verbose', dest='verbose', |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 1159 | action='store_true', |
| 1160 | help='Enable debug logging') |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1161 | parser.add_option('--print_test_list', dest='print_test_list', |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 1162 | metavar='FILE', |
| 1163 | help='Read and print test list FILE, and exit') |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1164 | parser.add_option('--restart', dest='restart', |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 1165 | action='store_true', |
| 1166 | help='Clear all test state') |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1167 | parser.add_option('--ui', dest='ui', type='choice', |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 1168 | choices=['none', 'gtk', 'chrome'], |
Jon Salz | 2f881df | 2013-02-01 17:00:35 +0800 | [diff] [blame] | 1169 | default='chrome', |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 1170 | help='UI to use') |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1171 | parser.add_option('--ui_scale_factor', dest='ui_scale_factor', |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 1172 | type='int', default=1, |
| 1173 | help=('Factor by which to scale UI ' |
| 1174 | '(Chrome UI only)')) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1175 | parser.add_option('--test_list', dest='test_list', |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 1176 | metavar='FILE', |
| 1177 | help='Use FILE as test list') |
Jon Salz | c79a998 | 2012-08-30 04:42:01 +0800 | [diff] [blame] | 1178 | parser.add_option('--dummy_shopfloor', action='store_true', |
| 1179 | help='Use a dummy shopfloor server') |
chungyi | afe8f77 | 2012-08-15 19:36:29 +0800 | [diff] [blame] | 1180 | parser.add_option('--automation', dest='automation', |
| 1181 | action='store_true', |
| 1182 | help='Enable automation on running factory test') |
Ricky Liang | 09216dc | 2013-02-22 17:26:45 +0800 | [diff] [blame] | 1183 | parser.add_option('--one_pixel_less', dest='one_pixel_less', |
| 1184 | action='store_true', |
| 1185 | help=('Start Chrome one pixel less than the full screen.' |
| 1186 | 'Needed by Exynos platform to run GTK.')) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1187 | (self.options, self.args) = parser.parse_args(args) |
| 1188 | |
Jon Salz | 46b8956 | 2012-07-05 11:49:22 +0800 | [diff] [blame] | 1189 | # Make sure factory directories exist. |
| 1190 | factory.get_log_root() |
| 1191 | factory.get_state_root() |
| 1192 | factory.get_test_data_root() |
| 1193 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1194 | global _inited_logging # pylint: disable=W0603 |
| 1195 | if not _inited_logging: |
| 1196 | factory.init_logging('goofy', verbose=self.options.verbose) |
| 1197 | _inited_logging = True |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 1198 | |
Jon Salz | 0f99660 | 2012-10-03 15:26:48 +0800 | [diff] [blame] | 1199 | if self.options.print_test_list: |
| 1200 | print factory.read_test_list( |
| 1201 | self.options.print_test_list).__repr__(recursive=True) |
| 1202 | sys.exit(0) |
| 1203 | |
Jon Salz | ee85d52 | 2012-07-17 14:34:46 +0800 | [diff] [blame] | 1204 | event_log.IncrementBootSequence() |
Jon Salz | d15bbcf | 2013-05-21 17:33:57 +0800 | [diff] [blame] | 1205 | # Don't defer logging the initial event, so we can make sure |
| 1206 | # that device_id, reimage_id, etc. are all set up. |
| 1207 | self.event_log = EventLog('goofy', defer=False) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1208 | |
| 1209 | if (not suppress_chroot_warning and |
| 1210 | factory.in_chroot() and |
| 1211 | self.options.ui == 'gtk' and |
| 1212 | os.environ.get('DISPLAY') in [None, '', ':0', ':0.0']): |
| 1213 | # That's not going to work! Tell the user how to run |
| 1214 | # this way. |
| 1215 | logging.warn(GOOFY_IN_CHROOT_WARNING) |
| 1216 | time.sleep(1) |
| 1217 | |
| 1218 | if env: |
| 1219 | self.env = env |
| 1220 | elif factory.in_chroot(): |
| 1221 | self.env = test_environment.FakeChrootEnvironment() |
| 1222 | logging.warn( |
| 1223 | 'Using chroot environment: will not actually run autotests') |
| 1224 | else: |
| 1225 | self.env = test_environment.DUTEnvironment() |
| 1226 | self.env.goofy = self |
| 1227 | |
| 1228 | if self.options.restart: |
| 1229 | state.clear_state() |
| 1230 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1231 | if self.options.ui_scale_factor != 1 and utils.in_qemu(): |
| 1232 | logging.warn( |
| 1233 | 'In QEMU; ignoring ui_scale_factor argument') |
| 1234 | self.options.ui_scale_factor = 1 |
| 1235 | |
| 1236 | logging.info('Started') |
| 1237 | |
| 1238 | self.start_state_server() |
| 1239 | self.state_instance.set_shared_data('hwid_cfg', get_hwid_cfg()) |
| 1240 | self.state_instance.set_shared_data('ui_scale_factor', |
Ricky Liang | 09216dc | 2013-02-22 17:26:45 +0800 | [diff] [blame] | 1241 | self.options.ui_scale_factor) |
| 1242 | self.state_instance.set_shared_data('one_pixel_less', |
| 1243 | self.options.one_pixel_less) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1244 | self.last_shutdown_time = ( |
| 1245 | self.state_instance.get_shared_data('shutdown_time', optional=True)) |
| 1246 | self.state_instance.del_shared_data('shutdown_time', optional=True) |
Jon Salz | b19ea07 | 2013-02-07 16:35:00 +0800 | [diff] [blame] | 1247 | self.state_instance.del_shared_data('startup_error', optional=True) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1248 | |
Jon Salz | 128b093 | 2013-07-03 16:55:26 +0800 | [diff] [blame^] | 1249 | try: |
| 1250 | self.InitTestLists() |
| 1251 | except: # pylint: disable=W0702 |
| 1252 | logging.exception('Unable to initialize test lists') |
| 1253 | self.state_instance.set_shared_data( |
| 1254 | 'startup_error', |
| 1255 | 'Unable to initialize test lists\n%s' % ( |
| 1256 | traceback.format_exc())) |
Jon Salz | b19ea07 | 2013-02-07 16:35:00 +0800 | [diff] [blame] | 1257 | if self.options.ui == 'chrome': |
| 1258 | # Create an empty test list with default options so that the rest of |
| 1259 | # startup can proceed. |
| 1260 | self.test_list = factory.FactoryTestList( |
| 1261 | [], self.state_instance, factory.Options()) |
| 1262 | else: |
| 1263 | # Bail with an error; no point in starting up. |
| 1264 | sys.exit('No valid test list; exiting.') |
| 1265 | |
Jon Salz | 822838b | 2013-03-25 17:32:33 +0800 | [diff] [blame] | 1266 | if self.test_list.options.clear_state_on_start: |
| 1267 | self.state_instance.clear_test_state() |
| 1268 | |
Vic Yang | 3e1cf5d | 2013-06-05 18:50:24 +0800 | [diff] [blame] | 1269 | if system.SystemInfo().firmware_version is None and not utils.in_chroot(): |
Vic Yang | 9bd4f77 | 2013-06-04 17:34:00 +0800 | [diff] [blame] | 1270 | self.state_instance.set_shared_data('startup_error', |
| 1271 | 'Netboot firmware detected\n' |
| 1272 | 'Connect Ethernet and reboot to re-image.\n' |
| 1273 | u'侦测到网路开机固件\n' |
| 1274 | u'请连接乙太网并重启') |
| 1275 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1276 | if not self.state_instance.has_shared_data('ui_lang'): |
| 1277 | self.state_instance.set_shared_data('ui_lang', |
| 1278 | self.test_list.options.ui_lang) |
| 1279 | self.state_instance.set_shared_data( |
| 1280 | 'test_list_options', |
| 1281 | self.test_list.options.__dict__) |
| 1282 | self.state_instance.test_list = self.test_list |
| 1283 | |
Jon Salz | 83ef34b | 2012-11-01 19:46:35 +0800 | [diff] [blame] | 1284 | if not utils.in_chroot() and self.test_list.options.disable_log_rotation: |
| 1285 | open('/var/lib/cleanup_logs_paused', 'w').close() |
| 1286 | |
Jon Salz | 2392642 | 2012-09-01 03:38:13 +0800 | [diff] [blame] | 1287 | if self.options.dummy_shopfloor: |
| 1288 | os.environ[shopfloor.SHOPFLOOR_SERVER_ENV_VAR_NAME] = ( |
| 1289 | 'http://localhost:%d/' % shopfloor.DEFAULT_SERVER_PORT) |
| 1290 | self.dummy_shopfloor = Spawn( |
| 1291 | [os.path.join(factory.FACTORY_PATH, 'bin', 'shopfloor_server'), |
| 1292 | '--dummy']) |
| 1293 | elif self.test_list.options.shopfloor_server_url: |
| 1294 | shopfloor.set_server_url(self.test_list.options.shopfloor_server_url) |
Jon Salz | 2bf2f6b | 2013-03-28 18:49:26 +0800 | [diff] [blame] | 1295 | shopfloor.set_enabled(True) |
Jon Salz | 2392642 | 2012-09-01 03:38:13 +0800 | [diff] [blame] | 1296 | |
Jon Salz | 0f99660 | 2012-10-03 15:26:48 +0800 | [diff] [blame] | 1297 | if self.test_list.options.time_sanitizer and not utils.in_chroot(): |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 1298 | self.time_sanitizer = time_sanitizer.TimeSanitizer( |
| 1299 | base_time=time_sanitizer.GetBaseTimeFromFile( |
| 1300 | # lsb-factory is written by the factory install shim during |
| 1301 | # installation, so it should have a good time obtained from |
Jon Salz | 54882d0 | 2012-08-31 01:57:54 +0800 | [diff] [blame] | 1302 | # the mini-Omaha server. If it's not available, we'll use |
| 1303 | # /etc/lsb-factory (which will be much older, but reasonably |
| 1304 | # sane) and rely on a shopfloor sync to set a more accurate |
| 1305 | # time. |
| 1306 | '/usr/local/etc/lsb-factory', |
| 1307 | '/etc/lsb-release')) |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 1308 | self.time_sanitizer.RunOnce() |
| 1309 | |
Vic Yang | d8990da | 2013-06-27 16:57:43 +0800 | [diff] [blame] | 1310 | if self.test_list.options.check_cpu_usage_period_secs: |
| 1311 | self.cpu_usage_watcher = Spawn(['py/tools/cpu_usage_monitor.py', |
| 1312 | '-p', str(self.test_list.options.check_cpu_usage_period_secs)], |
| 1313 | cwd=factory.FACTORY_PATH) |
| 1314 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1315 | self.init_states() |
| 1316 | self.start_event_server() |
| 1317 | self.connection_manager = self.env.create_connection_manager( |
Tai-Hsu Lin | 371351a | 2012-08-27 14:17:14 +0800 | [diff] [blame] | 1318 | self.test_list.options.wlans, |
| 1319 | self.test_list.options.scan_wifi_period_secs) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1320 | # Note that we create a log watcher even if |
| 1321 | # sync_event_log_period_secs isn't set (no background |
| 1322 | # syncing), since we may use it to flush event logs as well. |
| 1323 | self.log_watcher = EventLogWatcher( |
| 1324 | self.test_list.options.sync_event_log_period_secs, |
Jon Salz | d15bbcf | 2013-05-21 17:33:57 +0800 | [diff] [blame] | 1325 | event_log_db_file=None, |
Jon Salz | 16d1054 | 2012-07-23 12:18:45 +0800 | [diff] [blame] | 1326 | handle_event_logs_callback=self.handle_event_logs) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1327 | if self.test_list.options.sync_event_log_period_secs: |
| 1328 | self.log_watcher.StartWatchThread() |
| 1329 | |
Cheng-Yi Chiang | 344b10f | 2013-05-03 16:44:03 +0800 | [diff] [blame] | 1330 | # Note that we create a system log manager even if |
| 1331 | # sync_log_period_secs isn't set (no background |
| 1332 | # syncing), since we may kick it to sync logs in its |
| 1333 | # thread. |
Cheng-Yi Chiang | d3516a3 | 2013-07-17 15:30:47 +0800 | [diff] [blame] | 1334 | if self.test_list.options.enable_sync_log: |
| 1335 | self.system_log_manager = SystemLogManager( |
| 1336 | sync_log_paths=self.test_list.options.sync_log_paths, |
| 1337 | sync_period_sec=self.test_list.options.sync_log_period_secs, |
| 1338 | clear_log_paths=self.test_list.options.clear_log_paths) |
| 1339 | self.system_log_manager.StartSyncThread() |
Cheng-Yi Chiang | 344b10f | 2013-05-03 16:44:03 +0800 | [diff] [blame] | 1340 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1341 | self.update_system_info() |
| 1342 | |
Vic Yang | 4953fc1 | 2012-07-26 16:19:53 +0800 | [diff] [blame] | 1343 | assert ((self.test_list.options.min_charge_pct is None) == |
| 1344 | (self.test_list.options.max_charge_pct is None)) |
Vic Yang | e83d9a1 | 2013-04-19 20:00:20 +0800 | [diff] [blame] | 1345 | if utils.in_chroot(): |
| 1346 | logging.info('In chroot, ignoring charge manager and charge state') |
| 1347 | elif self.test_list.options.min_charge_pct is not None: |
Vic Yang | 4953fc1 | 2012-07-26 16:19:53 +0800 | [diff] [blame] | 1348 | self.charge_manager = ChargeManager(self.test_list.options.min_charge_pct, |
| 1349 | self.test_list.options.max_charge_pct) |
Jon Salz | ad7353b | 2012-10-15 16:22:46 +0800 | [diff] [blame] | 1350 | system.SystemStatus.charge_manager = self.charge_manager |
Cheng-Yi Chiang | d818695 | 2013-04-04 23:41:14 +0800 | [diff] [blame] | 1351 | else: |
| 1352 | # Goofy should set charger state to charge if charge_manager is disabled. |
| 1353 | try: |
| 1354 | system.GetBoard().SetChargeState(Board.ChargeState.CHARGE) |
| 1355 | except BoardException: |
| 1356 | logging.exception('Unable to set charge state on this board') |
Vic Yang | 4953fc1 | 2012-07-26 16:19:53 +0800 | [diff] [blame] | 1357 | |
Cheng-Yi Chiang | cdfa418 | 2013-05-05 03:20:19 +0800 | [diff] [blame] | 1358 | self.core_dump_manager = CoreDumpManager( |
| 1359 | self.test_list.options.core_dump_watchlist) |
| 1360 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1361 | os.environ['CROS_FACTORY'] = '1' |
| 1362 | os.environ['CROS_DISABLE_SITE_SYSINFO'] = '1' |
| 1363 | |
| 1364 | # Set CROS_UI since some behaviors in ui.py depend on the |
| 1365 | # particular UI in use. TODO(jsalz): Remove this (and all |
| 1366 | # places it is used) when the GTK UI is removed. |
| 1367 | os.environ['CROS_UI'] = self.options.ui |
| 1368 | |
Jon Salz | 416f9cc | 2013-05-10 18:32:50 +0800 | [diff] [blame] | 1369 | # Initialize hooks. |
| 1370 | module, cls = self.test_list.options.hooks_class.rsplit('.', 1) |
| 1371 | self.hooks = getattr(__import__(module, fromlist=[cls]), cls)() |
| 1372 | assert isinstance(self.hooks, factory.Hooks), ( |
| 1373 | "hooks should be of type Hooks but is %r" % type(self.hooks)) |
| 1374 | self.hooks.test_list = self.test_list |
| 1375 | |
Jon Salz | ce6a7f8 | 2013-06-10 18:22:54 +0800 | [diff] [blame] | 1376 | if not utils.in_chroot(): |
Jon Salz | ddf0d05 | 2013-06-18 12:52:44 +0800 | [diff] [blame] | 1377 | self.cpufreq_manager = CpufreqManager(event_log=self.event_log) |
Jon Salz | ce6a7f8 | 2013-06-10 18:22:54 +0800 | [diff] [blame] | 1378 | |
Jon Salz | 416f9cc | 2013-05-10 18:32:50 +0800 | [diff] [blame] | 1379 | # Call startup hook. |
| 1380 | self.hooks.OnStartup() |
Justin Chuang | 31b0243 | 2013-06-27 15:16:51 +0800 | [diff] [blame] | 1381 | # Startup hooks may want to skip some tests. |
| 1382 | self.update_skipped_tests() |
Jon Salz | 416f9cc | 2013-05-10 18:32:50 +0800 | [diff] [blame] | 1383 | |
Jon Salz | e12c2b3 | 2013-06-25 16:24:34 +0800 | [diff] [blame] | 1384 | self.find_kcrashes() |
| 1385 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1386 | if self.options.ui == 'chrome': |
| 1387 | self.env.launch_chrome() |
| 1388 | logging.info('Waiting for a web socket connection') |
Cheng-Yi Chiang | fd8ed39 | 2013-03-08 21:37:31 +0800 | [diff] [blame] | 1389 | self.web_socket_manager.wait() |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1390 | |
| 1391 | # Wait for the test widget size to be set; this is done in |
| 1392 | # an asynchronous RPC so there is a small chance that the |
| 1393 | # web socket might be opened first. |
| 1394 | for _ in range(100): # 10 s |
| 1395 | try: |
| 1396 | if self.state_instance.get_shared_data('test_widget_size'): |
| 1397 | break |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 1398 | except KeyError: |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1399 | pass # Retry |
| 1400 | time.sleep(0.1) # 100 ms |
| 1401 | else: |
| 1402 | logging.warn('Never received test_widget_size from UI') |
Jon Salz | 4529728 | 2013-05-18 14:31:47 +0800 | [diff] [blame] | 1403 | |
| 1404 | # Send Chrome a Tab to get focus to the factory UI |
| 1405 | # (http://crosbug.com/p/19444). TODO(jsalz): remove this hack |
| 1406 | # and figure out the right way to get the focus to Chrome. |
| 1407 | if not utils.in_chroot(): |
| 1408 | Spawn( |
| 1409 | [os.path.join(factory.FACTORY_PATH, 'bin', 'send_key'), 'Tab'], |
| 1410 | check_call=True, log=True) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1411 | elif self.options.ui == 'gtk': |
| 1412 | self.start_ui() |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 1413 | |
Ricky Liang | 650f6bf | 2012-09-28 13:22:54 +0800 | [diff] [blame] | 1414 | # Create download path for autotest beforehand or autotests run at |
| 1415 | # the same time might fail due to race condition. |
| 1416 | if not factory.in_chroot(): |
| 1417 | utils.TryMakeDirs(os.path.join('/usr/local/autotest', 'tests', |
| 1418 | 'download')) |
| 1419 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1420 | def state_change_callback(test, test_state): |
| 1421 | self.event_client.post_event( |
| 1422 | Event(Event.Type.STATE_CHANGE, |
| 1423 | path=test.path, state=test_state)) |
| 1424 | self.test_list.state_change_callback = state_change_callback |
Jon Salz | 73e0fd0 | 2012-04-04 11:46:38 +0800 | [diff] [blame] | 1425 | |
Jon Salz | a6711d7 | 2012-07-18 14:33:03 +0800 | [diff] [blame] | 1426 | for handler in self.on_ui_startup: |
| 1427 | handler() |
| 1428 | |
| 1429 | self.prespawner = Prespawner() |
| 1430 | self.prespawner.start() |
| 1431 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1432 | try: |
| 1433 | tests_after_shutdown = self.state_instance.get_shared_data( |
| 1434 | 'tests_after_shutdown') |
| 1435 | except KeyError: |
| 1436 | tests_after_shutdown = None |
Jon Salz | 57717ca | 2012-04-04 16:47:25 +0800 | [diff] [blame] | 1437 | |
Jon Salz | 5c344f6 | 2012-07-13 14:31:16 +0800 | [diff] [blame] | 1438 | force_auto_run = (tests_after_shutdown == FORCE_AUTO_RUN) |
| 1439 | if not force_auto_run and tests_after_shutdown is not None: |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1440 | logging.info('Resuming tests after shutdown: %s', |
| 1441 | tests_after_shutdown) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1442 | self.tests_to_run.extend( |
| 1443 | self.test_list.lookup_path(t) for t in tests_after_shutdown) |
| 1444 | self.run_queue.put(self.run_next_test) |
| 1445 | else: |
Jon Salz | 5c344f6 | 2012-07-13 14:31:16 +0800 | [diff] [blame] | 1446 | if force_auto_run or self.test_list.options.auto_run_on_start: |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1447 | self.run_queue.put( |
| 1448 | lambda: self.run_tests(self.test_list, untested_only=True)) |
Jon Salz | 5c344f6 | 2012-07-13 14:31:16 +0800 | [diff] [blame] | 1449 | self.state_instance.set_shared_data('tests_after_shutdown', None) |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 1450 | |
Dean Liao | 592e4d5 | 2013-01-10 20:06:39 +0800 | [diff] [blame] | 1451 | self.may_disable_cros_shortcut_keys() |
| 1452 | |
| 1453 | def may_disable_cros_shortcut_keys(self): |
| 1454 | test_options = self.test_list.options |
| 1455 | if test_options.disable_cros_shortcut_keys: |
| 1456 | logging.info('Filter ChromeOS shortcut keys.') |
| 1457 | self.key_filter = KeyFilter( |
| 1458 | unmap_caps_lock=test_options.disable_caps_lock, |
| 1459 | caps_lock_keycode=test_options.caps_lock_keycode) |
| 1460 | self.key_filter.Start() |
| 1461 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1462 | def run(self): |
| 1463 | '''Runs Goofy.''' |
| 1464 | # Process events forever. |
| 1465 | while self.run_once(True): |
| 1466 | pass |
Jon Salz | 73e0fd0 | 2012-04-04 11:46:38 +0800 | [diff] [blame] | 1467 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1468 | def run_once(self, block=False): |
| 1469 | '''Runs all items pending in the event loop. |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 1470 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1471 | Args: |
| 1472 | block: If true, block until at least one event is processed. |
Jon Salz | 7c15e8b | 2012-06-19 17:10:37 +0800 | [diff] [blame] | 1473 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1474 | Returns: |
| 1475 | True to keep going or False to shut down. |
| 1476 | ''' |
| 1477 | events = utils.DrainQueue(self.run_queue) |
cychiang | 2188674 | 2012-07-05 15:16:32 +0800 | [diff] [blame] | 1478 | while not events: |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1479 | # Nothing on the run queue. |
| 1480 | self._run_queue_idle() |
| 1481 | if block: |
| 1482 | # Block for at least one event... |
cychiang | 2188674 | 2012-07-05 15:16:32 +0800 | [diff] [blame] | 1483 | try: |
| 1484 | events.append(self.run_queue.get(timeout=RUN_QUEUE_TIMEOUT_SECS)) |
| 1485 | except Queue.Empty: |
| 1486 | # Keep going (calling _run_queue_idle() again at the top of |
| 1487 | # the loop) |
| 1488 | continue |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1489 | # ...and grab anything else that showed up at the same |
| 1490 | # time. |
| 1491 | events.extend(utils.DrainQueue(self.run_queue)) |
cychiang | 2188674 | 2012-07-05 15:16:32 +0800 | [diff] [blame] | 1492 | else: |
| 1493 | break |
Jon Salz | 51528e1 | 2012-07-02 18:54:45 +0800 | [diff] [blame] | 1494 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1495 | for event in events: |
| 1496 | if not event: |
| 1497 | # Shutdown request. |
| 1498 | self.run_queue.task_done() |
| 1499 | return False |
Jon Salz | 51528e1 | 2012-07-02 18:54:45 +0800 | [diff] [blame] | 1500 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1501 | try: |
| 1502 | event() |
Jon Salz | 85a3988 | 2012-07-05 16:45:04 +0800 | [diff] [blame] | 1503 | except: # pylint: disable=W0702 |
| 1504 | logging.exception('Error in event loop') |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1505 | self.record_exception(traceback.format_exception_only( |
| 1506 | *sys.exc_info()[:2])) |
| 1507 | # But keep going |
| 1508 | finally: |
| 1509 | self.run_queue.task_done() |
| 1510 | return True |
Jon Salz | 0405ab5 | 2012-03-16 15:26:52 +0800 | [diff] [blame] | 1511 | |
Jon Salz | 0e6532d | 2012-10-25 16:30:11 +0800 | [diff] [blame] | 1512 | def _should_sync_time(self, foreground=False): |
| 1513 | '''Returns True if we should attempt syncing time with shopfloor. |
| 1514 | |
| 1515 | Args: |
| 1516 | foreground: If True, synchronizes even if background syncing |
| 1517 | is disabled (e.g., in explicit sync requests from the |
| 1518 | SyncShopfloor test). |
| 1519 | ''' |
| 1520 | return ((foreground or |
| 1521 | self.test_list.options.sync_time_period_secs) and |
Jon Salz | 54882d0 | 2012-08-31 01:57:54 +0800 | [diff] [blame] | 1522 | self.time_sanitizer and |
| 1523 | (not self.time_synced) and |
| 1524 | (not factory.in_chroot())) |
| 1525 | |
Jon Salz | 0e6532d | 2012-10-25 16:30:11 +0800 | [diff] [blame] | 1526 | def sync_time_with_shopfloor_server(self, foreground=False): |
Jon Salz | 54882d0 | 2012-08-31 01:57:54 +0800 | [diff] [blame] | 1527 | '''Syncs time with shopfloor server, if not yet synced. |
| 1528 | |
Jon Salz | 0e6532d | 2012-10-25 16:30:11 +0800 | [diff] [blame] | 1529 | Args: |
| 1530 | foreground: If True, synchronizes even if background syncing |
| 1531 | is disabled (e.g., in explicit sync requests from the |
| 1532 | SyncShopfloor test). |
| 1533 | |
Jon Salz | 54882d0 | 2012-08-31 01:57:54 +0800 | [diff] [blame] | 1534 | Returns: |
| 1535 | False if no time sanitizer is available, or True if this sync (or a |
| 1536 | previous sync) succeeded. |
| 1537 | |
| 1538 | Raises: |
| 1539 | Exception if unable to contact the shopfloor server. |
| 1540 | ''' |
Jon Salz | 0e6532d | 2012-10-25 16:30:11 +0800 | [diff] [blame] | 1541 | if self._should_sync_time(foreground): |
Jon Salz | 54882d0 | 2012-08-31 01:57:54 +0800 | [diff] [blame] | 1542 | self.time_sanitizer.SyncWithShopfloor() |
| 1543 | self.time_synced = True |
| 1544 | return self.time_synced |
| 1545 | |
Jon Salz | b92c511 | 2012-09-21 15:40:11 +0800 | [diff] [blame] | 1546 | def log_disk_space_stats(self): |
Jon Salz | 18e0e02 | 2013-06-11 17:13:39 +0800 | [diff] [blame] | 1547 | if (utils.in_chroot() or |
| 1548 | not self.test_list.options.log_disk_space_period_secs): |
Jon Salz | b92c511 | 2012-09-21 15:40:11 +0800 | [diff] [blame] | 1549 | return |
| 1550 | |
| 1551 | now = time.time() |
| 1552 | if (self.last_log_disk_space_time and |
| 1553 | now - self.last_log_disk_space_time < |
| 1554 | self.test_list.options.log_disk_space_period_secs): |
| 1555 | return |
| 1556 | self.last_log_disk_space_time = now |
| 1557 | |
Cheng-Yi Chiang | d040652 | 2013-04-01 15:40:18 +0800 | [diff] [blame] | 1558 | # Upload event if stateful partition usage is above threshold. |
| 1559 | # Stateful partition is mounted on /usr/local, while |
| 1560 | # encrypted stateful partition is mounted on /var. |
| 1561 | # If there are too much logs in the factory process, |
| 1562 | # these two partitions might get full. |
Jon Salz | b92c511 | 2012-09-21 15:40:11 +0800 | [diff] [blame] | 1563 | try: |
Cheng-Yi Chiang | d040652 | 2013-04-01 15:40:18 +0800 | [diff] [blame] | 1564 | vfs_infos = disk_space.GetAllVFSInfo() |
| 1565 | stateful_info, encrypted_info = None, None |
| 1566 | for vfs_info in vfs_infos.values(): |
| 1567 | if '/usr/local' in vfs_info.mount_points: |
| 1568 | stateful_info = vfs_info |
| 1569 | if '/var' in vfs_info.mount_points: |
| 1570 | encrypted_info = vfs_info |
| 1571 | |
| 1572 | stateful = disk_space.GetPartitionUsage(stateful_info) |
| 1573 | encrypted = disk_space.GetPartitionUsage(encrypted_info) |
| 1574 | |
| 1575 | above_threshold = ( |
| 1576 | self.test_list.options.stateful_usage_threshold and |
| 1577 | max(stateful.bytes_used_pct, |
| 1578 | stateful.inodes_used_pct, |
| 1579 | encrypted.bytes_used_pct, |
| 1580 | encrypted.inodes_used_pct) > |
| 1581 | self.test_list.options.stateful_usage_threshold) |
| 1582 | |
| 1583 | if above_threshold: |
| 1584 | self.event_log.Log('stateful_partition_usage', |
| 1585 | partitions={ |
| 1586 | 'stateful': { |
| 1587 | 'bytes_used_pct': FloatDigit(stateful.bytes_used_pct, 2), |
| 1588 | 'inodes_used_pct': FloatDigit(stateful.inodes_used_pct, 2)}, |
| 1589 | 'encrypted_stateful': { |
| 1590 | 'bytes_used_pct': FloatDigit(encrypted.bytes_used_pct, 2), |
| 1591 | 'inodes_used_pct': FloatDigit(encrypted.inodes_used_pct, 2)} |
| 1592 | }) |
| 1593 | self.log_watcher.ScanEventLogs() |
Cheng-Yi Chiang | 00798e7 | 2013-06-20 18:16:39 +0800 | [diff] [blame] | 1594 | if (not utils.in_chroot() and |
| 1595 | self.test_list.options.stateful_usage_above_threshold_action): |
| 1596 | Spawn(self.test_list.options.stateful_usage_above_threshold_action, |
| 1597 | call=True) |
Cheng-Yi Chiang | d040652 | 2013-04-01 15:40:18 +0800 | [diff] [blame] | 1598 | |
| 1599 | message = disk_space.FormatSpaceUsedAll(vfs_infos) |
Jon Salz | 3c493bb | 2013-02-07 17:24:58 +0800 | [diff] [blame] | 1600 | if message != self.last_log_disk_space_message: |
Cheng-Yi Chiang | d040652 | 2013-04-01 15:40:18 +0800 | [diff] [blame] | 1601 | if above_threshold: |
| 1602 | logging.warning(message) |
| 1603 | else: |
| 1604 | logging.info(message) |
Jon Salz | 3c493bb | 2013-02-07 17:24:58 +0800 | [diff] [blame] | 1605 | self.last_log_disk_space_message = message |
Jon Salz | b92c511 | 2012-09-21 15:40:11 +0800 | [diff] [blame] | 1606 | except: # pylint: disable=W0702 |
| 1607 | logging.exception('Unable to get disk space used') |
| 1608 | |
Justin Chuang | 8381398 | 2013-05-13 01:26:32 +0800 | [diff] [blame] | 1609 | def check_battery(self): |
| 1610 | '''Checks the current battery status. |
| 1611 | |
| 1612 | Logs current battery charging level and status to log. If the battery level |
| 1613 | is lower below warning_low_battery_pct, send warning event to shopfloor. |
| 1614 | If the battery level is lower below critical_low_battery_pct, flush disks. |
| 1615 | ''' |
| 1616 | if not self.test_list.options.check_battery_period_secs: |
| 1617 | return |
| 1618 | |
| 1619 | now = time.time() |
| 1620 | if (self.last_check_battery_time and |
| 1621 | now - self.last_check_battery_time < |
| 1622 | self.test_list.options.check_battery_period_secs): |
| 1623 | return |
| 1624 | self.last_check_battery_time = now |
| 1625 | |
| 1626 | message = '' |
| 1627 | log_level = logging.INFO |
| 1628 | try: |
| 1629 | power = system.GetBoard().power |
| 1630 | if not power.CheckBatteryPresent(): |
| 1631 | message = 'Battery is not present' |
| 1632 | else: |
| 1633 | ac_present = power.CheckACPresent() |
| 1634 | charge_pct = power.GetChargePct(get_float=True) |
| 1635 | message = ('Current battery level %.1f%%, AC charger is %s' % |
| 1636 | (charge_pct, 'connected' if ac_present else 'disconnected')) |
| 1637 | |
| 1638 | if charge_pct > self.test_list.options.critical_low_battery_pct: |
| 1639 | critical_low_battery = False |
| 1640 | else: |
| 1641 | critical_low_battery = True |
| 1642 | # Only sync disks when battery level is still above minimum |
| 1643 | # value. This can be used for offline analysis when shopfloor cannot |
| 1644 | # be connected. |
| 1645 | if charge_pct > MIN_BATTERY_LEVEL_FOR_DISK_SYNC: |
| 1646 | logging.warning('disk syncing for critical low battery situation') |
| 1647 | os.system('sync; sync; sync') |
| 1648 | else: |
| 1649 | logging.warning('disk syncing is cancelled ' |
| 1650 | 'because battery level is lower than %.1f', |
| 1651 | MIN_BATTERY_LEVEL_FOR_DISK_SYNC) |
| 1652 | |
| 1653 | # Notify shopfloor server |
| 1654 | if (critical_low_battery or |
| 1655 | (not ac_present and |
| 1656 | charge_pct <= self.test_list.options.warning_low_battery_pct)): |
| 1657 | log_level = logging.WARNING |
| 1658 | |
| 1659 | self.event_log.Log('low_battery', |
| 1660 | battery_level=charge_pct, |
| 1661 | charger_connected=ac_present, |
| 1662 | critical=critical_low_battery) |
| 1663 | self.log_watcher.KickWatchThread() |
Cheng-Yi Chiang | d3516a3 | 2013-07-17 15:30:47 +0800 | [diff] [blame] | 1664 | if self.system_log_manager: |
| 1665 | self.system_log_manager.KickSyncThread() |
Justin Chuang | 8381398 | 2013-05-13 01:26:32 +0800 | [diff] [blame] | 1666 | except: # pylint: disable=W0702 |
| 1667 | logging.exception('Unable to check battery or notify shopfloor') |
| 1668 | finally: |
| 1669 | if message != self.last_check_battery_message: |
| 1670 | logging.log(log_level, message) |
| 1671 | self.last_check_battery_message = message |
| 1672 | |
Cheng-Yi Chiang | cdfa418 | 2013-05-05 03:20:19 +0800 | [diff] [blame] | 1673 | def check_core_dump(self): |
| 1674 | '''Checks if there is any core dumped file. |
| 1675 | |
| 1676 | Removes unwanted core dump files immediately. |
| 1677 | Syncs those files matching watch list to server with a delay between |
| 1678 | each sync. After the files have been synced to server, deletes the files. |
| 1679 | ''' |
| 1680 | core_dump_files = self.core_dump_manager.ScanFiles() |
| 1681 | if core_dump_files: |
| 1682 | now = time.time() |
| 1683 | if (self.last_kick_sync_time and now - self.last_kick_sync_time < |
| 1684 | self.test_list.options.kick_sync_min_interval_secs): |
| 1685 | return |
| 1686 | self.last_kick_sync_time = now |
| 1687 | |
| 1688 | # Sends event to server |
| 1689 | self.event_log.Log('core_dumped', files=core_dump_files) |
| 1690 | self.log_watcher.KickWatchThread() |
| 1691 | |
| 1692 | # Syncs files to server |
Cheng-Yi Chiang | d3516a3 | 2013-07-17 15:30:47 +0800 | [diff] [blame] | 1693 | if self.system_log_manager: |
| 1694 | self.system_log_manager.KickSyncThread( |
| 1695 | core_dump_files, self.core_dump_manager.ClearFiles) |
Cheng-Yi Chiang | cdfa418 | 2013-05-05 03:20:19 +0800 | [diff] [blame] | 1696 | |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 1697 | def sync_time_in_background(self): |
Jon Salz | b22d117 | 2012-08-06 10:38:57 +0800 | [diff] [blame] | 1698 | '''Writes out current time and tries to sync with shopfloor server.''' |
| 1699 | if not self.time_sanitizer: |
| 1700 | return |
| 1701 | |
| 1702 | # Write out the current time. |
| 1703 | self.time_sanitizer.SaveTime() |
| 1704 | |
Jon Salz | 54882d0 | 2012-08-31 01:57:54 +0800 | [diff] [blame] | 1705 | if not self._should_sync_time(): |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 1706 | return |
| 1707 | |
| 1708 | now = time.time() |
| 1709 | if self.last_sync_time and ( |
| 1710 | now - self.last_sync_time < |
| 1711 | self.test_list.options.sync_time_period_secs): |
| 1712 | # Not yet time for another check. |
| 1713 | return |
| 1714 | self.last_sync_time = now |
| 1715 | |
| 1716 | def target(): |
| 1717 | try: |
Jon Salz | 54882d0 | 2012-08-31 01:57:54 +0800 | [diff] [blame] | 1718 | self.sync_time_with_shopfloor_server() |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 1719 | except: # pylint: disable=W0702 |
| 1720 | # Oh well. Log an error (but no trace) |
| 1721 | logging.info( |
| 1722 | 'Unable to get time from shopfloor server: %s', |
| 1723 | utils.FormatExceptionOnly()) |
| 1724 | |
| 1725 | thread = threading.Thread(target=target) |
| 1726 | thread.daemon = True |
| 1727 | thread.start() |
| 1728 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1729 | def _run_queue_idle(self): |
Vic Yang | 4953fc1 | 2012-07-26 16:19:53 +0800 | [diff] [blame] | 1730 | '''Invoked when the run queue has no events. |
| 1731 | |
| 1732 | This method must not raise exception. |
| 1733 | ''' |
Jon Salz | b22d117 | 2012-08-06 10:38:57 +0800 | [diff] [blame] | 1734 | now = time.time() |
| 1735 | if (self.last_idle and |
| 1736 | now < (self.last_idle + RUN_QUEUE_TIMEOUT_SECS - 1)): |
| 1737 | # Don't run more often than once every (RUN_QUEUE_TIMEOUT_SECS - |
| 1738 | # 1) seconds. |
| 1739 | return |
| 1740 | |
| 1741 | self.last_idle = now |
| 1742 | |
Vic Yang | 311ddb8 | 2012-09-26 12:08:28 +0800 | [diff] [blame] | 1743 | self.check_exclusive() |
cychiang | 2188674 | 2012-07-05 15:16:32 +0800 | [diff] [blame] | 1744 | self.check_for_updates() |
Jon Salz | 8fa8e83 | 2012-07-13 19:04:09 +0800 | [diff] [blame] | 1745 | self.sync_time_in_background() |
Jon Salz | b92c511 | 2012-09-21 15:40:11 +0800 | [diff] [blame] | 1746 | self.log_disk_space_stats() |
Justin Chuang | 8381398 | 2013-05-13 01:26:32 +0800 | [diff] [blame] | 1747 | self.check_battery() |
Cheng-Yi Chiang | cdfa418 | 2013-05-05 03:20:19 +0800 | [diff] [blame] | 1748 | self.check_core_dump() |
Jon Salz | 57717ca | 2012-04-04 16:47:25 +0800 | [diff] [blame] | 1749 | |
Jon Salz | d15bbcf | 2013-05-21 17:33:57 +0800 | [diff] [blame] | 1750 | def handle_event_logs(self, chunks): |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1751 | '''Callback for event watcher. |
Jon Salz | 258a40c | 2012-04-19 12:34:01 +0800 | [diff] [blame] | 1752 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1753 | Attempts to upload the event logs to the shopfloor server. |
Vic Yang | 9302761 | 2013-05-06 02:42:49 +0800 | [diff] [blame] | 1754 | |
| 1755 | Args: |
Jon Salz | d15bbcf | 2013-05-21 17:33:57 +0800 | [diff] [blame] | 1756 | chunks: A list of Chunk objects. |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1757 | ''' |
Cheng-Yi Chiang | 3e5ec7b | 2013-07-17 12:44:46 +0800 | [diff] [blame] | 1758 | if not self.test_list.options.sync_event_log: |
| 1759 | logging.info('Skipped syncing event logs %s', |
| 1760 | ', '.join([str(chunk) for chunk in chunks])) |
| 1761 | return |
| 1762 | |
Vic Yang | 9302761 | 2013-05-06 02:42:49 +0800 | [diff] [blame] | 1763 | first_exception = None |
| 1764 | exception_count = 0 |
| 1765 | |
Jon Salz | d15bbcf | 2013-05-21 17:33:57 +0800 | [diff] [blame] | 1766 | for chunk in chunks: |
Vic Yang | 9302761 | 2013-05-06 02:42:49 +0800 | [diff] [blame] | 1767 | try: |
Jon Salz | cddb640 | 2013-05-23 12:56:42 +0800 | [diff] [blame] | 1768 | description = 'event logs (%s)' % str(chunk) |
Vic Yang | 9302761 | 2013-05-06 02:42:49 +0800 | [diff] [blame] | 1769 | start_time = time.time() |
| 1770 | shopfloor_client = shopfloor.get_instance( |
| 1771 | detect=True, |
| 1772 | timeout=self.test_list.options.shopfloor_timeout_secs) |
Jon Salz | d15bbcf | 2013-05-21 17:33:57 +0800 | [diff] [blame] | 1773 | shopfloor_client.UploadEvent(chunk.log_name + "." + |
| 1774 | event_log.GetReimageId(), |
| 1775 | Binary(chunk.chunk)) |
Vic Yang | 9302761 | 2013-05-06 02:42:49 +0800 | [diff] [blame] | 1776 | logging.info( |
| 1777 | 'Successfully synced %s in %.03f s', |
| 1778 | description, time.time() - start_time) |
| 1779 | except: # pylint: disable=W0702 |
Jon Salz | d15bbcf | 2013-05-21 17:33:57 +0800 | [diff] [blame] | 1780 | first_exception = (first_exception or (chunk.log_name + ': ' + |
Vic Yang | 9302761 | 2013-05-06 02:42:49 +0800 | [diff] [blame] | 1781 | utils.FormatExceptionOnly())) |
| 1782 | exception_count += 1 |
| 1783 | |
| 1784 | if exception_count: |
| 1785 | if exception_count == 1: |
| 1786 | msg = 'Log upload failed: %s' % first_exception |
| 1787 | else: |
| 1788 | msg = '%d log upload failed; first is: %s' % ( |
| 1789 | exception_count, first_exception) |
| 1790 | raise Exception(msg) |
| 1791 | |
Jon Salz | 57717ca | 2012-04-04 16:47:25 +0800 | [diff] [blame] | 1792 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1793 | def run_tests_with_status(self, statuses_to_run, starting_at=None, |
| 1794 | root=None): |
| 1795 | '''Runs all top-level tests with a particular status. |
Jon Salz | 0405ab5 | 2012-03-16 15:26:52 +0800 | [diff] [blame] | 1796 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1797 | All active tests, plus any tests to re-run, are reset. |
Jon Salz | 57717ca | 2012-04-04 16:47:25 +0800 | [diff] [blame] | 1798 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1799 | Args: |
| 1800 | starting_at: If provided, only auto-runs tests beginning with |
| 1801 | this test. |
| 1802 | ''' |
| 1803 | root = root or self.test_list |
Jon Salz | 57717ca | 2012-04-04 16:47:25 +0800 | [diff] [blame] | 1804 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1805 | if starting_at: |
| 1806 | # Make sure they passed a test, not a string. |
| 1807 | assert isinstance(starting_at, factory.FactoryTest) |
Jon Salz | 0405ab5 | 2012-03-16 15:26:52 +0800 | [diff] [blame] | 1808 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1809 | tests_to_reset = [] |
| 1810 | tests_to_run = [] |
Jon Salz | 0405ab5 | 2012-03-16 15:26:52 +0800 | [diff] [blame] | 1811 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1812 | found_starting_at = False |
Jon Salz | 0405ab5 | 2012-03-16 15:26:52 +0800 | [diff] [blame] | 1813 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1814 | for test in root.get_top_level_tests(): |
| 1815 | if starting_at: |
| 1816 | if test == starting_at: |
| 1817 | # We've found starting_at; do auto-run on all |
| 1818 | # subsequent tests. |
| 1819 | found_starting_at = True |
| 1820 | if not found_starting_at: |
| 1821 | # Don't start this guy yet |
| 1822 | continue |
Jon Salz | 0405ab5 | 2012-03-16 15:26:52 +0800 | [diff] [blame] | 1823 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1824 | status = test.get_state().status |
| 1825 | if status == TestState.ACTIVE or status in statuses_to_run: |
| 1826 | # Reset the test (later; we will need to abort |
| 1827 | # all active tests first). |
| 1828 | tests_to_reset.append(test) |
| 1829 | if status in statuses_to_run: |
| 1830 | tests_to_run.append(test) |
Jon Salz | 0405ab5 | 2012-03-16 15:26:52 +0800 | [diff] [blame] | 1831 | |
Jon Salz | 6dc031d | 2013-06-19 13:06:23 +0800 | [diff] [blame] | 1832 | self.abort_active_tests('Operator requested run/re-run of certain tests') |
Jon Salz | 258a40c | 2012-04-19 12:34:01 +0800 | [diff] [blame] | 1833 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1834 | # Reset all statuses of the tests to run (in case any tests were active; |
| 1835 | # we want them to be run again). |
| 1836 | for test_to_reset in tests_to_reset: |
| 1837 | for test in test_to_reset.walk(): |
| 1838 | test.update_state(status=TestState.UNTESTED) |
Jon Salz | 57717ca | 2012-04-04 16:47:25 +0800 | [diff] [blame] | 1839 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1840 | self.run_tests(tests_to_run, untested_only=True) |
Jon Salz | 0405ab5 | 2012-03-16 15:26:52 +0800 | [diff] [blame] | 1841 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1842 | def restart_tests(self, root=None): |
| 1843 | '''Restarts all tests.''' |
| 1844 | root = root or self.test_list |
Jon Salz | 0405ab5 | 2012-03-16 15:26:52 +0800 | [diff] [blame] | 1845 | |
Jon Salz | 6dc031d | 2013-06-19 13:06:23 +0800 | [diff] [blame] | 1846 | self.abort_active_tests('Operator requested restart of certain tests') |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1847 | for test in root.walk(): |
| 1848 | test.update_state(status=TestState.UNTESTED) |
| 1849 | self.run_tests(root) |
Hung-Te Lin | 9663236 | 2012-03-20 21:14:18 +0800 | [diff] [blame] | 1850 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1851 | def auto_run(self, starting_at=None, root=None): |
| 1852 | '''"Auto-runs" tests that have not been run yet. |
Hung-Te Lin | 9663236 | 2012-03-20 21:14:18 +0800 | [diff] [blame] | 1853 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1854 | Args: |
| 1855 | starting_at: If provide, only auto-runs tests beginning with |
| 1856 | this test. |
| 1857 | ''' |
| 1858 | root = root or self.test_list |
| 1859 | self.run_tests_with_status([TestState.UNTESTED, TestState.ACTIVE], |
| 1860 | starting_at=starting_at, |
| 1861 | root=root) |
Jon Salz | 968e90b | 2012-03-18 16:12:43 +0800 | [diff] [blame] | 1862 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1863 | def re_run_failed(self, root=None): |
| 1864 | '''Re-runs failed tests.''' |
| 1865 | root = root or self.test_list |
| 1866 | self.run_tests_with_status([TestState.FAILED], root=root) |
Jon Salz | 57717ca | 2012-04-04 16:47:25 +0800 | [diff] [blame] | 1867 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1868 | def show_review_information(self): |
| 1869 | '''Event handler for showing review information screen. |
Jon Salz | 57717ca | 2012-04-04 16:47:25 +0800 | [diff] [blame] | 1870 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1871 | The information screene is rendered by main UI program (ui.py), so in |
| 1872 | goofy we only need to kill all active tests, set them as untested, and |
| 1873 | clear remaining tests. |
| 1874 | ''' |
| 1875 | self.kill_active_tests(False) |
Jon Salz | a6711d7 | 2012-07-18 14:33:03 +0800 | [diff] [blame] | 1876 | self.cancel_pending_tests() |
Jon Salz | 57717ca | 2012-04-04 16:47:25 +0800 | [diff] [blame] | 1877 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1878 | def handle_switch_test(self, event): |
| 1879 | '''Switches to a particular test. |
Jon Salz | 0405ab5 | 2012-03-16 15:26:52 +0800 | [diff] [blame] | 1880 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1881 | @param event: The SWITCH_TEST event. |
| 1882 | ''' |
| 1883 | test = self.test_list.lookup_path(event.path) |
| 1884 | if not test: |
| 1885 | logging.error('Unknown test %r', event.key) |
| 1886 | return |
Jon Salz | 73e0fd0 | 2012-04-04 11:46:38 +0800 | [diff] [blame] | 1887 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1888 | invoc = self.invocations.get(test) |
| 1889 | if invoc and test.backgroundable: |
| 1890 | # Already running: just bring to the front if it |
| 1891 | # has a UI. |
| 1892 | logging.info('Setting visible test to %s', test.path) |
Jon Salz | 36fbbb5 | 2012-07-05 13:45:06 +0800 | [diff] [blame] | 1893 | self.set_visible_test(test) |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1894 | return |
Jon Salz | 73e0fd0 | 2012-04-04 11:46:38 +0800 | [diff] [blame] | 1895 | |
Jon Salz | 6dc031d | 2013-06-19 13:06:23 +0800 | [diff] [blame] | 1896 | self.abort_active_tests('Operator requested abort (switch_test)') |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1897 | for t in test.walk(): |
| 1898 | t.update_state(status=TestState.UNTESTED) |
Jon Salz | 73e0fd0 | 2012-04-04 11:46:38 +0800 | [diff] [blame] | 1899 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1900 | if self.test_list.options.auto_run_on_keypress: |
| 1901 | self.auto_run(starting_at=test) |
| 1902 | else: |
| 1903 | self.run_tests(test) |
Jon Salz | 73e0fd0 | 2012-04-04 11:46:38 +0800 | [diff] [blame] | 1904 | |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1905 | def wait(self): |
| 1906 | '''Waits for all pending invocations. |
| 1907 | |
| 1908 | Useful for testing. |
| 1909 | ''' |
Jon Salz | 1acc874 | 2012-07-17 17:45:55 +0800 | [diff] [blame] | 1910 | while self.invocations: |
| 1911 | for k, v in self.invocations.iteritems(): |
| 1912 | logging.info('Waiting for %s to complete...', k) |
| 1913 | v.thread.join() |
| 1914 | self.reap_completed_tests() |
Jon Salz | 0697cbf | 2012-07-04 15:14:04 +0800 | [diff] [blame] | 1915 | |
| 1916 | def check_exceptions(self): |
| 1917 | '''Raises an error if any exceptions have occurred in |
| 1918 | invocation threads.''' |
| 1919 | if self.exceptions: |
| 1920 | raise RuntimeError('Exception in invocation thread: %r' % |
| 1921 | self.exceptions) |
| 1922 | |
| 1923 | def record_exception(self, msg): |
| 1924 | '''Records an exception in an invocation thread. |
| 1925 | |
| 1926 | An exception with the given message will be rethrown when |
| 1927 | Goofy is destroyed.''' |
| 1928 | self.exceptions.append(msg) |
Jon Salz | 73e0fd0 | 2012-04-04 11:46:38 +0800 | [diff] [blame] | 1929 | |
Hung-Te Lin | f2f78f7 | 2012-02-08 19:27:11 +0800 | [diff] [blame] | 1930 | |
| 1931 | if __name__ == '__main__': |
Jon Salz | 77c151e | 2012-08-28 07:20:37 +0800 | [diff] [blame] | 1932 | goofy = Goofy() |
| 1933 | try: |
| 1934 | goofy.main() |
Jon Salz | 0f99660 | 2012-10-03 15:26:48 +0800 | [diff] [blame] | 1935 | except SystemExit: |
| 1936 | # Propagate SystemExit without logging. |
| 1937 | raise |
Jon Salz | 31373eb | 2012-09-21 16:19:49 +0800 | [diff] [blame] | 1938 | except: |
Jon Salz | 0f99660 | 2012-10-03 15:26:48 +0800 | [diff] [blame] | 1939 | # Log the error before trying to shut down (unless it's a graceful |
| 1940 | # exit). |
Jon Salz | 31373eb | 2012-09-21 16:19:49 +0800 | [diff] [blame] | 1941 | logging.exception('Error in main loop') |
| 1942 | raise |
Jon Salz | 77c151e | 2012-08-28 07:20:37 +0800 | [diff] [blame] | 1943 | finally: |
| 1944 | goofy.destroy() |