blob: 632cece3dca9e63fcbbc81435978bf0e82a80c1a [file] [log] [blame]
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001#!/usr/bin/python -u
Hung-Te Linf2f78f72012-02-08 19:27:11 +08002# -*- coding: utf-8 -*-
3#
Jon Salz37eccbd2012-05-25 16:06:52 +08004# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
Hung-Te Linf2f78f72012-02-08 19:27:11 +08005# Use of this source code is governed by a BSD-style license that can be
6# found in the LICENSE file.
7
8'''
9The main factory flow that runs the factory test and finalizes a device.
10'''
11
Jon Salze12c2b32013-06-25 16:24:34 +080012import glob
Jon Salz0405ab52012-03-16 15:26:52 +080013import logging
14import os
Jon Salz73e0fd02012-04-04 11:46:38 +080015import Queue
Jon Salze12c2b32013-06-25 16:24:34 +080016import shutil
Jon Salz77c151e2012-08-28 07:20:37 +080017import signal
Jon Salz0405ab52012-03-16 15:26:52 +080018import sys
Jon Salzeff94182013-06-19 15:06:28 +080019import syslog
Jon Salz0405ab52012-03-16 15:26:52 +080020import threading
21import time
22import traceback
Jon Salz258a40c2012-04-19 12:34:01 +080023import uuid
Jon Salzb10cf512012-08-09 17:29:21 +080024from xmlrpclib import Binary
Hung-Te Linf2f78f72012-02-08 19:27:11 +080025from collections import deque
26from optparse import OptionParser
Hung-Te Linf2f78f72012-02-08 19:27:11 +080027
Jon Salz0697cbf2012-07-04 15:14:04 +080028import factory_common # pylint: disable=W0611
jcliangcd688182012-08-20 21:01:26 +080029from cros.factory import event_log
30from cros.factory import system
Cheng-Yi Chiangd0406522013-04-01 15:40:18 +080031from cros.factory.event_log import EventLog, FloatDigit
Tom Wai-Hong Tamd33723e2013-04-10 21:14:37 +080032from cros.factory.event_log_watcher import EventLogWatcher
jcliangcd688182012-08-20 21:01:26 +080033from cros.factory.goofy import test_environment
34from cros.factory.goofy import time_sanitizer
Jon Salz83591782012-06-26 11:09:58 +080035from cros.factory.goofy import updater
jcliangcd688182012-08-20 21:01:26 +080036from cros.factory.goofy.goofy_rpc import GoofyRPC
Jon Salz885dcac2013-07-23 16:39:50 +080037from cros.factory.goofy.invocation import TestArgEnv
jcliangcd688182012-08-20 21:01:26 +080038from cros.factory.goofy.invocation import TestInvocation
39from cros.factory.goofy.prespawner import Prespawner
Cheng-Yi Chiang344b10f2013-05-03 16:44:03 +080040from cros.factory.goofy.system_log_manager import SystemLogManager
jcliangcd688182012-08-20 21:01:26 +080041from cros.factory.goofy.web_socket_manager import WebSocketManager
Cheng-Yi Chiangd8186952013-04-04 23:41:14 +080042from cros.factory.system.board import Board, BoardException
jcliangcd688182012-08-20 21:01:26 +080043from cros.factory.system.charge_manager import ChargeManager
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +080044from cros.factory.system.core_dump_manager import CoreDumpManager
Jon Salzce6a7f82013-06-10 18:22:54 +080045from cros.factory.system.cpufreq_manager import CpufreqManager
Jon Salzb92c5112012-09-21 15:40:11 +080046from cros.factory.system import disk_space
jcliangcd688182012-08-20 21:01:26 +080047from cros.factory.test import factory
48from cros.factory.test import state
Jon Salz51528e12012-07-02 18:54:45 +080049from cros.factory.test import shopfloor
Jon Salz83591782012-06-26 11:09:58 +080050from cros.factory.test import utils
Jon Salz128b0932013-07-03 16:55:26 +080051from cros.factory.test.test_lists import test_lists
Jon Salz83591782012-06-26 11:09:58 +080052from cros.factory.test.event import Event
53from cros.factory.test.event import EventClient
54from cros.factory.test.event import EventServer
jcliangcd688182012-08-20 21:01:26 +080055from cros.factory.test.factory import TestState
Jon Salzd7550792013-07-12 05:49:27 +080056from cros.factory.test.utils import Enum
Dean Liao592e4d52013-01-10 20:06:39 +080057from cros.factory.tools.key_filter import KeyFilter
Jon Salz2af235d2013-06-24 14:47:21 +080058from cros.factory.utils import file_utils
Jon Salz78c32392012-07-25 14:18:29 +080059from cros.factory.utils.process_utils import Spawn
Hung-Te Linf2f78f72012-02-08 19:27:11 +080060
61
Hung-Te Linf2f78f72012-02-08 19:27:11 +080062HWID_CFG_PATH = '/usr/local/share/chromeos-hwid/cfg'
Chun-ta Lin279e7e92013-02-19 17:40:39 +080063CACHES_DIR = os.path.join(factory.get_state_root(), "caches")
Hung-Te Linf2f78f72012-02-08 19:27:11 +080064
Cheng-Yi Chiang39d32ad2013-07-23 15:02:38 +080065CLEANUP_LOGS_PAUSED = '/var/lib/cleanup_logs_paused'
66
Jon Salz8796e362012-05-24 11:39:09 +080067# File that suppresses reboot if present (e.g., for development).
68NO_REBOOT_FILE = '/var/log/factory.noreboot'
69
Jon Salz5c344f62012-07-13 14:31:16 +080070# Value for tests_after_shutdown that forces auto-run (e.g., after
71# a factory update, when the available set of tests might change).
72FORCE_AUTO_RUN = 'force_auto_run'
73
cychiang21886742012-07-05 15:16:32 +080074RUN_QUEUE_TIMEOUT_SECS = 10
75
Justin Chuang83813982013-05-13 01:26:32 +080076# Sync disks when battery level is higher than this value.
77# Otherwise, power loss during disk sync operation may incur even worse outcome.
78MIN_BATTERY_LEVEL_FOR_DISK_SYNC = 1.0
79
Jon Salze12c2b32013-06-25 16:24:34 +080080MAX_CRASH_FILE_SIZE = 64*1024
81
Jon Salz758e6cc2012-04-03 15:47:07 +080082GOOFY_IN_CHROOT_WARNING = '\n' + ('*' * 70) + '''
83You are running Goofy inside the chroot. Autotests are not supported.
84
85To use Goofy in the chroot, first install an Xvnc server:
86
Jon Salz0697cbf2012-07-04 15:14:04 +080087 sudo apt-get install tightvncserver
Jon Salz758e6cc2012-04-03 15:47:07 +080088
89...and then start a VNC X server outside the chroot:
90
Jon Salz0697cbf2012-07-04 15:14:04 +080091 vncserver :10 &
92 vncviewer :10
Jon Salz758e6cc2012-04-03 15:47:07 +080093
94...and run Goofy as follows:
95
Jon Salz0697cbf2012-07-04 15:14:04 +080096 env --unset=XAUTHORITY DISPLAY=localhost:10 python goofy.py
Jon Salz758e6cc2012-04-03 15:47:07 +080097''' + ('*' * 70)
Jon Salz73e0fd02012-04-04 11:46:38 +080098suppress_chroot_warning = False
Hung-Te Linf2f78f72012-02-08 19:27:11 +080099
Jon Salzd7550792013-07-12 05:49:27 +0800100Status = Enum(['UNINITIALIZED', 'INITIALIZING', 'RUNNING',
101 'TERMINATING', 'TERMINATED'])
102
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800103def get_hwid_cfg():
Jon Salz0697cbf2012-07-04 15:14:04 +0800104 '''
105 Returns the HWID config tag, or an empty string if none can be found.
106 '''
107 if 'CROS_HWID' in os.environ:
108 return os.environ['CROS_HWID']
109 if os.path.exists(HWID_CFG_PATH):
110 with open(HWID_CFG_PATH, 'rt') as hwid_cfg_handle:
111 return hwid_cfg_handle.read().strip()
112 return ''
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800113
114
Jon Salz73e0fd02012-04-04 11:46:38 +0800115_inited_logging = False
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800116
117class Goofy(object):
Jon Salz0697cbf2012-07-04 15:14:04 +0800118 '''
119 The main factory flow.
120
121 Note that all methods in this class must be invoked from the main
122 (event) thread. Other threads, such as callbacks and TestInvocation
123 methods, should instead post events on the run queue.
124
125 TODO: Unit tests. (chrome-os-partner:7409)
126
127 Properties:
128 uuid: A unique UUID for this invocation of Goofy.
129 state_instance: An instance of FactoryState.
130 state_server: The FactoryState XML/RPC server.
131 state_server_thread: A thread running state_server.
132 event_server: The EventServer socket server.
133 event_server_thread: A thread running event_server.
134 event_client: A client to the event server.
135 connection_manager: The connection_manager object.
Cheng-Yi Chiang835f2682013-05-06 22:15:48 +0800136 system_log_manager: The SystemLogManager object.
137 core_dump_manager: The CoreDumpManager object.
Jon Salz0697cbf2012-07-04 15:14:04 +0800138 ui_process: The factory ui process object.
139 run_queue: A queue of callbacks to invoke from the main thread.
140 invocations: A map from FactoryTest objects to the corresponding
141 TestInvocations objects representing active tests.
142 tests_to_run: A deque of tests that should be run when the current
143 test(s) complete.
144 options: Command-line options.
145 args: Command-line args.
146 test_list: The test list.
Jon Salz128b0932013-07-03 16:55:26 +0800147 test_lists: All new-style test lists.
Jon Salz0697cbf2012-07-04 15:14:04 +0800148 event_handlers: Map of Event.Type to the method used to handle that
149 event. If the method has an 'event' argument, the event is passed
150 to the handler.
151 exceptions: Exceptions encountered in invocation threads.
Jon Salz3c493bb2013-02-07 17:24:58 +0800152 last_log_disk_space_message: The last message we logged about disk space
153 (to avoid duplication).
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +0800154 last_kick_sync_time: The last time to kick system_log_manager to sync
155 because of core dump files (to avoid kicking too soon then abort the
156 sync.)
Jon Salz416f9cc2013-05-10 18:32:50 +0800157 hooks: A Hooks object containing hooks for various Goofy actions.
Jon Salzd7550792013-07-12 05:49:27 +0800158 status: The current Goofy status (a member of the Status enum).
Jon Salz0697cbf2012-07-04 15:14:04 +0800159 '''
160 def __init__(self):
161 self.uuid = str(uuid.uuid4())
162 self.state_instance = None
163 self.state_server = None
164 self.state_server_thread = None
Jon Salz16d10542012-07-23 12:18:45 +0800165 self.goofy_rpc = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800166 self.event_server = None
167 self.event_server_thread = None
168 self.event_client = None
169 self.connection_manager = None
Vic Yang4953fc12012-07-26 16:19:53 +0800170 self.charge_manager = None
Jon Salz8fa8e832012-07-13 19:04:09 +0800171 self.time_sanitizer = None
172 self.time_synced = False
Jon Salz0697cbf2012-07-04 15:14:04 +0800173 self.log_watcher = None
Cheng-Yi Chiang344b10f2013-05-03 16:44:03 +0800174 self.system_log_manager = None
Cheng-Yi Chiang835f2682013-05-06 22:15:48 +0800175 self.core_dump_manager = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800176 self.event_log = None
177 self.prespawner = None
178 self.ui_process = None
Jon Salzc79a9982012-08-30 04:42:01 +0800179 self.dummy_shopfloor = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800180 self.run_queue = Queue.Queue()
181 self.invocations = {}
182 self.tests_to_run = deque()
183 self.visible_test = None
184 self.chrome = None
Jon Salz416f9cc2013-05-10 18:32:50 +0800185 self.hooks = None
Vic Yangd8990da2013-06-27 16:57:43 +0800186 self.cpu_usage_watcher = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800187
188 self.options = None
189 self.args = None
190 self.test_list = None
Jon Salz128b0932013-07-03 16:55:26 +0800191 self.test_lists = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800192 self.on_ui_startup = []
193 self.env = None
Jon Salzb22d1172012-08-06 10:38:57 +0800194 self.last_idle = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800195 self.last_shutdown_time = None
cychiang21886742012-07-05 15:16:32 +0800196 self.last_update_check = None
Jon Salz8fa8e832012-07-13 19:04:09 +0800197 self.last_sync_time = None
Jon Salzb92c5112012-09-21 15:40:11 +0800198 self.last_log_disk_space_time = None
Jon Salz3c493bb2013-02-07 17:24:58 +0800199 self.last_log_disk_space_message = None
Justin Chuang83813982013-05-13 01:26:32 +0800200 self.last_check_battery_time = None
201 self.last_check_battery_message = None
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +0800202 self.last_kick_sync_time = None
Vic Yang311ddb82012-09-26 12:08:28 +0800203 self.exclusive_items = set()
Jon Salz0f996602012-10-03 15:26:48 +0800204 self.event_log = None
Dean Liao592e4d52013-01-10 20:06:39 +0800205 self.key_filter = None
Jon Salzce6a7f82013-06-10 18:22:54 +0800206 self.cpufreq_manager = None
Jon Salzd7550792013-07-12 05:49:27 +0800207 self.status = Status.UNINITIALIZED
Jon Salz0697cbf2012-07-04 15:14:04 +0800208
Jon Salz85a39882012-07-05 16:45:04 +0800209 def test_or_root(event, parent_or_group=True):
210 '''Returns the test affected by a particular event.
211
212 Args:
213 event: The event containing an optional 'path' attribute.
214 parent_on_group: If True, returns the top-level parent for a test (the
215 root node of the tests that need to be run together if the given test
216 path is to be run).
217 '''
Jon Salz0697cbf2012-07-04 15:14:04 +0800218 try:
219 path = event.path
220 except AttributeError:
221 path = None
222
223 if path:
Jon Salz85a39882012-07-05 16:45:04 +0800224 test = self.test_list.lookup_path(path)
225 if parent_or_group:
226 test = test.get_top_level_parent_or_group()
227 return test
Jon Salz0697cbf2012-07-04 15:14:04 +0800228 else:
229 return self.test_list
230
231 self.event_handlers = {
232 Event.Type.SWITCH_TEST: self.handle_switch_test,
233 Event.Type.SHOW_NEXT_ACTIVE_TEST:
234 lambda event: self.show_next_active_test(),
235 Event.Type.RESTART_TESTS:
236 lambda event: self.restart_tests(root=test_or_root(event)),
237 Event.Type.AUTO_RUN:
238 lambda event: self.auto_run(root=test_or_root(event)),
239 Event.Type.RE_RUN_FAILED:
240 lambda event: self.re_run_failed(root=test_or_root(event)),
241 Event.Type.RUN_TESTS_WITH_STATUS:
242 lambda event: self.run_tests_with_status(
243 event.status,
244 root=test_or_root(event)),
245 Event.Type.REVIEW:
246 lambda event: self.show_review_information(),
247 Event.Type.UPDATE_SYSTEM_INFO:
248 lambda event: self.update_system_info(),
Jon Salz0697cbf2012-07-04 15:14:04 +0800249 Event.Type.STOP:
Jon Salz85a39882012-07-05 16:45:04 +0800250 lambda event: self.stop(root=test_or_root(event, False),
Jon Salz6dc031d2013-06-19 13:06:23 +0800251 fail=getattr(event, 'fail', False),
252 reason=getattr(event, 'reason', None)),
Jon Salz36fbbb52012-07-05 13:45:06 +0800253 Event.Type.SET_VISIBLE_TEST:
254 lambda event: self.set_visible_test(
255 self.test_list.lookup_path(event.path)),
Jon Salz4712ac72013-02-07 17:12:05 +0800256 Event.Type.CLEAR_STATE:
257 lambda event: self.clear_state(self.test_list.lookup_path(event.path)),
Jon Salz0697cbf2012-07-04 15:14:04 +0800258 }
259
260 self.exceptions = []
261 self.web_socket_manager = None
262
263 def destroy(self):
Jon Salzd7550792013-07-12 05:49:27 +0800264 self.status = Status.TERMINATING
Jon Salz0697cbf2012-07-04 15:14:04 +0800265 if self.chrome:
266 self.chrome.kill()
267 self.chrome = None
Jon Salzc79a9982012-08-30 04:42:01 +0800268 if self.dummy_shopfloor:
269 self.dummy_shopfloor.kill()
270 self.dummy_shopfloor = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800271 if self.ui_process:
272 utils.kill_process_tree(self.ui_process, 'ui')
273 self.ui_process = None
274 if self.web_socket_manager:
275 logging.info('Stopping web sockets')
276 self.web_socket_manager.close()
277 self.web_socket_manager = None
278 if self.state_server_thread:
279 logging.info('Stopping state server')
280 self.state_server.shutdown()
281 self.state_server_thread.join()
282 self.state_server.server_close()
283 self.state_server_thread = None
284 if self.state_instance:
285 self.state_instance.close()
286 if self.event_server_thread:
287 logging.info('Stopping event server')
288 self.event_server.shutdown() # pylint: disable=E1101
289 self.event_server_thread.join()
290 self.event_server.server_close()
291 self.event_server_thread = None
292 if self.log_watcher:
293 if self.log_watcher.IsThreadStarted():
294 self.log_watcher.StopWatchThread()
295 self.log_watcher = None
Cheng-Yi Chiang344b10f2013-05-03 16:44:03 +0800296 if self.system_log_manager:
297 if self.system_log_manager.IsThreadRunning():
298 self.system_log_manager.StopSyncThread()
299 self.system_log_manager = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800300 if self.prespawner:
301 logging.info('Stopping prespawner')
302 self.prespawner.stop()
303 self.prespawner = None
304 if self.event_client:
305 logging.info('Closing event client')
306 self.event_client.close()
307 self.event_client = None
Jon Salzddf0d052013-06-18 12:52:44 +0800308 if self.cpufreq_manager:
309 self.cpufreq_manager.Stop()
Jon Salz0697cbf2012-07-04 15:14:04 +0800310 if self.event_log:
311 self.event_log.Close()
312 self.event_log = None
Dean Liao592e4d52013-01-10 20:06:39 +0800313 if self.key_filter:
314 self.key_filter.Stop()
Vic Yangd8990da2013-06-27 16:57:43 +0800315 if self.cpu_usage_watcher:
316 self.cpu_usage_watcher.terminate()
Dean Liao592e4d52013-01-10 20:06:39 +0800317
Jon Salz0697cbf2012-07-04 15:14:04 +0800318 self.check_exceptions()
319 logging.info('Done destroying Goofy')
Jon Salzd7550792013-07-12 05:49:27 +0800320 self.status = Status.TERMINATED
Jon Salz0697cbf2012-07-04 15:14:04 +0800321
322 def start_state_server(self):
Jon Salz2af235d2013-06-24 14:47:21 +0800323 # Before starting state server, remount stateful partitions with
324 # no commit flag. The default commit time (commit=600) makes corruption
325 # too likely.
326 file_utils.ResetCommitTime()
327
Jon Salz0697cbf2012-07-04 15:14:04 +0800328 self.state_instance, self.state_server = (
329 state.create_server(bind_address='0.0.0.0'))
Jon Salz16d10542012-07-23 12:18:45 +0800330 self.goofy_rpc = GoofyRPC(self)
331 self.goofy_rpc.RegisterMethods(self.state_instance)
Jon Salz0697cbf2012-07-04 15:14:04 +0800332 logging.info('Starting state server')
333 self.state_server_thread = threading.Thread(
334 target=self.state_server.serve_forever,
335 name='StateServer')
336 self.state_server_thread.start()
337
338 def start_event_server(self):
339 self.event_server = EventServer()
340 logging.info('Starting factory event server')
341 self.event_server_thread = threading.Thread(
342 target=self.event_server.serve_forever,
343 name='EventServer') # pylint: disable=E1101
344 self.event_server_thread.start()
345
346 self.event_client = EventClient(
347 callback=self.handle_event, event_loop=self.run_queue)
348
349 self.web_socket_manager = WebSocketManager(self.uuid)
350 self.state_server.add_handler("/event",
351 self.web_socket_manager.handle_web_socket)
352
353 def start_ui(self):
354 ui_proc_args = [
355 os.path.join(factory.FACTORY_PACKAGE_PATH, 'test', 'ui.py'),
356 self.options.test_list]
357 if self.options.verbose:
358 ui_proc_args.append('-v')
359 logging.info('Starting ui %s', ui_proc_args)
Jon Salz78c32392012-07-25 14:18:29 +0800360 self.ui_process = Spawn(ui_proc_args)
Jon Salz0697cbf2012-07-04 15:14:04 +0800361 logging.info('Waiting for UI to come up...')
362 self.event_client.wait(
363 lambda event: event.type == Event.Type.UI_READY)
364 logging.info('UI has started')
365
366 def set_visible_test(self, test):
367 if self.visible_test == test:
368 return
Jon Salz2f2d42c2012-07-30 12:30:34 +0800369 if test and not test.has_ui:
370 return
Jon Salz0697cbf2012-07-04 15:14:04 +0800371
372 if test:
373 test.update_state(visible=True)
374 if self.visible_test:
375 self.visible_test.update_state(visible=False)
376 self.visible_test = test
377
Jon Salzd4306c82012-11-30 15:16:36 +0800378 def _log_startup_messages(self):
379 '''Logs the tail of var/log/messages and mosys and EC console logs.'''
380 # TODO(jsalz): This is mostly a copy-and-paste of code in init_states,
381 # for factory-3004.B only. Consolidate and merge back to ToT.
382 if utils.in_chroot():
383 return
384
385 try:
386 var_log_messages = (
387 utils.var_log_messages_before_reboot())
388 logging.info(
389 'Tail of /var/log/messages before last reboot:\n'
390 '%s', ('\n'.join(
391 ' ' + x for x in var_log_messages)))
392 except: # pylint: disable=W0702
393 logging.exception('Unable to grok /var/log/messages')
394
395 try:
396 mosys_log = utils.Spawn(
397 ['mosys', 'eventlog', 'list'],
398 read_stdout=True, log_stderr_on_error=True).stdout_data
399 logging.info('System eventlog from mosys:\n%s\n', mosys_log)
400 except: # pylint: disable=W0702
401 logging.exception('Unable to read mosys eventlog')
402
403 try:
Vic Yang8341dde2013-01-29 16:48:52 +0800404 board = system.GetBoard()
405 ec_console_log = board.GetECConsoleLog()
Jon Salzd4306c82012-11-30 15:16:36 +0800406 logging.info('EC console log after reboot:\n%s\n', ec_console_log)
407 except: # pylint: disable=W0702
408 logging.exception('Error retrieving EC console log')
409
Vic Yang079f9872013-07-01 11:32:00 +0800410 try:
411 board = system.GetBoard()
412 ec_panic_info = board.GetECPanicInfo()
413 logging.info('EC panic info after reboot:\n%s\n', ec_panic_info)
414 except: # pylint: disable=W0702
415 logging.exception('Error retrieving EC panic info')
416
Jon Salz0697cbf2012-07-04 15:14:04 +0800417 def handle_shutdown_complete(self, test, test_state):
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800418 '''
Jon Salz0697cbf2012-07-04 15:14:04 +0800419 Handles the case where a shutdown was detected during a shutdown step.
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800420
Jon Salz0697cbf2012-07-04 15:14:04 +0800421 @param test: The ShutdownStep.
422 @param test_state: The test state.
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800423 '''
Jon Salz0697cbf2012-07-04 15:14:04 +0800424 test_state = test.update_state(increment_shutdown_count=1)
425 logging.info('Detected shutdown (%d of %d)',
426 test_state.shutdown_count, test.iterations)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800427
Jon Salz0697cbf2012-07-04 15:14:04 +0800428 def log_and_update_state(status, error_msg, **kw):
429 self.event_log.Log('rebooted',
430 status=status, error_msg=error_msg, **kw)
Jon Salzd4306c82012-11-30 15:16:36 +0800431 logging.info('Rebooted: status=%s, %s', status,
432 (('error_msg=%s' % error_msg) if error_msg else None))
Jon Salz0697cbf2012-07-04 15:14:04 +0800433 test.update_state(status=status, error_msg=error_msg)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800434
Jon Salz0697cbf2012-07-04 15:14:04 +0800435 if not self.last_shutdown_time:
436 log_and_update_state(status=TestState.FAILED,
437 error_msg='Unable to read shutdown_time')
438 return
Jon Salz258a40c2012-04-19 12:34:01 +0800439
Jon Salz0697cbf2012-07-04 15:14:04 +0800440 now = time.time()
441 logging.info('%.03f s passed since reboot',
442 now - self.last_shutdown_time)
Jon Salz258a40c2012-04-19 12:34:01 +0800443
Jon Salz0697cbf2012-07-04 15:14:04 +0800444 if self.last_shutdown_time > now:
445 test.update_state(status=TestState.FAILED,
446 error_msg='Time moved backward during reboot')
447 elif (isinstance(test, factory.RebootStep) and
448 self.test_list.options.max_reboot_time_secs and
449 (now - self.last_shutdown_time >
450 self.test_list.options.max_reboot_time_secs)):
451 # A reboot took too long; fail. (We don't check this for
452 # HaltSteps, because the machine could be halted for a
453 # very long time, and even unplugged with battery backup,
454 # thus hosing the clock.)
455 log_and_update_state(
456 status=TestState.FAILED,
457 error_msg=('More than %d s elapsed during reboot '
458 '(%.03f s, from %s to %s)' % (
459 self.test_list.options.max_reboot_time_secs,
460 now - self.last_shutdown_time,
461 utils.TimeString(self.last_shutdown_time),
462 utils.TimeString(now))),
463 duration=(now-self.last_shutdown_time))
Jon Salzd4306c82012-11-30 15:16:36 +0800464 self._log_startup_messages()
Jon Salz0697cbf2012-07-04 15:14:04 +0800465 elif test_state.shutdown_count == test.iterations:
466 # Good!
467 log_and_update_state(status=TestState.PASSED,
468 duration=(now - self.last_shutdown_time),
469 error_msg='')
470 elif test_state.shutdown_count > test.iterations:
471 # Shut down too many times
472 log_and_update_state(status=TestState.FAILED,
473 error_msg='Too many shutdowns')
Jon Salzd4306c82012-11-30 15:16:36 +0800474 self._log_startup_messages()
Jon Salz0697cbf2012-07-04 15:14:04 +0800475 elif utils.are_shift_keys_depressed():
476 logging.info('Shift keys are depressed; cancelling restarts')
477 # Abort shutdown
478 log_and_update_state(
479 status=TestState.FAILED,
480 error_msg='Shutdown aborted with double shift keys')
Jon Salza6711d72012-07-18 14:33:03 +0800481 self.cancel_pending_tests()
Jon Salz0697cbf2012-07-04 15:14:04 +0800482 else:
483 def handler():
484 if self._prompt_cancel_shutdown(
485 test, test_state.shutdown_count + 1):
Jon Salza6711d72012-07-18 14:33:03 +0800486 factory.console.info('Shutdown aborted by operator')
Jon Salz0697cbf2012-07-04 15:14:04 +0800487 log_and_update_state(
488 status=TestState.FAILED,
489 error_msg='Shutdown aborted by operator')
Jon Salza6711d72012-07-18 14:33:03 +0800490 self.cancel_pending_tests()
Jon Salz0697cbf2012-07-04 15:14:04 +0800491 return
Jon Salz0405ab52012-03-16 15:26:52 +0800492
Jon Salz0697cbf2012-07-04 15:14:04 +0800493 # Time to shutdown again
494 log_and_update_state(
495 status=TestState.ACTIVE,
496 error_msg='',
497 iteration=test_state.shutdown_count)
Jon Salz73e0fd02012-04-04 11:46:38 +0800498
Jon Salz0697cbf2012-07-04 15:14:04 +0800499 self.event_log.Log('shutdown', operation='reboot')
500 self.state_instance.set_shared_data('shutdown_time',
501 time.time())
502 self.env.shutdown('reboot')
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800503
Jon Salz0697cbf2012-07-04 15:14:04 +0800504 self.on_ui_startup.append(handler)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800505
Jon Salz0697cbf2012-07-04 15:14:04 +0800506 def _prompt_cancel_shutdown(self, test, iteration):
507 if self.options.ui != 'chrome':
508 return False
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800509
Jon Salz0697cbf2012-07-04 15:14:04 +0800510 pending_shutdown_data = {
511 'delay_secs': test.delay_secs,
512 'time': time.time() + test.delay_secs,
513 'operation': test.operation,
514 'iteration': iteration,
515 'iterations': test.iterations,
516 }
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800517
Jon Salz0697cbf2012-07-04 15:14:04 +0800518 # Create a new (threaded) event client since we
519 # don't want to use the event loop for this.
520 with EventClient() as event_client:
521 event_client.post_event(Event(Event.Type.PENDING_SHUTDOWN,
522 **pending_shutdown_data))
523 aborted = event_client.wait(
524 lambda event: event.type == Event.Type.CANCEL_SHUTDOWN,
525 timeout=test.delay_secs) is not None
526 if aborted:
527 event_client.post_event(Event(Event.Type.PENDING_SHUTDOWN))
528 return aborted
Jon Salz258a40c2012-04-19 12:34:01 +0800529
Jon Salz0697cbf2012-07-04 15:14:04 +0800530 def init_states(self):
531 '''
532 Initializes all states on startup.
533 '''
534 for test in self.test_list.get_all_tests():
535 # Make sure the state server knows about all the tests,
536 # defaulting to an untested state.
537 test.update_state(update_parent=False, visible=False)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800538
Jon Salz0697cbf2012-07-04 15:14:04 +0800539 var_log_messages = None
Vic Yanga9c32212012-08-16 20:07:54 +0800540 mosys_log = None
Vic Yange4c275d2012-08-28 01:50:20 +0800541 ec_console_log = None
Vic Yang079f9872013-07-01 11:32:00 +0800542 ec_panic_info = None
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800543
Jon Salz0697cbf2012-07-04 15:14:04 +0800544 # Any 'active' tests should be marked as failed now.
545 for test in self.test_list.walk():
Jon Salza6711d72012-07-18 14:33:03 +0800546 if not test.is_leaf():
547 # Don't bother with parents; they will be updated when their
548 # children are updated.
549 continue
550
Jon Salz0697cbf2012-07-04 15:14:04 +0800551 test_state = test.get_state()
552 if test_state.status != TestState.ACTIVE:
553 continue
554 if isinstance(test, factory.ShutdownStep):
555 # Shutdown while the test was active - that's good.
556 self.handle_shutdown_complete(test, test_state)
557 else:
558 # Unexpected shutdown. Grab /var/log/messages for context.
559 if var_log_messages is None:
560 try:
561 var_log_messages = (
562 utils.var_log_messages_before_reboot())
563 # Write it to the log, to make it easier to
564 # correlate with /var/log/messages.
565 logging.info(
566 'Unexpected shutdown. '
567 'Tail of /var/log/messages before last reboot:\n'
568 '%s', ('\n'.join(
569 ' ' + x for x in var_log_messages)))
570 except: # pylint: disable=W0702
571 logging.exception('Unable to grok /var/log/messages')
572 var_log_messages = []
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800573
Jon Salz008f4ea2012-08-28 05:39:45 +0800574 if mosys_log is None and not utils.in_chroot():
575 try:
576 mosys_log = utils.Spawn(
577 ['mosys', 'eventlog', 'list'],
578 read_stdout=True, log_stderr_on_error=True).stdout_data
579 # Write it to the log also.
580 logging.info('System eventlog from mosys:\n%s\n', mosys_log)
581 except: # pylint: disable=W0702
582 logging.exception('Unable to read mosys eventlog')
Vic Yanga9c32212012-08-16 20:07:54 +0800583
Vic Yange4c275d2012-08-28 01:50:20 +0800584 if ec_console_log is None:
585 try:
Vic Yang8341dde2013-01-29 16:48:52 +0800586 board = system.GetBoard()
587 ec_console_log = board.GetECConsoleLog()
Vic Yange4c275d2012-08-28 01:50:20 +0800588 logging.info('EC console log after reboot:\n%s\n', ec_console_log)
Jon Salzfe1f6652012-09-07 05:40:14 +0800589 except: # pylint: disable=W0702
Vic Yange4c275d2012-08-28 01:50:20 +0800590 logging.exception('Error retrieving EC console log')
591
Vic Yang079f9872013-07-01 11:32:00 +0800592 if ec_panic_info is None:
593 try:
594 board = system.GetBoard()
595 ec_panic_info = board.GetECPanicInfo()
596 logging.info('EC panic info after reboot:\n%s\n', ec_panic_info)
597 except: # pylint: disable=W0702
598 logging.exception('Error retrieving EC panic info')
599
Jon Salz0697cbf2012-07-04 15:14:04 +0800600 error_msg = 'Unexpected shutdown while test was running'
601 self.event_log.Log('end_test',
602 path=test.path,
603 status=TestState.FAILED,
604 invocation=test.get_state().invocation,
605 error_msg=error_msg,
Vic Yanga9c32212012-08-16 20:07:54 +0800606 var_log_messages='\n'.join(var_log_messages),
607 mosys_log=mosys_log)
Jon Salz0697cbf2012-07-04 15:14:04 +0800608 test.update_state(
609 status=TestState.FAILED,
610 error_msg=error_msg)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800611
Jon Salz50efe942012-07-26 11:54:10 +0800612 if not test.never_fails:
613 # For "never_fails" tests (such as "Start"), don't cancel
614 # pending tests, since reboot is expected.
615 factory.console.info('Unexpected shutdown while test %s '
616 'running; cancelling any pending tests',
617 test.path)
618 self.state_instance.set_shared_data('tests_after_shutdown', [])
Jon Salz69806bb2012-07-20 18:05:02 +0800619
Jon Salz008f4ea2012-08-28 05:39:45 +0800620 self.update_skipped_tests()
621
622 def update_skipped_tests(self):
623 '''
624 Updates skipped states based on run_if.
625 '''
Jon Salz885dcac2013-07-23 16:39:50 +0800626 env = TestArgEnv()
Jon Salz008f4ea2012-08-28 05:39:45 +0800627 for t in self.test_list.walk():
Jon Salz885dcac2013-07-23 16:39:50 +0800628 if t.is_leaf() and (t.run_if_table_name or t.run_if_expr):
629 value = None
630
631 if t.run_if_expr:
632 try:
633 value = t.run_if_expr(env)
634 except: # pylint: disable=W0702
635 logging.exception('Unable to evaluate run_if expression for %s',
636 t.path)
637 # But keep going; we have no choice. This will end up
638 # always activating the test.
639 else:
640 try:
641 aux = shopfloor.get_selected_aux_data(t.run_if_table_name)
642 value = aux.get(t.run_if_col)
643 except ValueError:
644 # Not available; assume it shouldn't be skipped
645 pass
646
647 if value is None:
648 skip = False
649 else:
650 skip = (not value) ^ t.run_if_not
Jon Salz008f4ea2012-08-28 05:39:45 +0800651
652 test_state = t.get_state()
653 if ((not skip) and
654 (test_state.status == TestState.PASSED) and
655 (test_state.error_msg == TestState.SKIPPED_MSG)):
656 # It was marked as skipped before, but now we need to run it.
657 # Mark as untested.
658 t.update_state(skip=skip, status=TestState.UNTESTED, error_msg='')
659 else:
660 t.update_state(skip=skip)
661
Jon Salz0697cbf2012-07-04 15:14:04 +0800662 def show_next_active_test(self):
663 '''
664 Rotates to the next visible active test.
665 '''
666 self.reap_completed_tests()
667 active_tests = [
668 t for t in self.test_list.walk()
669 if t.is_leaf() and t.get_state().status == TestState.ACTIVE]
670 if not active_tests:
671 return
Jon Salz4f6c7172012-06-11 20:45:36 +0800672
Jon Salz0697cbf2012-07-04 15:14:04 +0800673 try:
674 next_test = active_tests[
675 (active_tests.index(self.visible_test) + 1) % len(active_tests)]
676 except ValueError: # visible_test not present in active_tests
677 next_test = active_tests[0]
Jon Salz4f6c7172012-06-11 20:45:36 +0800678
Jon Salz0697cbf2012-07-04 15:14:04 +0800679 self.set_visible_test(next_test)
Jon Salz4f6c7172012-06-11 20:45:36 +0800680
Jon Salz0697cbf2012-07-04 15:14:04 +0800681 def handle_event(self, event):
682 '''
683 Handles an event from the event server.
684 '''
685 handler = self.event_handlers.get(event.type)
686 if handler:
687 handler(event)
688 else:
689 # We don't register handlers for all event types - just ignore
690 # this event.
691 logging.debug('Unbound event type %s', event.type)
Jon Salz4f6c7172012-06-11 20:45:36 +0800692
Vic Yangaabf9fd2013-04-09 18:56:13 +0800693 def check_critical_factory_note(self):
694 '''
695 Returns True if the last factory note is critical.
696 '''
697 notes = self.state_instance.get_shared_data('factory_note', True)
698 return notes and notes[-1]['level'] == 'CRITICAL'
699
Jon Salz0697cbf2012-07-04 15:14:04 +0800700 def run_next_test(self):
701 '''
702 Runs the next eligible test (or tests) in self.tests_to_run.
703 '''
704 self.reap_completed_tests()
Vic Yangaabf9fd2013-04-09 18:56:13 +0800705 if self.tests_to_run and self.check_critical_factory_note():
706 self.tests_to_run.clear()
707 return
Jon Salz0697cbf2012-07-04 15:14:04 +0800708 while self.tests_to_run:
709 logging.debug('Tests to run: %s',
710 [x.path for x in self.tests_to_run])
Jon Salz94eb56f2012-06-12 18:01:12 +0800711
Jon Salz0697cbf2012-07-04 15:14:04 +0800712 test = self.tests_to_run[0]
Jon Salz94eb56f2012-06-12 18:01:12 +0800713
Jon Salz0697cbf2012-07-04 15:14:04 +0800714 if test in self.invocations:
715 logging.info('Next test %s is already running', test.path)
716 self.tests_to_run.popleft()
717 return
Jon Salz94eb56f2012-06-12 18:01:12 +0800718
Jon Salza1412922012-07-23 16:04:17 +0800719 for requirement in test.require_run:
720 for i in requirement.test.walk():
721 if i.get_state().status == TestState.ACTIVE:
Jon Salz304a75d2012-07-06 11:14:15 +0800722 logging.info('Waiting for active test %s to complete '
Jon Salza1412922012-07-23 16:04:17 +0800723 'before running %s', i.path, test.path)
Jon Salz304a75d2012-07-06 11:14:15 +0800724 return
725
Jon Salz0697cbf2012-07-04 15:14:04 +0800726 if self.invocations and not (test.backgroundable and all(
727 [x.backgroundable for x in self.invocations])):
728 logging.debug('Waiting for non-backgroundable tests to '
729 'complete before running %s', test.path)
730 return
Jon Salz94eb56f2012-06-12 18:01:12 +0800731
Jon Salz3e6f5202012-10-15 15:08:29 +0800732 if test.get_state().skip:
733 factory.console.info('Skipping test %s', test.path)
734 test.update_state(status=TestState.PASSED,
735 error_msg=TestState.SKIPPED_MSG)
736 self.tests_to_run.popleft()
737 continue
738
Jon Salz0697cbf2012-07-04 15:14:04 +0800739 self.tests_to_run.popleft()
Jon Salz94eb56f2012-06-12 18:01:12 +0800740
Jon Salz304a75d2012-07-06 11:14:15 +0800741 untested = set()
Jon Salza1412922012-07-23 16:04:17 +0800742 for requirement in test.require_run:
743 for i in requirement.test.walk():
744 if i == test:
Jon Salz304a75d2012-07-06 11:14:15 +0800745 # We've hit this test itself; stop checking
746 break
Jon Salza1412922012-07-23 16:04:17 +0800747 if ((i.get_state().status == TestState.UNTESTED) or
748 (requirement.passed and i.get_state().status !=
749 TestState.PASSED)):
Jon Salz304a75d2012-07-06 11:14:15 +0800750 # Found an untested test; move on to the next
751 # element in require_run.
Jon Salza1412922012-07-23 16:04:17 +0800752 untested.add(i)
Jon Salz304a75d2012-07-06 11:14:15 +0800753 break
754
755 if untested:
756 untested_paths = ', '.join(sorted([x.path for x in untested]))
757 if self.state_instance.get_shared_data('engineering_mode',
758 optional=True):
759 # In engineering mode, we'll let it go.
760 factory.console.warn('In engineering mode; running '
761 '%s even though required tests '
762 '[%s] have not completed',
763 test.path, untested_paths)
764 else:
765 # Not in engineering mode; mark it failed.
766 error_msg = ('Required tests [%s] have not been run yet'
767 % untested_paths)
768 factory.console.error('Not running %s: %s',
769 test.path, error_msg)
770 test.update_state(status=TestState.FAILED,
771 error_msg=error_msg)
772 continue
773
Jon Salz0697cbf2012-07-04 15:14:04 +0800774 if isinstance(test, factory.ShutdownStep):
775 if os.path.exists(NO_REBOOT_FILE):
776 test.update_state(
777 status=TestState.FAILED, increment_count=1,
778 error_msg=('Skipped shutdown since %s is present' %
Jon Salz304a75d2012-07-06 11:14:15 +0800779 NO_REBOOT_FILE))
Jon Salz0697cbf2012-07-04 15:14:04 +0800780 continue
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800781
Jon Salz0697cbf2012-07-04 15:14:04 +0800782 test.update_state(status=TestState.ACTIVE, increment_count=1,
783 error_msg='', shutdown_count=0)
784 if self._prompt_cancel_shutdown(test, 1):
785 self.event_log.Log('reboot_cancelled')
786 test.update_state(
787 status=TestState.FAILED, increment_count=1,
788 error_msg='Shutdown aborted by operator',
789 shutdown_count=0)
chungyiafe8f772012-08-15 19:36:29 +0800790 continue
Jon Salz2f757d42012-06-27 17:06:42 +0800791
Jon Salz0697cbf2012-07-04 15:14:04 +0800792 # Save pending test list in the state server
Jon Salzdbf398f2012-06-14 17:30:01 +0800793 self.state_instance.set_shared_data(
Jon Salz0697cbf2012-07-04 15:14:04 +0800794 'tests_after_shutdown',
795 [t.path for t in self.tests_to_run])
796 # Save shutdown time
797 self.state_instance.set_shared_data('shutdown_time',
798 time.time())
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800799
Jon Salz0697cbf2012-07-04 15:14:04 +0800800 with self.env.lock:
801 self.event_log.Log('shutdown', operation=test.operation)
802 shutdown_result = self.env.shutdown(test.operation)
803 if shutdown_result:
804 # That's all, folks!
805 self.run_queue.put(None)
806 return
807 else:
808 # Just pass (e.g., in the chroot).
809 test.update_state(status=TestState.PASSED)
810 self.state_instance.set_shared_data(
811 'tests_after_shutdown', None)
812 # Send event with no fields to indicate that there is no
813 # longer a pending shutdown.
814 self.event_client.post_event(Event(
815 Event.Type.PENDING_SHUTDOWN))
816 continue
Jon Salz258a40c2012-04-19 12:34:01 +0800817
Cheng-Yi Chiangce05c002013-04-04 02:13:17 +0800818 self._run_test(test, test.iterations, test.retries)
Jon Salz1acc8742012-07-17 17:45:55 +0800819
Cheng-Yi Chiangce05c002013-04-04 02:13:17 +0800820 def _run_test(self, test, iterations_left=None, retries_left=None):
Jon Salz1acc8742012-07-17 17:45:55 +0800821 invoc = TestInvocation(self, test, on_completion=self.run_next_test)
822 new_state = test.update_state(
823 status=TestState.ACTIVE, increment_count=1, error_msg='',
Jon Salzbd42ce12012-09-18 08:03:59 +0800824 invocation=invoc.uuid, iterations_left=iterations_left,
Cheng-Yi Chiangce05c002013-04-04 02:13:17 +0800825 retries_left=retries_left,
Jon Salzbd42ce12012-09-18 08:03:59 +0800826 visible=(self.visible_test == test))
Jon Salz1acc8742012-07-17 17:45:55 +0800827 invoc.count = new_state.count
828
829 self.invocations[test] = invoc
830 if self.visible_test is None and test.has_ui:
831 self.set_visible_test(test)
Vic Yang311ddb82012-09-26 12:08:28 +0800832 self.check_exclusive()
Jon Salz1acc8742012-07-17 17:45:55 +0800833 invoc.start()
Jon Salz5f2a0672012-05-22 17:14:06 +0800834
Vic Yang311ddb82012-09-26 12:08:28 +0800835 def check_exclusive(self):
Jon Salzce6a7f82013-06-10 18:22:54 +0800836 # alias since this is really long
837 EXCL_OPT = factory.FactoryTest.EXCLUSIVE_OPTIONS
838
Vic Yang311ddb82012-09-26 12:08:28 +0800839 current_exclusive_items = set([
Jon Salzce6a7f82013-06-10 18:22:54 +0800840 item for item in EXCL_OPT
Vic Yang311ddb82012-09-26 12:08:28 +0800841 if any([test.is_exclusive(item) for test in self.invocations])])
842
843 new_exclusive_items = current_exclusive_items - self.exclusive_items
Jon Salzce6a7f82013-06-10 18:22:54 +0800844 if EXCL_OPT.NETWORKING in new_exclusive_items:
Vic Yang311ddb82012-09-26 12:08:28 +0800845 logging.info('Disabling network')
846 self.connection_manager.DisableNetworking()
Jon Salzce6a7f82013-06-10 18:22:54 +0800847 if EXCL_OPT.CHARGER in new_exclusive_items:
Vic Yang311ddb82012-09-26 12:08:28 +0800848 logging.info('Stop controlling charger')
849
850 new_non_exclusive_items = self.exclusive_items - current_exclusive_items
Jon Salzce6a7f82013-06-10 18:22:54 +0800851 if EXCL_OPT.NETWORKING in new_non_exclusive_items:
Vic Yang311ddb82012-09-26 12:08:28 +0800852 logging.info('Re-enabling network')
853 self.connection_manager.EnableNetworking()
Jon Salzce6a7f82013-06-10 18:22:54 +0800854 if EXCL_OPT.CHARGER in new_non_exclusive_items:
Vic Yang311ddb82012-09-26 12:08:28 +0800855 logging.info('Start controlling charger')
856
Jon Salzce6a7f82013-06-10 18:22:54 +0800857 if self.cpufreq_manager:
858 enabled = EXCL_OPT.CPUFREQ not in current_exclusive_items
859 try:
860 self.cpufreq_manager.SetEnabled(enabled)
861 except: # pylint: disable=W0702
862 logging.exception('Unable to %s cpufreq services',
863 'enable' if enabled else 'disable')
864
Vic Yang311ddb82012-09-26 12:08:28 +0800865 # Only adjust charge state if not excluded
Jon Salzce6a7f82013-06-10 18:22:54 +0800866 if (EXCL_OPT.CHARGER not in current_exclusive_items and
867 not utils.in_chroot()):
Cheng-Yi Chiangd8186952013-04-04 23:41:14 +0800868 if self.charge_manager:
869 self.charge_manager.AdjustChargeState()
870 else:
871 try:
872 system.GetBoard().SetChargeState(Board.ChargeState.CHARGE)
873 except BoardException:
874 logging.exception('Unable to set charge state on this board')
Vic Yang311ddb82012-09-26 12:08:28 +0800875
876 self.exclusive_items = current_exclusive_items
Jon Salz5da61e62012-05-31 13:06:22 +0800877
cychiang21886742012-07-05 15:16:32 +0800878 def check_for_updates(self):
879 '''
880 Schedules an asynchronous check for updates if necessary.
881 '''
882 if not self.test_list.options.update_period_secs:
883 # Not enabled.
884 return
885
886 now = time.time()
887 if self.last_update_check and (
888 now - self.last_update_check <
889 self.test_list.options.update_period_secs):
890 # Not yet time for another check.
891 return
892
893 self.last_update_check = now
894
895 def handle_check_for_update(reached_shopfloor, md5sum, needs_update):
896 if reached_shopfloor:
897 new_update_md5sum = md5sum if needs_update else None
898 if system.SystemInfo.update_md5sum != new_update_md5sum:
899 logging.info('Received new update MD5SUM: %s', new_update_md5sum)
900 system.SystemInfo.update_md5sum = new_update_md5sum
901 self.run_queue.put(self.update_system_info)
902
903 updater.CheckForUpdateAsync(
904 handle_check_for_update,
905 self.test_list.options.shopfloor_timeout_secs)
906
Jon Salza6711d72012-07-18 14:33:03 +0800907 def cancel_pending_tests(self):
908 '''Cancels any tests in the run queue.'''
909 self.run_tests([])
910
Jon Salz0697cbf2012-07-04 15:14:04 +0800911 def run_tests(self, subtrees, untested_only=False):
912 '''
913 Runs tests under subtree.
Jon Salz258a40c2012-04-19 12:34:01 +0800914
Jon Salz0697cbf2012-07-04 15:14:04 +0800915 The tests are run in order unless one fails (then stops).
916 Backgroundable tests are run simultaneously; when a foreground test is
917 encountered, we wait for all active tests to finish before continuing.
Jon Salzb1b39092012-05-03 02:05:09 +0800918
Jon Salz0697cbf2012-07-04 15:14:04 +0800919 @param subtrees: Node or nodes containing tests to run (may either be
920 a single test or a list). Duplicates will be ignored.
921 '''
922 if type(subtrees) != list:
923 subtrees = [subtrees]
Jon Salz258a40c2012-04-19 12:34:01 +0800924
Jon Salz0697cbf2012-07-04 15:14:04 +0800925 # Nodes we've seen so far, to avoid duplicates.
926 seen = set()
Jon Salz94eb56f2012-06-12 18:01:12 +0800927
Jon Salz0697cbf2012-07-04 15:14:04 +0800928 self.tests_to_run = deque()
929 for subtree in subtrees:
930 for test in subtree.walk():
931 if test in seen:
932 continue
933 seen.add(test)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800934
Jon Salz0697cbf2012-07-04 15:14:04 +0800935 if not test.is_leaf():
936 continue
937 if (untested_only and
938 test.get_state().status != TestState.UNTESTED):
939 continue
940 self.tests_to_run.append(test)
941 self.run_next_test()
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800942
Jon Salz0697cbf2012-07-04 15:14:04 +0800943 def reap_completed_tests(self):
944 '''
945 Removes completed tests from the set of active tests.
946
947 Also updates the visible test if it was reaped.
948 '''
Cheng-Yi Chiang5ac22ca2013-04-12 17:45:26 +0800949 test_completed = False
Jon Salz0697cbf2012-07-04 15:14:04 +0800950 for t, v in dict(self.invocations).iteritems():
951 if v.is_completed():
Cheng-Yi Chiang5ac22ca2013-04-12 17:45:26 +0800952 test_completed = True
Jon Salz1acc8742012-07-17 17:45:55 +0800953 new_state = t.update_state(**v.update_state_on_completion)
Jon Salz0697cbf2012-07-04 15:14:04 +0800954 del self.invocations[t]
955
Chun-Ta Lin54e17e42012-09-06 22:05:13 +0800956 # Stop on failure if flag is true.
957 if (self.test_list.options.stop_on_failure and
958 new_state.status == TestState.FAILED):
959 # Clean all the tests to cause goofy to stop.
960 self.tests_to_run = []
961 factory.console.info("Stop on failure triggered. Empty the queue.")
962
Jon Salz1acc8742012-07-17 17:45:55 +0800963 if new_state.iterations_left and new_state.status == TestState.PASSED:
964 # Play it again, Sam!
965 self._run_test(t)
Cheng-Yi Chiangce05c002013-04-04 02:13:17 +0800966 # new_state.retries_left is obtained after update.
967 # For retries_left == 0, test can still be run for the last time.
968 elif (new_state.retries_left >= 0 and
969 new_state.status == TestState.FAILED):
970 # Still have to retry, Sam!
971 self._run_test(t)
Jon Salz1acc8742012-07-17 17:45:55 +0800972
Cheng-Yi Chiang5ac22ca2013-04-12 17:45:26 +0800973 if test_completed:
Vic Yangf01c59f2013-04-19 17:37:56 +0800974 self.log_watcher.KickWatchThread()
Cheng-Yi Chiang5ac22ca2013-04-12 17:45:26 +0800975
Jon Salz0697cbf2012-07-04 15:14:04 +0800976 if (self.visible_test is None or
Jon Salz85a39882012-07-05 16:45:04 +0800977 self.visible_test not in self.invocations):
Jon Salz0697cbf2012-07-04 15:14:04 +0800978 self.set_visible_test(None)
979 # Make the first running test, if any, the visible test
980 for t in self.test_list.walk():
981 if t in self.invocations:
982 self.set_visible_test(t)
983 break
984
Jon Salz6dc031d2013-06-19 13:06:23 +0800985 def kill_active_tests(self, abort, root=None, reason=None):
Jon Salz0697cbf2012-07-04 15:14:04 +0800986 '''
987 Kills and waits for all active tests.
988
Jon Salz85a39882012-07-05 16:45:04 +0800989 Args:
990 abort: True to change state of killed tests to FAILED, False for
Jon Salz0697cbf2012-07-04 15:14:04 +0800991 UNTESTED.
Jon Salz85a39882012-07-05 16:45:04 +0800992 root: If set, only kills tests with root as an ancestor.
Jon Salz0697cbf2012-07-04 15:14:04 +0800993 '''
994 self.reap_completed_tests()
995 for test, invoc in self.invocations.items():
Jon Salz85a39882012-07-05 16:45:04 +0800996 if root and not test.has_ancestor(root):
997 continue
998
Jon Salz0697cbf2012-07-04 15:14:04 +0800999 factory.console.info('Killing active test %s...' % test.path)
Jon Salz6dc031d2013-06-19 13:06:23 +08001000 invoc.abort_and_join(reason)
Jon Salz0697cbf2012-07-04 15:14:04 +08001001 factory.console.info('Killed %s' % test.path)
Jon Salz1acc8742012-07-17 17:45:55 +08001002 test.update_state(**invoc.update_state_on_completion)
Jon Salz0697cbf2012-07-04 15:14:04 +08001003 del self.invocations[test]
Jon Salz1acc8742012-07-17 17:45:55 +08001004
Jon Salz0697cbf2012-07-04 15:14:04 +08001005 if not abort:
1006 test.update_state(status=TestState.UNTESTED)
1007 self.reap_completed_tests()
1008
Jon Salz6dc031d2013-06-19 13:06:23 +08001009 def stop(self, root=None, fail=False, reason=None):
1010 self.kill_active_tests(fail, root, reason)
Jon Salz85a39882012-07-05 16:45:04 +08001011 # Remove any tests in the run queue under the root.
1012 self.tests_to_run = deque([x for x in self.tests_to_run
1013 if root and not x.has_ancestor(root)])
1014 self.run_next_test()
Jon Salz0697cbf2012-07-04 15:14:04 +08001015
Jon Salz4712ac72013-02-07 17:12:05 +08001016 def clear_state(self, root=None):
Jon Salzd7550792013-07-12 05:49:27 +08001017 if root is None:
1018 root = self.test_list
Jon Salz6dc031d2013-06-19 13:06:23 +08001019 self.stop(root, reason='Clearing test state')
Jon Salz4712ac72013-02-07 17:12:05 +08001020 for f in root.walk():
1021 if f.is_leaf():
1022 f.update_state(status=TestState.UNTESTED)
1023
Jon Salz6dc031d2013-06-19 13:06:23 +08001024 def abort_active_tests(self, reason=None):
1025 self.kill_active_tests(True, reason=reason)
Jon Salz0697cbf2012-07-04 15:14:04 +08001026
1027 def main(self):
Jon Salzeff94182013-06-19 15:06:28 +08001028 syslog.openlog('goofy')
1029
Jon Salz0697cbf2012-07-04 15:14:04 +08001030 try:
Jon Salzd7550792013-07-12 05:49:27 +08001031 self.status = Status.INITIALIZING
Jon Salz0697cbf2012-07-04 15:14:04 +08001032 self.init()
1033 self.event_log.Log('goofy_init',
1034 success=True)
1035 except:
1036 if self.event_log:
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001037 try:
Jon Salz0697cbf2012-07-04 15:14:04 +08001038 self.event_log.Log('goofy_init',
1039 success=False,
1040 trace=traceback.format_exc())
1041 except: # pylint: disable=W0702
1042 pass
1043 raise
1044
Jon Salzd7550792013-07-12 05:49:27 +08001045 self.status = Status.RUNNING
Jon Salzeff94182013-06-19 15:06:28 +08001046 syslog.syslog('Goofy (factory test harness) starting')
Jon Salz0697cbf2012-07-04 15:14:04 +08001047 self.run()
1048
1049 def update_system_info(self):
1050 '''Updates system info.'''
1051 system_info = system.SystemInfo()
1052 self.state_instance.set_shared_data('system_info', system_info.__dict__)
1053 self.event_client.post_event(Event(Event.Type.SYSTEM_INFO,
1054 system_info=system_info.__dict__))
1055 logging.info('System info: %r', system_info.__dict__)
1056
Jon Salzeb42f0d2012-07-27 19:14:04 +08001057 def update_factory(self, auto_run_on_restart=False, post_update_hook=None):
1058 '''Commences updating factory software.
1059
1060 Args:
1061 auto_run_on_restart: Auto-run when the machine comes back up.
1062 post_update_hook: Code to call after update but immediately before
1063 restart.
1064
1065 Returns:
1066 Never if the update was successful (we just reboot).
1067 False if the update was unnecessary (no update available).
1068 '''
Jon Salz6dc031d2013-06-19 13:06:23 +08001069 self.kill_active_tests(False, reason='Factory software update')
Jon Salza6711d72012-07-18 14:33:03 +08001070 self.cancel_pending_tests()
Jon Salz0697cbf2012-07-04 15:14:04 +08001071
Jon Salz5c344f62012-07-13 14:31:16 +08001072 def pre_update_hook():
1073 if auto_run_on_restart:
1074 self.state_instance.set_shared_data('tests_after_shutdown',
1075 FORCE_AUTO_RUN)
1076 self.state_instance.close()
1077
Jon Salzeb42f0d2012-07-27 19:14:04 +08001078 if updater.TryUpdate(pre_update_hook=pre_update_hook):
1079 if post_update_hook:
1080 post_update_hook()
1081 self.env.shutdown('reboot')
Jon Salz0697cbf2012-07-04 15:14:04 +08001082
Jon Salzcef132a2012-08-30 04:58:08 +08001083 def handle_sigint(self, dummy_signum, dummy_frame):
Jon Salz77c151e2012-08-28 07:20:37 +08001084 logging.error('Received SIGINT')
1085 self.run_queue.put(None)
1086 raise KeyboardInterrupt()
1087
Jon Salze12c2b32013-06-25 16:24:34 +08001088 def find_kcrashes(self):
1089 """Finds kcrash files, logs them, and marks them as seen."""
1090 seen_crashes = set(
1091 self.state_instance.get_shared_data('seen_crashes', optional=True)
1092 or [])
1093
1094 for path in glob.glob('/var/spool/crash/*'):
1095 if not os.path.isfile(path):
1096 continue
1097 if path in seen_crashes:
1098 continue
1099 try:
1100 stat = os.stat(path)
1101 mtime = utils.TimeString(stat.st_mtime)
1102 logging.info(
1103 'Found new crash file %s (%d bytes at %s)',
1104 path, stat.st_size, mtime)
1105 extra_log_args = {}
1106
1107 try:
1108 _, ext = os.path.splitext(path)
1109 if ext in ['.kcrash', '.meta']:
1110 ext = ext.replace('.', '')
1111 with open(path) as f:
1112 data = f.read(MAX_CRASH_FILE_SIZE)
1113 tell = f.tell()
1114 logging.info(
1115 'Contents of %s%s:%s',
1116 path,
1117 ('' if tell == stat.st_size
1118 else '(truncated to %d bytes)' % MAX_CRASH_FILE_SIZE),
1119 ('\n' + data).replace('\n', '\n ' + ext + '> '))
1120 extra_log_args['data'] = data
1121
1122 # Copy to /var/factory/kcrash for posterity
1123 kcrash_dir = factory.get_factory_root('kcrash')
1124 utils.TryMakeDirs(kcrash_dir)
1125 shutil.copy(path, kcrash_dir)
1126 logging.info('Copied to %s',
1127 os.path.join(kcrash_dir, os.path.basename(path)))
1128 finally:
1129 # Even if something goes wrong with the above, still try to
1130 # log to event log
1131 self.event_log.Log('crash_file',
1132 path=path, size=stat.st_size, mtime=mtime,
1133 **extra_log_args)
1134 except: # pylint: disable=W0702
1135 logging.exception('Unable to handle crash files %s', path)
1136 seen_crashes.add(path)
1137
1138 self.state_instance.set_shared_data('seen_crashes', list(seen_crashes))
1139
Jon Salz128b0932013-07-03 16:55:26 +08001140 def GetTestList(self, test_list_id):
1141 """Returns the test list with the given ID.
1142
1143 Raises:
1144 TestListError: The test list ID is not valid.
1145 """
1146 try:
1147 return self.test_lists[test_list_id]
1148 except KeyError:
1149 raise test_lists.TestListError(
1150 '%r is not a valid test list ID (available IDs are [%s])' % (
1151 test_list_id, ', '.join(sorted(self.test_lists.keys()))))
1152
1153 def InitTestLists(self):
1154 """Reads in all test lists and sets the active test list."""
1155 self.test_lists = test_lists.BuildAllTestLists()
Jon Salzd7550792013-07-12 05:49:27 +08001156 logging.info('Loaded test lists: [%s]',
1157 test_lists.DescribeTestLists(self.test_lists))
Jon Salz128b0932013-07-03 16:55:26 +08001158
1159 if not self.options.test_list:
1160 self.options.test_list = test_lists.GetActiveTestListId()
1161
1162 if os.sep in self.options.test_list:
1163 # It's a path pointing to an old-style test list; use it.
1164 self.test_list = factory.read_test_list(self.options.test_list)
1165 else:
1166 self.test_list = self.GetTestList(self.options.test_list)
1167
1168 logging.info('Active test list: %s', self.test_list.test_list_id)
1169
1170 if isinstance(self.test_list, test_lists.OldStyleTestList):
1171 # Actually load it in. (See OldStyleTestList for an explanation
1172 # of why this is necessary.)
1173 self.test_list = self.test_list.Load()
1174
1175 self.test_list.state_instance = self.state_instance
1176
Shuo-Peng Liao268b40b2013-07-01 15:58:59 +08001177 def init_hooks(self):
1178 """Initializes hooks.
1179
1180 Must run after self.test_list ready.
1181 """
Shuo-Peng Liao52b90da2013-06-30 17:00:06 +08001182 module, cls = self.test_list.options.hooks_class.rsplit('.', 1)
1183 self.hooks = getattr(__import__(module, fromlist=[cls]), cls)()
1184 assert isinstance(self.hooks, factory.Hooks), (
1185 "hooks should be of type Hooks but is %r" % type(self.hooks))
1186 self.hooks.test_list = self.test_list
Shuo-Peng Liao268b40b2013-07-01 15:58:59 +08001187 self.hooks.OnCreatedTestList()
Shuo-Peng Liao52b90da2013-06-30 17:00:06 +08001188
Jon Salz0697cbf2012-07-04 15:14:04 +08001189 def init(self, args=None, env=None):
1190 '''Initializes Goofy.
1191
1192 Args:
1193 args: A list of command-line arguments. Uses sys.argv if
1194 args is None.
1195 env: An Environment instance to use (or None to choose
1196 FakeChrootEnvironment or DUTEnvironment as appropriate).
1197 '''
Jon Salz77c151e2012-08-28 07:20:37 +08001198 signal.signal(signal.SIGINT, self.handle_sigint)
1199
Jon Salz0697cbf2012-07-04 15:14:04 +08001200 parser = OptionParser()
1201 parser.add_option('-v', '--verbose', dest='verbose',
Jon Salz8fa8e832012-07-13 19:04:09 +08001202 action='store_true',
1203 help='Enable debug logging')
Jon Salz0697cbf2012-07-04 15:14:04 +08001204 parser.add_option('--print_test_list', dest='print_test_list',
Jon Salz8fa8e832012-07-13 19:04:09 +08001205 metavar='FILE',
1206 help='Read and print test list FILE, and exit')
Jon Salz0697cbf2012-07-04 15:14:04 +08001207 parser.add_option('--restart', dest='restart',
Jon Salz8fa8e832012-07-13 19:04:09 +08001208 action='store_true',
1209 help='Clear all test state')
Jon Salz0697cbf2012-07-04 15:14:04 +08001210 parser.add_option('--ui', dest='ui', type='choice',
Jon Salz8fa8e832012-07-13 19:04:09 +08001211 choices=['none', 'gtk', 'chrome'],
Jon Salz2f881df2013-02-01 17:00:35 +08001212 default='chrome',
Jon Salz8fa8e832012-07-13 19:04:09 +08001213 help='UI to use')
Jon Salz0697cbf2012-07-04 15:14:04 +08001214 parser.add_option('--ui_scale_factor', dest='ui_scale_factor',
Jon Salz8fa8e832012-07-13 19:04:09 +08001215 type='int', default=1,
1216 help=('Factor by which to scale UI '
1217 '(Chrome UI only)'))
Jon Salz0697cbf2012-07-04 15:14:04 +08001218 parser.add_option('--test_list', dest='test_list',
Jon Salz8fa8e832012-07-13 19:04:09 +08001219 metavar='FILE',
1220 help='Use FILE as test list')
Jon Salzc79a9982012-08-30 04:42:01 +08001221 parser.add_option('--dummy_shopfloor', action='store_true',
1222 help='Use a dummy shopfloor server')
chungyiafe8f772012-08-15 19:36:29 +08001223 parser.add_option('--automation', dest='automation',
1224 action='store_true',
1225 help='Enable automation on running factory test')
Jon Salz0697cbf2012-07-04 15:14:04 +08001226 (self.options, self.args) = parser.parse_args(args)
1227
Jon Salz46b89562012-07-05 11:49:22 +08001228 # Make sure factory directories exist.
1229 factory.get_log_root()
1230 factory.get_state_root()
1231 factory.get_test_data_root()
1232
Jon Salz0697cbf2012-07-04 15:14:04 +08001233 global _inited_logging # pylint: disable=W0603
1234 if not _inited_logging:
1235 factory.init_logging('goofy', verbose=self.options.verbose)
1236 _inited_logging = True
Jon Salz8fa8e832012-07-13 19:04:09 +08001237
Jon Salz0f996602012-10-03 15:26:48 +08001238 if self.options.print_test_list:
1239 print factory.read_test_list(
1240 self.options.print_test_list).__repr__(recursive=True)
1241 sys.exit(0)
1242
Jon Salzee85d522012-07-17 14:34:46 +08001243 event_log.IncrementBootSequence()
Jon Salzd15bbcf2013-05-21 17:33:57 +08001244 # Don't defer logging the initial event, so we can make sure
1245 # that device_id, reimage_id, etc. are all set up.
1246 self.event_log = EventLog('goofy', defer=False)
Jon Salz0697cbf2012-07-04 15:14:04 +08001247
1248 if (not suppress_chroot_warning and
1249 factory.in_chroot() and
1250 self.options.ui == 'gtk' and
1251 os.environ.get('DISPLAY') in [None, '', ':0', ':0.0']):
1252 # That's not going to work! Tell the user how to run
1253 # this way.
1254 logging.warn(GOOFY_IN_CHROOT_WARNING)
1255 time.sleep(1)
1256
1257 if env:
1258 self.env = env
1259 elif factory.in_chroot():
1260 self.env = test_environment.FakeChrootEnvironment()
1261 logging.warn(
1262 'Using chroot environment: will not actually run autotests')
1263 else:
1264 self.env = test_environment.DUTEnvironment()
1265 self.env.goofy = self
1266
1267 if self.options.restart:
1268 state.clear_state()
1269
Jon Salz0697cbf2012-07-04 15:14:04 +08001270 if self.options.ui_scale_factor != 1 and utils.in_qemu():
1271 logging.warn(
1272 'In QEMU; ignoring ui_scale_factor argument')
1273 self.options.ui_scale_factor = 1
1274
1275 logging.info('Started')
1276
1277 self.start_state_server()
1278 self.state_instance.set_shared_data('hwid_cfg', get_hwid_cfg())
1279 self.state_instance.set_shared_data('ui_scale_factor',
Ricky Liang09216dc2013-02-22 17:26:45 +08001280 self.options.ui_scale_factor)
Jon Salz0697cbf2012-07-04 15:14:04 +08001281 self.last_shutdown_time = (
1282 self.state_instance.get_shared_data('shutdown_time', optional=True))
1283 self.state_instance.del_shared_data('shutdown_time', optional=True)
Jon Salzb19ea072013-02-07 16:35:00 +08001284 self.state_instance.del_shared_data('startup_error', optional=True)
Jon Salz0697cbf2012-07-04 15:14:04 +08001285
Jon Salz128b0932013-07-03 16:55:26 +08001286 try:
1287 self.InitTestLists()
1288 except: # pylint: disable=W0702
1289 logging.exception('Unable to initialize test lists')
1290 self.state_instance.set_shared_data(
1291 'startup_error',
1292 'Unable to initialize test lists\n%s' % (
1293 traceback.format_exc()))
Jon Salzb19ea072013-02-07 16:35:00 +08001294 if self.options.ui == 'chrome':
1295 # Create an empty test list with default options so that the rest of
1296 # startup can proceed.
1297 self.test_list = factory.FactoryTestList(
1298 [], self.state_instance, factory.Options())
1299 else:
1300 # Bail with an error; no point in starting up.
1301 sys.exit('No valid test list; exiting.')
1302
Shuo-Peng Liao268b40b2013-07-01 15:58:59 +08001303 self.init_hooks()
1304
Jon Salz822838b2013-03-25 17:32:33 +08001305 if self.test_list.options.clear_state_on_start:
1306 self.state_instance.clear_test_state()
1307
Vic Yang3e1cf5d2013-06-05 18:50:24 +08001308 if system.SystemInfo().firmware_version is None and not utils.in_chroot():
Vic Yang9bd4f772013-06-04 17:34:00 +08001309 self.state_instance.set_shared_data('startup_error',
1310 'Netboot firmware detected\n'
1311 'Connect Ethernet and reboot to re-image.\n'
1312 u'侦测到网路开机固件\n'
1313 u'请连接乙太网并重启')
1314
Jon Salz0697cbf2012-07-04 15:14:04 +08001315 if not self.state_instance.has_shared_data('ui_lang'):
1316 self.state_instance.set_shared_data('ui_lang',
1317 self.test_list.options.ui_lang)
1318 self.state_instance.set_shared_data(
1319 'test_list_options',
1320 self.test_list.options.__dict__)
1321 self.state_instance.test_list = self.test_list
1322
Cheng-Yi Chiang39d32ad2013-07-23 15:02:38 +08001323 self.check_log_rotation()
Jon Salz83ef34b2012-11-01 19:46:35 +08001324
Jon Salz23926422012-09-01 03:38:13 +08001325 if self.options.dummy_shopfloor:
1326 os.environ[shopfloor.SHOPFLOOR_SERVER_ENV_VAR_NAME] = (
1327 'http://localhost:%d/' % shopfloor.DEFAULT_SERVER_PORT)
1328 self.dummy_shopfloor = Spawn(
1329 [os.path.join(factory.FACTORY_PATH, 'bin', 'shopfloor_server'),
1330 '--dummy'])
1331 elif self.test_list.options.shopfloor_server_url:
1332 shopfloor.set_server_url(self.test_list.options.shopfloor_server_url)
Jon Salz2bf2f6b2013-03-28 18:49:26 +08001333 shopfloor.set_enabled(True)
Jon Salz23926422012-09-01 03:38:13 +08001334
Jon Salz0f996602012-10-03 15:26:48 +08001335 if self.test_list.options.time_sanitizer and not utils.in_chroot():
Jon Salz8fa8e832012-07-13 19:04:09 +08001336 self.time_sanitizer = time_sanitizer.TimeSanitizer(
1337 base_time=time_sanitizer.GetBaseTimeFromFile(
1338 # lsb-factory is written by the factory install shim during
1339 # installation, so it should have a good time obtained from
Jon Salz54882d02012-08-31 01:57:54 +08001340 # the mini-Omaha server. If it's not available, we'll use
1341 # /etc/lsb-factory (which will be much older, but reasonably
1342 # sane) and rely on a shopfloor sync to set a more accurate
1343 # time.
1344 '/usr/local/etc/lsb-factory',
1345 '/etc/lsb-release'))
Jon Salz8fa8e832012-07-13 19:04:09 +08001346 self.time_sanitizer.RunOnce()
1347
Vic Yangd8990da2013-06-27 16:57:43 +08001348 if self.test_list.options.check_cpu_usage_period_secs:
1349 self.cpu_usage_watcher = Spawn(['py/tools/cpu_usage_monitor.py',
1350 '-p', str(self.test_list.options.check_cpu_usage_period_secs)],
1351 cwd=factory.FACTORY_PATH)
1352
Jon Salz0697cbf2012-07-04 15:14:04 +08001353 self.init_states()
1354 self.start_event_server()
1355 self.connection_manager = self.env.create_connection_manager(
Tai-Hsu Lin371351a2012-08-27 14:17:14 +08001356 self.test_list.options.wlans,
1357 self.test_list.options.scan_wifi_period_secs)
Jon Salz0697cbf2012-07-04 15:14:04 +08001358 # Note that we create a log watcher even if
1359 # sync_event_log_period_secs isn't set (no background
1360 # syncing), since we may use it to flush event logs as well.
1361 self.log_watcher = EventLogWatcher(
1362 self.test_list.options.sync_event_log_period_secs,
Jon Salzd15bbcf2013-05-21 17:33:57 +08001363 event_log_db_file=None,
Jon Salz16d10542012-07-23 12:18:45 +08001364 handle_event_logs_callback=self.handle_event_logs)
Jon Salz0697cbf2012-07-04 15:14:04 +08001365 if self.test_list.options.sync_event_log_period_secs:
1366 self.log_watcher.StartWatchThread()
1367
Cheng-Yi Chiang344b10f2013-05-03 16:44:03 +08001368 # Note that we create a system log manager even if
1369 # sync_log_period_secs isn't set (no background
1370 # syncing), since we may kick it to sync logs in its
1371 # thread.
Cheng-Yi Chiangd3516a32013-07-17 15:30:47 +08001372 if self.test_list.options.enable_sync_log:
1373 self.system_log_manager = SystemLogManager(
1374 sync_log_paths=self.test_list.options.sync_log_paths,
1375 sync_period_sec=self.test_list.options.sync_log_period_secs,
1376 clear_log_paths=self.test_list.options.clear_log_paths)
1377 self.system_log_manager.StartSyncThread()
Cheng-Yi Chiang344b10f2013-05-03 16:44:03 +08001378
Jon Salz0697cbf2012-07-04 15:14:04 +08001379 self.update_system_info()
1380
Vic Yang4953fc12012-07-26 16:19:53 +08001381 assert ((self.test_list.options.min_charge_pct is None) ==
1382 (self.test_list.options.max_charge_pct is None))
Vic Yange83d9a12013-04-19 20:00:20 +08001383 if utils.in_chroot():
1384 logging.info('In chroot, ignoring charge manager and charge state')
1385 elif self.test_list.options.min_charge_pct is not None:
Vic Yang4953fc12012-07-26 16:19:53 +08001386 self.charge_manager = ChargeManager(self.test_list.options.min_charge_pct,
1387 self.test_list.options.max_charge_pct)
Jon Salzad7353b2012-10-15 16:22:46 +08001388 system.SystemStatus.charge_manager = self.charge_manager
Cheng-Yi Chiangd8186952013-04-04 23:41:14 +08001389 else:
1390 # Goofy should set charger state to charge if charge_manager is disabled.
1391 try:
1392 system.GetBoard().SetChargeState(Board.ChargeState.CHARGE)
1393 except BoardException:
1394 logging.exception('Unable to set charge state on this board')
Vic Yang4953fc12012-07-26 16:19:53 +08001395
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +08001396 self.core_dump_manager = CoreDumpManager(
1397 self.test_list.options.core_dump_watchlist)
1398
Jon Salz0697cbf2012-07-04 15:14:04 +08001399 os.environ['CROS_FACTORY'] = '1'
1400 os.environ['CROS_DISABLE_SITE_SYSINFO'] = '1'
1401
1402 # Set CROS_UI since some behaviors in ui.py depend on the
1403 # particular UI in use. TODO(jsalz): Remove this (and all
1404 # places it is used) when the GTK UI is removed.
1405 os.environ['CROS_UI'] = self.options.ui
1406
Shuo-Peng Liao1ff502e2013-06-30 18:37:02 +08001407 if not utils.in_chroot() and self.test_list.options.use_cpufreq_manager:
Jon Salzddf0d052013-06-18 12:52:44 +08001408 self.cpufreq_manager = CpufreqManager(event_log=self.event_log)
Jon Salzce6a7f82013-06-10 18:22:54 +08001409
Justin Chuang31b02432013-06-27 15:16:51 +08001410 # Startup hooks may want to skip some tests.
1411 self.update_skipped_tests()
Jon Salz416f9cc2013-05-10 18:32:50 +08001412
Jon Salze12c2b32013-06-25 16:24:34 +08001413 self.find_kcrashes()
1414
Shuo-Peng Liao268b40b2013-07-01 15:58:59 +08001415 # Should not move earlier.
1416 self.hooks.OnStartup()
1417
Jon Salz0697cbf2012-07-04 15:14:04 +08001418 if self.options.ui == 'chrome':
1419 self.env.launch_chrome()
1420 logging.info('Waiting for a web socket connection')
Cheng-Yi Chiangfd8ed392013-03-08 21:37:31 +08001421 self.web_socket_manager.wait()
Jon Salz0697cbf2012-07-04 15:14:04 +08001422
1423 # Wait for the test widget size to be set; this is done in
1424 # an asynchronous RPC so there is a small chance that the
1425 # web socket might be opened first.
1426 for _ in range(100): # 10 s
1427 try:
1428 if self.state_instance.get_shared_data('test_widget_size'):
1429 break
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001430 except KeyError:
Jon Salz0697cbf2012-07-04 15:14:04 +08001431 pass # Retry
1432 time.sleep(0.1) # 100 ms
1433 else:
1434 logging.warn('Never received test_widget_size from UI')
Jon Salz45297282013-05-18 14:31:47 +08001435
1436 # Send Chrome a Tab to get focus to the factory UI
1437 # (http://crosbug.com/p/19444). TODO(jsalz): remove this hack
1438 # and figure out the right way to get the focus to Chrome.
1439 if not utils.in_chroot():
Ricky Liangb97f3652013-08-20 17:30:28 +08001440 utils.SendKey('Tab')
Jon Salz0697cbf2012-07-04 15:14:04 +08001441 elif self.options.ui == 'gtk':
1442 self.start_ui()
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001443
Ricky Liang650f6bf2012-09-28 13:22:54 +08001444 # Create download path for autotest beforehand or autotests run at
1445 # the same time might fail due to race condition.
1446 if not factory.in_chroot():
1447 utils.TryMakeDirs(os.path.join('/usr/local/autotest', 'tests',
1448 'download'))
1449
Jon Salz0697cbf2012-07-04 15:14:04 +08001450 def state_change_callback(test, test_state):
1451 self.event_client.post_event(
1452 Event(Event.Type.STATE_CHANGE,
1453 path=test.path, state=test_state))
1454 self.test_list.state_change_callback = state_change_callback
Jon Salz73e0fd02012-04-04 11:46:38 +08001455
Jon Salza6711d72012-07-18 14:33:03 +08001456 for handler in self.on_ui_startup:
1457 handler()
1458
1459 self.prespawner = Prespawner()
1460 self.prespawner.start()
1461
Jon Salz0697cbf2012-07-04 15:14:04 +08001462 try:
1463 tests_after_shutdown = self.state_instance.get_shared_data(
1464 'tests_after_shutdown')
1465 except KeyError:
1466 tests_after_shutdown = None
Jon Salz57717ca2012-04-04 16:47:25 +08001467
Jon Salz5c344f62012-07-13 14:31:16 +08001468 force_auto_run = (tests_after_shutdown == FORCE_AUTO_RUN)
1469 if not force_auto_run and tests_after_shutdown is not None:
Jon Salz0697cbf2012-07-04 15:14:04 +08001470 logging.info('Resuming tests after shutdown: %s',
1471 tests_after_shutdown)
Jon Salz0697cbf2012-07-04 15:14:04 +08001472 self.tests_to_run.extend(
1473 self.test_list.lookup_path(t) for t in tests_after_shutdown)
1474 self.run_queue.put(self.run_next_test)
1475 else:
Jon Salz5c344f62012-07-13 14:31:16 +08001476 if force_auto_run or self.test_list.options.auto_run_on_start:
Jon Salz0697cbf2012-07-04 15:14:04 +08001477 self.run_queue.put(
1478 lambda: self.run_tests(self.test_list, untested_only=True))
Jon Salz5c344f62012-07-13 14:31:16 +08001479 self.state_instance.set_shared_data('tests_after_shutdown', None)
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001480
Dean Liao592e4d52013-01-10 20:06:39 +08001481 self.may_disable_cros_shortcut_keys()
1482
1483 def may_disable_cros_shortcut_keys(self):
1484 test_options = self.test_list.options
1485 if test_options.disable_cros_shortcut_keys:
1486 logging.info('Filter ChromeOS shortcut keys.')
1487 self.key_filter = KeyFilter(
1488 unmap_caps_lock=test_options.disable_caps_lock,
1489 caps_lock_keycode=test_options.caps_lock_keycode)
1490 self.key_filter.Start()
1491
Jon Salz0697cbf2012-07-04 15:14:04 +08001492 def run(self):
1493 '''Runs Goofy.'''
1494 # Process events forever.
1495 while self.run_once(True):
1496 pass
Jon Salz73e0fd02012-04-04 11:46:38 +08001497
Jon Salz0697cbf2012-07-04 15:14:04 +08001498 def run_once(self, block=False):
1499 '''Runs all items pending in the event loop.
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001500
Jon Salz0697cbf2012-07-04 15:14:04 +08001501 Args:
1502 block: If true, block until at least one event is processed.
Jon Salz7c15e8b2012-06-19 17:10:37 +08001503
Jon Salz0697cbf2012-07-04 15:14:04 +08001504 Returns:
1505 True to keep going or False to shut down.
1506 '''
1507 events = utils.DrainQueue(self.run_queue)
cychiang21886742012-07-05 15:16:32 +08001508 while not events:
Jon Salz0697cbf2012-07-04 15:14:04 +08001509 # Nothing on the run queue.
1510 self._run_queue_idle()
1511 if block:
1512 # Block for at least one event...
cychiang21886742012-07-05 15:16:32 +08001513 try:
1514 events.append(self.run_queue.get(timeout=RUN_QUEUE_TIMEOUT_SECS))
1515 except Queue.Empty:
1516 # Keep going (calling _run_queue_idle() again at the top of
1517 # the loop)
1518 continue
Jon Salz0697cbf2012-07-04 15:14:04 +08001519 # ...and grab anything else that showed up at the same
1520 # time.
1521 events.extend(utils.DrainQueue(self.run_queue))
cychiang21886742012-07-05 15:16:32 +08001522 else:
1523 break
Jon Salz51528e12012-07-02 18:54:45 +08001524
Jon Salz0697cbf2012-07-04 15:14:04 +08001525 for event in events:
1526 if not event:
1527 # Shutdown request.
1528 self.run_queue.task_done()
1529 return False
Jon Salz51528e12012-07-02 18:54:45 +08001530
Jon Salz0697cbf2012-07-04 15:14:04 +08001531 try:
1532 event()
Jon Salz85a39882012-07-05 16:45:04 +08001533 except: # pylint: disable=W0702
1534 logging.exception('Error in event loop')
Jon Salz0697cbf2012-07-04 15:14:04 +08001535 self.record_exception(traceback.format_exception_only(
1536 *sys.exc_info()[:2]))
1537 # But keep going
1538 finally:
1539 self.run_queue.task_done()
1540 return True
Jon Salz0405ab52012-03-16 15:26:52 +08001541
Jon Salz0e6532d2012-10-25 16:30:11 +08001542 def _should_sync_time(self, foreground=False):
1543 '''Returns True if we should attempt syncing time with shopfloor.
1544
1545 Args:
1546 foreground: If True, synchronizes even if background syncing
1547 is disabled (e.g., in explicit sync requests from the
1548 SyncShopfloor test).
1549 '''
1550 return ((foreground or
1551 self.test_list.options.sync_time_period_secs) and
Jon Salz54882d02012-08-31 01:57:54 +08001552 self.time_sanitizer and
1553 (not self.time_synced) and
1554 (not factory.in_chroot()))
1555
Jon Salz0e6532d2012-10-25 16:30:11 +08001556 def sync_time_with_shopfloor_server(self, foreground=False):
Jon Salz54882d02012-08-31 01:57:54 +08001557 '''Syncs time with shopfloor server, if not yet synced.
1558
Jon Salz0e6532d2012-10-25 16:30:11 +08001559 Args:
1560 foreground: If True, synchronizes even if background syncing
1561 is disabled (e.g., in explicit sync requests from the
1562 SyncShopfloor test).
1563
Jon Salz54882d02012-08-31 01:57:54 +08001564 Returns:
1565 False if no time sanitizer is available, or True if this sync (or a
1566 previous sync) succeeded.
1567
1568 Raises:
1569 Exception if unable to contact the shopfloor server.
1570 '''
Jon Salz0e6532d2012-10-25 16:30:11 +08001571 if self._should_sync_time(foreground):
Jon Salz54882d02012-08-31 01:57:54 +08001572 self.time_sanitizer.SyncWithShopfloor()
1573 self.time_synced = True
1574 return self.time_synced
1575
Jon Salzb92c5112012-09-21 15:40:11 +08001576 def log_disk_space_stats(self):
Jon Salz18e0e022013-06-11 17:13:39 +08001577 if (utils.in_chroot() or
1578 not self.test_list.options.log_disk_space_period_secs):
Jon Salzb92c5112012-09-21 15:40:11 +08001579 return
1580
1581 now = time.time()
1582 if (self.last_log_disk_space_time and
1583 now - self.last_log_disk_space_time <
1584 self.test_list.options.log_disk_space_period_secs):
1585 return
1586 self.last_log_disk_space_time = now
1587
Cheng-Yi Chiangd0406522013-04-01 15:40:18 +08001588 # Upload event if stateful partition usage is above threshold.
1589 # Stateful partition is mounted on /usr/local, while
1590 # encrypted stateful partition is mounted on /var.
1591 # If there are too much logs in the factory process,
1592 # these two partitions might get full.
Jon Salzb92c5112012-09-21 15:40:11 +08001593 try:
Cheng-Yi Chiangd0406522013-04-01 15:40:18 +08001594 vfs_infos = disk_space.GetAllVFSInfo()
1595 stateful_info, encrypted_info = None, None
1596 for vfs_info in vfs_infos.values():
1597 if '/usr/local' in vfs_info.mount_points:
1598 stateful_info = vfs_info
1599 if '/var' in vfs_info.mount_points:
1600 encrypted_info = vfs_info
1601
1602 stateful = disk_space.GetPartitionUsage(stateful_info)
1603 encrypted = disk_space.GetPartitionUsage(encrypted_info)
1604
1605 above_threshold = (
1606 self.test_list.options.stateful_usage_threshold and
1607 max(stateful.bytes_used_pct,
1608 stateful.inodes_used_pct,
1609 encrypted.bytes_used_pct,
1610 encrypted.inodes_used_pct) >
1611 self.test_list.options.stateful_usage_threshold)
1612
1613 if above_threshold:
1614 self.event_log.Log('stateful_partition_usage',
1615 partitions={
1616 'stateful': {
1617 'bytes_used_pct': FloatDigit(stateful.bytes_used_pct, 2),
1618 'inodes_used_pct': FloatDigit(stateful.inodes_used_pct, 2)},
1619 'encrypted_stateful': {
1620 'bytes_used_pct': FloatDigit(encrypted.bytes_used_pct, 2),
1621 'inodes_used_pct': FloatDigit(encrypted.inodes_used_pct, 2)}
1622 })
1623 self.log_watcher.ScanEventLogs()
Cheng-Yi Chiang00798e72013-06-20 18:16:39 +08001624 if (not utils.in_chroot() and
1625 self.test_list.options.stateful_usage_above_threshold_action):
1626 Spawn(self.test_list.options.stateful_usage_above_threshold_action,
1627 call=True)
Cheng-Yi Chiangd0406522013-04-01 15:40:18 +08001628
1629 message = disk_space.FormatSpaceUsedAll(vfs_infos)
Jon Salz3c493bb2013-02-07 17:24:58 +08001630 if message != self.last_log_disk_space_message:
Cheng-Yi Chiangd0406522013-04-01 15:40:18 +08001631 if above_threshold:
1632 logging.warning(message)
1633 else:
1634 logging.info(message)
Jon Salz3c493bb2013-02-07 17:24:58 +08001635 self.last_log_disk_space_message = message
Jon Salzb92c5112012-09-21 15:40:11 +08001636 except: # pylint: disable=W0702
1637 logging.exception('Unable to get disk space used')
1638
Justin Chuang83813982013-05-13 01:26:32 +08001639 def check_battery(self):
1640 '''Checks the current battery status.
1641
1642 Logs current battery charging level and status to log. If the battery level
1643 is lower below warning_low_battery_pct, send warning event to shopfloor.
1644 If the battery level is lower below critical_low_battery_pct, flush disks.
1645 '''
1646 if not self.test_list.options.check_battery_period_secs:
1647 return
1648
1649 now = time.time()
1650 if (self.last_check_battery_time and
1651 now - self.last_check_battery_time <
1652 self.test_list.options.check_battery_period_secs):
1653 return
1654 self.last_check_battery_time = now
1655
1656 message = ''
1657 log_level = logging.INFO
1658 try:
1659 power = system.GetBoard().power
1660 if not power.CheckBatteryPresent():
1661 message = 'Battery is not present'
1662 else:
1663 ac_present = power.CheckACPresent()
1664 charge_pct = power.GetChargePct(get_float=True)
1665 message = ('Current battery level %.1f%%, AC charger is %s' %
1666 (charge_pct, 'connected' if ac_present else 'disconnected'))
1667
1668 if charge_pct > self.test_list.options.critical_low_battery_pct:
1669 critical_low_battery = False
1670 else:
1671 critical_low_battery = True
1672 # Only sync disks when battery level is still above minimum
1673 # value. This can be used for offline analysis when shopfloor cannot
1674 # be connected.
1675 if charge_pct > MIN_BATTERY_LEVEL_FOR_DISK_SYNC:
1676 logging.warning('disk syncing for critical low battery situation')
1677 os.system('sync; sync; sync')
1678 else:
1679 logging.warning('disk syncing is cancelled '
1680 'because battery level is lower than %.1f',
1681 MIN_BATTERY_LEVEL_FOR_DISK_SYNC)
1682
1683 # Notify shopfloor server
1684 if (critical_low_battery or
1685 (not ac_present and
1686 charge_pct <= self.test_list.options.warning_low_battery_pct)):
1687 log_level = logging.WARNING
1688
1689 self.event_log.Log('low_battery',
1690 battery_level=charge_pct,
1691 charger_connected=ac_present,
1692 critical=critical_low_battery)
1693 self.log_watcher.KickWatchThread()
Cheng-Yi Chiangd3516a32013-07-17 15:30:47 +08001694 if self.system_log_manager:
1695 self.system_log_manager.KickSyncThread()
Justin Chuang83813982013-05-13 01:26:32 +08001696 except: # pylint: disable=W0702
1697 logging.exception('Unable to check battery or notify shopfloor')
1698 finally:
1699 if message != self.last_check_battery_message:
1700 logging.log(log_level, message)
1701 self.last_check_battery_message = message
1702
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +08001703 def check_core_dump(self):
1704 '''Checks if there is any core dumped file.
1705
1706 Removes unwanted core dump files immediately.
1707 Syncs those files matching watch list to server with a delay between
1708 each sync. After the files have been synced to server, deletes the files.
1709 '''
1710 core_dump_files = self.core_dump_manager.ScanFiles()
1711 if core_dump_files:
1712 now = time.time()
1713 if (self.last_kick_sync_time and now - self.last_kick_sync_time <
1714 self.test_list.options.kick_sync_min_interval_secs):
1715 return
1716 self.last_kick_sync_time = now
1717
1718 # Sends event to server
1719 self.event_log.Log('core_dumped', files=core_dump_files)
1720 self.log_watcher.KickWatchThread()
1721
1722 # Syncs files to server
Cheng-Yi Chiangd3516a32013-07-17 15:30:47 +08001723 if self.system_log_manager:
1724 self.system_log_manager.KickSyncThread(
1725 core_dump_files, self.core_dump_manager.ClearFiles)
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +08001726
Cheng-Yi Chiang39d32ad2013-07-23 15:02:38 +08001727 def check_log_rotation(self):
1728 '''Checks log rotation file presence/absence according to test_list option.
1729
1730 Touch /var/lib/cleanup_logs_paused if test_list.options.disable_log_rotation
1731 is True, delete it otherwise. This must be done in idle loop because
1732 autotest client will touch /var/lib/cleanup_logs_paused each time it runs
1733 an autotest.
1734 '''
1735 if utils.in_chroot():
1736 return
1737 try:
1738 if self.test_list.options.disable_log_rotation:
1739 open(CLEANUP_LOGS_PAUSED, 'w').close()
1740 else:
1741 file_utils.TryUnlink(CLEANUP_LOGS_PAUSED)
1742 except: # pylint: disable=W0702
1743 # Oh well. Logs an error (but no trace)
1744 logging.info(
1745 'Unable to %s %s: %s',
1746 'touch' if self.test_list.options.disable_log_rotation else 'delete',
1747 CLEANUP_LOGS_PAUSED, utils.FormatExceptionOnly())
1748
Jon Salz8fa8e832012-07-13 19:04:09 +08001749 def sync_time_in_background(self):
Jon Salzb22d1172012-08-06 10:38:57 +08001750 '''Writes out current time and tries to sync with shopfloor server.'''
1751 if not self.time_sanitizer:
1752 return
1753
1754 # Write out the current time.
1755 self.time_sanitizer.SaveTime()
1756
Jon Salz54882d02012-08-31 01:57:54 +08001757 if not self._should_sync_time():
Jon Salz8fa8e832012-07-13 19:04:09 +08001758 return
1759
1760 now = time.time()
1761 if self.last_sync_time and (
1762 now - self.last_sync_time <
1763 self.test_list.options.sync_time_period_secs):
1764 # Not yet time for another check.
1765 return
1766 self.last_sync_time = now
1767
1768 def target():
1769 try:
Jon Salz54882d02012-08-31 01:57:54 +08001770 self.sync_time_with_shopfloor_server()
Jon Salz8fa8e832012-07-13 19:04:09 +08001771 except: # pylint: disable=W0702
1772 # Oh well. Log an error (but no trace)
1773 logging.info(
1774 'Unable to get time from shopfloor server: %s',
1775 utils.FormatExceptionOnly())
1776
1777 thread = threading.Thread(target=target)
1778 thread.daemon = True
1779 thread.start()
1780
Jon Salz0697cbf2012-07-04 15:14:04 +08001781 def _run_queue_idle(self):
Vic Yang4953fc12012-07-26 16:19:53 +08001782 '''Invoked when the run queue has no events.
1783
1784 This method must not raise exception.
1785 '''
Jon Salzb22d1172012-08-06 10:38:57 +08001786 now = time.time()
1787 if (self.last_idle and
1788 now < (self.last_idle + RUN_QUEUE_TIMEOUT_SECS - 1)):
1789 # Don't run more often than once every (RUN_QUEUE_TIMEOUT_SECS -
1790 # 1) seconds.
1791 return
1792
1793 self.last_idle = now
1794
Vic Yang311ddb82012-09-26 12:08:28 +08001795 self.check_exclusive()
cychiang21886742012-07-05 15:16:32 +08001796 self.check_for_updates()
Jon Salz8fa8e832012-07-13 19:04:09 +08001797 self.sync_time_in_background()
Jon Salzb92c5112012-09-21 15:40:11 +08001798 self.log_disk_space_stats()
Justin Chuang83813982013-05-13 01:26:32 +08001799 self.check_battery()
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +08001800 self.check_core_dump()
Cheng-Yi Chiang39d32ad2013-07-23 15:02:38 +08001801 self.check_log_rotation()
Jon Salz57717ca2012-04-04 16:47:25 +08001802
Jon Salzd15bbcf2013-05-21 17:33:57 +08001803 def handle_event_logs(self, chunks):
Jon Salz0697cbf2012-07-04 15:14:04 +08001804 '''Callback for event watcher.
Jon Salz258a40c2012-04-19 12:34:01 +08001805
Jon Salz0697cbf2012-07-04 15:14:04 +08001806 Attempts to upload the event logs to the shopfloor server.
Vic Yang93027612013-05-06 02:42:49 +08001807
1808 Args:
Jon Salzd15bbcf2013-05-21 17:33:57 +08001809 chunks: A list of Chunk objects.
Jon Salz0697cbf2012-07-04 15:14:04 +08001810 '''
Vic Yang93027612013-05-06 02:42:49 +08001811 first_exception = None
1812 exception_count = 0
1813
Jon Salzd15bbcf2013-05-21 17:33:57 +08001814 for chunk in chunks:
Vic Yang93027612013-05-06 02:42:49 +08001815 try:
Jon Salzcddb6402013-05-23 12:56:42 +08001816 description = 'event logs (%s)' % str(chunk)
Vic Yang93027612013-05-06 02:42:49 +08001817 start_time = time.time()
1818 shopfloor_client = shopfloor.get_instance(
1819 detect=True,
1820 timeout=self.test_list.options.shopfloor_timeout_secs)
Jon Salzd15bbcf2013-05-21 17:33:57 +08001821 shopfloor_client.UploadEvent(chunk.log_name + "." +
1822 event_log.GetReimageId(),
1823 Binary(chunk.chunk))
Vic Yang93027612013-05-06 02:42:49 +08001824 logging.info(
1825 'Successfully synced %s in %.03f s',
1826 description, time.time() - start_time)
1827 except: # pylint: disable=W0702
Jon Salzd15bbcf2013-05-21 17:33:57 +08001828 first_exception = (first_exception or (chunk.log_name + ': ' +
Vic Yang93027612013-05-06 02:42:49 +08001829 utils.FormatExceptionOnly()))
1830 exception_count += 1
1831
1832 if exception_count:
1833 if exception_count == 1:
1834 msg = 'Log upload failed: %s' % first_exception
1835 else:
1836 msg = '%d log upload failed; first is: %s' % (
1837 exception_count, first_exception)
1838 raise Exception(msg)
1839
Jon Salz57717ca2012-04-04 16:47:25 +08001840
Jon Salz0697cbf2012-07-04 15:14:04 +08001841 def run_tests_with_status(self, statuses_to_run, starting_at=None,
1842 root=None):
1843 '''Runs all top-level tests with a particular status.
Jon Salz0405ab52012-03-16 15:26:52 +08001844
Jon Salz0697cbf2012-07-04 15:14:04 +08001845 All active tests, plus any tests to re-run, are reset.
Jon Salz57717ca2012-04-04 16:47:25 +08001846
Jon Salz0697cbf2012-07-04 15:14:04 +08001847 Args:
1848 starting_at: If provided, only auto-runs tests beginning with
1849 this test.
1850 '''
1851 root = root or self.test_list
Jon Salz57717ca2012-04-04 16:47:25 +08001852
Jon Salz0697cbf2012-07-04 15:14:04 +08001853 if starting_at:
1854 # Make sure they passed a test, not a string.
1855 assert isinstance(starting_at, factory.FactoryTest)
Jon Salz0405ab52012-03-16 15:26:52 +08001856
Jon Salz0697cbf2012-07-04 15:14:04 +08001857 tests_to_reset = []
1858 tests_to_run = []
Jon Salz0405ab52012-03-16 15:26:52 +08001859
Jon Salz0697cbf2012-07-04 15:14:04 +08001860 found_starting_at = False
Jon Salz0405ab52012-03-16 15:26:52 +08001861
Jon Salz0697cbf2012-07-04 15:14:04 +08001862 for test in root.get_top_level_tests():
1863 if starting_at:
1864 if test == starting_at:
1865 # We've found starting_at; do auto-run on all
1866 # subsequent tests.
1867 found_starting_at = True
1868 if not found_starting_at:
1869 # Don't start this guy yet
1870 continue
Jon Salz0405ab52012-03-16 15:26:52 +08001871
Jon Salz0697cbf2012-07-04 15:14:04 +08001872 status = test.get_state().status
1873 if status == TestState.ACTIVE or status in statuses_to_run:
1874 # Reset the test (later; we will need to abort
1875 # all active tests first).
1876 tests_to_reset.append(test)
1877 if status in statuses_to_run:
1878 tests_to_run.append(test)
Jon Salz0405ab52012-03-16 15:26:52 +08001879
Jon Salz6dc031d2013-06-19 13:06:23 +08001880 self.abort_active_tests('Operator requested run/re-run of certain tests')
Jon Salz258a40c2012-04-19 12:34:01 +08001881
Jon Salz0697cbf2012-07-04 15:14:04 +08001882 # Reset all statuses of the tests to run (in case any tests were active;
1883 # we want them to be run again).
1884 for test_to_reset in tests_to_reset:
1885 for test in test_to_reset.walk():
1886 test.update_state(status=TestState.UNTESTED)
Jon Salz57717ca2012-04-04 16:47:25 +08001887
Jon Salz0697cbf2012-07-04 15:14:04 +08001888 self.run_tests(tests_to_run, untested_only=True)
Jon Salz0405ab52012-03-16 15:26:52 +08001889
Jon Salz0697cbf2012-07-04 15:14:04 +08001890 def restart_tests(self, root=None):
1891 '''Restarts all tests.'''
1892 root = root or self.test_list
Jon Salz0405ab52012-03-16 15:26:52 +08001893
Jon Salz6dc031d2013-06-19 13:06:23 +08001894 self.abort_active_tests('Operator requested restart of certain tests')
Jon Salz0697cbf2012-07-04 15:14:04 +08001895 for test in root.walk():
1896 test.update_state(status=TestState.UNTESTED)
1897 self.run_tests(root)
Hung-Te Lin96632362012-03-20 21:14:18 +08001898
Jon Salz0697cbf2012-07-04 15:14:04 +08001899 def auto_run(self, starting_at=None, root=None):
1900 '''"Auto-runs" tests that have not been run yet.
Hung-Te Lin96632362012-03-20 21:14:18 +08001901
Jon Salz0697cbf2012-07-04 15:14:04 +08001902 Args:
1903 starting_at: If provide, only auto-runs tests beginning with
1904 this test.
1905 '''
1906 root = root or self.test_list
1907 self.run_tests_with_status([TestState.UNTESTED, TestState.ACTIVE],
1908 starting_at=starting_at,
1909 root=root)
Jon Salz968e90b2012-03-18 16:12:43 +08001910
Jon Salz0697cbf2012-07-04 15:14:04 +08001911 def re_run_failed(self, root=None):
1912 '''Re-runs failed tests.'''
1913 root = root or self.test_list
1914 self.run_tests_with_status([TestState.FAILED], root=root)
Jon Salz57717ca2012-04-04 16:47:25 +08001915
Jon Salz0697cbf2012-07-04 15:14:04 +08001916 def show_review_information(self):
1917 '''Event handler for showing review information screen.
Jon Salz57717ca2012-04-04 16:47:25 +08001918
Jon Salz0697cbf2012-07-04 15:14:04 +08001919 The information screene is rendered by main UI program (ui.py), so in
1920 goofy we only need to kill all active tests, set them as untested, and
1921 clear remaining tests.
1922 '''
1923 self.kill_active_tests(False)
Jon Salza6711d72012-07-18 14:33:03 +08001924 self.cancel_pending_tests()
Jon Salz57717ca2012-04-04 16:47:25 +08001925
Jon Salz0697cbf2012-07-04 15:14:04 +08001926 def handle_switch_test(self, event):
1927 '''Switches to a particular test.
Jon Salz0405ab52012-03-16 15:26:52 +08001928
Jon Salz0697cbf2012-07-04 15:14:04 +08001929 @param event: The SWITCH_TEST event.
1930 '''
1931 test = self.test_list.lookup_path(event.path)
1932 if not test:
1933 logging.error('Unknown test %r', event.key)
1934 return
Jon Salz73e0fd02012-04-04 11:46:38 +08001935
Jon Salz0697cbf2012-07-04 15:14:04 +08001936 invoc = self.invocations.get(test)
1937 if invoc and test.backgroundable:
1938 # Already running: just bring to the front if it
1939 # has a UI.
1940 logging.info('Setting visible test to %s', test.path)
Jon Salz36fbbb52012-07-05 13:45:06 +08001941 self.set_visible_test(test)
Jon Salz0697cbf2012-07-04 15:14:04 +08001942 return
Jon Salz73e0fd02012-04-04 11:46:38 +08001943
Jon Salz6dc031d2013-06-19 13:06:23 +08001944 self.abort_active_tests('Operator requested abort (switch_test)')
Jon Salz0697cbf2012-07-04 15:14:04 +08001945 for t in test.walk():
1946 t.update_state(status=TestState.UNTESTED)
Jon Salz73e0fd02012-04-04 11:46:38 +08001947
Jon Salz0697cbf2012-07-04 15:14:04 +08001948 if self.test_list.options.auto_run_on_keypress:
1949 self.auto_run(starting_at=test)
1950 else:
1951 self.run_tests(test)
Jon Salz73e0fd02012-04-04 11:46:38 +08001952
Jon Salz0697cbf2012-07-04 15:14:04 +08001953 def wait(self):
1954 '''Waits for all pending invocations.
1955
1956 Useful for testing.
1957 '''
Jon Salz1acc8742012-07-17 17:45:55 +08001958 while self.invocations:
1959 for k, v in self.invocations.iteritems():
1960 logging.info('Waiting for %s to complete...', k)
1961 v.thread.join()
1962 self.reap_completed_tests()
Jon Salz0697cbf2012-07-04 15:14:04 +08001963
1964 def check_exceptions(self):
1965 '''Raises an error if any exceptions have occurred in
1966 invocation threads.'''
1967 if self.exceptions:
1968 raise RuntimeError('Exception in invocation thread: %r' %
1969 self.exceptions)
1970
1971 def record_exception(self, msg):
1972 '''Records an exception in an invocation thread.
1973
1974 An exception with the given message will be rethrown when
1975 Goofy is destroyed.'''
1976 self.exceptions.append(msg)
Jon Salz73e0fd02012-04-04 11:46:38 +08001977
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001978
1979if __name__ == '__main__':
Jon Salz77c151e2012-08-28 07:20:37 +08001980 goofy = Goofy()
1981 try:
1982 goofy.main()
Jon Salz0f996602012-10-03 15:26:48 +08001983 except SystemExit:
1984 # Propagate SystemExit without logging.
1985 raise
Jon Salz31373eb2012-09-21 16:19:49 +08001986 except:
Jon Salz0f996602012-10-03 15:26:48 +08001987 # Log the error before trying to shut down (unless it's a graceful
1988 # exit).
Jon Salz31373eb2012-09-21 16:19:49 +08001989 logging.exception('Error in main loop')
1990 raise
Jon Salz77c151e2012-08-28 07:20:37 +08001991 finally:
1992 goofy.destroy()