blob: c0025881b0d6ea1c244fbc32639d10d508db8bf4 [file] [log] [blame]
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001#!/usr/bin/python -u
Hung-Te Linf2f78f72012-02-08 19:27:11 +08002# -*- coding: utf-8 -*-
3#
Jon Salz37eccbd2012-05-25 16:06:52 +08004# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
Hung-Te Linf2f78f72012-02-08 19:27:11 +08005# Use of this source code is governed by a BSD-style license that can be
6# found in the LICENSE file.
7
8'''
9The main factory flow that runs the factory test and finalizes a device.
10'''
11
Jon Salze12c2b32013-06-25 16:24:34 +080012import glob
Jon Salz0405ab52012-03-16 15:26:52 +080013import logging
14import os
Jon Salz73e0fd02012-04-04 11:46:38 +080015import Queue
Jon Salze12c2b32013-06-25 16:24:34 +080016import shutil
Jon Salz77c151e2012-08-28 07:20:37 +080017import signal
Jon Salz0405ab52012-03-16 15:26:52 +080018import sys
Jon Salzeff94182013-06-19 15:06:28 +080019import syslog
Jon Salz0405ab52012-03-16 15:26:52 +080020import threading
21import time
22import traceback
Jon Salz258a40c2012-04-19 12:34:01 +080023import uuid
Jon Salzb10cf512012-08-09 17:29:21 +080024from xmlrpclib import Binary
Hung-Te Linf2f78f72012-02-08 19:27:11 +080025from collections import deque
26from optparse import OptionParser
Hung-Te Linf2f78f72012-02-08 19:27:11 +080027
Jon Salz0697cbf2012-07-04 15:14:04 +080028import factory_common # pylint: disable=W0611
jcliangcd688182012-08-20 21:01:26 +080029from cros.factory import event_log
30from cros.factory import system
Cheng-Yi Chiangd0406522013-04-01 15:40:18 +080031from cros.factory.event_log import EventLog, FloatDigit
Tom Wai-Hong Tamd33723e2013-04-10 21:14:37 +080032from cros.factory.event_log_watcher import EventLogWatcher
jcliangcd688182012-08-20 21:01:26 +080033from cros.factory.goofy import test_environment
34from cros.factory.goofy import time_sanitizer
Jon Salz83591782012-06-26 11:09:58 +080035from cros.factory.goofy import updater
jcliangcd688182012-08-20 21:01:26 +080036from cros.factory.goofy.goofy_rpc import GoofyRPC
Jon Salz885dcac2013-07-23 16:39:50 +080037from cros.factory.goofy.invocation import TestArgEnv
jcliangcd688182012-08-20 21:01:26 +080038from cros.factory.goofy.invocation import TestInvocation
39from cros.factory.goofy.prespawner import Prespawner
Cheng-Yi Chiang344b10f2013-05-03 16:44:03 +080040from cros.factory.goofy.system_log_manager import SystemLogManager
jcliangcd688182012-08-20 21:01:26 +080041from cros.factory.goofy.web_socket_manager import WebSocketManager
Cheng-Yi Chiangd8186952013-04-04 23:41:14 +080042from cros.factory.system.board import Board, BoardException
jcliangcd688182012-08-20 21:01:26 +080043from cros.factory.system.charge_manager import ChargeManager
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +080044from cros.factory.system.core_dump_manager import CoreDumpManager
Jon Salzce6a7f82013-06-10 18:22:54 +080045from cros.factory.system.cpufreq_manager import CpufreqManager
Jon Salzb92c5112012-09-21 15:40:11 +080046from cros.factory.system import disk_space
jcliangcd688182012-08-20 21:01:26 +080047from cros.factory.test import factory
48from cros.factory.test import state
Jon Salz51528e12012-07-02 18:54:45 +080049from cros.factory.test import shopfloor
Jon Salz83591782012-06-26 11:09:58 +080050from cros.factory.test import utils
Jon Salz128b0932013-07-03 16:55:26 +080051from cros.factory.test.test_lists import test_lists
Jon Salz83591782012-06-26 11:09:58 +080052from cros.factory.test.event import Event
53from cros.factory.test.event import EventClient
54from cros.factory.test.event import EventServer
jcliangcd688182012-08-20 21:01:26 +080055from cros.factory.test.factory import TestState
Jon Salzd7550792013-07-12 05:49:27 +080056from cros.factory.test.utils import Enum
Dean Liao592e4d52013-01-10 20:06:39 +080057from cros.factory.tools.key_filter import KeyFilter
Jon Salz2af235d2013-06-24 14:47:21 +080058from cros.factory.utils import file_utils
Jon Salz78c32392012-07-25 14:18:29 +080059from cros.factory.utils.process_utils import Spawn
Hung-Te Linf2f78f72012-02-08 19:27:11 +080060
61
Hung-Te Linf2f78f72012-02-08 19:27:11 +080062HWID_CFG_PATH = '/usr/local/share/chromeos-hwid/cfg'
Chun-ta Lin279e7e92013-02-19 17:40:39 +080063CACHES_DIR = os.path.join(factory.get_state_root(), "caches")
Hung-Te Linf2f78f72012-02-08 19:27:11 +080064
Cheng-Yi Chiang39d32ad2013-07-23 15:02:38 +080065CLEANUP_LOGS_PAUSED = '/var/lib/cleanup_logs_paused'
66
Jon Salz8796e362012-05-24 11:39:09 +080067# File that suppresses reboot if present (e.g., for development).
68NO_REBOOT_FILE = '/var/log/factory.noreboot'
69
Jon Salz5c344f62012-07-13 14:31:16 +080070# Value for tests_after_shutdown that forces auto-run (e.g., after
71# a factory update, when the available set of tests might change).
72FORCE_AUTO_RUN = 'force_auto_run'
73
cychiang21886742012-07-05 15:16:32 +080074RUN_QUEUE_TIMEOUT_SECS = 10
75
Justin Chuang83813982013-05-13 01:26:32 +080076# Sync disks when battery level is higher than this value.
77# Otherwise, power loss during disk sync operation may incur even worse outcome.
78MIN_BATTERY_LEVEL_FOR_DISK_SYNC = 1.0
79
Jon Salze12c2b32013-06-25 16:24:34 +080080MAX_CRASH_FILE_SIZE = 64*1024
81
Jon Salz758e6cc2012-04-03 15:47:07 +080082GOOFY_IN_CHROOT_WARNING = '\n' + ('*' * 70) + '''
83You are running Goofy inside the chroot. Autotests are not supported.
84
85To use Goofy in the chroot, first install an Xvnc server:
86
Jon Salz0697cbf2012-07-04 15:14:04 +080087 sudo apt-get install tightvncserver
Jon Salz758e6cc2012-04-03 15:47:07 +080088
89...and then start a VNC X server outside the chroot:
90
Jon Salz0697cbf2012-07-04 15:14:04 +080091 vncserver :10 &
92 vncviewer :10
Jon Salz758e6cc2012-04-03 15:47:07 +080093
94...and run Goofy as follows:
95
Jon Salz0697cbf2012-07-04 15:14:04 +080096 env --unset=XAUTHORITY DISPLAY=localhost:10 python goofy.py
Jon Salz758e6cc2012-04-03 15:47:07 +080097''' + ('*' * 70)
Jon Salz73e0fd02012-04-04 11:46:38 +080098suppress_chroot_warning = False
Hung-Te Linf2f78f72012-02-08 19:27:11 +080099
Jon Salzd7550792013-07-12 05:49:27 +0800100Status = Enum(['UNINITIALIZED', 'INITIALIZING', 'RUNNING',
101 'TERMINATING', 'TERMINATED'])
102
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800103def get_hwid_cfg():
Jon Salz0697cbf2012-07-04 15:14:04 +0800104 '''
105 Returns the HWID config tag, or an empty string if none can be found.
106 '''
107 if 'CROS_HWID' in os.environ:
108 return os.environ['CROS_HWID']
109 if os.path.exists(HWID_CFG_PATH):
110 with open(HWID_CFG_PATH, 'rt') as hwid_cfg_handle:
111 return hwid_cfg_handle.read().strip()
112 return ''
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800113
114
Jon Salz73e0fd02012-04-04 11:46:38 +0800115_inited_logging = False
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800116
117class Goofy(object):
Jon Salz0697cbf2012-07-04 15:14:04 +0800118 '''
119 The main factory flow.
120
121 Note that all methods in this class must be invoked from the main
122 (event) thread. Other threads, such as callbacks and TestInvocation
123 methods, should instead post events on the run queue.
124
125 TODO: Unit tests. (chrome-os-partner:7409)
126
127 Properties:
128 uuid: A unique UUID for this invocation of Goofy.
129 state_instance: An instance of FactoryState.
130 state_server: The FactoryState XML/RPC server.
131 state_server_thread: A thread running state_server.
132 event_server: The EventServer socket server.
133 event_server_thread: A thread running event_server.
134 event_client: A client to the event server.
135 connection_manager: The connection_manager object.
Cheng-Yi Chiang835f2682013-05-06 22:15:48 +0800136 system_log_manager: The SystemLogManager object.
137 core_dump_manager: The CoreDumpManager object.
Jon Salz0697cbf2012-07-04 15:14:04 +0800138 ui_process: The factory ui process object.
139 run_queue: A queue of callbacks to invoke from the main thread.
140 invocations: A map from FactoryTest objects to the corresponding
141 TestInvocations objects representing active tests.
142 tests_to_run: A deque of tests that should be run when the current
143 test(s) complete.
144 options: Command-line options.
145 args: Command-line args.
146 test_list: The test list.
Jon Salz128b0932013-07-03 16:55:26 +0800147 test_lists: All new-style test lists.
Jon Salz0697cbf2012-07-04 15:14:04 +0800148 event_handlers: Map of Event.Type to the method used to handle that
149 event. If the method has an 'event' argument, the event is passed
150 to the handler.
151 exceptions: Exceptions encountered in invocation threads.
Jon Salz3c493bb2013-02-07 17:24:58 +0800152 last_log_disk_space_message: The last message we logged about disk space
153 (to avoid duplication).
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +0800154 last_kick_sync_time: The last time to kick system_log_manager to sync
155 because of core dump files (to avoid kicking too soon then abort the
156 sync.)
Jon Salz416f9cc2013-05-10 18:32:50 +0800157 hooks: A Hooks object containing hooks for various Goofy actions.
Jon Salzd7550792013-07-12 05:49:27 +0800158 status: The current Goofy status (a member of the Status enum).
Jon Salz0697cbf2012-07-04 15:14:04 +0800159 '''
160 def __init__(self):
161 self.uuid = str(uuid.uuid4())
162 self.state_instance = None
163 self.state_server = None
164 self.state_server_thread = None
Jon Salz16d10542012-07-23 12:18:45 +0800165 self.goofy_rpc = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800166 self.event_server = None
167 self.event_server_thread = None
168 self.event_client = None
169 self.connection_manager = None
Vic Yang4953fc12012-07-26 16:19:53 +0800170 self.charge_manager = None
Jon Salz8fa8e832012-07-13 19:04:09 +0800171 self.time_sanitizer = None
172 self.time_synced = False
Jon Salz0697cbf2012-07-04 15:14:04 +0800173 self.log_watcher = None
Cheng-Yi Chiang344b10f2013-05-03 16:44:03 +0800174 self.system_log_manager = None
Cheng-Yi Chiang835f2682013-05-06 22:15:48 +0800175 self.core_dump_manager = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800176 self.event_log = None
177 self.prespawner = None
178 self.ui_process = None
Jon Salzc79a9982012-08-30 04:42:01 +0800179 self.dummy_shopfloor = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800180 self.run_queue = Queue.Queue()
181 self.invocations = {}
182 self.tests_to_run = deque()
183 self.visible_test = None
184 self.chrome = None
Jon Salz416f9cc2013-05-10 18:32:50 +0800185 self.hooks = None
Vic Yangd8990da2013-06-27 16:57:43 +0800186 self.cpu_usage_watcher = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800187
188 self.options = None
189 self.args = None
190 self.test_list = None
Jon Salz128b0932013-07-03 16:55:26 +0800191 self.test_lists = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800192 self.on_ui_startup = []
193 self.env = None
Jon Salzb22d1172012-08-06 10:38:57 +0800194 self.last_idle = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800195 self.last_shutdown_time = None
cychiang21886742012-07-05 15:16:32 +0800196 self.last_update_check = None
Jon Salz8fa8e832012-07-13 19:04:09 +0800197 self.last_sync_time = None
Jon Salzb92c5112012-09-21 15:40:11 +0800198 self.last_log_disk_space_time = None
Jon Salz3c493bb2013-02-07 17:24:58 +0800199 self.last_log_disk_space_message = None
Justin Chuang83813982013-05-13 01:26:32 +0800200 self.last_check_battery_time = None
201 self.last_check_battery_message = None
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +0800202 self.last_kick_sync_time = None
Vic Yang311ddb82012-09-26 12:08:28 +0800203 self.exclusive_items = set()
Jon Salz0f996602012-10-03 15:26:48 +0800204 self.event_log = None
Dean Liao592e4d52013-01-10 20:06:39 +0800205 self.key_filter = None
Jon Salzce6a7f82013-06-10 18:22:54 +0800206 self.cpufreq_manager = None
Jon Salzd7550792013-07-12 05:49:27 +0800207 self.status = Status.UNINITIALIZED
Jon Salz0697cbf2012-07-04 15:14:04 +0800208
Jon Salz85a39882012-07-05 16:45:04 +0800209 def test_or_root(event, parent_or_group=True):
210 '''Returns the test affected by a particular event.
211
212 Args:
213 event: The event containing an optional 'path' attribute.
214 parent_on_group: If True, returns the top-level parent for a test (the
215 root node of the tests that need to be run together if the given test
216 path is to be run).
217 '''
Jon Salz0697cbf2012-07-04 15:14:04 +0800218 try:
219 path = event.path
220 except AttributeError:
221 path = None
222
223 if path:
Jon Salz85a39882012-07-05 16:45:04 +0800224 test = self.test_list.lookup_path(path)
225 if parent_or_group:
226 test = test.get_top_level_parent_or_group()
227 return test
Jon Salz0697cbf2012-07-04 15:14:04 +0800228 else:
229 return self.test_list
230
231 self.event_handlers = {
232 Event.Type.SWITCH_TEST: self.handle_switch_test,
233 Event.Type.SHOW_NEXT_ACTIVE_TEST:
234 lambda event: self.show_next_active_test(),
235 Event.Type.RESTART_TESTS:
236 lambda event: self.restart_tests(root=test_or_root(event)),
237 Event.Type.AUTO_RUN:
238 lambda event: self.auto_run(root=test_or_root(event)),
239 Event.Type.RE_RUN_FAILED:
240 lambda event: self.re_run_failed(root=test_or_root(event)),
241 Event.Type.RUN_TESTS_WITH_STATUS:
242 lambda event: self.run_tests_with_status(
243 event.status,
244 root=test_or_root(event)),
245 Event.Type.REVIEW:
246 lambda event: self.show_review_information(),
247 Event.Type.UPDATE_SYSTEM_INFO:
248 lambda event: self.update_system_info(),
Jon Salz0697cbf2012-07-04 15:14:04 +0800249 Event.Type.STOP:
Jon Salz85a39882012-07-05 16:45:04 +0800250 lambda event: self.stop(root=test_or_root(event, False),
Jon Salz6dc031d2013-06-19 13:06:23 +0800251 fail=getattr(event, 'fail', False),
252 reason=getattr(event, 'reason', None)),
Jon Salz36fbbb52012-07-05 13:45:06 +0800253 Event.Type.SET_VISIBLE_TEST:
254 lambda event: self.set_visible_test(
255 self.test_list.lookup_path(event.path)),
Jon Salz4712ac72013-02-07 17:12:05 +0800256 Event.Type.CLEAR_STATE:
257 lambda event: self.clear_state(self.test_list.lookup_path(event.path)),
Jon Salz0697cbf2012-07-04 15:14:04 +0800258 }
259
260 self.exceptions = []
261 self.web_socket_manager = None
262
263 def destroy(self):
Jon Salzd7550792013-07-12 05:49:27 +0800264 self.status = Status.TERMINATING
Jon Salz0697cbf2012-07-04 15:14:04 +0800265 if self.chrome:
266 self.chrome.kill()
267 self.chrome = None
Jon Salzc79a9982012-08-30 04:42:01 +0800268 if self.dummy_shopfloor:
269 self.dummy_shopfloor.kill()
270 self.dummy_shopfloor = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800271 if self.ui_process:
272 utils.kill_process_tree(self.ui_process, 'ui')
273 self.ui_process = None
274 if self.web_socket_manager:
275 logging.info('Stopping web sockets')
276 self.web_socket_manager.close()
277 self.web_socket_manager = None
278 if self.state_server_thread:
279 logging.info('Stopping state server')
280 self.state_server.shutdown()
281 self.state_server_thread.join()
282 self.state_server.server_close()
283 self.state_server_thread = None
284 if self.state_instance:
285 self.state_instance.close()
286 if self.event_server_thread:
287 logging.info('Stopping event server')
288 self.event_server.shutdown() # pylint: disable=E1101
289 self.event_server_thread.join()
290 self.event_server.server_close()
291 self.event_server_thread = None
292 if self.log_watcher:
293 if self.log_watcher.IsThreadStarted():
294 self.log_watcher.StopWatchThread()
295 self.log_watcher = None
Cheng-Yi Chiang344b10f2013-05-03 16:44:03 +0800296 if self.system_log_manager:
297 if self.system_log_manager.IsThreadRunning():
298 self.system_log_manager.StopSyncThread()
299 self.system_log_manager = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800300 if self.prespawner:
301 logging.info('Stopping prespawner')
302 self.prespawner.stop()
303 self.prespawner = None
304 if self.event_client:
305 logging.info('Closing event client')
306 self.event_client.close()
307 self.event_client = None
Jon Salzddf0d052013-06-18 12:52:44 +0800308 if self.cpufreq_manager:
309 self.cpufreq_manager.Stop()
Jon Salz0697cbf2012-07-04 15:14:04 +0800310 if self.event_log:
311 self.event_log.Close()
312 self.event_log = None
Dean Liao592e4d52013-01-10 20:06:39 +0800313 if self.key_filter:
314 self.key_filter.Stop()
Vic Yangd8990da2013-06-27 16:57:43 +0800315 if self.cpu_usage_watcher:
316 self.cpu_usage_watcher.terminate()
Dean Liao592e4d52013-01-10 20:06:39 +0800317
Jon Salz0697cbf2012-07-04 15:14:04 +0800318 self.check_exceptions()
319 logging.info('Done destroying Goofy')
Jon Salzd7550792013-07-12 05:49:27 +0800320 self.status = Status.TERMINATED
Jon Salz0697cbf2012-07-04 15:14:04 +0800321
322 def start_state_server(self):
Jon Salz2af235d2013-06-24 14:47:21 +0800323 # Before starting state server, remount stateful partitions with
324 # no commit flag. The default commit time (commit=600) makes corruption
325 # too likely.
326 file_utils.ResetCommitTime()
327
Jon Salz0697cbf2012-07-04 15:14:04 +0800328 self.state_instance, self.state_server = (
329 state.create_server(bind_address='0.0.0.0'))
Jon Salz16d10542012-07-23 12:18:45 +0800330 self.goofy_rpc = GoofyRPC(self)
331 self.goofy_rpc.RegisterMethods(self.state_instance)
Jon Salz0697cbf2012-07-04 15:14:04 +0800332 logging.info('Starting state server')
333 self.state_server_thread = threading.Thread(
334 target=self.state_server.serve_forever,
335 name='StateServer')
336 self.state_server_thread.start()
337
338 def start_event_server(self):
339 self.event_server = EventServer()
340 logging.info('Starting factory event server')
341 self.event_server_thread = threading.Thread(
342 target=self.event_server.serve_forever,
343 name='EventServer') # pylint: disable=E1101
344 self.event_server_thread.start()
345
346 self.event_client = EventClient(
347 callback=self.handle_event, event_loop=self.run_queue)
348
349 self.web_socket_manager = WebSocketManager(self.uuid)
350 self.state_server.add_handler("/event",
351 self.web_socket_manager.handle_web_socket)
352
353 def start_ui(self):
354 ui_proc_args = [
355 os.path.join(factory.FACTORY_PACKAGE_PATH, 'test', 'ui.py'),
356 self.options.test_list]
357 if self.options.verbose:
358 ui_proc_args.append('-v')
359 logging.info('Starting ui %s', ui_proc_args)
Jon Salz78c32392012-07-25 14:18:29 +0800360 self.ui_process = Spawn(ui_proc_args)
Jon Salz0697cbf2012-07-04 15:14:04 +0800361 logging.info('Waiting for UI to come up...')
362 self.event_client.wait(
363 lambda event: event.type == Event.Type.UI_READY)
364 logging.info('UI has started')
365
366 def set_visible_test(self, test):
367 if self.visible_test == test:
368 return
Jon Salz2f2d42c2012-07-30 12:30:34 +0800369 if test and not test.has_ui:
370 return
Jon Salz0697cbf2012-07-04 15:14:04 +0800371
372 if test:
373 test.update_state(visible=True)
374 if self.visible_test:
375 self.visible_test.update_state(visible=False)
376 self.visible_test = test
377
Jon Salzd4306c82012-11-30 15:16:36 +0800378 def _log_startup_messages(self):
379 '''Logs the tail of var/log/messages and mosys and EC console logs.'''
380 # TODO(jsalz): This is mostly a copy-and-paste of code in init_states,
381 # for factory-3004.B only. Consolidate and merge back to ToT.
382 if utils.in_chroot():
383 return
384
385 try:
386 var_log_messages = (
387 utils.var_log_messages_before_reboot())
388 logging.info(
389 'Tail of /var/log/messages before last reboot:\n'
390 '%s', ('\n'.join(
391 ' ' + x for x in var_log_messages)))
392 except: # pylint: disable=W0702
393 logging.exception('Unable to grok /var/log/messages')
394
395 try:
396 mosys_log = utils.Spawn(
397 ['mosys', 'eventlog', 'list'],
398 read_stdout=True, log_stderr_on_error=True).stdout_data
399 logging.info('System eventlog from mosys:\n%s\n', mosys_log)
400 except: # pylint: disable=W0702
401 logging.exception('Unable to read mosys eventlog')
402
403 try:
Vic Yang8341dde2013-01-29 16:48:52 +0800404 board = system.GetBoard()
405 ec_console_log = board.GetECConsoleLog()
Jon Salzd4306c82012-11-30 15:16:36 +0800406 logging.info('EC console log after reboot:\n%s\n', ec_console_log)
407 except: # pylint: disable=W0702
408 logging.exception('Error retrieving EC console log')
409
Vic Yang079f9872013-07-01 11:32:00 +0800410 try:
411 board = system.GetBoard()
412 ec_panic_info = board.GetECPanicInfo()
413 logging.info('EC panic info after reboot:\n%s\n', ec_panic_info)
414 except: # pylint: disable=W0702
415 logging.exception('Error retrieving EC panic info')
416
Jon Salz0697cbf2012-07-04 15:14:04 +0800417 def handle_shutdown_complete(self, test, test_state):
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800418 '''
Jon Salz0697cbf2012-07-04 15:14:04 +0800419 Handles the case where a shutdown was detected during a shutdown step.
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800420
Jon Salz0697cbf2012-07-04 15:14:04 +0800421 @param test: The ShutdownStep.
422 @param test_state: The test state.
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800423 '''
Jon Salz0697cbf2012-07-04 15:14:04 +0800424 test_state = test.update_state(increment_shutdown_count=1)
425 logging.info('Detected shutdown (%d of %d)',
426 test_state.shutdown_count, test.iterations)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800427
Jon Salz0697cbf2012-07-04 15:14:04 +0800428 def log_and_update_state(status, error_msg, **kw):
429 self.event_log.Log('rebooted',
430 status=status, error_msg=error_msg, **kw)
Jon Salzd4306c82012-11-30 15:16:36 +0800431 logging.info('Rebooted: status=%s, %s', status,
432 (('error_msg=%s' % error_msg) if error_msg else None))
Jon Salz0697cbf2012-07-04 15:14:04 +0800433 test.update_state(status=status, error_msg=error_msg)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800434
Jon Salz0697cbf2012-07-04 15:14:04 +0800435 if not self.last_shutdown_time:
436 log_and_update_state(status=TestState.FAILED,
437 error_msg='Unable to read shutdown_time')
438 return
Jon Salz258a40c2012-04-19 12:34:01 +0800439
Jon Salz0697cbf2012-07-04 15:14:04 +0800440 now = time.time()
441 logging.info('%.03f s passed since reboot',
442 now - self.last_shutdown_time)
Jon Salz258a40c2012-04-19 12:34:01 +0800443
Jon Salz0697cbf2012-07-04 15:14:04 +0800444 if self.last_shutdown_time > now:
445 test.update_state(status=TestState.FAILED,
446 error_msg='Time moved backward during reboot')
447 elif (isinstance(test, factory.RebootStep) and
448 self.test_list.options.max_reboot_time_secs and
449 (now - self.last_shutdown_time >
450 self.test_list.options.max_reboot_time_secs)):
451 # A reboot took too long; fail. (We don't check this for
452 # HaltSteps, because the machine could be halted for a
453 # very long time, and even unplugged with battery backup,
454 # thus hosing the clock.)
455 log_and_update_state(
456 status=TestState.FAILED,
457 error_msg=('More than %d s elapsed during reboot '
458 '(%.03f s, from %s to %s)' % (
459 self.test_list.options.max_reboot_time_secs,
460 now - self.last_shutdown_time,
461 utils.TimeString(self.last_shutdown_time),
462 utils.TimeString(now))),
463 duration=(now-self.last_shutdown_time))
Jon Salzd4306c82012-11-30 15:16:36 +0800464 self._log_startup_messages()
Jon Salz0697cbf2012-07-04 15:14:04 +0800465 elif test_state.shutdown_count == test.iterations:
466 # Good!
467 log_and_update_state(status=TestState.PASSED,
468 duration=(now - self.last_shutdown_time),
469 error_msg='')
470 elif test_state.shutdown_count > test.iterations:
471 # Shut down too many times
472 log_and_update_state(status=TestState.FAILED,
473 error_msg='Too many shutdowns')
Jon Salzd4306c82012-11-30 15:16:36 +0800474 self._log_startup_messages()
Jon Salz0697cbf2012-07-04 15:14:04 +0800475 elif utils.are_shift_keys_depressed():
476 logging.info('Shift keys are depressed; cancelling restarts')
477 # Abort shutdown
478 log_and_update_state(
479 status=TestState.FAILED,
480 error_msg='Shutdown aborted with double shift keys')
Jon Salza6711d72012-07-18 14:33:03 +0800481 self.cancel_pending_tests()
Jon Salz0697cbf2012-07-04 15:14:04 +0800482 else:
483 def handler():
484 if self._prompt_cancel_shutdown(
485 test, test_state.shutdown_count + 1):
Jon Salza6711d72012-07-18 14:33:03 +0800486 factory.console.info('Shutdown aborted by operator')
Jon Salz0697cbf2012-07-04 15:14:04 +0800487 log_and_update_state(
488 status=TestState.FAILED,
489 error_msg='Shutdown aborted by operator')
Jon Salza6711d72012-07-18 14:33:03 +0800490 self.cancel_pending_tests()
Jon Salz0697cbf2012-07-04 15:14:04 +0800491 return
Jon Salz0405ab52012-03-16 15:26:52 +0800492
Jon Salz0697cbf2012-07-04 15:14:04 +0800493 # Time to shutdown again
494 log_and_update_state(
495 status=TestState.ACTIVE,
496 error_msg='',
497 iteration=test_state.shutdown_count)
Jon Salz73e0fd02012-04-04 11:46:38 +0800498
Jon Salz0697cbf2012-07-04 15:14:04 +0800499 self.event_log.Log('shutdown', operation='reboot')
500 self.state_instance.set_shared_data('shutdown_time',
501 time.time())
502 self.env.shutdown('reboot')
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800503
Jon Salz0697cbf2012-07-04 15:14:04 +0800504 self.on_ui_startup.append(handler)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800505
Jon Salz0697cbf2012-07-04 15:14:04 +0800506 def _prompt_cancel_shutdown(self, test, iteration):
507 if self.options.ui != 'chrome':
508 return False
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800509
Jon Salz0697cbf2012-07-04 15:14:04 +0800510 pending_shutdown_data = {
511 'delay_secs': test.delay_secs,
512 'time': time.time() + test.delay_secs,
513 'operation': test.operation,
514 'iteration': iteration,
515 'iterations': test.iterations,
516 }
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800517
Jon Salz0697cbf2012-07-04 15:14:04 +0800518 # Create a new (threaded) event client since we
519 # don't want to use the event loop for this.
520 with EventClient() as event_client:
521 event_client.post_event(Event(Event.Type.PENDING_SHUTDOWN,
522 **pending_shutdown_data))
523 aborted = event_client.wait(
524 lambda event: event.type == Event.Type.CANCEL_SHUTDOWN,
525 timeout=test.delay_secs) is not None
526 if aborted:
527 event_client.post_event(Event(Event.Type.PENDING_SHUTDOWN))
528 return aborted
Jon Salz258a40c2012-04-19 12:34:01 +0800529
Jon Salz0697cbf2012-07-04 15:14:04 +0800530 def init_states(self):
531 '''
532 Initializes all states on startup.
533 '''
534 for test in self.test_list.get_all_tests():
535 # Make sure the state server knows about all the tests,
536 # defaulting to an untested state.
537 test.update_state(update_parent=False, visible=False)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800538
Jon Salz0697cbf2012-07-04 15:14:04 +0800539 var_log_messages = None
Vic Yanga9c32212012-08-16 20:07:54 +0800540 mosys_log = None
Vic Yange4c275d2012-08-28 01:50:20 +0800541 ec_console_log = None
Vic Yang079f9872013-07-01 11:32:00 +0800542 ec_panic_info = None
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800543
Jon Salz0697cbf2012-07-04 15:14:04 +0800544 # Any 'active' tests should be marked as failed now.
545 for test in self.test_list.walk():
Jon Salza6711d72012-07-18 14:33:03 +0800546 if not test.is_leaf():
547 # Don't bother with parents; they will be updated when their
548 # children are updated.
549 continue
550
Jon Salz0697cbf2012-07-04 15:14:04 +0800551 test_state = test.get_state()
552 if test_state.status != TestState.ACTIVE:
553 continue
554 if isinstance(test, factory.ShutdownStep):
555 # Shutdown while the test was active - that's good.
556 self.handle_shutdown_complete(test, test_state)
557 else:
558 # Unexpected shutdown. Grab /var/log/messages for context.
559 if var_log_messages is None:
560 try:
561 var_log_messages = (
562 utils.var_log_messages_before_reboot())
563 # Write it to the log, to make it easier to
564 # correlate with /var/log/messages.
565 logging.info(
566 'Unexpected shutdown. '
567 'Tail of /var/log/messages before last reboot:\n'
568 '%s', ('\n'.join(
569 ' ' + x for x in var_log_messages)))
570 except: # pylint: disable=W0702
571 logging.exception('Unable to grok /var/log/messages')
572 var_log_messages = []
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800573
Jon Salz008f4ea2012-08-28 05:39:45 +0800574 if mosys_log is None and not utils.in_chroot():
575 try:
576 mosys_log = utils.Spawn(
577 ['mosys', 'eventlog', 'list'],
578 read_stdout=True, log_stderr_on_error=True).stdout_data
579 # Write it to the log also.
580 logging.info('System eventlog from mosys:\n%s\n', mosys_log)
581 except: # pylint: disable=W0702
582 logging.exception('Unable to read mosys eventlog')
Vic Yanga9c32212012-08-16 20:07:54 +0800583
Vic Yange4c275d2012-08-28 01:50:20 +0800584 if ec_console_log is None:
585 try:
Vic Yang8341dde2013-01-29 16:48:52 +0800586 board = system.GetBoard()
587 ec_console_log = board.GetECConsoleLog()
Vic Yange4c275d2012-08-28 01:50:20 +0800588 logging.info('EC console log after reboot:\n%s\n', ec_console_log)
Jon Salzfe1f6652012-09-07 05:40:14 +0800589 except: # pylint: disable=W0702
Vic Yange4c275d2012-08-28 01:50:20 +0800590 logging.exception('Error retrieving EC console log')
591
Vic Yang079f9872013-07-01 11:32:00 +0800592 if ec_panic_info is None:
593 try:
594 board = system.GetBoard()
595 ec_panic_info = board.GetECPanicInfo()
596 logging.info('EC panic info after reboot:\n%s\n', ec_panic_info)
597 except: # pylint: disable=W0702
598 logging.exception('Error retrieving EC panic info')
599
Jon Salz0697cbf2012-07-04 15:14:04 +0800600 error_msg = 'Unexpected shutdown while test was running'
601 self.event_log.Log('end_test',
602 path=test.path,
603 status=TestState.FAILED,
604 invocation=test.get_state().invocation,
605 error_msg=error_msg,
Vic Yanga9c32212012-08-16 20:07:54 +0800606 var_log_messages='\n'.join(var_log_messages),
607 mosys_log=mosys_log)
Jon Salz0697cbf2012-07-04 15:14:04 +0800608 test.update_state(
609 status=TestState.FAILED,
610 error_msg=error_msg)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800611
Jon Salz50efe942012-07-26 11:54:10 +0800612 if not test.never_fails:
613 # For "never_fails" tests (such as "Start"), don't cancel
614 # pending tests, since reboot is expected.
615 factory.console.info('Unexpected shutdown while test %s '
616 'running; cancelling any pending tests',
617 test.path)
618 self.state_instance.set_shared_data('tests_after_shutdown', [])
Jon Salz69806bb2012-07-20 18:05:02 +0800619
Jon Salz008f4ea2012-08-28 05:39:45 +0800620 self.update_skipped_tests()
621
622 def update_skipped_tests(self):
623 '''
624 Updates skipped states based on run_if.
625 '''
Jon Salz885dcac2013-07-23 16:39:50 +0800626 env = TestArgEnv()
Jon Salz008f4ea2012-08-28 05:39:45 +0800627 for t in self.test_list.walk():
Jon Salz885dcac2013-07-23 16:39:50 +0800628 if t.is_leaf() and (t.run_if_table_name or t.run_if_expr):
629 value = None
630
631 if t.run_if_expr:
632 try:
633 value = t.run_if_expr(env)
634 except: # pylint: disable=W0702
635 logging.exception('Unable to evaluate run_if expression for %s',
636 t.path)
637 # But keep going; we have no choice. This will end up
638 # always activating the test.
639 else:
640 try:
641 aux = shopfloor.get_selected_aux_data(t.run_if_table_name)
642 value = aux.get(t.run_if_col)
643 except ValueError:
644 # Not available; assume it shouldn't be skipped
645 pass
646
647 if value is None:
648 skip = False
649 else:
650 skip = (not value) ^ t.run_if_not
Jon Salz008f4ea2012-08-28 05:39:45 +0800651
652 test_state = t.get_state()
653 if ((not skip) and
654 (test_state.status == TestState.PASSED) and
655 (test_state.error_msg == TestState.SKIPPED_MSG)):
656 # It was marked as skipped before, but now we need to run it.
657 # Mark as untested.
658 t.update_state(skip=skip, status=TestState.UNTESTED, error_msg='')
659 else:
660 t.update_state(skip=skip)
661
Jon Salz0697cbf2012-07-04 15:14:04 +0800662 def show_next_active_test(self):
663 '''
664 Rotates to the next visible active test.
665 '''
666 self.reap_completed_tests()
667 active_tests = [
668 t for t in self.test_list.walk()
669 if t.is_leaf() and t.get_state().status == TestState.ACTIVE]
670 if not active_tests:
671 return
Jon Salz4f6c7172012-06-11 20:45:36 +0800672
Jon Salz0697cbf2012-07-04 15:14:04 +0800673 try:
674 next_test = active_tests[
675 (active_tests.index(self.visible_test) + 1) % len(active_tests)]
676 except ValueError: # visible_test not present in active_tests
677 next_test = active_tests[0]
Jon Salz4f6c7172012-06-11 20:45:36 +0800678
Jon Salz0697cbf2012-07-04 15:14:04 +0800679 self.set_visible_test(next_test)
Jon Salz4f6c7172012-06-11 20:45:36 +0800680
Jon Salz0697cbf2012-07-04 15:14:04 +0800681 def handle_event(self, event):
682 '''
683 Handles an event from the event server.
684 '''
685 handler = self.event_handlers.get(event.type)
686 if handler:
687 handler(event)
688 else:
689 # We don't register handlers for all event types - just ignore
690 # this event.
691 logging.debug('Unbound event type %s', event.type)
Jon Salz4f6c7172012-06-11 20:45:36 +0800692
Vic Yangaabf9fd2013-04-09 18:56:13 +0800693 def check_critical_factory_note(self):
694 '''
695 Returns True if the last factory note is critical.
696 '''
697 notes = self.state_instance.get_shared_data('factory_note', True)
698 return notes and notes[-1]['level'] == 'CRITICAL'
699
Jon Salz0697cbf2012-07-04 15:14:04 +0800700 def run_next_test(self):
701 '''
702 Runs the next eligible test (or tests) in self.tests_to_run.
703 '''
704 self.reap_completed_tests()
Vic Yangaabf9fd2013-04-09 18:56:13 +0800705 if self.tests_to_run and self.check_critical_factory_note():
706 self.tests_to_run.clear()
707 return
Jon Salz0697cbf2012-07-04 15:14:04 +0800708 while self.tests_to_run:
709 logging.debug('Tests to run: %s',
710 [x.path for x in self.tests_to_run])
Jon Salz94eb56f2012-06-12 18:01:12 +0800711
Jon Salz0697cbf2012-07-04 15:14:04 +0800712 test = self.tests_to_run[0]
Jon Salz94eb56f2012-06-12 18:01:12 +0800713
Jon Salz0697cbf2012-07-04 15:14:04 +0800714 if test in self.invocations:
715 logging.info('Next test %s is already running', test.path)
716 self.tests_to_run.popleft()
717 return
Jon Salz94eb56f2012-06-12 18:01:12 +0800718
Jon Salza1412922012-07-23 16:04:17 +0800719 for requirement in test.require_run:
720 for i in requirement.test.walk():
721 if i.get_state().status == TestState.ACTIVE:
Jon Salz304a75d2012-07-06 11:14:15 +0800722 logging.info('Waiting for active test %s to complete '
Jon Salza1412922012-07-23 16:04:17 +0800723 'before running %s', i.path, test.path)
Jon Salz304a75d2012-07-06 11:14:15 +0800724 return
725
Jon Salz0697cbf2012-07-04 15:14:04 +0800726 if self.invocations and not (test.backgroundable and all(
727 [x.backgroundable for x in self.invocations])):
728 logging.debug('Waiting for non-backgroundable tests to '
729 'complete before running %s', test.path)
730 return
Jon Salz94eb56f2012-06-12 18:01:12 +0800731
Jon Salz3e6f5202012-10-15 15:08:29 +0800732 if test.get_state().skip:
733 factory.console.info('Skipping test %s', test.path)
734 test.update_state(status=TestState.PASSED,
735 error_msg=TestState.SKIPPED_MSG)
736 self.tests_to_run.popleft()
737 continue
738
Jon Salz0697cbf2012-07-04 15:14:04 +0800739 self.tests_to_run.popleft()
Jon Salz94eb56f2012-06-12 18:01:12 +0800740
Jon Salz304a75d2012-07-06 11:14:15 +0800741 untested = set()
Jon Salza1412922012-07-23 16:04:17 +0800742 for requirement in test.require_run:
743 for i in requirement.test.walk():
744 if i == test:
Jon Salz304a75d2012-07-06 11:14:15 +0800745 # We've hit this test itself; stop checking
746 break
Jon Salza1412922012-07-23 16:04:17 +0800747 if ((i.get_state().status == TestState.UNTESTED) or
748 (requirement.passed and i.get_state().status !=
749 TestState.PASSED)):
Jon Salz304a75d2012-07-06 11:14:15 +0800750 # Found an untested test; move on to the next
751 # element in require_run.
Jon Salza1412922012-07-23 16:04:17 +0800752 untested.add(i)
Jon Salz304a75d2012-07-06 11:14:15 +0800753 break
754
755 if untested:
756 untested_paths = ', '.join(sorted([x.path for x in untested]))
757 if self.state_instance.get_shared_data('engineering_mode',
758 optional=True):
759 # In engineering mode, we'll let it go.
760 factory.console.warn('In engineering mode; running '
761 '%s even though required tests '
762 '[%s] have not completed',
763 test.path, untested_paths)
764 else:
765 # Not in engineering mode; mark it failed.
766 error_msg = ('Required tests [%s] have not been run yet'
767 % untested_paths)
768 factory.console.error('Not running %s: %s',
769 test.path, error_msg)
770 test.update_state(status=TestState.FAILED,
771 error_msg=error_msg)
772 continue
773
Jon Salz0697cbf2012-07-04 15:14:04 +0800774 if isinstance(test, factory.ShutdownStep):
775 if os.path.exists(NO_REBOOT_FILE):
776 test.update_state(
777 status=TestState.FAILED, increment_count=1,
778 error_msg=('Skipped shutdown since %s is present' %
Jon Salz304a75d2012-07-06 11:14:15 +0800779 NO_REBOOT_FILE))
Jon Salz0697cbf2012-07-04 15:14:04 +0800780 continue
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800781
Jon Salz0697cbf2012-07-04 15:14:04 +0800782 test.update_state(status=TestState.ACTIVE, increment_count=1,
783 error_msg='', shutdown_count=0)
784 if self._prompt_cancel_shutdown(test, 1):
785 self.event_log.Log('reboot_cancelled')
786 test.update_state(
787 status=TestState.FAILED, increment_count=1,
788 error_msg='Shutdown aborted by operator',
789 shutdown_count=0)
chungyiafe8f772012-08-15 19:36:29 +0800790 continue
Jon Salz2f757d42012-06-27 17:06:42 +0800791
Jon Salz0697cbf2012-07-04 15:14:04 +0800792 # Save pending test list in the state server
Jon Salzdbf398f2012-06-14 17:30:01 +0800793 self.state_instance.set_shared_data(
Jon Salz0697cbf2012-07-04 15:14:04 +0800794 'tests_after_shutdown',
795 [t.path for t in self.tests_to_run])
796 # Save shutdown time
797 self.state_instance.set_shared_data('shutdown_time',
798 time.time())
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800799
Jon Salz0697cbf2012-07-04 15:14:04 +0800800 with self.env.lock:
801 self.event_log.Log('shutdown', operation=test.operation)
802 shutdown_result = self.env.shutdown(test.operation)
803 if shutdown_result:
804 # That's all, folks!
805 self.run_queue.put(None)
806 return
807 else:
808 # Just pass (e.g., in the chroot).
809 test.update_state(status=TestState.PASSED)
810 self.state_instance.set_shared_data(
811 'tests_after_shutdown', None)
812 # Send event with no fields to indicate that there is no
813 # longer a pending shutdown.
814 self.event_client.post_event(Event(
815 Event.Type.PENDING_SHUTDOWN))
816 continue
Jon Salz258a40c2012-04-19 12:34:01 +0800817
Cheng-Yi Chiangce05c002013-04-04 02:13:17 +0800818 self._run_test(test, test.iterations, test.retries)
Jon Salz1acc8742012-07-17 17:45:55 +0800819
Cheng-Yi Chiangce05c002013-04-04 02:13:17 +0800820 def _run_test(self, test, iterations_left=None, retries_left=None):
Jon Salz1acc8742012-07-17 17:45:55 +0800821 invoc = TestInvocation(self, test, on_completion=self.run_next_test)
822 new_state = test.update_state(
823 status=TestState.ACTIVE, increment_count=1, error_msg='',
Jon Salzbd42ce12012-09-18 08:03:59 +0800824 invocation=invoc.uuid, iterations_left=iterations_left,
Cheng-Yi Chiangce05c002013-04-04 02:13:17 +0800825 retries_left=retries_left,
Jon Salzbd42ce12012-09-18 08:03:59 +0800826 visible=(self.visible_test == test))
Jon Salz1acc8742012-07-17 17:45:55 +0800827 invoc.count = new_state.count
828
829 self.invocations[test] = invoc
830 if self.visible_test is None and test.has_ui:
831 self.set_visible_test(test)
Vic Yang311ddb82012-09-26 12:08:28 +0800832 self.check_exclusive()
Jon Salz1acc8742012-07-17 17:45:55 +0800833 invoc.start()
Jon Salz5f2a0672012-05-22 17:14:06 +0800834
Vic Yang311ddb82012-09-26 12:08:28 +0800835 def check_exclusive(self):
Jon Salzce6a7f82013-06-10 18:22:54 +0800836 # alias since this is really long
837 EXCL_OPT = factory.FactoryTest.EXCLUSIVE_OPTIONS
838
Vic Yang311ddb82012-09-26 12:08:28 +0800839 current_exclusive_items = set([
Jon Salzce6a7f82013-06-10 18:22:54 +0800840 item for item in EXCL_OPT
Vic Yang311ddb82012-09-26 12:08:28 +0800841 if any([test.is_exclusive(item) for test in self.invocations])])
842
843 new_exclusive_items = current_exclusive_items - self.exclusive_items
Jon Salzce6a7f82013-06-10 18:22:54 +0800844 if EXCL_OPT.NETWORKING in new_exclusive_items:
Vic Yang311ddb82012-09-26 12:08:28 +0800845 logging.info('Disabling network')
846 self.connection_manager.DisableNetworking()
Jon Salzce6a7f82013-06-10 18:22:54 +0800847 if EXCL_OPT.CHARGER in new_exclusive_items:
Vic Yang311ddb82012-09-26 12:08:28 +0800848 logging.info('Stop controlling charger')
849
850 new_non_exclusive_items = self.exclusive_items - current_exclusive_items
Jon Salzce6a7f82013-06-10 18:22:54 +0800851 if EXCL_OPT.NETWORKING in new_non_exclusive_items:
Vic Yang311ddb82012-09-26 12:08:28 +0800852 logging.info('Re-enabling network')
853 self.connection_manager.EnableNetworking()
Jon Salzce6a7f82013-06-10 18:22:54 +0800854 if EXCL_OPT.CHARGER in new_non_exclusive_items:
Vic Yang311ddb82012-09-26 12:08:28 +0800855 logging.info('Start controlling charger')
856
Jon Salzce6a7f82013-06-10 18:22:54 +0800857 if self.cpufreq_manager:
858 enabled = EXCL_OPT.CPUFREQ not in current_exclusive_items
859 try:
860 self.cpufreq_manager.SetEnabled(enabled)
861 except: # pylint: disable=W0702
862 logging.exception('Unable to %s cpufreq services',
863 'enable' if enabled else 'disable')
864
Vic Yang311ddb82012-09-26 12:08:28 +0800865 # Only adjust charge state if not excluded
Jon Salzce6a7f82013-06-10 18:22:54 +0800866 if (EXCL_OPT.CHARGER not in current_exclusive_items and
867 not utils.in_chroot()):
Cheng-Yi Chiangd8186952013-04-04 23:41:14 +0800868 if self.charge_manager:
869 self.charge_manager.AdjustChargeState()
870 else:
871 try:
872 system.GetBoard().SetChargeState(Board.ChargeState.CHARGE)
873 except BoardException:
874 logging.exception('Unable to set charge state on this board')
Vic Yang311ddb82012-09-26 12:08:28 +0800875
876 self.exclusive_items = current_exclusive_items
Jon Salz5da61e62012-05-31 13:06:22 +0800877
cychiang21886742012-07-05 15:16:32 +0800878 def check_for_updates(self):
879 '''
880 Schedules an asynchronous check for updates if necessary.
881 '''
882 if not self.test_list.options.update_period_secs:
883 # Not enabled.
884 return
885
886 now = time.time()
887 if self.last_update_check and (
888 now - self.last_update_check <
889 self.test_list.options.update_period_secs):
890 # Not yet time for another check.
891 return
892
893 self.last_update_check = now
894
895 def handle_check_for_update(reached_shopfloor, md5sum, needs_update):
896 if reached_shopfloor:
897 new_update_md5sum = md5sum if needs_update else None
898 if system.SystemInfo.update_md5sum != new_update_md5sum:
899 logging.info('Received new update MD5SUM: %s', new_update_md5sum)
900 system.SystemInfo.update_md5sum = new_update_md5sum
901 self.run_queue.put(self.update_system_info)
902
903 updater.CheckForUpdateAsync(
904 handle_check_for_update,
905 self.test_list.options.shopfloor_timeout_secs)
906
Jon Salza6711d72012-07-18 14:33:03 +0800907 def cancel_pending_tests(self):
908 '''Cancels any tests in the run queue.'''
909 self.run_tests([])
910
Jon Salz0697cbf2012-07-04 15:14:04 +0800911 def run_tests(self, subtrees, untested_only=False):
912 '''
913 Runs tests under subtree.
Jon Salz258a40c2012-04-19 12:34:01 +0800914
Jon Salz0697cbf2012-07-04 15:14:04 +0800915 The tests are run in order unless one fails (then stops).
916 Backgroundable tests are run simultaneously; when a foreground test is
917 encountered, we wait for all active tests to finish before continuing.
Jon Salzb1b39092012-05-03 02:05:09 +0800918
Jon Salz0697cbf2012-07-04 15:14:04 +0800919 @param subtrees: Node or nodes containing tests to run (may either be
920 a single test or a list). Duplicates will be ignored.
921 '''
922 if type(subtrees) != list:
923 subtrees = [subtrees]
Jon Salz258a40c2012-04-19 12:34:01 +0800924
Jon Salz0697cbf2012-07-04 15:14:04 +0800925 # Nodes we've seen so far, to avoid duplicates.
926 seen = set()
Jon Salz94eb56f2012-06-12 18:01:12 +0800927
Jon Salz0697cbf2012-07-04 15:14:04 +0800928 self.tests_to_run = deque()
929 for subtree in subtrees:
930 for test in subtree.walk():
931 if test in seen:
932 continue
933 seen.add(test)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800934
Jon Salz0697cbf2012-07-04 15:14:04 +0800935 if not test.is_leaf():
936 continue
937 if (untested_only and
938 test.get_state().status != TestState.UNTESTED):
939 continue
940 self.tests_to_run.append(test)
941 self.run_next_test()
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800942
Jon Salz0697cbf2012-07-04 15:14:04 +0800943 def reap_completed_tests(self):
944 '''
945 Removes completed tests from the set of active tests.
946
947 Also updates the visible test if it was reaped.
948 '''
Cheng-Yi Chiang5ac22ca2013-04-12 17:45:26 +0800949 test_completed = False
Jon Salz0697cbf2012-07-04 15:14:04 +0800950 for t, v in dict(self.invocations).iteritems():
951 if v.is_completed():
Cheng-Yi Chiang5ac22ca2013-04-12 17:45:26 +0800952 test_completed = True
Jon Salz1acc8742012-07-17 17:45:55 +0800953 new_state = t.update_state(**v.update_state_on_completion)
Jon Salz0697cbf2012-07-04 15:14:04 +0800954 del self.invocations[t]
955
Chun-Ta Lin54e17e42012-09-06 22:05:13 +0800956 # Stop on failure if flag is true.
957 if (self.test_list.options.stop_on_failure and
958 new_state.status == TestState.FAILED):
959 # Clean all the tests to cause goofy to stop.
960 self.tests_to_run = []
961 factory.console.info("Stop on failure triggered. Empty the queue.")
962
Jon Salz1acc8742012-07-17 17:45:55 +0800963 if new_state.iterations_left and new_state.status == TestState.PASSED:
964 # Play it again, Sam!
965 self._run_test(t)
Cheng-Yi Chiangce05c002013-04-04 02:13:17 +0800966 # new_state.retries_left is obtained after update.
967 # For retries_left == 0, test can still be run for the last time.
968 elif (new_state.retries_left >= 0 and
969 new_state.status == TestState.FAILED):
970 # Still have to retry, Sam!
971 self._run_test(t)
Jon Salz1acc8742012-07-17 17:45:55 +0800972
Cheng-Yi Chiang5ac22ca2013-04-12 17:45:26 +0800973 if test_completed:
Vic Yangf01c59f2013-04-19 17:37:56 +0800974 self.log_watcher.KickWatchThread()
Cheng-Yi Chiang5ac22ca2013-04-12 17:45:26 +0800975
Jon Salz0697cbf2012-07-04 15:14:04 +0800976 if (self.visible_test is None or
Jon Salz85a39882012-07-05 16:45:04 +0800977 self.visible_test not in self.invocations):
Jon Salz0697cbf2012-07-04 15:14:04 +0800978 self.set_visible_test(None)
979 # Make the first running test, if any, the visible test
980 for t in self.test_list.walk():
981 if t in self.invocations:
982 self.set_visible_test(t)
983 break
984
Jon Salz6dc031d2013-06-19 13:06:23 +0800985 def kill_active_tests(self, abort, root=None, reason=None):
Jon Salz0697cbf2012-07-04 15:14:04 +0800986 '''
987 Kills and waits for all active tests.
988
Jon Salz85a39882012-07-05 16:45:04 +0800989 Args:
990 abort: True to change state of killed tests to FAILED, False for
Jon Salz0697cbf2012-07-04 15:14:04 +0800991 UNTESTED.
Jon Salz85a39882012-07-05 16:45:04 +0800992 root: If set, only kills tests with root as an ancestor.
Jon Salz0697cbf2012-07-04 15:14:04 +0800993 '''
994 self.reap_completed_tests()
995 for test, invoc in self.invocations.items():
Jon Salz85a39882012-07-05 16:45:04 +0800996 if root and not test.has_ancestor(root):
997 continue
998
Jon Salz0697cbf2012-07-04 15:14:04 +0800999 factory.console.info('Killing active test %s...' % test.path)
Jon Salz6dc031d2013-06-19 13:06:23 +08001000 invoc.abort_and_join(reason)
Jon Salz0697cbf2012-07-04 15:14:04 +08001001 factory.console.info('Killed %s' % test.path)
Jon Salz1acc8742012-07-17 17:45:55 +08001002 test.update_state(**invoc.update_state_on_completion)
Jon Salz0697cbf2012-07-04 15:14:04 +08001003 del self.invocations[test]
Jon Salz1acc8742012-07-17 17:45:55 +08001004
Jon Salz0697cbf2012-07-04 15:14:04 +08001005 if not abort:
1006 test.update_state(status=TestState.UNTESTED)
1007 self.reap_completed_tests()
1008
Jon Salz6dc031d2013-06-19 13:06:23 +08001009 def stop(self, root=None, fail=False, reason=None):
1010 self.kill_active_tests(fail, root, reason)
Jon Salz85a39882012-07-05 16:45:04 +08001011 # Remove any tests in the run queue under the root.
1012 self.tests_to_run = deque([x for x in self.tests_to_run
1013 if root and not x.has_ancestor(root)])
1014 self.run_next_test()
Jon Salz0697cbf2012-07-04 15:14:04 +08001015
Jon Salz4712ac72013-02-07 17:12:05 +08001016 def clear_state(self, root=None):
Jon Salzd7550792013-07-12 05:49:27 +08001017 if root is None:
1018 root = self.test_list
Jon Salz6dc031d2013-06-19 13:06:23 +08001019 self.stop(root, reason='Clearing test state')
Jon Salz4712ac72013-02-07 17:12:05 +08001020 for f in root.walk():
1021 if f.is_leaf():
1022 f.update_state(status=TestState.UNTESTED)
1023
Jon Salz6dc031d2013-06-19 13:06:23 +08001024 def abort_active_tests(self, reason=None):
1025 self.kill_active_tests(True, reason=reason)
Jon Salz0697cbf2012-07-04 15:14:04 +08001026
1027 def main(self):
Jon Salzeff94182013-06-19 15:06:28 +08001028 syslog.openlog('goofy')
1029
Jon Salz0697cbf2012-07-04 15:14:04 +08001030 try:
Jon Salzd7550792013-07-12 05:49:27 +08001031 self.status = Status.INITIALIZING
Jon Salz0697cbf2012-07-04 15:14:04 +08001032 self.init()
1033 self.event_log.Log('goofy_init',
1034 success=True)
1035 except:
1036 if self.event_log:
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001037 try:
Jon Salz0697cbf2012-07-04 15:14:04 +08001038 self.event_log.Log('goofy_init',
1039 success=False,
1040 trace=traceback.format_exc())
1041 except: # pylint: disable=W0702
1042 pass
1043 raise
1044
Jon Salzd7550792013-07-12 05:49:27 +08001045 self.status = Status.RUNNING
Jon Salzeff94182013-06-19 15:06:28 +08001046 syslog.syslog('Goofy (factory test harness) starting')
Jon Salz0697cbf2012-07-04 15:14:04 +08001047 self.run()
1048
1049 def update_system_info(self):
1050 '''Updates system info.'''
1051 system_info = system.SystemInfo()
1052 self.state_instance.set_shared_data('system_info', system_info.__dict__)
1053 self.event_client.post_event(Event(Event.Type.SYSTEM_INFO,
1054 system_info=system_info.__dict__))
1055 logging.info('System info: %r', system_info.__dict__)
1056
Jon Salzeb42f0d2012-07-27 19:14:04 +08001057 def update_factory(self, auto_run_on_restart=False, post_update_hook=None):
1058 '''Commences updating factory software.
1059
1060 Args:
1061 auto_run_on_restart: Auto-run when the machine comes back up.
1062 post_update_hook: Code to call after update but immediately before
1063 restart.
1064
1065 Returns:
1066 Never if the update was successful (we just reboot).
1067 False if the update was unnecessary (no update available).
1068 '''
Jon Salz6dc031d2013-06-19 13:06:23 +08001069 self.kill_active_tests(False, reason='Factory software update')
Jon Salza6711d72012-07-18 14:33:03 +08001070 self.cancel_pending_tests()
Jon Salz0697cbf2012-07-04 15:14:04 +08001071
Jon Salz5c344f62012-07-13 14:31:16 +08001072 def pre_update_hook():
1073 if auto_run_on_restart:
1074 self.state_instance.set_shared_data('tests_after_shutdown',
1075 FORCE_AUTO_RUN)
1076 self.state_instance.close()
1077
Jon Salzeb42f0d2012-07-27 19:14:04 +08001078 if updater.TryUpdate(pre_update_hook=pre_update_hook):
1079 if post_update_hook:
1080 post_update_hook()
1081 self.env.shutdown('reboot')
Jon Salz0697cbf2012-07-04 15:14:04 +08001082
Jon Salzcef132a2012-08-30 04:58:08 +08001083 def handle_sigint(self, dummy_signum, dummy_frame):
Jon Salz77c151e2012-08-28 07:20:37 +08001084 logging.error('Received SIGINT')
1085 self.run_queue.put(None)
1086 raise KeyboardInterrupt()
1087
Jon Salze12c2b32013-06-25 16:24:34 +08001088 def find_kcrashes(self):
1089 """Finds kcrash files, logs them, and marks them as seen."""
1090 seen_crashes = set(
1091 self.state_instance.get_shared_data('seen_crashes', optional=True)
1092 or [])
1093
1094 for path in glob.glob('/var/spool/crash/*'):
1095 if not os.path.isfile(path):
1096 continue
1097 if path in seen_crashes:
1098 continue
1099 try:
1100 stat = os.stat(path)
1101 mtime = utils.TimeString(stat.st_mtime)
1102 logging.info(
1103 'Found new crash file %s (%d bytes at %s)',
1104 path, stat.st_size, mtime)
1105 extra_log_args = {}
1106
1107 try:
1108 _, ext = os.path.splitext(path)
1109 if ext in ['.kcrash', '.meta']:
1110 ext = ext.replace('.', '')
1111 with open(path) as f:
1112 data = f.read(MAX_CRASH_FILE_SIZE)
1113 tell = f.tell()
1114 logging.info(
1115 'Contents of %s%s:%s',
1116 path,
1117 ('' if tell == stat.st_size
1118 else '(truncated to %d bytes)' % MAX_CRASH_FILE_SIZE),
1119 ('\n' + data).replace('\n', '\n ' + ext + '> '))
1120 extra_log_args['data'] = data
1121
1122 # Copy to /var/factory/kcrash for posterity
1123 kcrash_dir = factory.get_factory_root('kcrash')
1124 utils.TryMakeDirs(kcrash_dir)
1125 shutil.copy(path, kcrash_dir)
1126 logging.info('Copied to %s',
1127 os.path.join(kcrash_dir, os.path.basename(path)))
1128 finally:
1129 # Even if something goes wrong with the above, still try to
1130 # log to event log
1131 self.event_log.Log('crash_file',
1132 path=path, size=stat.st_size, mtime=mtime,
1133 **extra_log_args)
1134 except: # pylint: disable=W0702
1135 logging.exception('Unable to handle crash files %s', path)
1136 seen_crashes.add(path)
1137
1138 self.state_instance.set_shared_data('seen_crashes', list(seen_crashes))
1139
Jon Salz128b0932013-07-03 16:55:26 +08001140 def GetTestList(self, test_list_id):
1141 """Returns the test list with the given ID.
1142
1143 Raises:
1144 TestListError: The test list ID is not valid.
1145 """
1146 try:
1147 return self.test_lists[test_list_id]
1148 except KeyError:
1149 raise test_lists.TestListError(
1150 '%r is not a valid test list ID (available IDs are [%s])' % (
1151 test_list_id, ', '.join(sorted(self.test_lists.keys()))))
1152
1153 def InitTestLists(self):
1154 """Reads in all test lists and sets the active test list."""
1155 self.test_lists = test_lists.BuildAllTestLists()
Jon Salzd7550792013-07-12 05:49:27 +08001156 logging.info('Loaded test lists: [%s]',
1157 test_lists.DescribeTestLists(self.test_lists))
Jon Salz128b0932013-07-03 16:55:26 +08001158
1159 if not self.options.test_list:
1160 self.options.test_list = test_lists.GetActiveTestListId()
1161
1162 if os.sep in self.options.test_list:
1163 # It's a path pointing to an old-style test list; use it.
1164 self.test_list = factory.read_test_list(self.options.test_list)
1165 else:
1166 self.test_list = self.GetTestList(self.options.test_list)
1167
1168 logging.info('Active test list: %s', self.test_list.test_list_id)
1169
1170 if isinstance(self.test_list, test_lists.OldStyleTestList):
1171 # Actually load it in. (See OldStyleTestList for an explanation
1172 # of why this is necessary.)
1173 self.test_list = self.test_list.Load()
1174
1175 self.test_list.state_instance = self.state_instance
1176
Shuo-Peng Liao52b90da2013-06-30 17:00:06 +08001177 def init_hook(self):
1178 """Initializes hooks."""
1179 module, cls = self.test_list.options.hooks_class.rsplit('.', 1)
1180 self.hooks = getattr(__import__(module, fromlist=[cls]), cls)()
1181 assert isinstance(self.hooks, factory.Hooks), (
1182 "hooks should be of type Hooks but is %r" % type(self.hooks))
1183 self.hooks.test_list = self.test_list
1184 self.hooks.OnStartup()
1185
Jon Salz0697cbf2012-07-04 15:14:04 +08001186 def init(self, args=None, env=None):
1187 '''Initializes Goofy.
1188
1189 Args:
1190 args: A list of command-line arguments. Uses sys.argv if
1191 args is None.
1192 env: An Environment instance to use (or None to choose
1193 FakeChrootEnvironment or DUTEnvironment as appropriate).
1194 '''
Jon Salz77c151e2012-08-28 07:20:37 +08001195 signal.signal(signal.SIGINT, self.handle_sigint)
1196
Jon Salz0697cbf2012-07-04 15:14:04 +08001197 parser = OptionParser()
1198 parser.add_option('-v', '--verbose', dest='verbose',
Jon Salz8fa8e832012-07-13 19:04:09 +08001199 action='store_true',
1200 help='Enable debug logging')
Jon Salz0697cbf2012-07-04 15:14:04 +08001201 parser.add_option('--print_test_list', dest='print_test_list',
Jon Salz8fa8e832012-07-13 19:04:09 +08001202 metavar='FILE',
1203 help='Read and print test list FILE, and exit')
Jon Salz0697cbf2012-07-04 15:14:04 +08001204 parser.add_option('--restart', dest='restart',
Jon Salz8fa8e832012-07-13 19:04:09 +08001205 action='store_true',
1206 help='Clear all test state')
Jon Salz0697cbf2012-07-04 15:14:04 +08001207 parser.add_option('--ui', dest='ui', type='choice',
Jon Salz8fa8e832012-07-13 19:04:09 +08001208 choices=['none', 'gtk', 'chrome'],
Jon Salz2f881df2013-02-01 17:00:35 +08001209 default='chrome',
Jon Salz8fa8e832012-07-13 19:04:09 +08001210 help='UI to use')
Jon Salz0697cbf2012-07-04 15:14:04 +08001211 parser.add_option('--ui_scale_factor', dest='ui_scale_factor',
Jon Salz8fa8e832012-07-13 19:04:09 +08001212 type='int', default=1,
1213 help=('Factor by which to scale UI '
1214 '(Chrome UI only)'))
Jon Salz0697cbf2012-07-04 15:14:04 +08001215 parser.add_option('--test_list', dest='test_list',
Jon Salz8fa8e832012-07-13 19:04:09 +08001216 metavar='FILE',
1217 help='Use FILE as test list')
Jon Salzc79a9982012-08-30 04:42:01 +08001218 parser.add_option('--dummy_shopfloor', action='store_true',
1219 help='Use a dummy shopfloor server')
chungyiafe8f772012-08-15 19:36:29 +08001220 parser.add_option('--automation', dest='automation',
1221 action='store_true',
1222 help='Enable automation on running factory test')
Ricky Liang09216dc2013-02-22 17:26:45 +08001223 parser.add_option('--one_pixel_less', dest='one_pixel_less',
1224 action='store_true',
1225 help=('Start Chrome one pixel less than the full screen.'
1226 'Needed by Exynos platform to run GTK.'))
Jon Salz0697cbf2012-07-04 15:14:04 +08001227 (self.options, self.args) = parser.parse_args(args)
1228
Jon Salz46b89562012-07-05 11:49:22 +08001229 # Make sure factory directories exist.
1230 factory.get_log_root()
1231 factory.get_state_root()
1232 factory.get_test_data_root()
1233
Jon Salz0697cbf2012-07-04 15:14:04 +08001234 global _inited_logging # pylint: disable=W0603
1235 if not _inited_logging:
1236 factory.init_logging('goofy', verbose=self.options.verbose)
1237 _inited_logging = True
Jon Salz8fa8e832012-07-13 19:04:09 +08001238
Jon Salz0f996602012-10-03 15:26:48 +08001239 if self.options.print_test_list:
1240 print factory.read_test_list(
1241 self.options.print_test_list).__repr__(recursive=True)
1242 sys.exit(0)
1243
Jon Salzee85d522012-07-17 14:34:46 +08001244 event_log.IncrementBootSequence()
Jon Salzd15bbcf2013-05-21 17:33:57 +08001245 # Don't defer logging the initial event, so we can make sure
1246 # that device_id, reimage_id, etc. are all set up.
1247 self.event_log = EventLog('goofy', defer=False)
Jon Salz0697cbf2012-07-04 15:14:04 +08001248
1249 if (not suppress_chroot_warning and
1250 factory.in_chroot() and
1251 self.options.ui == 'gtk' and
1252 os.environ.get('DISPLAY') in [None, '', ':0', ':0.0']):
1253 # That's not going to work! Tell the user how to run
1254 # this way.
1255 logging.warn(GOOFY_IN_CHROOT_WARNING)
1256 time.sleep(1)
1257
1258 if env:
1259 self.env = env
1260 elif factory.in_chroot():
1261 self.env = test_environment.FakeChrootEnvironment()
1262 logging.warn(
1263 'Using chroot environment: will not actually run autotests')
1264 else:
1265 self.env = test_environment.DUTEnvironment()
1266 self.env.goofy = self
1267
1268 if self.options.restart:
1269 state.clear_state()
1270
Jon Salz0697cbf2012-07-04 15:14:04 +08001271 if self.options.ui_scale_factor != 1 and utils.in_qemu():
1272 logging.warn(
1273 'In QEMU; ignoring ui_scale_factor argument')
1274 self.options.ui_scale_factor = 1
1275
1276 logging.info('Started')
1277
1278 self.start_state_server()
1279 self.state_instance.set_shared_data('hwid_cfg', get_hwid_cfg())
1280 self.state_instance.set_shared_data('ui_scale_factor',
Ricky Liang09216dc2013-02-22 17:26:45 +08001281 self.options.ui_scale_factor)
1282 self.state_instance.set_shared_data('one_pixel_less',
1283 self.options.one_pixel_less)
Jon Salz0697cbf2012-07-04 15:14:04 +08001284 self.last_shutdown_time = (
1285 self.state_instance.get_shared_data('shutdown_time', optional=True))
1286 self.state_instance.del_shared_data('shutdown_time', optional=True)
Jon Salzb19ea072013-02-07 16:35:00 +08001287 self.state_instance.del_shared_data('startup_error', optional=True)
Jon Salz0697cbf2012-07-04 15:14:04 +08001288
Jon Salz128b0932013-07-03 16:55:26 +08001289 try:
1290 self.InitTestLists()
1291 except: # pylint: disable=W0702
1292 logging.exception('Unable to initialize test lists')
1293 self.state_instance.set_shared_data(
1294 'startup_error',
1295 'Unable to initialize test lists\n%s' % (
1296 traceback.format_exc()))
Jon Salzb19ea072013-02-07 16:35:00 +08001297 if self.options.ui == 'chrome':
1298 # Create an empty test list with default options so that the rest of
1299 # startup can proceed.
1300 self.test_list = factory.FactoryTestList(
1301 [], self.state_instance, factory.Options())
1302 else:
1303 # Bail with an error; no point in starting up.
1304 sys.exit('No valid test list; exiting.')
1305
Jon Salz822838b2013-03-25 17:32:33 +08001306 if self.test_list.options.clear_state_on_start:
1307 self.state_instance.clear_test_state()
1308
Vic Yang3e1cf5d2013-06-05 18:50:24 +08001309 if system.SystemInfo().firmware_version is None and not utils.in_chroot():
Vic Yang9bd4f772013-06-04 17:34:00 +08001310 self.state_instance.set_shared_data('startup_error',
1311 'Netboot firmware detected\n'
1312 'Connect Ethernet and reboot to re-image.\n'
1313 u'侦测到网路开机固件\n'
1314 u'请连接乙太网并重启')
1315
Jon Salz0697cbf2012-07-04 15:14:04 +08001316 if not self.state_instance.has_shared_data('ui_lang'):
1317 self.state_instance.set_shared_data('ui_lang',
1318 self.test_list.options.ui_lang)
1319 self.state_instance.set_shared_data(
1320 'test_list_options',
1321 self.test_list.options.__dict__)
1322 self.state_instance.test_list = self.test_list
1323
Cheng-Yi Chiang39d32ad2013-07-23 15:02:38 +08001324 self.check_log_rotation()
Jon Salz83ef34b2012-11-01 19:46:35 +08001325
Shuo-Peng Liao52b90da2013-06-30 17:00:06 +08001326 self.init_hook()
1327
Jon Salz23926422012-09-01 03:38:13 +08001328 if self.options.dummy_shopfloor:
1329 os.environ[shopfloor.SHOPFLOOR_SERVER_ENV_VAR_NAME] = (
1330 'http://localhost:%d/' % shopfloor.DEFAULT_SERVER_PORT)
1331 self.dummy_shopfloor = Spawn(
1332 [os.path.join(factory.FACTORY_PATH, 'bin', 'shopfloor_server'),
1333 '--dummy'])
1334 elif self.test_list.options.shopfloor_server_url:
1335 shopfloor.set_server_url(self.test_list.options.shopfloor_server_url)
Jon Salz2bf2f6b2013-03-28 18:49:26 +08001336 shopfloor.set_enabled(True)
Jon Salz23926422012-09-01 03:38:13 +08001337
Jon Salz0f996602012-10-03 15:26:48 +08001338 if self.test_list.options.time_sanitizer and not utils.in_chroot():
Jon Salz8fa8e832012-07-13 19:04:09 +08001339 self.time_sanitizer = time_sanitizer.TimeSanitizer(
1340 base_time=time_sanitizer.GetBaseTimeFromFile(
1341 # lsb-factory is written by the factory install shim during
1342 # installation, so it should have a good time obtained from
Jon Salz54882d02012-08-31 01:57:54 +08001343 # the mini-Omaha server. If it's not available, we'll use
1344 # /etc/lsb-factory (which will be much older, but reasonably
1345 # sane) and rely on a shopfloor sync to set a more accurate
1346 # time.
1347 '/usr/local/etc/lsb-factory',
1348 '/etc/lsb-release'))
Jon Salz8fa8e832012-07-13 19:04:09 +08001349 self.time_sanitizer.RunOnce()
1350
Vic Yangd8990da2013-06-27 16:57:43 +08001351 if self.test_list.options.check_cpu_usage_period_secs:
1352 self.cpu_usage_watcher = Spawn(['py/tools/cpu_usage_monitor.py',
1353 '-p', str(self.test_list.options.check_cpu_usage_period_secs)],
1354 cwd=factory.FACTORY_PATH)
1355
Jon Salz0697cbf2012-07-04 15:14:04 +08001356 self.init_states()
1357 self.start_event_server()
1358 self.connection_manager = self.env.create_connection_manager(
Tai-Hsu Lin371351a2012-08-27 14:17:14 +08001359 self.test_list.options.wlans,
1360 self.test_list.options.scan_wifi_period_secs)
Jon Salz0697cbf2012-07-04 15:14:04 +08001361 # Note that we create a log watcher even if
1362 # sync_event_log_period_secs isn't set (no background
1363 # syncing), since we may use it to flush event logs as well.
1364 self.log_watcher = EventLogWatcher(
1365 self.test_list.options.sync_event_log_period_secs,
Jon Salzd15bbcf2013-05-21 17:33:57 +08001366 event_log_db_file=None,
Jon Salz16d10542012-07-23 12:18:45 +08001367 handle_event_logs_callback=self.handle_event_logs)
Jon Salz0697cbf2012-07-04 15:14:04 +08001368 if self.test_list.options.sync_event_log_period_secs:
1369 self.log_watcher.StartWatchThread()
1370
Cheng-Yi Chiang344b10f2013-05-03 16:44:03 +08001371 # Note that we create a system log manager even if
1372 # sync_log_period_secs isn't set (no background
1373 # syncing), since we may kick it to sync logs in its
1374 # thread.
Cheng-Yi Chiangd3516a32013-07-17 15:30:47 +08001375 if self.test_list.options.enable_sync_log:
1376 self.system_log_manager = SystemLogManager(
1377 sync_log_paths=self.test_list.options.sync_log_paths,
1378 sync_period_sec=self.test_list.options.sync_log_period_secs,
1379 clear_log_paths=self.test_list.options.clear_log_paths)
1380 self.system_log_manager.StartSyncThread()
Cheng-Yi Chiang344b10f2013-05-03 16:44:03 +08001381
Jon Salz0697cbf2012-07-04 15:14:04 +08001382 self.update_system_info()
1383
Vic Yang4953fc12012-07-26 16:19:53 +08001384 assert ((self.test_list.options.min_charge_pct is None) ==
1385 (self.test_list.options.max_charge_pct is None))
Vic Yange83d9a12013-04-19 20:00:20 +08001386 if utils.in_chroot():
1387 logging.info('In chroot, ignoring charge manager and charge state')
1388 elif self.test_list.options.min_charge_pct is not None:
Vic Yang4953fc12012-07-26 16:19:53 +08001389 self.charge_manager = ChargeManager(self.test_list.options.min_charge_pct,
1390 self.test_list.options.max_charge_pct)
Jon Salzad7353b2012-10-15 16:22:46 +08001391 system.SystemStatus.charge_manager = self.charge_manager
Cheng-Yi Chiangd8186952013-04-04 23:41:14 +08001392 else:
1393 # Goofy should set charger state to charge if charge_manager is disabled.
1394 try:
1395 system.GetBoard().SetChargeState(Board.ChargeState.CHARGE)
1396 except BoardException:
1397 logging.exception('Unable to set charge state on this board')
Vic Yang4953fc12012-07-26 16:19:53 +08001398
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +08001399 self.core_dump_manager = CoreDumpManager(
1400 self.test_list.options.core_dump_watchlist)
1401
Jon Salz0697cbf2012-07-04 15:14:04 +08001402 os.environ['CROS_FACTORY'] = '1'
1403 os.environ['CROS_DISABLE_SITE_SYSINFO'] = '1'
1404
1405 # Set CROS_UI since some behaviors in ui.py depend on the
1406 # particular UI in use. TODO(jsalz): Remove this (and all
1407 # places it is used) when the GTK UI is removed.
1408 os.environ['CROS_UI'] = self.options.ui
1409
Jon Salzce6a7f82013-06-10 18:22:54 +08001410 if not utils.in_chroot():
Jon Salzddf0d052013-06-18 12:52:44 +08001411 self.cpufreq_manager = CpufreqManager(event_log=self.event_log)
Jon Salzce6a7f82013-06-10 18:22:54 +08001412
Justin Chuang31b02432013-06-27 15:16:51 +08001413 # Startup hooks may want to skip some tests.
1414 self.update_skipped_tests()
Jon Salz416f9cc2013-05-10 18:32:50 +08001415
Jon Salze12c2b32013-06-25 16:24:34 +08001416 self.find_kcrashes()
1417
Jon Salz0697cbf2012-07-04 15:14:04 +08001418 if self.options.ui == 'chrome':
1419 self.env.launch_chrome()
1420 logging.info('Waiting for a web socket connection')
Cheng-Yi Chiangfd8ed392013-03-08 21:37:31 +08001421 self.web_socket_manager.wait()
Jon Salz0697cbf2012-07-04 15:14:04 +08001422
1423 # Wait for the test widget size to be set; this is done in
1424 # an asynchronous RPC so there is a small chance that the
1425 # web socket might be opened first.
1426 for _ in range(100): # 10 s
1427 try:
1428 if self.state_instance.get_shared_data('test_widget_size'):
1429 break
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001430 except KeyError:
Jon Salz0697cbf2012-07-04 15:14:04 +08001431 pass # Retry
1432 time.sleep(0.1) # 100 ms
1433 else:
1434 logging.warn('Never received test_widget_size from UI')
Jon Salz45297282013-05-18 14:31:47 +08001435
1436 # Send Chrome a Tab to get focus to the factory UI
1437 # (http://crosbug.com/p/19444). TODO(jsalz): remove this hack
1438 # and figure out the right way to get the focus to Chrome.
1439 if not utils.in_chroot():
1440 Spawn(
1441 [os.path.join(factory.FACTORY_PATH, 'bin', 'send_key'), 'Tab'],
1442 check_call=True, log=True)
Jon Salz0697cbf2012-07-04 15:14:04 +08001443 elif self.options.ui == 'gtk':
1444 self.start_ui()
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001445
Ricky Liang650f6bf2012-09-28 13:22:54 +08001446 # Create download path for autotest beforehand or autotests run at
1447 # the same time might fail due to race condition.
1448 if not factory.in_chroot():
1449 utils.TryMakeDirs(os.path.join('/usr/local/autotest', 'tests',
1450 'download'))
1451
Jon Salz0697cbf2012-07-04 15:14:04 +08001452 def state_change_callback(test, test_state):
1453 self.event_client.post_event(
1454 Event(Event.Type.STATE_CHANGE,
1455 path=test.path, state=test_state))
1456 self.test_list.state_change_callback = state_change_callback
Jon Salz73e0fd02012-04-04 11:46:38 +08001457
Jon Salza6711d72012-07-18 14:33:03 +08001458 for handler in self.on_ui_startup:
1459 handler()
1460
1461 self.prespawner = Prespawner()
1462 self.prespawner.start()
1463
Jon Salz0697cbf2012-07-04 15:14:04 +08001464 try:
1465 tests_after_shutdown = self.state_instance.get_shared_data(
1466 'tests_after_shutdown')
1467 except KeyError:
1468 tests_after_shutdown = None
Jon Salz57717ca2012-04-04 16:47:25 +08001469
Jon Salz5c344f62012-07-13 14:31:16 +08001470 force_auto_run = (tests_after_shutdown == FORCE_AUTO_RUN)
1471 if not force_auto_run and tests_after_shutdown is not None:
Jon Salz0697cbf2012-07-04 15:14:04 +08001472 logging.info('Resuming tests after shutdown: %s',
1473 tests_after_shutdown)
Jon Salz0697cbf2012-07-04 15:14:04 +08001474 self.tests_to_run.extend(
1475 self.test_list.lookup_path(t) for t in tests_after_shutdown)
1476 self.run_queue.put(self.run_next_test)
1477 else:
Jon Salz5c344f62012-07-13 14:31:16 +08001478 if force_auto_run or self.test_list.options.auto_run_on_start:
Jon Salz0697cbf2012-07-04 15:14:04 +08001479 self.run_queue.put(
1480 lambda: self.run_tests(self.test_list, untested_only=True))
Jon Salz5c344f62012-07-13 14:31:16 +08001481 self.state_instance.set_shared_data('tests_after_shutdown', None)
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001482
Dean Liao592e4d52013-01-10 20:06:39 +08001483 self.may_disable_cros_shortcut_keys()
1484
1485 def may_disable_cros_shortcut_keys(self):
1486 test_options = self.test_list.options
1487 if test_options.disable_cros_shortcut_keys:
1488 logging.info('Filter ChromeOS shortcut keys.')
1489 self.key_filter = KeyFilter(
1490 unmap_caps_lock=test_options.disable_caps_lock,
1491 caps_lock_keycode=test_options.caps_lock_keycode)
1492 self.key_filter.Start()
1493
Jon Salz0697cbf2012-07-04 15:14:04 +08001494 def run(self):
1495 '''Runs Goofy.'''
1496 # Process events forever.
1497 while self.run_once(True):
1498 pass
Jon Salz73e0fd02012-04-04 11:46:38 +08001499
Jon Salz0697cbf2012-07-04 15:14:04 +08001500 def run_once(self, block=False):
1501 '''Runs all items pending in the event loop.
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001502
Jon Salz0697cbf2012-07-04 15:14:04 +08001503 Args:
1504 block: If true, block until at least one event is processed.
Jon Salz7c15e8b2012-06-19 17:10:37 +08001505
Jon Salz0697cbf2012-07-04 15:14:04 +08001506 Returns:
1507 True to keep going or False to shut down.
1508 '''
1509 events = utils.DrainQueue(self.run_queue)
cychiang21886742012-07-05 15:16:32 +08001510 while not events:
Jon Salz0697cbf2012-07-04 15:14:04 +08001511 # Nothing on the run queue.
1512 self._run_queue_idle()
1513 if block:
1514 # Block for at least one event...
cychiang21886742012-07-05 15:16:32 +08001515 try:
1516 events.append(self.run_queue.get(timeout=RUN_QUEUE_TIMEOUT_SECS))
1517 except Queue.Empty:
1518 # Keep going (calling _run_queue_idle() again at the top of
1519 # the loop)
1520 continue
Jon Salz0697cbf2012-07-04 15:14:04 +08001521 # ...and grab anything else that showed up at the same
1522 # time.
1523 events.extend(utils.DrainQueue(self.run_queue))
cychiang21886742012-07-05 15:16:32 +08001524 else:
1525 break
Jon Salz51528e12012-07-02 18:54:45 +08001526
Jon Salz0697cbf2012-07-04 15:14:04 +08001527 for event in events:
1528 if not event:
1529 # Shutdown request.
1530 self.run_queue.task_done()
1531 return False
Jon Salz51528e12012-07-02 18:54:45 +08001532
Jon Salz0697cbf2012-07-04 15:14:04 +08001533 try:
1534 event()
Jon Salz85a39882012-07-05 16:45:04 +08001535 except: # pylint: disable=W0702
1536 logging.exception('Error in event loop')
Jon Salz0697cbf2012-07-04 15:14:04 +08001537 self.record_exception(traceback.format_exception_only(
1538 *sys.exc_info()[:2]))
1539 # But keep going
1540 finally:
1541 self.run_queue.task_done()
1542 return True
Jon Salz0405ab52012-03-16 15:26:52 +08001543
Jon Salz0e6532d2012-10-25 16:30:11 +08001544 def _should_sync_time(self, foreground=False):
1545 '''Returns True if we should attempt syncing time with shopfloor.
1546
1547 Args:
1548 foreground: If True, synchronizes even if background syncing
1549 is disabled (e.g., in explicit sync requests from the
1550 SyncShopfloor test).
1551 '''
1552 return ((foreground or
1553 self.test_list.options.sync_time_period_secs) and
Jon Salz54882d02012-08-31 01:57:54 +08001554 self.time_sanitizer and
1555 (not self.time_synced) and
1556 (not factory.in_chroot()))
1557
Jon Salz0e6532d2012-10-25 16:30:11 +08001558 def sync_time_with_shopfloor_server(self, foreground=False):
Jon Salz54882d02012-08-31 01:57:54 +08001559 '''Syncs time with shopfloor server, if not yet synced.
1560
Jon Salz0e6532d2012-10-25 16:30:11 +08001561 Args:
1562 foreground: If True, synchronizes even if background syncing
1563 is disabled (e.g., in explicit sync requests from the
1564 SyncShopfloor test).
1565
Jon Salz54882d02012-08-31 01:57:54 +08001566 Returns:
1567 False if no time sanitizer is available, or True if this sync (or a
1568 previous sync) succeeded.
1569
1570 Raises:
1571 Exception if unable to contact the shopfloor server.
1572 '''
Jon Salz0e6532d2012-10-25 16:30:11 +08001573 if self._should_sync_time(foreground):
Jon Salz54882d02012-08-31 01:57:54 +08001574 self.time_sanitizer.SyncWithShopfloor()
1575 self.time_synced = True
1576 return self.time_synced
1577
Jon Salzb92c5112012-09-21 15:40:11 +08001578 def log_disk_space_stats(self):
Jon Salz18e0e022013-06-11 17:13:39 +08001579 if (utils.in_chroot() or
1580 not self.test_list.options.log_disk_space_period_secs):
Jon Salzb92c5112012-09-21 15:40:11 +08001581 return
1582
1583 now = time.time()
1584 if (self.last_log_disk_space_time and
1585 now - self.last_log_disk_space_time <
1586 self.test_list.options.log_disk_space_period_secs):
1587 return
1588 self.last_log_disk_space_time = now
1589
Cheng-Yi Chiangd0406522013-04-01 15:40:18 +08001590 # Upload event if stateful partition usage is above threshold.
1591 # Stateful partition is mounted on /usr/local, while
1592 # encrypted stateful partition is mounted on /var.
1593 # If there are too much logs in the factory process,
1594 # these two partitions might get full.
Jon Salzb92c5112012-09-21 15:40:11 +08001595 try:
Cheng-Yi Chiangd0406522013-04-01 15:40:18 +08001596 vfs_infos = disk_space.GetAllVFSInfo()
1597 stateful_info, encrypted_info = None, None
1598 for vfs_info in vfs_infos.values():
1599 if '/usr/local' in vfs_info.mount_points:
1600 stateful_info = vfs_info
1601 if '/var' in vfs_info.mount_points:
1602 encrypted_info = vfs_info
1603
1604 stateful = disk_space.GetPartitionUsage(stateful_info)
1605 encrypted = disk_space.GetPartitionUsage(encrypted_info)
1606
1607 above_threshold = (
1608 self.test_list.options.stateful_usage_threshold and
1609 max(stateful.bytes_used_pct,
1610 stateful.inodes_used_pct,
1611 encrypted.bytes_used_pct,
1612 encrypted.inodes_used_pct) >
1613 self.test_list.options.stateful_usage_threshold)
1614
1615 if above_threshold:
1616 self.event_log.Log('stateful_partition_usage',
1617 partitions={
1618 'stateful': {
1619 'bytes_used_pct': FloatDigit(stateful.bytes_used_pct, 2),
1620 'inodes_used_pct': FloatDigit(stateful.inodes_used_pct, 2)},
1621 'encrypted_stateful': {
1622 'bytes_used_pct': FloatDigit(encrypted.bytes_used_pct, 2),
1623 'inodes_used_pct': FloatDigit(encrypted.inodes_used_pct, 2)}
1624 })
1625 self.log_watcher.ScanEventLogs()
Cheng-Yi Chiang00798e72013-06-20 18:16:39 +08001626 if (not utils.in_chroot() and
1627 self.test_list.options.stateful_usage_above_threshold_action):
1628 Spawn(self.test_list.options.stateful_usage_above_threshold_action,
1629 call=True)
Cheng-Yi Chiangd0406522013-04-01 15:40:18 +08001630
1631 message = disk_space.FormatSpaceUsedAll(vfs_infos)
Jon Salz3c493bb2013-02-07 17:24:58 +08001632 if message != self.last_log_disk_space_message:
Cheng-Yi Chiangd0406522013-04-01 15:40:18 +08001633 if above_threshold:
1634 logging.warning(message)
1635 else:
1636 logging.info(message)
Jon Salz3c493bb2013-02-07 17:24:58 +08001637 self.last_log_disk_space_message = message
Jon Salzb92c5112012-09-21 15:40:11 +08001638 except: # pylint: disable=W0702
1639 logging.exception('Unable to get disk space used')
1640
Justin Chuang83813982013-05-13 01:26:32 +08001641 def check_battery(self):
1642 '''Checks the current battery status.
1643
1644 Logs current battery charging level and status to log. If the battery level
1645 is lower below warning_low_battery_pct, send warning event to shopfloor.
1646 If the battery level is lower below critical_low_battery_pct, flush disks.
1647 '''
1648 if not self.test_list.options.check_battery_period_secs:
1649 return
1650
1651 now = time.time()
1652 if (self.last_check_battery_time and
1653 now - self.last_check_battery_time <
1654 self.test_list.options.check_battery_period_secs):
1655 return
1656 self.last_check_battery_time = now
1657
1658 message = ''
1659 log_level = logging.INFO
1660 try:
1661 power = system.GetBoard().power
1662 if not power.CheckBatteryPresent():
1663 message = 'Battery is not present'
1664 else:
1665 ac_present = power.CheckACPresent()
1666 charge_pct = power.GetChargePct(get_float=True)
1667 message = ('Current battery level %.1f%%, AC charger is %s' %
1668 (charge_pct, 'connected' if ac_present else 'disconnected'))
1669
1670 if charge_pct > self.test_list.options.critical_low_battery_pct:
1671 critical_low_battery = False
1672 else:
1673 critical_low_battery = True
1674 # Only sync disks when battery level is still above minimum
1675 # value. This can be used for offline analysis when shopfloor cannot
1676 # be connected.
1677 if charge_pct > MIN_BATTERY_LEVEL_FOR_DISK_SYNC:
1678 logging.warning('disk syncing for critical low battery situation')
1679 os.system('sync; sync; sync')
1680 else:
1681 logging.warning('disk syncing is cancelled '
1682 'because battery level is lower than %.1f',
1683 MIN_BATTERY_LEVEL_FOR_DISK_SYNC)
1684
1685 # Notify shopfloor server
1686 if (critical_low_battery or
1687 (not ac_present and
1688 charge_pct <= self.test_list.options.warning_low_battery_pct)):
1689 log_level = logging.WARNING
1690
1691 self.event_log.Log('low_battery',
1692 battery_level=charge_pct,
1693 charger_connected=ac_present,
1694 critical=critical_low_battery)
1695 self.log_watcher.KickWatchThread()
Cheng-Yi Chiangd3516a32013-07-17 15:30:47 +08001696 if self.system_log_manager:
1697 self.system_log_manager.KickSyncThread()
Justin Chuang83813982013-05-13 01:26:32 +08001698 except: # pylint: disable=W0702
1699 logging.exception('Unable to check battery or notify shopfloor')
1700 finally:
1701 if message != self.last_check_battery_message:
1702 logging.log(log_level, message)
1703 self.last_check_battery_message = message
1704
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +08001705 def check_core_dump(self):
1706 '''Checks if there is any core dumped file.
1707
1708 Removes unwanted core dump files immediately.
1709 Syncs those files matching watch list to server with a delay between
1710 each sync. After the files have been synced to server, deletes the files.
1711 '''
1712 core_dump_files = self.core_dump_manager.ScanFiles()
1713 if core_dump_files:
1714 now = time.time()
1715 if (self.last_kick_sync_time and now - self.last_kick_sync_time <
1716 self.test_list.options.kick_sync_min_interval_secs):
1717 return
1718 self.last_kick_sync_time = now
1719
1720 # Sends event to server
1721 self.event_log.Log('core_dumped', files=core_dump_files)
1722 self.log_watcher.KickWatchThread()
1723
1724 # Syncs files to server
Cheng-Yi Chiangd3516a32013-07-17 15:30:47 +08001725 if self.system_log_manager:
1726 self.system_log_manager.KickSyncThread(
1727 core_dump_files, self.core_dump_manager.ClearFiles)
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +08001728
Cheng-Yi Chiang39d32ad2013-07-23 15:02:38 +08001729 def check_log_rotation(self):
1730 '''Checks log rotation file presence/absence according to test_list option.
1731
1732 Touch /var/lib/cleanup_logs_paused if test_list.options.disable_log_rotation
1733 is True, delete it otherwise. This must be done in idle loop because
1734 autotest client will touch /var/lib/cleanup_logs_paused each time it runs
1735 an autotest.
1736 '''
1737 if utils.in_chroot():
1738 return
1739 try:
1740 if self.test_list.options.disable_log_rotation:
1741 open(CLEANUP_LOGS_PAUSED, 'w').close()
1742 else:
1743 file_utils.TryUnlink(CLEANUP_LOGS_PAUSED)
1744 except: # pylint: disable=W0702
1745 # Oh well. Logs an error (but no trace)
1746 logging.info(
1747 'Unable to %s %s: %s',
1748 'touch' if self.test_list.options.disable_log_rotation else 'delete',
1749 CLEANUP_LOGS_PAUSED, utils.FormatExceptionOnly())
1750
Jon Salz8fa8e832012-07-13 19:04:09 +08001751 def sync_time_in_background(self):
Jon Salzb22d1172012-08-06 10:38:57 +08001752 '''Writes out current time and tries to sync with shopfloor server.'''
1753 if not self.time_sanitizer:
1754 return
1755
1756 # Write out the current time.
1757 self.time_sanitizer.SaveTime()
1758
Jon Salz54882d02012-08-31 01:57:54 +08001759 if not self._should_sync_time():
Jon Salz8fa8e832012-07-13 19:04:09 +08001760 return
1761
1762 now = time.time()
1763 if self.last_sync_time and (
1764 now - self.last_sync_time <
1765 self.test_list.options.sync_time_period_secs):
1766 # Not yet time for another check.
1767 return
1768 self.last_sync_time = now
1769
1770 def target():
1771 try:
Jon Salz54882d02012-08-31 01:57:54 +08001772 self.sync_time_with_shopfloor_server()
Jon Salz8fa8e832012-07-13 19:04:09 +08001773 except: # pylint: disable=W0702
1774 # Oh well. Log an error (but no trace)
1775 logging.info(
1776 'Unable to get time from shopfloor server: %s',
1777 utils.FormatExceptionOnly())
1778
1779 thread = threading.Thread(target=target)
1780 thread.daemon = True
1781 thread.start()
1782
Jon Salz0697cbf2012-07-04 15:14:04 +08001783 def _run_queue_idle(self):
Vic Yang4953fc12012-07-26 16:19:53 +08001784 '''Invoked when the run queue has no events.
1785
1786 This method must not raise exception.
1787 '''
Jon Salzb22d1172012-08-06 10:38:57 +08001788 now = time.time()
1789 if (self.last_idle and
1790 now < (self.last_idle + RUN_QUEUE_TIMEOUT_SECS - 1)):
1791 # Don't run more often than once every (RUN_QUEUE_TIMEOUT_SECS -
1792 # 1) seconds.
1793 return
1794
1795 self.last_idle = now
1796
Vic Yang311ddb82012-09-26 12:08:28 +08001797 self.check_exclusive()
cychiang21886742012-07-05 15:16:32 +08001798 self.check_for_updates()
Jon Salz8fa8e832012-07-13 19:04:09 +08001799 self.sync_time_in_background()
Jon Salzb92c5112012-09-21 15:40:11 +08001800 self.log_disk_space_stats()
Justin Chuang83813982013-05-13 01:26:32 +08001801 self.check_battery()
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +08001802 self.check_core_dump()
Cheng-Yi Chiang39d32ad2013-07-23 15:02:38 +08001803 self.check_log_rotation()
Jon Salz57717ca2012-04-04 16:47:25 +08001804
Jon Salzd15bbcf2013-05-21 17:33:57 +08001805 def handle_event_logs(self, chunks):
Jon Salz0697cbf2012-07-04 15:14:04 +08001806 '''Callback for event watcher.
Jon Salz258a40c2012-04-19 12:34:01 +08001807
Jon Salz0697cbf2012-07-04 15:14:04 +08001808 Attempts to upload the event logs to the shopfloor server.
Vic Yang93027612013-05-06 02:42:49 +08001809
1810 Args:
Jon Salzd15bbcf2013-05-21 17:33:57 +08001811 chunks: A list of Chunk objects.
Jon Salz0697cbf2012-07-04 15:14:04 +08001812 '''
Vic Yang93027612013-05-06 02:42:49 +08001813 first_exception = None
1814 exception_count = 0
1815
Jon Salzd15bbcf2013-05-21 17:33:57 +08001816 for chunk in chunks:
Vic Yang93027612013-05-06 02:42:49 +08001817 try:
Jon Salzcddb6402013-05-23 12:56:42 +08001818 description = 'event logs (%s)' % str(chunk)
Vic Yang93027612013-05-06 02:42:49 +08001819 start_time = time.time()
1820 shopfloor_client = shopfloor.get_instance(
1821 detect=True,
1822 timeout=self.test_list.options.shopfloor_timeout_secs)
Jon Salzd15bbcf2013-05-21 17:33:57 +08001823 shopfloor_client.UploadEvent(chunk.log_name + "." +
1824 event_log.GetReimageId(),
1825 Binary(chunk.chunk))
Vic Yang93027612013-05-06 02:42:49 +08001826 logging.info(
1827 'Successfully synced %s in %.03f s',
1828 description, time.time() - start_time)
1829 except: # pylint: disable=W0702
Jon Salzd15bbcf2013-05-21 17:33:57 +08001830 first_exception = (first_exception or (chunk.log_name + ': ' +
Vic Yang93027612013-05-06 02:42:49 +08001831 utils.FormatExceptionOnly()))
1832 exception_count += 1
1833
1834 if exception_count:
1835 if exception_count == 1:
1836 msg = 'Log upload failed: %s' % first_exception
1837 else:
1838 msg = '%d log upload failed; first is: %s' % (
1839 exception_count, first_exception)
1840 raise Exception(msg)
1841
Jon Salz57717ca2012-04-04 16:47:25 +08001842
Jon Salz0697cbf2012-07-04 15:14:04 +08001843 def run_tests_with_status(self, statuses_to_run, starting_at=None,
1844 root=None):
1845 '''Runs all top-level tests with a particular status.
Jon Salz0405ab52012-03-16 15:26:52 +08001846
Jon Salz0697cbf2012-07-04 15:14:04 +08001847 All active tests, plus any tests to re-run, are reset.
Jon Salz57717ca2012-04-04 16:47:25 +08001848
Jon Salz0697cbf2012-07-04 15:14:04 +08001849 Args:
1850 starting_at: If provided, only auto-runs tests beginning with
1851 this test.
1852 '''
1853 root = root or self.test_list
Jon Salz57717ca2012-04-04 16:47:25 +08001854
Jon Salz0697cbf2012-07-04 15:14:04 +08001855 if starting_at:
1856 # Make sure they passed a test, not a string.
1857 assert isinstance(starting_at, factory.FactoryTest)
Jon Salz0405ab52012-03-16 15:26:52 +08001858
Jon Salz0697cbf2012-07-04 15:14:04 +08001859 tests_to_reset = []
1860 tests_to_run = []
Jon Salz0405ab52012-03-16 15:26:52 +08001861
Jon Salz0697cbf2012-07-04 15:14:04 +08001862 found_starting_at = False
Jon Salz0405ab52012-03-16 15:26:52 +08001863
Jon Salz0697cbf2012-07-04 15:14:04 +08001864 for test in root.get_top_level_tests():
1865 if starting_at:
1866 if test == starting_at:
1867 # We've found starting_at; do auto-run on all
1868 # subsequent tests.
1869 found_starting_at = True
1870 if not found_starting_at:
1871 # Don't start this guy yet
1872 continue
Jon Salz0405ab52012-03-16 15:26:52 +08001873
Jon Salz0697cbf2012-07-04 15:14:04 +08001874 status = test.get_state().status
1875 if status == TestState.ACTIVE or status in statuses_to_run:
1876 # Reset the test (later; we will need to abort
1877 # all active tests first).
1878 tests_to_reset.append(test)
1879 if status in statuses_to_run:
1880 tests_to_run.append(test)
Jon Salz0405ab52012-03-16 15:26:52 +08001881
Jon Salz6dc031d2013-06-19 13:06:23 +08001882 self.abort_active_tests('Operator requested run/re-run of certain tests')
Jon Salz258a40c2012-04-19 12:34:01 +08001883
Jon Salz0697cbf2012-07-04 15:14:04 +08001884 # Reset all statuses of the tests to run (in case any tests were active;
1885 # we want them to be run again).
1886 for test_to_reset in tests_to_reset:
1887 for test in test_to_reset.walk():
1888 test.update_state(status=TestState.UNTESTED)
Jon Salz57717ca2012-04-04 16:47:25 +08001889
Jon Salz0697cbf2012-07-04 15:14:04 +08001890 self.run_tests(tests_to_run, untested_only=True)
Jon Salz0405ab52012-03-16 15:26:52 +08001891
Jon Salz0697cbf2012-07-04 15:14:04 +08001892 def restart_tests(self, root=None):
1893 '''Restarts all tests.'''
1894 root = root or self.test_list
Jon Salz0405ab52012-03-16 15:26:52 +08001895
Jon Salz6dc031d2013-06-19 13:06:23 +08001896 self.abort_active_tests('Operator requested restart of certain tests')
Jon Salz0697cbf2012-07-04 15:14:04 +08001897 for test in root.walk():
1898 test.update_state(status=TestState.UNTESTED)
1899 self.run_tests(root)
Hung-Te Lin96632362012-03-20 21:14:18 +08001900
Jon Salz0697cbf2012-07-04 15:14:04 +08001901 def auto_run(self, starting_at=None, root=None):
1902 '''"Auto-runs" tests that have not been run yet.
Hung-Te Lin96632362012-03-20 21:14:18 +08001903
Jon Salz0697cbf2012-07-04 15:14:04 +08001904 Args:
1905 starting_at: If provide, only auto-runs tests beginning with
1906 this test.
1907 '''
1908 root = root or self.test_list
1909 self.run_tests_with_status([TestState.UNTESTED, TestState.ACTIVE],
1910 starting_at=starting_at,
1911 root=root)
Jon Salz968e90b2012-03-18 16:12:43 +08001912
Jon Salz0697cbf2012-07-04 15:14:04 +08001913 def re_run_failed(self, root=None):
1914 '''Re-runs failed tests.'''
1915 root = root or self.test_list
1916 self.run_tests_with_status([TestState.FAILED], root=root)
Jon Salz57717ca2012-04-04 16:47:25 +08001917
Jon Salz0697cbf2012-07-04 15:14:04 +08001918 def show_review_information(self):
1919 '''Event handler for showing review information screen.
Jon Salz57717ca2012-04-04 16:47:25 +08001920
Jon Salz0697cbf2012-07-04 15:14:04 +08001921 The information screene is rendered by main UI program (ui.py), so in
1922 goofy we only need to kill all active tests, set them as untested, and
1923 clear remaining tests.
1924 '''
1925 self.kill_active_tests(False)
Jon Salza6711d72012-07-18 14:33:03 +08001926 self.cancel_pending_tests()
Jon Salz57717ca2012-04-04 16:47:25 +08001927
Jon Salz0697cbf2012-07-04 15:14:04 +08001928 def handle_switch_test(self, event):
1929 '''Switches to a particular test.
Jon Salz0405ab52012-03-16 15:26:52 +08001930
Jon Salz0697cbf2012-07-04 15:14:04 +08001931 @param event: The SWITCH_TEST event.
1932 '''
1933 test = self.test_list.lookup_path(event.path)
1934 if not test:
1935 logging.error('Unknown test %r', event.key)
1936 return
Jon Salz73e0fd02012-04-04 11:46:38 +08001937
Jon Salz0697cbf2012-07-04 15:14:04 +08001938 invoc = self.invocations.get(test)
1939 if invoc and test.backgroundable:
1940 # Already running: just bring to the front if it
1941 # has a UI.
1942 logging.info('Setting visible test to %s', test.path)
Jon Salz36fbbb52012-07-05 13:45:06 +08001943 self.set_visible_test(test)
Jon Salz0697cbf2012-07-04 15:14:04 +08001944 return
Jon Salz73e0fd02012-04-04 11:46:38 +08001945
Jon Salz6dc031d2013-06-19 13:06:23 +08001946 self.abort_active_tests('Operator requested abort (switch_test)')
Jon Salz0697cbf2012-07-04 15:14:04 +08001947 for t in test.walk():
1948 t.update_state(status=TestState.UNTESTED)
Jon Salz73e0fd02012-04-04 11:46:38 +08001949
Jon Salz0697cbf2012-07-04 15:14:04 +08001950 if self.test_list.options.auto_run_on_keypress:
1951 self.auto_run(starting_at=test)
1952 else:
1953 self.run_tests(test)
Jon Salz73e0fd02012-04-04 11:46:38 +08001954
Jon Salz0697cbf2012-07-04 15:14:04 +08001955 def wait(self):
1956 '''Waits for all pending invocations.
1957
1958 Useful for testing.
1959 '''
Jon Salz1acc8742012-07-17 17:45:55 +08001960 while self.invocations:
1961 for k, v in self.invocations.iteritems():
1962 logging.info('Waiting for %s to complete...', k)
1963 v.thread.join()
1964 self.reap_completed_tests()
Jon Salz0697cbf2012-07-04 15:14:04 +08001965
1966 def check_exceptions(self):
1967 '''Raises an error if any exceptions have occurred in
1968 invocation threads.'''
1969 if self.exceptions:
1970 raise RuntimeError('Exception in invocation thread: %r' %
1971 self.exceptions)
1972
1973 def record_exception(self, msg):
1974 '''Records an exception in an invocation thread.
1975
1976 An exception with the given message will be rethrown when
1977 Goofy is destroyed.'''
1978 self.exceptions.append(msg)
Jon Salz73e0fd02012-04-04 11:46:38 +08001979
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001980
1981if __name__ == '__main__':
Jon Salz77c151e2012-08-28 07:20:37 +08001982 goofy = Goofy()
1983 try:
1984 goofy.main()
Jon Salz0f996602012-10-03 15:26:48 +08001985 except SystemExit:
1986 # Propagate SystemExit without logging.
1987 raise
Jon Salz31373eb2012-09-21 16:19:49 +08001988 except:
Jon Salz0f996602012-10-03 15:26:48 +08001989 # Log the error before trying to shut down (unless it's a graceful
1990 # exit).
Jon Salz31373eb2012-09-21 16:19:49 +08001991 logging.exception('Error in main loop')
1992 raise
Jon Salz77c151e2012-08-28 07:20:37 +08001993 finally:
1994 goofy.destroy()