blob: 51dcdab71cd97e5cd747fe6e6f7065e06c5c1423 [file] [log] [blame]
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001#!/usr/bin/python -u
Hung-Te Linf2f78f72012-02-08 19:27:11 +08002# -*- coding: utf-8 -*-
3#
Jon Salz37eccbd2012-05-25 16:06:52 +08004# Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
Hung-Te Linf2f78f72012-02-08 19:27:11 +08005# Use of this source code is governed by a BSD-style license that can be
6# found in the LICENSE file.
7
8'''
9The main factory flow that runs the factory test and finalizes a device.
10'''
11
Jon Salze12c2b32013-06-25 16:24:34 +080012import glob
Jon Salz0405ab52012-03-16 15:26:52 +080013import logging
14import os
Jon Salz73e0fd02012-04-04 11:46:38 +080015import Queue
Jon Salze12c2b32013-06-25 16:24:34 +080016import shutil
Jon Salz77c151e2012-08-28 07:20:37 +080017import signal
Jon Salz0405ab52012-03-16 15:26:52 +080018import sys
Jon Salzeff94182013-06-19 15:06:28 +080019import syslog
Jon Salz0405ab52012-03-16 15:26:52 +080020import threading
21import time
22import traceback
Jon Salz258a40c2012-04-19 12:34:01 +080023import uuid
Jon Salzb10cf512012-08-09 17:29:21 +080024from xmlrpclib import Binary
Hung-Te Linf2f78f72012-02-08 19:27:11 +080025from collections import deque
26from optparse import OptionParser
Hung-Te Linf2f78f72012-02-08 19:27:11 +080027
Jon Salz0697cbf2012-07-04 15:14:04 +080028import factory_common # pylint: disable=W0611
jcliangcd688182012-08-20 21:01:26 +080029from cros.factory import event_log
30from cros.factory import system
Cheng-Yi Chiangd0406522013-04-01 15:40:18 +080031from cros.factory.event_log import EventLog, FloatDigit
Tom Wai-Hong Tamd33723e2013-04-10 21:14:37 +080032from cros.factory.event_log_watcher import EventLogWatcher
jcliangcd688182012-08-20 21:01:26 +080033from cros.factory.goofy import test_environment
34from cros.factory.goofy import time_sanitizer
Jon Salz83591782012-06-26 11:09:58 +080035from cros.factory.goofy import updater
jcliangcd688182012-08-20 21:01:26 +080036from cros.factory.goofy.goofy_rpc import GoofyRPC
Jon Salz885dcac2013-07-23 16:39:50 +080037from cros.factory.goofy.invocation import TestArgEnv
jcliangcd688182012-08-20 21:01:26 +080038from cros.factory.goofy.invocation import TestInvocation
39from cros.factory.goofy.prespawner import Prespawner
Cheng-Yi Chiang344b10f2013-05-03 16:44:03 +080040from cros.factory.goofy.system_log_manager import SystemLogManager
jcliangcd688182012-08-20 21:01:26 +080041from cros.factory.goofy.web_socket_manager import WebSocketManager
Cheng-Yi Chiangd8186952013-04-04 23:41:14 +080042from cros.factory.system.board import Board, BoardException
jcliangcd688182012-08-20 21:01:26 +080043from cros.factory.system.charge_manager import ChargeManager
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +080044from cros.factory.system.core_dump_manager import CoreDumpManager
Jon Salzce6a7f82013-06-10 18:22:54 +080045from cros.factory.system.cpufreq_manager import CpufreqManager
Jon Salzb92c5112012-09-21 15:40:11 +080046from cros.factory.system import disk_space
jcliangcd688182012-08-20 21:01:26 +080047from cros.factory.test import factory
48from cros.factory.test import state
Jon Salz51528e12012-07-02 18:54:45 +080049from cros.factory.test import shopfloor
Jon Salz83591782012-06-26 11:09:58 +080050from cros.factory.test import utils
Jon Salz128b0932013-07-03 16:55:26 +080051from cros.factory.test.test_lists import test_lists
Jon Salz83591782012-06-26 11:09:58 +080052from cros.factory.test.event import Event
53from cros.factory.test.event import EventClient
54from cros.factory.test.event import EventServer
jcliangcd688182012-08-20 21:01:26 +080055from cros.factory.test.factory import TestState
Jon Salzd7550792013-07-12 05:49:27 +080056from cros.factory.test.utils import Enum
Dean Liao592e4d52013-01-10 20:06:39 +080057from cros.factory.tools.key_filter import KeyFilter
Jon Salz2af235d2013-06-24 14:47:21 +080058from cros.factory.utils import file_utils
Jon Salz78c32392012-07-25 14:18:29 +080059from cros.factory.utils.process_utils import Spawn
Hung-Te Linf2f78f72012-02-08 19:27:11 +080060
61
Hung-Te Linf2f78f72012-02-08 19:27:11 +080062HWID_CFG_PATH = '/usr/local/share/chromeos-hwid/cfg'
Chun-ta Lin279e7e92013-02-19 17:40:39 +080063CACHES_DIR = os.path.join(factory.get_state_root(), "caches")
Hung-Te Linf2f78f72012-02-08 19:27:11 +080064
Cheng-Yi Chiang39d32ad2013-07-23 15:02:38 +080065CLEANUP_LOGS_PAUSED = '/var/lib/cleanup_logs_paused'
66
Jon Salz8796e362012-05-24 11:39:09 +080067# File that suppresses reboot if present (e.g., for development).
68NO_REBOOT_FILE = '/var/log/factory.noreboot'
69
Jon Salz5c344f62012-07-13 14:31:16 +080070# Value for tests_after_shutdown that forces auto-run (e.g., after
71# a factory update, when the available set of tests might change).
72FORCE_AUTO_RUN = 'force_auto_run'
73
cychiang21886742012-07-05 15:16:32 +080074RUN_QUEUE_TIMEOUT_SECS = 10
75
Justin Chuang83813982013-05-13 01:26:32 +080076# Sync disks when battery level is higher than this value.
77# Otherwise, power loss during disk sync operation may incur even worse outcome.
78MIN_BATTERY_LEVEL_FOR_DISK_SYNC = 1.0
79
Jon Salze12c2b32013-06-25 16:24:34 +080080MAX_CRASH_FILE_SIZE = 64*1024
81
Jon Salz758e6cc2012-04-03 15:47:07 +080082GOOFY_IN_CHROOT_WARNING = '\n' + ('*' * 70) + '''
83You are running Goofy inside the chroot. Autotests are not supported.
84
85To use Goofy in the chroot, first install an Xvnc server:
86
Jon Salz0697cbf2012-07-04 15:14:04 +080087 sudo apt-get install tightvncserver
Jon Salz758e6cc2012-04-03 15:47:07 +080088
89...and then start a VNC X server outside the chroot:
90
Jon Salz0697cbf2012-07-04 15:14:04 +080091 vncserver :10 &
92 vncviewer :10
Jon Salz758e6cc2012-04-03 15:47:07 +080093
94...and run Goofy as follows:
95
Jon Salz0697cbf2012-07-04 15:14:04 +080096 env --unset=XAUTHORITY DISPLAY=localhost:10 python goofy.py
Jon Salz758e6cc2012-04-03 15:47:07 +080097''' + ('*' * 70)
Jon Salz73e0fd02012-04-04 11:46:38 +080098suppress_chroot_warning = False
Hung-Te Linf2f78f72012-02-08 19:27:11 +080099
Jon Salzd7550792013-07-12 05:49:27 +0800100Status = Enum(['UNINITIALIZED', 'INITIALIZING', 'RUNNING',
101 'TERMINATING', 'TERMINATED'])
102
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800103def get_hwid_cfg():
Jon Salz0697cbf2012-07-04 15:14:04 +0800104 '''
105 Returns the HWID config tag, or an empty string if none can be found.
106 '''
107 if 'CROS_HWID' in os.environ:
108 return os.environ['CROS_HWID']
109 if os.path.exists(HWID_CFG_PATH):
110 with open(HWID_CFG_PATH, 'rt') as hwid_cfg_handle:
111 return hwid_cfg_handle.read().strip()
112 return ''
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800113
114
Jon Salz73e0fd02012-04-04 11:46:38 +0800115_inited_logging = False
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800116
117class Goofy(object):
Jon Salz0697cbf2012-07-04 15:14:04 +0800118 '''
119 The main factory flow.
120
121 Note that all methods in this class must be invoked from the main
122 (event) thread. Other threads, such as callbacks and TestInvocation
123 methods, should instead post events on the run queue.
124
125 TODO: Unit tests. (chrome-os-partner:7409)
126
127 Properties:
128 uuid: A unique UUID for this invocation of Goofy.
129 state_instance: An instance of FactoryState.
130 state_server: The FactoryState XML/RPC server.
131 state_server_thread: A thread running state_server.
132 event_server: The EventServer socket server.
133 event_server_thread: A thread running event_server.
134 event_client: A client to the event server.
135 connection_manager: The connection_manager object.
Cheng-Yi Chiang835f2682013-05-06 22:15:48 +0800136 system_log_manager: The SystemLogManager object.
137 core_dump_manager: The CoreDumpManager object.
Jon Salz0697cbf2012-07-04 15:14:04 +0800138 ui_process: The factory ui process object.
139 run_queue: A queue of callbacks to invoke from the main thread.
140 invocations: A map from FactoryTest objects to the corresponding
141 TestInvocations objects representing active tests.
142 tests_to_run: A deque of tests that should be run when the current
143 test(s) complete.
144 options: Command-line options.
145 args: Command-line args.
146 test_list: The test list.
Jon Salz128b0932013-07-03 16:55:26 +0800147 test_lists: All new-style test lists.
Jon Salz0697cbf2012-07-04 15:14:04 +0800148 event_handlers: Map of Event.Type to the method used to handle that
149 event. If the method has an 'event' argument, the event is passed
150 to the handler.
151 exceptions: Exceptions encountered in invocation threads.
Jon Salz3c493bb2013-02-07 17:24:58 +0800152 last_log_disk_space_message: The last message we logged about disk space
153 (to avoid duplication).
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +0800154 last_kick_sync_time: The last time to kick system_log_manager to sync
155 because of core dump files (to avoid kicking too soon then abort the
156 sync.)
Jon Salz416f9cc2013-05-10 18:32:50 +0800157 hooks: A Hooks object containing hooks for various Goofy actions.
Jon Salzd7550792013-07-12 05:49:27 +0800158 status: The current Goofy status (a member of the Status enum).
Jon Salz0697cbf2012-07-04 15:14:04 +0800159 '''
160 def __init__(self):
161 self.uuid = str(uuid.uuid4())
162 self.state_instance = None
163 self.state_server = None
164 self.state_server_thread = None
Jon Salz16d10542012-07-23 12:18:45 +0800165 self.goofy_rpc = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800166 self.event_server = None
167 self.event_server_thread = None
168 self.event_client = None
169 self.connection_manager = None
Vic Yang4953fc12012-07-26 16:19:53 +0800170 self.charge_manager = None
Jon Salz8fa8e832012-07-13 19:04:09 +0800171 self.time_sanitizer = None
172 self.time_synced = False
Jon Salz0697cbf2012-07-04 15:14:04 +0800173 self.log_watcher = None
Cheng-Yi Chiang344b10f2013-05-03 16:44:03 +0800174 self.system_log_manager = None
Cheng-Yi Chiang835f2682013-05-06 22:15:48 +0800175 self.core_dump_manager = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800176 self.event_log = None
177 self.prespawner = None
178 self.ui_process = None
Jon Salzc79a9982012-08-30 04:42:01 +0800179 self.dummy_shopfloor = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800180 self.run_queue = Queue.Queue()
181 self.invocations = {}
182 self.tests_to_run = deque()
183 self.visible_test = None
184 self.chrome = None
Jon Salz416f9cc2013-05-10 18:32:50 +0800185 self.hooks = None
Vic Yangd8990da2013-06-27 16:57:43 +0800186 self.cpu_usage_watcher = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800187
188 self.options = None
189 self.args = None
190 self.test_list = None
Jon Salz128b0932013-07-03 16:55:26 +0800191 self.test_lists = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800192 self.on_ui_startup = []
193 self.env = None
Jon Salzb22d1172012-08-06 10:38:57 +0800194 self.last_idle = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800195 self.last_shutdown_time = None
cychiang21886742012-07-05 15:16:32 +0800196 self.last_update_check = None
Jon Salz8fa8e832012-07-13 19:04:09 +0800197 self.last_sync_time = None
Jon Salzb92c5112012-09-21 15:40:11 +0800198 self.last_log_disk_space_time = None
Jon Salz3c493bb2013-02-07 17:24:58 +0800199 self.last_log_disk_space_message = None
Justin Chuang83813982013-05-13 01:26:32 +0800200 self.last_check_battery_time = None
201 self.last_check_battery_message = None
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +0800202 self.last_kick_sync_time = None
Vic Yang311ddb82012-09-26 12:08:28 +0800203 self.exclusive_items = set()
Jon Salz0f996602012-10-03 15:26:48 +0800204 self.event_log = None
Dean Liao592e4d52013-01-10 20:06:39 +0800205 self.key_filter = None
Jon Salzce6a7f82013-06-10 18:22:54 +0800206 self.cpufreq_manager = None
Jon Salzd7550792013-07-12 05:49:27 +0800207 self.status = Status.UNINITIALIZED
Jon Salz0697cbf2012-07-04 15:14:04 +0800208
Jon Salz85a39882012-07-05 16:45:04 +0800209 def test_or_root(event, parent_or_group=True):
210 '''Returns the test affected by a particular event.
211
212 Args:
213 event: The event containing an optional 'path' attribute.
214 parent_on_group: If True, returns the top-level parent for a test (the
215 root node of the tests that need to be run together if the given test
216 path is to be run).
217 '''
Jon Salz0697cbf2012-07-04 15:14:04 +0800218 try:
219 path = event.path
220 except AttributeError:
221 path = None
222
223 if path:
Jon Salz85a39882012-07-05 16:45:04 +0800224 test = self.test_list.lookup_path(path)
225 if parent_or_group:
226 test = test.get_top_level_parent_or_group()
227 return test
Jon Salz0697cbf2012-07-04 15:14:04 +0800228 else:
229 return self.test_list
230
231 self.event_handlers = {
232 Event.Type.SWITCH_TEST: self.handle_switch_test,
233 Event.Type.SHOW_NEXT_ACTIVE_TEST:
234 lambda event: self.show_next_active_test(),
235 Event.Type.RESTART_TESTS:
236 lambda event: self.restart_tests(root=test_or_root(event)),
237 Event.Type.AUTO_RUN:
238 lambda event: self.auto_run(root=test_or_root(event)),
239 Event.Type.RE_RUN_FAILED:
240 lambda event: self.re_run_failed(root=test_or_root(event)),
241 Event.Type.RUN_TESTS_WITH_STATUS:
242 lambda event: self.run_tests_with_status(
243 event.status,
244 root=test_or_root(event)),
245 Event.Type.REVIEW:
246 lambda event: self.show_review_information(),
247 Event.Type.UPDATE_SYSTEM_INFO:
248 lambda event: self.update_system_info(),
Jon Salz0697cbf2012-07-04 15:14:04 +0800249 Event.Type.STOP:
Jon Salz85a39882012-07-05 16:45:04 +0800250 lambda event: self.stop(root=test_or_root(event, False),
Jon Salz6dc031d2013-06-19 13:06:23 +0800251 fail=getattr(event, 'fail', False),
252 reason=getattr(event, 'reason', None)),
Jon Salz36fbbb52012-07-05 13:45:06 +0800253 Event.Type.SET_VISIBLE_TEST:
254 lambda event: self.set_visible_test(
255 self.test_list.lookup_path(event.path)),
Jon Salz4712ac72013-02-07 17:12:05 +0800256 Event.Type.CLEAR_STATE:
257 lambda event: self.clear_state(self.test_list.lookup_path(event.path)),
Jon Salz0697cbf2012-07-04 15:14:04 +0800258 }
259
260 self.exceptions = []
261 self.web_socket_manager = None
262
263 def destroy(self):
Jon Salzd7550792013-07-12 05:49:27 +0800264 self.status = Status.TERMINATING
Jon Salz0697cbf2012-07-04 15:14:04 +0800265 if self.chrome:
266 self.chrome.kill()
267 self.chrome = None
Jon Salzc79a9982012-08-30 04:42:01 +0800268 if self.dummy_shopfloor:
269 self.dummy_shopfloor.kill()
270 self.dummy_shopfloor = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800271 if self.ui_process:
272 utils.kill_process_tree(self.ui_process, 'ui')
273 self.ui_process = None
274 if self.web_socket_manager:
275 logging.info('Stopping web sockets')
276 self.web_socket_manager.close()
277 self.web_socket_manager = None
278 if self.state_server_thread:
279 logging.info('Stopping state server')
280 self.state_server.shutdown()
281 self.state_server_thread.join()
282 self.state_server.server_close()
283 self.state_server_thread = None
284 if self.state_instance:
285 self.state_instance.close()
286 if self.event_server_thread:
287 logging.info('Stopping event server')
288 self.event_server.shutdown() # pylint: disable=E1101
289 self.event_server_thread.join()
290 self.event_server.server_close()
291 self.event_server_thread = None
292 if self.log_watcher:
293 if self.log_watcher.IsThreadStarted():
294 self.log_watcher.StopWatchThread()
295 self.log_watcher = None
Cheng-Yi Chiang344b10f2013-05-03 16:44:03 +0800296 if self.system_log_manager:
297 if self.system_log_manager.IsThreadRunning():
298 self.system_log_manager.StopSyncThread()
299 self.system_log_manager = None
Jon Salz0697cbf2012-07-04 15:14:04 +0800300 if self.prespawner:
301 logging.info('Stopping prespawner')
302 self.prespawner.stop()
303 self.prespawner = None
304 if self.event_client:
305 logging.info('Closing event client')
306 self.event_client.close()
307 self.event_client = None
Jon Salzddf0d052013-06-18 12:52:44 +0800308 if self.cpufreq_manager:
309 self.cpufreq_manager.Stop()
Jon Salz0697cbf2012-07-04 15:14:04 +0800310 if self.event_log:
311 self.event_log.Close()
312 self.event_log = None
Dean Liao592e4d52013-01-10 20:06:39 +0800313 if self.key_filter:
314 self.key_filter.Stop()
Vic Yangd8990da2013-06-27 16:57:43 +0800315 if self.cpu_usage_watcher:
316 self.cpu_usage_watcher.terminate()
Dean Liao592e4d52013-01-10 20:06:39 +0800317
Jon Salz0697cbf2012-07-04 15:14:04 +0800318 self.check_exceptions()
319 logging.info('Done destroying Goofy')
Jon Salzd7550792013-07-12 05:49:27 +0800320 self.status = Status.TERMINATED
Jon Salz0697cbf2012-07-04 15:14:04 +0800321
322 def start_state_server(self):
Jon Salz2af235d2013-06-24 14:47:21 +0800323 # Before starting state server, remount stateful partitions with
324 # no commit flag. The default commit time (commit=600) makes corruption
325 # too likely.
326 file_utils.ResetCommitTime()
327
Jon Salz0697cbf2012-07-04 15:14:04 +0800328 self.state_instance, self.state_server = (
329 state.create_server(bind_address='0.0.0.0'))
Jon Salz16d10542012-07-23 12:18:45 +0800330 self.goofy_rpc = GoofyRPC(self)
331 self.goofy_rpc.RegisterMethods(self.state_instance)
Jon Salz0697cbf2012-07-04 15:14:04 +0800332 logging.info('Starting state server')
333 self.state_server_thread = threading.Thread(
334 target=self.state_server.serve_forever,
335 name='StateServer')
336 self.state_server_thread.start()
337
338 def start_event_server(self):
339 self.event_server = EventServer()
340 logging.info('Starting factory event server')
341 self.event_server_thread = threading.Thread(
342 target=self.event_server.serve_forever,
343 name='EventServer') # pylint: disable=E1101
344 self.event_server_thread.start()
345
346 self.event_client = EventClient(
347 callback=self.handle_event, event_loop=self.run_queue)
348
349 self.web_socket_manager = WebSocketManager(self.uuid)
350 self.state_server.add_handler("/event",
351 self.web_socket_manager.handle_web_socket)
352
353 def start_ui(self):
354 ui_proc_args = [
355 os.path.join(factory.FACTORY_PACKAGE_PATH, 'test', 'ui.py'),
356 self.options.test_list]
357 if self.options.verbose:
358 ui_proc_args.append('-v')
359 logging.info('Starting ui %s', ui_proc_args)
Jon Salz78c32392012-07-25 14:18:29 +0800360 self.ui_process = Spawn(ui_proc_args)
Jon Salz0697cbf2012-07-04 15:14:04 +0800361 logging.info('Waiting for UI to come up...')
362 self.event_client.wait(
363 lambda event: event.type == Event.Type.UI_READY)
364 logging.info('UI has started')
365
366 def set_visible_test(self, test):
367 if self.visible_test == test:
368 return
Jon Salz2f2d42c2012-07-30 12:30:34 +0800369 if test and not test.has_ui:
370 return
Jon Salz0697cbf2012-07-04 15:14:04 +0800371
372 if test:
373 test.update_state(visible=True)
374 if self.visible_test:
375 self.visible_test.update_state(visible=False)
376 self.visible_test = test
377
Jon Salzd4306c82012-11-30 15:16:36 +0800378 def _log_startup_messages(self):
379 '''Logs the tail of var/log/messages and mosys and EC console logs.'''
380 # TODO(jsalz): This is mostly a copy-and-paste of code in init_states,
381 # for factory-3004.B only. Consolidate and merge back to ToT.
382 if utils.in_chroot():
383 return
384
385 try:
386 var_log_messages = (
387 utils.var_log_messages_before_reboot())
388 logging.info(
389 'Tail of /var/log/messages before last reboot:\n'
390 '%s', ('\n'.join(
391 ' ' + x for x in var_log_messages)))
392 except: # pylint: disable=W0702
393 logging.exception('Unable to grok /var/log/messages')
394
395 try:
396 mosys_log = utils.Spawn(
397 ['mosys', 'eventlog', 'list'],
398 read_stdout=True, log_stderr_on_error=True).stdout_data
399 logging.info('System eventlog from mosys:\n%s\n', mosys_log)
400 except: # pylint: disable=W0702
401 logging.exception('Unable to read mosys eventlog')
402
403 try:
Vic Yang8341dde2013-01-29 16:48:52 +0800404 board = system.GetBoard()
405 ec_console_log = board.GetECConsoleLog()
Jon Salzd4306c82012-11-30 15:16:36 +0800406 logging.info('EC console log after reboot:\n%s\n', ec_console_log)
407 except: # pylint: disable=W0702
408 logging.exception('Error retrieving EC console log')
409
Vic Yang079f9872013-07-01 11:32:00 +0800410 try:
411 board = system.GetBoard()
412 ec_panic_info = board.GetECPanicInfo()
413 logging.info('EC panic info after reboot:\n%s\n', ec_panic_info)
414 except: # pylint: disable=W0702
415 logging.exception('Error retrieving EC panic info')
416
Jon Salz0697cbf2012-07-04 15:14:04 +0800417 def handle_shutdown_complete(self, test, test_state):
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800418 '''
Jon Salz0697cbf2012-07-04 15:14:04 +0800419 Handles the case where a shutdown was detected during a shutdown step.
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800420
Jon Salz0697cbf2012-07-04 15:14:04 +0800421 @param test: The ShutdownStep.
422 @param test_state: The test state.
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800423 '''
Jon Salz0697cbf2012-07-04 15:14:04 +0800424 test_state = test.update_state(increment_shutdown_count=1)
425 logging.info('Detected shutdown (%d of %d)',
426 test_state.shutdown_count, test.iterations)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800427
Jon Salz0697cbf2012-07-04 15:14:04 +0800428 def log_and_update_state(status, error_msg, **kw):
429 self.event_log.Log('rebooted',
430 status=status, error_msg=error_msg, **kw)
Jon Salzd4306c82012-11-30 15:16:36 +0800431 logging.info('Rebooted: status=%s, %s', status,
432 (('error_msg=%s' % error_msg) if error_msg else None))
Jon Salz0697cbf2012-07-04 15:14:04 +0800433 test.update_state(status=status, error_msg=error_msg)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800434
Jon Salz0697cbf2012-07-04 15:14:04 +0800435 if not self.last_shutdown_time:
436 log_and_update_state(status=TestState.FAILED,
437 error_msg='Unable to read shutdown_time')
438 return
Jon Salz258a40c2012-04-19 12:34:01 +0800439
Jon Salz0697cbf2012-07-04 15:14:04 +0800440 now = time.time()
441 logging.info('%.03f s passed since reboot',
442 now - self.last_shutdown_time)
Jon Salz258a40c2012-04-19 12:34:01 +0800443
Jon Salz0697cbf2012-07-04 15:14:04 +0800444 if self.last_shutdown_time > now:
445 test.update_state(status=TestState.FAILED,
446 error_msg='Time moved backward during reboot')
447 elif (isinstance(test, factory.RebootStep) and
448 self.test_list.options.max_reboot_time_secs and
449 (now - self.last_shutdown_time >
450 self.test_list.options.max_reboot_time_secs)):
451 # A reboot took too long; fail. (We don't check this for
452 # HaltSteps, because the machine could be halted for a
453 # very long time, and even unplugged with battery backup,
454 # thus hosing the clock.)
455 log_and_update_state(
456 status=TestState.FAILED,
457 error_msg=('More than %d s elapsed during reboot '
458 '(%.03f s, from %s to %s)' % (
459 self.test_list.options.max_reboot_time_secs,
460 now - self.last_shutdown_time,
461 utils.TimeString(self.last_shutdown_time),
462 utils.TimeString(now))),
463 duration=(now-self.last_shutdown_time))
Jon Salzd4306c82012-11-30 15:16:36 +0800464 self._log_startup_messages()
Jon Salz0697cbf2012-07-04 15:14:04 +0800465 elif test_state.shutdown_count == test.iterations:
466 # Good!
467 log_and_update_state(status=TestState.PASSED,
468 duration=(now - self.last_shutdown_time),
469 error_msg='')
470 elif test_state.shutdown_count > test.iterations:
471 # Shut down too many times
472 log_and_update_state(status=TestState.FAILED,
473 error_msg='Too many shutdowns')
Jon Salzd4306c82012-11-30 15:16:36 +0800474 self._log_startup_messages()
Jon Salz0697cbf2012-07-04 15:14:04 +0800475 elif utils.are_shift_keys_depressed():
476 logging.info('Shift keys are depressed; cancelling restarts')
477 # Abort shutdown
478 log_and_update_state(
479 status=TestState.FAILED,
480 error_msg='Shutdown aborted with double shift keys')
Jon Salza6711d72012-07-18 14:33:03 +0800481 self.cancel_pending_tests()
Jon Salz0697cbf2012-07-04 15:14:04 +0800482 else:
483 def handler():
484 if self._prompt_cancel_shutdown(
485 test, test_state.shutdown_count + 1):
Jon Salza6711d72012-07-18 14:33:03 +0800486 factory.console.info('Shutdown aborted by operator')
Jon Salz0697cbf2012-07-04 15:14:04 +0800487 log_and_update_state(
488 status=TestState.FAILED,
489 error_msg='Shutdown aborted by operator')
Jon Salza6711d72012-07-18 14:33:03 +0800490 self.cancel_pending_tests()
Jon Salz0697cbf2012-07-04 15:14:04 +0800491 return
Jon Salz0405ab52012-03-16 15:26:52 +0800492
Jon Salz0697cbf2012-07-04 15:14:04 +0800493 # Time to shutdown again
494 log_and_update_state(
495 status=TestState.ACTIVE,
496 error_msg='',
497 iteration=test_state.shutdown_count)
Jon Salz73e0fd02012-04-04 11:46:38 +0800498
Jon Salz0697cbf2012-07-04 15:14:04 +0800499 self.event_log.Log('shutdown', operation='reboot')
500 self.state_instance.set_shared_data('shutdown_time',
501 time.time())
502 self.env.shutdown('reboot')
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800503
Jon Salz0697cbf2012-07-04 15:14:04 +0800504 self.on_ui_startup.append(handler)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800505
Jon Salz0697cbf2012-07-04 15:14:04 +0800506 def _prompt_cancel_shutdown(self, test, iteration):
507 if self.options.ui != 'chrome':
508 return False
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800509
Jon Salz0697cbf2012-07-04 15:14:04 +0800510 pending_shutdown_data = {
511 'delay_secs': test.delay_secs,
512 'time': time.time() + test.delay_secs,
513 'operation': test.operation,
514 'iteration': iteration,
515 'iterations': test.iterations,
516 }
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800517
Jon Salz0697cbf2012-07-04 15:14:04 +0800518 # Create a new (threaded) event client since we
519 # don't want to use the event loop for this.
520 with EventClient() as event_client:
521 event_client.post_event(Event(Event.Type.PENDING_SHUTDOWN,
522 **pending_shutdown_data))
523 aborted = event_client.wait(
524 lambda event: event.type == Event.Type.CANCEL_SHUTDOWN,
525 timeout=test.delay_secs) is not None
526 if aborted:
527 event_client.post_event(Event(Event.Type.PENDING_SHUTDOWN))
528 return aborted
Jon Salz258a40c2012-04-19 12:34:01 +0800529
Jon Salz0697cbf2012-07-04 15:14:04 +0800530 def init_states(self):
531 '''
532 Initializes all states on startup.
533 '''
534 for test in self.test_list.get_all_tests():
535 # Make sure the state server knows about all the tests,
536 # defaulting to an untested state.
537 test.update_state(update_parent=False, visible=False)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800538
Jon Salz0697cbf2012-07-04 15:14:04 +0800539 var_log_messages = None
Vic Yanga9c32212012-08-16 20:07:54 +0800540 mosys_log = None
Vic Yange4c275d2012-08-28 01:50:20 +0800541 ec_console_log = None
Vic Yang079f9872013-07-01 11:32:00 +0800542 ec_panic_info = None
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800543
Jon Salz0697cbf2012-07-04 15:14:04 +0800544 # Any 'active' tests should be marked as failed now.
545 for test in self.test_list.walk():
Jon Salza6711d72012-07-18 14:33:03 +0800546 if not test.is_leaf():
547 # Don't bother with parents; they will be updated when their
548 # children are updated.
549 continue
550
Jon Salz0697cbf2012-07-04 15:14:04 +0800551 test_state = test.get_state()
552 if test_state.status != TestState.ACTIVE:
553 continue
554 if isinstance(test, factory.ShutdownStep):
555 # Shutdown while the test was active - that's good.
556 self.handle_shutdown_complete(test, test_state)
557 else:
558 # Unexpected shutdown. Grab /var/log/messages for context.
559 if var_log_messages is None:
560 try:
561 var_log_messages = (
562 utils.var_log_messages_before_reboot())
563 # Write it to the log, to make it easier to
564 # correlate with /var/log/messages.
565 logging.info(
566 'Unexpected shutdown. '
567 'Tail of /var/log/messages before last reboot:\n'
568 '%s', ('\n'.join(
569 ' ' + x for x in var_log_messages)))
570 except: # pylint: disable=W0702
571 logging.exception('Unable to grok /var/log/messages')
572 var_log_messages = []
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800573
Jon Salz008f4ea2012-08-28 05:39:45 +0800574 if mosys_log is None and not utils.in_chroot():
575 try:
576 mosys_log = utils.Spawn(
577 ['mosys', 'eventlog', 'list'],
578 read_stdout=True, log_stderr_on_error=True).stdout_data
579 # Write it to the log also.
580 logging.info('System eventlog from mosys:\n%s\n', mosys_log)
581 except: # pylint: disable=W0702
582 logging.exception('Unable to read mosys eventlog')
Vic Yanga9c32212012-08-16 20:07:54 +0800583
Vic Yange4c275d2012-08-28 01:50:20 +0800584 if ec_console_log is None:
585 try:
Vic Yang8341dde2013-01-29 16:48:52 +0800586 board = system.GetBoard()
587 ec_console_log = board.GetECConsoleLog()
Vic Yange4c275d2012-08-28 01:50:20 +0800588 logging.info('EC console log after reboot:\n%s\n', ec_console_log)
Jon Salzfe1f6652012-09-07 05:40:14 +0800589 except: # pylint: disable=W0702
Vic Yange4c275d2012-08-28 01:50:20 +0800590 logging.exception('Error retrieving EC console log')
591
Vic Yang079f9872013-07-01 11:32:00 +0800592 if ec_panic_info is None:
593 try:
594 board = system.GetBoard()
595 ec_panic_info = board.GetECPanicInfo()
596 logging.info('EC panic info after reboot:\n%s\n', ec_panic_info)
597 except: # pylint: disable=W0702
598 logging.exception('Error retrieving EC panic info')
599
Jon Salz0697cbf2012-07-04 15:14:04 +0800600 error_msg = 'Unexpected shutdown while test was running'
601 self.event_log.Log('end_test',
602 path=test.path,
603 status=TestState.FAILED,
604 invocation=test.get_state().invocation,
605 error_msg=error_msg,
Vic Yanga9c32212012-08-16 20:07:54 +0800606 var_log_messages='\n'.join(var_log_messages),
607 mosys_log=mosys_log)
Jon Salz0697cbf2012-07-04 15:14:04 +0800608 test.update_state(
609 status=TestState.FAILED,
610 error_msg=error_msg)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800611
Jon Salz50efe942012-07-26 11:54:10 +0800612 if not test.never_fails:
613 # For "never_fails" tests (such as "Start"), don't cancel
614 # pending tests, since reboot is expected.
615 factory.console.info('Unexpected shutdown while test %s '
616 'running; cancelling any pending tests',
617 test.path)
618 self.state_instance.set_shared_data('tests_after_shutdown', [])
Jon Salz69806bb2012-07-20 18:05:02 +0800619
Jon Salz008f4ea2012-08-28 05:39:45 +0800620 self.update_skipped_tests()
621
622 def update_skipped_tests(self):
623 '''
624 Updates skipped states based on run_if.
625 '''
Jon Salz885dcac2013-07-23 16:39:50 +0800626 env = TestArgEnv()
Jon Salz008f4ea2012-08-28 05:39:45 +0800627 for t in self.test_list.walk():
Jon Salz885dcac2013-07-23 16:39:50 +0800628 if t.is_leaf() and (t.run_if_table_name or t.run_if_expr):
629 value = None
630
631 if t.run_if_expr:
632 try:
633 value = t.run_if_expr(env)
634 except: # pylint: disable=W0702
635 logging.exception('Unable to evaluate run_if expression for %s',
636 t.path)
637 # But keep going; we have no choice. This will end up
638 # always activating the test.
639 else:
640 try:
641 aux = shopfloor.get_selected_aux_data(t.run_if_table_name)
642 value = aux.get(t.run_if_col)
643 except ValueError:
644 # Not available; assume it shouldn't be skipped
645 pass
646
647 if value is None:
648 skip = False
649 else:
650 skip = (not value) ^ t.run_if_not
Jon Salz008f4ea2012-08-28 05:39:45 +0800651
652 test_state = t.get_state()
653 if ((not skip) and
654 (test_state.status == TestState.PASSED) and
655 (test_state.error_msg == TestState.SKIPPED_MSG)):
656 # It was marked as skipped before, but now we need to run it.
657 # Mark as untested.
658 t.update_state(skip=skip, status=TestState.UNTESTED, error_msg='')
659 else:
660 t.update_state(skip=skip)
661
Jon Salz0697cbf2012-07-04 15:14:04 +0800662 def show_next_active_test(self):
663 '''
664 Rotates to the next visible active test.
665 '''
666 self.reap_completed_tests()
667 active_tests = [
668 t for t in self.test_list.walk()
669 if t.is_leaf() and t.get_state().status == TestState.ACTIVE]
670 if not active_tests:
671 return
Jon Salz4f6c7172012-06-11 20:45:36 +0800672
Jon Salz0697cbf2012-07-04 15:14:04 +0800673 try:
674 next_test = active_tests[
675 (active_tests.index(self.visible_test) + 1) % len(active_tests)]
676 except ValueError: # visible_test not present in active_tests
677 next_test = active_tests[0]
Jon Salz4f6c7172012-06-11 20:45:36 +0800678
Jon Salz0697cbf2012-07-04 15:14:04 +0800679 self.set_visible_test(next_test)
Jon Salz4f6c7172012-06-11 20:45:36 +0800680
Jon Salz0697cbf2012-07-04 15:14:04 +0800681 def handle_event(self, event):
682 '''
683 Handles an event from the event server.
684 '''
685 handler = self.event_handlers.get(event.type)
686 if handler:
687 handler(event)
688 else:
689 # We don't register handlers for all event types - just ignore
690 # this event.
691 logging.debug('Unbound event type %s', event.type)
Jon Salz4f6c7172012-06-11 20:45:36 +0800692
Vic Yangaabf9fd2013-04-09 18:56:13 +0800693 def check_critical_factory_note(self):
694 '''
695 Returns True if the last factory note is critical.
696 '''
697 notes = self.state_instance.get_shared_data('factory_note', True)
698 return notes and notes[-1]['level'] == 'CRITICAL'
699
Jon Salz0697cbf2012-07-04 15:14:04 +0800700 def run_next_test(self):
701 '''
702 Runs the next eligible test (or tests) in self.tests_to_run.
703 '''
704 self.reap_completed_tests()
Vic Yangaabf9fd2013-04-09 18:56:13 +0800705 if self.tests_to_run and self.check_critical_factory_note():
706 self.tests_to_run.clear()
707 return
Jon Salz0697cbf2012-07-04 15:14:04 +0800708 while self.tests_to_run:
709 logging.debug('Tests to run: %s',
710 [x.path for x in self.tests_to_run])
Jon Salz94eb56f2012-06-12 18:01:12 +0800711
Jon Salz0697cbf2012-07-04 15:14:04 +0800712 test = self.tests_to_run[0]
Jon Salz94eb56f2012-06-12 18:01:12 +0800713
Jon Salz0697cbf2012-07-04 15:14:04 +0800714 if test in self.invocations:
715 logging.info('Next test %s is already running', test.path)
716 self.tests_to_run.popleft()
717 return
Jon Salz94eb56f2012-06-12 18:01:12 +0800718
Jon Salza1412922012-07-23 16:04:17 +0800719 for requirement in test.require_run:
720 for i in requirement.test.walk():
721 if i.get_state().status == TestState.ACTIVE:
Jon Salz304a75d2012-07-06 11:14:15 +0800722 logging.info('Waiting for active test %s to complete '
Jon Salza1412922012-07-23 16:04:17 +0800723 'before running %s', i.path, test.path)
Jon Salz304a75d2012-07-06 11:14:15 +0800724 return
725
Jon Salz0697cbf2012-07-04 15:14:04 +0800726 if self.invocations and not (test.backgroundable and all(
727 [x.backgroundable for x in self.invocations])):
728 logging.debug('Waiting for non-backgroundable tests to '
729 'complete before running %s', test.path)
730 return
Jon Salz94eb56f2012-06-12 18:01:12 +0800731
Jon Salz3e6f5202012-10-15 15:08:29 +0800732 if test.get_state().skip:
733 factory.console.info('Skipping test %s', test.path)
734 test.update_state(status=TestState.PASSED,
735 error_msg=TestState.SKIPPED_MSG)
736 self.tests_to_run.popleft()
737 continue
738
Jon Salz0697cbf2012-07-04 15:14:04 +0800739 self.tests_to_run.popleft()
Jon Salz94eb56f2012-06-12 18:01:12 +0800740
Jon Salz304a75d2012-07-06 11:14:15 +0800741 untested = set()
Jon Salza1412922012-07-23 16:04:17 +0800742 for requirement in test.require_run:
743 for i in requirement.test.walk():
744 if i == test:
Jon Salz304a75d2012-07-06 11:14:15 +0800745 # We've hit this test itself; stop checking
746 break
Jon Salza1412922012-07-23 16:04:17 +0800747 if ((i.get_state().status == TestState.UNTESTED) or
748 (requirement.passed and i.get_state().status !=
749 TestState.PASSED)):
Jon Salz304a75d2012-07-06 11:14:15 +0800750 # Found an untested test; move on to the next
751 # element in require_run.
Jon Salza1412922012-07-23 16:04:17 +0800752 untested.add(i)
Jon Salz304a75d2012-07-06 11:14:15 +0800753 break
754
755 if untested:
756 untested_paths = ', '.join(sorted([x.path for x in untested]))
757 if self.state_instance.get_shared_data('engineering_mode',
758 optional=True):
759 # In engineering mode, we'll let it go.
760 factory.console.warn('In engineering mode; running '
761 '%s even though required tests '
762 '[%s] have not completed',
763 test.path, untested_paths)
764 else:
765 # Not in engineering mode; mark it failed.
766 error_msg = ('Required tests [%s] have not been run yet'
767 % untested_paths)
768 factory.console.error('Not running %s: %s',
769 test.path, error_msg)
770 test.update_state(status=TestState.FAILED,
771 error_msg=error_msg)
772 continue
773
Jon Salz0697cbf2012-07-04 15:14:04 +0800774 if isinstance(test, factory.ShutdownStep):
775 if os.path.exists(NO_REBOOT_FILE):
776 test.update_state(
777 status=TestState.FAILED, increment_count=1,
778 error_msg=('Skipped shutdown since %s is present' %
Jon Salz304a75d2012-07-06 11:14:15 +0800779 NO_REBOOT_FILE))
Jon Salz0697cbf2012-07-04 15:14:04 +0800780 continue
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800781
Jon Salz0697cbf2012-07-04 15:14:04 +0800782 test.update_state(status=TestState.ACTIVE, increment_count=1,
783 error_msg='', shutdown_count=0)
784 if self._prompt_cancel_shutdown(test, 1):
785 self.event_log.Log('reboot_cancelled')
786 test.update_state(
787 status=TestState.FAILED, increment_count=1,
788 error_msg='Shutdown aborted by operator',
789 shutdown_count=0)
chungyiafe8f772012-08-15 19:36:29 +0800790 continue
Jon Salz2f757d42012-06-27 17:06:42 +0800791
Jon Salz0697cbf2012-07-04 15:14:04 +0800792 # Save pending test list in the state server
Jon Salzdbf398f2012-06-14 17:30:01 +0800793 self.state_instance.set_shared_data(
Jon Salz0697cbf2012-07-04 15:14:04 +0800794 'tests_after_shutdown',
795 [t.path for t in self.tests_to_run])
796 # Save shutdown time
797 self.state_instance.set_shared_data('shutdown_time',
798 time.time())
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800799
Jon Salz0697cbf2012-07-04 15:14:04 +0800800 with self.env.lock:
801 self.event_log.Log('shutdown', operation=test.operation)
802 shutdown_result = self.env.shutdown(test.operation)
803 if shutdown_result:
804 # That's all, folks!
805 self.run_queue.put(None)
806 return
807 else:
808 # Just pass (e.g., in the chroot).
809 test.update_state(status=TestState.PASSED)
810 self.state_instance.set_shared_data(
811 'tests_after_shutdown', None)
812 # Send event with no fields to indicate that there is no
813 # longer a pending shutdown.
814 self.event_client.post_event(Event(
815 Event.Type.PENDING_SHUTDOWN))
816 continue
Jon Salz258a40c2012-04-19 12:34:01 +0800817
Cheng-Yi Chiangce05c002013-04-04 02:13:17 +0800818 self._run_test(test, test.iterations, test.retries)
Jon Salz1acc8742012-07-17 17:45:55 +0800819
Cheng-Yi Chiangce05c002013-04-04 02:13:17 +0800820 def _run_test(self, test, iterations_left=None, retries_left=None):
Jon Salz1acc8742012-07-17 17:45:55 +0800821 invoc = TestInvocation(self, test, on_completion=self.run_next_test)
822 new_state = test.update_state(
823 status=TestState.ACTIVE, increment_count=1, error_msg='',
Jon Salzbd42ce12012-09-18 08:03:59 +0800824 invocation=invoc.uuid, iterations_left=iterations_left,
Cheng-Yi Chiangce05c002013-04-04 02:13:17 +0800825 retries_left=retries_left,
Jon Salzbd42ce12012-09-18 08:03:59 +0800826 visible=(self.visible_test == test))
Jon Salz1acc8742012-07-17 17:45:55 +0800827 invoc.count = new_state.count
828
829 self.invocations[test] = invoc
830 if self.visible_test is None and test.has_ui:
831 self.set_visible_test(test)
Vic Yang311ddb82012-09-26 12:08:28 +0800832 self.check_exclusive()
Jon Salz1acc8742012-07-17 17:45:55 +0800833 invoc.start()
Jon Salz5f2a0672012-05-22 17:14:06 +0800834
Vic Yang311ddb82012-09-26 12:08:28 +0800835 def check_exclusive(self):
Jon Salzce6a7f82013-06-10 18:22:54 +0800836 # alias since this is really long
837 EXCL_OPT = factory.FactoryTest.EXCLUSIVE_OPTIONS
838
Vic Yang311ddb82012-09-26 12:08:28 +0800839 current_exclusive_items = set([
Jon Salzce6a7f82013-06-10 18:22:54 +0800840 item for item in EXCL_OPT
Vic Yang311ddb82012-09-26 12:08:28 +0800841 if any([test.is_exclusive(item) for test in self.invocations])])
842
843 new_exclusive_items = current_exclusive_items - self.exclusive_items
Jon Salzce6a7f82013-06-10 18:22:54 +0800844 if EXCL_OPT.NETWORKING in new_exclusive_items:
Vic Yang311ddb82012-09-26 12:08:28 +0800845 logging.info('Disabling network')
846 self.connection_manager.DisableNetworking()
Jon Salzce6a7f82013-06-10 18:22:54 +0800847 if EXCL_OPT.CHARGER in new_exclusive_items:
Vic Yang311ddb82012-09-26 12:08:28 +0800848 logging.info('Stop controlling charger')
849
850 new_non_exclusive_items = self.exclusive_items - current_exclusive_items
Jon Salzce6a7f82013-06-10 18:22:54 +0800851 if EXCL_OPT.NETWORKING in new_non_exclusive_items:
Vic Yang311ddb82012-09-26 12:08:28 +0800852 logging.info('Re-enabling network')
853 self.connection_manager.EnableNetworking()
Jon Salzce6a7f82013-06-10 18:22:54 +0800854 if EXCL_OPT.CHARGER in new_non_exclusive_items:
Vic Yang311ddb82012-09-26 12:08:28 +0800855 logging.info('Start controlling charger')
856
Jon Salzce6a7f82013-06-10 18:22:54 +0800857 if self.cpufreq_manager:
858 enabled = EXCL_OPT.CPUFREQ not in current_exclusive_items
859 try:
860 self.cpufreq_manager.SetEnabled(enabled)
861 except: # pylint: disable=W0702
862 logging.exception('Unable to %s cpufreq services',
863 'enable' if enabled else 'disable')
864
Vic Yang311ddb82012-09-26 12:08:28 +0800865 # Only adjust charge state if not excluded
Jon Salzce6a7f82013-06-10 18:22:54 +0800866 if (EXCL_OPT.CHARGER not in current_exclusive_items and
867 not utils.in_chroot()):
Cheng-Yi Chiangd8186952013-04-04 23:41:14 +0800868 if self.charge_manager:
869 self.charge_manager.AdjustChargeState()
870 else:
871 try:
872 system.GetBoard().SetChargeState(Board.ChargeState.CHARGE)
873 except BoardException:
874 logging.exception('Unable to set charge state on this board')
Vic Yang311ddb82012-09-26 12:08:28 +0800875
876 self.exclusive_items = current_exclusive_items
Jon Salz5da61e62012-05-31 13:06:22 +0800877
cychiang21886742012-07-05 15:16:32 +0800878 def check_for_updates(self):
879 '''
880 Schedules an asynchronous check for updates if necessary.
881 '''
882 if not self.test_list.options.update_period_secs:
883 # Not enabled.
884 return
885
886 now = time.time()
887 if self.last_update_check and (
888 now - self.last_update_check <
889 self.test_list.options.update_period_secs):
890 # Not yet time for another check.
891 return
892
893 self.last_update_check = now
894
895 def handle_check_for_update(reached_shopfloor, md5sum, needs_update):
896 if reached_shopfloor:
897 new_update_md5sum = md5sum if needs_update else None
898 if system.SystemInfo.update_md5sum != new_update_md5sum:
899 logging.info('Received new update MD5SUM: %s', new_update_md5sum)
900 system.SystemInfo.update_md5sum = new_update_md5sum
901 self.run_queue.put(self.update_system_info)
902
903 updater.CheckForUpdateAsync(
904 handle_check_for_update,
905 self.test_list.options.shopfloor_timeout_secs)
906
Jon Salza6711d72012-07-18 14:33:03 +0800907 def cancel_pending_tests(self):
908 '''Cancels any tests in the run queue.'''
909 self.run_tests([])
910
Jon Salz0697cbf2012-07-04 15:14:04 +0800911 def run_tests(self, subtrees, untested_only=False):
912 '''
913 Runs tests under subtree.
Jon Salz258a40c2012-04-19 12:34:01 +0800914
Jon Salz0697cbf2012-07-04 15:14:04 +0800915 The tests are run in order unless one fails (then stops).
916 Backgroundable tests are run simultaneously; when a foreground test is
917 encountered, we wait for all active tests to finish before continuing.
Jon Salzb1b39092012-05-03 02:05:09 +0800918
Jon Salz0697cbf2012-07-04 15:14:04 +0800919 @param subtrees: Node or nodes containing tests to run (may either be
920 a single test or a list). Duplicates will be ignored.
921 '''
922 if type(subtrees) != list:
923 subtrees = [subtrees]
Jon Salz258a40c2012-04-19 12:34:01 +0800924
Jon Salz0697cbf2012-07-04 15:14:04 +0800925 # Nodes we've seen so far, to avoid duplicates.
926 seen = set()
Jon Salz94eb56f2012-06-12 18:01:12 +0800927
Jon Salz0697cbf2012-07-04 15:14:04 +0800928 self.tests_to_run = deque()
929 for subtree in subtrees:
930 for test in subtree.walk():
931 if test in seen:
932 continue
933 seen.add(test)
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800934
Jon Salz0697cbf2012-07-04 15:14:04 +0800935 if not test.is_leaf():
936 continue
937 if (untested_only and
938 test.get_state().status != TestState.UNTESTED):
939 continue
940 self.tests_to_run.append(test)
941 self.run_next_test()
Hung-Te Linf2f78f72012-02-08 19:27:11 +0800942
Jon Salz0697cbf2012-07-04 15:14:04 +0800943 def reap_completed_tests(self):
944 '''
945 Removes completed tests from the set of active tests.
946
947 Also updates the visible test if it was reaped.
948 '''
Cheng-Yi Chiang5ac22ca2013-04-12 17:45:26 +0800949 test_completed = False
Jon Salz0697cbf2012-07-04 15:14:04 +0800950 for t, v in dict(self.invocations).iteritems():
951 if v.is_completed():
Cheng-Yi Chiang5ac22ca2013-04-12 17:45:26 +0800952 test_completed = True
Jon Salz1acc8742012-07-17 17:45:55 +0800953 new_state = t.update_state(**v.update_state_on_completion)
Jon Salz0697cbf2012-07-04 15:14:04 +0800954 del self.invocations[t]
955
Chun-Ta Lin54e17e42012-09-06 22:05:13 +0800956 # Stop on failure if flag is true.
957 if (self.test_list.options.stop_on_failure and
958 new_state.status == TestState.FAILED):
959 # Clean all the tests to cause goofy to stop.
960 self.tests_to_run = []
961 factory.console.info("Stop on failure triggered. Empty the queue.")
962
Jon Salz1acc8742012-07-17 17:45:55 +0800963 if new_state.iterations_left and new_state.status == TestState.PASSED:
964 # Play it again, Sam!
965 self._run_test(t)
Cheng-Yi Chiangce05c002013-04-04 02:13:17 +0800966 # new_state.retries_left is obtained after update.
967 # For retries_left == 0, test can still be run for the last time.
968 elif (new_state.retries_left >= 0 and
969 new_state.status == TestState.FAILED):
970 # Still have to retry, Sam!
971 self._run_test(t)
Jon Salz1acc8742012-07-17 17:45:55 +0800972
Cheng-Yi Chiang5ac22ca2013-04-12 17:45:26 +0800973 if test_completed:
Vic Yangf01c59f2013-04-19 17:37:56 +0800974 self.log_watcher.KickWatchThread()
Cheng-Yi Chiang5ac22ca2013-04-12 17:45:26 +0800975
Jon Salz0697cbf2012-07-04 15:14:04 +0800976 if (self.visible_test is None or
Jon Salz85a39882012-07-05 16:45:04 +0800977 self.visible_test not in self.invocations):
Jon Salz0697cbf2012-07-04 15:14:04 +0800978 self.set_visible_test(None)
979 # Make the first running test, if any, the visible test
980 for t in self.test_list.walk():
981 if t in self.invocations:
982 self.set_visible_test(t)
983 break
984
Jon Salz6dc031d2013-06-19 13:06:23 +0800985 def kill_active_tests(self, abort, root=None, reason=None):
Jon Salz0697cbf2012-07-04 15:14:04 +0800986 '''
987 Kills and waits for all active tests.
988
Jon Salz85a39882012-07-05 16:45:04 +0800989 Args:
990 abort: True to change state of killed tests to FAILED, False for
Jon Salz0697cbf2012-07-04 15:14:04 +0800991 UNTESTED.
Jon Salz85a39882012-07-05 16:45:04 +0800992 root: If set, only kills tests with root as an ancestor.
Jon Salz0697cbf2012-07-04 15:14:04 +0800993 '''
994 self.reap_completed_tests()
995 for test, invoc in self.invocations.items():
Jon Salz85a39882012-07-05 16:45:04 +0800996 if root and not test.has_ancestor(root):
997 continue
998
Jon Salz0697cbf2012-07-04 15:14:04 +0800999 factory.console.info('Killing active test %s...' % test.path)
Jon Salz6dc031d2013-06-19 13:06:23 +08001000 invoc.abort_and_join(reason)
Jon Salz0697cbf2012-07-04 15:14:04 +08001001 factory.console.info('Killed %s' % test.path)
Jon Salz1acc8742012-07-17 17:45:55 +08001002 test.update_state(**invoc.update_state_on_completion)
Jon Salz0697cbf2012-07-04 15:14:04 +08001003 del self.invocations[test]
Jon Salz1acc8742012-07-17 17:45:55 +08001004
Jon Salz0697cbf2012-07-04 15:14:04 +08001005 if not abort:
1006 test.update_state(status=TestState.UNTESTED)
1007 self.reap_completed_tests()
1008
Jon Salz6dc031d2013-06-19 13:06:23 +08001009 def stop(self, root=None, fail=False, reason=None):
1010 self.kill_active_tests(fail, root, reason)
Jon Salz85a39882012-07-05 16:45:04 +08001011 # Remove any tests in the run queue under the root.
1012 self.tests_to_run = deque([x for x in self.tests_to_run
1013 if root and not x.has_ancestor(root)])
1014 self.run_next_test()
Jon Salz0697cbf2012-07-04 15:14:04 +08001015
Jon Salz4712ac72013-02-07 17:12:05 +08001016 def clear_state(self, root=None):
Jon Salzd7550792013-07-12 05:49:27 +08001017 if root is None:
1018 root = self.test_list
Jon Salz6dc031d2013-06-19 13:06:23 +08001019 self.stop(root, reason='Clearing test state')
Jon Salz4712ac72013-02-07 17:12:05 +08001020 for f in root.walk():
1021 if f.is_leaf():
1022 f.update_state(status=TestState.UNTESTED)
1023
Jon Salz6dc031d2013-06-19 13:06:23 +08001024 def abort_active_tests(self, reason=None):
1025 self.kill_active_tests(True, reason=reason)
Jon Salz0697cbf2012-07-04 15:14:04 +08001026
1027 def main(self):
Jon Salzeff94182013-06-19 15:06:28 +08001028 syslog.openlog('goofy')
1029
Jon Salz0697cbf2012-07-04 15:14:04 +08001030 try:
Jon Salzd7550792013-07-12 05:49:27 +08001031 self.status = Status.INITIALIZING
Jon Salz0697cbf2012-07-04 15:14:04 +08001032 self.init()
1033 self.event_log.Log('goofy_init',
1034 success=True)
1035 except:
1036 if self.event_log:
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001037 try:
Jon Salz0697cbf2012-07-04 15:14:04 +08001038 self.event_log.Log('goofy_init',
1039 success=False,
1040 trace=traceback.format_exc())
1041 except: # pylint: disable=W0702
1042 pass
1043 raise
1044
Jon Salzd7550792013-07-12 05:49:27 +08001045 self.status = Status.RUNNING
Jon Salzeff94182013-06-19 15:06:28 +08001046 syslog.syslog('Goofy (factory test harness) starting')
Jon Salz0697cbf2012-07-04 15:14:04 +08001047 self.run()
1048
1049 def update_system_info(self):
1050 '''Updates system info.'''
1051 system_info = system.SystemInfo()
1052 self.state_instance.set_shared_data('system_info', system_info.__dict__)
1053 self.event_client.post_event(Event(Event.Type.SYSTEM_INFO,
1054 system_info=system_info.__dict__))
1055 logging.info('System info: %r', system_info.__dict__)
1056
Jon Salzeb42f0d2012-07-27 19:14:04 +08001057 def update_factory(self, auto_run_on_restart=False, post_update_hook=None):
1058 '''Commences updating factory software.
1059
1060 Args:
1061 auto_run_on_restart: Auto-run when the machine comes back up.
1062 post_update_hook: Code to call after update but immediately before
1063 restart.
1064
1065 Returns:
1066 Never if the update was successful (we just reboot).
1067 False if the update was unnecessary (no update available).
1068 '''
Jon Salz6dc031d2013-06-19 13:06:23 +08001069 self.kill_active_tests(False, reason='Factory software update')
Jon Salza6711d72012-07-18 14:33:03 +08001070 self.cancel_pending_tests()
Jon Salz0697cbf2012-07-04 15:14:04 +08001071
Jon Salz5c344f62012-07-13 14:31:16 +08001072 def pre_update_hook():
1073 if auto_run_on_restart:
1074 self.state_instance.set_shared_data('tests_after_shutdown',
1075 FORCE_AUTO_RUN)
1076 self.state_instance.close()
1077
Jon Salzeb42f0d2012-07-27 19:14:04 +08001078 if updater.TryUpdate(pre_update_hook=pre_update_hook):
1079 if post_update_hook:
1080 post_update_hook()
1081 self.env.shutdown('reboot')
Jon Salz0697cbf2012-07-04 15:14:04 +08001082
Jon Salzcef132a2012-08-30 04:58:08 +08001083 def handle_sigint(self, dummy_signum, dummy_frame):
Jon Salz77c151e2012-08-28 07:20:37 +08001084 logging.error('Received SIGINT')
1085 self.run_queue.put(None)
1086 raise KeyboardInterrupt()
1087
Jon Salze12c2b32013-06-25 16:24:34 +08001088 def find_kcrashes(self):
1089 """Finds kcrash files, logs them, and marks them as seen."""
1090 seen_crashes = set(
1091 self.state_instance.get_shared_data('seen_crashes', optional=True)
1092 or [])
1093
1094 for path in glob.glob('/var/spool/crash/*'):
1095 if not os.path.isfile(path):
1096 continue
1097 if path in seen_crashes:
1098 continue
1099 try:
1100 stat = os.stat(path)
1101 mtime = utils.TimeString(stat.st_mtime)
1102 logging.info(
1103 'Found new crash file %s (%d bytes at %s)',
1104 path, stat.st_size, mtime)
1105 extra_log_args = {}
1106
1107 try:
1108 _, ext = os.path.splitext(path)
1109 if ext in ['.kcrash', '.meta']:
1110 ext = ext.replace('.', '')
1111 with open(path) as f:
1112 data = f.read(MAX_CRASH_FILE_SIZE)
1113 tell = f.tell()
1114 logging.info(
1115 'Contents of %s%s:%s',
1116 path,
1117 ('' if tell == stat.st_size
1118 else '(truncated to %d bytes)' % MAX_CRASH_FILE_SIZE),
1119 ('\n' + data).replace('\n', '\n ' + ext + '> '))
1120 extra_log_args['data'] = data
1121
1122 # Copy to /var/factory/kcrash for posterity
1123 kcrash_dir = factory.get_factory_root('kcrash')
1124 utils.TryMakeDirs(kcrash_dir)
1125 shutil.copy(path, kcrash_dir)
1126 logging.info('Copied to %s',
1127 os.path.join(kcrash_dir, os.path.basename(path)))
1128 finally:
1129 # Even if something goes wrong with the above, still try to
1130 # log to event log
1131 self.event_log.Log('crash_file',
1132 path=path, size=stat.st_size, mtime=mtime,
1133 **extra_log_args)
1134 except: # pylint: disable=W0702
1135 logging.exception('Unable to handle crash files %s', path)
1136 seen_crashes.add(path)
1137
1138 self.state_instance.set_shared_data('seen_crashes', list(seen_crashes))
1139
Jon Salz128b0932013-07-03 16:55:26 +08001140 def GetTestList(self, test_list_id):
1141 """Returns the test list with the given ID.
1142
1143 Raises:
1144 TestListError: The test list ID is not valid.
1145 """
1146 try:
1147 return self.test_lists[test_list_id]
1148 except KeyError:
1149 raise test_lists.TestListError(
1150 '%r is not a valid test list ID (available IDs are [%s])' % (
1151 test_list_id, ', '.join(sorted(self.test_lists.keys()))))
1152
1153 def InitTestLists(self):
1154 """Reads in all test lists and sets the active test list."""
1155 self.test_lists = test_lists.BuildAllTestLists()
Jon Salzd7550792013-07-12 05:49:27 +08001156 logging.info('Loaded test lists: [%s]',
1157 test_lists.DescribeTestLists(self.test_lists))
Jon Salz128b0932013-07-03 16:55:26 +08001158
1159 if not self.options.test_list:
1160 self.options.test_list = test_lists.GetActiveTestListId()
1161
1162 if os.sep in self.options.test_list:
1163 # It's a path pointing to an old-style test list; use it.
1164 self.test_list = factory.read_test_list(self.options.test_list)
1165 else:
1166 self.test_list = self.GetTestList(self.options.test_list)
1167
1168 logging.info('Active test list: %s', self.test_list.test_list_id)
1169
1170 if isinstance(self.test_list, test_lists.OldStyleTestList):
1171 # Actually load it in. (See OldStyleTestList for an explanation
1172 # of why this is necessary.)
1173 self.test_list = self.test_list.Load()
1174
1175 self.test_list.state_instance = self.state_instance
1176
Shuo-Peng Liao268b40b2013-07-01 15:58:59 +08001177 def init_hooks(self):
1178 """Initializes hooks.
1179
1180 Must run after self.test_list ready.
1181 """
Shuo-Peng Liao52b90da2013-06-30 17:00:06 +08001182 module, cls = self.test_list.options.hooks_class.rsplit('.', 1)
1183 self.hooks = getattr(__import__(module, fromlist=[cls]), cls)()
1184 assert isinstance(self.hooks, factory.Hooks), (
1185 "hooks should be of type Hooks but is %r" % type(self.hooks))
1186 self.hooks.test_list = self.test_list
Shuo-Peng Liao268b40b2013-07-01 15:58:59 +08001187 self.hooks.OnCreatedTestList()
Shuo-Peng Liao52b90da2013-06-30 17:00:06 +08001188
Jon Salz0697cbf2012-07-04 15:14:04 +08001189 def init(self, args=None, env=None):
1190 '''Initializes Goofy.
1191
1192 Args:
1193 args: A list of command-line arguments. Uses sys.argv if
1194 args is None.
1195 env: An Environment instance to use (or None to choose
1196 FakeChrootEnvironment or DUTEnvironment as appropriate).
1197 '''
Jon Salz77c151e2012-08-28 07:20:37 +08001198 signal.signal(signal.SIGINT, self.handle_sigint)
1199
Jon Salz0697cbf2012-07-04 15:14:04 +08001200 parser = OptionParser()
1201 parser.add_option('-v', '--verbose', dest='verbose',
Jon Salz8fa8e832012-07-13 19:04:09 +08001202 action='store_true',
1203 help='Enable debug logging')
Jon Salz0697cbf2012-07-04 15:14:04 +08001204 parser.add_option('--print_test_list', dest='print_test_list',
Jon Salz8fa8e832012-07-13 19:04:09 +08001205 metavar='FILE',
1206 help='Read and print test list FILE, and exit')
Jon Salz0697cbf2012-07-04 15:14:04 +08001207 parser.add_option('--restart', dest='restart',
Jon Salz8fa8e832012-07-13 19:04:09 +08001208 action='store_true',
1209 help='Clear all test state')
Jon Salz0697cbf2012-07-04 15:14:04 +08001210 parser.add_option('--ui', dest='ui', type='choice',
Jon Salz8fa8e832012-07-13 19:04:09 +08001211 choices=['none', 'gtk', 'chrome'],
Jon Salz2f881df2013-02-01 17:00:35 +08001212 default='chrome',
Jon Salz8fa8e832012-07-13 19:04:09 +08001213 help='UI to use')
Jon Salz0697cbf2012-07-04 15:14:04 +08001214 parser.add_option('--ui_scale_factor', dest='ui_scale_factor',
Jon Salz8fa8e832012-07-13 19:04:09 +08001215 type='int', default=1,
1216 help=('Factor by which to scale UI '
1217 '(Chrome UI only)'))
Jon Salz0697cbf2012-07-04 15:14:04 +08001218 parser.add_option('--test_list', dest='test_list',
Jon Salz8fa8e832012-07-13 19:04:09 +08001219 metavar='FILE',
1220 help='Use FILE as test list')
Jon Salzc79a9982012-08-30 04:42:01 +08001221 parser.add_option('--dummy_shopfloor', action='store_true',
1222 help='Use a dummy shopfloor server')
chungyiafe8f772012-08-15 19:36:29 +08001223 parser.add_option('--automation', dest='automation',
1224 action='store_true',
1225 help='Enable automation on running factory test')
Ricky Liang09216dc2013-02-22 17:26:45 +08001226 parser.add_option('--one_pixel_less', dest='one_pixel_less',
1227 action='store_true',
1228 help=('Start Chrome one pixel less than the full screen.'
1229 'Needed by Exynos platform to run GTK.'))
Jon Salz0697cbf2012-07-04 15:14:04 +08001230 (self.options, self.args) = parser.parse_args(args)
1231
Jon Salz46b89562012-07-05 11:49:22 +08001232 # Make sure factory directories exist.
1233 factory.get_log_root()
1234 factory.get_state_root()
1235 factory.get_test_data_root()
1236
Jon Salz0697cbf2012-07-04 15:14:04 +08001237 global _inited_logging # pylint: disable=W0603
1238 if not _inited_logging:
1239 factory.init_logging('goofy', verbose=self.options.verbose)
1240 _inited_logging = True
Jon Salz8fa8e832012-07-13 19:04:09 +08001241
Jon Salz0f996602012-10-03 15:26:48 +08001242 if self.options.print_test_list:
1243 print factory.read_test_list(
1244 self.options.print_test_list).__repr__(recursive=True)
1245 sys.exit(0)
1246
Jon Salzee85d522012-07-17 14:34:46 +08001247 event_log.IncrementBootSequence()
Jon Salzd15bbcf2013-05-21 17:33:57 +08001248 # Don't defer logging the initial event, so we can make sure
1249 # that device_id, reimage_id, etc. are all set up.
1250 self.event_log = EventLog('goofy', defer=False)
Jon Salz0697cbf2012-07-04 15:14:04 +08001251
1252 if (not suppress_chroot_warning and
1253 factory.in_chroot() and
1254 self.options.ui == 'gtk' and
1255 os.environ.get('DISPLAY') in [None, '', ':0', ':0.0']):
1256 # That's not going to work! Tell the user how to run
1257 # this way.
1258 logging.warn(GOOFY_IN_CHROOT_WARNING)
1259 time.sleep(1)
1260
1261 if env:
1262 self.env = env
1263 elif factory.in_chroot():
1264 self.env = test_environment.FakeChrootEnvironment()
1265 logging.warn(
1266 'Using chroot environment: will not actually run autotests')
1267 else:
1268 self.env = test_environment.DUTEnvironment()
1269 self.env.goofy = self
1270
1271 if self.options.restart:
1272 state.clear_state()
1273
Jon Salz0697cbf2012-07-04 15:14:04 +08001274 if self.options.ui_scale_factor != 1 and utils.in_qemu():
1275 logging.warn(
1276 'In QEMU; ignoring ui_scale_factor argument')
1277 self.options.ui_scale_factor = 1
1278
1279 logging.info('Started')
1280
1281 self.start_state_server()
1282 self.state_instance.set_shared_data('hwid_cfg', get_hwid_cfg())
1283 self.state_instance.set_shared_data('ui_scale_factor',
Ricky Liang09216dc2013-02-22 17:26:45 +08001284 self.options.ui_scale_factor)
1285 self.state_instance.set_shared_data('one_pixel_less',
1286 self.options.one_pixel_less)
Jon Salz0697cbf2012-07-04 15:14:04 +08001287 self.last_shutdown_time = (
1288 self.state_instance.get_shared_data('shutdown_time', optional=True))
1289 self.state_instance.del_shared_data('shutdown_time', optional=True)
Jon Salzb19ea072013-02-07 16:35:00 +08001290 self.state_instance.del_shared_data('startup_error', optional=True)
Jon Salz0697cbf2012-07-04 15:14:04 +08001291
Jon Salz128b0932013-07-03 16:55:26 +08001292 try:
1293 self.InitTestLists()
1294 except: # pylint: disable=W0702
1295 logging.exception('Unable to initialize test lists')
1296 self.state_instance.set_shared_data(
1297 'startup_error',
1298 'Unable to initialize test lists\n%s' % (
1299 traceback.format_exc()))
Jon Salzb19ea072013-02-07 16:35:00 +08001300 if self.options.ui == 'chrome':
1301 # Create an empty test list with default options so that the rest of
1302 # startup can proceed.
1303 self.test_list = factory.FactoryTestList(
1304 [], self.state_instance, factory.Options())
1305 else:
1306 # Bail with an error; no point in starting up.
1307 sys.exit('No valid test list; exiting.')
1308
Shuo-Peng Liao268b40b2013-07-01 15:58:59 +08001309 self.init_hooks()
1310
Jon Salz822838b2013-03-25 17:32:33 +08001311 if self.test_list.options.clear_state_on_start:
1312 self.state_instance.clear_test_state()
1313
Vic Yang3e1cf5d2013-06-05 18:50:24 +08001314 if system.SystemInfo().firmware_version is None and not utils.in_chroot():
Vic Yang9bd4f772013-06-04 17:34:00 +08001315 self.state_instance.set_shared_data('startup_error',
1316 'Netboot firmware detected\n'
1317 'Connect Ethernet and reboot to re-image.\n'
1318 u'侦测到网路开机固件\n'
1319 u'请连接乙太网并重启')
1320
Jon Salz0697cbf2012-07-04 15:14:04 +08001321 if not self.state_instance.has_shared_data('ui_lang'):
1322 self.state_instance.set_shared_data('ui_lang',
1323 self.test_list.options.ui_lang)
1324 self.state_instance.set_shared_data(
1325 'test_list_options',
1326 self.test_list.options.__dict__)
1327 self.state_instance.test_list = self.test_list
1328
Cheng-Yi Chiang39d32ad2013-07-23 15:02:38 +08001329 self.check_log_rotation()
Jon Salz83ef34b2012-11-01 19:46:35 +08001330
Jon Salz23926422012-09-01 03:38:13 +08001331 if self.options.dummy_shopfloor:
1332 os.environ[shopfloor.SHOPFLOOR_SERVER_ENV_VAR_NAME] = (
1333 'http://localhost:%d/' % shopfloor.DEFAULT_SERVER_PORT)
1334 self.dummy_shopfloor = Spawn(
1335 [os.path.join(factory.FACTORY_PATH, 'bin', 'shopfloor_server'),
1336 '--dummy'])
1337 elif self.test_list.options.shopfloor_server_url:
1338 shopfloor.set_server_url(self.test_list.options.shopfloor_server_url)
Jon Salz2bf2f6b2013-03-28 18:49:26 +08001339 shopfloor.set_enabled(True)
Jon Salz23926422012-09-01 03:38:13 +08001340
Jon Salz0f996602012-10-03 15:26:48 +08001341 if self.test_list.options.time_sanitizer and not utils.in_chroot():
Jon Salz8fa8e832012-07-13 19:04:09 +08001342 self.time_sanitizer = time_sanitizer.TimeSanitizer(
1343 base_time=time_sanitizer.GetBaseTimeFromFile(
1344 # lsb-factory is written by the factory install shim during
1345 # installation, so it should have a good time obtained from
Jon Salz54882d02012-08-31 01:57:54 +08001346 # the mini-Omaha server. If it's not available, we'll use
1347 # /etc/lsb-factory (which will be much older, but reasonably
1348 # sane) and rely on a shopfloor sync to set a more accurate
1349 # time.
1350 '/usr/local/etc/lsb-factory',
1351 '/etc/lsb-release'))
Jon Salz8fa8e832012-07-13 19:04:09 +08001352 self.time_sanitizer.RunOnce()
1353
Vic Yangd8990da2013-06-27 16:57:43 +08001354 if self.test_list.options.check_cpu_usage_period_secs:
1355 self.cpu_usage_watcher = Spawn(['py/tools/cpu_usage_monitor.py',
1356 '-p', str(self.test_list.options.check_cpu_usage_period_secs)],
1357 cwd=factory.FACTORY_PATH)
1358
Jon Salz0697cbf2012-07-04 15:14:04 +08001359 self.init_states()
1360 self.start_event_server()
1361 self.connection_manager = self.env.create_connection_manager(
Tai-Hsu Lin371351a2012-08-27 14:17:14 +08001362 self.test_list.options.wlans,
1363 self.test_list.options.scan_wifi_period_secs)
Jon Salz0697cbf2012-07-04 15:14:04 +08001364 # Note that we create a log watcher even if
1365 # sync_event_log_period_secs isn't set (no background
1366 # syncing), since we may use it to flush event logs as well.
1367 self.log_watcher = EventLogWatcher(
1368 self.test_list.options.sync_event_log_period_secs,
Jon Salzd15bbcf2013-05-21 17:33:57 +08001369 event_log_db_file=None,
Jon Salz16d10542012-07-23 12:18:45 +08001370 handle_event_logs_callback=self.handle_event_logs)
Jon Salz0697cbf2012-07-04 15:14:04 +08001371 if self.test_list.options.sync_event_log_period_secs:
1372 self.log_watcher.StartWatchThread()
1373
Cheng-Yi Chiang344b10f2013-05-03 16:44:03 +08001374 # Note that we create a system log manager even if
1375 # sync_log_period_secs isn't set (no background
1376 # syncing), since we may kick it to sync logs in its
1377 # thread.
Cheng-Yi Chiangd3516a32013-07-17 15:30:47 +08001378 if self.test_list.options.enable_sync_log:
1379 self.system_log_manager = SystemLogManager(
1380 sync_log_paths=self.test_list.options.sync_log_paths,
1381 sync_period_sec=self.test_list.options.sync_log_period_secs,
1382 clear_log_paths=self.test_list.options.clear_log_paths)
1383 self.system_log_manager.StartSyncThread()
Cheng-Yi Chiang344b10f2013-05-03 16:44:03 +08001384
Jon Salz0697cbf2012-07-04 15:14:04 +08001385 self.update_system_info()
1386
Vic Yang4953fc12012-07-26 16:19:53 +08001387 assert ((self.test_list.options.min_charge_pct is None) ==
1388 (self.test_list.options.max_charge_pct is None))
Vic Yange83d9a12013-04-19 20:00:20 +08001389 if utils.in_chroot():
1390 logging.info('In chroot, ignoring charge manager and charge state')
1391 elif self.test_list.options.min_charge_pct is not None:
Vic Yang4953fc12012-07-26 16:19:53 +08001392 self.charge_manager = ChargeManager(self.test_list.options.min_charge_pct,
1393 self.test_list.options.max_charge_pct)
Jon Salzad7353b2012-10-15 16:22:46 +08001394 system.SystemStatus.charge_manager = self.charge_manager
Cheng-Yi Chiangd8186952013-04-04 23:41:14 +08001395 else:
1396 # Goofy should set charger state to charge if charge_manager is disabled.
1397 try:
1398 system.GetBoard().SetChargeState(Board.ChargeState.CHARGE)
1399 except BoardException:
1400 logging.exception('Unable to set charge state on this board')
Vic Yang4953fc12012-07-26 16:19:53 +08001401
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +08001402 self.core_dump_manager = CoreDumpManager(
1403 self.test_list.options.core_dump_watchlist)
1404
Jon Salz0697cbf2012-07-04 15:14:04 +08001405 os.environ['CROS_FACTORY'] = '1'
1406 os.environ['CROS_DISABLE_SITE_SYSINFO'] = '1'
1407
1408 # Set CROS_UI since some behaviors in ui.py depend on the
1409 # particular UI in use. TODO(jsalz): Remove this (and all
1410 # places it is used) when the GTK UI is removed.
1411 os.environ['CROS_UI'] = self.options.ui
1412
Shuo-Peng Liao1ff502e2013-06-30 18:37:02 +08001413 if not utils.in_chroot() and self.test_list.options.use_cpufreq_manager:
Jon Salzddf0d052013-06-18 12:52:44 +08001414 self.cpufreq_manager = CpufreqManager(event_log=self.event_log)
Jon Salzce6a7f82013-06-10 18:22:54 +08001415
Justin Chuang31b02432013-06-27 15:16:51 +08001416 # Startup hooks may want to skip some tests.
1417 self.update_skipped_tests()
Jon Salz416f9cc2013-05-10 18:32:50 +08001418
Jon Salze12c2b32013-06-25 16:24:34 +08001419 self.find_kcrashes()
1420
Shuo-Peng Liao268b40b2013-07-01 15:58:59 +08001421 # Should not move earlier.
1422 self.hooks.OnStartup()
1423
Jon Salz0697cbf2012-07-04 15:14:04 +08001424 if self.options.ui == 'chrome':
1425 self.env.launch_chrome()
1426 logging.info('Waiting for a web socket connection')
Cheng-Yi Chiangfd8ed392013-03-08 21:37:31 +08001427 self.web_socket_manager.wait()
Jon Salz0697cbf2012-07-04 15:14:04 +08001428
1429 # Wait for the test widget size to be set; this is done in
1430 # an asynchronous RPC so there is a small chance that the
1431 # web socket might be opened first.
1432 for _ in range(100): # 10 s
1433 try:
1434 if self.state_instance.get_shared_data('test_widget_size'):
1435 break
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001436 except KeyError:
Jon Salz0697cbf2012-07-04 15:14:04 +08001437 pass # Retry
1438 time.sleep(0.1) # 100 ms
1439 else:
1440 logging.warn('Never received test_widget_size from UI')
Jon Salz45297282013-05-18 14:31:47 +08001441
1442 # Send Chrome a Tab to get focus to the factory UI
1443 # (http://crosbug.com/p/19444). TODO(jsalz): remove this hack
1444 # and figure out the right way to get the focus to Chrome.
1445 if not utils.in_chroot():
1446 Spawn(
1447 [os.path.join(factory.FACTORY_PATH, 'bin', 'send_key'), 'Tab'],
1448 check_call=True, log=True)
Jon Salz0697cbf2012-07-04 15:14:04 +08001449 elif self.options.ui == 'gtk':
1450 self.start_ui()
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001451
Ricky Liang650f6bf2012-09-28 13:22:54 +08001452 # Create download path for autotest beforehand or autotests run at
1453 # the same time might fail due to race condition.
1454 if not factory.in_chroot():
1455 utils.TryMakeDirs(os.path.join('/usr/local/autotest', 'tests',
1456 'download'))
1457
Jon Salz0697cbf2012-07-04 15:14:04 +08001458 def state_change_callback(test, test_state):
1459 self.event_client.post_event(
1460 Event(Event.Type.STATE_CHANGE,
1461 path=test.path, state=test_state))
1462 self.test_list.state_change_callback = state_change_callback
Jon Salz73e0fd02012-04-04 11:46:38 +08001463
Jon Salza6711d72012-07-18 14:33:03 +08001464 for handler in self.on_ui_startup:
1465 handler()
1466
1467 self.prespawner = Prespawner()
1468 self.prespawner.start()
1469
Jon Salz0697cbf2012-07-04 15:14:04 +08001470 try:
1471 tests_after_shutdown = self.state_instance.get_shared_data(
1472 'tests_after_shutdown')
1473 except KeyError:
1474 tests_after_shutdown = None
Jon Salz57717ca2012-04-04 16:47:25 +08001475
Jon Salz5c344f62012-07-13 14:31:16 +08001476 force_auto_run = (tests_after_shutdown == FORCE_AUTO_RUN)
1477 if not force_auto_run and tests_after_shutdown is not None:
Jon Salz0697cbf2012-07-04 15:14:04 +08001478 logging.info('Resuming tests after shutdown: %s',
1479 tests_after_shutdown)
Jon Salz0697cbf2012-07-04 15:14:04 +08001480 self.tests_to_run.extend(
1481 self.test_list.lookup_path(t) for t in tests_after_shutdown)
1482 self.run_queue.put(self.run_next_test)
1483 else:
Jon Salz5c344f62012-07-13 14:31:16 +08001484 if force_auto_run or self.test_list.options.auto_run_on_start:
Jon Salz0697cbf2012-07-04 15:14:04 +08001485 self.run_queue.put(
1486 lambda: self.run_tests(self.test_list, untested_only=True))
Jon Salz5c344f62012-07-13 14:31:16 +08001487 self.state_instance.set_shared_data('tests_after_shutdown', None)
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001488
Dean Liao592e4d52013-01-10 20:06:39 +08001489 self.may_disable_cros_shortcut_keys()
1490
1491 def may_disable_cros_shortcut_keys(self):
1492 test_options = self.test_list.options
1493 if test_options.disable_cros_shortcut_keys:
1494 logging.info('Filter ChromeOS shortcut keys.')
1495 self.key_filter = KeyFilter(
1496 unmap_caps_lock=test_options.disable_caps_lock,
1497 caps_lock_keycode=test_options.caps_lock_keycode)
1498 self.key_filter.Start()
1499
Jon Salz0697cbf2012-07-04 15:14:04 +08001500 def run(self):
1501 '''Runs Goofy.'''
1502 # Process events forever.
1503 while self.run_once(True):
1504 pass
Jon Salz73e0fd02012-04-04 11:46:38 +08001505
Jon Salz0697cbf2012-07-04 15:14:04 +08001506 def run_once(self, block=False):
1507 '''Runs all items pending in the event loop.
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001508
Jon Salz0697cbf2012-07-04 15:14:04 +08001509 Args:
1510 block: If true, block until at least one event is processed.
Jon Salz7c15e8b2012-06-19 17:10:37 +08001511
Jon Salz0697cbf2012-07-04 15:14:04 +08001512 Returns:
1513 True to keep going or False to shut down.
1514 '''
1515 events = utils.DrainQueue(self.run_queue)
cychiang21886742012-07-05 15:16:32 +08001516 while not events:
Jon Salz0697cbf2012-07-04 15:14:04 +08001517 # Nothing on the run queue.
1518 self._run_queue_idle()
1519 if block:
1520 # Block for at least one event...
cychiang21886742012-07-05 15:16:32 +08001521 try:
1522 events.append(self.run_queue.get(timeout=RUN_QUEUE_TIMEOUT_SECS))
1523 except Queue.Empty:
1524 # Keep going (calling _run_queue_idle() again at the top of
1525 # the loop)
1526 continue
Jon Salz0697cbf2012-07-04 15:14:04 +08001527 # ...and grab anything else that showed up at the same
1528 # time.
1529 events.extend(utils.DrainQueue(self.run_queue))
cychiang21886742012-07-05 15:16:32 +08001530 else:
1531 break
Jon Salz51528e12012-07-02 18:54:45 +08001532
Jon Salz0697cbf2012-07-04 15:14:04 +08001533 for event in events:
1534 if not event:
1535 # Shutdown request.
1536 self.run_queue.task_done()
1537 return False
Jon Salz51528e12012-07-02 18:54:45 +08001538
Jon Salz0697cbf2012-07-04 15:14:04 +08001539 try:
1540 event()
Jon Salz85a39882012-07-05 16:45:04 +08001541 except: # pylint: disable=W0702
1542 logging.exception('Error in event loop')
Jon Salz0697cbf2012-07-04 15:14:04 +08001543 self.record_exception(traceback.format_exception_only(
1544 *sys.exc_info()[:2]))
1545 # But keep going
1546 finally:
1547 self.run_queue.task_done()
1548 return True
Jon Salz0405ab52012-03-16 15:26:52 +08001549
Jon Salz0e6532d2012-10-25 16:30:11 +08001550 def _should_sync_time(self, foreground=False):
1551 '''Returns True if we should attempt syncing time with shopfloor.
1552
1553 Args:
1554 foreground: If True, synchronizes even if background syncing
1555 is disabled (e.g., in explicit sync requests from the
1556 SyncShopfloor test).
1557 '''
1558 return ((foreground or
1559 self.test_list.options.sync_time_period_secs) and
Jon Salz54882d02012-08-31 01:57:54 +08001560 self.time_sanitizer and
1561 (not self.time_synced) and
1562 (not factory.in_chroot()))
1563
Jon Salz0e6532d2012-10-25 16:30:11 +08001564 def sync_time_with_shopfloor_server(self, foreground=False):
Jon Salz54882d02012-08-31 01:57:54 +08001565 '''Syncs time with shopfloor server, if not yet synced.
1566
Jon Salz0e6532d2012-10-25 16:30:11 +08001567 Args:
1568 foreground: If True, synchronizes even if background syncing
1569 is disabled (e.g., in explicit sync requests from the
1570 SyncShopfloor test).
1571
Jon Salz54882d02012-08-31 01:57:54 +08001572 Returns:
1573 False if no time sanitizer is available, or True if this sync (or a
1574 previous sync) succeeded.
1575
1576 Raises:
1577 Exception if unable to contact the shopfloor server.
1578 '''
Jon Salz0e6532d2012-10-25 16:30:11 +08001579 if self._should_sync_time(foreground):
Jon Salz54882d02012-08-31 01:57:54 +08001580 self.time_sanitizer.SyncWithShopfloor()
1581 self.time_synced = True
1582 return self.time_synced
1583
Jon Salzb92c5112012-09-21 15:40:11 +08001584 def log_disk_space_stats(self):
Jon Salz18e0e022013-06-11 17:13:39 +08001585 if (utils.in_chroot() or
1586 not self.test_list.options.log_disk_space_period_secs):
Jon Salzb92c5112012-09-21 15:40:11 +08001587 return
1588
1589 now = time.time()
1590 if (self.last_log_disk_space_time and
1591 now - self.last_log_disk_space_time <
1592 self.test_list.options.log_disk_space_period_secs):
1593 return
1594 self.last_log_disk_space_time = now
1595
Cheng-Yi Chiangd0406522013-04-01 15:40:18 +08001596 # Upload event if stateful partition usage is above threshold.
1597 # Stateful partition is mounted on /usr/local, while
1598 # encrypted stateful partition is mounted on /var.
1599 # If there are too much logs in the factory process,
1600 # these two partitions might get full.
Jon Salzb92c5112012-09-21 15:40:11 +08001601 try:
Cheng-Yi Chiangd0406522013-04-01 15:40:18 +08001602 vfs_infos = disk_space.GetAllVFSInfo()
1603 stateful_info, encrypted_info = None, None
1604 for vfs_info in vfs_infos.values():
1605 if '/usr/local' in vfs_info.mount_points:
1606 stateful_info = vfs_info
1607 if '/var' in vfs_info.mount_points:
1608 encrypted_info = vfs_info
1609
1610 stateful = disk_space.GetPartitionUsage(stateful_info)
1611 encrypted = disk_space.GetPartitionUsage(encrypted_info)
1612
1613 above_threshold = (
1614 self.test_list.options.stateful_usage_threshold and
1615 max(stateful.bytes_used_pct,
1616 stateful.inodes_used_pct,
1617 encrypted.bytes_used_pct,
1618 encrypted.inodes_used_pct) >
1619 self.test_list.options.stateful_usage_threshold)
1620
1621 if above_threshold:
1622 self.event_log.Log('stateful_partition_usage',
1623 partitions={
1624 'stateful': {
1625 'bytes_used_pct': FloatDigit(stateful.bytes_used_pct, 2),
1626 'inodes_used_pct': FloatDigit(stateful.inodes_used_pct, 2)},
1627 'encrypted_stateful': {
1628 'bytes_used_pct': FloatDigit(encrypted.bytes_used_pct, 2),
1629 'inodes_used_pct': FloatDigit(encrypted.inodes_used_pct, 2)}
1630 })
1631 self.log_watcher.ScanEventLogs()
Cheng-Yi Chiang00798e72013-06-20 18:16:39 +08001632 if (not utils.in_chroot() and
1633 self.test_list.options.stateful_usage_above_threshold_action):
1634 Spawn(self.test_list.options.stateful_usage_above_threshold_action,
1635 call=True)
Cheng-Yi Chiangd0406522013-04-01 15:40:18 +08001636
1637 message = disk_space.FormatSpaceUsedAll(vfs_infos)
Jon Salz3c493bb2013-02-07 17:24:58 +08001638 if message != self.last_log_disk_space_message:
Cheng-Yi Chiangd0406522013-04-01 15:40:18 +08001639 if above_threshold:
1640 logging.warning(message)
1641 else:
1642 logging.info(message)
Jon Salz3c493bb2013-02-07 17:24:58 +08001643 self.last_log_disk_space_message = message
Jon Salzb92c5112012-09-21 15:40:11 +08001644 except: # pylint: disable=W0702
1645 logging.exception('Unable to get disk space used')
1646
Justin Chuang83813982013-05-13 01:26:32 +08001647 def check_battery(self):
1648 '''Checks the current battery status.
1649
1650 Logs current battery charging level and status to log. If the battery level
1651 is lower below warning_low_battery_pct, send warning event to shopfloor.
1652 If the battery level is lower below critical_low_battery_pct, flush disks.
1653 '''
1654 if not self.test_list.options.check_battery_period_secs:
1655 return
1656
1657 now = time.time()
1658 if (self.last_check_battery_time and
1659 now - self.last_check_battery_time <
1660 self.test_list.options.check_battery_period_secs):
1661 return
1662 self.last_check_battery_time = now
1663
1664 message = ''
1665 log_level = logging.INFO
1666 try:
1667 power = system.GetBoard().power
1668 if not power.CheckBatteryPresent():
1669 message = 'Battery is not present'
1670 else:
1671 ac_present = power.CheckACPresent()
1672 charge_pct = power.GetChargePct(get_float=True)
1673 message = ('Current battery level %.1f%%, AC charger is %s' %
1674 (charge_pct, 'connected' if ac_present else 'disconnected'))
1675
1676 if charge_pct > self.test_list.options.critical_low_battery_pct:
1677 critical_low_battery = False
1678 else:
1679 critical_low_battery = True
1680 # Only sync disks when battery level is still above minimum
1681 # value. This can be used for offline analysis when shopfloor cannot
1682 # be connected.
1683 if charge_pct > MIN_BATTERY_LEVEL_FOR_DISK_SYNC:
1684 logging.warning('disk syncing for critical low battery situation')
1685 os.system('sync; sync; sync')
1686 else:
1687 logging.warning('disk syncing is cancelled '
1688 'because battery level is lower than %.1f',
1689 MIN_BATTERY_LEVEL_FOR_DISK_SYNC)
1690
1691 # Notify shopfloor server
1692 if (critical_low_battery or
1693 (not ac_present and
1694 charge_pct <= self.test_list.options.warning_low_battery_pct)):
1695 log_level = logging.WARNING
1696
1697 self.event_log.Log('low_battery',
1698 battery_level=charge_pct,
1699 charger_connected=ac_present,
1700 critical=critical_low_battery)
1701 self.log_watcher.KickWatchThread()
Cheng-Yi Chiangd3516a32013-07-17 15:30:47 +08001702 if self.system_log_manager:
1703 self.system_log_manager.KickSyncThread()
Justin Chuang83813982013-05-13 01:26:32 +08001704 except: # pylint: disable=W0702
1705 logging.exception('Unable to check battery or notify shopfloor')
1706 finally:
1707 if message != self.last_check_battery_message:
1708 logging.log(log_level, message)
1709 self.last_check_battery_message = message
1710
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +08001711 def check_core_dump(self):
1712 '''Checks if there is any core dumped file.
1713
1714 Removes unwanted core dump files immediately.
1715 Syncs those files matching watch list to server with a delay between
1716 each sync. After the files have been synced to server, deletes the files.
1717 '''
1718 core_dump_files = self.core_dump_manager.ScanFiles()
1719 if core_dump_files:
1720 now = time.time()
1721 if (self.last_kick_sync_time and now - self.last_kick_sync_time <
1722 self.test_list.options.kick_sync_min_interval_secs):
1723 return
1724 self.last_kick_sync_time = now
1725
1726 # Sends event to server
1727 self.event_log.Log('core_dumped', files=core_dump_files)
1728 self.log_watcher.KickWatchThread()
1729
1730 # Syncs files to server
Cheng-Yi Chiangd3516a32013-07-17 15:30:47 +08001731 if self.system_log_manager:
1732 self.system_log_manager.KickSyncThread(
1733 core_dump_files, self.core_dump_manager.ClearFiles)
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +08001734
Cheng-Yi Chiang39d32ad2013-07-23 15:02:38 +08001735 def check_log_rotation(self):
1736 '''Checks log rotation file presence/absence according to test_list option.
1737
1738 Touch /var/lib/cleanup_logs_paused if test_list.options.disable_log_rotation
1739 is True, delete it otherwise. This must be done in idle loop because
1740 autotest client will touch /var/lib/cleanup_logs_paused each time it runs
1741 an autotest.
1742 '''
1743 if utils.in_chroot():
1744 return
1745 try:
1746 if self.test_list.options.disable_log_rotation:
1747 open(CLEANUP_LOGS_PAUSED, 'w').close()
1748 else:
1749 file_utils.TryUnlink(CLEANUP_LOGS_PAUSED)
1750 except: # pylint: disable=W0702
1751 # Oh well. Logs an error (but no trace)
1752 logging.info(
1753 'Unable to %s %s: %s',
1754 'touch' if self.test_list.options.disable_log_rotation else 'delete',
1755 CLEANUP_LOGS_PAUSED, utils.FormatExceptionOnly())
1756
Jon Salz8fa8e832012-07-13 19:04:09 +08001757 def sync_time_in_background(self):
Jon Salzb22d1172012-08-06 10:38:57 +08001758 '''Writes out current time and tries to sync with shopfloor server.'''
1759 if not self.time_sanitizer:
1760 return
1761
1762 # Write out the current time.
1763 self.time_sanitizer.SaveTime()
1764
Jon Salz54882d02012-08-31 01:57:54 +08001765 if not self._should_sync_time():
Jon Salz8fa8e832012-07-13 19:04:09 +08001766 return
1767
1768 now = time.time()
1769 if self.last_sync_time and (
1770 now - self.last_sync_time <
1771 self.test_list.options.sync_time_period_secs):
1772 # Not yet time for another check.
1773 return
1774 self.last_sync_time = now
1775
1776 def target():
1777 try:
Jon Salz54882d02012-08-31 01:57:54 +08001778 self.sync_time_with_shopfloor_server()
Jon Salz8fa8e832012-07-13 19:04:09 +08001779 except: # pylint: disable=W0702
1780 # Oh well. Log an error (but no trace)
1781 logging.info(
1782 'Unable to get time from shopfloor server: %s',
1783 utils.FormatExceptionOnly())
1784
1785 thread = threading.Thread(target=target)
1786 thread.daemon = True
1787 thread.start()
1788
Jon Salz0697cbf2012-07-04 15:14:04 +08001789 def _run_queue_idle(self):
Vic Yang4953fc12012-07-26 16:19:53 +08001790 '''Invoked when the run queue has no events.
1791
1792 This method must not raise exception.
1793 '''
Jon Salzb22d1172012-08-06 10:38:57 +08001794 now = time.time()
1795 if (self.last_idle and
1796 now < (self.last_idle + RUN_QUEUE_TIMEOUT_SECS - 1)):
1797 # Don't run more often than once every (RUN_QUEUE_TIMEOUT_SECS -
1798 # 1) seconds.
1799 return
1800
1801 self.last_idle = now
1802
Vic Yang311ddb82012-09-26 12:08:28 +08001803 self.check_exclusive()
cychiang21886742012-07-05 15:16:32 +08001804 self.check_for_updates()
Jon Salz8fa8e832012-07-13 19:04:09 +08001805 self.sync_time_in_background()
Jon Salzb92c5112012-09-21 15:40:11 +08001806 self.log_disk_space_stats()
Justin Chuang83813982013-05-13 01:26:32 +08001807 self.check_battery()
Cheng-Yi Chiangcdfa4182013-05-05 03:20:19 +08001808 self.check_core_dump()
Cheng-Yi Chiang39d32ad2013-07-23 15:02:38 +08001809 self.check_log_rotation()
Jon Salz57717ca2012-04-04 16:47:25 +08001810
Jon Salzd15bbcf2013-05-21 17:33:57 +08001811 def handle_event_logs(self, chunks):
Jon Salz0697cbf2012-07-04 15:14:04 +08001812 '''Callback for event watcher.
Jon Salz258a40c2012-04-19 12:34:01 +08001813
Jon Salz0697cbf2012-07-04 15:14:04 +08001814 Attempts to upload the event logs to the shopfloor server.
Vic Yang93027612013-05-06 02:42:49 +08001815
1816 Args:
Jon Salzd15bbcf2013-05-21 17:33:57 +08001817 chunks: A list of Chunk objects.
Jon Salz0697cbf2012-07-04 15:14:04 +08001818 '''
Vic Yang93027612013-05-06 02:42:49 +08001819 first_exception = None
1820 exception_count = 0
1821
Jon Salzd15bbcf2013-05-21 17:33:57 +08001822 for chunk in chunks:
Vic Yang93027612013-05-06 02:42:49 +08001823 try:
Jon Salzcddb6402013-05-23 12:56:42 +08001824 description = 'event logs (%s)' % str(chunk)
Vic Yang93027612013-05-06 02:42:49 +08001825 start_time = time.time()
1826 shopfloor_client = shopfloor.get_instance(
1827 detect=True,
1828 timeout=self.test_list.options.shopfloor_timeout_secs)
Jon Salzd15bbcf2013-05-21 17:33:57 +08001829 shopfloor_client.UploadEvent(chunk.log_name + "." +
1830 event_log.GetReimageId(),
1831 Binary(chunk.chunk))
Vic Yang93027612013-05-06 02:42:49 +08001832 logging.info(
1833 'Successfully synced %s in %.03f s',
1834 description, time.time() - start_time)
1835 except: # pylint: disable=W0702
Jon Salzd15bbcf2013-05-21 17:33:57 +08001836 first_exception = (first_exception or (chunk.log_name + ': ' +
Vic Yang93027612013-05-06 02:42:49 +08001837 utils.FormatExceptionOnly()))
1838 exception_count += 1
1839
1840 if exception_count:
1841 if exception_count == 1:
1842 msg = 'Log upload failed: %s' % first_exception
1843 else:
1844 msg = '%d log upload failed; first is: %s' % (
1845 exception_count, first_exception)
1846 raise Exception(msg)
1847
Jon Salz57717ca2012-04-04 16:47:25 +08001848
Jon Salz0697cbf2012-07-04 15:14:04 +08001849 def run_tests_with_status(self, statuses_to_run, starting_at=None,
1850 root=None):
1851 '''Runs all top-level tests with a particular status.
Jon Salz0405ab52012-03-16 15:26:52 +08001852
Jon Salz0697cbf2012-07-04 15:14:04 +08001853 All active tests, plus any tests to re-run, are reset.
Jon Salz57717ca2012-04-04 16:47:25 +08001854
Jon Salz0697cbf2012-07-04 15:14:04 +08001855 Args:
1856 starting_at: If provided, only auto-runs tests beginning with
1857 this test.
1858 '''
1859 root = root or self.test_list
Jon Salz57717ca2012-04-04 16:47:25 +08001860
Jon Salz0697cbf2012-07-04 15:14:04 +08001861 if starting_at:
1862 # Make sure they passed a test, not a string.
1863 assert isinstance(starting_at, factory.FactoryTest)
Jon Salz0405ab52012-03-16 15:26:52 +08001864
Jon Salz0697cbf2012-07-04 15:14:04 +08001865 tests_to_reset = []
1866 tests_to_run = []
Jon Salz0405ab52012-03-16 15:26:52 +08001867
Jon Salz0697cbf2012-07-04 15:14:04 +08001868 found_starting_at = False
Jon Salz0405ab52012-03-16 15:26:52 +08001869
Jon Salz0697cbf2012-07-04 15:14:04 +08001870 for test in root.get_top_level_tests():
1871 if starting_at:
1872 if test == starting_at:
1873 # We've found starting_at; do auto-run on all
1874 # subsequent tests.
1875 found_starting_at = True
1876 if not found_starting_at:
1877 # Don't start this guy yet
1878 continue
Jon Salz0405ab52012-03-16 15:26:52 +08001879
Jon Salz0697cbf2012-07-04 15:14:04 +08001880 status = test.get_state().status
1881 if status == TestState.ACTIVE or status in statuses_to_run:
1882 # Reset the test (later; we will need to abort
1883 # all active tests first).
1884 tests_to_reset.append(test)
1885 if status in statuses_to_run:
1886 tests_to_run.append(test)
Jon Salz0405ab52012-03-16 15:26:52 +08001887
Jon Salz6dc031d2013-06-19 13:06:23 +08001888 self.abort_active_tests('Operator requested run/re-run of certain tests')
Jon Salz258a40c2012-04-19 12:34:01 +08001889
Jon Salz0697cbf2012-07-04 15:14:04 +08001890 # Reset all statuses of the tests to run (in case any tests were active;
1891 # we want them to be run again).
1892 for test_to_reset in tests_to_reset:
1893 for test in test_to_reset.walk():
1894 test.update_state(status=TestState.UNTESTED)
Jon Salz57717ca2012-04-04 16:47:25 +08001895
Jon Salz0697cbf2012-07-04 15:14:04 +08001896 self.run_tests(tests_to_run, untested_only=True)
Jon Salz0405ab52012-03-16 15:26:52 +08001897
Jon Salz0697cbf2012-07-04 15:14:04 +08001898 def restart_tests(self, root=None):
1899 '''Restarts all tests.'''
1900 root = root or self.test_list
Jon Salz0405ab52012-03-16 15:26:52 +08001901
Jon Salz6dc031d2013-06-19 13:06:23 +08001902 self.abort_active_tests('Operator requested restart of certain tests')
Jon Salz0697cbf2012-07-04 15:14:04 +08001903 for test in root.walk():
1904 test.update_state(status=TestState.UNTESTED)
1905 self.run_tests(root)
Hung-Te Lin96632362012-03-20 21:14:18 +08001906
Jon Salz0697cbf2012-07-04 15:14:04 +08001907 def auto_run(self, starting_at=None, root=None):
1908 '''"Auto-runs" tests that have not been run yet.
Hung-Te Lin96632362012-03-20 21:14:18 +08001909
Jon Salz0697cbf2012-07-04 15:14:04 +08001910 Args:
1911 starting_at: If provide, only auto-runs tests beginning with
1912 this test.
1913 '''
1914 root = root or self.test_list
1915 self.run_tests_with_status([TestState.UNTESTED, TestState.ACTIVE],
1916 starting_at=starting_at,
1917 root=root)
Jon Salz968e90b2012-03-18 16:12:43 +08001918
Jon Salz0697cbf2012-07-04 15:14:04 +08001919 def re_run_failed(self, root=None):
1920 '''Re-runs failed tests.'''
1921 root = root or self.test_list
1922 self.run_tests_with_status([TestState.FAILED], root=root)
Jon Salz57717ca2012-04-04 16:47:25 +08001923
Jon Salz0697cbf2012-07-04 15:14:04 +08001924 def show_review_information(self):
1925 '''Event handler for showing review information screen.
Jon Salz57717ca2012-04-04 16:47:25 +08001926
Jon Salz0697cbf2012-07-04 15:14:04 +08001927 The information screene is rendered by main UI program (ui.py), so in
1928 goofy we only need to kill all active tests, set them as untested, and
1929 clear remaining tests.
1930 '''
1931 self.kill_active_tests(False)
Jon Salza6711d72012-07-18 14:33:03 +08001932 self.cancel_pending_tests()
Jon Salz57717ca2012-04-04 16:47:25 +08001933
Jon Salz0697cbf2012-07-04 15:14:04 +08001934 def handle_switch_test(self, event):
1935 '''Switches to a particular test.
Jon Salz0405ab52012-03-16 15:26:52 +08001936
Jon Salz0697cbf2012-07-04 15:14:04 +08001937 @param event: The SWITCH_TEST event.
1938 '''
1939 test = self.test_list.lookup_path(event.path)
1940 if not test:
1941 logging.error('Unknown test %r', event.key)
1942 return
Jon Salz73e0fd02012-04-04 11:46:38 +08001943
Jon Salz0697cbf2012-07-04 15:14:04 +08001944 invoc = self.invocations.get(test)
1945 if invoc and test.backgroundable:
1946 # Already running: just bring to the front if it
1947 # has a UI.
1948 logging.info('Setting visible test to %s', test.path)
Jon Salz36fbbb52012-07-05 13:45:06 +08001949 self.set_visible_test(test)
Jon Salz0697cbf2012-07-04 15:14:04 +08001950 return
Jon Salz73e0fd02012-04-04 11:46:38 +08001951
Jon Salz6dc031d2013-06-19 13:06:23 +08001952 self.abort_active_tests('Operator requested abort (switch_test)')
Jon Salz0697cbf2012-07-04 15:14:04 +08001953 for t in test.walk():
1954 t.update_state(status=TestState.UNTESTED)
Jon Salz73e0fd02012-04-04 11:46:38 +08001955
Jon Salz0697cbf2012-07-04 15:14:04 +08001956 if self.test_list.options.auto_run_on_keypress:
1957 self.auto_run(starting_at=test)
1958 else:
1959 self.run_tests(test)
Jon Salz73e0fd02012-04-04 11:46:38 +08001960
Jon Salz0697cbf2012-07-04 15:14:04 +08001961 def wait(self):
1962 '''Waits for all pending invocations.
1963
1964 Useful for testing.
1965 '''
Jon Salz1acc8742012-07-17 17:45:55 +08001966 while self.invocations:
1967 for k, v in self.invocations.iteritems():
1968 logging.info('Waiting for %s to complete...', k)
1969 v.thread.join()
1970 self.reap_completed_tests()
Jon Salz0697cbf2012-07-04 15:14:04 +08001971
1972 def check_exceptions(self):
1973 '''Raises an error if any exceptions have occurred in
1974 invocation threads.'''
1975 if self.exceptions:
1976 raise RuntimeError('Exception in invocation thread: %r' %
1977 self.exceptions)
1978
1979 def record_exception(self, msg):
1980 '''Records an exception in an invocation thread.
1981
1982 An exception with the given message will be rethrown when
1983 Goofy is destroyed.'''
1984 self.exceptions.append(msg)
Jon Salz73e0fd02012-04-04 11:46:38 +08001985
Hung-Te Linf2f78f72012-02-08 19:27:11 +08001986
1987if __name__ == '__main__':
Jon Salz77c151e2012-08-28 07:20:37 +08001988 goofy = Goofy()
1989 try:
1990 goofy.main()
Jon Salz0f996602012-10-03 15:26:48 +08001991 except SystemExit:
1992 # Propagate SystemExit without logging.
1993 raise
Jon Salz31373eb2012-09-21 16:19:49 +08001994 except:
Jon Salz0f996602012-10-03 15:26:48 +08001995 # Log the error before trying to shut down (unless it's a graceful
1996 # exit).
Jon Salz31373eb2012-09-21 16:19:49 +08001997 logging.exception('Error in main loop')
1998 raise
Jon Salz77c151e2012-08-28 07:20:37 +08001999 finally:
2000 goofy.destroy()