blob: 3fdc8bf6fabe0fa6c0d9314aae596658c30d39f7 [file] [log] [blame]
Simran Basi833814b2013-01-29 13:13:43 -08001# Copyright (c) 2013 The Chromium OS Authors. All rights reserved.
2# Use of this source code is governed by a BSD-style license that can be
3# found in the LICENSE file.
4
5import logging
6import os
Dennis Jeffreyc42fd302013-04-17 11:57:51 -07007import pprint
Simran Basi833814b2013-01-29 13:13:43 -08008import re
9import StringIO
10
11import common
12from autotest_lib.client.common_lib import error, utils
13from autotest_lib.client.common_lib.cros import dev_server
14
15
Dave Tu6a404e62013-11-05 15:54:48 -080016TELEMETRY_RUN_BENCHMARKS_SCRIPT = 'tools/perf/run_benchmark'
Simran Basi833814b2013-01-29 13:13:43 -080017TELEMETRY_RUN_TESTS_SCRIPT = 'tools/telemetry/run_tests'
Simran Basi1dbfc132013-05-02 10:11:02 -070018TELEMETRY_RUN_CROS_TESTS_SCRIPT = 'chrome/test/telemetry/run_cros_tests'
Simran Basiee9e8602013-03-19 11:52:18 -070019TELEMETRY_TIMEOUT_MINS = 60
Simran Basi833814b2013-01-29 13:13:43 -080020
21# Result Statuses
22SUCCESS_STATUS = 'SUCCESS'
23WARNING_STATUS = 'WARNING'
24FAILED_STATUS = 'FAILED'
25
Dennis Jeffreyc42fd302013-04-17 11:57:51 -070026# Regex for the RESULT output lines understood by chrome buildbot.
27# Keep in sync with chromium/tools/build/scripts/slave/process_log_utils.py.
28RESULTS_REGEX = re.compile(r'(?P<IMPORTANT>\*)?RESULT '
29 '(?P<GRAPH>[^:]*): (?P<TRACE>[^=]*)= '
30 '(?P<VALUE>[\{\[]?[-\d\., ]+[\}\]]?)('
31 ' ?(?P<UNITS>.+))?')
32
Simran Basi833814b2013-01-29 13:13:43 -080033
34class TelemetryResult(object):
35 """Class to represent the results of a telemetry run.
36
37 This class represents the results of a telemetry run, whether it ran
38 successful, failed or had warnings.
39 """
40
41
42 def __init__(self, exit_code=0, stdout='', stderr=''):
43 """Initializes this TelemetryResultObject instance.
44
45 @param status: Status of the telemtry run.
46 @param stdout: Stdout of the telemetry run.
47 @param stderr: Stderr of the telemetry run.
48 """
49 if exit_code == 0:
50 self.status = SUCCESS_STATUS
51 else:
52 self.status = FAILED_STATUS
53
Fang Denge689e712013-11-13 18:27:06 -080054 # A list of perf values, e.g.
55 # [{'graph': 'graphA', 'trace': 'page_load_time',
56 # 'units': 'secs', 'value':0.5}, ...]
57 self.perf_data = []
Simran Basi833814b2013-01-29 13:13:43 -080058 self._stdout = stdout
59 self._stderr = stderr
60 self.output = '\n'.join([stdout, stderr])
61
62
Dennis Jeffreyc42fd302013-04-17 11:57:51 -070063 def _cleanup_perf_string(self, str):
64 """Clean up a perf-related string by removing illegal characters.
Simran Basi833814b2013-01-29 13:13:43 -080065
Dennis Jeffreyc42fd302013-04-17 11:57:51 -070066 Perf keys stored in the chromeOS database may contain only letters,
67 numbers, underscores, periods, and dashes. Transform an inputted
68 string so that any illegal characters are replaced by underscores.
69
70 @param str: The perf string to clean up.
71
72 @return The cleaned-up perf string.
73 """
74 return re.sub(r'[^\w.-]', '_', str)
75
76
77 def _cleanup_units_string(self, units):
78 """Cleanup a units string.
79
80 Given a string representing units for a perf measurement, clean it up
81 by replacing certain illegal characters with meaningful alternatives.
82 Any other illegal characters should then be replaced with underscores.
Simran Basi833814b2013-01-29 13:13:43 -080083
84 Examples:
Dennis Jeffreyc42fd302013-04-17 11:57:51 -070085 count/time -> count_per_time
86 % -> percent
87 units! --> units_
88 score (bigger is better) -> score__bigger_is_better_
89 score (runs/s) -> score__runs_per_s_
Simran Basi833814b2013-01-29 13:13:43 -080090
Dennis Jeffreyc42fd302013-04-17 11:57:51 -070091 @param units: The units string to clean up.
Simran Basi833814b2013-01-29 13:13:43 -080092
Dennis Jeffreyc42fd302013-04-17 11:57:51 -070093 @return The cleaned-up units string.
Simran Basi833814b2013-01-29 13:13:43 -080094 """
Dennis Jeffreyc42fd302013-04-17 11:57:51 -070095 if '%' in units:
96 units = units.replace('%', 'percent')
Simran Basi833814b2013-01-29 13:13:43 -080097 if '/' in units:
98 units = units.replace('/','_per_')
Dennis Jeffreyc42fd302013-04-17 11:57:51 -070099 return self._cleanup_perf_string(units)
Simran Basi833814b2013-01-29 13:13:43 -0800100
101
102 def parse_benchmark_results(self):
103 """Parse the results of a telemetry benchmark run.
104
Dave Tu6a404e62013-11-05 15:54:48 -0800105 Stdout has the output in RESULT block format below.
Simran Basi833814b2013-01-29 13:13:43 -0800106
Dennis Jeffreyc42fd302013-04-17 11:57:51 -0700107 The lines of interest start with the substring "RESULT". These are
108 specially-formatted perf data lines that are interpreted by chrome
109 builbot (when the Telemetry tests run for chrome desktop) and are
110 parsed to extract perf data that can then be displayed on a perf
111 dashboard. This format is documented in the docstring of class
112 GraphingLogProcessor in this file in the chrome tree:
Simran Basi833814b2013-01-29 13:13:43 -0800113
Dennis Jeffreyc42fd302013-04-17 11:57:51 -0700114 chromium/tools/build/scripts/slave/process_log_utils.py
Simran Basi833814b2013-01-29 13:13:43 -0800115
Dennis Jeffreyc42fd302013-04-17 11:57:51 -0700116 Example RESULT output lines:
117 RESULT average_commit_time_by_url: http___www.ebay.com= 8.86528 ms
118 RESULT CodeLoad: CodeLoad= 6343 score (bigger is better)
119 RESULT ai-astar: ai-astar= [614,527,523,471,530,523,577,625,614,538] ms
120
121 Currently for chromeOS, we can only associate a single perf key (string)
122 with a perf value. That string can only contain letters, numbers,
123 dashes, periods, and underscores, as defined by write_keyval() in:
124
125 chromeos/src/third_party/autotest/files/client/common_lib/
126 base_utils.py
127
128 We therefore parse each RESULT line, clean up the strings to remove any
129 illegal characters not accepted by chromeOS, and construct a perf key
130 string based on the parsed components of the RESULT line (with each
131 component separated by a special delimiter). We prefix the perf key
132 with the substring "TELEMETRY" to identify it as a telemetry-formatted
133 perf key.
Simran Basi833814b2013-01-29 13:13:43 -0800134
135 Stderr has the format of Warnings/Tracebacks. There is always a default
Dennis Jeffreyc42fd302013-04-17 11:57:51 -0700136 warning of the display enviornment setting, followed by warnings of
Simran Basi833814b2013-01-29 13:13:43 -0800137 page timeouts or a traceback.
138
139 If there are any other warnings we flag the test as warning. If there
140 is a traceback we consider this test a failure.
Simran Basi833814b2013-01-29 13:13:43 -0800141 """
Simran Basi833814b2013-01-29 13:13:43 -0800142 if not self._stdout:
143 # Nothing in stdout implies a test failure.
144 logging.error('No stdout, test failed.')
145 self.status = FAILED_STATUS
146 return
147
148 stdout_lines = self._stdout.splitlines()
Simran Basi833814b2013-01-29 13:13:43 -0800149 for line in stdout_lines:
Dennis Jeffreyc42fd302013-04-17 11:57:51 -0700150 results_match = RESULTS_REGEX.search(line)
151 if not results_match:
Simran Basi833814b2013-01-29 13:13:43 -0800152 continue
Dennis Jeffreyc42fd302013-04-17 11:57:51 -0700153
154 match_dict = results_match.groupdict()
155 graph_name = self._cleanup_perf_string(match_dict['GRAPH'].strip())
156 trace_name = self._cleanup_perf_string(match_dict['TRACE'].strip())
157 units = self._cleanup_units_string(
158 (match_dict['UNITS'] or 'units').strip())
159 value = match_dict['VALUE'].strip()
160 unused_important = match_dict['IMPORTANT'] or False # Unused now.
161
162 if value.startswith('['):
163 # A list of values, e.g., "[12,15,8,7,16]". Extract just the
164 # numbers, compute the average and use that. In this example,
165 # we'd get 12+15+8+7+16 / 5 --> 11.6.
166 value_list = [float(x) for x in value.strip('[],').split(',')]
167 value = float(sum(value_list)) / len(value_list)
168 elif value.startswith('{'):
169 # A single value along with a standard deviation, e.g.,
170 # "{34.2,2.15}". Extract just the value itself and use that.
171 # In this example, we'd get 34.2.
172 value_list = [float(x) for x in value.strip('{},').split(',')]
173 value = value_list[0] # Position 0 is the value.
Fang Denge689e712013-11-13 18:27:06 -0800174 elif re.search('^\d+$', value):
175 value = int(value)
176 else:
177 value = float(value)
Dennis Jeffreyc42fd302013-04-17 11:57:51 -0700178
Fang Denge689e712013-11-13 18:27:06 -0800179 self.perf_data.append({'graph':graph_name, 'trace': trace_name,
180 'units': units, 'value': value})
Dennis Jeffreyc42fd302013-04-17 11:57:51 -0700181
182 pp = pprint.PrettyPrinter(indent=2)
Fang Denge689e712013-11-13 18:27:06 -0800183 logging.debug('Perf values: %s', pp.pformat(self.perf_data))
Simran Basi833814b2013-01-29 13:13:43 -0800184
185 if self.status is SUCCESS_STATUS:
186 return
187
188 # Otherwise check if simply a Warning occurred or a Failure,
189 # i.e. a Traceback is listed.
190 self.status = WARNING_STATUS
191 for line in self._stderr.splitlines():
192 if line.startswith('Traceback'):
193 self.status = FAILED_STATUS
194
195
196class TelemetryRunner(object):
197 """Class responsible for telemetry for a given build.
198
199 This class will extract and install telemetry on the devserver and is
200 responsible for executing the telemetry benchmarks and returning their
201 output to the caller.
202 """
203
Luis Lozano23ae3192013-11-08 16:22:46 -0800204 def __init__(self, host, local=False):
Simran Basi833814b2013-01-29 13:13:43 -0800205 """Initializes this telemetry runner instance.
206
207 If telemetry is not installed for this build, it will be.
Luis Lozano23ae3192013-11-08 16:22:46 -0800208
209 @param host: Host where the test will be run.
210 @param local: If set, no devserver will be used, test will be run
211 locally.
Simran Basi833814b2013-01-29 13:13:43 -0800212 """
213 self._host = host
Luis Lozano23ae3192013-11-08 16:22:46 -0800214
215 # TODO (llozano crbug.com/324964). Remove conditional code.
216 # Use a class hierarchy instead.
217 if local:
218 self._setup_local_telemetry()
219 else:
220 self._setup_devserver_telemetry()
221
222 logging.debug('Telemetry Path: %s', self._telemetry_path)
223
224
225 def _setup_devserver_telemetry(self):
226 """Setup Telemetry to use the devserver."""
227 logging.debug('Setting up telemetry for devserver testing')
Simran Basi833814b2013-01-29 13:13:43 -0800228 logging.debug('Grabbing build from AFE.')
229
Luis Lozano23ae3192013-11-08 16:22:46 -0800230 build = self._host.get_build()
Simran Basi833814b2013-01-29 13:13:43 -0800231 if not build:
232 logging.error('Unable to locate build label for host: %s.',
233 self._host.hostname)
234 raise error.AutotestError('Failed to grab build for host %s.' %
235 self._host.hostname)
236
237 logging.debug('Setting up telemetry for build: %s', build)
238
239 self._devserver = dev_server.ImageServer.resolve(build)
240 self._telemetry_path = self._devserver.setup_telemetry(build=build)
Luis Lozano23ae3192013-11-08 16:22:46 -0800241
242
243 def _setup_local_telemetry(self):
244 """Setup Telemetry to use local path to its sources.
245
246 First look for chrome source root, either externally mounted, or inside
247 the chroot. Prefer chrome-src-internal source tree to chrome-src.
248 """
249 TELEMETRY_DIR = 'src'
250 CHROME_LOCAL_SRC = '/var/cache/chromeos-cache/distfiles/target/'
251 CHROME_EXTERNAL_SRC = '~/chrome_root/'
252
253 logging.debug('Setting up telemetry for local testing')
254
255 sources_list = ('chrome-src-internal', 'chrome-src')
256 dir_list = [os.path.join(CHROME_EXTERNAL_SRC, x) for x in sources_list]
257 dir_list.extend(
258 [os.path.join(CHROME_LOCAL_SRC, x) for x in sources_list])
259 if 'CHROME_ROOT' in os.environ:
260 dir_list.insert(0, os.environ['CHROME_ROOT'])
261
262 telemetry_src = ''
263 for dir in dir_list:
264 if os.path.exists(dir):
265 telemetry_src = os.path.join(dir, TELEMETRY_DIR)
266 break
267 else:
268 raise error.TestError('Telemetry source directory not found.')
269
270 self._devserver = None
271 self._telemetry_path = telemetry_src
272
273
274 def _get_telemetry_cmd(self, script, test_or_benchmark):
275 """Build command to execute telemetry based on script and benchmark.
276
277 @param script: Telemetry script we want to run. For example:
278 [path_to_telemetry_src]/src/tools/telemetry/run_tests.
279 @param test_or_benchmark: Name of the test or benchmark we want to run,
280 with the page_set (if required) as part of
281 the string.
282 @returns Full telemetry command to execute the script.
283 """
284 telemetry_cmd = []
285 if self._devserver:
286 devserver_hostname = self._devserver.url().split(
287 'http://')[1].split(':')[0]
288 telemetry_cmd.extend(['ssh', devserver_hostname])
289
290 telemetry_cmd.extend(
291 ['python',
292 script,
293 '--browser=cros-chrome',
294 '--remote=%s' % self._host.hostname,
295 test_or_benchmark])
296 return telemetry_cmd
Simran Basi833814b2013-01-29 13:13:43 -0800297
298
299 def _run_telemetry(self, script, test_or_benchmark):
300 """Runs telemetry on a dut.
301
302 @param script: Telemetry script we want to run. For example:
Luis Lozano23ae3192013-11-08 16:22:46 -0800303 [path_to_telemetry_src]/src/tools/telemetry/run_tests.
Simran Basi833814b2013-01-29 13:13:43 -0800304 @param test_or_benchmark: Name of the test or benchmark we want to run,
305 with the page_set (if required) as part of the
306 string.
307
308 @returns A TelemetryResult Instance with the results of this telemetry
309 execution.
310 """
Simran Basi1dbfc132013-05-02 10:11:02 -0700311 # TODO (sbasi crbug.com/239933) add support for incognito mode.
Simran Basi833814b2013-01-29 13:13:43 -0800312
Luis Lozano23ae3192013-11-08 16:22:46 -0800313 telemetry_cmd = self._get_telemetry_cmd(script, test_or_benchmark)
314 logging.debug('Running Telemetry: %s', ' '.join(telemetry_cmd))
315
Simran Basi833814b2013-01-29 13:13:43 -0800316 output = StringIO.StringIO()
317 error_output = StringIO.StringIO()
318 exit_code = 0
319 try:
Luis Lozano23ae3192013-11-08 16:22:46 -0800320 result = utils.run(' '.join(telemetry_cmd), stdout_tee=output,
Simran Basi833814b2013-01-29 13:13:43 -0800321 stderr_tee=error_output,
322 timeout=TELEMETRY_TIMEOUT_MINS*60)
323 exit_code = result.exit_status
324 except error.CmdError as e:
325 # Telemetry returned a return code of not 0; for benchmarks this
326 # can be due to a timeout on one of the pages of the page set and
327 # we may still have data on the rest. For a test however this
328 # indicates failure.
329 logging.debug('Error occurred executing telemetry.')
330 exit_code = e.result_obj.exit_status
331
332 stdout = output.getvalue()
333 stderr = error_output.getvalue()
334 logging.debug('Telemetry completed with exit code: %d.\nstdout:%s\n'
335 'stderr:%s', exit_code, stdout, stderr)
336
337 return TelemetryResult(exit_code=exit_code, stdout=stdout,
338 stderr=stderr)
339
340
Simran Basi1dbfc132013-05-02 10:11:02 -0700341 def _run_test(self, script, test):
342 """Runs a telemetry test on a dut.
343
344 @param script: Which telemetry test script we want to run. Can be
345 telemetry's base test script or the Chrome OS specific
346 test script.
347 @param test: Telemetry test we want to run.
348
349 @returns A TelemetryResult Instance with the results of this telemetry
350 execution.
351 """
352 logging.debug('Running telemetry test: %s', test)
353 telemetry_script = os.path.join(self._telemetry_path, script)
354 result = self._run_telemetry(telemetry_script, test)
355 if result.status is FAILED_STATUS:
356 raise error.TestFail('Telemetry test: %s failed.',
357 test)
358 return result
359
360
Simran Basi833814b2013-01-29 13:13:43 -0800361 def run_telemetry_test(self, test):
362 """Runs a telemetry test on a dut.
363
364 @param test: Telemetry test we want to run.
365
366 @returns A TelemetryResult Instance with the results of this telemetry
367 execution.
368 """
Simran Basi1dbfc132013-05-02 10:11:02 -0700369 return self._run_test(TELEMETRY_RUN_TESTS_SCRIPT, test)
370
371
372 def run_cros_telemetry_test(self, test):
373 """Runs a cros specific telemetry test on a dut.
374
375 @param test: Telemetry test we want to run.
376
377 @returns A TelemetryResult instance with the results of this telemetry
378 execution.
379 """
380 return self._run_test(TELEMETRY_RUN_CROS_TESTS_SCRIPT, test)
Simran Basi833814b2013-01-29 13:13:43 -0800381
382
Fang Denge689e712013-11-13 18:27:06 -0800383 @staticmethod
384 def _output_perf_value(perf_value_writer, perf_data):
385 """Output perf values to result dir.
386
387 The perf values will be output to the result dir and
388 be subsequently uploaded to perf dashboard.
389
390 @param perf_value_writer: Should be an instance with the function
391 output_perf_value(), if None, no perf value
392 will be written. Typically this will be the
393 job object from an autotest test.
394 @param perf_data: A list of perf values, each value is
395 a dictionary that looks like
396 {'graph':'GraphA', 'trace':'metric1',
397 'units':'secs', 'value':0.5}
398 """
399 for perf_value in perf_data:
400 perf_value_writer.output_perf_value(
401 description=perf_value['trace'],
402 value=perf_value['value'],
403 units=perf_value['units'],
404 graph=perf_value['graph'])
405
406
407 def run_telemetry_benchmark(self, benchmark, perf_value_writer=None):
Simran Basi833814b2013-01-29 13:13:43 -0800408 """Runs a telemetry benchmark on a dut.
409
410 @param benchmark: Benchmark we want to run.
Fang Denge689e712013-11-13 18:27:06 -0800411 @param perf_value_writer: Should be an instance with the function
412 output_perf_value(), if None, no perf value
413 will be written. Typically this will be the
414 job object from an autotest test.
Simran Basi833814b2013-01-29 13:13:43 -0800415
416 @returns A TelemetryResult Instance with the results of this telemetry
417 execution.
418 """
Dave Tu6a404e62013-11-05 15:54:48 -0800419 logging.debug('Running telemetry benchmark: %s', benchmark)
Simran Basi833814b2013-01-29 13:13:43 -0800420 telemetry_script = os.path.join(self._telemetry_path,
421 TELEMETRY_RUN_BENCHMARKS_SCRIPT)
Dave Tu6a404e62013-11-05 15:54:48 -0800422 result = self._run_telemetry(telemetry_script, benchmark)
Simran Basi833814b2013-01-29 13:13:43 -0800423 result.parse_benchmark_results()
424
Fang Denge689e712013-11-13 18:27:06 -0800425 if perf_value_writer:
426 self._output_perf_value(perf_value_writer, result.perf_data)
Simran Basi833814b2013-01-29 13:13:43 -0800427
428 if result.status is WARNING_STATUS:
Dave Tu6a404e62013-11-05 15:54:48 -0800429 raise error.TestWarn('Telemetry Benchmark: %s'
430 ' exited with Warnings.' % benchmark)
Simran Basi833814b2013-01-29 13:13:43 -0800431 if result.status is FAILED_STATUS:
Dave Tu6a404e62013-11-05 15:54:48 -0800432 raise error.TestFail('Telemetry Benchmark: %s'
433 ' failed to run.' % benchmark)
Simran Basi833814b2013-01-29 13:13:43 -0800434
435 return result