Blame - server/cros/telemetry_runner.py - chromium.googlesource.com/chromiumos/platform/tauto

2013-01-29 13:13:43 -0800

[diff] [blame]

1

2

# Use of this source code is governed by a BSD-style license that can be

3

# found in the LICENSE file.

4

5

import logging

6

import os

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

7

import pprint

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

import re

import StringIO

import common

from autotest_lib.client.common_lib import error, utils

13

from autotest_lib.client.common_lib.cros import dev_server

14

15

Dave Tu

2013-11-05 15:54:48 -0800

[diff] [blame]

16

TELEMETRY_RUN_BENCHMARKS_SCRIPT = 'tools/perf/run_benchmark'

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

17

TELEMETRY_RUN_TESTS_SCRIPT = 'tools/telemetry/run_tests'

Simran Basi

1dbfc13

2013-05-02 10:11:02 -0700

[diff] [blame]

18

TELEMETRY_RUN_CROS_TESTS_SCRIPT = 'chrome/test/telemetry/run_cros_tests'

Simran Basi

ee9e860

2013-03-19 11:52:18 -0700

[diff] [blame]

19

TELEMETRY_TIMEOUT_MINS = 60

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

20

21

# Result Statuses

22

SUCCESS_STATUS = 'SUCCESS'

23

WARNING_STATUS = 'WARNING'

24

FAILED_STATUS = 'FAILED'

25

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

26

# Regex for the RESULT output lines understood by chrome buildbot.

27

# Keep in sync with chromium/tools/build/scripts/slave/process_log_utils.py.

28

RESULTS_REGEX = re.compile(r'(?P<IMPORTANT>\*)?RESULT '

29

'(?P<GRAPH>[^:]*): (?P<TRACE>[^=]*)= '

30

'(?P<VALUE>[\{\[]?[-\d\., ]+[\}\]]?)('

31

' ?(?P<UNITS>.+))?')

32

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

33

34

class TelemetryResult(object):

35

"""Class to represent the results of a telemetry run.

36

37

This class represents the results of a telemetry run, whether it ran

38

successful, failed or had warnings.

"""

def __init__(self, exit_code=0, stdout='', stderr=''):

43

"""Initializes this TelemetryResultObject instance.

44

45

@param status: Status of the telemtry run.

46

@param stdout: Stdout of the telemetry run.

47

@param stderr: Stderr of the telemetry run.

48

"""

49

if exit_code == 0:

50

self.status = SUCCESS_STATUS

51

else:

52

self.status = FAILED_STATUS

53

Fang Deng

2013-11-13 18:27:06 -0800

[diff] [blame]

54

# A list of perf values, e.g.

55

# [{'graph': 'graphA', 'trace': 'page_load_time',

56

# 'units': 'secs', 'value':0.5}, ...]

57

self.perf_data = []

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

58

self._stdout = stdout

59

self._stderr = stderr

60

self.output = '\n'.join([stdout, stderr])

61

62

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

63

def _cleanup_perf_string(self, str):

64

"""Clean up a perf-related string by removing illegal characters.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

65

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

66

Perf keys stored in the chromeOS database may contain only letters,

67

numbers, underscores, periods, and dashes. Transform an inputted

68

string so that any illegal characters are replaced by underscores.

69

70

@param str: The perf string to clean up.

71

72

@return The cleaned-up perf string.

73

"""

74

return re.sub(r'[^\w.-]', '_', str)

75

76

77

def _cleanup_units_string(self, units):

78

"""Cleanup a units string.

79

80

Given a string representing units for a perf measurement, clean it up

81

by replacing certain illegal characters with meaningful alternatives.

82

Any other illegal characters should then be replaced with underscores.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

83

84

Examples:

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

85

count/time -> count_per_time

86

% -> percent

87

units! --> units_

88

score (bigger is better) -> score__bigger_is_better_

89

score (runs/s) -> score__runs_per_s_

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

90

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

91

@param units: The units string to clean up.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

92

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

93

@return The cleaned-up units string.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

94

"""

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

95

if '%' in units:

96

units = units.replace('%', 'percent')

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

97

if '/' in units:

98

units = units.replace('/','_per_')

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

99

return self._cleanup_perf_string(units)

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

100

101

102

def parse_benchmark_results(self):

103

"""Parse the results of a telemetry benchmark run.

104

Dave Tu

2013-11-05 15:54:48 -0800

[diff] [blame]

105

Stdout has the output in RESULT block format below.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

106

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

107

The lines of interest start with the substring "RESULT". These are

108

specially-formatted perf data lines that are interpreted by chrome

109

builbot (when the Telemetry tests run for chrome desktop) and are

110

parsed to extract perf data that can then be displayed on a perf

111

dashboard. This format is documented in the docstring of class

112

GraphingLogProcessor in this file in the chrome tree:

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

113

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

114

chromium/tools/build/scripts/slave/process_log_utils.py

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

115

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

116

Example RESULT output lines:

117

RESULT average_commit_time_by_url: http___www.ebay.com= 8.86528 ms

118

RESULT CodeLoad: CodeLoad= 6343 score (bigger is better)

119

RESULT ai-astar: ai-astar= [614,527,523,471,530,523,577,625,614,538] ms

120

121

Currently for chromeOS, we can only associate a single perf key (string)

122

with a perf value. That string can only contain letters, numbers,

123

dashes, periods, and underscores, as defined by write_keyval() in:

124

125

chromeos/src/third_party/autotest/files/client/common_lib/

126

base_utils.py

127

128

We therefore parse each RESULT line, clean up the strings to remove any

129

illegal characters not accepted by chromeOS, and construct a perf key

130

string based on the parsed components of the RESULT line (with each

131

component separated by a special delimiter). We prefix the perf key

132

with the substring "TELEMETRY" to identify it as a telemetry-formatted

133

perf key.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

134

135

Stderr has the format of Warnings/Tracebacks. There is always a default

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

136

warning of the display enviornment setting, followed by warnings of

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

137

page timeouts or a traceback.

138

139

If there are any other warnings we flag the test as warning. If there

140

is a traceback we consider this test a failure.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

141

"""

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

142

if not self._stdout:

143

# Nothing in stdout implies a test failure.

144

logging.error('No stdout, test failed.')

145

self.status = FAILED_STATUS

146

return

147

148

stdout_lines = self._stdout.splitlines()

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

149

for line in stdout_lines:

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

150

results_match = RESULTS_REGEX.search(line)

151

if not results_match:

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

152

continue

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

153

154

match_dict = results_match.groupdict()

155

graph_name = self._cleanup_perf_string(match_dict['GRAPH'].strip())

156

trace_name = self._cleanup_perf_string(match_dict['TRACE'].strip())

157

units = self._cleanup_units_string(

158

(match_dict['UNITS'] or 'units').strip())

159

value = match_dict['VALUE'].strip()

160

unused_important = match_dict['IMPORTANT'] or False # Unused now.

161

162

if value.startswith('['):

163

# A list of values, e.g., "[12,15,8,7,16]". Extract just the

164

# numbers, compute the average and use that. In this example,

165

# we'd get 12+15+8+7+16 / 5 --> 11.6.

166

value_list = [float(x) for x in value.strip('[],').split(',')]

167

value = float(sum(value_list)) / len(value_list)

168

elif value.startswith('{'):

169

# A single value along with a standard deviation, e.g.,

170

# "{34.2,2.15}". Extract just the value itself and use that.

171

# In this example, we'd get 34.2.

172

value_list = [float(x) for x in value.strip('{},').split(',')]

173

value = value_list[0] # Position 0 is the value.

Fang Deng

2013-11-13 18:27:06 -0800

[diff] [blame]

174

elif re.search('^\d+$', value):

175

value = int(value)

176

else:

177

value = float(value)

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

178

Fang Deng

2013-11-13 18:27:06 -0800

[diff] [blame]

179

self.perf_data.append({'graph':graph_name, 'trace': trace_name,

180

'units': units, 'value': value})

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

181

182

pp = pprint.PrettyPrinter(indent=2)

Fang Deng

2013-11-13 18:27:06 -0800

[diff] [blame]

183

logging.debug('Perf values: %s', pp.pformat(self.perf_data))

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

184

185

if self.status is SUCCESS_STATUS:

186

return

187

188

# Otherwise check if simply a Warning occurred or a Failure,

189

# i.e. a Traceback is listed.

190

self.status = WARNING_STATUS

191

for line in self._stderr.splitlines():

192

if line.startswith('Traceback'):

193

self.status = FAILED_STATUS

194

195

196

class TelemetryRunner(object):

197

"""Class responsible for telemetry for a given build.

198

199

This class will extract and install telemetry on the devserver and is

200

responsible for executing the telemetry benchmarks and returning their

201

output to the caller.

202

"""

203

204

def __init__(self, host):

205

"""Initializes this telemetry runner instance.

206

207

If telemetry is not installed for this build, it will be.

208

"""

209

self._host = host

210

logging.debug('Grabbing build from AFE.')

211

212

build = host.get_build()

213

if not build:

214

logging.error('Unable to locate build label for host: %s.',

215

self._host.hostname)

216

raise error.AutotestError('Failed to grab build for host %s.' %

217

self._host.hostname)

218

219

logging.debug('Setting up telemetry for build: %s', build)

220

221

self._devserver = dev_server.ImageServer.resolve(build)

222

self._telemetry_path = self._devserver.setup_telemetry(build=build)

223

logging.debug('Telemetry Path: %s',self._telemetry_path)

224

225

226

def _run_telemetry(self, script, test_or_benchmark):

227

"""Runs telemetry on a dut.

228

229

@param script: Telemetry script we want to run. For example:

230

[path_to_telemetry_src]/src/tools/telemetry/run_tests

231

@param test_or_benchmark: Name of the test or benchmark we want to run,

232

with the page_set (if required) as part of the

233

string.

234

235

@returns A TelemetryResult Instance with the results of this telemetry

236

execution.

237

"""

238

devserver_hostname = self._devserver.url().split(

239

'http://')[1].split(':')[0]

Simran Basi

1dbfc13

2013-05-02 10:11:02 -0700

[diff] [blame]

240

# TODO (sbasi crbug.com/239933) add support for incognito mode.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

241

telemetry_args = ['ssh',

devserver_hostname,

'python',

script,

'--browser=cros-chrome',

246

'--remote=%s' % self._host.hostname,

247

test_or_benchmark]

248

249

logging.debug('Running Telemetry: %s', ' '.join(telemetry_args))

250

output = StringIO.StringIO()

251

error_output = StringIO.StringIO()

252

exit_code = 0

253

try:

254

result = utils.run(' '.join(telemetry_args), stdout_tee=output,

255

stderr_tee=error_output,

256

timeout=TELEMETRY_TIMEOUT_MINS*60)

257

exit_code = result.exit_status

258

except error.CmdError as e:

259

# Telemetry returned a return code of not 0; for benchmarks this

260

# can be due to a timeout on one of the pages of the page set and

261

# we may still have data on the rest. For a test however this

262

# indicates failure.

263

logging.debug('Error occurred executing telemetry.')

264

exit_code = e.result_obj.exit_status

265

266

stdout = output.getvalue()

267

stderr = error_output.getvalue()

268

logging.debug('Telemetry completed with exit code: %d.\nstdout:%s\n'

269

'stderr:%s', exit_code, stdout, stderr)

270

271

return TelemetryResult(exit_code=exit_code, stdout=stdout,

stderr=stderr)

Simran Basi

2013-05-02 10:11:02 -0700

[diff] [blame]

275

def _run_test(self, script, test):

276

"""Runs a telemetry test on a dut.

277

278

@param script: Which telemetry test script we want to run. Can be

279

telemetry's base test script or the Chrome OS specific

280

test script.

281

@param test: Telemetry test we want to run.

282

283

@returns A TelemetryResult Instance with the results of this telemetry

284

execution.

285

"""

286

logging.debug('Running telemetry test: %s', test)

287

telemetry_script = os.path.join(self._telemetry_path, script)

288

result = self._run_telemetry(telemetry_script, test)

289

if result.status is FAILED_STATUS:

290

raise error.TestFail('Telemetry test: %s failed.',

test)

return result

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

295

def run_telemetry_test(self, test):

296

"""Runs a telemetry test on a dut.

297

298

@param test: Telemetry test we want to run.

299

300

@returns A TelemetryResult Instance with the results of this telemetry

301

execution.

302

"""

Simran Basi

1dbfc13

2013-05-02 10:11:02 -0700

[diff] [blame]

303

return self._run_test(TELEMETRY_RUN_TESTS_SCRIPT, test)

304

305

306

def run_cros_telemetry_test(self, test):

307

"""Runs a cros specific telemetry test on a dut.

308

309

@param test: Telemetry test we want to run.

310

311

@returns A TelemetryResult instance with the results of this telemetry

312

execution.

313

"""

314

return self._run_test(TELEMETRY_RUN_CROS_TESTS_SCRIPT, test)

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

315

316

Fang Deng

2013-11-13 18:27:06 -0800

[diff] [blame]

317

@staticmethod

318

def _output_perf_value(perf_value_writer, perf_data):

319

"""Output perf values to result dir.

320

321

The perf values will be output to the result dir and

322

be subsequently uploaded to perf dashboard.

323

324

@param perf_value_writer: Should be an instance with the function

325

output_perf_value(), if None, no perf value

326

will be written. Typically this will be the

327

job object from an autotest test.

328

@param perf_data: A list of perf values, each value is

329

a dictionary that looks like

330

{'graph':'GraphA', 'trace':'metric1',

331

'units':'secs', 'value':0.5}

332

"""

333

for perf_value in perf_data:

334

perf_value_writer.output_perf_value(

335

description=perf_value['trace'],

336

value=perf_value['value'],

337

units=perf_value['units'],

338

graph=perf_value['graph'])

339

340

341

def run_telemetry_benchmark(self, benchmark, perf_value_writer=None):

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

342

"""Runs a telemetry benchmark on a dut.

343

344

@param benchmark: Benchmark we want to run.

Fang Deng

2013-11-13 18:27:06 -0800

[diff] [blame]

345

@param perf_value_writer: Should be an instance with the function

346

output_perf_value(), if None, no perf value

347

will be written. Typically this will be the

348

job object from an autotest test.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

349

350

@returns A TelemetryResult Instance with the results of this telemetry

351

execution.

352

"""

Dave Tu

2013-11-05 15:54:48 -0800

[diff] [blame]

353

logging.debug('Running telemetry benchmark: %s', benchmark)

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

354

telemetry_script = os.path.join(self._telemetry_path,

355

TELEMETRY_RUN_BENCHMARKS_SCRIPT)

Dave Tu

2013-11-05 15:54:48 -0800

[diff] [blame]

356

result = self._run_telemetry(telemetry_script, benchmark)

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

357

result.parse_benchmark_results()

358

Fang Deng

2013-11-13 18:27:06 -0800

[diff] [blame]

359

if perf_value_writer:

360

self._output_perf_value(perf_value_writer, result.perf_data)

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

361

362

if result.status is WARNING_STATUS:

Dave Tu

2013-11-05 15:54:48 -0800

[diff] [blame]

363

raise error.TestWarn('Telemetry Benchmark: %s'

364

' exited with Warnings.' % benchmark)

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

365

if result.status is FAILED_STATUS:

Dave Tu

2013-11-05 15:54:48 -0800

[diff] [blame]

366

raise error.TestFail('Telemetry Benchmark: %s'

367

' failed to run.' % benchmark)

Simran Basi