Blame - server/cros/telemetry_runner.py - chromium.googlesource.com/chromiumos/platform/tauto

2013-01-29 13:13:43 -0800

[diff] [blame]

1

2

# Use of this source code is governed by a BSD-style license that can be

3

# found in the LICENSE file.

4

5

import logging

6

import os

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

7

import pprint

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

import re

import StringIO

import common

from autotest_lib.client.common_lib import error, utils

13

from autotest_lib.client.common_lib.cros import dev_server

14

15

Dave Tu

2013-11-05 15:54:48 -0800

[diff] [blame]

16

TELEMETRY_RUN_BENCHMARKS_SCRIPT = 'tools/perf/run_benchmark'

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

17

TELEMETRY_RUN_TESTS_SCRIPT = 'tools/telemetry/run_tests'

Simran Basi

1dbfc13

2013-05-02 10:11:02 -0700

[diff] [blame]

18

TELEMETRY_RUN_CROS_TESTS_SCRIPT = 'chrome/test/telemetry/run_cros_tests'

Simran Basi

ee9e860

2013-03-19 11:52:18 -0700

[diff] [blame]

19

TELEMETRY_TIMEOUT_MINS = 60

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

20

21

# Result Statuses

22

SUCCESS_STATUS = 'SUCCESS'

23

WARNING_STATUS = 'WARNING'

24

FAILED_STATUS = 'FAILED'

25

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

26

# Regex for the RESULT output lines understood by chrome buildbot.

27

# Keep in sync with chromium/tools/build/scripts/slave/process_log_utils.py.

28

RESULTS_REGEX = re.compile(r'(?P<IMPORTANT>\*)?RESULT '

29

'(?P<GRAPH>[^:]*): (?P<TRACE>[^=]*)= '

30

'(?P<VALUE>[\{\[]?[-\d\., ]+[\}\]]?)('

31

' ?(?P<UNITS>.+))?')

32

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

33

34

class TelemetryResult(object):

35

"""Class to represent the results of a telemetry run.

36

37

This class represents the results of a telemetry run, whether it ran

38

successful, failed or had warnings.

"""

def __init__(self, exit_code=0, stdout='', stderr=''):

43

"""Initializes this TelemetryResultObject instance.

44

45

@param status: Status of the telemtry run.

46

@param stdout: Stdout of the telemetry run.

47

@param stderr: Stderr of the telemetry run.

48

"""

49

if exit_code == 0:

50

self.status = SUCCESS_STATUS

51

else:

52

self.status = FAILED_STATUS

53

Fang Deng

2013-11-13 18:27:06 -0800

[diff] [blame]

54

# A list of perf values, e.g.

55

# [{'graph': 'graphA', 'trace': 'page_load_time',

56

# 'units': 'secs', 'value':0.5}, ...]

57

self.perf_data = []

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

58

self._stdout = stdout

59

self._stderr = stderr

60

self.output = '\n'.join([stdout, stderr])

61

62

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

63

def _cleanup_perf_string(self, str):

64

"""Clean up a perf-related string by removing illegal characters.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

65

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

66

Perf keys stored in the chromeOS database may contain only letters,

67

numbers, underscores, periods, and dashes. Transform an inputted

68

string so that any illegal characters are replaced by underscores.

69

70

@param str: The perf string to clean up.

71

72

@return The cleaned-up perf string.

73

"""

74

return re.sub(r'[^\w.-]', '_', str)

75

76

77

def _cleanup_units_string(self, units):

78

"""Cleanup a units string.

79

80

Given a string representing units for a perf measurement, clean it up

81

by replacing certain illegal characters with meaningful alternatives.

82

Any other illegal characters should then be replaced with underscores.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

83

84

Examples:

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

85

count/time -> count_per_time

86

% -> percent

87

units! --> units_

88

score (bigger is better) -> score__bigger_is_better_

89

score (runs/s) -> score__runs_per_s_

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

90

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

91

@param units: The units string to clean up.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

92

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

93

@return The cleaned-up units string.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

94

"""

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

95

if '%' in units:

96

units = units.replace('%', 'percent')

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

97

if '/' in units:

98

units = units.replace('/','_per_')

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

99

return self._cleanup_perf_string(units)

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

100

101

102

def parse_benchmark_results(self):

103

"""Parse the results of a telemetry benchmark run.

104

Dave Tu

2013-11-05 15:54:48 -0800

[diff] [blame]

105

Stdout has the output in RESULT block format below.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

106

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

107

The lines of interest start with the substring "RESULT". These are

108

specially-formatted perf data lines that are interpreted by chrome

109

builbot (when the Telemetry tests run for chrome desktop) and are

110

parsed to extract perf data that can then be displayed on a perf

111

dashboard. This format is documented in the docstring of class

112

GraphingLogProcessor in this file in the chrome tree:

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

113

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

114

chromium/tools/build/scripts/slave/process_log_utils.py

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

115

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

116

Example RESULT output lines:

117

RESULT average_commit_time_by_url: http___www.ebay.com= 8.86528 ms

118

RESULT CodeLoad: CodeLoad= 6343 score (bigger is better)

119

RESULT ai-astar: ai-astar= [614,527,523,471,530,523,577,625,614,538] ms

120

121

Currently for chromeOS, we can only associate a single perf key (string)

122

with a perf value. That string can only contain letters, numbers,

123

dashes, periods, and underscores, as defined by write_keyval() in:

124

125

chromeos/src/third_party/autotest/files/client/common_lib/

126

base_utils.py

127

128

We therefore parse each RESULT line, clean up the strings to remove any

129

illegal characters not accepted by chromeOS, and construct a perf key

130

string based on the parsed components of the RESULT line (with each

131

component separated by a special delimiter). We prefix the perf key

132

with the substring "TELEMETRY" to identify it as a telemetry-formatted

133

perf key.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

134

135

Stderr has the format of Warnings/Tracebacks. There is always a default

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

136

warning of the display enviornment setting, followed by warnings of

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

137

page timeouts or a traceback.

138

139

If there are any other warnings we flag the test as warning. If there

140

is a traceback we consider this test a failure.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

141

"""

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

142

if not self._stdout:

143

# Nothing in stdout implies a test failure.

144

logging.error('No stdout, test failed.')

145

self.status = FAILED_STATUS

146

return

147

148

stdout_lines = self._stdout.splitlines()

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

149

for line in stdout_lines:

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

150

results_match = RESULTS_REGEX.search(line)

151

if not results_match:

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

152

continue

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

153

154

match_dict = results_match.groupdict()

155

graph_name = self._cleanup_perf_string(match_dict['GRAPH'].strip())

156

trace_name = self._cleanup_perf_string(match_dict['TRACE'].strip())

157

units = self._cleanup_units_string(

158

(match_dict['UNITS'] or 'units').strip())

159

value = match_dict['VALUE'].strip()

160

unused_important = match_dict['IMPORTANT'] or False # Unused now.

161

162

if value.startswith('['):

163

# A list of values, e.g., "[12,15,8,7,16]". Extract just the

164

# numbers, compute the average and use that. In this example,

165

# we'd get 12+15+8+7+16 / 5 --> 11.6.

166

value_list = [float(x) for x in value.strip('[],').split(',')]

167

value = float(sum(value_list)) / len(value_list)

168

elif value.startswith('{'):

169

# A single value along with a standard deviation, e.g.,

170

# "{34.2,2.15}". Extract just the value itself and use that.

171

# In this example, we'd get 34.2.

172

value_list = [float(x) for x in value.strip('{},').split(',')]

173

value = value_list[0] # Position 0 is the value.

Fang Deng

2013-11-13 18:27:06 -0800

[diff] [blame]

174

elif re.search('^\d+$', value):

175

value = int(value)

176

else:

177

value = float(value)

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

178

Fang Deng

2013-11-13 18:27:06 -0800

[diff] [blame]

179

self.perf_data.append({'graph':graph_name, 'trace': trace_name,

180

'units': units, 'value': value})

Dennis Jeffrey

2013-04-17 11:57:51 -0700

[diff] [blame]

181

182

pp = pprint.PrettyPrinter(indent=2)

Fang Deng

2013-11-13 18:27:06 -0800

[diff] [blame]

183

logging.debug('Perf values: %s', pp.pformat(self.perf_data))

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

184

185

if self.status is SUCCESS_STATUS:

186

return

187

188

# Otherwise check if simply a Warning occurred or a Failure,

189

# i.e. a Traceback is listed.

190

self.status = WARNING_STATUS

191

for line in self._stderr.splitlines():

192

if line.startswith('Traceback'):

193

self.status = FAILED_STATUS

194

195

196

class TelemetryRunner(object):

197

"""Class responsible for telemetry for a given build.

198

199

This class will extract and install telemetry on the devserver and is

200

responsible for executing the telemetry benchmarks and returning their

201

output to the caller.

202

"""

203

Luis Lozano

2013-11-08 16:22:46 -0800

[diff] [blame]

204

def __init__(self, host, local=False):

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

205

"""Initializes this telemetry runner instance.

206

207

If telemetry is not installed for this build, it will be.

Luis Lozano

2013-11-08 16:22:46 -0800

[diff] [blame]

208

209

@param host: Host where the test will be run.

210

@param local: If set, no devserver will be used, test will be run

211

locally.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

212

"""

213

self._host = host

Luis Lozano

2013-11-08 16:22:46 -0800

[diff] [blame]

214

215

# TODO (llozano crbug.com/324964). Remove conditional code.

216

# Use a class hierarchy instead.

217

if local:

218

self._setup_local_telemetry()

219

else:

220

self._setup_devserver_telemetry()

221

222

logging.debug('Telemetry Path: %s', self._telemetry_path)

223

224

225

def _setup_devserver_telemetry(self):

226

"""Setup Telemetry to use the devserver."""

227

logging.debug('Setting up telemetry for devserver testing')

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

228

logging.debug('Grabbing build from AFE.')

229

Luis Lozano

2013-11-08 16:22:46 -0800

[diff] [blame]

230

build = self._host.get_build()

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

231

if not build:

232

logging.error('Unable to locate build label for host: %s.',

233

self._host.hostname)

234

raise error.AutotestError('Failed to grab build for host %s.' %

235

self._host.hostname)

236

237

logging.debug('Setting up telemetry for build: %s', build)

238

239

self._devserver = dev_server.ImageServer.resolve(build)

240

self._telemetry_path = self._devserver.setup_telemetry(build=build)

Luis Lozano

2013-11-08 16:22:46 -0800

[diff] [blame]

241

242

243

def _setup_local_telemetry(self):

244

"""Setup Telemetry to use local path to its sources.

245

246

First look for chrome source root, either externally mounted, or inside

247

the chroot. Prefer chrome-src-internal source tree to chrome-src.

248

"""

249

TELEMETRY_DIR = 'src'

250

CHROME_LOCAL_SRC = '/var/cache/chromeos-cache/distfiles/target/'

251

CHROME_EXTERNAL_SRC = '~/chrome_root/'

252

253

logging.debug('Setting up telemetry for local testing')

254

255

sources_list = ('chrome-src-internal', 'chrome-src')

256

dir_list = [os.path.join(CHROME_EXTERNAL_SRC, x) for x in sources_list]

257

dir_list.extend(

258

[os.path.join(CHROME_LOCAL_SRC, x) for x in sources_list])

259

if 'CHROME_ROOT' in os.environ:

260

dir_list.insert(0, os.environ['CHROME_ROOT'])

telemetry_src = ''

for dir in dir_list:

if os.path.exists(dir):

265

telemetry_src = os.path.join(dir, TELEMETRY_DIR)

266

break

267

else:

268

raise error.TestError('Telemetry source directory not found.')

269

270

self._devserver = None

271

self._telemetry_path = telemetry_src

272

273

274

def _get_telemetry_cmd(self, script, test_or_benchmark):

275

"""Build command to execute telemetry based on script and benchmark.

276

277

@param script: Telemetry script we want to run. For example:

278

[path_to_telemetry_src]/src/tools/telemetry/run_tests.

279

@param test_or_benchmark: Name of the test or benchmark we want to run,

280

with the page_set (if required) as part of

281

the string.

282

@returns Full telemetry command to execute the script.

"""

telemetry_cmd = []

if self._devserver:

devserver_hostname = self._devserver.url().split(

287

'http://')[1].split(':')[0]

288

telemetry_cmd.extend(['ssh', devserver_hostname])

289

290

telemetry_cmd.extend(

291

['python',

292

script,

293

'--browser=cros-chrome',

294

'--remote=%s' % self._host.hostname,

295

test_or_benchmark])

296

return telemetry_cmd

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

297

298

299

def _run_telemetry(self, script, test_or_benchmark):

300

"""Runs telemetry on a dut.

301

302

@param script: Telemetry script we want to run. For example:

Luis Lozano

2013-11-08 16:22:46 -0800

[diff] [blame]

303

[path_to_telemetry_src]/src/tools/telemetry/run_tests.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

304

@param test_or_benchmark: Name of the test or benchmark we want to run,

305

with the page_set (if required) as part of the

306

string.

307

308

@returns A TelemetryResult Instance with the results of this telemetry

309

execution.

310

"""

Simran Basi

1dbfc13

2013-05-02 10:11:02 -0700

[diff] [blame]

311

# TODO (sbasi crbug.com/239933) add support for incognito mode.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

312

Luis Lozano

2013-11-08 16:22:46 -0800

[diff] [blame]

313

telemetry_cmd = self._get_telemetry_cmd(script, test_or_benchmark)

314

logging.debug('Running Telemetry: %s', ' '.join(telemetry_cmd))

315

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

316

output = StringIO.StringIO()

317

error_output = StringIO.StringIO()

318

exit_code = 0

319

try:

Luis Lozano

2013-11-08 16:22:46 -0800

[diff] [blame]

320

result = utils.run(' '.join(telemetry_cmd), stdout_tee=output,

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

321

stderr_tee=error_output,

322

timeout=TELEMETRY_TIMEOUT_MINS*60)

323

exit_code = result.exit_status

324

except error.CmdError as e:

325

# Telemetry returned a return code of not 0; for benchmarks this

326

# can be due to a timeout on one of the pages of the page set and

327

# we may still have data on the rest. For a test however this

328

# indicates failure.

329

logging.debug('Error occurred executing telemetry.')

330

exit_code = e.result_obj.exit_status

331

332

stdout = output.getvalue()

333

stderr = error_output.getvalue()

334

logging.debug('Telemetry completed with exit code: %d.\nstdout:%s\n'

335

'stderr:%s', exit_code, stdout, stderr)

336

337

return TelemetryResult(exit_code=exit_code, stdout=stdout,

stderr=stderr)

Simran Basi

2013-05-02 10:11:02 -0700

[diff] [blame]

341

def _run_test(self, script, test):

342

"""Runs a telemetry test on a dut.

343

344

@param script: Which telemetry test script we want to run. Can be

345

telemetry's base test script or the Chrome OS specific

346

test script.

347

@param test: Telemetry test we want to run.

348

349

@returns A TelemetryResult Instance with the results of this telemetry

350

execution.

351

"""

352

logging.debug('Running telemetry test: %s', test)

353

telemetry_script = os.path.join(self._telemetry_path, script)

354

result = self._run_telemetry(telemetry_script, test)

355

if result.status is FAILED_STATUS:

356

raise error.TestFail('Telemetry test: %s failed.',

test)

return result

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

361

def run_telemetry_test(self, test):

362

"""Runs a telemetry test on a dut.

363

364

@param test: Telemetry test we want to run.

365

366

@returns A TelemetryResult Instance with the results of this telemetry

367

execution.

368

"""

Simran Basi

1dbfc13

2013-05-02 10:11:02 -0700

[diff] [blame]

369

return self._run_test(TELEMETRY_RUN_TESTS_SCRIPT, test)

370

371

372

def run_cros_telemetry_test(self, test):

373

"""Runs a cros specific telemetry test on a dut.

374

375

@param test: Telemetry test we want to run.

376

377

@returns A TelemetryResult instance with the results of this telemetry

378

execution.

379

"""

380

return self._run_test(TELEMETRY_RUN_CROS_TESTS_SCRIPT, test)

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

381

382

Fang Deng

2013-11-13 18:27:06 -0800

[diff] [blame]

383

@staticmethod

384

def _output_perf_value(perf_value_writer, perf_data):

385

"""Output perf values to result dir.

386

387

The perf values will be output to the result dir and

388

be subsequently uploaded to perf dashboard.

389

390

@param perf_value_writer: Should be an instance with the function

391

output_perf_value(), if None, no perf value

392

will be written. Typically this will be the

393

job object from an autotest test.

394

@param perf_data: A list of perf values, each value is

395

a dictionary that looks like

396

{'graph':'GraphA', 'trace':'metric1',

397

'units':'secs', 'value':0.5}

398

"""

399

for perf_value in perf_data:

400

perf_value_writer.output_perf_value(

401

description=perf_value['trace'],

402

value=perf_value['value'],

403

units=perf_value['units'],

404

graph=perf_value['graph'])

405

406

407

def run_telemetry_benchmark(self, benchmark, perf_value_writer=None):

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

408

"""Runs a telemetry benchmark on a dut.

409

410

@param benchmark: Benchmark we want to run.

Fang Deng

2013-11-13 18:27:06 -0800

[diff] [blame]

411

@param perf_value_writer: Should be an instance with the function

412

output_perf_value(), if None, no perf value

413

will be written. Typically this will be the

414

job object from an autotest test.

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

415

416

@returns A TelemetryResult Instance with the results of this telemetry

417

execution.

418

"""

Dave Tu

2013-11-05 15:54:48 -0800

[diff] [blame]

419

logging.debug('Running telemetry benchmark: %s', benchmark)

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

420

telemetry_script = os.path.join(self._telemetry_path,

421

TELEMETRY_RUN_BENCHMARKS_SCRIPT)

Dave Tu

2013-11-05 15:54:48 -0800

[diff] [blame]

422

result = self._run_telemetry(telemetry_script, benchmark)

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

423

result.parse_benchmark_results()

424

Fang Deng

2013-11-13 18:27:06 -0800

[diff] [blame]

425

if perf_value_writer:

426

self._output_perf_value(perf_value_writer, result.perf_data)

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

427

428

if result.status is WARNING_STATUS:

Dave Tu

2013-11-05 15:54:48 -0800

[diff] [blame]

429

raise error.TestWarn('Telemetry Benchmark: %s'

430

' exited with Warnings.' % benchmark)

Simran Basi

2013-01-29 13:13:43 -0800

[diff] [blame]

431

if result.status is FAILED_STATUS:

Dave Tu

2013-11-05 15:54:48 -0800

[diff] [blame]

432

raise error.TestFail('Telemetry Benchmark: %s'

433

' failed to run.' % benchmark)

Simran Basi