blob: 4af7eb3c4de72dace8771fb5479fbf4e48afd39c [file] [log] [blame]
Josip Sokcevic4de5dea2022-03-23 21:15:14 +00001#!/usr/bin/env python3
Edward Lemur32e3d1e2018-07-12 00:54:05 +00002# Copyright (c) 2018 The Chromium Authors. All rights reserved.
3# Use of this source code is governed by a BSD-style license that can be
4# found in the LICENSE file.
5
Edward Lemurc87d45b2018-07-26 17:43:11 +00006from __future__ import print_function
7
Edward Lemur03d6d112018-10-23 15:17:36 +00008import re
Edward Lesmes1e59a242021-04-30 18:38:25 +00009import os
Josip Sokcevic7958e302023-03-01 23:02:21 +000010import scm
Edward Lemur32e3d1e2018-07-12 00:54:05 +000011import subprocess2
12import sys
Raul Tambreb946b232019-03-26 14:48:46 +000013
14try:
15 import urlparse
16except ImportError: # For Py3 compatibility
17 import urllib.parse as urlparse
Edward Lemur32e3d1e2018-07-12 00:54:05 +000018
Edward Lemur32e3d1e2018-07-12 00:54:05 +000019
Edward Lemur48836262018-10-18 02:08:06 +000020# Current version of metrics recording.
21# When we add new metrics, the version number will be increased, we display the
22# user what has changed, and ask the user to agree again.
Edward Lesmes1e59a242021-04-30 18:38:25 +000023CURRENT_VERSION = 2
Edward Lemur48836262018-10-18 02:08:06 +000024
Edward Lemur5ba1e9c2018-07-23 18:19:02 +000025APP_URL = 'https://cit-cli-metrics.appspot.com'
26
Edward Lesmes9c349062021-05-06 20:02:39 +000027REPORT_BUILD = os.getenv('DEPOT_TOOLS_REPORT_BUILD')
Edward Lesmes09f358b2021-06-22 22:31:52 +000028COLLECT_METRICS = (
29 os.getenv('DEPOT_TOOLS_COLLECT_METRICS') != '0'
30 and os.getenv('DEPOT_TOOLS_METRICS') != '0')
Edward Lesmes1e59a242021-04-30 18:38:25 +000031
Edward Lesmesc8f63d32021-06-02 23:51:53 +000032SYNC_STATUS_SUCCESS = 'SYNC_STATUS_SUCCESS'
33SYNC_STATUS_FAILURE = 'SYNC_STATUS_FAILURE'
34
Edward Lesmes1e59a242021-04-30 18:38:25 +000035
Samuel Huang98a7e802019-02-12 15:32:22 +000036def get_notice_countdown_header(countdown):
37 if countdown == 0:
38 yield ' METRICS COLLECTION IS TAKING PLACE'
39 else:
40 yield ' METRICS COLLECTION WILL START IN %d EXECUTIONS' % countdown
Edward Lemur32e3d1e2018-07-12 00:54:05 +000041
Samuel Huang98a7e802019-02-12 15:32:22 +000042def get_notice_version_change_header():
43 yield ' WE ARE COLLECTING ADDITIONAL METRICS'
44 yield ''
45 yield ' Please review the changes and opt-in again.'
46
47def get_notice_footer():
48 yield 'To suppress this message opt in or out using:'
49 yield '$ gclient metrics [--opt-in] [--opt-out]'
50 yield 'For more information please see metrics.README.md'
51 yield 'in your depot_tools checkout or visit'
Gavin Mak019e73a2023-04-07 18:46:41 +000052 yield 'https://bit.ly/3MpLAYM.'
Samuel Huang98a7e802019-02-12 15:32:22 +000053
54def get_change_notice(version):
55 if version == 0:
Edward Lesmes1e59a242021-04-30 18:38:25 +000056 return [] # No changes for version 0
Aravind Vasudevanc5f0cbb2022-01-24 23:56:57 +000057
58 if version == 1:
Edward Lesmes1e59a242021-04-30 18:38:25 +000059 return [
60 'We want to collect the Git version.',
61 'We want to collect information about the HTTP',
62 'requests that depot_tools makes, and the git and',
63 'cipd commands it executes.',
64 '',
65 'We only collect known strings to make sure we',
66 'don\'t record PII.',
67 ]
Aravind Vasudevanc5f0cbb2022-01-24 23:56:57 +000068
69 if version == 2:
Edward Lesmes1e59a242021-04-30 18:38:25 +000070 return [
71 'We will start collecting metrics from bots.',
72 'There are no changes for developers.',
73 'If the DEPOT_TOOLS_REPORT_BUILD environment variable is set,',
74 'we will report information about the current build',
75 '(e.g. buildbucket project, bucket, builder and build id),',
76 'and authenticate to the metrics collection server.',
77 'This information will only be recorded for requests',
78 'authenticated as bot service accounts.',
79 ]
Edward Lemur48836262018-10-18 02:08:06 +000080
81
Edward Lemur40764b02018-07-20 18:50:29 +000082KNOWN_PROJECT_URLS = {
83 'https://chrome-internal.googlesource.com/chrome/ios_internal',
84 'https://chrome-internal.googlesource.com/infra/infra_internal',
85 'https://chromium.googlesource.com/breakpad/breakpad',
86 'https://chromium.googlesource.com/chromium/src',
87 'https://chromium.googlesource.com/chromium/tools/depot_tools',
88 'https://chromium.googlesource.com/crashpad/crashpad',
89 'https://chromium.googlesource.com/external/gyp',
90 'https://chromium.googlesource.com/external/naclports',
91 'https://chromium.googlesource.com/infra/goma/client',
92 'https://chromium.googlesource.com/infra/infra',
93 'https://chromium.googlesource.com/native_client/',
94 'https://chromium.googlesource.com/syzygy',
95 'https://chromium.googlesource.com/v8/v8',
96 'https://dart.googlesource.com/sdk',
97 'https://pdfium.googlesource.com/pdfium',
98 'https://skia.googlesource.com/buildbot',
99 'https://skia.googlesource.com/skia',
100 'https://webrtc.googlesource.com/src',
101}
102
Edward Lemur03d6d112018-10-23 15:17:36 +0000103KNOWN_HTTP_HOSTS = {
104 'chrome-internal-review.googlesource.com',
105 'chromium-review.googlesource.com',
106 'dart-review.googlesource.com',
107 'eu1-mirror-chromium-review.googlesource.com',
108 'pdfium-review.googlesource.com',
109 'skia-review.googlesource.com',
110 'us1-mirror-chromium-review.googlesource.com',
111 'us2-mirror-chromium-review.googlesource.com',
112 'us3-mirror-chromium-review.googlesource.com',
113 'webrtc-review.googlesource.com',
114}
115
116KNOWN_HTTP_METHODS = {
117 'DELETE',
118 'GET',
119 'PATCH',
120 'POST',
121 'PUT',
122}
123
124KNOWN_HTTP_PATHS = {
125 'accounts':
126 re.compile(r'(/a)?/accounts/.*'),
127 'changes':
128 re.compile(r'(/a)?/changes/([^/]+)?$'),
129 'changes/abandon':
130 re.compile(r'(/a)?/changes/.*/abandon'),
131 'changes/comments':
132 re.compile(r'(/a)?/changes/.*/comments'),
133 'changes/detail':
134 re.compile(r'(/a)?/changes/.*/detail'),
135 'changes/edit':
136 re.compile(r'(/a)?/changes/.*/edit'),
137 'changes/message':
138 re.compile(r'(/a)?/changes/.*/message'),
139 'changes/restore':
140 re.compile(r'(/a)?/changes/.*/restore'),
141 'changes/reviewers':
142 re.compile(r'(/a)?/changes/.*/reviewers/.*'),
143 'changes/revisions/commit':
144 re.compile(r'(/a)?/changes/.*/revisions/.*/commit'),
145 'changes/revisions/review':
146 re.compile(r'(/a)?/changes/.*/revisions/.*/review'),
147 'changes/submit':
148 re.compile(r'(/a)?/changes/.*/submit'),
149 'projects/branches':
150 re.compile(r'(/a)?/projects/.*/branches/.*'),
151}
152
153KNOWN_HTTP_ARGS = {
154 'ALL_REVISIONS',
155 'CURRENT_COMMIT',
156 'CURRENT_REVISION',
157 'DETAILED_ACCOUNTS',
158 'LABELS',
159}
160
Edward Lemur861640f2018-10-31 19:45:31 +0000161GIT_VERSION_RE = re.compile(
162 r'git version (\d)\.(\d{0,2})\.(\d{0,2})'
163)
164
Edward Lemurfec80c42018-11-01 23:14:14 +0000165KNOWN_SUBCOMMAND_ARGS = {
166 'cc',
167 'hashtag',
168 'l=Auto-Submit+1',
Edward Lemur687ca902018-12-05 02:30:30 +0000169 'l=Code-Review+1',
170 'l=Code-Review+2',
Edward Lemurfec80c42018-11-01 23:14:14 +0000171 'l=Commit-Queue+1',
172 'l=Commit-Queue+2',
173 'label',
174 'm',
175 'notify=ALL',
176 'notify=NONE',
177 'private',
178 'r',
179 'ready',
180 'topic',
181 'wip'
182}
183
Edward Lemur32e3d1e2018-07-12 00:54:05 +0000184
185def get_python_version():
186 """Return the python version in the major.minor.micro format."""
187 return '{v.major}.{v.minor}.{v.micro}'.format(v=sys.version_info)
188
189
Edward Lemur861640f2018-10-31 19:45:31 +0000190def get_git_version():
191 """Return the Git version in the major.minor.micro format."""
192 p = subprocess2.Popen(
193 ['git', '--version'],
194 stdout=subprocess2.PIPE, stderr=subprocess2.PIPE)
195 stdout, _ = p.communicate()
Edward Lemur73065b22019-07-22 20:12:01 +0000196 match = GIT_VERSION_RE.match(stdout.decode('utf-8'))
Edward Lemur861640f2018-10-31 19:45:31 +0000197 if not match:
198 return None
199 return '%s.%s.%s' % match.groups()
200
201
Edward Lesmes1e59a242021-04-30 18:38:25 +0000202def get_bot_metrics():
Edward Lesmes9c349062021-05-06 20:02:39 +0000203 try:
204 project, bucket, builder, build = REPORT_BUILD.split('/')
205 return {
206 'build_id': int(build),
207 'builder': {
208 'project': project,
209 'bucket': bucket,
210 'builder': builder,
211 },
212 }
213 except (AttributeError, ValueError):
Edward Lesmes1e59a242021-04-30 18:38:25 +0000214 return None
Edward Lesmes1e59a242021-04-30 18:38:25 +0000215
216
217
Edward Lemur32e3d1e2018-07-12 00:54:05 +0000218def return_code_from_exception(exception):
219 """Returns the exit code that would result of raising the exception."""
220 if exception is None:
221 return 0
Gavin Mak5b2255d2023-07-14 18:22:24 +0000222 e = exception[1]
223 if isinstance(e, KeyboardInterrupt):
224 return 130
225 if isinstance(e, SystemExit):
226 return e.code
Edward Lemur32e3d1e2018-07-12 00:54:05 +0000227 return 1
228
229
Edward Lemurfec80c42018-11-01 23:14:14 +0000230def extract_known_subcommand_args(args):
231 """Extract the known arguments from the passed list of args."""
232 known_args = []
233 for arg in args:
234 if arg in KNOWN_SUBCOMMAND_ARGS:
235 known_args.append(arg)
236 else:
237 arg = arg.split('=')[0]
238 if arg in KNOWN_SUBCOMMAND_ARGS:
239 known_args.append(arg)
Edward Lemur01f4a4f2018-11-03 00:40:38 +0000240 return sorted(known_args)
Edward Lemurfec80c42018-11-01 23:14:14 +0000241
242
Edward Lemur03d6d112018-10-23 15:17:36 +0000243def extract_http_metrics(request_uri, method, status, response_time):
244 """Extract metrics from the request URI.
245
246 Extracts the host, path, and arguments from the request URI, and returns them
247 along with the method, status and response time.
248
249 The host, method, path and arguments must be in the KNOWN_HTTP_* constants
250 defined above.
251
252 Arguments are the values of the o= url parameter. In Gerrit, additional fields
253 can be obtained by adding o parameters, each option requires more database
254 lookups and slows down the query response time to the client, so we make an
255 effort to collect them.
256
257 The regex defined in KNOWN_HTTP_PATH_RES are checked against the path, and
258 those that match will be returned.
259 """
260 http_metrics = {
261 'status': status,
262 'response_time': response_time,
263 }
264
265 if method in KNOWN_HTTP_METHODS:
266 http_metrics['method'] = method
267
268 parsed_url = urlparse.urlparse(request_uri)
269
270 if parsed_url.netloc in KNOWN_HTTP_HOSTS:
271 http_metrics['host'] = parsed_url.netloc
272
Edward Lemur9217ff82019-07-16 23:14:24 +0000273 for name, path_re in KNOWN_HTTP_PATHS.items():
Edward Lemur03d6d112018-10-23 15:17:36 +0000274 if path_re.match(parsed_url.path):
275 http_metrics['path'] = name
276 break
277
278 parsed_query = urlparse.parse_qs(parsed_url.query)
279
280 # Collect o-parameters from the request.
281 args = [
282 arg for arg in parsed_query.get('o', [])
283 if arg in KNOWN_HTTP_ARGS
284 ]
285 if args:
286 http_metrics['arguments'] = args
287
288 return http_metrics
289
290
Edward Lemur32e3d1e2018-07-12 00:54:05 +0000291def get_repo_timestamp(path_to_repo):
292 """Get an approximate timestamp for the upstream of |path_to_repo|.
293
294 Returns the top two bits of the timestamp of the HEAD for the upstream of the
295 branch path_to_repo is checked out at.
296 """
297 # Get the upstream for the current branch. If we're not in a branch, fallback
298 # to HEAD.
299 try:
Edward Lemur36974ad2019-02-21 23:29:47 +0000300 upstream = scm.GIT.GetUpstreamBranch(path_to_repo) or 'HEAD'
Edward Lemur32e3d1e2018-07-12 00:54:05 +0000301 except subprocess2.CalledProcessError:
302 upstream = 'HEAD'
303
304 # Get the timestamp of the HEAD for the upstream of the current branch.
305 p = subprocess2.Popen(
306 ['git', '-C', path_to_repo, 'log', '-n1', upstream, '--format=%at'],
307 stdout=subprocess2.PIPE, stderr=subprocess2.PIPE)
308 stdout, _ = p.communicate()
309
310 # If there was an error, give up.
311 if p.returncode != 0:
312 return None
313
Edward Lemur18df41e2019-04-26 00:42:04 +0000314 return stdout.strip()
Edward Lemur32e3d1e2018-07-12 00:54:05 +0000315
Hans Wennborg24b5f902019-03-15 18:51:27 +0000316def print_boxed_text(out, min_width, lines):
317 [EW, NS, SE, SW, NE, NW] = list('=|++++')
Samuel Huang98a7e802019-02-12 15:32:22 +0000318 width = max(min_width, max(len(line) for line in lines))
319 out(SE + EW * (width + 2) + SW + '\n')
320 for line in lines:
Raul Tambreb946b232019-03-26 14:48:46 +0000321 out('%s %-*s %s\n' % (NS, width, line, NS))
Samuel Huang98a7e802019-02-12 15:32:22 +0000322 out(NE + EW * (width + 2) + NW + '\n')
Edward Lemur32e3d1e2018-07-12 00:54:05 +0000323
324def print_notice(countdown):
325 """Print a notice to let the user know the status of metrics collection."""
Samuel Huang98a7e802019-02-12 15:32:22 +0000326 lines = list(get_notice_countdown_header(countdown))
327 lines.append('')
328 lines += list(get_notice_footer())
Hans Wennborg24b5f902019-03-15 18:51:27 +0000329 print_boxed_text(sys.stderr.write, 49, lines)
Edward Lemur48836262018-10-18 02:08:06 +0000330
331def print_version_change(config_version):
332 """Print a notice to let the user know we are collecting more metrics."""
Samuel Huang98a7e802019-02-12 15:32:22 +0000333 lines = list(get_notice_version_change_header())
Edward Lemur9217ff82019-07-16 23:14:24 +0000334 for version in range(config_version + 1, CURRENT_VERSION + 1):
Samuel Huang98a7e802019-02-12 15:32:22 +0000335 lines.append('')
Edward Lesmes1e59a242021-04-30 18:38:25 +0000336 lines += get_change_notice(version)
Hans Wennborg24b5f902019-03-15 18:51:27 +0000337 print_boxed_text(sys.stderr.write, 49, lines)