Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 1 | #!/usr/bin/env python |
| 2 | # Copyright 2018 The Chromium Authors. All rights reserved. |
| 3 | # Use of this source code is governed by a BSD-style license that can be |
| 4 | # found in the LICENSE file. |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 5 | """ |
| 6 | This is script to upload ninja_log from googler. |
| 7 | |
| 8 | Server side implementation is in |
| 9 | https://cs.chromium.org/chromium/infra/go/src/infra/appengine/chromium_build_stats/ |
| 10 | |
| 11 | Uploaded ninjalog is stored in BigQuery table having following schema. |
| 12 | https://cs.chromium.org/chromium/infra/go/src/infra/appengine/chromium_build_stats/ninjaproto/ninjalog.proto |
| 13 | |
| 14 | The log will be used to analyze user side build performance. |
| 15 | """ |
| 16 | |
| 17 | import argparse |
| 18 | import cStringIO |
| 19 | import gzip |
| 20 | import json |
| 21 | import logging |
| 22 | import multiprocessing |
| 23 | import os |
| 24 | import platform |
Takuto Ikuta | 96fdf7c | 2018-12-03 09:18:39 +0000 | [diff] [blame] | 25 | import subprocess |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 26 | import sys |
Takuto Ikuta | 36248fc | 2019-01-11 03:02:32 +0000 | [diff] [blame] | 27 | import time |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 28 | |
Edward Lesmes | 1961043 | 2020-01-07 03:30:49 +0000 | [diff] [blame] | 29 | import httplib2 |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 30 | |
Takuto Ikuta | c8069af | 2019-01-09 06:24:56 +0000 | [diff] [blame] | 31 | # These build configs affect build performance a lot. |
Bruce Dawson | 9e63303 | 2020-08-04 21:50:29 +0000 | [diff] [blame] | 32 | # TODO(https://crbug.com/900161): Add 'blink_symbol_level' and |
| 33 | # 'enable_js_type_check'. |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 34 | WHITELISTED_CONFIGS = ('symbol_level', 'use_goma', 'is_debug', |
| 35 | 'is_component_build', 'enable_nacl', 'host_os', |
| 36 | 'host_cpu', 'target_os', 'target_cpu') |
| 37 | |
Takuto Ikuta | c8069af | 2019-01-09 06:24:56 +0000 | [diff] [blame] | 38 | |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 39 | def IsGoogler(server): |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 40 | """Check whether this script run inside corp network.""" |
| 41 | try: |
| 42 | h = httplib2.Http() |
| 43 | _, content = h.request('https://' + server + '/should-upload', 'GET') |
| 44 | return content == 'Success' |
| 45 | except httplib2.HttpLib2Error: |
| 46 | return False |
| 47 | |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 48 | |
Takuto Ikuta | 96fdf7c | 2018-12-03 09:18:39 +0000 | [diff] [blame] | 49 | def ParseGNArgs(gn_args): |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 50 | """Parse gn_args as json and return config dictionary.""" |
| 51 | configs = json.loads(gn_args) |
| 52 | build_configs = {} |
Takuto Ikuta | c8069af | 2019-01-09 06:24:56 +0000 | [diff] [blame] | 53 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 54 | for config in configs: |
| 55 | key = config["name"] |
| 56 | if key not in WHITELISTED_CONFIGS: |
| 57 | continue |
| 58 | if 'current' in config: |
| 59 | build_configs[key] = config['current']['value'] |
| 60 | else: |
| 61 | build_configs[key] = config['default']['value'] |
Takuto Ikuta | c8069af | 2019-01-09 06:24:56 +0000 | [diff] [blame] | 62 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 63 | return build_configs |
| 64 | |
Takuto Ikuta | 96fdf7c | 2018-12-03 09:18:39 +0000 | [diff] [blame] | 65 | |
Takuto Ikuta | cf56a4b | 2018-12-18 05:47:26 +0000 | [diff] [blame] | 66 | def GetBuildTargetFromCommandLine(cmdline): |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 67 | """Get build targets from commandline.""" |
Takuto Ikuta | cf56a4b | 2018-12-18 05:47:26 +0000 | [diff] [blame] | 68 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 69 | # Skip argv0. |
| 70 | idx = 1 |
Takuto Ikuta | cf56a4b | 2018-12-18 05:47:26 +0000 | [diff] [blame] | 71 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 72 | # Skipping all args that involve these flags, and taking all remaining args |
| 73 | # as targets. |
| 74 | onearg_flags = ('-C', '-f', '-j', '-k', '-l', '-d', '-t', '-w') |
| 75 | zeroarg_flags = ('--version', '-n', '-v') |
Takuto Ikuta | cf56a4b | 2018-12-18 05:47:26 +0000 | [diff] [blame] | 76 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 77 | targets = [] |
Takuto Ikuta | cf56a4b | 2018-12-18 05:47:26 +0000 | [diff] [blame] | 78 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 79 | while idx < len(cmdline): |
| 80 | if cmdline[idx] in onearg_flags: |
| 81 | idx += 2 |
| 82 | continue |
Takuto Ikuta | cf56a4b | 2018-12-18 05:47:26 +0000 | [diff] [blame] | 83 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 84 | if (cmdline[idx][:2] in onearg_flags or cmdline[idx] in zeroarg_flags): |
| 85 | idx += 1 |
| 86 | continue |
Takuto Ikuta | cf56a4b | 2018-12-18 05:47:26 +0000 | [diff] [blame] | 87 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 88 | targets.append(cmdline[idx]) |
| 89 | idx += 1 |
Takuto Ikuta | cf56a4b | 2018-12-18 05:47:26 +0000 | [diff] [blame] | 90 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 91 | return targets |
| 92 | |
Takuto Ikuta | cf56a4b | 2018-12-18 05:47:26 +0000 | [diff] [blame] | 93 | |
Takuto Ikuta | c8069af | 2019-01-09 06:24:56 +0000 | [diff] [blame] | 94 | def GetJflag(cmdline): |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 95 | """Parse cmdline to get flag value for -j""" |
Takuto Ikuta | c8069af | 2019-01-09 06:24:56 +0000 | [diff] [blame] | 96 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 97 | for i in range(len(cmdline)): |
| 98 | if (cmdline[i] == '-j' and i + 1 < len(cmdline) |
| 99 | and cmdline[i + 1].isdigit()): |
| 100 | return int(cmdline[i + 1]) |
Takuto Ikuta | c8069af | 2019-01-09 06:24:56 +0000 | [diff] [blame] | 101 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 102 | if (cmdline[i].startswith('-j') and cmdline[i][len('-j'):].isdigit()): |
| 103 | return int(cmdline[i][len('-j'):]) |
Takuto Ikuta | c8069af | 2019-01-09 06:24:56 +0000 | [diff] [blame] | 104 | |
Takuto Ikuta | 96fdf7c | 2018-12-03 09:18:39 +0000 | [diff] [blame] | 105 | |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 106 | def GetMetadata(cmdline, ninjalog): |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 107 | """Get metadata for uploaded ninjalog. |
Takuto Ikuta | c8069af | 2019-01-09 06:24:56 +0000 | [diff] [blame] | 108 | |
| 109 | Returned metadata has schema defined in |
| 110 | https://cs.chromium.org?q="type+Metadata+struct+%7B"+file:%5Einfra/go/src/infra/appengine/chromium_build_stats/ninjalog/ |
| 111 | |
| 112 | TODO(tikuta): Collect GOMA_* env var. |
| 113 | """ |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 114 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 115 | build_dir = os.path.dirname(ninjalog) |
Takuto Ikuta | 96fdf7c | 2018-12-03 09:18:39 +0000 | [diff] [blame] | 116 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 117 | build_configs = {} |
| 118 | |
| 119 | try: |
| 120 | args = ['gn', 'args', build_dir, '--list', '--short', '--json'] |
| 121 | if sys.platform == 'win32': |
| 122 | # gn in PATH is bat file in windows environment (except cygwin). |
| 123 | args = ['cmd', '/c'] + args |
| 124 | |
| 125 | gn_args = subprocess.check_output(args) |
| 126 | build_configs = ParseGNArgs(gn_args) |
| 127 | except subprocess.CalledProcessError as e: |
| 128 | logging.error("Failed to call gn %s", e) |
Takuto Ikuta | 96fdf7c | 2018-12-03 09:18:39 +0000 | [diff] [blame] | 129 | build_configs = {} |
| 130 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 131 | # Stringify config. |
| 132 | for k in build_configs: |
| 133 | build_configs[k] = str(build_configs[k]) |
Takuto Ikuta | 96fdf7c | 2018-12-03 09:18:39 +0000 | [diff] [blame] | 134 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 135 | metadata = { |
| 136 | 'platform': platform.system(), |
| 137 | 'cpu_core': multiprocessing.cpu_count(), |
| 138 | 'build_configs': build_configs, |
| 139 | 'targets': GetBuildTargetFromCommandLine(cmdline), |
| 140 | } |
Takuto Ikuta | 96fdf7c | 2018-12-03 09:18:39 +0000 | [diff] [blame] | 141 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 142 | jflag = GetJflag(cmdline) |
| 143 | if jflag is not None: |
| 144 | metadata['jobs'] = jflag |
Takuto Ikuta | 96fdf7c | 2018-12-03 09:18:39 +0000 | [diff] [blame] | 145 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 146 | return metadata |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 147 | |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 148 | |
| 149 | def GetNinjalog(cmdline): |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 150 | """GetNinjalog returns the path to ninjalog from cmdline.""" |
| 151 | # ninjalog is in current working directory by default. |
| 152 | ninjalog_dir = '.' |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 153 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 154 | i = 0 |
| 155 | while i < len(cmdline): |
| 156 | cmd = cmdline[i] |
| 157 | i += 1 |
| 158 | if cmd == '-C' and i < len(cmdline): |
| 159 | ninjalog_dir = cmdline[i] |
| 160 | i += 1 |
| 161 | continue |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 162 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 163 | if cmd.startswith('-C') and len(cmd) > len('-C'): |
| 164 | ninjalog_dir = cmd[len('-C'):] |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 165 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 166 | return os.path.join(ninjalog_dir, '.ninja_log') |
| 167 | |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 168 | |
| 169 | def main(): |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 170 | parser = argparse.ArgumentParser() |
| 171 | parser.add_argument('--server', |
| 172 | default='chromium-build-stats.appspot.com', |
| 173 | help='server to upload ninjalog file.') |
| 174 | parser.add_argument('--ninjalog', help='ninjalog file to upload.') |
| 175 | parser.add_argument('--verbose', |
| 176 | action='store_true', |
| 177 | help='Enable verbose logging.') |
| 178 | parser.add_argument('--cmdline', |
| 179 | required=True, |
| 180 | nargs=argparse.REMAINDER, |
| 181 | help='command line args passed to ninja.') |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 182 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 183 | args = parser.parse_args() |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 184 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 185 | if args.verbose: |
| 186 | logging.basicConfig(level=logging.INFO) |
| 187 | else: |
| 188 | # Disable logging. |
| 189 | logging.disable(logging.CRITICAL) |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 190 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 191 | if not IsGoogler(args.server): |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 192 | return 0 |
| 193 | |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 194 | ninjalog = args.ninjalog or GetNinjalog(args.cmdline) |
| 195 | if not os.path.isfile(ninjalog): |
| 196 | logging.warn("ninjalog is not found in %s", ninjalog) |
| 197 | return 1 |
| 198 | |
| 199 | # We assume that each ninja invocation interval takes at least 2 seconds. |
| 200 | # This is not to have duplicate entry in server when current build is no-op. |
| 201 | if os.stat(ninjalog).st_mtime < time.time() - 2: |
| 202 | logging.info("ninjalog is not updated recently %s", ninjalog) |
| 203 | return 0 |
| 204 | |
| 205 | output = cStringIO.StringIO() |
| 206 | |
| 207 | with open(ninjalog) as f: |
| 208 | with gzip.GzipFile(fileobj=output, mode='wb') as g: |
| 209 | g.write(f.read()) |
| 210 | g.write('# end of ninja log\n') |
| 211 | |
| 212 | metadata = GetMetadata(args.cmdline, ninjalog) |
| 213 | logging.info('send metadata: %s', json.dumps(metadata)) |
| 214 | g.write(json.dumps(metadata)) |
| 215 | |
| 216 | h = httplib2.Http() |
| 217 | resp_headers, content = h.request('https://' + args.server + |
| 218 | '/upload_ninja_log/', |
| 219 | 'POST', |
| 220 | body=output.getvalue(), |
| 221 | headers={'Content-Encoding': 'gzip'}) |
| 222 | |
| 223 | if resp_headers.status != 200: |
| 224 | logging.warn("unexpected status code for response: %s", resp_headers.status) |
| 225 | return 1 |
| 226 | |
| 227 | logging.info('response header: %s', resp_headers) |
| 228 | logging.info('response content: %s', content) |
| 229 | return 0 |
| 230 | |
| 231 | |
Takuto Ikuta | 9af233a | 2018-11-29 03:53:53 +0000 | [diff] [blame] | 232 | if __name__ == '__main__': |
Takuto Ikuta | a2e91db | 2020-06-09 11:21:59 +0000 | [diff] [blame] | 233 | sys.exit(main()) |