|
| 1 | +#!/usr/bin/env python3 |
| 2 | +""" |
| 3 | +This script: |
| 4 | +- Builds clang with user-defined flags |
| 5 | +- Uses that clang to build an instrumented clang, which can be used to collect |
| 6 | + PGO samples |
| 7 | +- Builds a user-defined set of sources (default: clang) to act as a |
| 8 | + "benchmark" to generate a PGO profile |
| 9 | +- Builds clang once more with the PGO profile generated above |
| 10 | +
|
| 11 | +This is a total of four clean builds of clang (by default). This may take a |
| 12 | +while. :) |
| 13 | +""" |
| 14 | + |
| 15 | +import argparse |
| 16 | +import collections |
| 17 | +import multiprocessing |
| 18 | +import os |
| 19 | +import shlex |
| 20 | +import shutil |
| 21 | +import subprocess |
| 22 | +import sys |
| 23 | + |
| 24 | +### User configuration |
| 25 | + |
| 26 | + |
| 27 | +# If you want to use a different 'benchmark' than building clang, make this |
| 28 | +# function do what you want. out_dir is the build directory for clang, so all |
| 29 | +# of the clang binaries will live under "${out_dir}/bin/". Using clang in |
| 30 | +# ${out_dir} will magically have the profiles go to the right place. |
| 31 | +# |
| 32 | +# You may assume that out_dir is a freshly-built directory that you can reach |
| 33 | +# in to build more things, if you'd like. |
| 34 | +def _run_benchmark(env, out_dir, include_debug_info): |
| 35 | + """The 'benchmark' we run to generate profile data.""" |
| 36 | + target_dir = env.output_subdir('instrumentation_run') |
| 37 | + |
| 38 | + # `check-llvm` and `check-clang` are cheap ways to increase coverage. The |
| 39 | + # former lets us touch on the non-x86 backends a bit if configured, and the |
| 40 | + # latter gives us more C to chew on (and will send us through diagnostic |
| 41 | + # paths a fair amount, though the `if (stuff_is_broken) { diag() ... }` |
| 42 | + # branches should still heavily be weighted in the not-taken direction, |
| 43 | + # since we built all of LLVM/etc). |
| 44 | + _build_things_in(env, target_dir, what=['check-llvm', 'check-clang']) |
| 45 | + |
| 46 | + # Building tblgen gets us coverage; don't skip it. (out_dir may also not |
| 47 | + # have them anyway, but that's less of an issue) |
| 48 | + cmake = _get_cmake_invocation_for_bootstrap_from( |
| 49 | + env, out_dir, skip_tablegens=False) |
| 50 | + |
| 51 | + if include_debug_info: |
| 52 | + cmake.add_flag('CMAKE_BUILD_TYPE', 'RelWithDebInfo') |
| 53 | + |
| 54 | + _run_fresh_cmake(env, cmake, target_dir) |
| 55 | + |
| 56 | + # Just build all the things. The more data we have, the better. |
| 57 | + _build_things_in(env, target_dir, what=['all']) |
| 58 | + |
| 59 | + |
| 60 | +### Script |
| 61 | + |
| 62 | + |
| 63 | +class CmakeInvocation: |
| 64 | + _cflags = ['CMAKE_C_FLAGS', 'CMAKE_CXX_FLAGS'] |
| 65 | + _ldflags = [ |
| 66 | + 'CMAKE_EXE_LINKER_FLAGS', |
| 67 | + 'CMAKE_MODULE_LINKER_FLAGS', |
| 68 | + 'CMAKE_SHARED_LINKER_FLAGS', |
| 69 | + ] |
| 70 | + |
| 71 | + def __init__(self, cmake, maker, cmake_dir): |
| 72 | + self._prefix = [cmake, '-G', maker, cmake_dir] |
| 73 | + |
| 74 | + # Map of str -> (list|str). |
| 75 | + self._flags = {} |
| 76 | + for flag in CmakeInvocation._cflags + CmakeInvocation._ldflags: |
| 77 | + self._flags[flag] = [] |
| 78 | + |
| 79 | + def add_new_flag(self, key, value): |
| 80 | + self.add_flag(key, value, allow_overwrites=False) |
| 81 | + |
| 82 | + def add_flag(self, key, value, allow_overwrites=True): |
| 83 | + if key not in self._flags: |
| 84 | + self._flags[key] = value |
| 85 | + return |
| 86 | + |
| 87 | + existing_value = self._flags[key] |
| 88 | + if isinstance(existing_value, list): |
| 89 | + existing_value.append(value) |
| 90 | + return |
| 91 | + |
| 92 | + if not allow_overwrites: |
| 93 | + raise ValueError('Invalid overwrite of %s requested' % key) |
| 94 | + |
| 95 | + self._flags[key] = value |
| 96 | + |
| 97 | + def add_cflags(self, flags): |
| 98 | + # No, I didn't intend to append ['-', 'O', '2'] to my flags, thanks :) |
| 99 | + assert not isinstance(flags, str) |
| 100 | + for f in CmakeInvocation._cflags: |
| 101 | + self._flags[f].extend(flags) |
| 102 | + |
| 103 | + def add_ldflags(self, flags): |
| 104 | + assert not isinstance(flags, str) |
| 105 | + for f in CmakeInvocation._ldflags: |
| 106 | + self._flags[f].extend(flags) |
| 107 | + |
| 108 | + def to_args(self): |
| 109 | + args = self._prefix.copy() |
| 110 | + for key, value in sorted(self._flags.items()): |
| 111 | + if isinstance(value, list): |
| 112 | + # We preload all of the list-y values (cflags, ...). If we've |
| 113 | + # nothing to add, don't. |
| 114 | + if not value: |
| 115 | + continue |
| 116 | + value = ' '.join(value) |
| 117 | + |
| 118 | + arg = '-D' + key |
| 119 | + if value != '': |
| 120 | + arg += '=' + value |
| 121 | + args.append(arg) |
| 122 | + return args |
| 123 | + |
| 124 | + |
| 125 | +class Env: |
| 126 | + def __init__(self, llvm_dir, use_make, output_dir, default_cmake_args, |
| 127 | + dry_run): |
| 128 | + self.llvm_dir = llvm_dir |
| 129 | + self.use_make = use_make |
| 130 | + self.output_dir = output_dir |
| 131 | + self.default_cmake_args = default_cmake_args.copy() |
| 132 | + self.dry_run = dry_run |
| 133 | + |
| 134 | + def get_default_cmake_args_kv(self): |
| 135 | + return self.default_cmake_args.items() |
| 136 | + |
| 137 | + def get_cmake_maker(self): |
| 138 | + return 'Ninja' if not self.use_make else 'Unix Makefiles' |
| 139 | + |
| 140 | + def get_make_command(self): |
| 141 | + if self.use_make: |
| 142 | + return ['make', '-j{}'.format(multiprocessing.cpu_count())] |
| 143 | + return ['ninja'] |
| 144 | + |
| 145 | + def output_subdir(self, name): |
| 146 | + return os.path.join(self.output_dir, name) |
| 147 | + |
| 148 | + def has_llvm_subproject(self, name): |
| 149 | + if name == 'compiler-rt': |
| 150 | + subdir = 'projects/compiler-rt' |
| 151 | + elif name == 'clang': |
| 152 | + subdir = 'tools/clang' |
| 153 | + else: |
| 154 | + raise ValueError('Unknown subproject: %s' % name) |
| 155 | + |
| 156 | + return os.path.isdir(os.path.join(self.llvm_dir, subdir)) |
| 157 | + |
| 158 | + # Note that we don't allow capturing stdout/stderr. This works quite nicely |
| 159 | + # with dry_run. |
| 160 | + def run_command(self, |
| 161 | + cmd, |
| 162 | + cwd=None, |
| 163 | + check=False, |
| 164 | + silent_unless_error=False): |
| 165 | + cmd_str = ' '.join(shlex.quote(s) for s in cmd) |
| 166 | + print( |
| 167 | + 'Running `%s` in %s' % (cmd_str, shlex.quote(cwd or os.getcwd()))) |
| 168 | + |
| 169 | + if self.dry_run: |
| 170 | + return |
| 171 | + |
| 172 | + if silent_unless_error: |
| 173 | + stdout, stderr = subprocess.PIPE, subprocess.STDOUT |
| 174 | + else: |
| 175 | + stdout, stderr = None, None |
| 176 | + |
| 177 | + # Don't use subprocess.run because it's >= py3.5 only, and it's not too |
| 178 | + # much extra effort to get what it gives us anyway. |
| 179 | + popen = subprocess.Popen( |
| 180 | + cmd, |
| 181 | + stdin=subprocess.DEVNULL, |
| 182 | + stdout=stdout, |
| 183 | + stderr=stderr, |
| 184 | + cwd=cwd) |
| 185 | + stdout, _ = popen.communicate() |
| 186 | + return_code = popen.wait(timeout=0) |
| 187 | + |
| 188 | + if not return_code: |
| 189 | + return |
| 190 | + |
| 191 | + if silent_unless_error: |
| 192 | + print(stdout.decode('utf-8', 'ignore')) |
| 193 | + |
| 194 | + if check: |
| 195 | + raise subprocess.CalledProcessError( |
| 196 | + returncode=return_code, cmd=cmd, output=stdout, stderr=None) |
| 197 | + |
| 198 | + |
| 199 | +def _get_default_cmake_invocation(env): |
| 200 | + inv = CmakeInvocation( |
| 201 | + cmake='cmake', maker=env.get_cmake_maker(), cmake_dir=env.llvm_dir) |
| 202 | + for key, value in env.get_default_cmake_args_kv(): |
| 203 | + inv.add_new_flag(key, value) |
| 204 | + return inv |
| 205 | + |
| 206 | + |
| 207 | +def _get_cmake_invocation_for_bootstrap_from(env, out_dir, |
| 208 | + skip_tablegens=True): |
| 209 | + clang = os.path.join(out_dir, 'bin', 'clang') |
| 210 | + cmake = _get_default_cmake_invocation(env) |
| 211 | + cmake.add_new_flag('CMAKE_C_COMPILER', clang) |
| 212 | + cmake.add_new_flag('CMAKE_CXX_COMPILER', clang + '++') |
| 213 | + |
| 214 | + # We often get no value out of building new tblgens; the previous build |
| 215 | + # should have them. It's still correct to build them, just slower. |
| 216 | + def add_tablegen(key, binary): |
| 217 | + path = os.path.join(out_dir, 'bin', binary) |
| 218 | + |
| 219 | + # Check that this exists, since the user's allowed to specify their own |
| 220 | + # stage1 directory (which is generally where we'll source everything |
| 221 | + # from). Dry runs should hope for the best from our user, as well. |
| 222 | + if env.dry_run or os.path.exists(path): |
| 223 | + cmake.add_new_flag(key, path) |
| 224 | + |
| 225 | + if skip_tablegens: |
| 226 | + add_tablegen('LLVM_TABLEGEN', 'llvm-tblgen') |
| 227 | + add_tablegen('CLANG_TABLEGEN', 'clang-tblgen') |
| 228 | + |
| 229 | + return cmake |
| 230 | + |
| 231 | + |
| 232 | +def _build_things_in(env, target_dir, what): |
| 233 | + cmd = env.get_make_command() + what |
| 234 | + env.run_command(cmd, cwd=target_dir, check=True) |
| 235 | + |
| 236 | + |
| 237 | +def _run_fresh_cmake(env, cmake, target_dir): |
| 238 | + if not env.dry_run: |
| 239 | + try: |
| 240 | + shutil.rmtree(target_dir) |
| 241 | + except FileNotFoundError: |
| 242 | + pass |
| 243 | + |
| 244 | + os.makedirs(target_dir, mode=0o755) |
| 245 | + |
| 246 | + cmake_args = cmake.to_args() |
| 247 | + env.run_command( |
| 248 | + cmake_args, cwd=target_dir, check=True, silent_unless_error=True) |
| 249 | + |
| 250 | + |
| 251 | +def _build_stage1_clang(env): |
| 252 | + target_dir = env.output_subdir('stage1') |
| 253 | + cmake = _get_default_cmake_invocation(env) |
| 254 | + _run_fresh_cmake(env, cmake, target_dir) |
| 255 | + |
| 256 | + # FIXME: The full build here is somewhat unfortunate. It's primarily |
| 257 | + # because I don't know what to call libclang_rt.profile for arches that |
| 258 | + # aren't x86_64 (and even then, it's in a subdir that contains clang's |
| 259 | + # current version). It would be nice to figure out what target I can |
| 260 | + # request to magically have libclang_rt.profile built for ${host} |
| 261 | + _build_things_in(env, target_dir, what=['all']) |
| 262 | + return target_dir |
| 263 | + |
| 264 | + |
| 265 | +def _generate_instrumented_clang_profile(env, stage1_dir, profile_dir, |
| 266 | + output_file): |
| 267 | + llvm_profdata = os.path.join(stage1_dir, 'bin', 'llvm-profdata') |
| 268 | + if env.dry_run: |
| 269 | + profiles = [os.path.join(profile_dir, '*.profraw')] |
| 270 | + else: |
| 271 | + profiles = [ |
| 272 | + os.path.join(profile_dir, f) for f in os.listdir(profile_dir) |
| 273 | + if f.endswith('.profraw') |
| 274 | + ] |
| 275 | + cmd = [llvm_profdata, 'merge', '-output=' + output_file] + profiles |
| 276 | + env.run_command(cmd, check=True) |
| 277 | + |
| 278 | + |
| 279 | +def _build_instrumented_clang(env, stage1_dir): |
| 280 | + assert os.path.isabs(stage1_dir) |
| 281 | + |
| 282 | + target_dir = os.path.join(env.output_dir, 'instrumented') |
| 283 | + cmake = _get_cmake_invocation_for_bootstrap_from(env, stage1_dir) |
| 284 | + cmake.add_new_flag('LLVM_BUILD_INSTRUMENTED', 'IR') |
| 285 | + |
| 286 | + # libcxx's configure step messes with our link order: we'll link |
| 287 | + # libclang_rt.profile after libgcc, and the former requires atexit from the |
| 288 | + # latter. So, configure checks fail. |
| 289 | + # |
| 290 | + # Since we don't need libcxx or compiler-rt anyway, just disable them. |
| 291 | + cmake.add_new_flag('LLVM_BUILD_RUNTIME', 'No') |
| 292 | + |
| 293 | + _run_fresh_cmake(env, cmake, target_dir) |
| 294 | + _build_things_in(env, target_dir, what=['clang', 'lld']) |
| 295 | + |
| 296 | + profiles_dir = os.path.join(target_dir, 'profiles') |
| 297 | + return target_dir, profiles_dir |
| 298 | + |
| 299 | + |
| 300 | +def _build_optimized_clang(env, stage1_dir, profdata_file): |
| 301 | + if not env.dry_run and not os.path.exists(profdata_file): |
| 302 | + raise ValueError('Looks like the profdata file at %s doesn\'t exist' % |
| 303 | + profdata_file) |
| 304 | + |
| 305 | + target_dir = os.path.join(env.output_dir, 'optimized') |
| 306 | + cmake = _get_cmake_invocation_for_bootstrap_from(env, stage1_dir) |
| 307 | + cmake.add_new_flag('LLVM_PROFDATA_FILE', os.path.abspath(profdata_file)) |
| 308 | + |
| 309 | + # We'll get complaints about hash mismatches in `main` in tools/etc. Ignore |
| 310 | + # it. |
| 311 | + cmake.add_cflags(['-Wno-backend-plugin']) |
| 312 | + _run_fresh_cmake(env, cmake, target_dir) |
| 313 | + _build_things_in(env, target_dir, what=['clang']) |
| 314 | + return target_dir |
| 315 | + |
| 316 | + |
| 317 | +Args = collections.namedtuple('Args', [ |
| 318 | + 'do_optimized_build', |
| 319 | + 'include_debug_info', |
| 320 | + 'profile_location', |
| 321 | + 'stage1_dir', |
| 322 | +]) |
| 323 | + |
| 324 | + |
| 325 | +def _parse_args(): |
| 326 | + parser = argparse.ArgumentParser( |
| 327 | + description='Builds LLVM and Clang with instrumentation, collects ' |
| 328 | + 'instrumentation profiles for them, and (optionally) builds things' |
| 329 | + 'with these PGO profiles. By default, it\'s assumed that you\'re ' |
| 330 | + 'running this from your LLVM root, and all build artifacts will be ' |
| 331 | + 'saved to $PWD/out.') |
| 332 | + parser.add_argument( |
| 333 | + '--cmake-extra-arg', |
| 334 | + action='append', |
| 335 | + default=[], |
| 336 | + help='an extra arg to pass to all cmake invocations. Note that this ' |
| 337 | + 'is interpreted as a -D argument, e.g. --cmake-extra-arg FOO=BAR will ' |
| 338 | + 'be passed as -DFOO=BAR. This may be specified multiple times.') |
| 339 | + parser.add_argument( |
| 340 | + '--dry-run', |
| 341 | + action='store_true', |
| 342 | + help='print commands instead of running them') |
| 343 | + parser.add_argument( |
| 344 | + '--llvm-dir', |
| 345 | + default='.', |
| 346 | + help='directory containing an LLVM checkout (default: $PWD)') |
| 347 | + parser.add_argument( |
| 348 | + '--no-optimized-build', |
| 349 | + action='store_true', |
| 350 | + help='disable the final, PGO-optimized build') |
| 351 | + parser.add_argument( |
| 352 | + '--out-dir', |
| 353 | + help='directory to write artifacts to (default: $llvm_dir/out)') |
| 354 | + parser.add_argument( |
| 355 | + '--profile-output', |
| 356 | + help='where to output the profile (default is $out/pgo_profile.prof)') |
| 357 | + parser.add_argument( |
| 358 | + '--stage1-dir', |
| 359 | + help='instead of having an initial build of everything, use the given ' |
| 360 | + 'directory. It is expected that this directory will have clang, ' |
| 361 | + 'llvm-profdata, and the appropriate libclang_rt.profile already built') |
| 362 | + parser.add_argument( |
| 363 | + '--use-debug-info-in-benchmark', |
| 364 | + action='store_true', |
| 365 | + help='use a regular build instead of RelWithDebInfo in the benchmark. ' |
| 366 | + 'This increases benchmark execution time and disk space requirements, ' |
| 367 | + 'but gives more coverage over debuginfo bits in LLVM and clang.') |
| 368 | + parser.add_argument( |
| 369 | + '--use-make', |
| 370 | + action='store_true', |
| 371 | + default=shutil.which('ninja') is None, |
| 372 | + help='use Makefiles instead of ninja') |
| 373 | + |
| 374 | + args = parser.parse_args() |
| 375 | + |
| 376 | + llvm_dir = os.path.abspath(args.llvm_dir) |
| 377 | + if args.out_dir is None: |
| 378 | + output_dir = os.path.join(llvm_dir, 'out') |
| 379 | + else: |
| 380 | + output_dir = os.path.abspath(args.out_dir) |
| 381 | + |
| 382 | + extra_args = {'CMAKE_BUILD_TYPE': 'Release'} |
| 383 | + for arg in args.cmake_extra_arg: |
| 384 | + if arg.startswith('-D'): |
| 385 | + arg = arg[2:] |
| 386 | + elif arg.startswith('-'): |
| 387 | + raise ValueError('Unknown not- -D arg encountered; you may need ' |
| 388 | + 'to tweak the source...') |
| 389 | + split = arg.split('=', 1) |
| 390 | + if len(split) == 1: |
| 391 | + key, val = split[0], '' |
| 392 | + else: |
| 393 | + key, val = split |
| 394 | + extra_args[key] = val |
| 395 | + |
| 396 | + env = Env( |
| 397 | + default_cmake_args=extra_args, |
| 398 | + dry_run=args.dry_run, |
| 399 | + llvm_dir=llvm_dir, |
| 400 | + output_dir=output_dir, |
| 401 | + use_make=args.use_make, |
| 402 | + ) |
| 403 | + |
| 404 | + if args.profile_output is not None: |
| 405 | + profile_location = args.profile_output |
| 406 | + else: |
| 407 | + profile_location = os.path.join(env.output_dir, 'pgo_profile.prof') |
| 408 | + |
| 409 | + result_args = Args( |
| 410 | + do_optimized_build=not args.no_optimized_build, |
| 411 | + include_debug_info=args.use_debug_info_in_benchmark, |
| 412 | + profile_location=profile_location, |
| 413 | + stage1_dir=args.stage1_dir, |
| 414 | + ) |
| 415 | + |
| 416 | + return env, result_args |
| 417 | + |
| 418 | + |
| 419 | +def _looks_like_llvm_dir(directory): |
| 420 | + """Arbitrary set of heuristics to determine if `directory` is an llvm dir. |
| 421 | +
|
| 422 | + Errs on the side of false-positives.""" |
| 423 | + |
| 424 | + contents = set(os.listdir(directory)) |
| 425 | + expected_contents = [ |
| 426 | + 'CODE_OWNERS.TXT', |
| 427 | + 'cmake', |
| 428 | + 'docs', |
| 429 | + 'include', |
| 430 | + 'utils', |
| 431 | + ] |
| 432 | + |
| 433 | + if not all(c in contents for c in expected_contents): |
| 434 | + return False |
| 435 | + |
| 436 | + try: |
| 437 | + include_listing = os.listdir(os.path.join(directory, 'include')) |
| 438 | + except NotADirectoryError: |
| 439 | + return False |
| 440 | + |
| 441 | + return 'llvm' in include_listing |
| 442 | + |
| 443 | + |
| 444 | +def _die(*args, **kwargs): |
| 445 | + kwargs['file'] = sys.stderr |
| 446 | + print(*args, **kwargs) |
| 447 | + sys.exit(1) |
| 448 | + |
| 449 | + |
| 450 | +def _main(): |
| 451 | + env, args = _parse_args() |
| 452 | + |
| 453 | + if not _looks_like_llvm_dir(env.llvm_dir): |
| 454 | + _die('Looks like %s isn\'t an LLVM directory; please see --help' % |
| 455 | + env.llvm_dir) |
| 456 | + if not env.has_llvm_subproject('clang'): |
| 457 | + _die('Need a clang checkout at tools/clang') |
| 458 | + if not env.has_llvm_subproject('compiler-rt'): |
| 459 | + _die('Need a compiler-rt checkout at projects/compiler-rt') |
| 460 | + |
| 461 | + def status(*args): |
| 462 | + print(*args, file=sys.stderr) |
| 463 | + |
| 464 | + if args.stage1_dir is None: |
| 465 | + status('*** Building stage1 clang...') |
| 466 | + stage1_out = _build_stage1_clang(env) |
| 467 | + else: |
| 468 | + stage1_out = args.stage1_dir |
| 469 | + |
| 470 | + status('*** Building instrumented clang...') |
| 471 | + instrumented_out, profile_dir = _build_instrumented_clang(env, stage1_out) |
| 472 | + status('*** Running profdata benchmarks...') |
| 473 | + _run_benchmark(env, instrumented_out, args.include_debug_info) |
| 474 | + status('*** Generating profile...') |
| 475 | + _generate_instrumented_clang_profile(env, stage1_out, profile_dir, |
| 476 | + args.profile_location) |
| 477 | + |
| 478 | + print('Final profile:', args.profile_location) |
| 479 | + if args.do_optimized_build: |
| 480 | + status('*** Building PGO-optimized binaries...') |
| 481 | + optimized_out = _build_optimized_clang(env, stage1_out, |
| 482 | + args.profile_location) |
| 483 | + print('Final build directory:', optimized_out) |
| 484 | + |
| 485 | + |
| 486 | +if __name__ == '__main__': |
| 487 | + _main() |
0 commit comments