Index: clang/docs/ClangCommandLineReference.rst =================================================================== --- clang/docs/ClangCommandLineReference.rst +++ clang/docs/ClangCommandLineReference.rst @@ -1331,6 +1331,10 @@ .. option:: -fautolink, -fno-autolink +.. option:: -fbasic-block-sections=labels, -fbasic-block-sections=all, -fbasic-block-sections=list=, -fbasic-block-sections=none + +Generate labels for each basic block or place each basic block or a subset of basic blocks in its own section + .. option:: -fblocks, -fno-blocks Enable the 'blocks' language feature Index: clang/docs/UsersManual.rst =================================================================== --- clang/docs/UsersManual.rst +++ clang/docs/UsersManual.rst @@ -1698,6 +1698,16 @@ $ cd $P/bar && clang -c -funique-internal-linkage-names name_conflict.c $ cd $P && clang foo/name_conflict.o && bar/name_conflict.o +**-fbasic-block-sections=[labels, all, list=, none]** + + Controls whether Clang emits a label for each basic block. Further, with + values "all" and "list=arg", each basic block or a subset of basic blocks + can be placed in its own unique section. + + Basic block sections allow the linker to reorder basic blocks and enables + link-time optimizations like whole program inter-procedural basic block + reordering. + Profile Guided Optimization --------------------------- Index: clang/include/clang/Basic/CodeGenOptions.h =================================================================== --- clang/include/clang/Basic/CodeGenOptions.h +++ clang/include/clang/Basic/CodeGenOptions.h @@ -110,6 +110,22 @@ Embed_Marker // Embed a marker as a placeholder for bitcode. }; + // This field stores one of the allowed values for the option + // -fbasic-block-sections=. The allowed values with this option are: + // {"labels", "all", "", "none"}. + // + // "labels": Only generate basic block symbols (labels) for all basic + // blocks, do not generate unique sections for basic blocks. + // Use the machine basic block id in the symbol name to + // associate profile info from virtual address to machine + // basic block. + // "all" : Generate basic block sections for all basic blocks. + // "": Generate basic block sections for a subset of basic blocks. + // The functions and the machine basic block ids are specified + // in the file. + // "none": Disable sections/labels for basic blocks. + std::string BBSections; + enum class FramePointerKind { None, // Omit all frame pointers. NonLeaf, // Keep non-leaf frame pointers. Index: clang/include/clang/Basic/CodeGenOptions.def =================================================================== --- clang/include/clang/Basic/CodeGenOptions.def +++ clang/include/clang/Basic/CodeGenOptions.def @@ -46,6 +46,9 @@ ///< aliases to base ctors when possible. CODEGENOPT(DataSections , 1, 0) ///< Set when -fdata-sections is enabled. CODEGENOPT(UniqueSectionNames, 1, 1) ///< Set for -funique-section-names. +CODEGENOPT(UniqueBasicBlockSectionNames, 1, 1) ///< Set for -funique-basic-block-section-names, + ///< Produce unique section names with + ///< basic block sections. ENUM_CODEGENOPT(FramePointer, FramePointerKind, 2, FramePointerKind::None) /// frame-pointer: all,non-leaf,none CODEGENOPT(DisableFree , 1, 0) ///< Don't free memory. Index: clang/include/clang/Driver/Options.td =================================================================== --- clang/include/clang/Driver/Options.td +++ clang/include/clang/Driver/Options.td @@ -1988,6 +1988,9 @@ Flags<[CC1Option]>, HelpText<"Place each function in its own section">; def fno_function_sections : Flag<["-"], "fno-function-sections">, Group; +def fbasic_block_sections_EQ : Joined<["-"], "fbasic-block-sections=">, Group, + Flags<[CC1Option, CC1AsOption]>, + HelpText<"Place each function's basic blocks in unique sections (ELF Only) : all | labels | none | ">; def fdata_sections : Flag <["-"], "fdata-sections">, Group, Flags<[CC1Option]>, HelpText<"Place each data in its own section">; def fno_data_sections : Flag <["-"], "fno-data-sections">, Group; @@ -2002,6 +2005,12 @@ def fno_unique_section_names : Flag <["-"], "fno-unique-section-names">, Group, Flags<[CC1Option]>; +def funique_basic_block_section_names : Flag <["-"], "funique-basic-block-section-names">, + Group, Flags<[CC1Option]>, + HelpText<"Use unique names for basic block sections (ELF Only)">; +def fno_unique_basic_block_section_names : Flag <["-"], "fno-unique-basic-block-section-names">, + Group; + def funique_internal_linkage_names : Flag <["-"], "funique-internal-linkage-names">, Group, Flags<[CC1Option]>, HelpText<"Uniqueify Internal Linkage Symbol Names by appending the MD5 hash of the module path">; Index: clang/lib/CodeGen/BackendUtil.cpp =================================================================== --- clang/lib/CodeGen/BackendUtil.cpp +++ clang/lib/CodeGen/BackendUtil.cpp @@ -487,9 +487,30 @@ Options.NoZerosInBSS = CodeGenOpts.NoZeroInitializedInBSS; Options.UnsafeFPMath = CodeGenOpts.UnsafeFPMath; Options.StackAlignmentOverride = CodeGenOpts.StackAlignment; + + Options.BBSections = + llvm::StringSwitch(CodeGenOpts.BBSections) + .Case("all", llvm::BasicBlockSection::All) + .Case("labels", llvm::BasicBlockSection::Labels) + .StartsWith("list=", llvm::BasicBlockSection::List) + .Case("none", llvm::BasicBlockSection::None) + .Default(llvm::BasicBlockSection::None); + + if (Options.BBSections == llvm::BasicBlockSection::List) { + ErrorOr> MBOrErr = + MemoryBuffer::getFile(CodeGenOpts.BBSections.substr(5)); + if (!MBOrErr) + errs() << "Error loading basic block sections function list file: " + << MBOrErr.getError().message() << "\n"; + else + Options.BBSectionsFuncListBuf = std::move(*MBOrErr); + } + Options.FunctionSections = CodeGenOpts.FunctionSections; Options.DataSections = CodeGenOpts.DataSections; Options.UniqueSectionNames = CodeGenOpts.UniqueSectionNames; + Options.UniqueBasicBlockSectionNames = + CodeGenOpts.UniqueBasicBlockSectionNames; Options.TLSSize = CodeGenOpts.TLSSize; Options.EmulatedTLS = CodeGenOpts.EmulatedTLS; Options.ExplicitEmulatedTLS = CodeGenOpts.ExplicitEmulatedTLS; Index: clang/lib/Driver/ToolChains/Clang.cpp =================================================================== --- clang/lib/Driver/ToolChains/Clang.cpp +++ clang/lib/Driver/ToolChains/Clang.cpp @@ -4252,10 +4252,13 @@ options::OPT_fno_function_sections, options::OPT_fdata_sections, options::OPT_fno_data_sections, + options::OPT_fbasic_block_sections_EQ, options::OPT_funique_internal_linkage_names, options::OPT_fno_unique_internal_linkage_names, options::OPT_funique_section_names, options::OPT_fno_unique_section_names, + options::OPT_funique_basic_block_section_names, + options::OPT_fno_unique_basic_block_section_names, options::OPT_mrestrict_it, options::OPT_mno_restrict_it, options::OPT_mstackrealign, @@ -4871,6 +4874,16 @@ CmdArgs.push_back("-ffunction-sections"); } + if (Arg *A = Args.getLastArg(options::OPT_fbasic_block_sections_EQ)) { + StringRef Val = A->getValue(); + if (Val != "all" && Val != "labels" && Val != "none" && + !(Val.startswith("list=") && llvm::sys::fs::exists(Val.substr(5)))) + D.Diag(diag::err_drv_invalid_value) + << A->getAsString(Args) << A->getValue(); + else + A->render(Args, CmdArgs); + } + if (Args.hasFlag(options::OPT_fdata_sections, options::OPT_fno_data_sections, UseSeparateSections)) { CmdArgs.push_back("-fdata-sections"); @@ -4884,6 +4897,10 @@ options::OPT_fno_unique_internal_linkage_names, false)) CmdArgs.push_back("-funique-internal-linkage-names"); + if (Args.hasFlag(options::OPT_funique_basic_block_section_names, + options::OPT_fno_unique_basic_block_section_names, false)) + CmdArgs.push_back("-funique-basic-block-section-names"); + Args.AddLastArg(CmdArgs, options::OPT_finstrument_functions, options::OPT_finstrument_functions_after_inlining, options::OPT_finstrument_function_entry_bare); Index: clang/lib/Frontend/CompilerInvocation.cpp =================================================================== --- clang/lib/Frontend/CompilerInvocation.cpp +++ clang/lib/Frontend/CompilerInvocation.cpp @@ -953,10 +953,19 @@ Opts.TrapFuncName = std::string(Args.getLastArgValue(OPT_ftrap_function_EQ)); Opts.UseInitArray = !Args.hasArg(OPT_fno_use_init_array); - Opts.FunctionSections = Args.hasArg(OPT_ffunction_sections); + Opts.BBSections = + std::string(Args.getLastArgValue(OPT_fbasic_block_sections_EQ, "none")); + + // Basic Block Sections implies Function Sections. + Opts.FunctionSections = + Args.hasArg(OPT_ffunction_sections) || + (Opts.BBSections != "none" && Opts.BBSections != "labels"); + Opts.DataSections = Args.hasArg(OPT_fdata_sections); Opts.StackSizeSection = Args.hasArg(OPT_fstack_size_section); Opts.UniqueSectionNames = !Args.hasArg(OPT_fno_unique_section_names); + Opts.UniqueBasicBlockSectionNames = + Args.hasArg(OPT_funique_basic_block_section_names); Opts.UniqueInternalLinkageNames = Args.hasArg(OPT_funique_internal_linkage_names); Index: clang/test/CodeGen/basic-block-sections.c =================================================================== --- /dev/null +++ clang/test/CodeGen/basic-block-sections.c @@ -0,0 +1,47 @@ +// REQUIRES: x86-registered-target + +// RUN: %clang_cc1 -triple x86_64-pc-linux-gnu -S -o - < %s | FileCheck %s --check-prefix=PLAIN +// RUN: %clang_cc1 -triple x86_64-pc-linux-gnu -S -fbasic-block-sections=all -fbasic-block-sections=none -o - < %s | FileCheck %s --check-prefix=PLAIN + +// RUN: %clang_cc1 -triple x86_64-pc-linux-gnu -S -fbasic-block-sections=labels -o - < %s | FileCheck %s --check-prefix=BB_LABELS +// RUN: %clang_cc1 -triple x86_64-pc-linux-gnu -S -fbasic-block-sections=all -o - < %s | FileCheck %s --check-prefix=BB_WORLD --check-prefix=BB_ALL +// RUN: %clang_cc1 -triple x86_64-pc-linux-gnu -S -fbasic-block-sections=list=%S/basic-block-sections.funcnames -o - < %s | FileCheck %s --check-prefix=BB_WORLD --check-prefix=BB_LIST +// RUN: %clang_cc1 -triple x86_64-pc-linux-gnu -S -fbasic-block-sections=all -funique-basic-block-section-names -o - < %s | FileCheck %s --check-prefix=UNIQUE + +int world(int a) { + if (a > 10) + return 10; + else if (a > 5) + return 5; + else + return 0; +} + +int another(int a) { + if (a > 10) + return 20; + return 0; +} + +// PLAIN-NOT: section +// PLAIN: world: +// +// BB_LABELS-NOT: section +// BB_LABELS: world: +// BB_LABELS: a.BB.world: +// BB_LABELS: aa.BB.world: +// BB_LABELS: a.BB.another: +// +// BB_WORLD: .section .text.world,"ax",@progbits{{$}} +// BB_WORLD: world: +// BB_WORLD: .section .text.world,"ax",@progbits,unique +// BB_WORLD: world.1: +// BB_WORLD: .section .text.another,"ax",@progbits +// BB_ALL: .section .text.another,"ax",@progbits,unique +// BB_ALL: another.1: +// BB_LIST-NOT: .section .text.another,"ax",@progbits,unique +// BB_LIST: another: +// BB_LIST-NOT: another.1: +// +// UNIQUE: .section .text.world.world.1, +// UNIQUE: .section .text.another.another.1, Index: clang/test/CodeGen/basic-block-sections.funcnames =================================================================== --- /dev/null +++ clang/test/CodeGen/basic-block-sections.funcnames @@ -0,0 +1 @@ +!world Index: clang/test/Driver/fbasic-block-sections.c =================================================================== --- /dev/null +++ clang/test/Driver/fbasic-block-sections.c @@ -0,0 +1,9 @@ +// RUN: %clang -### -fbasic-block-sections=none %s -S 2>&1 | FileCheck -check-prefix=CHECK-OPT-NONE %s +// RUN: %clang -### -fbasic-block-sections=all %s -S 2>&1 | FileCheck -check-prefix=CHECK-OPT-ALL %s +// RUN: %clang -### -fbasic-block-sections=list=%s %s -S 2>&1 | FileCheck -check-prefix=CHECK-OPT-LIST %s +// RUN: %clang -### -fbasic-block-sections=labels %s -S 2>&1 | FileCheck -check-prefix=CHECK-OPT-LABELS %s +// +// CHECK-OPT-NONE: "-fbasic-block-sections=none" +// CHECK-OPT-ALL: "-fbasic-block-sections=all" +// CHECK-OPT-LIST: "-fbasic-block-sections={{[^ ]*}}fbasic-block-sections.c" +// CHECK-OPT-LABELS: "-fbasic-block-sections=labels" Index: clang/test/Driver/funique-basic-block-section-names.c =================================================================== --- /dev/null +++ clang/test/Driver/funique-basic-block-section-names.c @@ -0,0 +1,4 @@ +// RUN: %clang -### -funique-basic-block-section-names %s -S 2>&1 | FileCheck -check-prefix=CHECK-OPT %s +// RUN: %clang -### -funique-basic-block-section-names -fno-unique-basic-block-section-names %s -S 2>&1 | FileCheck -check-prefix=CHECK-NOOPT %s +// CHECK-OPT: "-funique-basic-block-section-names" +// CHECK-NOOPT-NOT: "-funique-basic-block-section-names" Index: lld/ELF/Config.h =================================================================== --- lld/ELF/Config.h +++ lld/ELF/Config.h @@ -169,7 +169,7 @@ bool ltoDebugPassManager; bool ltoEmitAsm; bool ltoNewPassManager; - bool ltoUniqueBBSectionNames; + bool ltoUniqueBasicBlockSectionNames; bool ltoWholeProgramVisibility; bool mergeArmExidx; bool mipsN32Abi = false; Index: lld/ELF/Driver.cpp =================================================================== --- lld/ELF/Driver.cpp +++ lld/ELF/Driver.cpp @@ -930,7 +930,7 @@ config->ltoSampleProfile = args.getLastArgValue(OPT_lto_sample_profile); config->ltoBasicBlockSections = args.getLastArgValue(OPT_lto_basicblock_sections); - config->ltoUniqueBBSectionNames = + config->ltoUniqueBasicBlockSectionNames = args.hasFlag(OPT_lto_unique_bb_section_names, OPT_no_lto_unique_bb_section_names, false); config->mapFile = args.getLastArgValue(OPT_Map); Index: lld/ELF/LTO.cpp =================================================================== --- lld/ELF/LTO.cpp +++ lld/ELF/LTO.cpp @@ -79,7 +79,7 @@ // Check if basic block sections must be used. // Allowed values for --lto-basicblock-sections are "all", "labels", // "", or none. This is the equivalent - // of -fbasicblock-sections= flag in clang. + // of -fbasic-block-sections= flag in clang. if (!config->ltoBasicBlockSections.empty()) { if (config->ltoBasicBlockSections == "all") { c.Options.BBSections = BasicBlockSection::All; @@ -100,7 +100,8 @@ } } - c.Options.UniqueBBSectionNames = config->ltoUniqueBBSectionNames; + c.Options.UniqueBasicBlockSectionNames = + config->ltoUniqueBasicBlockSectionNames; if (auto relocModel = getRelocModelFromCMModel()) c.RelocModel = *relocModel; Index: llvm/include/llvm/CodeGen/CommandFlags.h =================================================================== --- llvm/include/llvm/CodeGen/CommandFlags.h +++ llvm/include/llvm/CodeGen/CommandFlags.h @@ -104,7 +104,7 @@ bool getUniqueSectionNames(); -bool getUniqueBBSectionNames(); +bool getUniqueBasicBlockSectionNames(); llvm::EABI getEABIVersion(); Index: llvm/include/llvm/CodeGen/Passes.h =================================================================== --- llvm/include/llvm/CodeGen/Passes.h +++ llvm/include/llvm/CodeGen/Passes.h @@ -44,7 +44,7 @@ FunctionPass *createUnreachableBlockEliminationPass(); /// createBBSectionsPrepare Pass - This pass assigns sections to machine basic - /// blocks and is enabled with -fbasicblock-sections. + /// blocks and is enabled with -fbasic-block-sections. /// Buf is a memory buffer that contains the list of functions and basic /// block ids to selectively enable basic block sections. MachineFunctionPass *createBBSectionsPreparePass(const MemoryBuffer *Buf); Index: llvm/include/llvm/Target/TargetMachine.h =================================================================== --- llvm/include/llvm/Target/TargetMachine.h +++ llvm/include/llvm/Target/TargetMachine.h @@ -246,7 +246,9 @@ bool getUniqueSectionNames() const { return Options.UniqueSectionNames; } /// Return true if unique basic block section names must be generated. - bool getUniqueBBSectionNames() const { return Options.UniqueBBSectionNames; } + bool getUniqueBasicBlockSectionNames() const { + return Options.UniqueBasicBlockSectionNames; + } /// Return true if data objects should be emitted into their own section, /// corresponds to -fdata-sections. @@ -261,7 +263,7 @@ } /// If basic blocks should be emitted into their own section, - /// corresponding to -fbasicblock-sections. + /// corresponding to -fbasic-block-sections. llvm::BasicBlockSection getBBSectionsType() const { return Options.BBSections; } Index: llvm/include/llvm/Target/TargetOptions.h =================================================================== --- llvm/include/llvm/Target/TargetOptions.h +++ llvm/include/llvm/Target/TargetOptions.h @@ -121,7 +121,7 @@ EnableFastISel(false), EnableGlobalISel(false), UseInitArray(false), DisableIntegratedAS(false), RelaxELFRelocations(false), FunctionSections(false), DataSections(false), - UniqueSectionNames(true), UniqueBBSectionNames(false), + UniqueSectionNames(true), UniqueBasicBlockSectionNames(false), TrapUnreachable(false), NoTrapAfterNoreturn(false), TLSSize(0), EmulatedTLS(false), ExplicitEmulatedTLS(false), EnableIPRA(false), EmitStackSizeSection(false), EnableMachineOutliner(false), @@ -234,7 +234,7 @@ unsigned UniqueSectionNames : 1; /// Use unique names for basic block sections. - unsigned UniqueBBSectionNames : 1; + unsigned UniqueBasicBlockSectionNames : 1; /// Emit target-specific trap instruction for 'unreachable' IR instructions. unsigned TrapUnreachable : 1; Index: llvm/lib/CodeGen/BBSectionsPrepare.cpp =================================================================== --- llvm/lib/CodeGen/BBSectionsPrepare.cpp +++ llvm/lib/CodeGen/BBSectionsPrepare.cpp @@ -9,15 +9,15 @@ // BBSectionsPrepare implementation. // // The purpose of this pass is to assign sections to basic blocks when -// -fbasicblock-sections= option is used. Further, with profile information only -// the subset of basic blocks with profiles are placed in separate sections and -// the rest are grouped in a cold section. The exception handling blocks are +// -fbasic-block-sections= option is used. Further, with profile information +// only the subset of basic blocks with profiles are placed in separate sections +// and the rest are grouped in a cold section. The exception handling blocks are // treated specially to ensure they are all in one seciton. // // Basic Block Sections // ==================== // -// With option, -fbasicblock-sections=list, every function may be split into +// With option, -fbasic-block-sections=list, every function may be split into // clusters of basic blocks. Every cluster will be emitted into a separate // section with its basic blocks sequenced in the given order. To get the // optimized performance, the clusters must form an optimal BB layout for the @@ -48,7 +48,7 @@ // Basic Block Labels // ================== // -// With -fbasicblock-sections=labels, or when a basic block is placed in a +// With -fbasic-block-sections=labels, or when a basic block is placed in a // unique section, it is labelled with a symbol. This allows easy mapping of // virtual addresses from PMU profiles back to the corresponding basic blocks. // Since the number of basic blocks is large, the labeling bloats the symbol Index: llvm/lib/CodeGen/CommandFlags.cpp =================================================================== --- llvm/lib/CodeGen/CommandFlags.cpp +++ llvm/lib/CodeGen/CommandFlags.cpp @@ -74,7 +74,7 @@ CGOPT(unsigned, TLSSize) CGOPT(bool, EmulatedTLS) CGOPT(bool, UniqueSectionNames) -CGOPT(bool, UniqueBBSectionNames) +CGOPT(bool, UniqueBasicBlockSectionNames) CGOPT(EABI, EABIVersion) CGOPT(DebuggerKind, DebuggerTuningOpt) CGOPT(bool, EnableStackSizeSection) @@ -346,11 +346,11 @@ cl::init(true)); CGBINDOPT(UniqueSectionNames); - static cl::opt UniqueBBSectionNames( + static cl::opt UniqueBasicBlockSectionNames( "unique-bb-section-names", cl::desc("Give unique names to every basic block section"), cl::init(false)); - CGBINDOPT(UniqueBBSectionNames); + CGBINDOPT(UniqueBasicBlockSectionNames); static cl::opt EABIVersion( "meabi", cl::desc("Set EABI type (default depends on triple):"), @@ -456,7 +456,7 @@ Options.FunctionSections = getFunctionSections(); Options.BBSections = getBBSectionsMode(Options); Options.UniqueSectionNames = getUniqueSectionNames(); - Options.UniqueBBSectionNames = getUniqueBBSectionNames(); + Options.UniqueBasicBlockSectionNames = getUniqueBasicBlockSectionNames(); Options.TLSSize = getTLSSize(); Options.EmulatedTLS = getEmulatedTLS(); Options.ExplicitEmulatedTLS = EmulatedTLSView->getNumOccurrences() > 0; Index: llvm/lib/CodeGen/MachineFunction.cpp =================================================================== --- llvm/lib/CodeGen/MachineFunction.cpp +++ llvm/lib/CodeGen/MachineFunction.cpp @@ -340,7 +340,7 @@ MBBNumbering.resize(BlockNo); } -/// This is used with -fbasicblock-sections or -fbasicblock-labels option. +/// This is used with -fbasic-block-sections or -fbasicblock-labels option. /// A unary encoding of basic block labels is done to keep ".strtab" sizes /// small. void MachineFunction::createBBLabels() { Index: llvm/lib/CodeGen/TargetLoweringObjectFileImpl.cpp =================================================================== --- llvm/lib/CodeGen/TargetLoweringObjectFileImpl.cpp +++ llvm/lib/CodeGen/TargetLoweringObjectFileImpl.cpp @@ -875,7 +875,7 @@ Name += MBB.getParent()->getName(); } else { Name += MBB.getParent()->getSection()->getName(); - if (TM.getUniqueBBSectionNames()) { + if (TM.getUniqueBasicBlockSectionNames()) { Name += "."; Name += MBB.getSymbol()->getName(); } else {