Diff 263783

llvm/lib/Transforms/IPO/OpenMPOpt.cpp

Show All 12 Lines
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

#include "llvm/Transforms/IPO/OpenMPOpt.h"		#include "llvm/Transforms/IPO/OpenMPOpt.h"

#include "llvm/ADT/EnumeratedArray.h"		#include "llvm/ADT/EnumeratedArray.h"
#include "llvm/ADT/Statistic.h"		#include "llvm/ADT/Statistic.h"
#include "llvm/Analysis/CallGraph.h"		#include "llvm/Analysis/CallGraph.h"
#include "llvm/Analysis/CallGraphSCCPass.h"		#include "llvm/Analysis/CallGraphSCCPass.h"
		#include "llvm/Analysis/OptimizationRemarkEmitter.h"
#include "llvm/Frontend/OpenMP/OMPConstants.h"		#include "llvm/Frontend/OpenMP/OMPConstants.h"
#include "llvm/Frontend/OpenMP/OMPIRBuilder.h"		#include "llvm/Frontend/OpenMP/OMPIRBuilder.h"
#include "llvm/InitializePasses.h"		#include "llvm/InitializePasses.h"
#include "llvm/Support/CommandLine.h"		#include "llvm/Support/CommandLine.h"
#include "llvm/Transforms/IPO.h"		#include "llvm/Transforms/IPO.h"
#include "llvm/Transforms/Utils/CallGraphUpdater.h"		#include "llvm/Transforms/Utils/CallGraphUpdater.h"

using namespace llvm;		using namespace llvm;
		jdoerfertUnsubmitted Not Done Reply Inline Actions Nit: probably not needed. jdoerfert: Nit: probably not needed.
using namespace omp;		using namespace omp;
using namespace types;		using namespace types;

#define DEBUG_TYPE "openmp-opt"		#define DEBUG_TYPE "openmp-opt"

static cl::opt<bool> DisableOpenMPOptimizations(		static cl::opt<bool> DisableOpenMPOptimizations(
"openmp-opt-disable", cl::ZeroOrMore,		"openmp-opt-disable", cl::ZeroOrMore,
cl::desc("Disable OpenMP specific optimizations."), cl::Hidden,		cl::desc("Disable OpenMP specific optimizations."), cl::Hidden,
cl::init(false));		cl::init(false));

STATISTIC(NumOpenMPRuntimeCallsDeduplicated,		STATISTIC(NumOpenMPRuntimeCallsDeduplicated,
"Number of OpenMP runtime calls deduplicated");		"Number of OpenMP runtime calls deduplicated");
STATISTIC(NumOpenMPRuntimeFunctionsIdentified,		STATISTIC(NumOpenMPRuntimeFunctionsIdentified,
"Number of OpenMP runtime functions identified");		"Number of OpenMP runtime functions identified");
STATISTIC(NumOpenMPRuntimeFunctionUsesIdentified,		STATISTIC(NumOpenMPRuntimeFunctionUsesIdentified,
"Number of OpenMP runtime function uses identified");		"Number of OpenMP runtime function uses identified");

#if !defined(NDEBUG)		#if !defined(NDEBUG)
static constexpr auto TAG = "[" DEBUG_TYPE "]";		static constexpr auto TAG = "[" DEBUG_TYPE "]";
#endif		#endif

namespace {		namespace {
struct OpenMPOpt {		struct OpenMPOpt {

		using OptimizationRemarkGetter =
		function_ref<OptimizationRemarkEmitter &(Function *)>;

OpenMPOpt(SmallVectorImpl<Function *> &SCC,		OpenMPOpt(SmallVectorImpl<Function *> &SCC,
SmallPtrSetImpl<Function *> &ModuleSlice,		SmallPtrSetImpl<Function *> &ModuleSlice,
CallGraphUpdater &CGUpdater)		CallGraphUpdater &CGUpdater, OptimizationRemarkGetter OREGetter)
: M((SCC.begin())->getParent()), SCC(SCC), ModuleSlice(ModuleSlice),		: M((SCC.begin())->getParent()), SCC(SCC), ModuleSlice(ModuleSlice),
		jdoerfertUnsubmitted Not Done Reply Inline Actions Just copy the getter (=function_ref) jdoerfert: Just copy the getter (=function_ref)
OMPBuilder(M), CGUpdater(CGUpdater) {		OMPBuilder(M), CGUpdater(CGUpdater), OREGetter(OREGetter) {
initializeTypes(M);		initializeTypes(M);
initializeRuntimeFunctions();		initializeRuntimeFunctions();
OMPBuilder.initialize();		OMPBuilder.initialize();
}		}

/// Generic information that describes a runtime function		/// Generic information that describes a runtime function
struct RuntimeFunctionInfo {		struct RuntimeFunctionInfo {

▲ Show 20 Lines • Show All 107 Lines • ▼ Show 20 Lines	auto DeleteCallCB = [&](Use &U, Function &) {
return false;		return false;
if (!Fn->onlyReadsMemory())		if (!Fn->onlyReadsMemory())
return false;		return false;
if (!Fn->hasFnAttribute(Attribute::WillReturn))		if (!Fn->hasFnAttribute(Attribute::WillReturn))
return false;		return false;

LLVM_DEBUG(dbgs() << TAG << "Delete read-only parallel region in "		LLVM_DEBUG(dbgs() << TAG << "Delete read-only parallel region in "
<< CI->getCaller()->getName() << "\n");		<< CI->getCaller()->getName() << "\n");

		auto Remark = [&](OptimizationRemark OR) {
		return OR << "Parallel region in "
		<< ore::NV("OpenMPParallelDelete", CI->getCaller()->getName())
		<< " deleted";
		};
		emitRemark<OptimizationRemark>(CI, "OpenMPParallelRegionDeletion",
		Remark);

CGUpdater.removeCallSite(*CI);		CGUpdater.removeCallSite(*CI);
CI->eraseFromParent();		CI->eraseFromParent();
Changed = true;		Changed = true;
return true;		return true;
};		};

RFI.foreachUse(DeleteCallCB);		RFI.foreachUse(DeleteCallCB);

▲ Show 20 Lines • Show All 123 Lines • ▼ Show 20 Lines	auto CanBeMoved = [](CallBase &CB) {
return true;		return true;
};		};

if (!ReplVal) {		if (!ReplVal) {
for (Use U : UV)		for (Use U : UV)
if (CallInst CI = getCallIfRegularCall(U, &RFI)) {		if (CallInst CI = getCallIfRegularCall(U, &RFI)) {
if (!CanBeMoved(*CI))		if (!CanBeMoved(*CI))
continue;		continue;

		auto Remark = [&](OptimizationRemark OR) {
		auto newLoc = &*F.getEntryBlock().getFirstInsertionPt();
		return OR << "OpenMP runtime call "
		hfinkelUnsubmitted Not Done Reply Inline Actions Why doesn't RFI.Name have a ore::NV field name. Tools might certainly be interested in what functions are being optimized. hfinkel: Why doesn't RFI.Name have a ore::NV field name. Tools might certainly be interested in what…
		<< ore::NV("OpenMPOptRuntime", RFI.Name) << " moved to "
		<< ore::NV("OpenMPRuntimeMoves", newLoc->getDebugLoc());
		};
		emitRemark<OptimizationRemark>(CI, "OpenMPRuntimeCodeMotion", Remark);

CI->moveBefore(&*F.getEntryBlock().getFirstInsertionPt());		CI->moveBefore(&*F.getEntryBlock().getFirstInsertionPt());
ReplVal = CI;		ReplVal = CI;
break;		break;
}		}
if (!ReplVal)		if (!ReplVal)
return false;		return false;
}		}

Show All 10 Lines	bool deduplicateRuntimeCalls(Function &F, RuntimeFunctionInfo &RFI,
}		}

bool Changed = false;		bool Changed = false;
auto ReplaceAndDeleteCB = [&](Use &U, Function &Caller) {		auto ReplaceAndDeleteCB = [&](Use &U, Function &Caller) {
CallInst *CI = getCallIfRegularCall(U, &RFI);		CallInst *CI = getCallIfRegularCall(U, &RFI);
if (!CI \|\| CI == ReplVal \|\| &F != &Caller)		if (!CI \|\| CI == ReplVal \|\| &F != &Caller)
return false;		return false;
assert(CI->getCaller() == &F && "Unexpected call!");		assert(CI->getCaller() == &F && "Unexpected call!");

		auto Remark = [&](OptimizationRemark OR) {
		return OR << "OpenMP runtime call "
		hfinkelUnsubmitted Not Done Reply Inline Actions Same here: a NV for RFI.Name seems useful. hfinkel: Same here: a NV for RFI.Name seems useful.
		<< ore::NV("OpenMPOptRuntime", RFI.Name) << " deduplicated";
		};
		emitRemark<OptimizationRemark>(CI, "OpenMPRuntimeDeduplicated", Remark);

CGUpdater.removeCallSite(*CI);		CGUpdater.removeCallSite(*CI);
CI->replaceAllUsesWith(ReplVal);		CI->replaceAllUsesWith(ReplVal);
CI->eraseFromParent();		CI->eraseFromParent();
++NumOpenMPRuntimeCallsDeduplicated;		++NumOpenMPRuntimeCallsDeduplicated;
Changed = true;		Changed = true;
return true;		return true;
};		};
RFI.foreachUse(ReplaceAndDeleteCB);		RFI.foreachUse(ReplaceAndDeleteCB);
▲ Show 20 Lines • Show All 149 Lines • ▼ Show 20 Lines	if (declMatchesRTFTypes(F, _ReturnType, ArgsTypes)) { \
}); \		}); \
} \		} \
}		}
#include "llvm/Frontend/OpenMP/OMPKinds.def"		#include "llvm/Frontend/OpenMP/OMPKinds.def"

// TODO: We should attach the attributes defined in OMPKinds.def.		// TODO: We should attach the attributes defined in OMPKinds.def.
}		}

		/// Emit a remark generically
		///
		/// This template function can be used to generically emit a remark. The
		/// RemarkKind should be one of the following:
		/// - OptimizationRemark to indicate a successful optimization attempt
		/// - OptimizationRemarkMissed to report a failed optimization attempt
		/// - OptimizationRemarkAnalysis to provide additional information about an
		/// optimization attempt
		///
		/// The remark is built using a callback function provided by the caller that
		/// takes a RemarkKind as input and returns a RemarkKind.
		template <typename RemarkKind,
		typename RemarkCallBack = function_ref<RemarkKind(RemarkKind &&)>>
		void emitRemark(Instruction *Inst, StringRef RemarkName,
		RemarkCallBack &&RemarkCB) {
		Function *F = Inst->getParent()->getParent();
		auto &ORE = OREGetter(F);

		ORE.emit([&]() {
		return RemarkCB(RemarkKind(DEBUG_TYPE, RemarkName, Inst));
		});
		jdoerfertUnsubmitted Not Done Reply Inline Actions Nit: getFunction() auto & or auto , please. Do you need a default for the callback type? jdoerfert:* Nit: getFunction() auto & or auto *, please. Do you need a default for the callback type?
		jhuber6AuthorUnsubmitted Done Reply Inline Actions I changed the OREGetter to return a reference. I'm not exactly sure what you mean by default for the callback type. Do you mean a default implementation or are you talking about just the template parameter. jhuber6: I changed the OREGetter to return a reference. I'm not exactly sure what you mean by default…
		jdoerfertUnsubmitted Not Done Reply Inline Actions The latter. Doesn't this work: template <typename RemarkKind, typename RemarkCallBack> jdoerfert: The latter. Doesn't this work: ``` template <typename RemarkKind, typename RemarkCallBack> ```
		jhuber6AuthorUnsubmitted Done Reply Inline Actions I was just using that template to rename the type inside the function. I was pretty much just using it as this: using RemarkCallBack = function_ref<RemarkKind(RemarkKind &&)>>; Should I change that? jhuber6: I was just using that template to rename the type inside the function. I was pretty much just…
		jdoerfertUnsubmitted Not Done Reply Inline Actions I don't get the last comment but I guess we can just leave it as is. jdoerfert: I don't get the last comment but I guess we can just leave it as is.
		}

/// The underyling module.		/// The underyling module.
Module &M;		Module &M;

/// The SCC we are operating on.		/// The SCC we are operating on.
SmallVectorImpl<Function *> &SCC;		SmallVectorImpl<Function *> &SCC;

/// The slice of the module we are allowed to look at.		/// The slice of the module we are allowed to look at.
SmallPtrSetImpl<Function *> &ModuleSlice;		SmallPtrSetImpl<Function *> &ModuleSlice;

/// An OpenMP-IR-Builder instance		/// An OpenMP-IR-Builder instance
OpenMPIRBuilder OMPBuilder;		OpenMPIRBuilder OMPBuilder;

/// Callback to update the call graph, the first argument is a removed call,		/// Callback to update the call graph, the first argument is a removed call,
/// the second an optional replacement call.		/// the second an optional replacement call.
CallGraphUpdater &CGUpdater;		CallGraphUpdater &CGUpdater;

		/// Callback to get an OptimizationRemarkEmitter from a Function *
		OptimizationRemarkGetter OREGetter;

/// Map from runtime function kind to the runtime function description.		/// Map from runtime function kind to the runtime function description.
EnumeratedArray<RuntimeFunctionInfo, RuntimeFunction,		EnumeratedArray<RuntimeFunctionInfo, RuntimeFunction,
RuntimeFunction::OMPRTL___last>		RuntimeFunction::OMPRTL___last>
RFIs;		RFIs;
};		};
} // namespace		} // namespace

PreservedAnalyses OpenMPOptPass::run(LazyCallGraph::SCC &C,		PreservedAnalyses OpenMPOptPass::run(LazyCallGraph::SCC &C,
Show All 10 Lines	PreservedAnalyses OpenMPOptPass::run(LazyCallGraph::SCC &C,
for (LazyCallGraph::Node &N : C) {		for (LazyCallGraph::Node &N : C) {
SCC.push_back(&N.getFunction());		SCC.push_back(&N.getFunction());
ModuleSlice.insert(SCC.back());		ModuleSlice.insert(SCC.back());
}		}

if (SCC.empty())		if (SCC.empty())
return PreservedAnalyses::all();		return PreservedAnalyses::all();

		auto OREGetter = [&C, &CG, &AM](Function *F) -> OptimizationRemarkEmitter & {
		FunctionAnalysisManager &FAM =
		AM.getResult<FunctionAnalysisManagerCGSCCProxy>(C, CG).getManager();
		return FAM.getResult<OptimizationRemarkEmitterAnalysis>(*F);
		};

		jdoerfertUnsubmitted Not Done Reply Inline Actions I don't think it's a good idea to move the result here. Just return a reference. jdoerfert: I don't think it's a good idea to move the result here. Just return a reference.
		jhuber6AuthorUnsubmitted Done Reply Inline Actions Yeah, I did this initially because I was having issues getting both the legacy and new versions to return a reference without memory leaks so I just did it by returning a unique_ptr. The std::move just cast it to an rvalue to avoid using the deleted constructor in the ORE class. I found another file that did something similar that had a single unique_ptr object to an ORE that's captured by reference. Then you just return a reference to that, so I'll change it to use that method because it's probably much more efficient. jhuber6: Yeah, I did this initially because I was having issues getting both the legacy and new versions…
CallGraphUpdater CGUpdater;		CallGraphUpdater CGUpdater;
CGUpdater.initialize(CG, C, AM, UR);		CGUpdater.initialize(CG, C, AM, UR);
// TODO: Compute the module slice we are allowed to look at.		// TODO: Compute the module slice we are allowed to look at.
OpenMPOpt OMPOpt(SCC, ModuleSlice, CGUpdater);		OpenMPOpt OMPOpt(SCC, ModuleSlice, CGUpdater, OREGetter);
bool Changed = OMPOpt.run();		bool Changed = OMPOpt.run();
(void)Changed;		(void)Changed;
return PreservedAnalyses::all();		return PreservedAnalyses::all();
}		}

namespace {		namespace {

struct OpenMPOptLegacyPass : public CallGraphSCCPass {		struct OpenMPOptLegacyPass : public CallGraphSCCPass {
Show All 31 Lines	for (CallGraphNode *CGN : CGSCC)
}		}

if (SCC.empty())		if (SCC.empty())
return false;		return false;

CallGraph &CG = getAnalysis<CallGraphWrapperPass>().getCallGraph();		CallGraph &CG = getAnalysis<CallGraphWrapperPass>().getCallGraph();
CGUpdater.initialize(CG, CGSCC);		CGUpdater.initialize(CG, CGSCC);

		// Maintain a map of functions to avoid rebuilding the ORE
		DenseMap<Function *, std::unique_ptr<OptimizationRemarkEmitter>> OREMap;
		auto OREGetter = [&OREMap](Function *F) -> OptimizationRemarkEmitter & {
		jdoerfertUnsubmitted Not Done Reply Inline Actions Call getAnalysis here? jdoerfert: Call getAnalysis here?
		jhuber6AuthorUnsubmitted Done Reply Inline Actions I tried using the getAnalysis method but it caused it to seg-fault. I'm not exactly confident why but some other passes generate the ORE this way so I figured it was okay. jhuber6: I tried using the getAnalysis method but it caused it to seg-fault. I'm not exactly confident…
		jdoerfertUnsubmitted Not Done Reply Inline Actions Oh, right. Yeah, so, the old PM CGSCC pass is bad at requiring function passes. Long story short, it doesn't work. We should do what the inliner does, create an ORE whenever we need one for a function. Since we would also like hotness information in the new pass manager (which I think we should get automatically via the pass), we should not always create a new ORE but only in the old PM. That said, the ORE constructor says it can be expensive if hotness filtering is requested as block frequency is computed. Thus, in the old PM we can cache the OREs ourselves. So, we keep a map from function to ORE and in the OREGetter we lookup the ORE, if not there create it, and return it. WDYT? jdoerfert: Oh, right. Yeah, so, the old PM CGSCC pass is bad at requiring function passes. Long story…
		jhuber6AuthorUnsubmitted Done Reply Inline Actions I was thinking about adding a cache previously since the function being worked on might not change often. It might be somewhat difficult to bake that functionality into the callback but I'll see what I can do in the morning. jhuber6: I was thinking about adding a cache previously since the function being worked on might not…
		jhuber6AuthorUnsubmitted Done Reply Inline Actions I just noticed I could probably have used try_emplace() rather than checking and inserting manually. jhuber6: I just noticed I could probably have used try_emplace() rather than checking and inserting…
		std::unique_ptr<OptimizationRemarkEmitter> &ORE = OREMap[F];
		if (!ORE)
		ORE = std::make_unique<OptimizationRemarkEmitter>(F);
		return *ORE;
		jdoerfertUnsubmitted Not Done Reply Inline Actions I usually prefer: std::make_unique<OptimizationRemarkEmitter> &ORE = OREMap[F]; if(!ORE) ORE = ... return ORE; Your code has 3 lookups into the map, mine only one. jdoerfert: I usually prefer: ``` std::make_unique<OptimizationRemarkEmitter> &ORE = OREMap[F]; if(!
		};

// TODO: Compute the module slice we are allowed to look at.		// TODO: Compute the module slice we are allowed to look at.
OpenMPOpt OMPOpt(SCC, ModuleSlice, CGUpdater);		OpenMPOpt OMPOpt(SCC, ModuleSlice, CGUpdater, OREGetter);
return OMPOpt.run();		return OMPOpt.run();
}		}

bool doFinalization(CallGraph &CG) override { return CGUpdater.finalize(); }		bool doFinalization(CallGraph &CG) override { return CGUpdater.finalize(); }
};		};

} // end anonymous namespace		} // end anonymous namespace

Show All 20 Lines

llvm/test/Transforms/OpenMP/deduplication_remarks.ll

This file was added.

				; RUN: opt -openmpopt -pass-remarks=openmp-opt -disable-output < %s 2>&1 \| FileCheck %s
				; RUN: opt -passes=openmpopt -pass-remarks=openmp-opt -disable-output < %s 2>&1 \| FileCheck %s
				; ModuleID = 'deduplication_remarks.c'
				source_filename = "deduplication_remarks.c"
				target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
				target triple = "x86_64-pc-linux-gnu"

				%struct.ident_t = type { i32, i32, i32, i32, i8* }

				@0 = private unnamed_addr global %struct.ident_t { i32 0, i32 34, i32 0, i32 0, i8* getelementptr inbounds ([23 x i8], [23 x i8]* @.str0, i32 0, i32 0) }, align 8
				@.str0 = private unnamed_addr constant [23 x i8] c";unknown;unknown;0;0;;\00", align 1

				; CHECK: remark: deduplication_remarks.c:9:10: OpenMP runtime call __kmpc_global_thread_num moved to deduplication_remarks.c:5:10
				; CHECK: remark: deduplication_remarks.c:7:10: OpenMP runtime call __kmpc_global_thread_num deduplicated
				; CHECK: remark: deduplication_remarks.c:5:10: OpenMP runtime call __kmpc_global_thread_num deduplicated
				define dso_local void @deduplicate() local_unnamed_addr !dbg !14 {
				%1 = tail call i32 @__kmpc_global_thread_num(%struct.ident_t* nonnull @0), !dbg !21
				call void @useI32(i32 %1), !dbg !23
				%2 = tail call i32 @__kmpc_global_thread_num(%struct.ident_t* nonnull @0), !dbg !24
				call void @useI32(i32 %2), !dbg !25
				%3 = tail call i32 @__kmpc_global_thread_num(%struct.ident_t* nonnull @0), !dbg !26
				call void @useI32(i32 %3), !dbg !27
				ret void, !dbg !28
				}

				declare i32 @__kmpc_global_thread_num(%struct.ident_t*)

				declare !dbg !4 void @useI32(i32) local_unnamed_addr

				declare void @llvm.dbg.value(metadata, metadata, metadata)

				!llvm.dbg.cu = !{!0}
				!llvm.module.flags = !{!8, !9, !10, !11, !12}
				!llvm.ident = !{!13}

				!0 = distinct !DICompileUnit(language: DW_LANG_C99, file: !1, producer: "clang version 10.0.0 ", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, enums: !2, retainedTypes: !3, splitDebugInlining: false, nameTableKind: None)
				!1 = !DIFile(filename: "deduplication_remarks.c", directory: "/tmp")
				!2 = !{}
				!3 = !{!4}
				!4 = !DISubprogram(name: "useI32", scope: !1, file: !1, line: 1, type: !5, flags: DIFlagPrototyped, spFlags: DISPFlagOptimized, retainedNodes: !2)
				!5 = !DISubroutineType(types: !6)
				!6 = !{null, !7}
				!7 = !DIBasicType(name: "int", size: 32, encoding: DW_ATE_signed)
				!8 = !{i32 7, !"Dwarf Version", i32 4}
				!9 = !{i32 2, !"Debug Info Version", i32 3}
				!10 = !{i32 1, !"wchar_size", i32 4}
				!11 = !{i32 7, !"PIC Level", i32 2}
				!12 = !{i32 7, !"PIE Level", i32 2}
				!13 = !{!"clang version 10.0.0 "}
				!14 = distinct !DISubprogram(name: "deduplicate", scope: !1, file: !1, line: 4, type: !15, scopeLine: 4, flags: DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition \| DISPFlagOptimized, unit: !0, retainedNodes: !17)
				!15 = !DISubroutineType(types: !16)
				!16 = !{null}
				!17 = !{!18, !19, !20}
				!18 = !DILocalVariable(name: "x", scope: !14, file: !1, line: 5, type: !7)
				!19 = !DILocalVariable(name: "y", scope: !14, file: !1, line: 7, type: !7)
				!20 = !DILocalVariable(name: "z", scope: !14, file: !1, line: 9, type: !7)
				!21 = !DILocation(line: 5, column: 10, scope: !14)
				!22 = !DILocation(line: 0, scope: !14)
				!23 = !DILocation(line: 6, column: 2, scope: !14)
				!24 = !DILocation(line: 7, column: 10, scope: !14)
				!25 = !DILocation(line: 8, column: 2, scope: !14)
				!26 = !DILocation(line: 9, column: 10, scope: !14)
				!27 = !DILocation(line: 10, column: 2, scope: !14)
				!28 = !DILocation(line: 13, column: 1, scope: !14)

llvm/test/Transforms/OpenMP/parallel_deletion_remarks.ll

This file was added.

				; RUN: opt -S -pass-remarks=openmp-opt -attributor -openmpopt -disable-output < %s 2>&1 \| FileCheck %s
				; RUN: opt -S -pass-remarks=openmp-opt -passes='attributor,cgscc(openmpopt)' -disable-output < %s 2>&1 \| FileCheck %s
				; ModuleID = 'parallel_deletion_remarks.ll'
				source_filename = "parallel_deletion_remarks.c"
				target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
				target triple = "x86_64-pc-linux-gnu"

				%struct.ident_t = type { i32, i32, i32, i32, i8* }

				@.str = private unnamed_addr constant [23 x i8] c";unknown;unknown;0;0;;\00", align 1
				@0 = private unnamed_addr constant %struct.ident_t { i32 0, i32 2, i32 0, i32 0, i8* getelementptr inbounds ([23 x i8], [23 x i8]* @.str, i32 0, i32 0) }, align 8

				; void delete_parallel(void) {
				; #pragma omp parallel
				; { unknown_willreturn(); }
				; #pragma omp parallel
				; { readonly_willreturn(); }
				; #pragma omp parallel
				; { readnone_willreturn(); }
				; #pragma omp parallel
				; {}
				; }
				;
				; This will delete all but the first parallel region

				; CHECK: remark: parallel_deletion_remarks.c:14:1: Parallel region in delete_parallel deleted
				; CHECK: remark: parallel_deletion_remarks.c:12:1: Parallel region in delete_parallel deleted
				; CHECK: remark: parallel_deletion_remarks.c:10:1: Parallel region in delete_parallel deleted
				define dso_local void @delete_parallel() local_unnamed_addr !dbg !15 {
				call void (%struct.ident_t, i32, void (i32, i32, ...), ...) @__kmpc_fork_call(%struct.ident_t* nonnull @0, i32 0, void (i32, i32, ...)* bitcast (void (i32, i32)* @.omp_outlined. to void (i32, i32, ...)*)), !dbg !18
				call void (%struct.ident_t, i32, void (i32, i32, ...), ...) @__kmpc_fork_call(%struct.ident_t* nonnull @0, i32 0, void (i32, i32, ...)* bitcast (void (i32, i32)* @.omp_outlined..2 to void (i32, i32, ...)*)), !dbg !19
				call void (%struct.ident_t, i32, void (i32, i32, ...), ...) @__kmpc_fork_call(%struct.ident_t* nonnull @0, i32 0, void (i32, i32, ...)* bitcast (void (i32, i32)* @.omp_outlined..4 to void (i32, i32, ...)*)), !dbg !20
				call void (%struct.ident_t, i32, void (i32, i32, ...), ...) @__kmpc_fork_call(%struct.ident_t* nonnull @0, i32 0, void (i32, i32, ...)* bitcast (void (i32, i32)* @.omp_outlined..6 to void (i32, i32, ...)*)), !dbg !21
				ret void, !dbg !22
				}

				declare !callback !23 void @__kmpc_fork_call(%struct.ident_t, i32, void (i32, i32, ...), ...) local_unnamed_addr

				; Function Attrs: willreturn
				declare !dbg !4 void @unknown_willreturn(...) #0

				; Function Attrs: readonly willreturn
				declare !dbg !7 void @readonly_willreturn(...) #1

				; Function Attrs: readnone willreturn
				declare !dbg !8 void @readnone_willreturn(...) #2

				define internal void @.omp_outlined.(i32* noalias nocapture readnone %0, i32* noalias nocapture readnone %1) !dbg !25 {
				call void (...) @unknown_willreturn(), !dbg !36
				ret void, !dbg !36
				}

				define internal void @.omp_outlined..2(i32* noalias nocapture readnone %0, i32* noalias nocapture readnone %1) !dbg !37 {
				call void (...) @readonly_willreturn(), !dbg !41
				ret void, !dbg !41
				}

				define internal void @.omp_outlined..4(i32* noalias nocapture readnone %0, i32* noalias nocapture readnone %1) !dbg !42 {
				call void (...) @readnone_willreturn(), !dbg !46
				ret void, !dbg !46
				}

				define internal void @.omp_outlined..6(i32* noalias nocapture %0, i32* noalias nocapture %1) !dbg !47 {
				ret void, !dbg !51
				}

				attributes #0 = { willreturn }
				attributes #1 = { readonly willreturn }
				attributes #2 = { readnone willreturn }

				!llvm.dbg.cu = !{!0}
				!llvm.module.flags = !{!9, !10, !11, !12, !13}
				!llvm.ident = !{!14}

				!0 = distinct !DICompileUnit(language: DW_LANG_C99, file: !1, producer: "clang version 10.0.0 ", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, enums: !2, retainedTypes: !3, splitDebugInlining: false, nameTableKind: None)
				!1 = !DIFile(filename: "parallel_deletion_remarks.c", directory: "/tmp")
				!2 = !{}
				!3 = !{!4, !7, !8}
				!4 = !DISubprogram(name: "unknown_willreturn", scope: !1, file: !1, line: 3, type: !5, spFlags: DISPFlagOptimized, retainedNodes: !2)
				!5 = !DISubroutineType(types: !6)
				!6 = !{null, null}
				!7 = !DISubprogram(name: "readonly_willreturn", scope: !1, file: !1, line: 4, type: !5, spFlags: DISPFlagOptimized, retainedNodes: !2)
				!8 = !DISubprogram(name: "readnone_willreturn", scope: !1, file: !1, line: 5, type: !5, spFlags: DISPFlagOptimized, retainedNodes: !2)
				!9 = !{i32 7, !"Dwarf Version", i32 4}
				!10 = !{i32 2, !"Debug Info Version", i32 3}
				!11 = !{i32 1, !"wchar_size", i32 4}
				!12 = !{i32 7, !"PIC Level", i32 2}
				!13 = !{i32 7, !"PIE Level", i32 2}
				!14 = !{!"clang version 10.0.0 "}
				!15 = distinct !DISubprogram(name: "delete_parallel", scope: !1, file: !1, line: 7, type: !16, scopeLine: 7, flags: DIFlagPrototyped \| DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition \| DISPFlagOptimized, unit: !0, retainedNodes: !2)
				!16 = !DISubroutineType(types: !17)
				!17 = !{null}
				!18 = !DILocation(line: 8, column: 1, scope: !15)
				!19 = !DILocation(line: 10, column: 1, scope: !15)
				!20 = !DILocation(line: 12, column: 1, scope: !15)
				!21 = !DILocation(line: 14, column: 1, scope: !15)
				!22 = !DILocation(line: 16, column: 1, scope: !15)
				!23 = !{!24}
				!24 = !{i64 2, i64 -1, i64 -1, i1 true}
				!25 = distinct !DISubprogram(name: ".omp_outlined.", scope: !1, file: !1, line: 9, type: !26, scopeLine: 9, flags: DIFlagPrototyped \| DIFlagAllCallsDescribed, spFlags: DISPFlagLocalToUnit \| DISPFlagDefinition \| DISPFlagOptimized, unit: !0, retainedNodes: !33)
				!26 = !DISubroutineType(types: !27)
				!27 = !{null, !28, !28}
				!28 = !DIDerivedType(tag: DW_TAG_const_type, baseType: !29)
				!29 = !DIDerivedType(tag: DW_TAG_restrict_type, baseType: !30)
				!30 = !DIDerivedType(tag: DW_TAG_pointer_type, baseType: !31, size: 64)
				!31 = !DIDerivedType(tag: DW_TAG_const_type, baseType: !32)
				!32 = !DIBasicType(name: "int", size: 32, encoding: DW_ATE_signed)
				!33 = !{!34, !35}
				!34 = !DILocalVariable(name: ".global_tid.", arg: 1, scope: !25, type: !28, flags: DIFlagArtificial)
				!35 = !DILocalVariable(name: ".bound_tid.", arg: 2, scope: !25, type: !28, flags: DIFlagArtificial)
				!36 = !DILocation(line: 9, column: 2, scope: !25)
				!37 = distinct !DISubprogram(name: ".omp_outlined..2", scope: !1, file: !1, line: 11, type: !26, scopeLine: 11, flags: DIFlagPrototyped \| DIFlagAllCallsDescribed, spFlags: DISPFlagLocalToUnit \| DISPFlagDefinition \| DISPFlagOptimized, unit: !0, retainedNodes: !38)
				!38 = !{!39, !40}
				!39 = !DILocalVariable(name: ".global_tid.", arg: 1, scope: !37, type: !28, flags: DIFlagArtificial)
				!40 = !DILocalVariable(name: ".bound_tid.", arg: 2, scope: !37, type: !28, flags: DIFlagArtificial)
				!41 = !DILocation(line: 11, column: 2, scope: !37)
				!42 = distinct !DISubprogram(name: ".omp_outlined..4", scope: !1, file: !1, line: 13, type: !26, scopeLine: 13, flags: DIFlagPrototyped \| DIFlagAllCallsDescribed, spFlags: DISPFlagLocalToUnit \| DISPFlagDefinition \| DISPFlagOptimized, unit: !0, retainedNodes: !43)
				!43 = !{!44, !45}
				!44 = !DILocalVariable(name: ".global_tid.", arg: 1, scope: !42, type: !28, flags: DIFlagArtificial)
				!45 = !DILocalVariable(name: ".bound_tid.", arg: 2, scope: !42, type: !28, flags: DIFlagArtificial)
				!46 = !DILocation(line: 13, column: 2, scope: !42)
				!47 = distinct !DISubprogram(name: ".omp_outlined..6", scope: !1, file: !1, line: 15, type: !26, scopeLine: 15, flags: DIFlagPrototyped \| DIFlagAllCallsDescribed, spFlags: DISPFlagLocalToUnit \| DISPFlagDefinition \| DISPFlagOptimized, unit: !0, retainedNodes: !48)
				!48 = !{!49, !50}
				!49 = !DILocalVariable(name: ".global_tid.", arg: 1, scope: !47, type: !28, flags: DIFlagArtificial)
				!50 = !DILocalVariable(name: ".bound_tid.", arg: 2, scope: !47, type: !28, flags: DIFlagArtificial)
				!51 = !DILocation(line: 15, column: 2, scope: !47)

This is an archive of the discontinued LLVM Phabricator instance.

OpenMPOpt Remarks Support
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 263783

llvm/lib/Transforms/IPO/OpenMPOpt.cpp

llvm/test/Transforms/OpenMP/deduplication_remarks.ll

llvm/test/Transforms/OpenMP/parallel_deletion_remarks.ll

This is an archive of the discontinued LLVM Phabricator instance.

OpenMPOpt Remarks SupportClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 263783

llvm/lib/Transforms/IPO/OpenMPOpt.cpp

llvm/test/Transforms/OpenMP/deduplication_remarks.ll

llvm/test/Transforms/OpenMP/parallel_deletion_remarks.ll

OpenMPOpt Remarks Support
ClosedPublic