Diff 171127

include/clang/AST/StmtOpenMP.h

Show First 20 Lines • Show All 386 Lines • ▼ Show 20 Lines	enum {
PrevEnsureUpperBoundOffset = 20,		PrevEnsureUpperBoundOffset = 20,
CombinedLowerBoundVariableOffset = 21,		CombinedLowerBoundVariableOffset = 21,
CombinedUpperBoundVariableOffset = 22,		CombinedUpperBoundVariableOffset = 22,
CombinedEnsureUpperBoundOffset = 23,		CombinedEnsureUpperBoundOffset = 23,
CombinedInitOffset = 24,		CombinedInitOffset = 24,
CombinedConditionOffset = 25,		CombinedConditionOffset = 25,
CombinedNextLowerBoundOffset = 26,		CombinedNextLowerBoundOffset = 26,
CombinedNextUpperBoundOffset = 27,		CombinedNextUpperBoundOffset = 27,
		CombinedDistConditionOffset = 28,
		CombinedParForInDistConditionOffset = 29,
// Offset to the end (and start of the following counters/updates/finals		// Offset to the end (and start of the following counters/updates/finals
// arrays) for combined distribute loop directives.		// arrays) for combined distribute loop directives.
CombinedDistributeEnd = 28,		CombinedDistributeEnd = 30,
};		};

/// Get the counters storage.		/// Get the counters storage.
MutableArrayRef<Expr *> getCounters() {		MutableArrayRef<Expr *> getCounters() {
Expr Storage = reinterpret_cast<Expr >(		Expr Storage = reinterpret_cast<Expr >(
&(*(std::next(child_begin(), getArraysOffset(getDirectiveKind())))));		&(*(std::next(child_begin(), getArraysOffset(getDirectiveKind())))));
return MutableArrayRef<Expr *>(Storage, CollapsedNum);		return MutableArrayRef<Expr *>(Storage, CollapsedNum);
}		}
▲ Show 20 Lines • Show All 194 Lines • ▼ Show 20 Lines	assert(isOpenMPLoopBoundSharingDirective(getDirectiveKind()) &&
"expected loop bound sharing directive");		"expected loop bound sharing directive");
*std::next(child_begin(), CombinedNextLowerBoundOffset) = CombNLB;		*std::next(child_begin(), CombinedNextLowerBoundOffset) = CombNLB;
}		}
void setCombinedNextUpperBound(Expr *CombNUB) {		void setCombinedNextUpperBound(Expr *CombNUB) {
assert(isOpenMPLoopBoundSharingDirective(getDirectiveKind()) &&		assert(isOpenMPLoopBoundSharingDirective(getDirectiveKind()) &&
"expected loop bound sharing directive");		"expected loop bound sharing directive");
*std::next(child_begin(), CombinedNextUpperBoundOffset) = CombNUB;		*std::next(child_begin(), CombinedNextUpperBoundOffset) = CombNUB;
}		}
		void setCombinedDistCond(Expr *CombDistCond) {
		assert(isOpenMPLoopBoundSharingDirective(getDirectiveKind()) &&
		"expected loop bound distribute sharing directive");
		*std::next(child_begin(), CombinedDistConditionOffset) = CombDistCond;
		}
		void setCombinedParForInDistCond(Expr *CombParForInDistCond) {
		assert(isOpenMPLoopBoundSharingDirective(getDirectiveKind()) &&
		"expected loop bound distribute sharing directive");
		*std::next(child_begin(),
		CombinedParForInDistConditionOffset) = CombParForInDistCond;
		}
void setCounters(ArrayRef<Expr *> A);		void setCounters(ArrayRef<Expr *> A);
void setPrivateCounters(ArrayRef<Expr *> A);		void setPrivateCounters(ArrayRef<Expr *> A);
void setInits(ArrayRef<Expr *> A);		void setInits(ArrayRef<Expr *> A);
void setUpdates(ArrayRef<Expr *> A);		void setUpdates(ArrayRef<Expr *> A);
void setFinals(ArrayRef<Expr *> A);		void setFinals(ArrayRef<Expr *> A);

public:		public:
/// The expressions built to support OpenMP loops in combined/composite		/// The expressions built to support OpenMP loops in combined/composite
Show All 16 Lines	struct DistCombinedHelperExprs {
/// with 'omp for' in a same construct		/// with 'omp for' in a same construct
Expr *Cond;		Expr *Cond;
/// Update of LowerBound for statically scheduled omp loops for		/// Update of LowerBound for statically scheduled omp loops for
/// outer loop in combined constructs (e.g. 'distribute parallel for')		/// outer loop in combined constructs (e.g. 'distribute parallel for')
Expr *NLB;		Expr *NLB;
/// Update of UpperBound for statically scheduled omp loops for		/// Update of UpperBound for statically scheduled omp loops for
/// outer loop in combined constructs (e.g. 'distribute parallel for')		/// outer loop in combined constructs (e.g. 'distribute parallel for')
Expr *NUB;		Expr *NUB;
		/// Distribute Loop condition used when composing 'omp distribute'
		/// with 'omp for' in a same construct when schedule is chunked.
		Expr *DistCond;
		/// 'omp parallel for' loop condition used when composed with
		/// 'omp distribute' in the same construct and when schedule is
		/// chunked and the chunk size is 1.
		Expr *ParForInDistCond;
};		};

/// The expressions built for the OpenMP loop CodeGen for the		/// The expressions built for the OpenMP loop CodeGen for the
/// whole collapsed loop nest.		/// whole collapsed loop nest.
struct HelperExprs {		struct HelperExprs {
/// Loop iteration variable.		/// Loop iteration variable.
Expr *IterationVarRef;		Expr *IterationVarRef;
/// Loop last iteration number.		/// Loop last iteration number.
▲ Show 20 Lines • Show All 101 Lines • ▼ Show 20 Lines	void clear(unsigned Size) {
PreInits = nullptr;		PreInits = nullptr;
DistCombinedFields.LB = nullptr;		DistCombinedFields.LB = nullptr;
DistCombinedFields.UB = nullptr;		DistCombinedFields.UB = nullptr;
DistCombinedFields.EUB = nullptr;		DistCombinedFields.EUB = nullptr;
DistCombinedFields.Init = nullptr;		DistCombinedFields.Init = nullptr;
DistCombinedFields.Cond = nullptr;		DistCombinedFields.Cond = nullptr;
DistCombinedFields.NLB = nullptr;		DistCombinedFields.NLB = nullptr;
DistCombinedFields.NUB = nullptr;		DistCombinedFields.NUB = nullptr;
		DistCombinedFields.DistCond = nullptr;
		DistCombinedFields.ParForInDistCond = nullptr;
}		}
};		};

/// Get number of collapsed loops.		/// Get number of collapsed loops.
unsigned getCollapsedNumber() const { return CollapsedNum; }		unsigned getCollapsedNumber() const { return CollapsedNum; }

Expr *getIterationVariable() const {		Expr *getIterationVariable() const {
return const_cast<Expr >(reinterpret_cast<const Expr >(		return const_cast<Expr >(reinterpret_cast<const Expr >(
▲ Show 20 Lines • Show All 152 Lines • ▼ Show 20 Lines	return const_cast<Expr >(reinterpret_cast<const Expr >(
*std::next(child_begin(), CombinedNextLowerBoundOffset)));		*std::next(child_begin(), CombinedNextLowerBoundOffset)));
}		}
Expr *getCombinedNextUpperBound() const {		Expr *getCombinedNextUpperBound() const {
assert(isOpenMPLoopBoundSharingDirective(getDirectiveKind()) &&		assert(isOpenMPLoopBoundSharingDirective(getDirectiveKind()) &&
"expected loop bound sharing directive");		"expected loop bound sharing directive");
return const_cast<Expr >(reinterpret_cast<const Expr >(		return const_cast<Expr >(reinterpret_cast<const Expr >(
*std::next(child_begin(), CombinedNextUpperBoundOffset)));		*std::next(child_begin(), CombinedNextUpperBoundOffset)));
}		}
		Expr *getCombinedDistCond() const {
		assert(isOpenMPLoopBoundSharingDirective(getDirectiveKind()) &&
		"expected loop bound distribute sharing directive");
		return const_cast<Expr >(reinterpret_cast<const Expr >(
		*std::next(child_begin(), CombinedDistConditionOffset)));
		}
		Expr *getCombinedParForInDistCond() const {
		assert(isOpenMPLoopBoundSharingDirective(getDirectiveKind()) &&
		"expected loop bound distribute sharing directive");
		return const_cast<Expr >(reinterpret_cast<const Expr >(
		*std::next(child_begin(), CombinedParForInDistConditionOffset)));
		}
const Stmt *getBody() const {		const Stmt *getBody() const {
// This relies on the loop form is already checked by Sema.		// This relies on the loop form is already checked by Sema.
const Stmt *Body =		const Stmt *Body =
getInnermostCapturedStmt()->getCapturedStmt()->IgnoreContainers();		getInnermostCapturedStmt()->getCapturedStmt()->IgnoreContainers();
Body = cast<ForStmt>(Body)->getBody();		Body = cast<ForStmt>(Body)->getBody();
for (unsigned Cnt = 1; Cnt < CollapsedNum; ++Cnt) {		for (unsigned Cnt = 1; Cnt < CollapsedNum; ++Cnt) {
Body = Body->IgnoreContainers();		Body = Body->IgnoreContainers();
Body = cast<ForStmt>(Body)->getBody();		Body = cast<ForStmt>(Body)->getBody();
▲ Show 20 Lines • Show All 3,117 Lines • Show Last 20 Lines

lib/AST/StmtOpenMP.cpp

Show First 20 Lines • Show All 1,073 Lines • ▼ Show 20 Lines	OMPDistributeParallelForDirective *OMPDistributeParallelForDirective::Create(
Dir->setPreInits(Exprs.PreInits);		Dir->setPreInits(Exprs.PreInits);
Dir->setCombinedLowerBoundVariable(Exprs.DistCombinedFields.LB);		Dir->setCombinedLowerBoundVariable(Exprs.DistCombinedFields.LB);
Dir->setCombinedUpperBoundVariable(Exprs.DistCombinedFields.UB);		Dir->setCombinedUpperBoundVariable(Exprs.DistCombinedFields.UB);
Dir->setCombinedEnsureUpperBound(Exprs.DistCombinedFields.EUB);		Dir->setCombinedEnsureUpperBound(Exprs.DistCombinedFields.EUB);
Dir->setCombinedInit(Exprs.DistCombinedFields.Init);		Dir->setCombinedInit(Exprs.DistCombinedFields.Init);
Dir->setCombinedCond(Exprs.DistCombinedFields.Cond);		Dir->setCombinedCond(Exprs.DistCombinedFields.Cond);
Dir->setCombinedNextLowerBound(Exprs.DistCombinedFields.NLB);		Dir->setCombinedNextLowerBound(Exprs.DistCombinedFields.NLB);
Dir->setCombinedNextUpperBound(Exprs.DistCombinedFields.NUB);		Dir->setCombinedNextUpperBound(Exprs.DistCombinedFields.NUB);
		Dir->setCombinedDistCond(Exprs.DistCombinedFields.DistCond);
		Dir->setCombinedParForInDistCond(Exprs.DistCombinedFields.ParForInDistCond);
Dir->HasCancel = HasCancel;		Dir->HasCancel = HasCancel;
return Dir;		return Dir;
}		}

OMPDistributeParallelForDirective *		OMPDistributeParallelForDirective *
OMPDistributeParallelForDirective::CreateEmpty(const ASTContext &C,		OMPDistributeParallelForDirective::CreateEmpty(const ASTContext &C,
unsigned NumClauses,		unsigned NumClauses,
unsigned CollapsedNum,		unsigned CollapsedNum,
▲ Show 20 Lines • Show All 50 Lines • ▼ Show 20 Lines	OMPDistributeParallelForSimdDirective::Create(
Dir->setPreInits(Exprs.PreInits);		Dir->setPreInits(Exprs.PreInits);
Dir->setCombinedLowerBoundVariable(Exprs.DistCombinedFields.LB);		Dir->setCombinedLowerBoundVariable(Exprs.DistCombinedFields.LB);
Dir->setCombinedUpperBoundVariable(Exprs.DistCombinedFields.UB);		Dir->setCombinedUpperBoundVariable(Exprs.DistCombinedFields.UB);
Dir->setCombinedEnsureUpperBound(Exprs.DistCombinedFields.EUB);		Dir->setCombinedEnsureUpperBound(Exprs.DistCombinedFields.EUB);
Dir->setCombinedInit(Exprs.DistCombinedFields.Init);		Dir->setCombinedInit(Exprs.DistCombinedFields.Init);
Dir->setCombinedCond(Exprs.DistCombinedFields.Cond);		Dir->setCombinedCond(Exprs.DistCombinedFields.Cond);
Dir->setCombinedNextLowerBound(Exprs.DistCombinedFields.NLB);		Dir->setCombinedNextLowerBound(Exprs.DistCombinedFields.NLB);
Dir->setCombinedNextUpperBound(Exprs.DistCombinedFields.NUB);		Dir->setCombinedNextUpperBound(Exprs.DistCombinedFields.NUB);
		Dir->setCombinedDistCond(Exprs.DistCombinedFields.DistCond);
		Dir->setCombinedParForInDistCond(Exprs.DistCombinedFields.ParForInDistCond);
return Dir;		return Dir;
}		}

OMPDistributeParallelForSimdDirective *		OMPDistributeParallelForSimdDirective *
OMPDistributeParallelForSimdDirective::CreateEmpty(const ASTContext &C,		OMPDistributeParallelForSimdDirective::CreateEmpty(const ASTContext &C,
unsigned NumClauses,		unsigned NumClauses,
unsigned CollapsedNum,		unsigned CollapsedNum,
EmptyShell) {		EmptyShell) {
▲ Show 20 Lines • Show All 296 Lines • ▼ Show 20 Lines	OMPTeamsDistributeParallelForSimdDirective::Create(
Dir->setPreInits(Exprs.PreInits);		Dir->setPreInits(Exprs.PreInits);
Dir->setCombinedLowerBoundVariable(Exprs.DistCombinedFields.LB);		Dir->setCombinedLowerBoundVariable(Exprs.DistCombinedFields.LB);
Dir->setCombinedUpperBoundVariable(Exprs.DistCombinedFields.UB);		Dir->setCombinedUpperBoundVariable(Exprs.DistCombinedFields.UB);
Dir->setCombinedEnsureUpperBound(Exprs.DistCombinedFields.EUB);		Dir->setCombinedEnsureUpperBound(Exprs.DistCombinedFields.EUB);
Dir->setCombinedInit(Exprs.DistCombinedFields.Init);		Dir->setCombinedInit(Exprs.DistCombinedFields.Init);
Dir->setCombinedCond(Exprs.DistCombinedFields.Cond);		Dir->setCombinedCond(Exprs.DistCombinedFields.Cond);
Dir->setCombinedNextLowerBound(Exprs.DistCombinedFields.NLB);		Dir->setCombinedNextLowerBound(Exprs.DistCombinedFields.NLB);
Dir->setCombinedNextUpperBound(Exprs.DistCombinedFields.NUB);		Dir->setCombinedNextUpperBound(Exprs.DistCombinedFields.NUB);
		Dir->setCombinedDistCond(Exprs.DistCombinedFields.DistCond);
		Dir->setCombinedParForInDistCond(Exprs.DistCombinedFields.ParForInDistCond);
return Dir;		return Dir;
}		}

OMPTeamsDistributeParallelForSimdDirective *		OMPTeamsDistributeParallelForSimdDirective *
OMPTeamsDistributeParallelForSimdDirective::CreateEmpty(const ASTContext &C,		OMPTeamsDistributeParallelForSimdDirective::CreateEmpty(const ASTContext &C,
unsigned NumClauses,		unsigned NumClauses,
unsigned CollapsedNum,		unsigned CollapsedNum,
EmptyShell) {		EmptyShell) {
▲ Show 20 Lines • Show All 51 Lines • ▼ Show 20 Lines	OMPTeamsDistributeParallelForDirective::Create(
Dir->setPreInits(Exprs.PreInits);		Dir->setPreInits(Exprs.PreInits);
Dir->setCombinedLowerBoundVariable(Exprs.DistCombinedFields.LB);		Dir->setCombinedLowerBoundVariable(Exprs.DistCombinedFields.LB);
Dir->setCombinedUpperBoundVariable(Exprs.DistCombinedFields.UB);		Dir->setCombinedUpperBoundVariable(Exprs.DistCombinedFields.UB);
Dir->setCombinedEnsureUpperBound(Exprs.DistCombinedFields.EUB);		Dir->setCombinedEnsureUpperBound(Exprs.DistCombinedFields.EUB);
Dir->setCombinedInit(Exprs.DistCombinedFields.Init);		Dir->setCombinedInit(Exprs.DistCombinedFields.Init);
Dir->setCombinedCond(Exprs.DistCombinedFields.Cond);		Dir->setCombinedCond(Exprs.DistCombinedFields.Cond);
Dir->setCombinedNextLowerBound(Exprs.DistCombinedFields.NLB);		Dir->setCombinedNextLowerBound(Exprs.DistCombinedFields.NLB);
Dir->setCombinedNextUpperBound(Exprs.DistCombinedFields.NUB);		Dir->setCombinedNextUpperBound(Exprs.DistCombinedFields.NUB);
		Dir->setCombinedDistCond(Exprs.DistCombinedFields.DistCond);
		Dir->setCombinedParForInDistCond(Exprs.DistCombinedFields.ParForInDistCond);
Dir->HasCancel = HasCancel;		Dir->HasCancel = HasCancel;
return Dir;		return Dir;
}		}

OMPTeamsDistributeParallelForDirective *		OMPTeamsDistributeParallelForDirective *
OMPTeamsDistributeParallelForDirective::CreateEmpty(const ASTContext &C,		OMPTeamsDistributeParallelForDirective::CreateEmpty(const ASTContext &C,
unsigned NumClauses,		unsigned NumClauses,
unsigned CollapsedNum,		unsigned CollapsedNum,
▲ Show 20 Lines • Show All 130 Lines • ▼ Show 20 Lines	OMPTargetTeamsDistributeParallelForDirective::Create(
Dir->setPreInits(Exprs.PreInits);		Dir->setPreInits(Exprs.PreInits);
Dir->setCombinedLowerBoundVariable(Exprs.DistCombinedFields.LB);		Dir->setCombinedLowerBoundVariable(Exprs.DistCombinedFields.LB);
Dir->setCombinedUpperBoundVariable(Exprs.DistCombinedFields.UB);		Dir->setCombinedUpperBoundVariable(Exprs.DistCombinedFields.UB);
Dir->setCombinedEnsureUpperBound(Exprs.DistCombinedFields.EUB);		Dir->setCombinedEnsureUpperBound(Exprs.DistCombinedFields.EUB);
Dir->setCombinedInit(Exprs.DistCombinedFields.Init);		Dir->setCombinedInit(Exprs.DistCombinedFields.Init);
Dir->setCombinedCond(Exprs.DistCombinedFields.Cond);		Dir->setCombinedCond(Exprs.DistCombinedFields.Cond);
Dir->setCombinedNextLowerBound(Exprs.DistCombinedFields.NLB);		Dir->setCombinedNextLowerBound(Exprs.DistCombinedFields.NLB);
Dir->setCombinedNextUpperBound(Exprs.DistCombinedFields.NUB);		Dir->setCombinedNextUpperBound(Exprs.DistCombinedFields.NUB);
		Dir->setCombinedDistCond(Exprs.DistCombinedFields.DistCond);
		Dir->setCombinedParForInDistCond(Exprs.DistCombinedFields.ParForInDistCond);
Dir->HasCancel = HasCancel;		Dir->HasCancel = HasCancel;
return Dir;		return Dir;
}		}

OMPTargetTeamsDistributeParallelForDirective *		OMPTargetTeamsDistributeParallelForDirective *
OMPTargetTeamsDistributeParallelForDirective::CreateEmpty(const ASTContext &C,		OMPTargetTeamsDistributeParallelForDirective::CreateEmpty(const ASTContext &C,
unsigned NumClauses,		unsigned NumClauses,
unsigned CollapsedNum,		unsigned CollapsedNum,
▲ Show 20 Lines • Show All 55 Lines • ▼ Show 20 Lines	OMPTargetTeamsDistributeParallelForSimdDirective::Create(
Dir->setPreInits(Exprs.PreInits);		Dir->setPreInits(Exprs.PreInits);
Dir->setCombinedLowerBoundVariable(Exprs.DistCombinedFields.LB);		Dir->setCombinedLowerBoundVariable(Exprs.DistCombinedFields.LB);
Dir->setCombinedUpperBoundVariable(Exprs.DistCombinedFields.UB);		Dir->setCombinedUpperBoundVariable(Exprs.DistCombinedFields.UB);
Dir->setCombinedEnsureUpperBound(Exprs.DistCombinedFields.EUB);		Dir->setCombinedEnsureUpperBound(Exprs.DistCombinedFields.EUB);
Dir->setCombinedInit(Exprs.DistCombinedFields.Init);		Dir->setCombinedInit(Exprs.DistCombinedFields.Init);
Dir->setCombinedCond(Exprs.DistCombinedFields.Cond);		Dir->setCombinedCond(Exprs.DistCombinedFields.Cond);
Dir->setCombinedNextLowerBound(Exprs.DistCombinedFields.NLB);		Dir->setCombinedNextLowerBound(Exprs.DistCombinedFields.NLB);
Dir->setCombinedNextUpperBound(Exprs.DistCombinedFields.NUB);		Dir->setCombinedNextUpperBound(Exprs.DistCombinedFields.NUB);
		Dir->setCombinedDistCond(Exprs.DistCombinedFields.DistCond);
		Dir->setCombinedParForInDistCond(Exprs.DistCombinedFields.ParForInDistCond);
return Dir;		return Dir;
}		}

OMPTargetTeamsDistributeParallelForSimdDirective *		OMPTargetTeamsDistributeParallelForSimdDirective *
OMPTargetTeamsDistributeParallelForSimdDirective::CreateEmpty(		OMPTargetTeamsDistributeParallelForSimdDirective::CreateEmpty(
const ASTContext &C, unsigned NumClauses, unsigned CollapsedNum,		const ASTContext &C, unsigned NumClauses, unsigned CollapsedNum,
EmptyShell) {		EmptyShell) {
auto Size =		auto Size =
▲ Show 20 Lines • Show All 65 Lines • Show Last 20 Lines

lib/CodeGen/CGOpenMPRuntime.h

Show First 20 Lines • Show All 884 Lines • ▼ Show 20 Lines	public:
/// Check if the specified \a ScheduleKind is static non-chunked.		/// Check if the specified \a ScheduleKind is static non-chunked.
/// This kind of distribute directive is emitted without outer loop.		/// This kind of distribute directive is emitted without outer loop.
/// \param ScheduleKind Schedule kind specified in the 'dist_schedule' clause.		/// \param ScheduleKind Schedule kind specified in the 'dist_schedule' clause.
/// \param Chunked True if chunk is specified in the clause.		/// \param Chunked True if chunk is specified in the clause.
///		///
virtual bool isStaticNonchunked(OpenMPDistScheduleClauseKind ScheduleKind,		virtual bool isStaticNonchunked(OpenMPDistScheduleClauseKind ScheduleKind,
bool Chunked) const;		bool Chunked) const;

		/// Check if the specified \a ScheduleKind is static chunked.
		/// \param ScheduleKind Schedule kind specified in the 'schedule' clause.
		/// \param Chunked True if chunk is specified in the clause.
		///
		virtual bool isStaticChunked(OpenMPScheduleClauseKind ScheduleKind,
		bool Chunked) const;

		/// Check if the specified \a ScheduleKind is static non-chunked.
		/// \param ScheduleKind Schedule kind specified in the 'dist_schedule' clause.
		/// \param Chunked True if chunk is specified in the clause.
		///
		virtual bool isStaticChunked(OpenMPDistScheduleClauseKind ScheduleKind,
		ABataevUnsubmitted Done Reply Inline Actions I'd rename this into `isDistStaticChunked` ABataev: I'd rename this into `isDistStaticChunked`
		gtberceaAuthorUnsubmitted Not Done Reply Inline Actions I've used the same naming convention as the isStaticNonchunked function for consistency. gtbercea: I've used the same naming convention as the isStaticNonchunked function for consistency.
		ABataevUnsubmitted Not Done Reply Inline Actions What about this? ABataev: What about this?
		bool Chunked) const;

/// Check if the specified \a ScheduleKind is dynamic.		/// Check if the specified \a ScheduleKind is dynamic.
/// This kind of worksharing directive is emitted without outer loop.		/// This kind of worksharing directive is emitted without outer loop.
/// \param ScheduleKind Schedule Kind specified in the 'schedule' clause.		/// \param ScheduleKind Schedule Kind specified in the 'schedule' clause.
///		///
virtual bool isDynamic(OpenMPScheduleClauseKind ScheduleKind) const;		virtual bool isDynamic(OpenMPScheduleClauseKind ScheduleKind) const;

/// struct with the values to be passed to the dispatch runtime function		/// struct with the values to be passed to the dispatch runtime function
struct DispatchRTInput {		struct DispatchRTInput {
▲ Show 20 Lines • Show All 600 Lines • ▼ Show 20 Lines	public:
virtual void getDefaultDistScheduleAndChunk(CodeGenFunction &CGF,		virtual void getDefaultDistScheduleAndChunk(CodeGenFunction &CGF,
const OMPLoopDirective &S, OpenMPDistScheduleClauseKind &ScheduleKind,		const OMPLoopDirective &S, OpenMPDistScheduleClauseKind &ScheduleKind,
llvm::Value *&Chunk) const {}		llvm::Value *&Chunk) const {}

/// Choose default schedule type and chunk value for the		/// Choose default schedule type and chunk value for the
/// schedule clause.		/// schedule clause.
virtual void getDefaultScheduleAndChunk(CodeGenFunction &CGF,		virtual void getDefaultScheduleAndChunk(CodeGenFunction &CGF,
const OMPLoopDirective &S, OpenMPScheduleClauseKind &ScheduleKind,		const OMPLoopDirective &S, OpenMPScheduleClauseKind &ScheduleKind,
llvm::Value *&Chunk) const {}		const Expr *&ChunkExpr) const {}

/// Emits call of the outlined function with the provided arguments,		/// Emits call of the outlined function with the provided arguments,
/// translating these arguments to correct target-specific arguments.		/// translating these arguments to correct target-specific arguments.
virtual void		virtual void
emitOutlinedFunctionCall(CodeGenFunction &CGF, SourceLocation Loc,		emitOutlinedFunctionCall(CodeGenFunction &CGF, SourceLocation Loc,
llvm::Value *OutlinedFn,		llvm::Value *OutlinedFn,
ArrayRef<llvm::Value *> Args = llvm::None) const;		ArrayRef<llvm::Value *> Args = llvm::None) const;

▲ Show 20 Lines • Show All 583 Lines • Show Last 20 Lines

lib/CodeGen/CGOpenMPRuntime.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

	Show First 20 Lines • Show All 3,286 Lines • ▼ Show 20 Lines
	}			}

	bool CGOpenMPRuntime::isStaticNonchunked(			bool CGOpenMPRuntime::isStaticNonchunked(
	OpenMPDistScheduleClauseKind ScheduleKind, bool Chunked) const {			OpenMPDistScheduleClauseKind ScheduleKind, bool Chunked) const {
	OpenMPSchedType Schedule = getRuntimeSchedule(ScheduleKind, Chunked);			OpenMPSchedType Schedule = getRuntimeSchedule(ScheduleKind, Chunked);
	return Schedule == OMP_dist_sch_static;			return Schedule == OMP_dist_sch_static;
	}			}

				bool CGOpenMPRuntime::isStaticChunked(OpenMPScheduleClauseKind ScheduleKind,
				bool Chunked) const {
				OpenMPSchedType Schedule =
				getRuntimeSchedule(ScheduleKind, Chunked, /Ordered=/false);
				return Schedule == OMP_sch_static_chunked;
				}

				bool CGOpenMPRuntime::isStaticChunked(
				OpenMPDistScheduleClauseKind ScheduleKind, bool Chunked) const {
				OpenMPSchedType Schedule = getRuntimeSchedule(ScheduleKind, Chunked);
				return Schedule == OMP_dist_sch_static_chunked;
				}

	bool CGOpenMPRuntime::isDynamic(OpenMPScheduleClauseKind ScheduleKind) const {			bool CGOpenMPRuntime::isDynamic(OpenMPScheduleClauseKind ScheduleKind) const {
	OpenMPSchedType Schedule =			OpenMPSchedType Schedule =
	getRuntimeSchedule(ScheduleKind, /Chunked=/false, /Ordered=/false);			getRuntimeSchedule(ScheduleKind, /Chunked=/false, /Ordered=/false);
	assert(Schedule != OMP_sch_static_chunked && "cannot be chunked here");			assert(Schedule != OMP_sch_static_chunked && "cannot be chunked here");
	return Schedule != OMP_sch_static;			return Schedule != OMP_sch_static;
	}			}

	▲ Show 20 Lines • Show All 6,222 Lines • Show Last 20 Lines

lib/CodeGen/CGOpenMPRuntimeNVPTX.h

Show First 20 Lines • Show All 342 Lines • ▼ Show 20 Lines	public:
/// Choose a default value for the dist_schedule clause.		/// Choose a default value for the dist_schedule clause.
void getDefaultDistScheduleAndChunk(CodeGenFunction &CGF,		void getDefaultDistScheduleAndChunk(CodeGenFunction &CGF,
const OMPLoopDirective &S, OpenMPDistScheduleClauseKind &ScheduleKind,		const OMPLoopDirective &S, OpenMPDistScheduleClauseKind &ScheduleKind,
llvm::Value *&Chunk) const override;		llvm::Value *&Chunk) const override;

/// Choose a default value for the schedule clause.		/// Choose a default value for the schedule clause.
void getDefaultScheduleAndChunk(CodeGenFunction &CGF,		void getDefaultScheduleAndChunk(CodeGenFunction &CGF,
const OMPLoopDirective &S, OpenMPScheduleClauseKind &ScheduleKind,		const OMPLoopDirective &S, OpenMPScheduleClauseKind &ScheduleKind,
llvm::Value *&Chunk) const override;		const Expr *&ChunkExpr) const override;

private:		private:
/// Track the execution mode when codegening directives within a target		/// Track the execution mode when codegening directives within a target
/// region. The appropriate mode (SPMD/NON-SPMD) is set on entry to the		/// region. The appropriate mode (SPMD/NON-SPMD) is set on entry to the
/// target region and used by containing directives such as 'parallel'		/// target region and used by containing directives such as 'parallel'
/// to emit optimized code.		/// to emit optimized code.
ExecutionMode CurrentExecutionMode = EM_Unknown;		ExecutionMode CurrentExecutionMode = EM_Unknown;

▲ Show 20 Lines • Show All 57 Lines • Show Last 20 Lines

lib/CodeGen/CGOpenMPRuntimeNVPTX.cpp

Show First 20 Lines • Show All 4,240 Lines • ▼ Show 20 Lines	if (getExecutionMode() == CGOpenMPRuntimeNVPTX::EM_SPMD) {
return;		return;
}		}
CGOpenMPRuntime::getDefaultDistScheduleAndChunk(		CGOpenMPRuntime::getDefaultDistScheduleAndChunk(
CGF, S, ScheduleKind, Chunk);		CGF, S, ScheduleKind, Chunk);
}		}

void CGOpenMPRuntimeNVPTX::getDefaultScheduleAndChunk(		void CGOpenMPRuntimeNVPTX::getDefaultScheduleAndChunk(
CodeGenFunction &CGF, const OMPLoopDirective &S,		CodeGenFunction &CGF, const OMPLoopDirective &S,
OpenMPScheduleClauseKind &ScheduleKind,		OpenMPScheduleClauseKind &ScheduleKind,
		ABataevUnsubmitted Done Reply Inline Actions If the `ChunkOne` field is not required, you need to restore original code here ABataev: If the `ChunkOne` field is not required, you need to restore original code here
llvm::Value *&Chunk) const {		const Expr *&ChunkExpr) const {
ScheduleKind = OMPC_SCHEDULE_static;		ScheduleKind = OMPC_SCHEDULE_static;
Chunk = CGF.Builder.getIntN(CGF.getContext().getTypeSize(		// Chunk size is 1 in this case.
S.getIterationVariable()->getType()), 1);		llvm::APInt ChunkSize(32, 1);
		ChunkExpr = IntegerLiteral::Create(CGF.getContext(), ChunkSize,
		CGF.getContext().getIntTypeForBitwidth(32, /Signed=/0),
		SourceLocation());
}		}

lib/CodeGen/CGStmtOpenMP.cpp

Show First 20 Lines • Show All 2,000 Lines • ▼ Show 20 Lines	void CodeGenFunction::EmitOMPDistributeOuterLoop(
const bool IVSigned = IVExpr->getType()->hasSignedIntegerRepresentation();		const bool IVSigned = IVExpr->getType()->hasSignedIntegerRepresentation();

CGOpenMPRuntime::StaticRTInput StaticInit(		CGOpenMPRuntime::StaticRTInput StaticInit(
IVSize, IVSigned, /* Ordered = */ false, LoopArgs.IL, LoopArgs.LB,		IVSize, IVSigned, /* Ordered = */ false, LoopArgs.IL, LoopArgs.LB,
LoopArgs.UB, LoopArgs.ST, LoopArgs.Chunk);		LoopArgs.UB, LoopArgs.ST, LoopArgs.Chunk);
RT.emitDistributeStaticInit(*this, S.getBeginLoc(), ScheduleKind, StaticInit);		RT.emitDistributeStaticInit(*this, S.getBeginLoc(), ScheduleKind, StaticInit);

// for combined 'distribute' and 'for' the increment expression of distribute		// for combined 'distribute' and 'for' the increment expression of distribute
// is store in DistInc. For 'distribute' alone, it is in Inc.		// is stored in DistInc. For 'distribute' alone, it is in Inc.
Expr *IncExpr;		Expr *IncExpr;
if (isOpenMPLoopBoundSharingDirective(S.getDirectiveKind()))		if (isOpenMPLoopBoundSharingDirective(S.getDirectiveKind()))
IncExpr = S.getDistInc();		IncExpr = S.getDistInc();
else		else
IncExpr = S.getInc();		IncExpr = S.getInc();

// this routine is shared by 'omp distribute parallel for' and		// this routine is shared by 'omp distribute parallel for' and
// 'omp distribute': select the right EUB expression depending on the		// 'omp distribute': select the right EUB expression depending on the
▲ Show 20 Lines • Show All 275 Lines • ▼ Show 20 Lines	// Emit 'then' code.
EmitOMPPrivateClause(S, LoopScope);		EmitOMPPrivateClause(S, LoopScope);
HasLastprivateClause = EmitOMPLastprivateClauseInit(S, LoopScope);		HasLastprivateClause = EmitOMPLastprivateClauseInit(S, LoopScope);
EmitOMPReductionClauseInit(S, LoopScope);		EmitOMPReductionClauseInit(S, LoopScope);
EmitOMPPrivateLoopCounters(S, LoopScope);		EmitOMPPrivateLoopCounters(S, LoopScope);
EmitOMPLinearClause(S, LoopScope);		EmitOMPLinearClause(S, LoopScope);
(void)LoopScope.Privatize();		(void)LoopScope.Privatize();

// Detect the loop schedule kind and chunk.		// Detect the loop schedule kind and chunk.
llvm::Value *Chunk = nullptr;		const Expr *ChunkExpr = nullptr;
OpenMPScheduleTy ScheduleKind;		OpenMPScheduleTy ScheduleKind;
if (const auto *C = S.getSingleClause<OMPScheduleClause>()) {		if (const auto *C = S.getSingleClause<OMPScheduleClause>()) {
ScheduleKind.Schedule = C->getScheduleKind();		ScheduleKind.Schedule = C->getScheduleKind();
ScheduleKind.M1 = C->getFirstScheduleModifier();		ScheduleKind.M1 = C->getFirstScheduleModifier();
ScheduleKind.M2 = C->getSecondScheduleModifier();		ScheduleKind.M2 = C->getSecondScheduleModifier();
if (const Expr *Ch = C->getChunkSize()) {		ChunkExpr = C->getChunkSize();
Chunk = EmitScalarExpr(Ch);
Chunk = EmitScalarConversion(Chunk, Ch->getType(),
S.getIterationVariable()->getType(),
S.getBeginLoc());
}
} else {		} else {
// Default behaviour for schedule clause.		// Default behaviour for schedule clause.
CGM.getOpenMPRuntime().getDefaultScheduleAndChunk(		CGM.getOpenMPRuntime().getDefaultScheduleAndChunk(
*this, S, ScheduleKind.Schedule, Chunk);		*this, S, ScheduleKind.Schedule, ChunkExpr);
		}
		bool HasChunkSizeOne = false;
		llvm::Value *Chunk = nullptr;
		if (ChunkExpr) {
		Chunk = EmitScalarExpr(ChunkExpr);
		Chunk = EmitScalarConversion(Chunk, ChunkExpr->getType(),
		S.getIterationVariable()->getType(),
		S.getBeginLoc());
		llvm::APSInt EvaluatedChunk;
		if (ChunkExpr->EvaluateAsInt(EvaluatedChunk, getContext()))
		HasChunkSizeOne = (EvaluatedChunk.getLimitedValue() == 1);
}		}
const unsigned IVSize = getContext().getTypeSize(IVExpr->getType());		const unsigned IVSize = getContext().getTypeSize(IVExpr->getType());
const bool IVSigned = IVExpr->getType()->hasSignedIntegerRepresentation();		const bool IVSigned = IVExpr->getType()->hasSignedIntegerRepresentation();
// OpenMP 4.5, 2.7.1 Loop Construct, Description.		// OpenMP 4.5, 2.7.1 Loop Construct, Description.
// If the static schedule kind is specified or if the ordered clause is		// If the static schedule kind is specified or if the ordered clause is
// specified, and if no monotonic modifier is specified, the effect will		// specified, and if no monotonic modifier is specified, the effect will
// be as if the monotonic modifier was specified.		// be as if the monotonic modifier was specified.
if (RT.isStaticNonchunked(ScheduleKind.Schedule,		bool StaticChunkedOne = RT.isStaticChunked(ScheduleKind.Schedule,
/* Chunked */ Chunk != nullptr) &&		/* Chunked */ Chunk != nullptr) && HasChunkSizeOne &&
		isOpenMPLoopBoundSharingDirective(S.getDirectiveKind());
		if ((RT.isStaticNonchunked(ScheduleKind.Schedule,
		/* Chunked */ Chunk != nullptr) \|\|
		StaticChunkedOne) &&
!Ordered) {		!Ordered) {
if (isOpenMPSimdDirective(S.getDirectiveKind()))		if (isOpenMPSimdDirective(S.getDirectiveKind()))
EmitOMPSimdInit(S, /IsMonotonic=/true);		EmitOMPSimdInit(S, /IsMonotonic=/true);
// OpenMP [2.7.1, Loop Construct, Description, table 2-1]		// OpenMP [2.7.1, Loop Construct, Description, table 2-1]
// When no chunk_size is specified, the iteration space is divided into		// When no chunk_size is specified, the iteration space is divided into
// chunks that are approximately equal in size, and at most one chunk is		// chunks that are approximately equal in size, and at most one chunk is
// distributed to each thread. Note that the size of the chunks is		// distributed to each thread. Note that the size of the chunks is
// unspecified in this case.		// unspecified in this case.
CGOpenMPRuntime::StaticRTInput StaticInit(		CGOpenMPRuntime::StaticRTInput StaticInit(
IVSize, IVSigned, Ordered, IL.getAddress(), LB.getAddress(),		IVSize, IVSigned, Ordered, IL.getAddress(), LB.getAddress(),
UB.getAddress(), ST.getAddress());		UB.getAddress(), ST.getAddress(),
		StaticChunkedOne ? Chunk : nullptr);
RT.emitForStaticInit(*this, S.getBeginLoc(), S.getDirectiveKind(),		RT.emitForStaticInit(*this, S.getBeginLoc(), S.getDirectiveKind(),
ScheduleKind, StaticInit);		ScheduleKind, StaticInit);
JumpDest LoopExit =		JumpDest LoopExit =
getJumpDestInCurrentScope(createBasicBlock("omp.loop.exit"));		getJumpDestInCurrentScope(createBasicBlock("omp.loop.exit"));
// UB = min(UB, GlobalUB);		// UB = min(UB, GlobalUB);
		if (!StaticChunkedOne)
EmitIgnoredExpr(S.getEnsureUpperBound());		EmitIgnoredExpr(S.getEnsureUpperBound());
// IV = LB;		// IV = LB;
EmitIgnoredExpr(S.getInit());		EmitIgnoredExpr(S.getInit());
// while (idx <= UB) { BODY; ++idx; }		// For unchunked static schedule generate:
EmitOMPInnerLoop(S, LoopScope.requiresCleanups(), S.getCond(),		//
S.getInc(),		// while (idx <= UB) {
		// BODY;
		// ++idx;
		// }
		//
		// For static schedule with chunk one:
		//
		// while (IV <= PrevUB) {
		// BODY;
		// IV += ST;
		// }
		EmitOMPInnerLoop(S, LoopScope.requiresCleanups(),
		StaticChunkedOne ? S.getCombinedParForInDistCond() : S.getCond(),
		StaticChunkedOne ? S.getDistInc() : S.getInc(),
[&S, LoopExit](CodeGenFunction &CGF) {		[&S, LoopExit](CodeGenFunction &CGF) {
CGF.EmitOMPLoopBody(S, LoopExit);		CGF.EmitOMPLoopBody(S, LoopExit);
CGF.EmitStopPoint(&S);		CGF.EmitStopPoint(&S);
},		},
[](CodeGenFunction &) {});		[](CodeGenFunction &) {});
EmitBlock(LoopExit.getBlock());		EmitBlock(LoopExit.getBlock());
// Tell the runtime we are done.		// Tell the runtime we are done.
auto &&CodeGen = [&S](CodeGenFunction &CGF) {		auto &&CodeGen = [&S](CodeGenFunction &CGF) {
CGF.CGM.getOpenMPRuntime().emitForStaticFinish(CGF, S.getEndLoc(),		CGF.CGM.getOpenMPRuntime().emitForStaticFinish(CGF, S.getEndLoc(),
S.getDirectiveKind());		S.getDirectiveKind());
};		};
OMPCancelStack.emitExit(*this, S.getDirectiveKind(), CodeGen);		OMPCancelStack.emitExit(*this, S.getDirectiveKind(), CodeGen);
} else {		} else {
		ABataevUnsubmitted Done Reply Inline Actions This whole code is very similar to the unchunked case. Could you merge it? ABataev: This whole code is very similar to the unchunked case. Could you merge it?
		ABataevUnsubmitted Not Done Reply Inline Actions What about this? ABataev: What about this?
const bool IsMonotonic =		const bool IsMonotonic =
Ordered \|\| ScheduleKind.Schedule == OMPC_SCHEDULE_static \|\|		Ordered \|\| ScheduleKind.Schedule == OMPC_SCHEDULE_static \|\|
		ABataevUnsubmitted Done Reply Inline Actions It allows you to check only the implicit case, what about if the user explicitly specifies that `chunk` is `1`? ABataev: It allows you to check only the implicit case, what about if the user explicitly specifies that…
ScheduleKind.Schedule == OMPC_SCHEDULE_unknown \|\|		ScheduleKind.Schedule == OMPC_SCHEDULE_unknown \|\|
ScheduleKind.M1 == OMPC_SCHEDULE_MODIFIER_monotonic \|\|		ScheduleKind.M1 == OMPC_SCHEDULE_MODIFIER_monotonic \|\|
ScheduleKind.M2 == OMPC_SCHEDULE_MODIFIER_monotonic;		ScheduleKind.M2 == OMPC_SCHEDULE_MODIFIER_monotonic;
// Emit the outer loop, which requests its work chunk [LB..UB] from		// Emit the outer loop, which requests its work chunk [LB..UB] from
// runtime and runs the inner loop to process it.		// runtime and runs the inner loop to process it.
const OMPLoopArguments LoopArguments(LB.getAddress(), UB.getAddress(),		const OMPLoopArguments LoopArguments(LB.getAddress(), UB.getAddress(),
ST.getAddress(), IL.getAddress(),		ST.getAddress(), IL.getAddress(),
Chunk, EUB);		Chunk, EUB);
▲ Show 20 Lines • Show All 969 Lines • ▼ Show 20 Lines	// Emit 'then' code.
// OpenMP [2.10.8, distribute Construct, Description]		// OpenMP [2.10.8, distribute Construct, Description]
// If dist_schedule is specified, kind must be static. If specified,		// If dist_schedule is specified, kind must be static. If specified,
// iterations are divided into chunks of size chunk_size, chunks are		// iterations are divided into chunks of size chunk_size, chunks are
// assigned to the teams of the league in a round-robin fashion in the		// assigned to the teams of the league in a round-robin fashion in the
// order of the team number. When no chunk_size is specified, the		// order of the team number. When no chunk_size is specified, the
// iteration space is divided into chunks that are approximately equal		// iteration space is divided into chunks that are approximately equal
// in size, and at most one chunk is distributed to each team of the		// in size, and at most one chunk is distributed to each team of the
// league. The size of the chunks is unspecified in this case.		// league. The size of the chunks is unspecified in this case.
		bool StaticChunked = RT.isStaticChunked(
		ScheduleKind, /* Chunked */ Chunk != nullptr) &&
		isOpenMPLoopBoundSharingDirective(S.getDirectiveKind());
if (RT.isStaticNonchunked(ScheduleKind,		if (RT.isStaticNonchunked(ScheduleKind,
/* Chunked */ Chunk != nullptr)) {		/* Chunked */ Chunk != nullptr) \|\|
		StaticChunked) {
if (isOpenMPSimdDirective(S.getDirectiveKind()))		if (isOpenMPSimdDirective(S.getDirectiveKind()))
EmitOMPSimdInit(S, /IsMonotonic=/true);		EmitOMPSimdInit(S, /IsMonotonic=/true);
CGOpenMPRuntime::StaticRTInput StaticInit(		CGOpenMPRuntime::StaticRTInput StaticInit(
IVSize, IVSigned, /* Ordered = */ false, IL.getAddress(),		IVSize, IVSigned, /* Ordered = */ false, IL.getAddress(),
LB.getAddress(), UB.getAddress(), ST.getAddress());		LB.getAddress(), UB.getAddress(), ST.getAddress(),
		StaticChunked ? Chunk : nullptr);
RT.emitDistributeStaticInit(*this, S.getBeginLoc(), ScheduleKind,		RT.emitDistributeStaticInit(*this, S.getBeginLoc(), ScheduleKind,
StaticInit);		StaticInit);
JumpDest LoopExit =		JumpDest LoopExit =
getJumpDestInCurrentScope(createBasicBlock("omp.loop.exit"));		getJumpDestInCurrentScope(createBasicBlock("omp.loop.exit"));
// UB = min(UB, GlobalUB);		// UB = min(UB, GlobalUB);
EmitIgnoredExpr(isOpenMPLoopBoundSharingDirective(S.getDirectiveKind())		EmitIgnoredExpr(isOpenMPLoopBoundSharingDirective(S.getDirectiveKind())
		ABataevUnsubmitted Done Reply Inline Actions Restore the original code here, the logic can be simplified ABataev: Restore the original code here, the logic can be simplified
? S.getCombinedEnsureUpperBound()		? S.getCombinedEnsureUpperBound()
: S.getEnsureUpperBound());		: S.getEnsureUpperBound());
// IV = LB;		// IV = LB;
EmitIgnoredExpr(isOpenMPLoopBoundSharingDirective(S.getDirectiveKind())		EmitIgnoredExpr(isOpenMPLoopBoundSharingDirective(S.getDirectiveKind())
		ABataevUnsubmitted Done Reply Inline Actions The same ABataev: The same
? S.getCombinedInit()		? S.getCombinedInit()
: S.getInit());		: S.getInit());

const Expr *Cond =		const Expr *Cond =
isOpenMPLoopBoundSharingDirective(S.getDirectiveKind())		isOpenMPLoopBoundSharingDirective(S.getDirectiveKind())
? S.getCombinedCond()		? S.getCombinedCond()
: S.getCond();		: S.getCond();

// for distribute alone, codegen		if (StaticChunked)
// while (idx <= UB) { BODY; ++idx; }		Cond = S.getCombinedDistCond();
// when combined with 'for' (e.g. as in 'distribute parallel for')
// while (idx <= UB) { <CodeGen rest of pragma>; idx += ST; }		// For static unchunked schedules generate:
		//
		// 1. For distribute alone, codegen
		// while (idx <= UB) {
		// BODY;
		// ++idx;
		// }
		//
		// 2. When combined with 'for' (e.g. as in 'distribute parallel for')
		// while (idx <= UB) {
		// <CodeGen rest of pragma>(LB, UB);
		// idx += ST;
		// }
		//
		// For static chunk one schedule generate:
		//
		// while (IV <= GlobalUB) {
		// <CodeGen rest of pragma>(LB, UB);
		// LB += ST;
		// UB += ST;
		// UB = min(UB, GlobalUB);
		// IV = LB;
		// }
		//
EmitOMPInnerLoop(S, LoopScope.requiresCleanups(), Cond, IncExpr,		EmitOMPInnerLoop(S, LoopScope.requiresCleanups(), Cond, IncExpr,
[&S, LoopExit, &CodeGenLoop](CodeGenFunction &CGF) {		[&S, LoopExit, &CodeGenLoop](CodeGenFunction &CGF) {
CodeGenLoop(CGF, S, LoopExit);		CodeGenLoop(CGF, S, LoopExit);
},		},
[](CodeGenFunction &) {});		[&S, StaticChunked](CodeGenFunction &CGF) {
		if (StaticChunked) {
		CGF.EmitIgnoredExpr(S.getCombinedNextLowerBound());
		CGF.EmitIgnoredExpr(S.getCombinedNextUpperBound());
		CGF.EmitIgnoredExpr(S.getCombinedEnsureUpperBound());
		CGF.EmitIgnoredExpr(S.getCombinedInit());
		}
		});
EmitBlock(LoopExit.getBlock());		EmitBlock(LoopExit.getBlock());
// Tell the runtime we are done.		// Tell the runtime we are done.
RT.emitForStaticFinish(*this, S.getBeginLoc(), S.getDirectiveKind());		RT.emitForStaticFinish(*this, S.getBeginLoc(), S.getDirectiveKind());
} else {		} else {
		ABataevUnsubmitted Done Reply Inline Actions Again, very similar to the unchunked code. Merge it. ABataev: Again, very similar to the unchunked code. Merge it.
		ABataevUnsubmitted Not Done Reply Inline Actions ? ABataev: ?
// Emit the outer loop, which requests its work chunk [LB..UB] from		// Emit the outer loop, which requests its work chunk [LB..UB] from
// runtime and runs the inner loop to process it.		// runtime and runs the inner loop to process it.
const OMPLoopArguments LoopArguments = {		const OMPLoopArguments LoopArguments = {
LB.getAddress(), UB.getAddress(), ST.getAddress(), IL.getAddress(),		LB.getAddress(), UB.getAddress(), ST.getAddress(), IL.getAddress(),
Chunk};		Chunk};
EmitOMPDistributeOuterLoop(ScheduleKind, S, LoopScope, LoopArguments,		EmitOMPDistributeOuterLoop(ScheduleKind, S, LoopScope, LoopArguments,
CodeGenLoop);		CodeGenLoop);
}		}
if (isOpenMPSimdDirective(S.getDirectiveKind())) {		if (isOpenMPSimdDirective(S.getDirectiveKind())) {
EmitOMPSimdFinal(S, [IL, &S](CodeGenFunction &CGF) {		EmitOMPSimdFinal(S, [IL, &S](CodeGenFunction &CGF) {
return CGF.Builder.CreateIsNotNull(		return CGF.Builder.CreateIsNotNull(
CGF.EmitLoadOfScalar(IL, S.getBeginLoc()));		CGF.EmitLoadOfScalar(IL, S.getBeginLoc()));
});		});
}		}
if (isOpenMPSimdDirective(S.getDirectiveKind()) &&		if (isOpenMPSimdDirective(S.getDirectiveKind()) &&
!isOpenMPParallelDirective(S.getDirectiveKind()) &&		!isOpenMPParallelDirective(S.getDirectiveKind()) &&
!isOpenMPTeamsDirective(S.getDirectiveKind())) {		!isOpenMPTeamsDirective(S.getDirectiveKind())) {
EmitOMPReductionClauseFinal(S, OMPD_simd);		EmitOMPReductionClauseFinal(S, OMPD_simd);
// Emit post-update of the reduction variables if IsLastIter != 0.		// Emit post-update of the reduction variables if IsLastIter != 0.
emitPostUpdateForReductionClause(		emitPostUpdateForReductionClause(
*this, S, [IL, &S](CodeGenFunction &CGF) {		*this, S, [IL, &S](CodeGenFunction &CGF) {
return CGF.Builder.CreateIsNotNull(		return CGF.Builder.CreateIsNotNull(
CGF.EmitLoadOfScalar(IL, S.getBeginLoc()));		CGF.EmitLoadOfScalar(IL, S.getBeginLoc()));
});		});
}		}
// Emit final copy of the lastprivate variables if IsLastIter != 0.		// Emit final copy of the lastprivate variables if IsLastIter != 0.
if (HasLastprivateClause) {		if (HasLastprivateClause) {
EmitOMPLastprivateClauseFinal(		EmitOMPLastprivateClauseFinal(
S, /NoFinals=/false,		S, /NoFinals=/false,
Builder.CreateIsNotNull(EmitLoadOfScalar(IL, S.getBeginLoc())));		Builder.CreateIsNotNull(EmitLoadOfScalar(IL, S.getBeginLoc())));
}		}
}		}

// We're now done with the loop, so jump to the continuation block.		// We're now done with the loop, so jump to the continuation block.
if (ContBlock) {		if (ContBlock) {
EmitBranch(ContBlock);		EmitBranch(ContBlock);
		ABataevUnsubmitted Done Reply Inline Actions Please, simplify this ABataev: Please, simplify this
EmitBlock(ContBlock, true);		EmitBlock(ContBlock, true);
}		}
}		}
}		}

void CodeGenFunction::EmitOMPDistributeDirective(		void CodeGenFunction::EmitOMPDistributeDirective(
const OMPDistributeDirective &S) {		const OMPDistributeDirective &S) {
auto &&CodeGen = [&S](CodeGenFunction &CGF, PrePostActionTy &) {		auto &&CodeGen = [&S](CodeGenFunction &CGF, PrePostActionTy &) {
▲ Show 20 Lines • Show All 1,557 Lines • Show Last 20 Lines

lib/Sema/SemaOpenMP.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 348 Lines • ▼ Show 20 Lines	OpenMPDirectiveKind getDirective(unsigned Level) const {
return Stack.back().first[Level].Directive;		return Stack.back().first[Level].Directive;
}		}
/// Returns parent directive.		/// Returns parent directive.
OpenMPDirectiveKind getParentDirective() const {		OpenMPDirectiveKind getParentDirective() const {
if (isStackEmpty() \|\| Stack.back().first.size() == 1)		if (isStackEmpty() \|\| Stack.back().first.size() == 1)
return OMPD_unknown;		return OMPD_unknown;
return std::next(Stack.back().first.rbegin())->Directive;		return std::next(Stack.back().first.rbegin())->Directive;
}		}

/// Add requires decl to internal vector		/// Add requires decl to internal vector
void addRequiresDecl(OMPRequiresDecl *RD) {		void addRequiresDecl(OMPRequiresDecl *RD) {
RequiresDecls.push_back(RD);		RequiresDecls.push_back(RD);
}		}

/// Checks for a duplicate clause amongst previously declared requires		/// Checks for a duplicate clause amongst previously declared requires
/// directives		/// directives
bool hasDuplicateRequiresClause(ArrayRef<OMPClause *> ClauseList) const {		bool hasDuplicateRequiresClause(ArrayRef<OMPClause *> ClauseList) const {
Show All 10 Lines	for (OMPClause *CNew : ClauseList) {
<< getOpenMPClauseName(CPrev->getClauseKind());		<< getOpenMPClauseName(CPrev->getClauseKind());
IsDuplicate = true;		IsDuplicate = true;
}		}
}		}
}		}
}		}
return IsDuplicate;		return IsDuplicate;
}		}

/// Set default data sharing attribute to none.		/// Set default data sharing attribute to none.
void setDefaultDSANone(SourceLocation Loc) {		void setDefaultDSANone(SourceLocation Loc) {
assert(!isStackEmpty());		assert(!isStackEmpty());
Stack.back().first.back().DefaultAttr = DSA_none;		Stack.back().first.back().DefaultAttr = DSA_none;
Stack.back().first.back().DefaultAttrLoc = Loc;		Stack.back().first.back().DefaultAttrLoc = Loc;
}		}
/// Set default data sharing attribute to shared.		/// Set default data sharing attribute to shared.
void setDefaultDSAShared(SourceLocation Loc) {		void setDefaultDSAShared(SourceLocation Loc) {
▲ Show 20 Lines • Show All 4,803 Lines • ▼ Show 20 Lines	checkOpenMPLoop(OpenMPDirectiveKind DKind, Expr *CollapseLoopCountExpr,
// Loop condition (IV < NumIterations) or (IV <= UB) for worksharing loops.		// Loop condition (IV < NumIterations) or (IV <= UB) for worksharing loops.
SourceLocation CondLoc = AStmt->getBeginLoc();		SourceLocation CondLoc = AStmt->getBeginLoc();
ExprResult Cond =		ExprResult Cond =
(isOpenMPWorksharingDirective(DKind) \|\|		(isOpenMPWorksharingDirective(DKind) \|\|
isOpenMPTaskLoopDirective(DKind) \|\| isOpenMPDistributeDirective(DKind))		isOpenMPTaskLoopDirective(DKind) \|\| isOpenMPDistributeDirective(DKind))
? SemaRef.BuildBinOp(CurScope, CondLoc, BO_LE, IV.get(), UB.get())		? SemaRef.BuildBinOp(CurScope, CondLoc, BO_LE, IV.get(), UB.get())
: SemaRef.BuildBinOp(CurScope, CondLoc, BO_LT, IV.get(),		: SemaRef.BuildBinOp(CurScope, CondLoc, BO_LT, IV.get(),
NumIterations.get());		NumIterations.get());
		ExprResult CombDistCond;
		if (isOpenMPLoopBoundSharingDirective(DKind)) {
		CombDistCond =
		SemaRef.BuildBinOp(CurScope, CondLoc, BO_LE, IV.get(), NumIterations.get());
		ABataevUnsubmitted Done Reply Inline Actions Seems to me, you need to use `NumIterations` instead of `LastIteration` ABataev: Seems to me, you need to use `NumIterations` instead of `LastIteration`
		ABataevUnsubmitted Not Done Reply Inline Actions Add the tests for the collapsed loops. ABataev: Add the tests for the collapsed loops.
		}

ExprResult CombCond;		ExprResult CombCond;
if (isOpenMPLoopBoundSharingDirective(DKind)) {		if (isOpenMPLoopBoundSharingDirective(DKind)) {
CombCond =		CombCond =
SemaRef.BuildBinOp(CurScope, CondLoc, BO_LE, IV.get(), CombUB.get());		SemaRef.BuildBinOp(CurScope, CondLoc, BO_LE, IV.get(), CombUB.get());
}		}
// Loop increment (IV = IV + 1)		// Loop increment (IV = IV + 1)
SourceLocation IncLoc = AStmt->getBeginLoc();		SourceLocation IncLoc = AStmt->getBeginLoc();
ExprResult Inc =		ExprResult Inc =
▲ Show 20 Lines • Show All 58 Lines • ▼ Show 20 Lines	if (isOpenMPWorksharingDirective(DKind) \|\| isOpenMPTaskLoopDirective(DKind) \|\|
}		}
}		}

// Create increment expression for distribute loop when combined in a same		// Create increment expression for distribute loop when combined in a same
// directive with for as IV = IV + ST; ensure upper bound expression based		// directive with for as IV = IV + ST; ensure upper bound expression based
// on PrevUB instead of NumIterations - used to implement 'for' when found		// on PrevUB instead of NumIterations - used to implement 'for' when found
// in combination with 'distribute', like in 'distribute parallel for'		// in combination with 'distribute', like in 'distribute parallel for'
SourceLocation DistIncLoc = AStmt->getBeginLoc();		SourceLocation DistIncLoc = AStmt->getBeginLoc();
ExprResult DistCond, DistInc, PrevEUB;		ExprResult DistCond, DistInc, PrevEUB, ParForInDistCond;
if (isOpenMPLoopBoundSharingDirective(DKind)) {		if (isOpenMPLoopBoundSharingDirective(DKind)) {
DistCond = SemaRef.BuildBinOp(CurScope, CondLoc, BO_LE, IV.get(), UB.get());		DistCond = SemaRef.BuildBinOp(CurScope, CondLoc, BO_LE, IV.get(), UB.get());
assert(DistCond.isUsable() && "distribute cond expr was not built");		assert(DistCond.isUsable() && "distribute cond expr was not built");

DistInc =		DistInc =
SemaRef.BuildBinOp(CurScope, DistIncLoc, BO_Add, IV.get(), ST.get());		SemaRef.BuildBinOp(CurScope, DistIncLoc, BO_Add, IV.get(), ST.get());
assert(DistInc.isUsable() && "distribute inc expr was not built");		assert(DistInc.isUsable() && "distribute inc expr was not built");
DistInc = SemaRef.BuildBinOp(CurScope, DistIncLoc, BO_Assign, IV.get(),		DistInc = SemaRef.BuildBinOp(CurScope, DistIncLoc, BO_Assign, IV.get(),
DistInc.get());		DistInc.get());
DistInc = SemaRef.ActOnFinishFullExpr(DistInc.get());		DistInc = SemaRef.ActOnFinishFullExpr(DistInc.get());
assert(DistInc.isUsable() && "distribute inc expr was not built");		assert(DistInc.isUsable() && "distribute inc expr was not built");

// Build expression: UB = min(UB, prevUB) for #for in composite or combined		// Build expression: UB = min(UB, prevUB) for #for in composite or combined
// construct		// construct
SourceLocation DistEUBLoc = AStmt->getBeginLoc();		SourceLocation DistEUBLoc = AStmt->getBeginLoc();
ExprResult IsUBGreater =		ExprResult IsUBGreater =
SemaRef.BuildBinOp(CurScope, DistEUBLoc, BO_GT, UB.get(), PrevUB.get());		SemaRef.BuildBinOp(CurScope, DistEUBLoc, BO_GT, UB.get(), PrevUB.get());
ExprResult CondOp = SemaRef.ActOnConditionalOp(		ExprResult CondOp = SemaRef.ActOnConditionalOp(
DistEUBLoc, DistEUBLoc, IsUBGreater.get(), PrevUB.get(), UB.get());		DistEUBLoc, DistEUBLoc, IsUBGreater.get(), PrevUB.get(), UB.get());
PrevEUB = SemaRef.BuildBinOp(CurScope, DistIncLoc, BO_Assign, UB.get(),		PrevEUB = SemaRef.BuildBinOp(CurScope, DistIncLoc, BO_Assign, UB.get(),
CondOp.get());		CondOp.get());
PrevEUB = SemaRef.ActOnFinishFullExpr(PrevEUB.get());		PrevEUB = SemaRef.ActOnFinishFullExpr(PrevEUB.get());

		// Build IV <= PrevEUB to be used in parallel for is in combination with
		ABataevUnsubmitted Done Reply Inline Actions Fix the comment here ABataev: Fix the comment here
		// a distribute directive with schedule(static, 1)
		ParForInDistCond =
		SemaRef.BuildBinOp(CurScope, CondLoc, BO_LE, IV.get(), PrevUB.get());
}		}

// Build updates and final values of the loop counters.		// Build updates and final values of the loop counters.
bool HasErrors = false;		bool HasErrors = false;
Built.Counters.resize(NestedLoopCount);		Built.Counters.resize(NestedLoopCount);
Built.Inits.resize(NestedLoopCount);		Built.Inits.resize(NestedLoopCount);
Built.Updates.resize(NestedLoopCount);		Built.Updates.resize(NestedLoopCount);
Built.Finals.resize(NestedLoopCount);		Built.Finals.resize(NestedLoopCount);
▲ Show 20 Lines • Show All 107 Lines • ▼ Show 20 Lines	checkOpenMPLoop(OpenMPDirectiveKind DKind, Expr *CollapseLoopCountExpr,
Built.PrevEUB = PrevEUB.get();		Built.PrevEUB = PrevEUB.get();
Built.DistCombinedFields.LB = CombLB.get();		Built.DistCombinedFields.LB = CombLB.get();
Built.DistCombinedFields.UB = CombUB.get();		Built.DistCombinedFields.UB = CombUB.get();
Built.DistCombinedFields.EUB = CombEUB.get();		Built.DistCombinedFields.EUB = CombEUB.get();
Built.DistCombinedFields.Init = CombInit.get();		Built.DistCombinedFields.Init = CombInit.get();
Built.DistCombinedFields.Cond = CombCond.get();		Built.DistCombinedFields.Cond = CombCond.get();
Built.DistCombinedFields.NLB = CombNextLB.get();		Built.DistCombinedFields.NLB = CombNextLB.get();
Built.DistCombinedFields.NUB = CombNextUB.get();		Built.DistCombinedFields.NUB = CombNextUB.get();
		Built.DistCombinedFields.DistCond = CombDistCond.get();
		Built.DistCombinedFields.ParForInDistCond = ParForInDistCond.get();

return NestedLoopCount;		return NestedLoopCount;
}		}

static Expr getCollapseNumberExpr(ArrayRef<OMPClause > Clauses) {		static Expr getCollapseNumberExpr(ArrayRef<OMPClause > Clauses) {
auto CollapseClauses =		auto CollapseClauses =
OMPExecutableDirective::getClausesOfKind<OMPCollapseClause>(Clauses);		OMPExecutableDirective::getClausesOfKind<OMPCollapseClause>(Clauses);
if (CollapseClauses.begin() != CollapseClauses.end())		if (CollapseClauses.begin() != CollapseClauses.end())
▲ Show 20 Lines • Show All 8,111 Lines • Show Last 20 Lines

lib/Serialization/ASTReaderStmt.cpp

Show First 20 Lines • Show All 1,850 Lines • ▼ Show 20 Lines	if (isOpenMPLoopBoundSharingDirective(D->getDirectiveKind())) {
D->setPrevEnsureUpperBound(Record.readSubExpr());		D->setPrevEnsureUpperBound(Record.readSubExpr());
D->setCombinedLowerBoundVariable(Record.readSubExpr());		D->setCombinedLowerBoundVariable(Record.readSubExpr());
D->setCombinedUpperBoundVariable(Record.readSubExpr());		D->setCombinedUpperBoundVariable(Record.readSubExpr());
D->setCombinedEnsureUpperBound(Record.readSubExpr());		D->setCombinedEnsureUpperBound(Record.readSubExpr());
D->setCombinedInit(Record.readSubExpr());		D->setCombinedInit(Record.readSubExpr());
D->setCombinedCond(Record.readSubExpr());		D->setCombinedCond(Record.readSubExpr());
D->setCombinedNextLowerBound(Record.readSubExpr());		D->setCombinedNextLowerBound(Record.readSubExpr());
D->setCombinedNextUpperBound(Record.readSubExpr());		D->setCombinedNextUpperBound(Record.readSubExpr());
		D->setCombinedDistCond(Record.readSubExpr());
		D->setCombinedParForInDistCond(Record.readSubExpr());
}		}
SmallVector<Expr *, 4> Sub;		SmallVector<Expr *, 4> Sub;
unsigned CollapsedNum = D->getCollapsedNumber();		unsigned CollapsedNum = D->getCollapsedNumber();
Sub.reserve(CollapsedNum);		Sub.reserve(CollapsedNum);
for (unsigned i = 0; i < CollapsedNum; ++i)		for (unsigned i = 0; i < CollapsedNum; ++i)
Sub.push_back(Record.readSubExpr());		Sub.push_back(Record.readSubExpr());
D->setCounters(Sub);		D->setCounters(Sub);
Sub.clear();		Sub.clear();
▲ Show 20 Lines • Show All 1,407 Lines • Show Last 20 Lines

lib/Serialization/ASTWriterStmt.cpp

Show First 20 Lines • Show All 1,848 Lines • ▼ Show 20 Lines	if (isOpenMPLoopBoundSharingDirective(D->getDirectiveKind())) {
Record.AddStmt(D->getPrevEnsureUpperBound());		Record.AddStmt(D->getPrevEnsureUpperBound());
Record.AddStmt(D->getCombinedLowerBoundVariable());		Record.AddStmt(D->getCombinedLowerBoundVariable());
Record.AddStmt(D->getCombinedUpperBoundVariable());		Record.AddStmt(D->getCombinedUpperBoundVariable());
Record.AddStmt(D->getCombinedEnsureUpperBound());		Record.AddStmt(D->getCombinedEnsureUpperBound());
Record.AddStmt(D->getCombinedInit());		Record.AddStmt(D->getCombinedInit());
Record.AddStmt(D->getCombinedCond());		Record.AddStmt(D->getCombinedCond());
Record.AddStmt(D->getCombinedNextLowerBound());		Record.AddStmt(D->getCombinedNextLowerBound());
Record.AddStmt(D->getCombinedNextUpperBound());		Record.AddStmt(D->getCombinedNextUpperBound());
		Record.AddStmt(D->getCombinedDistCond());
		Record.AddStmt(D->getCombinedParForInDistCond());
}		}
for (auto I : D->counters()) {		for (auto I : D->counters()) {
Record.AddStmt(I);		Record.AddStmt(I);
}		}
for (auto I : D->private_counters()) {		for (auto I : D->private_counters()) {
Record.AddStmt(I);		Record.AddStmt(I);
}		}
for (auto I : D->inits()) {		for (auto I : D->inits()) {
▲ Show 20 Lines • Show All 432 Lines • Show Last 20 Lines

test/OpenMP/distribute_parallel_for_codegen.cpp

Show First 20 Lines • Show All 401 Lines • ▼ Show 20 Lines	a[i] = b[i] + c[i];
// LAMBDA: define{{.+}} void [[OFFLOADING_FUN_3]](		// LAMBDA: define{{.+}} void [[OFFLOADING_FUN_3]](
// LAMBDA: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 5, {{.+}} [[OMP_OUTLINED_3:@.+]] to {{.+}})		// LAMBDA: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 5, {{.+}} [[OMP_OUTLINED_3:@.+]] to {{.+}})

#pragma omp distribute parallel for dist_schedule(static, ch)		#pragma omp distribute parallel for dist_schedule(static, ch)
for (int i = 0; i < n; ++i) {		for (int i = 0; i < n; ++i) {
a[i] = b[i] + c[i];		a[i] = b[i] + c[i];
// LAMBDA: define{{.+}} void [[OMP_OUTLINED_3]](		// LAMBDA: define{{.+}} void [[OMP_OUTLINED_3]](
// LAMBDA-DAG: [[OMP_IV:%.omp.iv]] = alloca		// LAMBDA-DAG: [[OMP_IV:%.omp.iv]] = alloca
		// LAMBDA-DAG: [[OMP_CAPT_EXPR:%.capture_expr.1]] = alloca
		ABataevUnsubmitted Done Reply Inline Actions Bad check for names, you should not rely on them. ABataev: Bad check for names, you should not rely on them.
// LAMBDA-DAG: [[OMP_LB:%.omp.comb.lb]] = alloca		// LAMBDA-DAG: [[OMP_LB:%.omp.comb.lb]] = alloca
// LAMBDA-DAG: [[OMP_UB:%.omp.comb.ub]] = alloca		// LAMBDA-DAG: [[OMP_UB:%.omp.comb.ub]] = alloca
// LAMBDA-DAG: [[OMP_ST:%.omp.stride]] = alloca		// LAMBDA-DAG: [[OMP_ST:%.omp.stride]] = alloca

// unlike the previous tests, in this one we have a outer and inner loop for 'distribute'
// LAMBDA: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, i32 91,		// LAMBDA: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, i32 91,
// LAMBDA: br label %[[DIST_OUTER_LOOP_HEADER:.+]]

// LAMBDA: [[DIST_OUTER_LOOP_HEADER]]:
// check EUB for distribute		// check EUB for distribute
// LAMBDA-DAG: [[OMP_UB_VAL_1:%.+]] = load{{.+}} [[OMP_UB]],		// LAMBDA-DAG: [[OMP_UB_VAL_1:%.+]] = load{{.+}} [[OMP_UB]],
// LAMBDA: [[NUM_IT_1:%.+]] = load{{.+}},		// LAMBDA: [[NUM_IT_1:%.+]] = load{{.+}} [[OMP_CAPT_EXPR]],
// LAMBDA-DAG: [[CMP_UB_NUM_IT:%.+]] = icmp sgt {{.+}} [[OMP_UB_VAL_1]], [[NUM_IT_1]]		// LAMBDA-DAG: [[CMP_UB_NUM_IT:%.+]] = icmp sgt {{.+}} [[OMP_UB_VAL_1]], [[NUM_IT_1]]
// LAMBDA: br {{.+}} [[CMP_UB_NUM_IT]], label %[[EUB_TRUE:.+]], label %[[EUB_FALSE:.+]]		// LAMBDA: br {{.+}} [[CMP_UB_NUM_IT]], label %[[EUB_TRUE:.+]], label %[[EUB_FALSE:.+]]
// LAMBDA-DAG: [[EUB_TRUE]]:		// LAMBDA-DAG: [[EUB_TRUE]]:
// LAMBDA: [[NUM_IT_2:%.+]] = load{{.+}},		// LAMBDA: [[NUM_IT_2:%.+]] = load{{.+}},
// LAMBDA: br label %[[EUB_END:.+]]		// LAMBDA: br label %[[EUB_END:.+]]
// LAMBDA-DAG: [[EUB_FALSE]]:		// LAMBDA-DAG: [[EUB_FALSE]]:
// LAMBDA: [[OMP_UB_VAL2:%.+]] = load{{.+}} [[OMP_UB]],		// LAMBDA: [[OMP_UB_VAL2:%.+]] = load{{.+}} [[OMP_UB]],
// LAMBDA: br label %[[EUB_END]]		// LAMBDA: br label %[[EUB_END]]
// LAMBDA-DAG: [[EUB_END]]:		// LAMBDA-DAG: [[EUB_END]]:
// LAMBDA-DAG: [[EUB_RES:%.+]] = phi{{.+}} [ [[NUM_IT_2]], %[[EUB_TRUE]] ], [ [[OMP_UB_VAL2]], %[[EUB_FALSE]] ]		// LAMBDA-DAG: [[EUB_RES:%.+]] = phi{{.+}} [ [[NUM_IT_2]], %[[EUB_TRUE]] ], [ [[OMP_UB_VAL2]], %[[EUB_FALSE]] ]
// LAMBDA: store{{.+}} [[EUB_RES]], {{.+}}* [[OMP_UB]],		// LAMBDA: store{{.+}} [[EUB_RES]], {{.+}}* [[OMP_UB]],

// initialize omp.iv		// initialize omp.iv
// LAMBDA: [[OMP_LB_VAL_1:%.+]] = load{{.+}}, {{.+}}* [[OMP_LB]],		// LAMBDA: [[OMP_LB_VAL_1:%.+]] = load{{.+}}, {{.+}}* [[OMP_LB]],
// LAMBDA: store {{.+}} [[OMP_LB_VAL_1]], {{.+}}* [[OMP_IV]],		// LAMBDA: store {{.+}} [[OMP_LB_VAL_1]], {{.+}}* [[OMP_IV]],

// check exit condition		// check exit condition
// LAMBDA-DAG: [[OMP_IV_VAL_1:%.+]] = load {{.+}} [[OMP_IV]],		// LAMBDA-DAG: [[OMP_IV_VAL_1:%.+]] = load {{.+}} [[OMP_IV]],
// LAMBDA-DAG: [[OMP_UB_VAL_3:%.+]] = load {{.+}} [[OMP_UB]],		// LAMBDA-DAG: [[OMP_UB_VAL_3:%.+]] = load {{.+}} [[OMP_CAPT_EXPR]],
// LAMBDA: [[CMP_IV_UB:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_1]], [[OMP_UB_VAL_3]]		// LAMBDA-DAG: [[OMP_UB_VAL_3_PLUS_ONE:%.+]] = add {{.+}} [[OMP_UB_VAL_3]], 1
// LAMBDA: br {{.+}} [[CMP_IV_UB]], label %[[DIST_OUTER_LOOP_BODY:.+]], label %[[DIST_OUTER_LOOP_END:.+]]		// LAMBDA: [[CMP_IV_UB:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_1]], [[OMP_UB_VAL_3_PLUS_ONE]]
		// LAMBDA: br {{.+}} [[CMP_IV_UB]], label %[[DIST_INNER_LOOP_BODY:.+]], label %[[DIST_INNER_LOOP_END:.+]]
// LAMBDA: [[DIST_OUTER_LOOP_BODY]]:
// LAMBDA: br label %[[DIST_INNER_LOOP_HEADER:.+]]

// LAMBDA: [[DIST_INNER_LOOP_HEADER]]:
// LAMBDA-DAG: [[OMP_IV_VAL_2:%.+]] = load {{.+}} [[OMP_IV]],
// LAMBDA-DAG: [[OMP_UB_VAL_4:%.+]] = load {{.+}} [[OMP_UB]],
// LAMBDA: [[CMP_IV_UB_2:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_2]], [[OMP_UB_VAL_4]]
// LAMBDA: br{{.+}} [[CMP_IV_UB_2]], label %[[DIST_INNER_LOOP_BODY:.+]], label %[[DIST_INNER_LOOP_END:.+]]

// check that PrevLB and PrevUB are passed to the 'for'		// check that PrevLB and PrevUB are passed to the 'for'
// LAMBDA: [[DIST_INNER_LOOP_BODY]]:		// LAMBDA: [[DIST_INNER_LOOP_BODY]]:
// LAMBDA-DAG: [[OMP_PREV_LB:%.+]] = load {{.+}}, {{.+}} [[OMP_LB]],		// LAMBDA-DAG: [[OMP_PREV_LB:%.+]] = load {{.+}}, {{.+}} [[OMP_LB]],
// LAMBDA-64-DAG: [[OMP_PREV_LB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_LB]] to {{.+}}		// LAMBDA-64-DAG: [[OMP_PREV_LB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_LB]] to {{.+}}
// LAMBDA-DAG: [[OMP_PREV_UB:%.+]] = load {{.+}}, {{.+}} [[OMP_UB]],		// LAMBDA-DAG: [[OMP_PREV_UB:%.+]] = load {{.+}}, {{.+}} [[OMP_UB]],
// LAMBDA-64-DAG: [[OMP_PREV_UB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_UB]] to {{.+}}		// LAMBDA-64-DAG: [[OMP_PREV_UB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_UB]] to {{.+}}
// check that distlb and distub are properly passed to fork_call		// check that distlb and distub are properly passed to fork_call
// LAMBDA-64: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB_EXT]], i{{[0-9]+}} [[OMP_PREV_UB_EXT]], {{.+}})		// LAMBDA-64: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB_EXT]], i{{[0-9]+}} [[OMP_PREV_UB_EXT]], {{.+}})
// LAMBDA-32: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB]], i{{[0-9]+}} [[OMP_PREV_UB]], {{.+}})		// LAMBDA-32: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB]], i{{[0-9]+}} [[OMP_PREV_UB]], {{.+}})
// LAMBDA: br label %[[DIST_INNER_LOOP_INC:.+]]		// LAMBDA: br label %[[DIST_INNER_LOOP_INC:.+]]

// check DistInc		// check DistInc
// LAMBDA: [[DIST_INNER_LOOP_INC]]:		// LAMBDA: [[DIST_INNER_LOOP_INC]]:
// LAMBDA-DAG: [[OMP_IV_VAL_3:%.+]] = load {{.+}}, {{.+}}* [[OMP_IV]],		// LAMBDA-DAG: [[OMP_IV_VAL_3:%.+]] = load {{.+}}, {{.+}}* [[OMP_IV]],
// LAMBDA-DAG: [[OMP_ST_VAL_1:%.+]] = load {{.+}}, {{.+}}* [[OMP_ST]],		// LAMBDA-DAG: [[OMP_ST_VAL_1:%.+]] = load {{.+}}, {{.+}}* [[OMP_ST]],
// LAMBDA: [[OMP_IV_INC:%.+]] = add{{.+}} [[OMP_IV_VAL_3]], [[OMP_ST_VAL_1]]		// LAMBDA: [[OMP_IV_INC:%.+]] = add{{.+}} [[OMP_IV_VAL_3]], [[OMP_ST_VAL_1]]
// LAMBDA: store{{.+}} [[OMP_IV_INC]], {{.+}}* [[OMP_IV]],		// LAMBDA: store{{.+}} [[OMP_IV_INC]], {{.+}}* [[OMP_IV]],
// LAMBDA: br label %[[DIST_INNER_LOOP_HEADER]]

// LAMBDA: [[DIST_INNER_LOOP_END]]:
// LAMBDA: br label %[[DIST_OUTER_LOOP_INC:.+]]

// LAMBDA: [[DIST_OUTER_LOOP_INC]]:
// check NextLB and NextUB
// LAMBDA-DAG: [[OMP_LB_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],		// LAMBDA-DAG: [[OMP_LB_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],
// LAMBDA-DAG: [[OMP_ST_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],		// LAMBDA-DAG: [[OMP_ST_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],
// LAMBDA-DAG: [[OMP_LB_NEXT:%.+]] = add{{.+}} [[OMP_LB_VAL_2]], [[OMP_ST_VAL_2]]		// LAMBDA-DAG: [[OMP_LB_NEXT:%.+]] = add{{.+}} [[OMP_LB_VAL_2]], [[OMP_ST_VAL_2]]
// LAMBDA: store{{.+}} [[OMP_LB_NEXT]], {{.+}}* [[OMP_LB]],		// LAMBDA: store{{.+}} [[OMP_LB_NEXT]], {{.+}}* [[OMP_LB]],
// LAMBDA-DAG: [[OMP_UB_VAL_5:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],		// LAMBDA-DAG: [[OMP_UB_VAL_5:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],
// LAMBDA-DAG: [[OMP_ST_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],		// LAMBDA-DAG: [[OMP_ST_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],
// LAMBDA-DAG: [[OMP_UB_NEXT:%.+]] = add{{.+}} [[OMP_UB_VAL_5]], [[OMP_ST_VAL_3]]		// LAMBDA-DAG: [[OMP_UB_NEXT:%.+]] = add{{.+}} [[OMP_UB_VAL_5]], [[OMP_ST_VAL_3]]
// LAMBDA: store{{.+}} [[OMP_UB_NEXT]], {{.+}}* [[OMP_UB]],		// LAMBDA: store{{.+}} [[OMP_UB_NEXT]], {{.+}}* [[OMP_UB]],
// LAMBDA: br label %[[DIST_OUTER_LOOP_HEADER]]

// outer loop exit		// Update UB
// LAMBDA: [[DIST_OUTER_LOOP_END]]:		// LAMBDA-DAG: [[OMP_UB_VAL_6:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],
		// LAMBDA: [[OMP_EXPR_VAL:%.+]] = load{{.+}}, {{.+}} [[OMP_CAPT_EXPR]],
		// LAMBDA-DAG: [[CMP_UB_NUM_IT_1:%.+]] = icmp sgt {{.+}}[[OMP_UB_VAL_6]], [[OMP_EXPR_VAL]]
		// LAMBDA: br {{.+}} [[CMP_UB_NUM_IT_1]], label %[[EUB_TRUE_1:.+]], label %[[EUB_FALSE_1:.+]]
		// LAMBDA-DAG: [[EUB_TRUE_1]]:
		// LAMBDA: [[NUM_IT_3:%.+]] = load{{.+}} [[OMP_CAPT_EXPR]],
		// LAMBDA: br label %[[EUB_END_1:.+]]
		// LAMBDA-DAG: [[EUB_FALSE_1]]:
		// LAMBDA: [[OMP_UB_VAL3:%.+]] = load{{.+}} [[OMP_UB]],
		// LAMBDA: br label %[[EUB_END_1]]
		// LAMBDA-DAG: [[EUB_END_1]]:
		// LAMBDA-DAG: [[EUB_RES_1:%.+]] = phi{{.+}} [ [[NUM_IT_3]], %[[EUB_TRUE_1]] ], [ [[OMP_UB_VAL3]], %[[EUB_FALSE_1]] ]
		// LAMBDA: store{{.+}} [[EUB_RES_1]], {{.+}}* [[OMP_UB]],

		// Store LB in IV
		// LAMBDA-DAG: [[OMP_LB_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],
		// LAMBDA: store{{.+}} [[OMP_LB_VAL_3]], {{.+}}* [[OMP_IV]],

		// LAMBDA: [[DIST_INNER_LOOP_END]]:
		// LAMBDA: br label %[[LOOP_EXIT:.+]]

		// loop exit
		// LAMBDA: [[LOOP_EXIT]]:
// LAMBDA-DAG: call void @__kmpc_for_static_fini(		// LAMBDA-DAG: call void @__kmpc_for_static_fini(
// LAMBDA: ret		// LAMBDA: ret

// skip implementation of 'parallel for': using default scheduling and was tested above		// skip implementation of 'parallel for': using default scheduling and was tested above
[&]() {		[&]() {
a[i] = b[i] + c[i];		a[i] = b[i] + c[i];
}();		}();
}		}
▲ Show 20 Lines • Show All 653 Lines • ▼ Show 20 Lines	#else
// CHECK: define{{.+}} void [[OFFLOADING_FUN_3]](		// CHECK: define{{.+}} void [[OFFLOADING_FUN_3]](
// CHECK: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 5, {{.+}} [[OMP_OUTLINED_3:@.+]] to {{.+}})		// CHECK: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 5, {{.+}} [[OMP_OUTLINED_3:@.+]] to {{.+}})

#pragma omp distribute parallel for dist_schedule(static, ch)		#pragma omp distribute parallel for dist_schedule(static, ch)
for (int i = 0; i < n; ++i) {		for (int i = 0; i < n; ++i) {
a[i] = b[i] + c[i];		a[i] = b[i] + c[i];
// CHECK: define{{.+}} void [[OMP_OUTLINED_3]](		// CHECK: define{{.+}} void [[OMP_OUTLINED_3]](
// CHECK-DAG: [[OMP_IV:%.omp.iv]] = alloca		// CHECK-DAG: [[OMP_IV:%.omp.iv]] = alloca
		// CHECK-DAG: [[OMP_CAPT_EXPR:%.capture_expr.1]] = alloca
// CHECK-DAG: [[OMP_LB:%.omp.comb.lb]] = alloca		// CHECK-DAG: [[OMP_LB:%.omp.comb.lb]] = alloca
// CHECK-DAG: [[OMP_UB:%.omp.comb.ub]] = alloca		// CHECK-DAG: [[OMP_UB:%.omp.comb.ub]] = alloca
// CHECK-DAG: [[OMP_ST:%.omp.stride]] = alloca		// CHECK-DAG: [[OMP_ST:%.omp.stride]] = alloca

// unlike the previous tests, in this one we have a outer and inner loop for 'distribute'		// unlike the previous tests, in this one we have a outer and inner loop for 'distribute'
// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, i32 91,		// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, i32 91,
// CHECK: br label %[[DIST_OUTER_LOOP_HEADER:.+]]

// CHECK: [[DIST_OUTER_LOOP_HEADER]]:
// check EUB for distribute		// check EUB for distribute
// CHECK-DAG: [[OMP_UB_VAL_1:%.+]] = load{{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_UB_VAL_1:%.+]] = load{{.+}} [[OMP_UB]],
// CHECK: [[NUM_IT_1:%.+]] = load{{.+}},		// CHECK: [[NUM_IT_1:%.+]] = load{{.+}} [[OMP_CAPT_EXPR]],
// CHECK-DAG: [[CMP_UB_NUM_IT:%.+]] = icmp sgt {{.+}} [[OMP_UB_VAL_1]], [[NUM_IT_1]]		// CHECK-DAG: [[CMP_UB_NUM_IT:%.+]] = icmp sgt {{.+}} [[OMP_UB_VAL_1]], [[NUM_IT_1]]
// CHECK: br {{.+}} [[CMP_UB_NUM_IT]], label %[[EUB_TRUE:.+]], label %[[EUB_FALSE:.+]]		// CHECK: br {{.+}} [[CMP_UB_NUM_IT]], label %[[EUB_TRUE:.+]], label %[[EUB_FALSE:.+]]
// CHECK-DAG: [[EUB_TRUE]]:		// CHECK-DAG: [[EUB_TRUE]]:
// CHECK: [[NUM_IT_2:%.+]] = load{{.+}},		// CHECK: [[NUM_IT_2:%.+]] = load{{.+}},
// CHECK: br label %[[EUB_END:.+]]		// CHECK: br label %[[EUB_END:.+]]
// CHECK-DAG: [[EUB_FALSE]]:		// CHECK-DAG: [[EUB_FALSE]]:
// CHECK: [[OMP_UB_VAL2:%.+]] = load{{.+}} [[OMP_UB]],		// CHECK: [[OMP_UB_VAL2:%.+]] = load{{.+}} [[OMP_UB]],
// CHECK: br label %[[EUB_END]]		// CHECK: br label %[[EUB_END]]
// CHECK-DAG: [[EUB_END]]:		// CHECK-DAG: [[EUB_END]]:
// CHECK-DAG: [[EUB_RES:%.+]] = phi{{.+}} [ [[NUM_IT_2]], %[[EUB_TRUE]] ], [ [[OMP_UB_VAL2]], %[[EUB_FALSE]] ]		// CHECK-DAG: [[EUB_RES:%.+]] = phi{{.+}} [ [[NUM_IT_2]], %[[EUB_TRUE]] ], [ [[OMP_UB_VAL2]], %[[EUB_FALSE]] ]
// CHECK: store{{.+}} [[EUB_RES]], {{.+}}* [[OMP_UB]],		// CHECK: store{{.+}} [[EUB_RES]], {{.+}}* [[OMP_UB]],

// initialize omp.iv		// initialize omp.iv
// CHECK: [[OMP_LB_VAL_1:%.+]] = load{{.+}}, {{.+}}* [[OMP_LB]],		// CHECK: [[OMP_LB_VAL_1:%.+]] = load{{.+}}, {{.+}}* [[OMP_LB]],
// CHECK: store {{.+}} [[OMP_LB_VAL_1]], {{.+}}* [[OMP_IV]],		// CHECK: store {{.+}} [[OMP_LB_VAL_1]], {{.+}}* [[OMP_IV]],

// check exit condition		// check exit condition
// CHECK-DAG: [[OMP_IV_VAL_1:%.+]] = load {{.+}} [[OMP_IV]],		// CHECK-DAG: [[OMP_IV_VAL_1:%.+]] = load {{.+}} [[OMP_IV]],
// CHECK-DAG: [[OMP_UB_VAL_3:%.+]] = load {{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_UB_VAL_3:%.+]] = load {{.+}} [[OMP_CAPT_EXPR]],
// CHECK: [[CMP_IV_UB:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_1]], [[OMP_UB_VAL_3]]		// CHECK-DAG: [[OMP_UB_VAL_3_PLUS_ONE:%.+]] = add {{.+}} [[OMP_UB_VAL_3]], 1
// CHECK: br {{.+}} [[CMP_IV_UB]], label %[[DIST_OUTER_LOOP_BODY:.+]], label %[[DIST_OUTER_LOOP_END:.+]]		// CHECK: [[CMP_IV_UB:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_1]], [[OMP_UB_VAL_3_PLUS_ONE]]
		// CHECK: br {{.+}} [[CMP_IV_UB]], label %[[DIST_INNER_LOOP_BODY:.+]], label %[[DIST_INNER_LOOP_END:.+]]
// CHECK: [[DIST_OUTER_LOOP_BODY]]:
// CHECK: br label %[[DIST_INNER_LOOP_HEADER:.+]]

// CHECK: [[DIST_INNER_LOOP_HEADER]]:
// CHECK-DAG: [[OMP_IV_VAL_2:%.+]] = load {{.+}} [[OMP_IV]],
// CHECK-DAG: [[OMP_UB_VAL_4:%.+]] = load {{.+}} [[OMP_UB]],
// CHECK: [[CMP_IV_UB_2:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_2]], [[OMP_UB_VAL_4]]
// CHECK: br{{.+}} [[CMP_IV_UB_2]], label %[[DIST_INNER_LOOP_BODY:.+]], label %[[DIST_INNER_LOOP_END:.+]]

// check that PrevLB and PrevUB are passed to the 'for'		// check that PrevLB and PrevUB are passed to the 'for'
// CHECK: [[DIST_INNER_LOOP_BODY]]:		// CHECK: [[DIST_INNER_LOOP_BODY]]:
// CHECK-DAG: [[OMP_PREV_LB:%.+]] = load {{.+}}, {{.+}} [[OMP_LB]],		// CHECK-DAG: [[OMP_PREV_LB:%.+]] = load {{.+}}, {{.+}} [[OMP_LB]],
// CHECK-64-DAG: [[OMP_PREV_LB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_LB]] to {{.+}}		// CHECK-64-DAG: [[OMP_PREV_LB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_LB]] to {{.+}}
// CHECK-DAG: [[OMP_PREV_UB:%.+]] = load {{.+}}, {{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_PREV_UB:%.+]] = load {{.+}}, {{.+}} [[OMP_UB]],
// CHECK-64-DAG: [[OMP_PREV_UB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_UB]] to {{.+}}		// CHECK-64-DAG: [[OMP_PREV_UB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_UB]] to {{.+}}
// check that distlb and distub are properly passed to fork_call		// check that distlb and distub are properly passed to fork_call
// CHECK-64: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB_EXT]], i{{[0-9]+}} [[OMP_PREV_UB_EXT]], {{.+}})		// CHECK-64: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB_EXT]], i{{[0-9]+}} [[OMP_PREV_UB_EXT]], {{.+}})
// CHECK-32: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB]], i{{[0-9]+}} [[OMP_PREV_UB]], {{.+}})		// CHECK-32: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB]], i{{[0-9]+}} [[OMP_PREV_UB]], {{.+}})
// CHECK: br label %[[DIST_INNER_LOOP_INC:.+]]		// CHECK: br label %[[DIST_INNER_LOOP_INC:.+]]

// check DistInc		// check DistInc
// CHECK: [[DIST_INNER_LOOP_INC]]:		// CHECK: [[DIST_INNER_LOOP_INC]]:
// CHECK-DAG: [[OMP_IV_VAL_3:%.+]] = load {{.+}}, {{.+}}* [[OMP_IV]],		// CHECK-DAG: [[OMP_IV_VAL_3:%.+]] = load {{.+}}, {{.+}}* [[OMP_IV]],
// CHECK-DAG: [[OMP_ST_VAL_1:%.+]] = load {{.+}}, {{.+}}* [[OMP_ST]],		// CHECK-DAG: [[OMP_ST_VAL_1:%.+]] = load {{.+}}, {{.+}}* [[OMP_ST]],
// CHECK: [[OMP_IV_INC:%.+]] = add{{.+}} [[OMP_IV_VAL_3]], [[OMP_ST_VAL_1]]		// CHECK: [[OMP_IV_INC:%.+]] = add{{.+}} [[OMP_IV_VAL_3]], [[OMP_ST_VAL_1]]
// CHECK: store{{.+}} [[OMP_IV_INC]], {{.+}}* [[OMP_IV]],		// CHECK: store{{.+}} [[OMP_IV_INC]], {{.+}}* [[OMP_IV]],
// CHECK: br label %[[DIST_INNER_LOOP_HEADER]]

// CHECK: [[DIST_INNER_LOOP_END]]:
// CHECK: br label %[[DIST_OUTER_LOOP_INC:.+]]

// CHECK: [[DIST_OUTER_LOOP_INC]]:
// check NextLB and NextUB
// CHECK-DAG: [[OMP_LB_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],		// CHECK-DAG: [[OMP_LB_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],
// CHECK-DAG: [[OMP_ST_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],		// CHECK-DAG: [[OMP_ST_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],
// CHECK-DAG: [[OMP_LB_NEXT:%.+]] = add{{.+}} [[OMP_LB_VAL_2]], [[OMP_ST_VAL_2]]		// CHECK-DAG: [[OMP_LB_NEXT:%.+]] = add{{.+}} [[OMP_LB_VAL_2]], [[OMP_ST_VAL_2]]
// CHECK: store{{.+}} [[OMP_LB_NEXT]], {{.+}}* [[OMP_LB]],		// CHECK: store{{.+}} [[OMP_LB_NEXT]], {{.+}}* [[OMP_LB]],
// CHECK-DAG: [[OMP_UB_VAL_5:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_UB_VAL_5:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],
// CHECK-DAG: [[OMP_ST_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],		// CHECK-DAG: [[OMP_ST_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],
// CHECK-DAG: [[OMP_UB_NEXT:%.+]] = add{{.+}} [[OMP_UB_VAL_5]], [[OMP_ST_VAL_3]]		// CHECK-DAG: [[OMP_UB_NEXT:%.+]] = add{{.+}} [[OMP_UB_VAL_5]], [[OMP_ST_VAL_3]]
// CHECK: store{{.+}} [[OMP_UB_NEXT]], {{.+}}* [[OMP_UB]],		// CHECK: store{{.+}} [[OMP_UB_NEXT]], {{.+}}* [[OMP_UB]],
// CHECK: br label %[[DIST_OUTER_LOOP_HEADER]]

// outer loop exit		// Update UB
// CHECK: [[DIST_OUTER_LOOP_END]]:		// CHECK-DAG: [[OMP_UB_VAL_6:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],
		// CHECK: [[OMP_EXPR_VAL:%.+]] = load{{.+}}, {{.+}} [[OMP_CAPT_EXPR]],
		// CHECK-DAG: [[CMP_UB_NUM_IT_1:%.+]] = icmp sgt {{.+}}[[OMP_UB_VAL_6]], [[OMP_EXPR_VAL]]
		// CHECK: br {{.+}} [[CMP_UB_NUM_IT_1]], label %[[EUB_TRUE_1:.+]], label %[[EUB_FALSE_1:.+]]
		// CHECK-DAG: [[EUB_TRUE_1]]:
		// CHECK: [[NUM_IT_3:%.+]] = load{{.+}} [[OMP_CAPT_EXPR]],
		// CHECK: br label %[[EUB_END_1:.+]]
		// CHECK-DAG: [[EUB_FALSE_1]]:
		// CHECK: [[OMP_UB_VAL3:%.+]] = load{{.+}} [[OMP_UB]],
		// CHECK: br label %[[EUB_END_1]]
		// CHECK-DAG: [[EUB_END_1]]:
		// CHECK-DAG: [[EUB_RES_1:%.+]] = phi{{.+}} [ [[NUM_IT_3]], %[[EUB_TRUE_1]] ], [ [[OMP_UB_VAL3]], %[[EUB_FALSE_1]] ]
		// CHECK: store{{.+}} [[EUB_RES_1]], {{.+}}* [[OMP_UB]],

		// Store LB in IV
		// CHECK-DAG: [[OMP_LB_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],
		// CHECK: store{{.+}} [[OMP_LB_VAL_3]], {{.+}}* [[OMP_IV]],

		// CHECK: [[DIST_INNER_LOOP_END]]:
		// CHECK: br label %[[LOOP_EXIT:.+]]

		// loop exit
		// CHECK: [[LOOP_EXIT]]:
// CHECK-DAG: call void @__kmpc_for_static_fini(		// CHECK-DAG: call void @__kmpc_for_static_fini(
// CHECK: ret		// CHECK: ret

// skip implementation of 'parallel for': using default scheduling and was tested above		// skip implementation of 'parallel for': using default scheduling and was tested above
}		}

// schedule: static no chunk		// schedule: static no chunk
#pragma omp target		#pragma omp target
▲ Show 20 Lines • Show All 618 Lines • ▼ Show 20 Lines
// CHECK-DAG: call void @__kmpc_for_static_fini(		// CHECK-DAG: call void @__kmpc_for_static_fini(
// CHECK: ret		// CHECK: ret

// CHECK: define{{.+}} void [[OFFLOADING_FUN_3]](		// CHECK: define{{.+}} void [[OFFLOADING_FUN_3]](
// CHECK: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 5, {{.+}} [[OMP_OUTLINED_3:@.+]] to {{.+}})		// CHECK: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 5, {{.+}} [[OMP_OUTLINED_3:@.+]] to {{.+}})

// CHECK: define{{.+}} void [[OMP_OUTLINED_3]](		// CHECK: define{{.+}} void [[OMP_OUTLINED_3]](
// CHECK-DAG: [[OMP_IV:%.omp.iv]] = alloca		// CHECK-DAG: [[OMP_IV:%.omp.iv]] = alloca
		// CHECK-DAG: [[OMP_CAPT_EXPR:%.capture_expr.1]] = alloca
// CHECK-DAG: [[OMP_LB:%.omp.comb.lb]] = alloca		// CHECK-DAG: [[OMP_LB:%.omp.comb.lb]] = alloca
// CHECK-DAG: [[OMP_UB:%.omp.comb.ub]] = alloca		// CHECK-DAG: [[OMP_UB:%.omp.comb.ub]] = alloca
// CHECK-DAG: [[OMP_ST:%.omp.stride]] = alloca		// CHECK-DAG: [[OMP_ST:%.omp.stride]] = alloca

// unlike the previous tests, in this one we have a outer and inner loop for 'distribute'		// unlike the previous tests, in this one we have a outer and inner loop for 'distribute'
// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, i32 91,		// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, i32 91,
// CHECK: br label %[[DIST_OUTER_LOOP_HEADER:.+]]

// CHECK: [[DIST_OUTER_LOOP_HEADER]]:
// check EUB for distribute		// check EUB for distribute
// CHECK-DAG: [[OMP_UB_VAL_1:%.+]] = load{{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_UB_VAL_1:%.+]] = load{{.+}} [[OMP_UB]],
// CHECK: [[NUM_IT_1:%.+]] = load{{.+}},		// CHECK: [[NUM_IT_1:%.+]] = load{{.+}} [[OMP_CAPT_EXPR]],
// CHECK-DAG: [[CMP_UB_NUM_IT:%.+]] = icmp sgt {{.+}} [[OMP_UB_VAL_1]], [[NUM_IT_1]]		// CHECK-DAG: [[CMP_UB_NUM_IT:%.+]] = icmp sgt {{.+}} [[OMP_UB_VAL_1]], [[NUM_IT_1]]
// CHECK: br {{.+}} [[CMP_UB_NUM_IT]], label %[[EUB_TRUE:.+]], label %[[EUB_FALSE:.+]]		// CHECK: br {{.+}} [[CMP_UB_NUM_IT]], label %[[EUB_TRUE:.+]], label %[[EUB_FALSE:.+]]
// CHECK-DAG: [[EUB_TRUE]]:		// CHECK-DAG: [[EUB_TRUE]]:
// CHECK: [[NUM_IT_2:%.+]] = load{{.+}},		// CHECK: [[NUM_IT_2:%.+]] = load{{.+}},
// CHECK: br label %[[EUB_END:.+]]		// CHECK: br label %[[EUB_END:.+]]
// CHECK-DAG: [[EUB_FALSE]]:		// CHECK-DAG: [[EUB_FALSE]]:
// CHECK: [[OMP_UB_VAL2:%.+]] = load{{.+}} [[OMP_UB]],		// CHECK: [[OMP_UB_VAL2:%.+]] = load{{.+}} [[OMP_UB]],
// CHECK: br label %[[EUB_END]]		// CHECK: br label %[[EUB_END]]
// CHECK-DAG: [[EUB_END]]:		// CHECK-DAG: [[EUB_END]]:
// CHECK-DAG: [[EUB_RES:%.+]] = phi{{.+}} [ [[NUM_IT_2]], %[[EUB_TRUE]] ], [ [[OMP_UB_VAL2]], %[[EUB_FALSE]] ]		// CHECK-DAG: [[EUB_RES:%.+]] = phi{{.+}} [ [[NUM_IT_2]], %[[EUB_TRUE]] ], [ [[OMP_UB_VAL2]], %[[EUB_FALSE]] ]
// CHECK: store{{.+}} [[EUB_RES]], {{.+}}* [[OMP_UB]],		// CHECK: store{{.+}} [[EUB_RES]], {{.+}}* [[OMP_UB]],

// initialize omp.iv		// initialize omp.iv
// CHECK: [[OMP_LB_VAL_1:%.+]] = load{{.+}}, {{.+}}* [[OMP_LB]],		// CHECK: [[OMP_LB_VAL_1:%.+]] = load{{.+}}, {{.+}}* [[OMP_LB]],
// CHECK: store {{.+}} [[OMP_LB_VAL_1]], {{.+}}* [[OMP_IV]],		// CHECK: store {{.+}} [[OMP_LB_VAL_1]], {{.+}}* [[OMP_IV]],

// check exit condition		// check exit condition
// CHECK-DAG: [[OMP_IV_VAL_1:%.+]] = load {{.+}} [[OMP_IV]],		// CHECK-DAG: [[OMP_IV_VAL_1:%.+]] = load {{.+}} [[OMP_IV]],
// CHECK-DAG: [[OMP_UB_VAL_3:%.+]] = load {{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_UB_VAL_3:%.+]] = load {{.+}} [[OMP_CAPT_EXPR]],
// CHECK: [[CMP_IV_UB:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_1]], [[OMP_UB_VAL_3]]		// CHECK-DAG: [[OMP_UB_VAL_3_PLUS_ONE:%.+]] = add {{.+}} [[OMP_UB_VAL_3]], 1
// CHECK: br {{.+}} [[CMP_IV_UB]], label %[[DIST_OUTER_LOOP_BODY:.+]], label %[[DIST_OUTER_LOOP_END:.+]]		// CHECK: [[CMP_IV_UB:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_1]], [[OMP_UB_VAL_3_PLUS_ONE]]
		// CHECK: br {{.+}} [[CMP_IV_UB]], label %[[DIST_INNER_LOOP_BODY:.+]], label %[[DIST_INNER_LOOP_END:.+]]
// CHECK: [[DIST_OUTER_LOOP_BODY]]:
// CHECK: br label %[[DIST_INNER_LOOP_HEADER:.+]]

// CHECK: [[DIST_INNER_LOOP_HEADER]]:
// CHECK-DAG: [[OMP_IV_VAL_2:%.+]] = load {{.+}} [[OMP_IV]],
// CHECK-DAG: [[OMP_UB_VAL_4:%.+]] = load {{.+}} [[OMP_UB]],
// CHECK: [[CMP_IV_UB_2:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_2]], [[OMP_UB_VAL_4]]
// CHECK: br{{.+}} [[CMP_IV_UB_2]], label %[[DIST_INNER_LOOP_BODY:.+]], label %[[DIST_INNER_LOOP_END:.+]]

// check that PrevLB and PrevUB are passed to the 'for'		// check that PrevLB and PrevUB are passed to the 'for'
// CHECK: [[DIST_INNER_LOOP_BODY]]:		// CHECK: [[DIST_INNER_LOOP_BODY]]:
// CHECK-DAG: [[OMP_PREV_LB:%.+]] = load {{.+}}, {{.+}} [[OMP_LB]],		// CHECK-DAG: [[OMP_PREV_LB:%.+]] = load {{.+}}, {{.+}} [[OMP_LB]],
// CHECK-64-DAG: [[OMP_PREV_LB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_LB]] to {{.+}}		// CHECK-64-DAG: [[OMP_PREV_LB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_LB]] to {{.+}}
// CHECK-DAG: [[OMP_PREV_UB:%.+]] = load {{.+}}, {{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_PREV_UB:%.+]] = load {{.+}}, {{.+}} [[OMP_UB]],
// CHECK-64-DAG: [[OMP_PREV_UB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_UB]] to {{.+}}		// CHECK-64-DAG: [[OMP_PREV_UB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_UB]] to {{.+}}
// check that distlb and distub are properly passed to fork_call		// check that distlb and distub are properly passed to fork_call
// CHECK-64: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB_EXT]], i{{[0-9]+}} [[OMP_PREV_UB_EXT]], {{.+}})		// CHECK-64: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB_EXT]], i{{[0-9]+}} [[OMP_PREV_UB_EXT]], {{.+}})
// CHECK-32: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB]], i{{[0-9]+}} [[OMP_PREV_UB]], {{.+}})		// CHECK-32: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB]], i{{[0-9]+}} [[OMP_PREV_UB]], {{.+}})
// CHECK: br label %[[DIST_INNER_LOOP_INC:.+]]		// CHECK: br label %[[DIST_INNER_LOOP_INC:.+]]

// check DistInc		// check DistInc
// CHECK: [[DIST_INNER_LOOP_INC]]:		// CHECK: [[DIST_INNER_LOOP_INC]]:
// CHECK-DAG: [[OMP_IV_VAL_3:%.+]] = load {{.+}}, {{.+}}* [[OMP_IV]],		// CHECK-DAG: [[OMP_IV_VAL_3:%.+]] = load {{.+}}, {{.+}}* [[OMP_IV]],
// CHECK-DAG: [[OMP_ST_VAL_1:%.+]] = load {{.+}}, {{.+}}* [[OMP_ST]],		// CHECK-DAG: [[OMP_ST_VAL_1:%.+]] = load {{.+}}, {{.+}}* [[OMP_ST]],
// CHECK: [[OMP_IV_INC:%.+]] = add{{.+}} [[OMP_IV_VAL_3]], [[OMP_ST_VAL_1]]		// CHECK: [[OMP_IV_INC:%.+]] = add{{.+}} [[OMP_IV_VAL_3]], [[OMP_ST_VAL_1]]
// CHECK: store{{.+}} [[OMP_IV_INC]], {{.+}}* [[OMP_IV]],		// CHECK: store{{.+}} [[OMP_IV_INC]], {{.+}}* [[OMP_IV]],
// CHECK: br label %[[DIST_INNER_LOOP_HEADER]]

// CHECK: [[DIST_INNER_LOOP_END]]:
// CHECK: br label %[[DIST_OUTER_LOOP_INC:.+]]

// CHECK: [[DIST_OUTER_LOOP_INC]]:
// check NextLB and NextUB
// CHECK-DAG: [[OMP_LB_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],		// CHECK-DAG: [[OMP_LB_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],
// CHECK-DAG: [[OMP_ST_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],		// CHECK-DAG: [[OMP_ST_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],
// CHECK-DAG: [[OMP_LB_NEXT:%.+]] = add{{.+}} [[OMP_LB_VAL_2]], [[OMP_ST_VAL_2]]		// CHECK-DAG: [[OMP_LB_NEXT:%.+]] = add{{.+}} [[OMP_LB_VAL_2]], [[OMP_ST_VAL_2]]
// CHECK: store{{.+}} [[OMP_LB_NEXT]], {{.+}}* [[OMP_LB]],		// CHECK: store{{.+}} [[OMP_LB_NEXT]], {{.+}}* [[OMP_LB]],
// CHECK-DAG: [[OMP_UB_VAL_5:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_UB_VAL_5:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],
// CHECK-DAG: [[OMP_ST_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],		// CHECK-DAG: [[OMP_ST_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],
// CHECK-DAG: [[OMP_UB_NEXT:%.+]] = add{{.+}} [[OMP_UB_VAL_5]], [[OMP_ST_VAL_3]]		// CHECK-DAG: [[OMP_UB_NEXT:%.+]] = add{{.+}} [[OMP_UB_VAL_5]], [[OMP_ST_VAL_3]]
// CHECK: store{{.+}} [[OMP_UB_NEXT]], {{.+}}* [[OMP_UB]],		// CHECK: store{{.+}} [[OMP_UB_NEXT]], {{.+}}* [[OMP_UB]],
// CHECK: br label %[[DIST_OUTER_LOOP_HEADER]]

// outer loop exit		// Update UB
// CHECK: [[DIST_OUTER_LOOP_END]]:		// CHECK-DAG: [[OMP_UB_VAL_6:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],
		// CHECK: [[OMP_EXPR_VAL:%.+]] = load{{.+}}, {{.+}} [[OMP_CAPT_EXPR]],
		// CHECK-DAG: [[CMP_UB_NUM_IT_1:%.+]] = icmp sgt {{.+}}[[OMP_UB_VAL_6]], [[OMP_EXPR_VAL]]
		// CHECK: br {{.+}} [[CMP_UB_NUM_IT_1]], label %[[EUB_TRUE_1:.+]], label %[[EUB_FALSE_1:.+]]
		// CHECK-DAG: [[EUB_TRUE_1]]:
		// CHECK: [[NUM_IT_3:%.+]] = load{{.+}} [[OMP_CAPT_EXPR]],
		// CHECK: br label %[[EUB_END_1:.+]]
		// CHECK-DAG: [[EUB_FALSE_1]]:
		// CHECK: [[OMP_UB_VAL3:%.+]] = load{{.+}} [[OMP_UB]],
		// CHECK: br label %[[EUB_END_1]]
		// CHECK-DAG: [[EUB_END_1]]:
		// CHECK-DAG: [[EUB_RES_1:%.+]] = phi{{.+}} [ [[NUM_IT_3]], %[[EUB_TRUE_1]] ], [ [[OMP_UB_VAL3]], %[[EUB_FALSE_1]] ]
		// CHECK: store{{.+}} [[EUB_RES_1]], {{.+}}* [[OMP_UB]],

		// Store LB in IV
		// CHECK-DAG: [[OMP_LB_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],
		// CHECK: store{{.+}} [[OMP_LB_VAL_3]], {{.+}}* [[OMP_IV]],

		// CHECK: [[DIST_INNER_LOOP_END]]:
		// CHECK: br label %[[LOOP_EXIT:.+]]

		// loop exit
		// CHECK: [[LOOP_EXIT]]:
// CHECK-DAG: call void @__kmpc_for_static_fini(		// CHECK-DAG: call void @__kmpc_for_static_fini(
// CHECK: ret		// CHECK: ret

// skip implementation of 'parallel for': using default scheduling and was tested above		// skip implementation of 'parallel for': using default scheduling and was tested above

// CHECK: define{{.+}} void [[OFFLOADING_FUN_4]](		// CHECK: define{{.+}} void [[OFFLOADING_FUN_4]](
// CHECK: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 4, {{.+}} [[OMP_OUTLINED_4:@.+]] to {{.+}})		// CHECK: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 4, {{.+}} [[OMP_OUTLINED_4:@.+]] to {{.+}})

▲ Show 20 Lines • Show All 320 Lines • Show Last 20 Lines

test/OpenMP/distribute_parallel_for_simd_codegen.cpp

Show First 20 Lines • Show All 400 Lines • ▼ Show 20 Lines	a[i] = b[i] + c[i];
// LAMBDA: define{{.+}} void [[OFFLOADING_FUN_3]](		// LAMBDA: define{{.+}} void [[OFFLOADING_FUN_3]](
// LAMBDA: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 5, {{.+}} [[OMP_OUTLINED_3:@.+]] to {{.+}})		// LAMBDA: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 5, {{.+}} [[OMP_OUTLINED_3:@.+]] to {{.+}})

#pragma omp distribute parallel for simd dist_schedule(static, ch)		#pragma omp distribute parallel for simd dist_schedule(static, ch)
for (int i = 0; i < n; ++i) {		for (int i = 0; i < n; ++i) {
a[i] = b[i] + c[i];		a[i] = b[i] + c[i];
// LAMBDA: define{{.+}} void [[OMP_OUTLINED_3]](		// LAMBDA: define{{.+}} void [[OMP_OUTLINED_3]](
// LAMBDA-DAG: [[OMP_IV:%.omp.iv]] = alloca		// LAMBDA-DAG: [[OMP_IV:%.omp.iv]] = alloca
		// LAMBDA-DAG: [[OMP_CAPT_EXPR:%.capture_expr.1]] = alloca
// LAMBDA-DAG: [[OMP_LB:%.omp.comb.lb]] = alloca		// LAMBDA-DAG: [[OMP_LB:%.omp.comb.lb]] = alloca
// LAMBDA-DAG: [[OMP_UB:%.omp.comb.ub]] = alloca		// LAMBDA-DAG: [[OMP_UB:%.omp.comb.ub]] = alloca
// LAMBDA-DAG: [[OMP_ST:%.omp.stride]] = alloca		// LAMBDA-DAG: [[OMP_ST:%.omp.stride]] = alloca

// unlike the previous tests, in this one we have a outer and inner loop for 'distribute'
// LAMBDA: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, i32 91,		// LAMBDA: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, i32 91,
// LAMBDA: br label %[[DIST_OUTER_LOOP_HEADER:.+]]

// LAMBDA: [[DIST_OUTER_LOOP_HEADER]]:
// check EUB for distribute		// check EUB for distribute
// LAMBDA-DAG: [[OMP_UB_VAL_1:%.+]] = load{{.+}} [[OMP_UB]],		// LAMBDA-DAG: [[OMP_UB_VAL_1:%.+]] = load{{.+}} [[OMP_UB]],
// LAMBDA: [[NUM_IT_1:%.+]] = load{{.+}},		// LAMBDA: [[NUM_IT_1:%.+]] = load{{.+}} [[OMP_CAPT_EXPR]],
// LAMBDA-DAG: [[CMP_UB_NUM_IT:%.+]] = icmp sgt {{.+}} [[OMP_UB_VAL_1]], [[NUM_IT_1]]		// LAMBDA-DAG: [[CMP_UB_NUM_IT:%.+]] = icmp sgt {{.+}} [[OMP_UB_VAL_1]], [[NUM_IT_1]]
// LAMBDA: br {{.+}} [[CMP_UB_NUM_IT]], label %[[EUB_TRUE:.+]], label %[[EUB_FALSE:.+]]		// LAMBDA: br {{.+}} [[CMP_UB_NUM_IT]], label %[[EUB_TRUE:.+]], label %[[EUB_FALSE:.+]]
// LAMBDA-DAG: [[EUB_TRUE]]:		// LAMBDA-DAG: [[EUB_TRUE]]:
// LAMBDA: [[NUM_IT_2:%.+]] = load{{.+}},		// LAMBDA: [[NUM_IT_2:%.+]] = load{{.+}},
// LAMBDA: br label %[[EUB_END:.+]]		// LAMBDA: br label %[[EUB_END:.+]]
// LAMBDA-DAG: [[EUB_FALSE]]:		// LAMBDA-DAG: [[EUB_FALSE]]:
// LAMBDA: [[OMP_UB_VAL2:%.+]] = load{{.+}} [[OMP_UB]],		// LAMBDA: [[OMP_UB_VAL2:%.+]] = load{{.+}} [[OMP_UB]],
// LAMBDA: br label %[[EUB_END]]		// LAMBDA: br label %[[EUB_END]]
// LAMBDA-DAG: [[EUB_END]]:		// LAMBDA-DAG: [[EUB_END]]:
// LAMBDA-DAG: [[EUB_RES:%.+]] = phi{{.+}} [ [[NUM_IT_2]], %[[EUB_TRUE]] ], [ [[OMP_UB_VAL2]], %[[EUB_FALSE]] ]		// LAMBDA-DAG: [[EUB_RES:%.+]] = phi{{.+}} [ [[NUM_IT_2]], %[[EUB_TRUE]] ], [ [[OMP_UB_VAL2]], %[[EUB_FALSE]] ]
// LAMBDA: store{{.+}} [[EUB_RES]], {{.+}}* [[OMP_UB]],		// LAMBDA: store{{.+}} [[EUB_RES]], {{.+}}* [[OMP_UB]],

// initialize omp.iv		// initialize omp.iv
// LAMBDA: [[OMP_LB_VAL_1:%.+]] = load{{.+}}, {{.+}}* [[OMP_LB]],		// LAMBDA: [[OMP_LB_VAL_1:%.+]] = load{{.+}}, {{.+}}* [[OMP_LB]],
// LAMBDA: store {{.+}} [[OMP_LB_VAL_1]], {{.+}}* [[OMP_IV]],		// LAMBDA: store {{.+}} [[OMP_LB_VAL_1]], {{.+}}* [[OMP_IV]],

// check exit condition		// check exit condition
// LAMBDA-DAG: [[OMP_IV_VAL_1:%.+]] = load {{.+}} [[OMP_IV]],		// LAMBDA-DAG: [[OMP_IV_VAL_1:%.+]] = load {{.+}} [[OMP_IV]],
// LAMBDA-DAG: [[OMP_UB_VAL_3:%.+]] = load {{.+}} [[OMP_UB]],		// LAMBDA-DAG: [[OMP_UB_VAL_3:%.+]] = load {{.+}} [[OMP_CAPT_EXPR]],
// LAMBDA: [[CMP_IV_UB:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_1]], [[OMP_UB_VAL_3]]		// LAMBDA-DAG: [[OMP_UB_VAL_3_PLUS_ONE:%.+]] = add {{.+}} [[OMP_UB_VAL_3]], 1
// LAMBDA: br {{.+}} [[CMP_IV_UB]], label %[[DIST_OUTER_LOOP_BODY:.+]], label %[[DIST_OUTER_LOOP_END:.+]]		// LAMBDA: [[CMP_IV_UB:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_1]], [[OMP_UB_VAL_3_PLUS_ONE]]
		// LAMBDA: br {{.+}} [[CMP_IV_UB]], label %[[DIST_INNER_LOOP_BODY:.+]], label %[[DIST_INNER_LOOP_END:.+]]
// LAMBDA: [[DIST_OUTER_LOOP_BODY]]:
// LAMBDA: br label %[[DIST_INNER_LOOP_HEADER:.+]]

// LAMBDA: [[DIST_INNER_LOOP_HEADER]]:
// LAMBDA-DAG: [[OMP_IV_VAL_2:%.+]] = load {{.+}} [[OMP_IV]],
// LAMBDA-DAG: [[OMP_UB_VAL_4:%.+]] = load {{.+}} [[OMP_UB]],
// LAMBDA: [[CMP_IV_UB_2:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_2]], [[OMP_UB_VAL_4]]
// LAMBDA: br{{.+}} [[CMP_IV_UB_2]], label %[[DIST_INNER_LOOP_BODY:.+]], label %[[DIST_INNER_LOOP_END:.+]]

// check that PrevLB and PrevUB are passed to the 'for'		// check that PrevLB and PrevUB are passed to the 'for'
// LAMBDA: [[DIST_INNER_LOOP_BODY]]:		// LAMBDA: [[DIST_INNER_LOOP_BODY]]:
// LAMBDA-DAG: [[OMP_PREV_LB:%.+]] = load {{.+}}, {{.+}} [[OMP_LB]],		// LAMBDA-DAG: [[OMP_PREV_LB:%.+]] = load {{.+}}, {{.+}} [[OMP_LB]],
// LAMBDA-64-DAG: [[OMP_PREV_LB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_LB]] to {{.+}}		// LAMBDA-64-DAG: [[OMP_PREV_LB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_LB]] to {{.+}}
// LAMBDA-DAG: [[OMP_PREV_UB:%.+]] = load {{.+}}, {{.+}} [[OMP_UB]],		// LAMBDA-DAG: [[OMP_PREV_UB:%.+]] = load {{.+}}, {{.+}} [[OMP_UB]],
// LAMBDA-64-DAG: [[OMP_PREV_UB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_UB]] to {{.+}}		// LAMBDA-64-DAG: [[OMP_PREV_UB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_UB]] to {{.+}}
// check that distlb and distub are properly passed to fork_call		// check that distlb and distub are properly passed to fork_call
// LAMBDA-64: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB_EXT]], i{{[0-9]+}} [[OMP_PREV_UB_EXT]], {{.+}})		// LAMBDA-64: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB_EXT]], i{{[0-9]+}} [[OMP_PREV_UB_EXT]], {{.+}})
// LAMBDA-32: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB]], i{{[0-9]+}} [[OMP_PREV_UB]], {{.+}})		// LAMBDA-32: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB]], i{{[0-9]+}} [[OMP_PREV_UB]], {{.+}})
// LAMBDA: br label %[[DIST_INNER_LOOP_INC:.+]]		// LAMBDA: br label %[[DIST_INNER_LOOP_INC:.+]]

// check DistInc		// check DistInc
// LAMBDA: [[DIST_INNER_LOOP_INC]]:		// LAMBDA: [[DIST_INNER_LOOP_INC]]:
// LAMBDA-DAG: [[OMP_IV_VAL_3:%.+]] = load {{.+}}, {{.+}}* [[OMP_IV]],		// LAMBDA-DAG: [[OMP_IV_VAL_3:%.+]] = load {{.+}}, {{.+}}* [[OMP_IV]],
// LAMBDA-DAG: [[OMP_ST_VAL_1:%.+]] = load {{.+}}, {{.+}}* [[OMP_ST]],		// LAMBDA-DAG: [[OMP_ST_VAL_1:%.+]] = load {{.+}}, {{.+}}* [[OMP_ST]],
// LAMBDA: [[OMP_IV_INC:%.+]] = add{{.+}} [[OMP_IV_VAL_3]], [[OMP_ST_VAL_1]]		// LAMBDA: [[OMP_IV_INC:%.+]] = add{{.+}} [[OMP_IV_VAL_3]], [[OMP_ST_VAL_1]]
// LAMBDA: store{{.+}} [[OMP_IV_INC]], {{.+}}* [[OMP_IV]],		// LAMBDA: store{{.+}} [[OMP_IV_INC]], {{.+}}* [[OMP_IV]],
// LAMBDA: br label %[[DIST_INNER_LOOP_HEADER]]

// LAMBDA: [[DIST_INNER_LOOP_END]]:
// LAMBDA: br label %[[DIST_OUTER_LOOP_INC:.+]]

// LAMBDA: [[DIST_OUTER_LOOP_INC]]:
// check NextLB and NextUB
// LAMBDA-DAG: [[OMP_LB_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],		// LAMBDA-DAG: [[OMP_LB_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],
// LAMBDA-DAG: [[OMP_ST_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],		// LAMBDA-DAG: [[OMP_ST_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],
// LAMBDA-DAG: [[OMP_LB_NEXT:%.+]] = add{{.+}} [[OMP_LB_VAL_2]], [[OMP_ST_VAL_2]]		// LAMBDA-DAG: [[OMP_LB_NEXT:%.+]] = add{{.+}} [[OMP_LB_VAL_2]], [[OMP_ST_VAL_2]]
// LAMBDA: store{{.+}} [[OMP_LB_NEXT]], {{.+}}* [[OMP_LB]],		// LAMBDA: store{{.+}} [[OMP_LB_NEXT]], {{.+}}* [[OMP_LB]],
// LAMBDA-DAG: [[OMP_UB_VAL_5:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],		// LAMBDA-DAG: [[OMP_UB_VAL_5:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],
// LAMBDA-DAG: [[OMP_ST_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],		// LAMBDA-DAG: [[OMP_ST_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],
// LAMBDA-DAG: [[OMP_UB_NEXT:%.+]] = add{{.+}} [[OMP_UB_VAL_5]], [[OMP_ST_VAL_3]]		// LAMBDA-DAG: [[OMP_UB_NEXT:%.+]] = add{{.+}} [[OMP_UB_VAL_5]], [[OMP_ST_VAL_3]]
// LAMBDA: store{{.+}} [[OMP_UB_NEXT]], {{.+}}* [[OMP_UB]],		// LAMBDA: store{{.+}} [[OMP_UB_NEXT]], {{.+}}* [[OMP_UB]],
// LAMBDA: br label %[[DIST_OUTER_LOOP_HEADER]]

// outer loop exit		// Update UB
// LAMBDA: [[DIST_OUTER_LOOP_END]]:		// LAMBDA-DAG: [[OMP_UB_VAL_6:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],
		// LAMBDA: [[OMP_EXPR_VAL:%.+]] = load{{.+}}, {{.+}} [[OMP_CAPT_EXPR]],
		// LAMBDA-DAG: [[CMP_UB_NUM_IT_1:%.+]] = icmp sgt {{.+}}[[OMP_UB_VAL_6]], [[OMP_EXPR_VAL]]
		// LAMBDA: br {{.+}} [[CMP_UB_NUM_IT_1]], label %[[EUB_TRUE_1:.+]], label %[[EUB_FALSE_1:.+]]
		// LAMBDA-DAG: [[EUB_TRUE_1]]:
		// LAMBDA: [[NUM_IT_3:%.+]] = load{{.+}} [[OMP_CAPT_EXPR]],
		// LAMBDA: br label %[[EUB_END_1:.+]]
		// LAMBDA-DAG: [[EUB_FALSE_1]]:
		// LAMBDA: [[OMP_UB_VAL3:%.+]] = load{{.+}} [[OMP_UB]],
		// LAMBDA: br label %[[EUB_END_1]]
		// LAMBDA-DAG: [[EUB_END_1]]:
		// LAMBDA-DAG: [[EUB_RES_1:%.+]] = phi{{.+}} [ [[NUM_IT_3]], %[[EUB_TRUE_1]] ], [ [[OMP_UB_VAL3]], %[[EUB_FALSE_1]] ]
		// LAMBDA: store{{.+}} [[EUB_RES_1]], {{.+}}* [[OMP_UB]],

		// Store LB in IV
		// LAMBDA-DAG: [[OMP_LB_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],
		// LAMBDA: store{{.+}} [[OMP_LB_VAL_3]], {{.+}}* [[OMP_IV]],

		// LAMBDA: [[DIST_INNER_LOOP_END]]:
		// LAMBDA: br label %[[LOOP_EXIT:.+]]

		// loop exit
		// LAMBDA: [[LOOP_EXIT]]:
// LAMBDA-DAG: call void @__kmpc_for_static_fini(		// LAMBDA-DAG: call void @__kmpc_for_static_fini(
// LAMBDA: ret		// LAMBDA: ret

// skip implementation of 'parallel for': using default scheduling and was tested above		// skip implementation of 'parallel for': using default scheduling and was tested above
[&]() {		[&]() {
a[i] = b[i] + c[i];		a[i] = b[i] + c[i];
}();		}();
}		}
▲ Show 20 Lines • Show All 653 Lines • ▼ Show 20 Lines	#else
// CHECK: define{{.+}} void [[OFFLOADING_FUN_3]](		// CHECK: define{{.+}} void [[OFFLOADING_FUN_3]](
// CHECK: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 5, {{.+}} [[OMP_OUTLINED_3:@.+]] to {{.+}})		// CHECK: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 5, {{.+}} [[OMP_OUTLINED_3:@.+]] to {{.+}})

#pragma omp distribute parallel for simd dist_schedule(static, ch)		#pragma omp distribute parallel for simd dist_schedule(static, ch)
for (int i = 0; i < n; ++i) {		for (int i = 0; i < n; ++i) {
a[i] = b[i] + c[i];		a[i] = b[i] + c[i];
// CHECK: define{{.+}} void [[OMP_OUTLINED_3]](		// CHECK: define{{.+}} void [[OMP_OUTLINED_3]](
// CHECK-DAG: [[OMP_IV:%.omp.iv]] = alloca		// CHECK-DAG: [[OMP_IV:%.omp.iv]] = alloca
		// CHECK-DAG: [[OMP_CAPT_EXPR:%.capture_expr.1]] = alloca
// CHECK-DAG: [[OMP_LB:%.omp.comb.lb]] = alloca		// CHECK-DAG: [[OMP_LB:%.omp.comb.lb]] = alloca
// CHECK-DAG: [[OMP_UB:%.omp.comb.ub]] = alloca		// CHECK-DAG: [[OMP_UB:%.omp.comb.ub]] = alloca
// CHECK-DAG: [[OMP_ST:%.omp.stride]] = alloca		// CHECK-DAG: [[OMP_ST:%.omp.stride]] = alloca

// unlike the previous tests, in this one we have a outer and inner loop for 'distribute'		// unlike the previous tests, in this one we have a outer and inner loop for 'distribute'
// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, i32 91,		// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, i32 91,
// CHECK: br label %[[DIST_OUTER_LOOP_HEADER:.+]]

// CHECK: [[DIST_OUTER_LOOP_HEADER]]:
// check EUB for distribute		// check EUB for distribute
// CHECK-DAG: [[OMP_UB_VAL_1:%.+]] = load{{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_UB_VAL_1:%.+]] = load{{.+}} [[OMP_UB]],
// CHECK: [[NUM_IT_1:%.+]] = load{{.+}},		// CHECK: [[NUM_IT_1:%.+]] = load{{.+}} [[OMP_CAPT_EXPR]],
// CHECK-DAG: [[CMP_UB_NUM_IT:%.+]] = icmp sgt {{.+}} [[OMP_UB_VAL_1]], [[NUM_IT_1]]		// CHECK-DAG: [[CMP_UB_NUM_IT:%.+]] = icmp sgt {{.+}} [[OMP_UB_VAL_1]], [[NUM_IT_1]]
// CHECK: br {{.+}} [[CMP_UB_NUM_IT]], label %[[EUB_TRUE:.+]], label %[[EUB_FALSE:.+]]		// CHECK: br {{.+}} [[CMP_UB_NUM_IT]], label %[[EUB_TRUE:.+]], label %[[EUB_FALSE:.+]]
// CHECK-DAG: [[EUB_TRUE]]:		// CHECK-DAG: [[EUB_TRUE]]:
// CHECK: [[NUM_IT_2:%.+]] = load{{.+}},		// CHECK: [[NUM_IT_2:%.+]] = load{{.+}},
// CHECK: br label %[[EUB_END:.+]]		// CHECK: br label %[[EUB_END:.+]]
// CHECK-DAG: [[EUB_FALSE]]:		// CHECK-DAG: [[EUB_FALSE]]:
// CHECK: [[OMP_UB_VAL2:%.+]] = load{{.+}} [[OMP_UB]],		// CHECK: [[OMP_UB_VAL2:%.+]] = load{{.+}} [[OMP_UB]],
// CHECK: br label %[[EUB_END]]		// CHECK: br label %[[EUB_END]]
// CHECK-DAG: [[EUB_END]]:		// CHECK-DAG: [[EUB_END]]:
// CHECK-DAG: [[EUB_RES:%.+]] = phi{{.+}} [ [[NUM_IT_2]], %[[EUB_TRUE]] ], [ [[OMP_UB_VAL2]], %[[EUB_FALSE]] ]		// CHECK-DAG: [[EUB_RES:%.+]] = phi{{.+}} [ [[NUM_IT_2]], %[[EUB_TRUE]] ], [ [[OMP_UB_VAL2]], %[[EUB_FALSE]] ]
// CHECK: store{{.+}} [[EUB_RES]], {{.+}}* [[OMP_UB]],		// CHECK: store{{.+}} [[EUB_RES]], {{.+}}* [[OMP_UB]],

// initialize omp.iv		// initialize omp.iv
// CHECK: [[OMP_LB_VAL_1:%.+]] = load{{.+}}, {{.+}}* [[OMP_LB]],		// CHECK: [[OMP_LB_VAL_1:%.+]] = load{{.+}}, {{.+}}* [[OMP_LB]],
// CHECK: store {{.+}} [[OMP_LB_VAL_1]], {{.+}}* [[OMP_IV]],		// CHECK: store {{.+}} [[OMP_LB_VAL_1]], {{.+}}* [[OMP_IV]],

// check exit condition		// check exit condition
// CHECK-DAG: [[OMP_IV_VAL_1:%.+]] = load {{.+}} [[OMP_IV]],		// CHECK-DAG: [[OMP_IV_VAL_1:%.+]] = load {{.+}} [[OMP_IV]],
// CHECK-DAG: [[OMP_UB_VAL_3:%.+]] = load {{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_UB_VAL_3:%.+]] = load {{.+}} [[OMP_CAPT_EXPR]],
// CHECK: [[CMP_IV_UB:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_1]], [[OMP_UB_VAL_3]]		// CHECK-DAG: [[OMP_UB_VAL_3_PLUS_ONE:%.+]] = add {{.+}} [[OMP_UB_VAL_3]], 1
// CHECK: br {{.+}} [[CMP_IV_UB]], label %[[DIST_OUTER_LOOP_BODY:.+]], label %[[DIST_OUTER_LOOP_END:.+]]		// CHECK: [[CMP_IV_UB:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_1]], [[OMP_UB_VAL_3_PLUS_ONE]]
		// CHECK: br {{.+}} [[CMP_IV_UB]], label %[[DIST_INNER_LOOP_BODY:.+]], label %[[DIST_INNER_LOOP_END:.+]]
// CHECK: [[DIST_OUTER_LOOP_BODY]]:
// CHECK: br label %[[DIST_INNER_LOOP_HEADER:.+]]

// CHECK: [[DIST_INNER_LOOP_HEADER]]:
// CHECK-DAG: [[OMP_IV_VAL_2:%.+]] = load {{.+}} [[OMP_IV]],
// CHECK-DAG: [[OMP_UB_VAL_4:%.+]] = load {{.+}} [[OMP_UB]],
// CHECK: [[CMP_IV_UB_2:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_2]], [[OMP_UB_VAL_4]]
// CHECK: br{{.+}} [[CMP_IV_UB_2]], label %[[DIST_INNER_LOOP_BODY:.+]], label %[[DIST_INNER_LOOP_END:.+]]

// check that PrevLB and PrevUB are passed to the 'for'		// check that PrevLB and PrevUB are passed to the 'for'
// CHECK: [[DIST_INNER_LOOP_BODY]]:		// CHECK: [[DIST_INNER_LOOP_BODY]]:
// CHECK-DAG: [[OMP_PREV_LB:%.+]] = load {{.+}}, {{.+}} [[OMP_LB]],		// CHECK-DAG: [[OMP_PREV_LB:%.+]] = load {{.+}}, {{.+}} [[OMP_LB]],
// CHECK-64-DAG: [[OMP_PREV_LB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_LB]] to {{.+}}		// CHECK-64-DAG: [[OMP_PREV_LB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_LB]] to {{.+}}
// CHECK-DAG: [[OMP_PREV_UB:%.+]] = load {{.+}}, {{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_PREV_UB:%.+]] = load {{.+}}, {{.+}} [[OMP_UB]],
// CHECK-64-DAG: [[OMP_PREV_UB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_UB]] to {{.+}}		// CHECK-64-DAG: [[OMP_PREV_UB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_UB]] to {{.+}}
// check that distlb and distub are properly passed to fork_call		// check that distlb and distub are properly passed to fork_call
// CHECK-64: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB_EXT]], i{{[0-9]+}} [[OMP_PREV_UB_EXT]], {{.+}})		// CHECK-64: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB_EXT]], i{{[0-9]+}} [[OMP_PREV_UB_EXT]], {{.+}})
// CHECK-32: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB]], i{{[0-9]+}} [[OMP_PREV_UB]], {{.+}})		// CHECK-32: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB]], i{{[0-9]+}} [[OMP_PREV_UB]], {{.+}})
// CHECK: br label %[[DIST_INNER_LOOP_INC:.+]]		// CHECK: br label %[[DIST_INNER_LOOP_INC:.+]]

// check DistInc		// check DistInc
// CHECK: [[DIST_INNER_LOOP_INC]]:		// CHECK: [[DIST_INNER_LOOP_INC]]:
// CHECK-DAG: [[OMP_IV_VAL_3:%.+]] = load {{.+}}, {{.+}}* [[OMP_IV]],		// CHECK-DAG: [[OMP_IV_VAL_3:%.+]] = load {{.+}}, {{.+}}* [[OMP_IV]],
// CHECK-DAG: [[OMP_ST_VAL_1:%.+]] = load {{.+}}, {{.+}}* [[OMP_ST]],		// CHECK-DAG: [[OMP_ST_VAL_1:%.+]] = load {{.+}}, {{.+}}* [[OMP_ST]],
// CHECK: [[OMP_IV_INC:%.+]] = add{{.+}} [[OMP_IV_VAL_3]], [[OMP_ST_VAL_1]]		// CHECK: [[OMP_IV_INC:%.+]] = add{{.+}} [[OMP_IV_VAL_3]], [[OMP_ST_VAL_1]]
// CHECK: store{{.+}} [[OMP_IV_INC]], {{.+}}* [[OMP_IV]],		// CHECK: store{{.+}} [[OMP_IV_INC]], {{.+}}* [[OMP_IV]],
// CHECK: br label %[[DIST_INNER_LOOP_HEADER]]

// CHECK: [[DIST_INNER_LOOP_END]]:
// CHECK: br label %[[DIST_OUTER_LOOP_INC:.+]]

// CHECK: [[DIST_OUTER_LOOP_INC]]:
// check NextLB and NextUB
// CHECK-DAG: [[OMP_LB_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],		// CHECK-DAG: [[OMP_LB_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],
// CHECK-DAG: [[OMP_ST_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],		// CHECK-DAG: [[OMP_ST_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],
// CHECK-DAG: [[OMP_LB_NEXT:%.+]] = add{{.+}} [[OMP_LB_VAL_2]], [[OMP_ST_VAL_2]]		// CHECK-DAG: [[OMP_LB_NEXT:%.+]] = add{{.+}} [[OMP_LB_VAL_2]], [[OMP_ST_VAL_2]]
// CHECK: store{{.+}} [[OMP_LB_NEXT]], {{.+}}* [[OMP_LB]],		// CHECK: store{{.+}} [[OMP_LB_NEXT]], {{.+}}* [[OMP_LB]],
// CHECK-DAG: [[OMP_UB_VAL_5:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_UB_VAL_5:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],
// CHECK-DAG: [[OMP_ST_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],		// CHECK-DAG: [[OMP_ST_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],
// CHECK-DAG: [[OMP_UB_NEXT:%.+]] = add{{.+}} [[OMP_UB_VAL_5]], [[OMP_ST_VAL_3]]		// CHECK-DAG: [[OMP_UB_NEXT:%.+]] = add{{.+}} [[OMP_UB_VAL_5]], [[OMP_ST_VAL_3]]
// CHECK: store{{.+}} [[OMP_UB_NEXT]], {{.+}}* [[OMP_UB]],		// CHECK: store{{.+}} [[OMP_UB_NEXT]], {{.+}}* [[OMP_UB]],
// CHECK: br label %[[DIST_OUTER_LOOP_HEADER]]

// outer loop exit		// Update UB
// CHECK: [[DIST_OUTER_LOOP_END]]:		// CHECK-DAG: [[OMP_UB_VAL_6:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],
		// CHECK: [[OMP_EXPR_VAL:%.+]] = load{{.+}}, {{.+}} [[OMP_CAPT_EXPR]],
		// CHECK-DAG: [[CMP_UB_NUM_IT_1:%.+]] = icmp sgt {{.+}}[[OMP_UB_VAL_6]], [[OMP_EXPR_VAL]]
		// CHECK: br {{.+}} [[CMP_UB_NUM_IT_1]], label %[[EUB_TRUE_1:.+]], label %[[EUB_FALSE_1:.+]]
		// CHECK-DAG: [[EUB_TRUE_1]]:
		// CHECK: [[NUM_IT_3:%.+]] = load{{.+}} [[OMP_CAPT_EXPR]],
		// CHECK: br label %[[EUB_END_1:.+]]
		// CHECK-DAG: [[EUB_FALSE_1]]:
		// CHECK: [[OMP_UB_VAL3:%.+]] = load{{.+}} [[OMP_UB]],
		// CHECK: br label %[[EUB_END_1]]
		// CHECK-DAG: [[EUB_END_1]]:
		// CHECK-DAG: [[EUB_RES_1:%.+]] = phi{{.+}} [ [[NUM_IT_3]], %[[EUB_TRUE_1]] ], [ [[OMP_UB_VAL3]], %[[EUB_FALSE_1]] ]
		// CHECK: store{{.+}} [[EUB_RES_1]], {{.+}}* [[OMP_UB]],

		// Store LB in IV
		// CHECK-DAG: [[OMP_LB_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],
		// CHECK: store{{.+}} [[OMP_LB_VAL_3]], {{.+}}* [[OMP_IV]],

		// CHECK: [[DIST_INNER_LOOP_END]]:
		// CHECK: br label %[[LOOP_EXIT:.+]]

		// loop exit
		// CHECK: [[LOOP_EXIT]]:
// CHECK-DAG: call void @__kmpc_for_static_fini(		// CHECK-DAG: call void @__kmpc_for_static_fini(
// CHECK: ret		// CHECK: ret

// skip implementation of 'parallel for': using default scheduling and was tested above		// skip implementation of 'parallel for': using default scheduling and was tested above
}		}

// schedule: static no chunk		// schedule: static no chunk
#pragma omp target		#pragma omp target
▲ Show 20 Lines • Show All 618 Lines • ▼ Show 20 Lines
// CHECK-DAG: call void @__kmpc_for_static_fini(		// CHECK-DAG: call void @__kmpc_for_static_fini(
// CHECK: ret		// CHECK: ret

// CHECK: define{{.+}} void [[OFFLOADING_FUN_3]](		// CHECK: define{{.+}} void [[OFFLOADING_FUN_3]](
// CHECK: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 5, {{.+}} [[OMP_OUTLINED_3:@.+]] to {{.+}})		// CHECK: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 5, {{.+}} [[OMP_OUTLINED_3:@.+]] to {{.+}})

// CHECK: define{{.+}} void [[OMP_OUTLINED_3]](		// CHECK: define{{.+}} void [[OMP_OUTLINED_3]](
// CHECK-DAG: [[OMP_IV:%.omp.iv]] = alloca		// CHECK-DAG: [[OMP_IV:%.omp.iv]] = alloca
		// CHECK-DAG: [[OMP_CAPT_EXPR:%.capture_expr.1]] = alloca
// CHECK-DAG: [[OMP_LB:%.omp.comb.lb]] = alloca		// CHECK-DAG: [[OMP_LB:%.omp.comb.lb]] = alloca
// CHECK-DAG: [[OMP_UB:%.omp.comb.ub]] = alloca		// CHECK-DAG: [[OMP_UB:%.omp.comb.ub]] = alloca
// CHECK-DAG: [[OMP_ST:%.omp.stride]] = alloca		// CHECK-DAG: [[OMP_ST:%.omp.stride]] = alloca

// unlike the previous tests, in this one we have a outer and inner loop for 'distribute'		// unlike the previous tests, in this one we have a outer and inner loop for 'distribute'
// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, i32 91,		// CHECK: call void @__kmpc_for_static_init_4({{.+}}, {{.+}}, i32 91,
// CHECK: br label %[[DIST_OUTER_LOOP_HEADER:.+]]

// CHECK: [[DIST_OUTER_LOOP_HEADER]]:
// check EUB for distribute		// check EUB for distribute
// CHECK-DAG: [[OMP_UB_VAL_1:%.+]] = load{{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_UB_VAL_1:%.+]] = load{{.+}} [[OMP_UB]],
// CHECK: [[NUM_IT_1:%.+]] = load{{.+}},		// CHECK: [[NUM_IT_1:%.+]] = load{{.+}} [[OMP_CAPT_EXPR]],
// CHECK-DAG: [[CMP_UB_NUM_IT:%.+]] = icmp sgt {{.+}} [[OMP_UB_VAL_1]], [[NUM_IT_1]]		// CHECK-DAG: [[CMP_UB_NUM_IT:%.+]] = icmp sgt {{.+}} [[OMP_UB_VAL_1]], [[NUM_IT_1]]
// CHECK: br {{.+}} [[CMP_UB_NUM_IT]], label %[[EUB_TRUE:.+]], label %[[EUB_FALSE:.+]]		// CHECK: br {{.+}} [[CMP_UB_NUM_IT]], label %[[EUB_TRUE:.+]], label %[[EUB_FALSE:.+]]
// CHECK-DAG: [[EUB_TRUE]]:		// CHECK-DAG: [[EUB_TRUE]]:
// CHECK: [[NUM_IT_2:%.+]] = load{{.+}},		// CHECK: [[NUM_IT_2:%.+]] = load{{.+}},
// CHECK: br label %[[EUB_END:.+]]		// CHECK: br label %[[EUB_END:.+]]
// CHECK-DAG: [[EUB_FALSE]]:		// CHECK-DAG: [[EUB_FALSE]]:
// CHECK: [[OMP_UB_VAL2:%.+]] = load{{.+}} [[OMP_UB]],		// CHECK: [[OMP_UB_VAL2:%.+]] = load{{.+}} [[OMP_UB]],
// CHECK: br label %[[EUB_END]]		// CHECK: br label %[[EUB_END]]
// CHECK-DAG: [[EUB_END]]:		// CHECK-DAG: [[EUB_END]]:
// CHECK-DAG: [[EUB_RES:%.+]] = phi{{.+}} [ [[NUM_IT_2]], %[[EUB_TRUE]] ], [ [[OMP_UB_VAL2]], %[[EUB_FALSE]] ]		// CHECK-DAG: [[EUB_RES:%.+]] = phi{{.+}} [ [[NUM_IT_2]], %[[EUB_TRUE]] ], [ [[OMP_UB_VAL2]], %[[EUB_FALSE]] ]
// CHECK: store{{.+}} [[EUB_RES]], {{.+}}* [[OMP_UB]],		// CHECK: store{{.+}} [[EUB_RES]], {{.+}}* [[OMP_UB]],

// initialize omp.iv		// initialize omp.iv
// CHECK: [[OMP_LB_VAL_1:%.+]] = load{{.+}}, {{.+}}* [[OMP_LB]],		// CHECK: [[OMP_LB_VAL_1:%.+]] = load{{.+}}, {{.+}}* [[OMP_LB]],
// CHECK: store {{.+}} [[OMP_LB_VAL_1]], {{.+}}* [[OMP_IV]],		// CHECK: store {{.+}} [[OMP_LB_VAL_1]], {{.+}}* [[OMP_IV]],

// check exit condition		// check exit condition
// CHECK-DAG: [[OMP_IV_VAL_1:%.+]] = load {{.+}} [[OMP_IV]],		// CHECK-DAG: [[OMP_IV_VAL_1:%.+]] = load {{.+}} [[OMP_IV]],
// CHECK-DAG: [[OMP_UB_VAL_3:%.+]] = load {{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_UB_VAL_3:%.+]] = load {{.+}} [[OMP_CAPT_EXPR]],
// CHECK: [[CMP_IV_UB:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_1]], [[OMP_UB_VAL_3]]		// CHECK-DAG: [[OMP_UB_VAL_3_PLUS_ONE:%.+]] = add {{.+}} [[OMP_UB_VAL_3]], 1
// CHECK: br {{.+}} [[CMP_IV_UB]], label %[[DIST_OUTER_LOOP_BODY:.+]], label %[[DIST_OUTER_LOOP_END:.+]]		// CHECK: [[CMP_IV_UB:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_1]], [[OMP_UB_VAL_3_PLUS_ONE]]
		// CHECK: br {{.+}} [[CMP_IV_UB]], label %[[DIST_INNER_LOOP_BODY:.+]], label %[[DIST_INNER_LOOP_END:.+]]
// CHECK: [[DIST_OUTER_LOOP_BODY]]:
// CHECK: br label %[[DIST_INNER_LOOP_HEADER:.+]]

// CHECK: [[DIST_INNER_LOOP_HEADER]]:
// CHECK-DAG: [[OMP_IV_VAL_2:%.+]] = load {{.+}} [[OMP_IV]],
// CHECK-DAG: [[OMP_UB_VAL_4:%.+]] = load {{.+}} [[OMP_UB]],
// CHECK: [[CMP_IV_UB_2:%.+]] = icmp sle {{.+}} [[OMP_IV_VAL_2]], [[OMP_UB_VAL_4]]
// CHECK: br{{.+}} [[CMP_IV_UB_2]], label %[[DIST_INNER_LOOP_BODY:.+]], label %[[DIST_INNER_LOOP_END:.+]]

// check that PrevLB and PrevUB are passed to the 'for'		// check that PrevLB and PrevUB are passed to the 'for'
// CHECK: [[DIST_INNER_LOOP_BODY]]:		// CHECK: [[DIST_INNER_LOOP_BODY]]:
// CHECK-DAG: [[OMP_PREV_LB:%.+]] = load {{.+}}, {{.+}} [[OMP_LB]],		// CHECK-DAG: [[OMP_PREV_LB:%.+]] = load {{.+}}, {{.+}} [[OMP_LB]],
// CHECK-64-DAG: [[OMP_PREV_LB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_LB]] to {{.+}}		// CHECK-64-DAG: [[OMP_PREV_LB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_LB]] to {{.+}}
// CHECK-DAG: [[OMP_PREV_UB:%.+]] = load {{.+}}, {{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_PREV_UB:%.+]] = load {{.+}}, {{.+}} [[OMP_UB]],
// CHECK-64-DAG: [[OMP_PREV_UB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_UB]] to {{.+}}		// CHECK-64-DAG: [[OMP_PREV_UB_EXT:%.+]] = zext {{.+}} [[OMP_PREV_UB]] to {{.+}}
// check that distlb and distub are properly passed to fork_call		// check that distlb and distub are properly passed to fork_call
// CHECK-64: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB_EXT]], i{{[0-9]+}} [[OMP_PREV_UB_EXT]], {{.+}})		// CHECK-64: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB_EXT]], i{{[0-9]+}} [[OMP_PREV_UB_EXT]], {{.+}})
// CHECK-32: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB]], i{{[0-9]+}} [[OMP_PREV_UB]], {{.+}})		// CHECK-32: call{{.+}} @__kmpc_fork_call({{.+}}, {{.+}}, {{.+}}[[OMP_PARFOR_OUTLINED_3:@.+]] to {{.+}}, i{{[0-9]+}} [[OMP_PREV_LB]], i{{[0-9]+}} [[OMP_PREV_UB]], {{.+}})
// CHECK: br label %[[DIST_INNER_LOOP_INC:.+]]		// CHECK: br label %[[DIST_INNER_LOOP_INC:.+]]

// check DistInc		// check DistInc
// CHECK: [[DIST_INNER_LOOP_INC]]:		// CHECK: [[DIST_INNER_LOOP_INC]]:
// CHECK-DAG: [[OMP_IV_VAL_3:%.+]] = load {{.+}}, {{.+}}* [[OMP_IV]],		// CHECK-DAG: [[OMP_IV_VAL_3:%.+]] = load {{.+}}, {{.+}}* [[OMP_IV]],
// CHECK-DAG: [[OMP_ST_VAL_1:%.+]] = load {{.+}}, {{.+}}* [[OMP_ST]],		// CHECK-DAG: [[OMP_ST_VAL_1:%.+]] = load {{.+}}, {{.+}}* [[OMP_ST]],
// CHECK: [[OMP_IV_INC:%.+]] = add{{.+}} [[OMP_IV_VAL_3]], [[OMP_ST_VAL_1]]		// CHECK: [[OMP_IV_INC:%.+]] = add{{.+}} [[OMP_IV_VAL_3]], [[OMP_ST_VAL_1]]
// CHECK: store{{.+}} [[OMP_IV_INC]], {{.+}}* [[OMP_IV]],		// CHECK: store{{.+}} [[OMP_IV_INC]], {{.+}}* [[OMP_IV]],
// CHECK: br label %[[DIST_INNER_LOOP_HEADER]]

// CHECK: [[DIST_INNER_LOOP_END]]:
// CHECK: br label %[[DIST_OUTER_LOOP_INC:.+]]

// CHECK: [[DIST_OUTER_LOOP_INC]]:
// check NextLB and NextUB
// CHECK-DAG: [[OMP_LB_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],		// CHECK-DAG: [[OMP_LB_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],
// CHECK-DAG: [[OMP_ST_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],		// CHECK-DAG: [[OMP_ST_VAL_2:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],
// CHECK-DAG: [[OMP_LB_NEXT:%.+]] = add{{.+}} [[OMP_LB_VAL_2]], [[OMP_ST_VAL_2]]		// CHECK-DAG: [[OMP_LB_NEXT:%.+]] = add{{.+}} [[OMP_LB_VAL_2]], [[OMP_ST_VAL_2]]
// CHECK: store{{.+}} [[OMP_LB_NEXT]], {{.+}}* [[OMP_LB]],		// CHECK: store{{.+}} [[OMP_LB_NEXT]], {{.+}}* [[OMP_LB]],
// CHECK-DAG: [[OMP_UB_VAL_5:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],		// CHECK-DAG: [[OMP_UB_VAL_5:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],
// CHECK-DAG: [[OMP_ST_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],		// CHECK-DAG: [[OMP_ST_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_ST]],
// CHECK-DAG: [[OMP_UB_NEXT:%.+]] = add{{.+}} [[OMP_UB_VAL_5]], [[OMP_ST_VAL_3]]		// CHECK-DAG: [[OMP_UB_NEXT:%.+]] = add{{.+}} [[OMP_UB_VAL_5]], [[OMP_ST_VAL_3]]
// CHECK: store{{.+}} [[OMP_UB_NEXT]], {{.+}}* [[OMP_UB]],		// CHECK: store{{.+}} [[OMP_UB_NEXT]], {{.+}}* [[OMP_UB]],
// CHECK: br label %[[DIST_OUTER_LOOP_HEADER]]

// outer loop exit		// Update UB
// CHECK: [[DIST_OUTER_LOOP_END]]:		// CHECK-DAG: [[OMP_UB_VAL_6:%.+]] = load{{.+}}, {{.+}} [[OMP_UB]],
		// CHECK: [[OMP_EXPR_VAL:%.+]] = load{{.+}}, {{.+}} [[OMP_CAPT_EXPR]],
		// CHECK-DAG: [[CMP_UB_NUM_IT_1:%.+]] = icmp sgt {{.+}}[[OMP_UB_VAL_6]], [[OMP_EXPR_VAL]]
		// CHECK: br {{.+}} [[CMP_UB_NUM_IT_1]], label %[[EUB_TRUE_1:.+]], label %[[EUB_FALSE_1:.+]]
		// CHECK-DAG: [[EUB_TRUE_1]]:
		// CHECK: [[NUM_IT_3:%.+]] = load{{.+}} [[OMP_CAPT_EXPR]],
		// CHECK: br label %[[EUB_END_1:.+]]
		// CHECK-DAG: [[EUB_FALSE_1]]:
		// CHECK: [[OMP_UB_VAL3:%.+]] = load{{.+}} [[OMP_UB]],
		// CHECK: br label %[[EUB_END_1]]
		// CHECK-DAG: [[EUB_END_1]]:
		// CHECK-DAG: [[EUB_RES_1:%.+]] = phi{{.+}} [ [[NUM_IT_3]], %[[EUB_TRUE_1]] ], [ [[OMP_UB_VAL3]], %[[EUB_FALSE_1]] ]
		// CHECK: store{{.+}} [[EUB_RES_1]], {{.+}}* [[OMP_UB]],

		// Store LB in IV
		// CHECK-DAG: [[OMP_LB_VAL_3:%.+]] = load{{.+}}, {{.+}} [[OMP_LB]],
		// CHECK: store{{.+}} [[OMP_LB_VAL_3]], {{.+}}* [[OMP_IV]],

		// CHECK: [[DIST_INNER_LOOP_END]]:
		// CHECK: br label %[[LOOP_EXIT:.+]]

		// loop exit
		// CHECK: [[LOOP_EXIT]]:
// CHECK-DAG: call void @__kmpc_for_static_fini(		// CHECK-DAG: call void @__kmpc_for_static_fini(
// CHECK: ret		// CHECK: ret

// skip implementation of 'parallel for': using default scheduling and was tested above		// skip implementation of 'parallel for': using default scheduling and was tested above

// CHECK: define{{.+}} void [[OFFLOADING_FUN_4]](		// CHECK: define{{.+}} void [[OFFLOADING_FUN_4]](
// CHECK: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 4, {{.+}} [[OMP_OUTLINED_4:@.+]] to {{.+}})		// CHECK: call {{.}}void {{.+}} @__kmpc_fork_teams({{.+}}, i32 4, {{.+}} [[OMP_OUTLINED_4:@.+]] to {{.+}})

▲ Show 20 Lines • Show All 322 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[OpenMP][NVPTX] Use single loops when generating code for distribute parallel for
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 171127

include/clang/AST/StmtOpenMP.h

lib/AST/StmtOpenMP.cpp

lib/CodeGen/CGOpenMPRuntime.h

lib/CodeGen/CGOpenMPRuntime.cpp

lib/CodeGen/CGOpenMPRuntimeNVPTX.h

lib/CodeGen/CGOpenMPRuntimeNVPTX.cpp

lib/CodeGen/CGStmtOpenMP.cpp

lib/Sema/SemaOpenMP.cpp

lib/Serialization/ASTReaderStmt.cpp

lib/Serialization/ASTWriterStmt.cpp

test/OpenMP/distribute_parallel_for_codegen.cpp

test/OpenMP/distribute_parallel_for_simd_codegen.cpp

This is an archive of the discontinued LLVM Phabricator instance.

[OpenMP][NVPTX] Use single loops when generating code for distribute parallel forClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 171127

include/clang/AST/StmtOpenMP.h

lib/AST/StmtOpenMP.cpp

lib/CodeGen/CGOpenMPRuntime.h

lib/CodeGen/CGOpenMPRuntime.cpp

lib/CodeGen/CGOpenMPRuntimeNVPTX.h

lib/CodeGen/CGOpenMPRuntimeNVPTX.cpp

lib/CodeGen/CGStmtOpenMP.cpp

lib/Sema/SemaOpenMP.cpp

lib/Serialization/ASTReaderStmt.cpp

lib/Serialization/ASTWriterStmt.cpp

test/OpenMP/distribute_parallel_for_codegen.cpp

test/OpenMP/distribute_parallel_for_simd_codegen.cpp

[OpenMP][NVPTX] Use single loops when generating code for distribute parallel for
ClosedPublic