Diff 324333

llvm/include/llvm/IR/Metadata.h

Show First 20 Lines • Show All 636 Lines • ▼ Show 20 Lines	public:
}		}
};		};

/// A collection of metadata nodes that might be associated with a		/// A collection of metadata nodes that might be associated with a
/// memory access used by the alias-analysis infrastructure.		/// memory access used by the alias-analysis infrastructure.
struct AAMDNodes {		struct AAMDNodes {
explicit AAMDNodes() = default;		explicit AAMDNodes() = default;
explicit AAMDNodes(MDNode T, MDNode TS, MDNode S, MDNode N)		explicit AAMDNodes(MDNode T, MDNode TS, MDNode S, MDNode N)
: TBAA(T), TBAAStruct(TS), Scope(S), NoAlias(N) {}		: TBAA(T), TBAAStruct(TS), Scope(S), NoAlias(N) {}
		jdoerfertUnsubmitted Done Reply Inline Actions Any reason to expose this. If not, maybe make them static members in the AAMDNode struct, potentially hidden. jdoerfert: Any reason to expose this. If not, maybe make them static members in the AAMDNode struct…
		wsmosesAuthorUnsubmitted Done Reply Inline Actions I can definitely see other users of such shifting, though if they always use AAMDNodes it will be encapsulated. A public static method seems good to me. wsmoses: I can definitely see other users of such shifting, though if they always use AAMDNodes it will…

bool operator==(const AAMDNodes &A) const {		bool operator==(const AAMDNodes &A) const {
return TBAA == A.TBAA && TBAAStruct == A.TBAAStruct && Scope == A.Scope &&		return TBAA == A.TBAA && TBAAStruct == A.TBAAStruct && Scope == A.Scope &&
NoAlias == A.NoAlias;		NoAlias == A.NoAlias;
}		}

bool operator!=(const AAMDNodes &A) const { return !(*this == A); }		bool operator!=(const AAMDNodes &A) const { return !(*this == A); }

explicit operator bool() const {		explicit operator bool() const {
return TBAA \|\| TBAAStruct \|\| Scope \|\| NoAlias;		return TBAA \|\| TBAAStruct \|\| Scope \|\| NoAlias;
}		}

/// The tag for type-based alias analysis.		/// The tag for type-based alias analysis.
MDNode *TBAA = nullptr;		MDNode *TBAA = nullptr;

/// The tag for type-based alias analysis (tbaa struct).		/// The tag for type-based alias analysis (tbaa struct).
MDNode *TBAAStruct = nullptr;		MDNode *TBAAStruct = nullptr;

/// The tag for alias scope specification (used with noalias).		/// The tag for alias scope specification (used with noalias).
MDNode *Scope = nullptr;		MDNode *Scope = nullptr;

/// The tag specifying the noalias scope.		/// The tag specifying the noalias scope.
MDNode *NoAlias = nullptr;		MDNode *NoAlias = nullptr;

		// Shift tbaa Metadata node to start off bytes later
		static MDNode ShiftTBAA(MDNode M, size_t off);

		// Shift tbaa.struct Metadata node to start off bytes later
		static MDNode ShiftTBAAStruct(MDNode M, size_t off);

/// Given two sets of AAMDNodes that apply to the same pointer,		/// Given two sets of AAMDNodes that apply to the same pointer,
/// give the best AAMDNodes that are compatible with both (i.e. a set of		/// give the best AAMDNodes that are compatible with both (i.e. a set of
/// nodes whose allowable aliasing conclusions are a subset of those		/// nodes whose allowable aliasing conclusions are a subset of those
/// allowable by both of the inputs). However, for efficiency		/// allowable by both of the inputs). However, for efficiency
/// reasons, do not create any new MDNodes.		/// reasons, do not create any new MDNodes.
AAMDNodes intersect(const AAMDNodes &Other) {		AAMDNodes intersect(const AAMDNodes &Other) {
AAMDNodes Result;		AAMDNodes Result;
Result.TBAA = Other.TBAA == TBAA ? TBAA : nullptr;		Result.TBAA = Other.TBAA == TBAA ? TBAA : nullptr;
Result.TBAAStruct = Other.TBAAStruct == TBAAStruct ? TBAAStruct : nullptr;		Result.TBAAStruct = Other.TBAAStruct == TBAAStruct ? TBAAStruct : nullptr;
Result.Scope = Other.Scope == Scope ? Scope : nullptr;		Result.Scope = Other.Scope == Scope ? Scope : nullptr;
Result.NoAlias = Other.NoAlias == NoAlias ? NoAlias : nullptr;		Result.NoAlias = Other.NoAlias == NoAlias ? NoAlias : nullptr;
return Result;		return Result;
}		}

		/// Create a new AAMDNode that describes this AAMDNode after applying a
		/// constant offset to the start of the pointer
		AAMDNodes shift(size_t Offset) {
		AAMDNodes Result;
		Result.TBAA = TBAA ? ShiftTBAA(TBAA, Offset) : nullptr;
		Result.TBAAStruct =
		TBAAStruct ? ShiftTBAAStruct(TBAAStruct, Offset) : nullptr;
		Result.Scope = Scope;
		Result.NoAlias = NoAlias;
		return Result;
		}
};		};

// Specialize DenseMapInfo for AAMDNodes.		// Specialize DenseMapInfo for AAMDNodes.
template<>		template<>
struct DenseMapInfo<AAMDNodes> {		struct DenseMapInfo<AAMDNodes> {
static inline AAMDNodes getEmptyKey() {		static inline AAMDNodes getEmptyKey() {
return AAMDNodes(DenseMapInfo<MDNode *>::getEmptyKey(),		return AAMDNodes(DenseMapInfo<MDNode *>::getEmptyKey(),
nullptr, nullptr, nullptr);		nullptr, nullptr, nullptr);
▲ Show 20 Lines • Show All 771 Lines • Show Last 20 Lines

llvm/include/llvm/IR/Operator.h

Show First 20 Lines • Show All 565 Lines • ▼ Show 20 Lines	public:
/// false and the value of the offset APInt is undefined (it is not		/// false and the value of the offset APInt is undefined (it is not
/// preserved!).		/// preserved!).
///		///
/// The APInt passed into this routine must be at exactly as wide as the		/// The APInt passed into this routine must be at exactly as wide as the
/// IntPtr type for the address space of the base GEP pointer.		/// IntPtr type for the address space of the base GEP pointer.
bool accumulateConstantOffset(		bool accumulateConstantOffset(
const DataLayout &DL, APInt &Offset,		const DataLayout &DL, APInt &Offset,
function_ref<bool(Value &, APInt &)> ExternalAnalysis = nullptr) const;		function_ref<bool(Value &, APInt &)> ExternalAnalysis = nullptr) const;

		static bool accumulateConstantOffset(
		Type SourceType, ArrayRef<const Value > Index, const DataLayout &DL,
		APInt &Offset,
		function_ref<bool(Value &, APInt &)> ExternalAnalysis = nullptr);
};		};

class PtrToIntOperator		class PtrToIntOperator
: public ConcreteOperator<Operator, Instruction::PtrToInt> {		: public ConcreteOperator<Operator, Instruction::PtrToInt> {
friend class PtrToInt;		friend class PtrToInt;
friend class ConstantExpr;		friend class ConstantExpr;

public:		public:
▲ Show 20 Lines • Show All 59 Lines • Show Last 20 Lines

llvm/lib/Analysis/TypeBasedAliasAnalysis.cpp

	Show First 20 Lines • Show All 731 Lines • ▼ Show 20 Lines
	bool TypeBasedAAWrapperPass::doFinalization(Module &M) {			bool TypeBasedAAWrapperPass::doFinalization(Module &M) {
	Result.reset();			Result.reset();
	return false;			return false;
	}			}

	void TypeBasedAAWrapperPass::getAnalysisUsage(AnalysisUsage &AU) const {			void TypeBasedAAWrapperPass::getAnalysisUsage(AnalysisUsage &AU) const {
	AU.setPreservesAll();			AU.setPreservesAll();
	}			}

				MDNode AAMDNodes::ShiftTBAA(MDNode MD, size_t Offset) {
				// Fast path if there's no offset
				if (Offset == 0)
				return MD;
				// Fast path if there's no path tbaa node (and thus scalar)
				if (!isStructPathTBAA(MD))
				jdoerfertUnsubmitted Done Reply Inline Actions Style: No braces. `Offset` not `off`, same elsewhere. `MD` (or similar) not `M`, same elsewhere. jdoerfert: Style: No braces. `Offset` not `off`, same elsewhere. `MD` (or similar) not `M`, same elsewhere.
				return MD;

				TBAAStructTagNode Tag(MD);
				jdoerfertUnsubmitted Done Reply Inline Actions you push back up to 4 elements, let's go with 4 here too. jdoerfert: you push back up to 4 elements, let's go with 4 here too.
				SmallVector<Metadata *, 5> Sub;
				Sub.push_back(MD->getOperand(0));
				Sub.push_back(MD->getOperand(1));
				ConstantInt *InnerOffset = mdconst::extract<ConstantInt>(MD->getOperand(2));

				if (Tag.isNewFormat()) {
				ConstantInt *InnerSize = mdconst::extract<ConstantInt>(MD->getOperand(3));

				if (InnerOffset->getZExtValue() + InnerSize->getZExtValue() <= Offset) {
				return nullptr;
				}

				uint64_t NewSize = InnerSize->getZExtValue();
				uint64_t NewOffset = InnerOffset->getZExtValue() - Offset;
				if (InnerOffset->getZExtValue() < Offset) {
				NewOffset = 0;
				NewSize -= Offset - InnerOffset->getZExtValue();
				}

				Sub.push_back(ConstantAsMetadata::get(
				ConstantInt::get(InnerOffset->getType(), NewOffset)));

				Sub.push_back(ConstantAsMetadata::get(
				ConstantInt::get(InnerSize->getType(), NewSize)));

				// immutable type
				if (MD->getNumOperands() >= 5)
				Sub.push_back(MD->getOperand(4));
				} else {
				if (InnerOffset->getZExtValue() < Offset)
				return nullptr;

				Sub.push_back(ConstantAsMetadata::get(ConstantInt::get(
				jeroen.dobbelaereUnsubmitted Done Reply Inline Actions What if the offset is inside the specified region instead of at the boundary ? Shouldn't we keep that with a 0 offset and adapted size ? Although keeping it is not strictly necessary, but then we will loose some tbaa information. jeroen.dobbelaere: What if the offset is inside the specified region instead of at the boundary ? Shouldn't we…
				wsmosesAuthorUnsubmitted Not Done Reply Inline Actions Good call, amended to include. wsmoses: Good call, amended to include.
				InnerOffset->getType(), InnerOffset->getZExtValue() - Offset)));

				// immutable type
				jdoerfertUnsubmitted Done Reply Inline Actions shouldn't we break at the end? jdoerfert: shouldn't we break at the end?
				wsmosesAuthorUnsubmitted Done Reply Inline Actions No, we want to extract all of the relevant TBAA.struct pieces. In essence TBAA.struct is a list of triples saying the offset, size, type. There therefore may be several relevant triples. wsmoses: No, we want to extract all of the relevant TBAA.struct pieces. In essence TBAA.struct is a list…
				if (MD->getNumOperands() >= 4)
				Sub.push_back(MD->getOperand(3));
				}
				return MDNode::get(MD->getContext(), Sub);
				}

				MDNode AAMDNodes::ShiftTBAAStruct(MDNode MD, size_t Offset) {
				// Fast path if there's no offset
				if (Offset == 0)
				return MD;
				SmallVector<Metadata *, 3> Sub;
				for (size_t i = 0, size = MD->getNumOperands(); i < size; i += 3) {
				ConstantInt *InnerOffset = mdconst::extract<ConstantInt>(MD->getOperand(i));
				ConstantInt *InnerSize =
				mdconst::extract<ConstantInt>(MD->getOperand(i + 1));
				// Don't include any triples that aren't in bounds
				if (InnerOffset->getZExtValue() + InnerSize->getZExtValue() <= Offset)
				continue;

				uint64_t NewSize = InnerSize->getZExtValue();
				uint64_t NewOffset = InnerOffset->getZExtValue() - Offset;
				if (InnerOffset->getZExtValue() < Offset) {
				NewOffset = 0;
				NewSize -= Offset - InnerOffset->getZExtValue();
				}

				// Shift the offset of the triple
				Sub.push_back(ConstantAsMetadata::get(
				ConstantInt::get(InnerOffset->getType(), NewOffset)));
				Sub.push_back(ConstantAsMetadata::get(
				ConstantInt::get(InnerSize->getType(), NewSize)));
				Sub.push_back(MD->getOperand(i + 2));
				}
				return MDNode::get(MD->getContext(), Sub);
				}
				No newline at end of file

llvm/lib/IR/Operator.cpp

Show First 20 Lines • Show All 55 Lines • ▼ Show 20 Lines	for (gep_type_iterator GTI = gep_type_begin(this), GTE = gep_type_end(this);
Result = Align(MinAlign(Offset, Result.value()));		Result = Align(MinAlign(Offset, Result.value()));
}		}
return Result;		return Result;
}		}

bool GEPOperator::accumulateConstantOffset(		bool GEPOperator::accumulateConstantOffset(
const DataLayout &DL, APInt &Offset,		const DataLayout &DL, APInt &Offset,
function_ref<bool(Value &, APInt &)> ExternalAnalysis) const {		function_ref<bool(Value &, APInt &)> ExternalAnalysis) const {
assert(Offset.getBitWidth() ==		assert(Offset.getBitWidth() ==
DL.getIndexSizeInBits(getPointerAddressSpace()) &&		DL.getIndexSizeInBits(getPointerAddressSpace()) &&
"The offset bit width does not match DL specification.");		"The offset bit width does not match DL specification.");
		SmallVector<const Value *> Index(value_op_begin() + 1, value_op_end());
		return GEPOperator::accumulateConstantOffset(getSourceElementType(), Index,
		DL, Offset, ExternalAnalysis);
		}

		bool GEPOperator::accumulateConstantOffset(
		Type SourceType, ArrayRef<const Value > Index, const DataLayout &DL,
		APInt &Offset, function_ref<bool(Value &, APInt &)> ExternalAnalysis) {
bool UsedExternalAnalysis = false;		bool UsedExternalAnalysis = false;
auto AccumulateOffset = [&](APInt Index, uint64_t Size) -> bool {		auto AccumulateOffset = [&](APInt Index, uint64_t Size) -> bool {
Index = Index.sextOrTrunc(Offset.getBitWidth());		Index = Index.sextOrTrunc(Offset.getBitWidth());
APInt IndexedSize = APInt(Offset.getBitWidth(), Size);		APInt IndexedSize = APInt(Offset.getBitWidth(), Size);
// For array or vector indices, scale the index by the size of the type.		// For array or vector indices, scale the index by the size of the type.
if (!UsedExternalAnalysis) {		if (!UsedExternalAnalysis) {
Offset += Index * IndexedSize;		Offset += Index * IndexedSize;
} else {		} else {
// External Analysis can return a result higher/lower than the value		// External Analysis can return a result higher/lower than the value
// represents. We need to detect overflow/underflow.		// represents. We need to detect overflow/underflow.
bool Overflow = false;		bool Overflow = false;
APInt OffsetPlus = Index.smul_ov(IndexedSize, Overflow);		APInt OffsetPlus = Index.smul_ov(IndexedSize, Overflow);
if (Overflow)		if (Overflow)
return false;		return false;
Offset = Offset.sadd_ov(OffsetPlus, Overflow);		Offset = Offset.sadd_ov(OffsetPlus, Overflow);
if (Overflow)		if (Overflow)
return false;		return false;
}		}
return true;		return true;
};		};
		auto begin = generic_gep_type_iterator<decltype(Index.begin())>::begin(
for (gep_type_iterator GTI = gep_type_begin(this), GTE = gep_type_end(this);		SourceType, Index.begin());
GTI != GTE; ++GTI) {		auto end = generic_gep_type_iterator<decltype(Index.end())>::end(Index.end());
		for (auto GTI = begin, GTE = end; GTI != GTE; ++GTI) {
// Scalable vectors are multiplied by a runtime constant.		// Scalable vectors are multiplied by a runtime constant.
bool ScalableType = false;		bool ScalableType = false;
if (isa<ScalableVectorType>(GTI.getIndexedType()))		if (isa<ScalableVectorType>(GTI.getIndexedType()))
ScalableType = true;		ScalableType = true;

Value *V = GTI.getOperand();		Value *V = GTI.getOperand();
StructType *STy = GTI.getStructTypeOrNull();		StructType *STy = GTI.getStructTypeOrNull();
// Handle ConstantInt if possible.		// Handle ConstantInt if possible.
Show All 39 Lines

llvm/lib/Transforms/Scalar/SROA.cpp

Show First 20 Lines • Show All 2,518 Lines • ▼ Show 20 Lines	if (VecTy) {
NewEndOffset == NewAllocaEndOffset &&		NewEndOffset == NewAllocaEndOffset &&
(canConvertValue(DL, NewAllocaTy, TargetTy) \|\|		(canConvertValue(DL, NewAllocaTy, TargetTy) \|\|
(IsLoadPastEnd && NewAllocaTy->isIntegerTy() &&		(IsLoadPastEnd && NewAllocaTy->isIntegerTy() &&
TargetTy->isIntegerTy()))) {		TargetTy->isIntegerTy()))) {
LoadInst *NewLI = IRB.CreateAlignedLoad(NewAI.getAllocatedType(), &NewAI,		LoadInst *NewLI = IRB.CreateAlignedLoad(NewAI.getAllocatedType(), &NewAI,
NewAI.getAlign(), LI.isVolatile(),		NewAI.getAlign(), LI.isVolatile(),
LI.getName());		LI.getName());
if (AATags)		if (AATags)
NewLI->setAAMetadata(AATags);		NewLI->setAAMetadata(AATags.shift(NewBeginOffset - BeginOffset));
if (LI.isVolatile())		if (LI.isVolatile())
NewLI->setAtomic(LI.getOrdering(), LI.getSyncScopeID());		NewLI->setAtomic(LI.getOrdering(), LI.getSyncScopeID());
if (NewLI->isAtomic())		if (NewLI->isAtomic())
NewLI->setAlignment(LI.getAlign());		NewLI->setAlignment(LI.getAlign());

// Any !nonnull metadata or !range metadata on the old load is also valid		// Any !nonnull metadata or !range metadata on the old load is also valid
// on the new load. This is even true in some cases even when the loads		// on the new load. This is even true in some cases even when the loads
// are different types, for example by mapping !nonnull metadata to		// are different types, for example by mapping !nonnull metadata to
Show All 22 Lines	if (VecTy) {
"endian_shift");		"endian_shift");
}		}
} else {		} else {
Type *LTy = TargetTy->getPointerTo(AS);		Type *LTy = TargetTy->getPointerTo(AS);
LoadInst *NewLI =		LoadInst *NewLI =
IRB.CreateAlignedLoad(TargetTy, getNewAllocaSlicePtr(IRB, LTy),		IRB.CreateAlignedLoad(TargetTy, getNewAllocaSlicePtr(IRB, LTy),
getSliceAlign(), LI.isVolatile(), LI.getName());		getSliceAlign(), LI.isVolatile(), LI.getName());
if (AATags)		if (AATags)
NewLI->setAAMetadata(AATags);		NewLI->setAAMetadata(AATags.shift(NewBeginOffset - BeginOffset));
if (LI.isVolatile())		if (LI.isVolatile())
NewLI->setAtomic(LI.getOrdering(), LI.getSyncScopeID());		NewLI->setAtomic(LI.getOrdering(), LI.getSyncScopeID());

V = NewLI;		V = NewLI;
IsPtrAdjusted = true;		IsPtrAdjusted = true;
}		}
V = convertValue(DL, IRB, V, TargetTy);		V = convertValue(DL, IRB, V, TargetTy);

▲ Show 20 Lines • Show All 46 Lines • ▼ Show 20 Lines	if (V->getType() != VecTy) {

// Mix in the existing elements.		// Mix in the existing elements.
Value *Old = IRB.CreateAlignedLoad(NewAI.getAllocatedType(), &NewAI,		Value *Old = IRB.CreateAlignedLoad(NewAI.getAllocatedType(), &NewAI,
NewAI.getAlign(), "load");		NewAI.getAlign(), "load");
V = insertVector(IRB, Old, V, BeginIndex, "vec");		V = insertVector(IRB, Old, V, BeginIndex, "vec");
}		}
StoreInst *Store = IRB.CreateAlignedStore(V, &NewAI, NewAI.getAlign());		StoreInst *Store = IRB.CreateAlignedStore(V, &NewAI, NewAI.getAlign());
if (AATags)		if (AATags)
Store->setAAMetadata(AATags);		Store->setAAMetadata(AATags.shift(NewBeginOffset - BeginOffset));
Pass.DeadInsts.push_back(&SI);		Pass.DeadInsts.push_back(&SI);

LLVM_DEBUG(dbgs() << " to: " << *Store << "\n");		LLVM_DEBUG(dbgs() << " to: " << *Store << "\n");
return true;		return true;
}		}

bool rewriteIntegerStore(Value *V, StoreInst &SI, AAMDNodes AATags) {		bool rewriteIntegerStore(Value *V, StoreInst &SI, AAMDNodes AATags) {
assert(IntTy && "We cannot extract an integer from the alloca");		assert(IntTy && "We cannot extract an integer from the alloca");
assert(!SI.isVolatile());		assert(!SI.isVolatile());
if (DL.getTypeSizeInBits(V->getType()).getFixedSize() !=		if (DL.getTypeSizeInBits(V->getType()).getFixedSize() !=
IntTy->getBitWidth()) {		IntTy->getBitWidth()) {
Value *Old = IRB.CreateAlignedLoad(NewAI.getAllocatedType(), &NewAI,		Value *Old = IRB.CreateAlignedLoad(NewAI.getAllocatedType(), &NewAI,
NewAI.getAlign(), "oldload");		NewAI.getAlign(), "oldload");
Old = convertValue(DL, IRB, Old, IntTy);		Old = convertValue(DL, IRB, Old, IntTy);
assert(BeginOffset >= NewAllocaBeginOffset && "Out of bounds offset");		assert(BeginOffset >= NewAllocaBeginOffset && "Out of bounds offset");
uint64_t Offset = BeginOffset - NewAllocaBeginOffset;		uint64_t Offset = BeginOffset - NewAllocaBeginOffset;
V = insertInteger(DL, IRB, Old, SI.getValueOperand(), Offset, "insert");		V = insertInteger(DL, IRB, Old, SI.getValueOperand(), Offset, "insert");
}		}
V = convertValue(DL, IRB, V, NewAllocaTy);		V = convertValue(DL, IRB, V, NewAllocaTy);
StoreInst *Store = IRB.CreateAlignedStore(V, &NewAI, NewAI.getAlign());		StoreInst *Store = IRB.CreateAlignedStore(V, &NewAI, NewAI.getAlign());
Store->copyMetadata(SI, {LLVMContext::MD_mem_parallel_loop_access,		Store->copyMetadata(SI, {LLVMContext::MD_mem_parallel_loop_access,
LLVMContext::MD_access_group});		LLVMContext::MD_access_group});
if (AATags)		if (AATags)
Store->setAAMetadata(AATags);		Store->setAAMetadata(AATags.shift(NewBeginOffset - BeginOffset));
Pass.DeadInsts.push_back(&SI);		Pass.DeadInsts.push_back(&SI);
LLVM_DEBUG(dbgs() << " to: " << *Store << "\n");		LLVM_DEBUG(dbgs() << " to: " << *Store << "\n");
return true;		return true;
}		}

bool visitStoreInst(StoreInst &SI) {		bool visitStoreInst(StoreInst &SI) {
LLVM_DEBUG(dbgs() << " original: " << SI << "\n");		LLVM_DEBUG(dbgs() << " original: " << SI << "\n");
Value *OldOp = SI.getOperand(1);		Value *OldOp = SI.getOperand(1);
▲ Show 20 Lines • Show All 53 Lines • ▼ Show 20 Lines	if (NewBeginOffset == NewAllocaBeginOffset &&
unsigned AS = SI.getPointerAddressSpace();		unsigned AS = SI.getPointerAddressSpace();
Value *NewPtr = getNewAllocaSlicePtr(IRB, V->getType()->getPointerTo(AS));		Value *NewPtr = getNewAllocaSlicePtr(IRB, V->getType()->getPointerTo(AS));
NewSI =		NewSI =
IRB.CreateAlignedStore(V, NewPtr, getSliceAlign(), SI.isVolatile());		IRB.CreateAlignedStore(V, NewPtr, getSliceAlign(), SI.isVolatile());
}		}
NewSI->copyMetadata(SI, {LLVMContext::MD_mem_parallel_loop_access,		NewSI->copyMetadata(SI, {LLVMContext::MD_mem_parallel_loop_access,
LLVMContext::MD_access_group});		LLVMContext::MD_access_group});
if (AATags)		if (AATags)
NewSI->setAAMetadata(AATags);		NewSI->setAAMetadata(AATags.shift(NewBeginOffset - BeginOffset));
if (SI.isVolatile())		if (SI.isVolatile())
NewSI->setAtomic(SI.getOrdering(), SI.getSyncScopeID());		NewSI->setAtomic(SI.getOrdering(), SI.getSyncScopeID());
if (NewSI->isAtomic())		if (NewSI->isAtomic())
NewSI->setAlignment(SI.getAlign());		NewSI->setAlignment(SI.getAlign());
Pass.DeadInsts.push_back(&SI);		Pass.DeadInsts.push_back(&SI);
deleteIfTriviallyDead(OldOp);		deleteIfTriviallyDead(OldOp);

LLVM_DEBUG(dbgs() << " to: " << *NewSI << "\n");		LLVM_DEBUG(dbgs() << " to: " << *NewSI << "\n");
▲ Show 20 Lines • Show All 79 Lines • ▼ Show 20 Lines	bool visitMemSetInst(MemSetInst &II) {
// a single value type, just emit a memset.		// a single value type, just emit a memset.
if (!CanContinue) {		if (!CanContinue) {
Type *SizeTy = II.getLength()->getType();		Type *SizeTy = II.getLength()->getType();
Constant *Size = ConstantInt::get(SizeTy, NewEndOffset - NewBeginOffset);		Constant *Size = ConstantInt::get(SizeTy, NewEndOffset - NewBeginOffset);
CallInst *New = IRB.CreateMemSet(		CallInst *New = IRB.CreateMemSet(
getNewAllocaSlicePtr(IRB, OldPtr->getType()), II.getValue(), Size,		getNewAllocaSlicePtr(IRB, OldPtr->getType()), II.getValue(), Size,
MaybeAlign(getSliceAlign()), II.isVolatile());		MaybeAlign(getSliceAlign()), II.isVolatile());
if (AATags)		if (AATags)
New->setAAMetadata(AATags);		New->setAAMetadata(AATags.shift(NewBeginOffset - BeginOffset));
LLVM_DEBUG(dbgs() << " to: " << *New << "\n");		LLVM_DEBUG(dbgs() << " to: " << *New << "\n");
return false;		return false;
}		}

// If we can represent this as a simple value, we have to build the actual		// If we can represent this as a simple value, we have to build the actual
// value to store, which requires expanding the byte present in memset to		// value to store, which requires expanding the byte present in memset to
// a sensible representation for the alloca type. This is essentially		// a sensible representation for the alloca type. This is essentially
// splatting the byte to a sufficiently wide integer, splatting it across		// splatting the byte to a sufficiently wide integer, splatting it across
▲ Show 20 Lines • Show All 52 Lines • ▼ Show 20 Lines	if (VecTy) {
V, cast<FixedVectorType>(AllocaVecTy)->getNumElements());		V, cast<FixedVectorType>(AllocaVecTy)->getNumElements());

V = convertValue(DL, IRB, V, AllocaTy);		V = convertValue(DL, IRB, V, AllocaTy);
}		}

StoreInst *New =		StoreInst *New =
IRB.CreateAlignedStore(V, &NewAI, NewAI.getAlign(), II.isVolatile());		IRB.CreateAlignedStore(V, &NewAI, NewAI.getAlign(), II.isVolatile());
if (AATags)		if (AATags)
New->setAAMetadata(AATags);		New->setAAMetadata(AATags.shift(NewBeginOffset - BeginOffset));
LLVM_DEBUG(dbgs() << " to: " << *New << "\n");		LLVM_DEBUG(dbgs() << " to: " << *New << "\n");
return !II.isVolatile();		return !II.isVolatile();
}		}

bool visitMemTransferInst(MemTransferInst &II) {		bool visitMemTransferInst(MemTransferInst &II) {
// Rewriting of memory transfer instructions can be a bit tricky. We break		// Rewriting of memory transfer instructions can be a bit tricky. We break
// them into two categories: split intrinsics and unsplit intrinsics.		// them into two categories: split intrinsics and unsplit intrinsics.

▲ Show 20 Lines • Show All 104 Lines • ▼ Show 20 Lines	if (EmitMemCpy) {
DestPtr = OtherPtr;		DestPtr = OtherPtr;
DestAlign = OtherAlign;		DestAlign = OtherAlign;
SrcPtr = OurPtr;		SrcPtr = OurPtr;
SrcAlign = SliceAlign;		SrcAlign = SliceAlign;
}		}
CallInst *New = IRB.CreateMemCpy(DestPtr, DestAlign, SrcPtr, SrcAlign,		CallInst *New = IRB.CreateMemCpy(DestPtr, DestAlign, SrcPtr, SrcAlign,
Size, II.isVolatile());		Size, II.isVolatile());
if (AATags)		if (AATags)
New->setAAMetadata(AATags);		New->setAAMetadata(AATags.shift(NewBeginOffset - BeginOffset));
LLVM_DEBUG(dbgs() << " to: " << *New << "\n");		LLVM_DEBUG(dbgs() << " to: " << *New << "\n");
return false;		return false;
}		}

bool IsWholeAlloca = NewBeginOffset == NewAllocaBeginOffset &&		bool IsWholeAlloca = NewBeginOffset == NewAllocaBeginOffset &&
NewEndOffset == NewAllocaEndOffset;		NewEndOffset == NewAllocaEndOffset;
uint64_t Size = NewEndOffset - NewBeginOffset;		uint64_t Size = NewEndOffset - NewBeginOffset;
unsigned BeginIndex = VecTy ? getIndex(NewBeginOffset) : 0;		unsigned BeginIndex = VecTy ? getIndex(NewBeginOffset) : 0;
Show All 37 Lines	if (VecTy && !IsWholeAlloca && !IsDest) {
NewAI.getAlign(), "load");		NewAI.getAlign(), "load");
Src = convertValue(DL, IRB, Src, IntTy);		Src = convertValue(DL, IRB, Src, IntTy);
uint64_t Offset = NewBeginOffset - NewAllocaBeginOffset;		uint64_t Offset = NewBeginOffset - NewAllocaBeginOffset;
Src = extractInteger(DL, IRB, Src, SubIntTy, Offset, "extract");		Src = extractInteger(DL, IRB, Src, SubIntTy, Offset, "extract");
} else {		} else {
LoadInst *Load = IRB.CreateAlignedLoad(OtherTy, SrcPtr, SrcAlign,		LoadInst *Load = IRB.CreateAlignedLoad(OtherTy, SrcPtr, SrcAlign,
II.isVolatile(), "copyload");		II.isVolatile(), "copyload");
if (AATags)		if (AATags)
Load->setAAMetadata(AATags);		Load->setAAMetadata(AATags.shift(NewBeginOffset - BeginOffset));
Src = Load;		Src = Load;
}		}

if (VecTy && !IsWholeAlloca && IsDest) {		if (VecTy && !IsWholeAlloca && IsDest) {
Value *Old = IRB.CreateAlignedLoad(NewAI.getAllocatedType(), &NewAI,		Value *Old = IRB.CreateAlignedLoad(NewAI.getAllocatedType(), &NewAI,
NewAI.getAlign(), "oldload");		NewAI.getAlign(), "oldload");
Src = insertVector(IRB, Old, Src, BeginIndex, "vec");		Src = insertVector(IRB, Old, Src, BeginIndex, "vec");
} else if (IntTy && !IsWholeAlloca && IsDest) {		} else if (IntTy && !IsWholeAlloca && IsDest) {
Value *Old = IRB.CreateAlignedLoad(NewAI.getAllocatedType(), &NewAI,		Value *Old = IRB.CreateAlignedLoad(NewAI.getAllocatedType(), &NewAI,
NewAI.getAlign(), "oldload");		NewAI.getAlign(), "oldload");
Old = convertValue(DL, IRB, Old, IntTy);		Old = convertValue(DL, IRB, Old, IntTy);
uint64_t Offset = NewBeginOffset - NewAllocaBeginOffset;		uint64_t Offset = NewBeginOffset - NewAllocaBeginOffset;
Src = insertInteger(DL, IRB, Old, Src, Offset, "insert");		Src = insertInteger(DL, IRB, Old, Src, Offset, "insert");
Src = convertValue(DL, IRB, Src, NewAllocaTy);		Src = convertValue(DL, IRB, Src, NewAllocaTy);
}		}

StoreInst *Store = cast<StoreInst>(		StoreInst *Store = cast<StoreInst>(
IRB.CreateAlignedStore(Src, DstPtr, DstAlign, II.isVolatile()));		IRB.CreateAlignedStore(Src, DstPtr, DstAlign, II.isVolatile()));
if (AATags)		if (AATags)
Store->setAAMetadata(AATags);		Store->setAAMetadata(AATags.shift(NewBeginOffset - BeginOffset));
LLVM_DEBUG(dbgs() << " to: " << *Store << "\n");		LLVM_DEBUG(dbgs() << " to: " << *Store << "\n");
return !II.isVolatile();		return !II.isVolatile();
}		}

bool visitIntrinsicInst(IntrinsicInst &II) {		bool visitIntrinsicInst(IntrinsicInst &II) {
assert((II.isLifetimeStartOrEnd() \|\| II.isDroppable()) &&		assert((II.isLifetimeStartOrEnd() \|\| II.isDroppable()) &&
"Unexpected intrinsic!");		"Unexpected intrinsic!");
LLVM_DEBUG(dbgs() << " original: " << II << "\n");		LLVM_DEBUG(dbgs() << " original: " << II << "\n");
▲ Show 20 Lines • Show All 284 Lines • ▼ Show 20 Lines	struct LoadOpSplitter : public OpSplitter<LoadOpSplitter> {
/// recursive emission to actually load values.		/// recursive emission to actually load values.
void emitFunc(Type Ty, Value &Agg, Align Alignment, const Twine &Name) {		void emitFunc(Type Ty, Value &Agg, Align Alignment, const Twine &Name) {
assert(Ty->isSingleValueType());		assert(Ty->isSingleValueType());
// Load the single value and insert it using the indices.		// Load the single value and insert it using the indices.
Value *GEP =		Value *GEP =
IRB.CreateInBoundsGEP(BaseTy, Ptr, GEPIndices, Name + ".gep");		IRB.CreateInBoundsGEP(BaseTy, Ptr, GEPIndices, Name + ".gep");
LoadInst *Load =		LoadInst *Load =
IRB.CreateAlignedLoad(Ty, GEP, Alignment, Name + ".load");		IRB.CreateAlignedLoad(Ty, GEP, Alignment, Name + ".load");
if (AATags)
Load->setAAMetadata(AATags);		APInt Offset(
		DL.getIndexSizeInBits(Ptr->getType()->getPointerAddressSpace()), 0);
		if (AATags &&
		GEPOperator::accumulateConstantOffset(BaseTy, GEPIndices, DL, Offset))
		jdoerfertUnsubmitted Done Reply Inline Actions No temporary GEPs please. What is wrong with GEP ? jdoerfert: No temporary GEPs please. What is wrong with GEP ?
		wsmosesAuthorUnsubmitted Done Reply Inline Actions The problem is that the GEP instruction itself may be constant folded by the IRBuilder (and thus why it only returns a value and not a gep instruction). wsmoses: The problem is that the GEP instruction itself may be constant folded by the IRBuilder (and…
		jdoerfertUnsubmitted Done Reply Inline Actions Hm, do we need this for anything other than struct types? jdoerfert: Hm, do we need this for anything other than struct types?
		wsmosesAuthorUnsubmitted Done Reply Inline Actions When you say struct types do you mean tbaa.struct (used in memcpy), tbaa struct path information, or something else? We definitely need this in tbaa.struct per the memcpy test case. I think we also want it for regular tbaa (e.g. you have a load which uses regular tbaa info and it should have its tbaa with the correct offset). Likewise I can imagine optimization passes other than SROA needing to do this sort of offset procedure (hence my inclination to make the API public for the shifting). wsmoses: When you say struct types do you mean tbaa.struct (used in memcpy), tbaa struct path…
		Load->setAAMetadata(AATags.shift(Offset.getZExtValue()));

Agg = IRB.CreateInsertValue(Agg, Load, Indices, Name + ".insert");		Agg = IRB.CreateInsertValue(Agg, Load, Indices, Name + ".insert");
LLVM_DEBUG(dbgs() << " to: " << *Load << "\n");		LLVM_DEBUG(dbgs() << " to: " << *Load << "\n");
}		}
};		};

bool visitLoadInst(LoadInst &LI) {		bool visitLoadInst(LoadInst &LI) {
assert(LI.getPointerOperand() == *U);		assert(LI.getPointerOperand() == *U);
if (!LI.isSimple() \|\| LI.getType()->isSingleValueType())		if (!LI.isSimple() \|\| LI.getType()->isSingleValueType())
Show All 29 Lines	void emitFunc(Type Ty, Value &Agg, Align Alignment, const Twine &Name) {
// The gep and extractvalue values are factored out of the CreateStore		// The gep and extractvalue values are factored out of the CreateStore
// call to make the output independent of the argument evaluation order.		// call to make the output independent of the argument evaluation order.
Value *ExtractValue =		Value *ExtractValue =
IRB.CreateExtractValue(Agg, Indices, Name + ".extract");		IRB.CreateExtractValue(Agg, Indices, Name + ".extract");
Value *InBoundsGEP =		Value *InBoundsGEP =
IRB.CreateInBoundsGEP(BaseTy, Ptr, GEPIndices, Name + ".gep");		IRB.CreateInBoundsGEP(BaseTy, Ptr, GEPIndices, Name + ".gep");
StoreInst *Store =		StoreInst *Store =
IRB.CreateAlignedStore(ExtractValue, InBoundsGEP, Alignment);		IRB.CreateAlignedStore(ExtractValue, InBoundsGEP, Alignment);
if (AATags)
Store->setAAMetadata(AATags);		APInt Offset(
		DL.getIndexSizeInBits(Ptr->getType()->getPointerAddressSpace()), 0);
		if (AATags &&
		GEPOperator::accumulateConstantOffset(BaseTy, GEPIndices, DL, Offset))
		jdoerfertUnsubmitted Done Reply Inline Actions No temporary GEPs please. What is wrong with `InBoundsGEP` ? jdoerfert: No temporary GEPs please. What is wrong with `InBoundsGEP` ?
		wsmosesAuthorUnsubmitted Done Reply Inline Actions Same reply as above. wsmoses: Same reply as above.
		Store->setAAMetadata(AATags.shift(Offset.getZExtValue()));

LLVM_DEBUG(dbgs() << " to: " << *Store << "\n");		LLVM_DEBUG(dbgs() << " to: " << *Store << "\n");
}		}
};		};

bool visitStoreInst(StoreInst &SI) {		bool visitStoreInst(StoreInst &SI) {
if (!SI.isSimple() \|\| SI.getPointerOperand() != *U)		if (!SI.isSimple() \|\| SI.getPointerOperand() != *U)
return false;		return false;
Value *V = SI.getValueOperand();		Value *V = SI.getValueOperand();
▲ Show 20 Lines • Show All 1,377 Lines • Show Last 20 Lines

llvm/test/Transforms/SROA/basictest.ll

	Show First 20 Lines • Show All 139 Lines • ▼ Show 20 Lines
	; CHECK-NEXT: %[[test3_a6:.*]] = alloca [7 x i8]			; CHECK-NEXT: %[[test3_a6:.*]] = alloca [7 x i8]
	; CHECK-NEXT: %[[test3_a7:.*]] = alloca [85 x i8]			; CHECK-NEXT: %[[test3_a7:.*]] = alloca [85 x i8]

	%b = getelementptr [300 x i8], [300 x i8]* %a, i64 0, i64 0			%b = getelementptr [300 x i8], [300 x i8]* %a, i64 0, i64 0
	call void @llvm.memcpy.p0i8.p0i8.i32(i8* %b, i8* align 8 %src, i32 300, i1 false), !tbaa !0			call void @llvm.memcpy.p0i8.p0i8.i32(i8* %b, i8* align 8 %src, i32 300, i1 false), !tbaa !0
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [42 x i8], [42 x i8] %[[test3_a1]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [42 x i8], [42 x i8] %[[test3_a1]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 8 %src, i32 42, {{.}}), !tbaa [[TAG_0:!.]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 8 %src, i32 42, {{.}}), !tbaa [[TAG_0:!.]]
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 42			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 42
	; CHECK-NEXT: %[[test3_r1:.]] = load i8, i8 %[[gep]], {{.*}}, !tbaa [[TAG_0]]			; CHECK-NEXT: %[[test3_r1:.]] = load i8, i8 %[[gep]], {{.}}, !tbaa [[TAG_0_M42:!.]]
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 43			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 43
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [99 x i8], [99 x i8] %[[test3_a2]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [99 x i8], [99 x i8] %[[test3_a2]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 99, {{.}}), !tbaa [[TAG_0:!.]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 99, {{.}}), !tbaa [[TAG_0_M43:!.]]
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 142			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 142
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [16 x i8], [16 x i8] %[[test3_a3]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [16 x i8], [16 x i8] %[[test3_a3]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 2 %[[gep_src]], i32 16, {{.}}), !tbaa [[TAG_0:!.]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 2 %[[gep_src]], i32 16, {{.}}), !tbaa [[TAG_0_M142:!.]]
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 158			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 158
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [42 x i8], [42 x i8] %[[test3_a4]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [42 x i8], [42 x i8] %[[test3_a4]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 2 %[[gep_src]], i32 42, {{.}}), !tbaa [[TAG_0:!.]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 2 %[[gep_src]], i32 42, {{.}}), !tbaa [[TAG_0_M158:!.]]
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 200			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 200
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a5]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a5]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 8 %[[gep_src]], i32 7, {{.}}), !tbaa [[TAG_0:!.]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 8 %[[gep_src]], i32 7, {{.*}})
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 207			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 207
	; CHECK-NEXT: %[[test3_r2:.]] = load i8, i8 %[[gep]], {{.*}}, !tbaa [[TAG_0]]			; CHECK-NOT: %[[bad_test3_r2:.]] = load i8, i8 %[[gep]], {{.*}}, !tbaa
				; CHECK-NEXT: %[[test3_r2:.]] = load i8, i8 %[[gep]], {{.*}}
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 208			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 208
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a6]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a6]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 8 %[[gep_src]], i32 7, {{.}}), !tbaa [[TAG_0:!.]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 8 %[[gep_src]], i32 7, {{.*}})
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 215			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 215
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [85 x i8], [85 x i8] %[[test3_a7]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [85 x i8], [85 x i8] %[[test3_a7]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 85, {{.}}), !tbaa [[TAG_0:!.]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 85, {{.*}})

	; Clobber a single element of the array, this should be promotable, and be deleted.			; Clobber a single element of the array, this should be promotable, and be deleted.
	%c = getelementptr [300 x i8], [300 x i8]* %a, i64 0, i64 42			%c = getelementptr [300 x i8], [300 x i8]* %a, i64 0, i64 42
	store i8 0, i8* %c			store i8 0, i8* %c

	; Make a sequence of overlapping stores to the array. These overlap both in			; Make a sequence of overlapping stores to the array. These overlap both in
	; forward strides and in shrinking accesses.			; forward strides and in shrinking accesses.
	%overlap.1.i8 = getelementptr [300 x i8], [300 x i8]* %a, i64 0, i64 142			%overlap.1.i8 = getelementptr [300 x i8], [300 x i8]* %a, i64 0, i64 142
	▲ Show 20 Lines • Show All 128 Lines • ▼ Show 20 Lines
	; CHECK-NEXT: store i32 4, i32* %[[bitcast]], {{.}}, !tbaa [[TAG_49:!.]]			; CHECK-NEXT: store i32 4, i32* %[[bitcast]], {{.}}, !tbaa [[TAG_49:!.]]

	%overlap2.prefix = getelementptr i8, i8* %overlap2.1.1.i8, i64 -4			%overlap2.prefix = getelementptr i8, i8* %overlap2.1.1.i8, i64 -4
	call void @llvm.memcpy.p0i8.p0i8.i32(i8* %overlap2.prefix, i8* %src, i32 8, i1 false), !tbaa !51			call void @llvm.memcpy.p0i8.p0i8.i32(i8* %overlap2.prefix, i8* %src, i32 8, i1 false), !tbaa !51
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [42 x i8], [42 x i8] %[[test3_a4]], i64 0, i64 39			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [42 x i8], [42 x i8] %[[test3_a4]], i64 0, i64 39
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %src, i32 3, {{.}}), !tbaa [[TAG_51:!.]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %src, i32 3, {{.}}), !tbaa [[TAG_51:!.]]
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 3			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 3
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a5]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a5]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 5, {{.*}}), !tbaa [[TAG_51]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 5, {{.*}})

	; Bridge between the overlapping areas			; Bridge between the overlapping areas
	call void @llvm.memset.p0i8.i32(i8* %overlap2.1.2.i8, i8 42, i32 8, i1 false), !tbaa !53			call void @llvm.memset.p0i8.i32(i8* %overlap2.1.2.i8, i8 42, i32 8, i1 false), !tbaa !53
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a5]], i64 0, i64 2			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a5]], i64 0, i64 2
	; CHECK-NEXT: call void @llvm.memset.p0i8.i32(i8* align 1 %[[gep]], i8 42, i32 5, {{.}}), !tbaa [[TAG_53:!.]]			; CHECK-NEXT: call void @llvm.memset.p0i8.i32(i8* align 1 %[[gep]], i8 42, i32 5, {{.}}), !tbaa [[TAG_53:!.]]
	; ...promoted i8 store...			; ...promoted i8 store...
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a6]], i64 0, i64 0			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a6]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memset.p0i8.i32(i8* align 1 %[[gep]], i8 42, i32 2, {{.*}}), !tbaa [[TAG_53]]			; CHECK-NEXT: call void @llvm.memset.p0i8.i32(i8* align 1 %[[gep]], i8 42, i32 2, {{.*}})

	; Entirely within the second overlap.			; Entirely within the second overlap.
	call void @llvm.memcpy.p0i8.p0i8.i32(i8* %overlap2.2.1.i8, i8* %src, i32 5, i1 false), !tbaa !55			call void @llvm.memcpy.p0i8.p0i8.i32(i8* %overlap2.2.1.i8, i8* %src, i32 5, i1 false), !tbaa !55
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a6]], i64 0, i64 1			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a6]], i64 0, i64 1
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep]], i8* align 1 %src, i32 5, {{.}}), !tbaa [[TAG_55:!.]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep]], i8* align 1 %src, i32 5, {{.}}), !tbaa [[TAG_55:!.]]

	; Trailing past the second overlap.			; Trailing past the second overlap.
	call void @llvm.memcpy.p0i8.p0i8.i32(i8* %overlap2.2.2.i8, i8* %src, i32 8, i1 false), !tbaa !57			call void @llvm.memcpy.p0i8.p0i8.i32(i8* %overlap2.2.2.i8, i8* %src, i32 8, i1 false), !tbaa !57
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a6]], i64 0, i64 2			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a6]], i64 0, i64 2
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep]], i8* align 1 %src, i32 5, {{.}}), !tbaa [[TAG_57:!.]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep]], i8* align 1 %src, i32 5, {{.}}), !tbaa [[TAG_57:!.]]
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 5			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 5
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [85 x i8], [85 x i8] %[[test3_a7]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [85 x i8], [85 x i8] %[[test3_a7]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 3, {{.*}}), !tbaa [[TAG_57]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 3, {{.*}})

	call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dst, i8* %b, i32 300, i1 false), !tbaa !59			call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dst, i8* %b, i32 300, i1 false), !tbaa !59
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds [42 x i8], [42 x i8] %[[test3_a1]], i64 0, i64 0			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds [42 x i8], [42 x i8] %[[test3_a1]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %dst, i8* align 1 %[[gep]], i32 42, {{.}}), !tbaa [[TAG_59:!.]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %dst, i8* align 1 %[[gep]], i32 42, {{.}}), !tbaa [[TAG_59:!.]]
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 42			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 42
	; CHECK-NEXT: store i8 0, i8* %[[gep]], {{.*}}, !tbaa [[TAG_59]]			; CHECK-NEXT: store i8 0, i8* %[[gep]], {{.*}}
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 43			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 43
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [99 x i8], [99 x i8] %[[test3_a2]], i64 0, i64 0			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [99 x i8], [99 x i8] %[[test3_a2]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 99, {{.*}}), !tbaa [[TAG_59]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 99, {{.*}})
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 142			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 142
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [16 x i8], [16 x i8] %[[test3_a3]], i64 0, i64 0			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [16 x i8], [16 x i8] %[[test3_a3]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 16, {{.*}}), !tbaa [[TAG_59]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 16, {{.*}})
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 158			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 158
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [42 x i8], [42 x i8] %[[test3_a4]], i64 0, i64 0			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [42 x i8], [42 x i8] %[[test3_a4]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 42, {{.*}}), !tbaa [[TAG_59]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 42, {{.*}})
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 200			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 200
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a5]], i64 0, i64 0			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a5]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}}), !tbaa [[TAG_59]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}})
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 207			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 207
	; CHECK-NEXT: store i8 42, i8* %[[gep]], {{.*}}, !tbaa [[TAG_59]]			; CHECK-NEXT: store i8 42, i8* %[[gep]], {{.*}}
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 208			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 208
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a6]], i64 0, i64 0			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test3_a6]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}}), !tbaa [[TAG_59]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}})
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 215			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 215
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [85 x i8], [85 x i8] %[[test3_a7]], i64 0, i64 0			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [85 x i8], [85 x i8] %[[test3_a7]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 85, {{.*}}), !tbaa [[TAG_59]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 85, {{.*}})

	ret void			ret void
	}			}

	define void @test4(i8* %dst, i8* %src) {			define void @test4(i8* %dst, i8* %src) {
	; CHECK-LABEL: @test4(			; CHECK-LABEL: @test4(

	entry:			entry:
	%a = alloca [100 x i8]			%a = alloca [100 x i8]
	; CHECK-NOT: alloca			; CHECK-NOT: alloca
	; CHECK: %[[test4_a1:.*]] = alloca [20 x i8]			; CHECK: %[[test4_a1:.*]] = alloca [20 x i8]
	; CHECK-NEXT: %[[test4_a2:.*]] = alloca [7 x i8]			; CHECK-NEXT: %[[test4_a2:.*]] = alloca [7 x i8]
	; CHECK-NEXT: %[[test4_a3:.*]] = alloca [10 x i8]			; CHECK-NEXT: %[[test4_a3:.*]] = alloca [10 x i8]
	; CHECK-NEXT: %[[test4_a4:.*]] = alloca [7 x i8]			; CHECK-NEXT: %[[test4_a4:.*]] = alloca [7 x i8]
	; CHECK-NEXT: %[[test4_a5:.*]] = alloca [7 x i8]			; CHECK-NEXT: %[[test4_a5:.*]] = alloca [7 x i8]
	; CHECK-NEXT: %[[test4_a6:.*]] = alloca [40 x i8]			; CHECK-NEXT: %[[test4_a6:.*]] = alloca [40 x i8]

	%b = getelementptr [100 x i8], [100 x i8]* %a, i64 0, i64 0			%b = getelementptr [100 x i8], [100 x i8]* %a, i64 0, i64 0
	call void @llvm.memcpy.p0i8.p0i8.i32(i8* %b, i8* %src, i32 100, i1 false), !tbaa !0			call void @llvm.memcpy.p0i8.p0i8.i32(i8* %b, i8* %src, i32 100, i1 false), !tbaa !0
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds [20 x i8], [20 x i8] %[[test4_a1]], i64 0, i64 0			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds [20 x i8], [20 x i8] %[[test4_a1]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep]], i8* align 1 %src, i32 20, {{.*}}), !tbaa [[TAG_0]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep]], i8* align 1 %src, i32 20, {{.*}}), !tbaa [[TAG_0]]
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 20			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 20
	; CHECK-NEXT: %[[bitcast:.]] = bitcast i8 %[[gep]] to i16*			; CHECK-NEXT: %[[bitcast:.]] = bitcast i8 %[[gep]] to i16*
	; CHECK-NEXT: %[[test4_r1:.]] = load i16, i16 %[[bitcast]], {{.*}}, !tbaa [[TAG_0]]			; CHECK-NEXT: %[[test4_r1:.]] = load i16, i16 %[[bitcast]], {{.}}, !tbaa [[TAG_0_M20:!.]]
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 22			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 22
	; CHECK-NEXT: %[[test4_r2:.]] = load i8, i8 %[[gep]], {{.*}}, !tbaa [[TAG_0]]			; CHECK-NEXT: %[[test4_r2:.]] = load i8, i8 %[[gep]], {{.}}, !tbaa [[TAG_0_M22:!.]]
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 23			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 23
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a2]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a2]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}}), !tbaa [[TAG_0]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.}}), !tbaa [[TAG_0_M23:!.]]
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 30			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 30
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [10 x i8], [10 x i8] %[[test4_a3]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [10 x i8], [10 x i8] %[[test4_a3]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 10, {{.*}}), !tbaa [[TAG_0]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 10, {{.}}), !tbaa [[TAG_0_M30:!.]]
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 40			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 40
	; CHECK-NEXT: %[[bitcast:.]] = bitcast i8 %[[gep]] to i16*			; CHECK-NEXT: %[[bitcast:.]] = bitcast i8 %[[gep]] to i16*
	; CHECK-NEXT: %[[test4_r3:.]] = load i16, i16 %[[bitcast]], {{.*}}, !tbaa [[TAG_0]]			; CHECK-NEXT: %[[test4_r3:.]] = load i16, i16 %[[bitcast]], {{.}}, !tbaa [[TAG_0_M40:!.]]
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 42			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 42
	; CHECK-NEXT: %[[test4_r4:.]] = load i8, i8 %[[gep]], {{.*}}, !tbaa [[TAG_0]]			; CHECK-NEXT: %[[test4_r4:.]] = load i8, i8 %[[gep]], {{.*}}, !tbaa [[TAG_0_M42]]
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 43			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 43
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a4]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a4]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}}), !tbaa [[TAG_0]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}}), !tbaa [[TAG_0_M43]]
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 50			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 50
	; CHECK-NEXT: %[[bitcast:.]] = bitcast i8 %[[gep]] to i16*			; CHECK-NEXT: %[[bitcast:.]] = bitcast i8 %[[gep]] to i16*
	; CHECK-NEXT: %[[test4_r5:.]] = load i16, i16 %[[bitcast]], {{.*}}, !tbaa [[TAG_0]]			; CHECK-NEXT: %[[test4_r5:.]] = load i16, i16 %[[bitcast]], {{.}}, !tbaa [[TAG_0_M50:!.]]
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 52			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %src, i64 52
	; CHECK-NEXT: %[[test4_r6:.]] = load i8, i8 %[[gep]], {{.*}}, !tbaa [[TAG_0]]			; CHECK-NEXT: %[[test4_r6:.]] = load i8, i8 %[[gep]], {{.}}, !tbaa [[TAG_0_M52:!.]]
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 53			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 53
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a5]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a5]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}}), !tbaa [[TAG_0]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}}), !tbaa [[TAG_0_M53:!.+]]
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 60			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds i8, i8 %src, i64 60
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [40 x i8], [40 x i8] %[[test4_a6]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [40 x i8], [40 x i8] %[[test4_a6]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 40, {{.*}}), !tbaa [[TAG_0]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 40, {{.*}}), !tbaa [[TAG_0_M60:!.+]]

	%a.src.1 = getelementptr [100 x i8], [100 x i8]* %a, i64 0, i64 20			%a.src.1 = getelementptr [100 x i8], [100 x i8]* %a, i64 0, i64 20
	%a.dst.1 = getelementptr [100 x i8], [100 x i8]* %a, i64 0, i64 40			%a.dst.1 = getelementptr [100 x i8], [100 x i8]* %a, i64 0, i64 40
	call void @llvm.memcpy.p0i8.p0i8.i32(i8* %a.dst.1, i8* %a.src.1, i32 10, i1 false), !tbaa !3			call void @llvm.memcpy.p0i8.p0i8.i32(i8* %a.dst.1, i8* %a.src.1, i32 10, i1 false), !tbaa !3
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a4]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a4]], i64 0, i64 0
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a2]], i64 0, i64 0			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a2]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}}), !tbaa [[TAG_3]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}})

	; Clobber a single element of the array, this should be promotable, and be deleted.			; Clobber a single element of the array, this should be promotable, and be deleted.
	%c = getelementptr [100 x i8], [100 x i8]* %a, i64 0, i64 42			%c = getelementptr [100 x i8], [100 x i8]* %a, i64 0, i64 42
	store i8 0, i8* %c			store i8 0, i8* %c

	%a.src.2 = getelementptr [100 x i8], [100 x i8]* %a, i64 0, i64 50			%a.src.2 = getelementptr [100 x i8], [100 x i8]* %a, i64 0, i64 50
	call void @llvm.memmove.p0i8.p0i8.i32(i8* %a.dst.1, i8* %a.src.2, i32 10, i1 false), !tbaa !5			call void @llvm.memmove.p0i8.p0i8.i32(i8* %a.dst.1, i8* %a.src.2, i32 10, i1 false), !tbaa !5
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a4]], i64 0, i64 0			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a4]], i64 0, i64 0
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a5]], i64 0, i64 0			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a5]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}}), !tbaa [[TAG_5]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}})

	call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dst, i8* %b, i32 100, i1 false), !tbaa !7			call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dst, i8* %b, i32 100, i1 false), !tbaa !7
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds [20 x i8], [20 x i8] %[[test4_a1]], i64 0, i64 0			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds [20 x i8], [20 x i8] %[[test4_a1]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %dst, i8* align 1 %[[gep]], i32 20, {{.*}}), !tbaa [[TAG_7]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %dst, i8* align 1 %[[gep]], i32 20, {{.*}}), !tbaa [[TAG_7]]
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 20			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 20
	; CHECK-NEXT: %[[bitcast:.]] = bitcast i8 %[[gep]] to i16*			; CHECK-NEXT: %[[bitcast:.]] = bitcast i8 %[[gep]] to i16*
	; CHECK-NEXT: store i16 %[[test4_r1]], i16* %[[bitcast]], {{.*}}, !tbaa [[TAG_7]]			; CHECK-NEXT: store i16 %[[test4_r1]], i16* %[[bitcast]], {{.*}}
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 22			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 22
	; CHECK-NEXT: store i8 %[[test4_r2]], i8* %[[gep]], {{.*}}, !tbaa [[TAG_7]]			; CHECK-NEXT: store i8 %[[test4_r2]], i8* %[[gep]], {{.*}}
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 23			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 23
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a2]], i64 0, i64 0			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a2]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}}), !tbaa [[TAG_7]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}})
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 30			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 30
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [10 x i8], [10 x i8] %[[test4_a3]], i64 0, i64 0			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [10 x i8], [10 x i8] %[[test4_a3]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 10, {{.*}}), !tbaa [[TAG_7]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 10, {{.*}})
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 40			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 40
	; CHECK-NEXT: %[[bitcast:.]] = bitcast i8 %[[gep]] to i16*			; CHECK-NEXT: %[[bitcast:.]] = bitcast i8 %[[gep]] to i16*
	; CHECK-NEXT: store i16 %[[test4_r5]], i16* %[[bitcast]], {{.*}}, !tbaa [[TAG_7]]			; CHECK-NEXT: store i16 %[[test4_r5]], i16* %[[bitcast]], {{.*}}
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 42			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 42
	; CHECK-NEXT: store i8 %[[test4_r6]], i8* %[[gep]], {{.*}}, !tbaa [[TAG_7]]			; CHECK-NEXT: store i8 %[[test4_r6]], i8* %[[gep]], {{.*}}
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 43			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 43
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a4]], i64 0, i64 0			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a4]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}}), !tbaa [[TAG_7]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}})
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 50			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 50
	; CHECK-NEXT: %[[bitcast:.]] = bitcast i8 %[[gep]] to i16*			; CHECK-NEXT: %[[bitcast:.]] = bitcast i8 %[[gep]] to i16*
	; CHECK-NEXT: store i16 %[[test4_r5]], i16* %[[bitcast]], {{.*}}, !tbaa [[TAG_7]]			; CHECK-NEXT: store i16 %[[test4_r5]], i16* %[[bitcast]], {{.*}}
	; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 52			; CHECK-NEXT: %[[gep:.]] = getelementptr inbounds i8, i8 %dst, i64 52
	; CHECK-NEXT: store i8 %[[test4_r6]], i8* %[[gep]], {{.*}}, !tbaa [[TAG_7]]			; CHECK-NEXT: store i8 %[[test4_r6]], i8* %[[gep]], {{.*}}
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 53			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 53
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a5]], i64 0, i64 0			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [7 x i8], [7 x i8] %[[test4_a5]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}}), !tbaa [[TAG_7]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 7, {{.*}})
	; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 60			; CHECK-NEXT: %[[gep_dst:.]] = getelementptr inbounds i8, i8 %dst, i64 60
	; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [40 x i8], [40 x i8] %[[test4_a6]], i64 0, i64 0			; CHECK-NEXT: %[[gep_src:.]] = getelementptr inbounds [40 x i8], [40 x i8] %[[test4_a6]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 40, {{.*}}), !tbaa [[TAG_7]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[gep_dst]], i8* align 1 %[[gep_src]], i32 40, {{.*}})

	ret void			ret void
	}			}

	declare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture, i8* nocapture, i32, i1) nounwind			declare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture, i8* nocapture, i32, i1) nounwind
	declare void @llvm.memcpy.p1i8.p0i8.i32(i8 addrspace(1)* nocapture, i8* nocapture, i32, i1) nounwind			declare void @llvm.memcpy.p1i8.p0i8.i32(i8 addrspace(1)* nocapture, i8* nocapture, i32, i1) nounwind
	declare void @llvm.memmove.p0i8.p0i8.i32(i8* nocapture, i8* nocapture, i32, i1) nounwind			declare void @llvm.memmove.p0i8.p0i8.i32(i8* nocapture, i8* nocapture, i32, i1) nounwind
	declare void @llvm.memset.p0i8.i32(i8* nocapture, i8, i32, i1) nounwind			declare void @llvm.memset.p0i8.i32(i8* nocapture, i8, i32, i1) nounwind
	▲ Show 20 Lines • Show All 380 Lines • ▼ Show 20 Lines
	define void @test18(i8* %src, i8* %dst, i32 %size) {			define void @test18(i8* %src, i8* %dst, i32 %size) {
	; Preserve transfer instrinsics with a variable size, even if they overlap with			; Preserve transfer instrinsics with a variable size, even if they overlap with
	; fixed size operations. Further, continue to split and promote allocas preceding			; fixed size operations. Further, continue to split and promote allocas preceding
	; the variable sized intrinsic.			; the variable sized intrinsic.
	; CHECK-LABEL: @test18(			; CHECK-LABEL: @test18(
	; CHECK: %[[a:.*]] = alloca [34 x i8]			; CHECK: %[[a:.*]] = alloca [34 x i8]
	; CHECK: %[[srcgep1:.]] = getelementptr inbounds i8, i8 %src, i64 4			; CHECK: %[[srcgep1:.]] = getelementptr inbounds i8, i8 %src, i64 4
	; CHECK-NEXT: %[[srccast1:.]] = bitcast i8 %[[srcgep1]] to i32*			; CHECK-NEXT: %[[srccast1:.]] = bitcast i8 %[[srcgep1]] to i32*
	; CHECK-NEXT: %[[srcload:.]] = load i32, i32 %[[srccast1]], {{.*}}, !tbaa [[TAG_0]]			; CHECK-NEXT: %[[srcload:.]] = load i32, i32 %[[srccast1]], {{.}}, !tbaa [[TAG_0_M4:!.]]
	; CHECK-NEXT: %[[agep1:.]] = getelementptr inbounds [34 x i8], [34 x i8] %[[a]], i64 0, i64 0			; CHECK-NEXT: %[[agep1:.]] = getelementptr inbounds [34 x i8], [34 x i8] %[[a]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[agep1]], i8* %src, i32 %size, {{.*}}), !tbaa [[TAG_3]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* align 1 %[[agep1]], i8* %src, i32 %size, {{.*}}), !tbaa [[TAG_3]]
	; CHECK-NEXT: %[[agep2:.]] = getelementptr inbounds [34 x i8], [34 x i8] %[[a]], i64 0, i64 0			; CHECK-NEXT: %[[agep2:.]] = getelementptr inbounds [34 x i8], [34 x i8] %[[a]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memset.p0i8.i32(i8* align 1 %[[agep2]], i8 42, i32 %size, {{.*}}), !tbaa [[TAG_5]]			; CHECK-NEXT: call void @llvm.memset.p0i8.i32(i8* align 1 %[[agep2]], i8 42, i32 %size, {{.*}}), !tbaa [[TAG_5]]
	; CHECK-NEXT: %[[dstcast1:.]] = bitcast i8 %dst to i32*			; CHECK-NEXT: %[[dstcast1:.]] = bitcast i8 %dst to i32*
	; CHECK-NEXT: store i32 42, i32* %[[dstcast1]], {{.*}}, !tbaa [[TAG_9]]			; CHECK-NEXT: store i32 42, i32* %[[dstcast1]], {{.*}}, !tbaa [[TAG_9]]
	; CHECK-NEXT: %[[dstgep1:.]] = getelementptr inbounds i8, i8 %dst, i64 4			; CHECK-NEXT: %[[dstgep1:.]] = getelementptr inbounds i8, i8 %dst, i64 4
	; CHECK-NEXT: %[[dstcast2:.]] = bitcast i8 %[[dstgep1]] to i32*			; CHECK-NEXT: %[[dstcast2:.]] = bitcast i8 %[[dstgep1]] to i32*
	; CHECK-NEXT: store i32 %[[srcload]], i32* %[[dstcast2]], {{.*}}, !tbaa [[TAG_9]]			; CHECK-NEXT: store i32 %[[srcload]], i32* %[[dstcast2]], {{.*}}
	; CHECK-NEXT: %[[agep3:.]] = getelementptr inbounds [34 x i8], [34 x i8] %[[a]], i64 0, i64 0			; CHECK-NEXT: %[[agep3:.]] = getelementptr inbounds [34 x i8], [34 x i8] %[[a]], i64 0, i64 0
	; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dst, i8* align 1 %[[agep3]], i32 %size, {{.*}}), !tbaa [[TAG_11]]			; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* %dst, i8* align 1 %[[agep3]], i32 %size, {{.*}}), !tbaa [[TAG_11]]
	; CHECK-NEXT: ret void			; CHECK-NEXT: ret void

	entry:			entry:
	%a = alloca [42 x i8]			%a = alloca [42 x i8]
	%ptr = getelementptr [42 x i8], [42 x i8]* %a, i32 0, i32 0			%ptr = getelementptr [42 x i8], [42 x i8]* %a, i32 0, i32 0
	call void @llvm.memcpy.p0i8.p0i8.i32(i8* %ptr, i8* %src, i32 8, i1 false), !tbaa !0			call void @llvm.memcpy.p0i8.p0i8.i32(i8* %ptr, i8* %src, i32 8, i1 false), !tbaa !0
	▲ Show 20 Lines • Show All 1,014 Lines • ▼ Show 20 Lines
	bb6:			bb6:
	br label %bb7			br label %bb7

	bb7:			bb7:
	call void @llvm.lifetime.end.isVoid.i64.p0i8(i64 40, [10 x float]* nonnull %ra)			call void @llvm.lifetime.end.isVoid.i64.p0i8(i64 40, [10 x float]* nonnull %ra)
	ret void			ret void
	}			}

	!0 = !{!1, !1, i64 0, i64 1}			!0 = !{!1, !1, i64 0, i64 200}
	!1 = !{!2, i64 1, !"type_0"}			!1 = !{!2, i64 1, !"type_0"}
	!2 = !{!"root"}			!2 = !{!"root"}
	!3 = !{!4, !4, i64 0, i64 1}			!3 = !{!4, !4, i64 0, i64 1}
	!4 = !{!2, i64 1, !"type_3"}			!4 = !{!2, i64 1, !"type_3"}
	!5 = !{!6, !6, i64 0, i64 1}			!5 = !{!6, !6, i64 0, i64 1}
	!6 = !{!2, i64 1, !"type_5"}			!6 = !{!2, i64 1, !"type_5"}
	!7 = !{!8, !8, i64 0, i64 1}			!7 = !{!8, !8, i64 0, i64 1}
	!8 = !{!2, i64 1, !"type_7"}			!8 = !{!2, i64 1, !"type_7"}
	▲ Show 20 Lines • Show All 45 Lines • ▼ Show 20 Lines
	!54 = !{!2, i64 1, !"type_53"}			!54 = !{!2, i64 1, !"type_53"}
	!55 = !{!56, !56, i64 0, i64 1}			!55 = !{!56, !56, i64 0, i64 1}
	!56 = !{!2, i64 1, !"type_55"}			!56 = !{!2, i64 1, !"type_55"}
	!57 = !{!58, !58, i64 0, i64 1}			!57 = !{!58, !58, i64 0, i64 1}
	!58 = !{!2, i64 1, !"type_57"}			!58 = !{!2, i64 1, !"type_57"}
	!59 = !{!60, !60, i64 0, i64 1}			!59 = !{!60, !60, i64 0, i64 1}
	!60 = !{!2, i64 1, !"type_59"}			!60 = !{!2, i64 1, !"type_59"}

	; CHECK-DAG: [[TYPE_0:!.]] = !{{{.}}, !"type_0"}			; CHECK-DAG: [[TAG_0]] = !{[[TYPE_0:!.*]], [[TYPE_0]], i64 0, i64 200}
	; CHECK-DAG: [[TAG_0]] = !{[[TYPE_0]], [[TYPE_0]], i64 0, i64 1}			; CHECK-DAG: [[TYPE_0]] = !{{{.*}}, !"type_0"}

				; CHECK-DAG: [[TAG_0_M42]] = !{[[TYPE_0]], [[TYPE_0]], i64 0, i64 158}
				; CHECK-DAG: [[TAG_0_M43]] = !{[[TYPE_0]], [[TYPE_0]], i64 0, i64 157}
				; CHECK-DAG: [[TAG_0_M142]] = !{[[TYPE_0]], [[TYPE_0]], i64 0, i64 58}
				; CHECK-DAG: [[TAG_0_M158]] = !{[[TYPE_0]], [[TYPE_0]], i64 0, i64 42}

				; CHECK-DAG: [[TAG_59]] = !{[[TYPE_59:!.*]], [[TYPE_59]], i64 0, i64 1}
				; CHECK-DAG: [[TYPE_59]] = !{{{.*}}, !"type_59"}

				; CHECK-DAG: [[TAG_0_M20]] = !{[[TYPE_0]], [[TYPE_0]], i64 0, i64 180}
				; CHECK-DAG: [[TAG_0_M22]] = !{[[TYPE_0]], [[TYPE_0]], i64 0, i64 178}
				; CHECK-DAG: [[TAG_0_M23]] = !{[[TYPE_0]], [[TYPE_0]], i64 0, i64 177}
				; CHECK-DAG: [[TAG_0_M30]] = !{[[TYPE_0]], [[TYPE_0]], i64 0, i64 170}
				; CHECK-DAG: [[TAG_0_M40]] = !{[[TYPE_0]], [[TYPE_0]], i64 0, i64 160}
				; CHECK-DAG: [[TAG_0_M50]] = !{[[TYPE_0]], [[TYPE_0]], i64 0, i64 150}
				; CHECK-DAG: [[TAG_0_M52]] = !{[[TYPE_0]], [[TYPE_0]], i64 0, i64 148}
				; CHECK-DAG: [[TAG_0_M53]] = !{[[TYPE_0]], [[TYPE_0]], i64 0, i64 147}
				; CHECK-DAG: [[TAG_0_M60]] = !{[[TYPE_0]], [[TYPE_0]], i64 0, i64 140}

				; CHECK-DAG: [[TYPE_7:!.]] = !{{{.}}, !"type_7"}
				; CHECK-DAG: [[TAG_7]] = !{[[TYPE_7]], [[TYPE_7]], i64 0, i64 1}

	; CHECK-DAG: [[TYPE_3:!.]] = !{{{.}}, !"type_3"}			; CHECK-DAG: [[TYPE_3:!.]] = !{{{.}}, !"type_3"}
	; CHECK-DAG: [[TAG_3]] = !{[[TYPE_3]], [[TYPE_3]], i64 0, i64 1}			; CHECK-DAG: [[TAG_3]] = !{[[TYPE_3]], [[TYPE_3]], i64 0, i64 1}

	; CHECK-DAG: [[TYPE_5:!.]] = !{{{.}}, !"type_5"}			; CHECK-DAG: [[TYPE_5:!.]] = !{{{.}}, !"type_5"}
	; CHECK-DAG: [[TAG_5]] = !{[[TYPE_5]], [[TYPE_5]], i64 0, i64 1}			; CHECK-DAG: [[TAG_5]] = !{[[TYPE_5]], [[TYPE_5]], i64 0, i64 1}
	; CHECK-DAG: [[TYPE_7:!.]] = !{{{.}}, !"type_7"}
	; CHECK-DAG: [[TAG_7]] = !{[[TYPE_7]], [[TYPE_7]], i64 0, i64 1}			; CHECK-DAG: [[TAG_0_M4]] = !{[[TYPE_0]], [[TYPE_0]], i64 0, i64 196}


	; CHECK-DAG: [[TYPE_9:!.]] = !{{{.}}, !"type_9"}			; CHECK-DAG: [[TYPE_9:!.]] = !{{{.}}, !"type_9"}
	; CHECK-DAG: [[TAG_9]] = !{[[TYPE_9]], [[TYPE_9]], i64 0, i64 1}			; CHECK-DAG: [[TAG_9]] = !{[[TYPE_9]], [[TYPE_9]], i64 0, i64 1}
	; CHECK-DAG: [[TYPE_11:!.]] = !{{{.}}, !"type_11"}			; CHECK-DAG: [[TYPE_11:!.]] = !{{{.}}, !"type_11"}
	; CHECK-DAG: [[TAG_11]] = !{[[TYPE_11]], [[TYPE_11]], i64 0, i64 1}			; CHECK-DAG: [[TAG_11]] = !{[[TYPE_11]], [[TYPE_11]], i64 0, i64 1}
	; CHECK-DAG: [[TYPE_13:!.]] = !{{{.}}, !"type_13"}			; CHECK-DAG: [[TYPE_13:!.]] = !{{{.}}, !"type_13"}
	; CHECK-DAG: [[TAG_13]] = !{[[TYPE_13]], [[TYPE_13]], i64 0, i64 1}			; CHECK-DAG: [[TAG_13]] = !{[[TYPE_13]], [[TYPE_13]], i64 0, i64 1}
	; CHECK-DAG: [[TYPE_15:!.]] = !{{{.}}, !"type_15"}			; CHECK-DAG: [[TYPE_15:!.]] = !{{{.}}, !"type_15"}
	; CHECK-DAG: [[TAG_15]] = !{[[TYPE_15]], [[TYPE_15]], i64 0, i64 1}			; CHECK-DAG: [[TAG_15]] = !{[[TYPE_15]], [[TYPE_15]], i64 0, i64 1}
	Show All 34 Lines
	; CHECK-DAG: [[TYPE_51:!.]] = !{{{.}}, !"type_51"}			; CHECK-DAG: [[TYPE_51:!.]] = !{{{.}}, !"type_51"}
	; CHECK-DAG: [[TAG_51]] = !{[[TYPE_51]], [[TYPE_51]], i64 0, i64 1}			; CHECK-DAG: [[TAG_51]] = !{[[TYPE_51]], [[TYPE_51]], i64 0, i64 1}
	; CHECK-DAG: [[TYPE_53:!.]] = !{{{.}}, !"type_53"}			; CHECK-DAG: [[TYPE_53:!.]] = !{{{.}}, !"type_53"}
	; CHECK-DAG: [[TAG_53]] = !{[[TYPE_53]], [[TYPE_53]], i64 0, i64 1}			; CHECK-DAG: [[TAG_53]] = !{[[TYPE_53]], [[TYPE_53]], i64 0, i64 1}
	; CHECK-DAG: [[TYPE_55:!.]] = !{{{.}}, !"type_55"}			; CHECK-DAG: [[TYPE_55:!.]] = !{{{.}}, !"type_55"}
	; CHECK-DAG: [[TAG_55]] = !{[[TYPE_55]], [[TYPE_55]], i64 0, i64 1}			; CHECK-DAG: [[TAG_55]] = !{[[TYPE_55]], [[TYPE_55]], i64 0, i64 1}
	; CHECK-DAG: [[TYPE_57:!.]] = !{{{.}}, !"type_57"}			; CHECK-DAG: [[TYPE_57:!.]] = !{{{.}}, !"type_57"}
	; CHECK-DAG: [[TAG_57]] = !{[[TYPE_57]], [[TYPE_57]], i64 0, i64 1}			; CHECK-DAG: [[TAG_57]] = !{[[TYPE_57]], [[TYPE_57]], i64 0, i64 1}
	; CHECK-DAG: [[TYPE_59:!.]] = !{{{.}}, !"type_59"}
	; CHECK-DAG: [[TAG_59]] = !{[[TYPE_59]], [[TYPE_59]], i64 0, i64 1}

llvm/test/Transforms/SROA/tbaa-struct2.ll

This file was added.

				; RUN: opt -S -sroa %s \| FileCheck %s

				; SROA should correctly offset `!tbaa.struct` metadata

				%struct.Wishart = type { double, i32 }
				declare void @llvm.memcpy.p0i8.p0i8.i64(i8* writeonly, i8* readonly, i64, i1 immarg)
				declare double @subcall(double %g, i32 %m)

				define double @bar(%struct.Wishart* %wishart) {
				%tmp = alloca %struct.Wishart, align 8
				%tmpaddr = bitcast %struct.Wishart* %tmp to i8*
				%waddr = bitcast %struct.Wishart* %wishart to i8*
				call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 8 %tmpaddr, i8* align 8 %waddr, i64 16, i1 false), !tbaa.struct !2
				%gamma = getelementptr inbounds %struct.Wishart, %struct.Wishart* %tmp, i32 0, i32 0
				%lg = load double, double* %gamma, align 8, !tbaa !4
				%m = getelementptr inbounds %struct.Wishart, %struct.Wishart* %tmp, i32 0, i32 1
				%lm = load i32, i32* %m, align 8, !tbaa !8
				%call = call double @subcall(double %lg, i32 %lm)
				ret double %call
				}

				!2 = !{i64 0, i64 8, !3, i64 8, i64 4, !7}
				!3 = !{!4, !4, i64 0}
				!4 = !{!"double", !5, i64 0}
				!5 = !{!"omnipotent char", !6, i64 0}
				!6 = !{!"Simple C++ TBAA"}
				!7 = !{!8, !8, i64 0}
				!8 = !{!"int", !5, i64 0}

				; CHECK: define double @bar(%struct.Wishart* %wishart) {
				; CHECK-NEXT: %tmp.sroa.3 = alloca [4 x i8], align 4
				; CHECK-NEXT: %tmp.sroa.0.0.waddr.sroa_idx = getelementptr inbounds %struct.Wishart, %struct.Wishart* %wishart, i64 0, i32 0
				; CHECK-NEXT: %tmp.sroa.0.0.copyload = load double, double* %tmp.sroa.0.0.waddr.sroa_idx, align 8, !tbaa.struct !0
				; CHECK-NEXT: %tmp.sroa.2.0.waddr.sroa_idx1 = getelementptr inbounds %struct.Wishart, %struct.Wishart* %wishart, i64 0, i32 1
				; CHECK-NEXT: %tmp.sroa.2.0.copyload = load i32, i32* %tmp.sroa.2.0.waddr.sroa_idx1, align 8, !tbaa.struct !7
				; CHECK-NEXT: %tmp.sroa.3.0.waddr.sroa_raw_cast = bitcast %struct.Wishart* %wishart to i8*
				; CHECK-NEXT: %tmp.sroa.3.0.waddr.sroa_raw_idx = getelementptr inbounds i8, i8* %tmp.sroa.3.0.waddr.sroa_raw_cast, i64 12
				; CHECK-NEXT: %tmp.sroa.3.0.tmpaddr.sroa_idx = getelementptr inbounds [4 x i8], [4 x i8]* %tmp.sroa.3, i64 0, i64 0
				; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* align 4 %tmp.sroa.3.0.tmpaddr.sroa_idx, i8* align 4 %tmp.sroa.3.0.waddr.sroa_raw_idx, i64 4, i1 false), !tbaa.struct !8
				; CHECK-NEXT: %call = call double @subcall(double %tmp.sroa.0.0.copyload, i32 %tmp.sroa.2.0.copyload)
				; CHECK-NEXT: ret double %call
				; CHECK-NEXT: }

				; CHECK: !0 = !{i64 0, i64 8, !1, i64 8, i64 4, !5}
				; CHECK: !1 = !{!2, !2, i64 0}
				; CHECK: !2 = !{!"double", !{{[0-9]+}}, i64 0}

				; CHECK: !5 = !{!6, !6, i64 0}
				; CHECK: !6 = !{!"int", !{{[0-9]+}}, i64 0}
				; CHECK: !7 = !{i64 0, i64 4, !5}
				; CHECK: !8 = !{}
				No newline at end of file

This is an archive of the discontinued LLVM Phabricator instance.

[SROA] Propagate correct TBAA/TBAA Struct offsets
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 324333

llvm/include/llvm/IR/Metadata.h

llvm/include/llvm/IR/Operator.h

llvm/lib/Analysis/TypeBasedAliasAnalysis.cpp

llvm/lib/IR/Operator.cpp

llvm/lib/Transforms/Scalar/SROA.cpp

llvm/test/Transforms/SROA/basictest.ll

llvm/test/Transforms/SROA/tbaa-struct2.ll

This is an archive of the discontinued LLVM Phabricator instance.

[SROA] Propagate correct TBAA/TBAA Struct offsetsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 324333

llvm/include/llvm/IR/Metadata.h

llvm/include/llvm/IR/Operator.h

llvm/lib/Analysis/TypeBasedAliasAnalysis.cpp

llvm/lib/IR/Operator.cpp

llvm/lib/Transforms/Scalar/SROA.cpp

llvm/test/Transforms/SROA/basictest.ll

llvm/test/Transforms/SROA/tbaa-struct2.ll

[SROA] Propagate correct TBAA/TBAA Struct offsets
ClosedPublic