Diff 125359

llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 12,601 Lines • ▼ Show 20 Lines	if (IsConstantSrc) {
SDValue Val = St->getValue();		SDValue Val = St->getValue();
// If constant is of the wrong type, convert it now.		// If constant is of the wrong type, convert it now.
if (MemVT != Val.getValueType()) {		if (MemVT != Val.getValueType()) {
Val = peekThroughBitcast(Val);		Val = peekThroughBitcast(Val);
// Deal with constants of wrong size.		// Deal with constants of wrong size.
if (ElementSizeBits != Val.getValueSizeInBits()) {		if (ElementSizeBits != Val.getValueSizeInBits()) {
EVT IntMemVT =		EVT IntMemVT =
EVT::getIntegerVT(*DAG.getContext(), MemVT.getSizeInBits());		EVT::getIntegerVT(*DAG.getContext(), MemVT.getSizeInBits());
if (auto *CFP = dyn_cast<ConstantFPSDNode>(Val))		if (isa<ConstantFPSDNode>(Val)) {
Val = DAG.getConstant(		// Not clear how to truncate FP values.
CFP->getValueAPF().bitcastToAPInt().zextOrTrunc(		return false;
ElementSizeBits),		} else if (auto *C = dyn_cast<ConstantSDNode>(Val))
SDLoc(CFP), IntMemVT);		Val = DAG.getConstant(C->getAPIntValue()
else if (auto *C = dyn_cast<ConstantSDNode>(Val))		.zextOrTrunc(Val.getValueSizeInBits())
Val = DAG.getConstant(		.zextOrTrunc(ElementSizeBits),
C->getAPIntValue().zextOrTrunc(ElementSizeBits),
SDLoc(C), IntMemVT);		SDLoc(C), IntMemVT);
}		}
// Make sure correctly size type is the correct type.		// Make sure correctly size type is the correct type.
Val = DAG.getBitcast(MemVT, Val);		Val = DAG.getBitcast(MemVT, Val);
}		}
BuildVector.push_back(Val);		BuildVector.push_back(Val);
}		}
StoredVal = DAG.getNode(MemVT.isVector() ? ISD::CONCAT_VECTORS		StoredVal = DAG.getNode(MemVT.isVector() ? ISD::CONCAT_VECTORS
: ISD::BUILD_VECTOR,		: ISD::BUILD_VECTOR,
▲ Show 20 Lines • Show All 46 Lines • ▼ Show 20 Lines	if (UseVector) {
bool IsLE = DAG.getDataLayout().isLittleEndian();		bool IsLE = DAG.getDataLayout().isLittleEndian();
for (unsigned i = 0; i < NumStores; ++i) {		for (unsigned i = 0; i < NumStores; ++i) {
unsigned Idx = IsLE ? (NumStores - 1 - i) : i;		unsigned Idx = IsLE ? (NumStores - 1 - i) : i;
StoreSDNode *St = cast<StoreSDNode>(StoreNodes[Idx].MemNode);		StoreSDNode *St = cast<StoreSDNode>(StoreNodes[Idx].MemNode);

SDValue Val = St->getValue();		SDValue Val = St->getValue();
StoreInt <<= ElementSizeBits;		StoreInt <<= ElementSizeBits;
if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Val)) {		if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Val)) {
StoreInt \|= C->getAPIntValue().zextOrTrunc(SizeInBits);		StoreInt \|= C->getAPIntValue()
		.zextOrTrunc(ElementSizeBits)
		.zextOrTrunc(SizeInBits);
} else if (ConstantFPSDNode *C = dyn_cast<ConstantFPSDNode>(Val)) {		} else if (ConstantFPSDNode *C = dyn_cast<ConstantFPSDNode>(Val)) {
StoreInt \|= C->getValueAPF().bitcastToAPInt().zextOrTrunc(SizeInBits);		StoreInt \|= C->getValueAPF()
		.bitcastToAPInt()
		.zextOrTrunc(ElementSizeBits)
		.zextOrTrunc(SizeInBits);
		// If fp truncation is necessary give up for now.
		if (MemVT.getSizeInBits() != ElementSizeBits)
		return false;
} else {		} else {
llvm_unreachable("Invalid constant element type");		llvm_unreachable("Invalid constant element type");
}		}
}		}

// Create the new Load and Store operations.		// Create the new Load and Store operations.
StoredVal = DAG.getConstant(StoreInt, DL, StoreTy);		StoredVal = DAG.getConstant(StoreInt, DL, StoreTy);
}		}
▲ Show 20 Lines • Show All 4,822 Lines • Show Last 20 Lines

llvm/lib/Target/AArch64/AArch64ISelLowering.h

Show First 20 Lines • Show All 403 Lines • ▼ Show 20 Lines	public:
unsigned		unsigned
getExceptionSelectorRegister(const Constant *PersonalityFn) const override {		getExceptionSelectorRegister(const Constant *PersonalityFn) const override {
// FIXME: This is a guess. Has this been defined yet?		// FIXME: This is a guess. Has this been defined yet?
return AArch64::X1;		return AArch64::X1;
}		}

bool isIntDivCheap(EVT VT, AttributeList Attr) const override;		bool isIntDivCheap(EVT VT, AttributeList Attr) const override;

// Disable currently because of invalid merge.
bool mergeStoresAfterLegalization() const override { return false; }

bool canMergeStoresTo(unsigned AddressSpace, EVT MemVT,		bool canMergeStoresTo(unsigned AddressSpace, EVT MemVT,
const SelectionDAG &DAG) const override {		const SelectionDAG &DAG) const override {
// Do not merge to float value size (128 bytes) if no implicit		// Do not merge to float value size (128 bytes) if no implicit
// float attribute is set.		// float attribute is set.

bool NoFloat = DAG.getMachineFunction().getFunction()->hasFnAttribute(		bool NoFloat = DAG.getMachineFunction().getFunction()->hasFnAttribute(
Attribute::NoImplicitFloat);		Attribute::NoImplicitFloat);

▲ Show 20 Lines • Show All 239 Lines • Show Last 20 Lines

llvm/lib/Target/ARM/ARMISelLowering.h

Show First 20 Lines • Show All 526 Lines • ▼ Show 20 Lines	public:
shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override;		shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override;
bool shouldExpandAtomicCmpXchgInIR(AtomicCmpXchgInst *AI) const override;		bool shouldExpandAtomicCmpXchgInIR(AtomicCmpXchgInst *AI) const override;

bool useLoadStackGuardNode() const override;		bool useLoadStackGuardNode() const override;

bool canCombineStoreAndExtract(Type VectorTy, Value Idx,		bool canCombineStoreAndExtract(Type VectorTy, Value Idx,
unsigned &Cost) const override;		unsigned &Cost) const override;

// Disable currently because of invalid merge.
bool mergeStoresAfterLegalization() const override { return false; }

bool canMergeStoresTo(unsigned AddressSpace, EVT MemVT,		bool canMergeStoresTo(unsigned AddressSpace, EVT MemVT,
const SelectionDAG &DAG) const override {		const SelectionDAG &DAG) const override {
// Do not merge to larger than i32.		// Do not merge to larger than i32.
return (MemVT.getSizeInBits() <= 32);		return (MemVT.getSizeInBits() <= 32);
}		}

bool isCheapToSpeculateCttz() const override;		bool isCheapToSpeculateCttz() const override;
bool isCheapToSpeculateCtlz() const override;		bool isCheapToSpeculateCtlz() const override;
▲ Show 20 Lines • Show All 251 Lines • Show Last 20 Lines

llvm/test/CodeGen/AArch64/arm64-complex-ret.ll

	; RUN: llc -mtriple=arm64-eabi -o - %s \| FileCheck %s			; RUN: llc -mtriple=arm64-eabi -o - %s \| FileCheck %s

	define { i192, i192, i21, i192 } @foo(i192) {			define { i192, i192, i21, i192 } @foo(i192) {
	; CHECK-LABEL: foo:			; CHECK-LABEL: foo:
	; CHECK: stp xzr, xzr, [x8]			; CHECK-DAG: str xzr, [x8, #16]
				; CHECK-DAG: str q0, [x8]
	ret { i192, i192, i21, i192 } {i192 0, i192 1, i21 2, i192 3}			ret { i192, i192, i21, i192 } {i192 0, i192 1, i21 2, i192 3}
	}			}

llvm/test/CodeGen/AArch64/arm64-narrow-st-merge.ll

Show All 13 Lines	entry:
%add = add nsw i32 %n, 1		%add = add nsw i32 %n, 1
%idxprom1 = sext i32 %add to i64		%idxprom1 = sext i32 %add to i64
%arrayidx2 = getelementptr inbounds i16, i16* %P, i64 %idxprom1		%arrayidx2 = getelementptr inbounds i16, i16* %P, i64 %idxprom1
store i16 0, i16* %arrayidx2		store i16 0, i16* %arrayidx2
ret void		ret void
}		}

; CHECK-LABEL: Strh_zero_4		; CHECK-LABEL: Strh_zero_4
; CHECK: stp wzr, wzr		; CHECK: str xzr
; CHECK-STRICT-LABEL: Strh_zero_4		; CHECK-STRICT-LABEL: Strh_zero_4
; CHECK-STRICT: strh wzr		; CHECK-STRICT: strh wzr
; CHECK-STRICT: strh wzr		; CHECK-STRICT: strh wzr
; CHECK-STRICT: strh wzr		; CHECK-STRICT: strh wzr
; CHECK-STRICT: strh wzr		; CHECK-STRICT: strh wzr
define void @Strh_zero_4(i16* nocapture %P, i32 %n) {		define void @Strh_zero_4(i16* nocapture %P, i32 %n) {
entry:		entry:
%idxprom = sext i32 %n to i64		%idxprom = sext i32 %n to i64
▲ Show 20 Lines • Show All 101 Lines • ▼ Show 20 Lines	entry:
%sub1 = add nsw i32 %n, -3		%sub1 = add nsw i32 %n, -3
%idxprom2 = sext i32 %sub1 to i64		%idxprom2 = sext i32 %sub1 to i64
%arrayidx3 = getelementptr inbounds i16, i16* %P, i64 %idxprom2		%arrayidx3 = getelementptr inbounds i16, i16* %P, i64 %idxprom2
store i16 0, i16* %arrayidx3		store i16 0, i16* %arrayidx3
ret void		ret void
}		}

; CHECK-LABEL: Sturh_zero_4		; CHECK-LABEL: Sturh_zero_4
; CHECK: stp wzr, wzr		; CHECK: stur xzr
; CHECK-STRICT-LABEL: Sturh_zero_4		; CHECK-STRICT-LABEL: Sturh_zero_4
; CHECK-STRICT: sturh wzr		; CHECK-STRICT: sturh wzr
; CHECK-STRICT: sturh wzr		; CHECK-STRICT: sturh wzr
; CHECK-STRICT: sturh wzr		; CHECK-STRICT: sturh wzr
; CHECK-STRICT: sturh wzr		; CHECK-STRICT: sturh wzr
define void @Sturh_zero_4(i16* nocapture %P, i32 %n) {		define void @Sturh_zero_4(i16* nocapture %P, i32 %n) {
entry:		entry:
%sub = add nsw i32 %n, -3		%sub = add nsw i32 %n, -3
▲ Show 20 Lines • Show All 61 Lines • Show Last 20 Lines

llvm/test/CodeGen/AArch64/arm64-variadic-aapcs.ll

	Show All 26 Lines
	; CHECK: add [[GR_TOPTMP:x[0-9]+]], sp, #[[GR_BASE]]			; CHECK: add [[GR_TOPTMP:x[0-9]+]], sp, #[[GR_BASE]]
	; CHECK: add [[GR_TOP:x[0-9]+]], [[GR_TOPTMP]], #56			; CHECK: add [[GR_TOP:x[0-9]+]], [[GR_TOPTMP]], #56
	; CHECK: str [[GR_TOP]], [x[[VA_LIST]], #8]			; CHECK: str [[GR_TOP]], [x[[VA_LIST]], #8]

	; CHECK: mov [[VR_TOPTMP:x[0-9]+]], sp			; CHECK: mov [[VR_TOPTMP:x[0-9]+]], sp
	; CHECK: add [[VR_TOP:x[0-9]+]], [[VR_TOPTMP]], #128			; CHECK: add [[VR_TOP:x[0-9]+]], [[VR_TOPTMP]], #128
	; CHECK: str [[VR_TOP]], [x[[VA_LIST]], #16]			; CHECK: str [[VR_TOP]], [x[[VA_LIST]], #16]

	; CHECK: mov [[GR_OFFS:w[0-9]+]], #-56			; CHECK: mov [[GRVR:x[0-9]+]], #-545460846720
	; CHECK: str [[GR_OFFS]], [x[[VA_LIST]], #24]			; CHECK: movk [[GRVR]], #65480
				; CHECK: str [[GRVR]], [x[[VA_LIST]], #24]
	; CHECK: orr [[VR_OFFS:w[0-9]+]], wzr, #0xffffff80
	; CHECK: str [[VR_OFFS]], [x[[VA_LIST]], #28]

	%addr = bitcast %va_list* @var to i8*			%addr = bitcast %va_list* @var to i8*
	call void @llvm.va_start(i8* %addr)			call void @llvm.va_start(i8* %addr)

	ret void			ret void
	}			}

	define void @test_fewargs(i32 %n, i32 %n1, i32 %n2, float %m, ...) {			define void @test_fewargs(i32 %n, i32 %n1, i32 %n2, float %m, ...) {
	Show All 17 Lines
	; CHECK: add [[GR_TOPTMP:x[0-9]+]], sp, #[[GR_BASE]]			; CHECK: add [[GR_TOPTMP:x[0-9]+]], sp, #[[GR_BASE]]
	; CHECK: add [[GR_TOP:x[0-9]+]], [[GR_TOPTMP]], #40			; CHECK: add [[GR_TOP:x[0-9]+]], [[GR_TOPTMP]], #40
	; CHECK: str [[GR_TOP]], [x[[VA_LIST]], #8]			; CHECK: str [[GR_TOP]], [x[[VA_LIST]], #8]

	; CHECK: mov [[VR_TOPTMP:x[0-9]+]], sp			; CHECK: mov [[VR_TOPTMP:x[0-9]+]], sp
	; CHECK: add [[VR_TOP:x[0-9]+]], [[VR_TOPTMP]], #112			; CHECK: add [[VR_TOP:x[0-9]+]], [[VR_TOPTMP]], #112
	; CHECK: str [[VR_TOP]], [x[[VA_LIST]], #16]			; CHECK: str [[VR_TOP]], [x[[VA_LIST]], #16]

	; CHECK: mov [[GR_OFFS:w[0-9]+]], #-40			; CHECK: mov [[GRVR_OFFS:x[0-9]+]], #-40
	; CHECK: str [[GR_OFFS]], [x[[VA_LIST]], #24]			; CHECK: movk [[GRVR_OFFS]], #65424, lsl #32
				; CHECK: str [[GRVR_OFFS]], [x[[VA_LIST]], #24]
	; CHECK: mov [[VR_OFFS:w[0-9]+]], #-11
	; CHECK: str [[VR_OFFS]], [x[[VA_LIST]], #28]

	%addr = bitcast %va_list* @var to i8*			%addr = bitcast %va_list* @var to i8*
	call void @llvm.va_start(i8* %addr)			call void @llvm.va_start(i8* %addr)

	ret void			ret void
	}			}

	define void @test_nospare([8 x i64], [8 x float], ...) {			define void @test_nospare([8 x i64], [8 x float], ...) {
	▲ Show 20 Lines • Show All 60 Lines • Show Last 20 Lines

llvm/test/CodeGen/AArch64/tailcall-explicit-sret.ll

Show All 29 Lines
; CHECK: ret		; CHECK: ret
define void @test_tailcall_explicit_sret_alloca_unused() #0 {		define void @test_tailcall_explicit_sret_alloca_unused() #0 {
%l = alloca i1024, align 8		%l = alloca i1024, align 8
tail call void @test_explicit_sret(i1024* %l)		tail call void @test_explicit_sret(i1024* %l)
ret void		ret void
}		}

; CHECK-LABEL: _test_tailcall_explicit_sret_alloca_dummyusers:		; CHECK-LABEL: _test_tailcall_explicit_sret_alloca_dummyusers:
; CHECK: ldr [[PTRLOAD1:x[0-9]+]], [x0]		; CHECK: ldr [[PTRLOAD1:q[0-9]+]], [x0]
; CHECK: str [[PTRLOAD1]], [sp]		; CHECK: str [[PTRLOAD1]], [sp]
; CHECK: mov x8, sp		; CHECK: mov x8, sp
; CHECK-NEXT: bl _test_explicit_sret		; CHECK-NEXT: bl _test_explicit_sret
; CHECK: ret		; CHECK: ret
define void @test_tailcall_explicit_sret_alloca_dummyusers(i1024* %ptr) #0 {		define void @test_tailcall_explicit_sret_alloca_dummyusers(i1024* %ptr) #0 {
%l = alloca i1024, align 8		%l = alloca i1024, align 8
%r = load i1024, i1024* %ptr, align 8		%r = load i1024, i1024* %ptr, align 8
store i1024 %r, i1024* %l, align 8		store i1024 %r, i1024* %l, align 8
Show All 12 Lines	define void @test_tailcall_explicit_sret_gep(i1024* %ptr) #0 {
tail call void @test_explicit_sret(i1024* %ptr2)		tail call void @test_explicit_sret(i1024* %ptr2)
ret void		ret void
}		}

; CHECK-LABEL: _test_tailcall_explicit_sret_alloca_returned:		; CHECK-LABEL: _test_tailcall_explicit_sret_alloca_returned:
; CHECK: mov x[[CALLERX8NUM:[0-9]+]], x8		; CHECK: mov x[[CALLERX8NUM:[0-9]+]], x8
; CHECK: mov x8, sp		; CHECK: mov x8, sp
; CHECK-NEXT: bl _test_explicit_sret		; CHECK-NEXT: bl _test_explicit_sret
; CHECK-NEXT: ldr [[CALLERSRET1:x[0-9]+]], [sp]		; CHECK-NEXT: ldr [[CALLERSRET1:q[0-9]+]], [sp]
; CHECK: str [[CALLERSRET1:x[0-9]+]], [x[[CALLERX8NUM]]]		; CHECK: str [[CALLERSRET1:q[0-9]+]], [x[[CALLERX8NUM]]]
; CHECK: ret		; CHECK: ret
define i1024 @test_tailcall_explicit_sret_alloca_returned() #0 {		define i1024 @test_tailcall_explicit_sret_alloca_returned() #0 {
%l = alloca i1024, align 8		%l = alloca i1024, align 8
tail call void @test_explicit_sret(i1024* %l)		tail call void @test_explicit_sret(i1024* %l)
%r = load i1024, i1024* %l, align 8		%r = load i1024, i1024* %l, align 8
ret i1024 %r		ret i1024 %r
}		}

; CHECK-LABEL: _test_indirect_tailcall_explicit_sret_nosret_arg:		; CHECK-LABEL: _test_indirect_tailcall_explicit_sret_nosret_arg:
; CHECK-DAG: mov x[[CALLERX8NUM:[0-9]+]], x8		; CHECK-DAG: mov x[[CALLERX8NUM:[0-9]+]], x8
; CHECK-DAG: mov [[FPTR:x[0-9]+]], x0		; CHECK-DAG: mov [[FPTR:x[0-9]+]], x0
; CHECK: mov x0, sp		; CHECK: mov x0, sp
; CHECK-NEXT: blr [[FPTR]]		; CHECK-NEXT: blr [[FPTR]]
; CHECK-NEXT: ldr [[CALLERSRET1:x[0-9]+]], [sp]		; CHECK: ldr [[CALLERSRET1:q[0-9]+]], [sp]
; CHECK: str [[CALLERSRET1:x[0-9]+]], [x[[CALLERX8NUM]]]		; CHECK: str [[CALLERSRET1:q[0-9]+]], [x[[CALLERX8NUM]]]
; CHECK: ret		; CHECK: ret
define void @test_indirect_tailcall_explicit_sret_nosret_arg(i1024* sret %arg, void (i1024) %f) #0 {		define void @test_indirect_tailcall_explicit_sret_nosret_arg(i1024* sret %arg, void (i1024) %f) #0 {
%l = alloca i1024, align 8		%l = alloca i1024, align 8
tail call void %f(i1024* %l)		tail call void %f(i1024* %l)
%r = load i1024, i1024* %l, align 8		%r = load i1024, i1024* %l, align 8
store i1024 %r, i1024* %arg, align 8		store i1024 %r, i1024* %arg, align 8
ret void		ret void
}		}

; CHECK-LABEL: _test_indirect_tailcall_explicit_sret_:		; CHECK-LABEL: _test_indirect_tailcall_explicit_sret_:
; CHECK: mov x[[CALLERX8NUM:[0-9]+]], x8		; CHECK: mov x[[CALLERX8NUM:[0-9]+]], x8
; CHECK: mov x8, sp		; CHECK: mov x8, sp
; CHECK-NEXT: blr x0		; CHECK-NEXT: blr x0
; CHECK-NEXT: ldr [[CALLERSRET1:x[0-9]+]], [sp]		; CHECK: ldr [[CALLERSRET1:q[0-9]+]], [sp]
; CHECK: str [[CALLERSRET1:x[0-9]+]], [x[[CALLERX8NUM]]]		; CHECK: str [[CALLERSRET1:q[0-9]+]], [x[[CALLERX8NUM]]]
; CHECK: ret		; CHECK: ret
define void @test_indirect_tailcall_explicit_sret_(i1024* sret %arg, i1024 ()* %f) #0 {		define void @test_indirect_tailcall_explicit_sret_(i1024* sret %arg, i1024 ()* %f) #0 {
%ret = tail call i1024 %f()		%ret = tail call i1024 %f()
store i1024 %ret, i1024* %arg, align 8		store i1024 %ret, i1024* %arg, align 8
ret void		ret void
}		}

attributes #0 = { nounwind }		attributes #0 = { nounwind }

llvm/test/CodeGen/AArch64/tailcall-implicit-sret.ll

	; RUN: llc < %s -mtriple arm64-apple-darwin -aarch64-enable-ldst-opt=false -disable-post-ra -asm-verbose=false \| FileCheck %s			; RUN: llc < %s -mtriple arm64-apple-darwin -aarch64-enable-ldst-opt=false -disable-post-ra -asm-verbose=false \| FileCheck %s
	; Disable the load/store optimizer to avoid having LDP/STPs and simplify checks.			; Disable the load/store optimizer to avoid having LDP/STPs and simplify checks.

	target datalayout = "e-m:o-i64:64-i128:128-n32:64-S128"			target datalayout = "e-m:o-i64:64-i128:128-n32:64-S128"

	; Check that we don't try to tail-call with an sret-demoted return.			; Check that we don't try to tail-call with an sret-demoted return.

	declare i1024 @test_sret() #0			declare i1024 @test_sret() #0

	; CHECK-LABEL: _test_call_sret:			; CHECK-LABEL: _test_call_sret:
	; CHECK: mov x[[CALLERX8NUM:[0-9]+]], x8			; CHECK: mov x[[CALLERX8NUM:[0-9]+]], x8
	; CHECK: mov x8, sp			; CHECK: mov x8, sp
	; CHECK-NEXT: bl _test_sret			; CHECK-NEXT: bl _test_sret
	; CHECK-NEXT: ldr [[CALLERSRET1:x[0-9]+]], [sp]			; CHECK: ldr [[CALLERSRET1:q[0-9]+]], [sp]
	; CHECK: str [[CALLERSRET1:x[0-9]+]], [x[[CALLERX8NUM]]]			; CHECK: str [[CALLERSRET1:q[0-9]+]], [x[[CALLERX8NUM]]]
	; CHECK: ret			; CHECK: ret
	define i1024 @test_call_sret() #0 {			define i1024 @test_call_sret() #0 {
	%a = call i1024 @test_sret()			%a = call i1024 @test_sret()
	ret i1024 %a			ret i1024 %a
	}			}

	; CHECK-LABEL: _test_tailcall_sret:			; CHECK-LABEL: _test_tailcall_sret:
	; CHECK: mov x[[CALLERX8NUM:[0-9]+]], x8			; CHECK: mov x[[CALLERX8NUM:[0-9]+]], x8
	; CHECK: mov x8, sp			; CHECK: mov x8, sp
	; CHECK-NEXT: bl _test_sret			; CHECK-NEXT: bl _test_sret
	; CHECK-NEXT: ldr [[CALLERSRET1:x[0-9]+]], [sp]			; CHECK: ldr [[CALLERSRET1:q[0-9]+]], [sp]
	; CHECK: str [[CALLERSRET1:x[0-9]+]], [x[[CALLERX8NUM]]]			; CHECK: str [[CALLERSRET1:q[0-9]+]], [x[[CALLERX8NUM]]]
	; CHECK: ret			; CHECK: ret
	define i1024 @test_tailcall_sret() #0 {			define i1024 @test_tailcall_sret() #0 {
	%a = tail call i1024 @test_sret()			%a = tail call i1024 @test_sret()
	ret i1024 %a			ret i1024 %a
	}			}

	; CHECK-LABEL: _test_indirect_tailcall_sret:			; CHECK-LABEL: _test_indirect_tailcall_sret:
	; CHECK: mov x[[CALLERX8NUM:[0-9]+]], x8			; CHECK: mov x[[CALLERX8NUM:[0-9]+]], x8
	; CHECK: mov x8, sp			; CHECK: mov x8, sp
	; CHECK-NEXT: blr x0			; CHECK-NEXT: blr x0
	; CHECK-NEXT: ldr [[CALLERSRET1:x[0-9]+]], [sp]			; CHECK: ldr [[CALLERSRET1:q[0-9]+]], [sp]
	; CHECK: str [[CALLERSRET1:x[0-9]+]], [x[[CALLERX8NUM]]]			; CHECK: str [[CALLERSRET1:q[0-9]+]], [x[[CALLERX8NUM]]]
	; CHECK: ret			; CHECK: ret
	define i1024 @test_indirect_tailcall_sret(i1024 ()* %f) #0 {			define i1024 @test_indirect_tailcall_sret(i1024 ()* %f) #0 {
	%a = tail call i1024 %f()			%a = tail call i1024 %f()
	ret i1024 %a			ret i1024 %a
	}			}

	attributes #0 = { nounwind }			attributes #0 = { nounwind }

llvm/test/CodeGen/ARM/arm-storebytesmerge.ll

This file was added.

				; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
				; RUN: llc -mtriple=arm-eabi -mattr=+neon %s -o - \| FileCheck %s

				target datalayout = "e-m:e-p:32:32-i64:64-v128:64:128-a:0:32-n32-S64"
				target triple = "thumbv7em-arm-none-eabi"

				; Function Attrs: nounwind
				define arm_aapcs_vfpcc void @test(i8* %v50) #0 {
				; CHECK-LABEL: test:
				; CHECK: @ BB#0:
				; CHECK-NEXT: movw r1, #35722
				; CHECK-NEXT: movt r1, #36236
				; CHECK-NEXT: str.w r1, [r0, #394]
				; CHECK-NEXT: movw r1, #36750
				; CHECK-NEXT: movt r1, #37264
				; CHECK-NEXT: str.w r1, [r0, #398]
				; CHECK-NEXT: movw r1, #37778
				; CHECK-NEXT: movt r1, #38292
				; CHECK-NEXT: str.w r1, [r0, #402]
				; CHECK-NEXT: movw r1, #38806
				; CHECK-NEXT: movt r1, #39320
				; CHECK-NEXT: str.w r1, [r0, #406]
				; CHECK-NEXT: movw r1, #39834
				; CHECK-NEXT: strh.w r1, [r0, #410]
				; CHECK-NEXT: movw r1, #40348
				; CHECK-NEXT: movt r1, #40862
				; CHECK-NEXT: str.w r1, [r0, #412]
				; CHECK-NEXT: movw r1, #41376
				; CHECK-NEXT: movt r1, #41890
				; CHECK-NEXT: str.w r1, [r0, #416]
				; CHECK-NEXT: movw r1, #42404
				; CHECK-NEXT: movt r1, #42918
				; CHECK-NEXT: str.w r1, [r0, #420]
				; CHECK-NEXT: movw r1, #43432
				; CHECK-NEXT: movt r1, #43946
				; CHECK-NEXT: str.w r1, [r0, #424]
				; CHECK-NEXT: movw r1, #44460
				; CHECK-NEXT: movt r1, #44974
				; CHECK-NEXT: str.w r1, [r0, #428]
				; CHECK-NEXT: movw r1, #45488
				; CHECK-NEXT: strh.w r1, [r0, #432]
				; CHECK-NEXT: movw r1, #46002
				; CHECK-NEXT: movt r1, #46516
				; CHECK-NEXT: str.w r1, [r0, #434]
				; CHECK-NEXT: movw r1, #47030
				; CHECK-NEXT: strh.w r1, [r0, #438]
				; CHECK-NEXT: movw r1, #47544
				; CHECK-NEXT: movt r1, #48058
				; CHECK-NEXT: str.w r1, [r0, #440]
				; CHECK-NEXT: movw r1, #48572
				; CHECK-NEXT: movt r1, #49086
				; CHECK-NEXT: str.w r1, [r0, #444]
				; CHECK-NEXT: movw r1, #49600
				; CHECK-NEXT: strh.w r1, [r0, #448]
				; CHECK-NEXT: movs r1, #194
				; CHECK-NEXT: strb.w r1, [r0, #450]
				; CHECK-NEXT: movw r1, #50371
				; CHECK-NEXT: movt r1, #50885
				; CHECK-NEXT: str.w r1, [r0, #451]
				; CHECK-NEXT: movw r1, #51399
				; CHECK-NEXT: movt r1, #51913
				; CHECK-NEXT: str.w r1, [r0, #455]
				; CHECK-NEXT: movw r1, #52427
				; CHECK-NEXT: movt r1, #52941
				; CHECK-NEXT: str.w r1, [r0, #459]
				; CHECK-NEXT: movw r1, #53455
				; CHECK-NEXT: movt r1, #53969
				; CHECK-NEXT: str.w r1, [r0, #463]
				; CHECK-NEXT: movw r1, #54483
				; CHECK-NEXT: strh.w r1, [r0, #467]
				; CHECK-NEXT: movw r1, #54997
				; CHECK-NEXT: movt r1, #55511
				; CHECK-NEXT: str.w r1, [r0, #469]
				; CHECK-NEXT: movw r1, #56025
				; CHECK-NEXT: movt r1, #56539
				; CHECK-NEXT: str.w r1, [r0, #473]
				; CHECK-NEXT: movw r1, #57053
				; CHECK-NEXT: movt r1, #57567
				; CHECK-NEXT: str.w r1, [r0, #477]
				; CHECK-NEXT: movw r1, #58081
				; CHECK-NEXT: movt r1, #58595
				; CHECK-NEXT: str.w r1, [r0, #481]
				; CHECK-NEXT: movw r1, #59109
				; CHECK-NEXT: movt r1, #59623
				; CHECK-NEXT: str.w r1, [r0, #485]
				; CHECK-NEXT: movw r1, #60137
				; CHECK-NEXT: strh.w r1, [r0, #489]
				; CHECK-NEXT: movw r1, #60651
				; CHECK-NEXT: movt r1, #61165
				; CHECK-NEXT: str.w r1, [r0, #491]
				; CHECK-NEXT: movw r1, #61679
				; CHECK-NEXT: strh.w r1, [r0, #495]
				; CHECK-NEXT: movw r1, #62193
				; CHECK-NEXT: movt r1, #62707
				; CHECK-NEXT: str.w r1, [r0, #497]
				; CHECK-NEXT: movw r1, #63221
				; CHECK-NEXT: movt r1, #63735
				; CHECK-NEXT: str.w r1, [r0, #501]
				; CHECK-NEXT: movw r1, #64249
				; CHECK-NEXT: strh.w r1, [r0, #505]
				; CHECK-NEXT: movs r1, #251
				; CHECK-NEXT: strb.w r1, [r0, #507]
				; CHECK-NEXT: movw r1, #65020
				; CHECK-NEXT: movt r1, #65534
				; CHECK-NEXT: str.w r1, [r0, #508]
				; CHECK-NEXT: bx lr
				%v190 = getelementptr inbounds i8, i8* %v50, i32 394
				store i8 -118, i8* %v190, align 1
				%v191 = getelementptr inbounds i8, i8* %v50, i32 395
				store i8 -117, i8* %v191, align 1
				%v192 = getelementptr inbounds i8, i8* %v50, i32 396
				store i8 -116, i8* %v192, align 1
				%v193 = getelementptr inbounds i8, i8* %v50, i32 397
				store i8 -115, i8* %v193, align 1
				%v194 = getelementptr inbounds i8, i8* %v50, i32 398
				store i8 -114, i8* %v194, align 1
				%v195 = getelementptr inbounds i8, i8* %v50, i32 399
				store i8 -113, i8* %v195, align 1
				%v196 = getelementptr inbounds i8, i8* %v50, i32 400
				store i8 -112, i8* %v196, align 1
				%v197 = getelementptr inbounds i8, i8* %v50, i32 401
				store i8 -111, i8* %v197, align 1
				%v198 = getelementptr inbounds i8, i8* %v50, i32 402
				store i8 -110, i8* %v198, align 1
				%v199 = getelementptr inbounds i8, i8* %v50, i32 403
				store i8 -109, i8* %v199, align 1
				%v200 = getelementptr inbounds i8, i8* %v50, i32 404
				store i8 -108, i8* %v200, align 1
				%v201 = getelementptr inbounds i8, i8* %v50, i32 405
				store i8 -107, i8* %v201, align 1
				%v202 = getelementptr inbounds i8, i8* %v50, i32 406
				store i8 -106, i8* %v202, align 1
				%v203 = getelementptr inbounds i8, i8* %v50, i32 407
				store i8 -105, i8* %v203, align 1
				%v204 = getelementptr inbounds i8, i8* %v50, i32 408
				store i8 -104, i8* %v204, align 1
				%v205 = getelementptr inbounds i8, i8* %v50, i32 409
				store i8 -103, i8* %v205, align 1
				%v206 = getelementptr inbounds i8, i8* %v50, i32 410
				store i8 -102, i8* %v206, align 1
				%v207 = getelementptr inbounds i8, i8* %v50, i32 411
				store i8 -101, i8* %v207, align 1
				%v208 = getelementptr inbounds i8, i8* %v50, i32 412
				store i8 -100, i8* %v208, align 1
				%v209 = getelementptr inbounds i8, i8* %v50, i32 413
				store i8 -99, i8* %v209, align 1
				%v210 = getelementptr inbounds i8, i8* %v50, i32 414
				store i8 -98, i8* %v210, align 1
				%v211 = getelementptr inbounds i8, i8* %v50, i32 415
				store i8 -97, i8* %v211, align 1
				%v212 = getelementptr inbounds i8, i8* %v50, i32 416
				store i8 -96, i8* %v212, align 1
				%v213 = getelementptr inbounds i8, i8* %v50, i32 417
				store i8 -95, i8* %v213, align 1
				%v214 = getelementptr inbounds i8, i8* %v50, i32 418
				store i8 -94, i8* %v214, align 1
				%v215 = getelementptr inbounds i8, i8* %v50, i32 419
				store i8 -93, i8* %v215, align 1
				%v216 = getelementptr inbounds i8, i8* %v50, i32 420
				store i8 -92, i8* %v216, align 1
				%v217 = getelementptr inbounds i8, i8* %v50, i32 421
				store i8 -91, i8* %v217, align 1
				%v218 = getelementptr inbounds i8, i8* %v50, i32 422
				store i8 -90, i8* %v218, align 1
				%v219 = getelementptr inbounds i8, i8* %v50, i32 423
				store i8 -89, i8* %v219, align 1
				%v220 = getelementptr inbounds i8, i8* %v50, i32 424
				store i8 -88, i8* %v220, align 1
				%v221 = getelementptr inbounds i8, i8* %v50, i32 425
				store i8 -87, i8* %v221, align 1
				%v222 = getelementptr inbounds i8, i8* %v50, i32 426
				store i8 -86, i8* %v222, align 1
				%v223 = getelementptr inbounds i8, i8* %v50, i32 427
				store i8 -85, i8* %v223, align 1
				%v224 = getelementptr inbounds i8, i8* %v50, i32 428
				store i8 -84, i8* %v224, align 1
				%v225 = getelementptr inbounds i8, i8* %v50, i32 429
				store i8 -83, i8* %v225, align 1
				%v226 = getelementptr inbounds i8, i8* %v50, i32 430
				store i8 -82, i8* %v226, align 1
				%v227 = getelementptr inbounds i8, i8* %v50, i32 431
				store i8 -81, i8* %v227, align 1
				%v228 = getelementptr inbounds i8, i8* %v50, i32 432
				store i8 -80, i8* %v228, align 1
				%v229 = getelementptr inbounds i8, i8* %v50, i32 433
				store i8 -79, i8* %v229, align 1
				%v230 = getelementptr inbounds i8, i8* %v50, i32 434
				store i8 -78, i8* %v230, align 1
				%v231 = getelementptr inbounds i8, i8* %v50, i32 435
				store i8 -77, i8* %v231, align 1
				%v232 = getelementptr inbounds i8, i8* %v50, i32 436
				store i8 -76, i8* %v232, align 1
				%v233 = getelementptr inbounds i8, i8* %v50, i32 437
				store i8 -75, i8* %v233, align 1
				%v234 = getelementptr inbounds i8, i8* %v50, i32 438
				store i8 -74, i8* %v234, align 1
				%v235 = getelementptr inbounds i8, i8* %v50, i32 439
				store i8 -73, i8* %v235, align 1
				%v236 = getelementptr inbounds i8, i8* %v50, i32 440
				store i8 -72, i8* %v236, align 1
				%v237 = getelementptr inbounds i8, i8* %v50, i32 441
				store i8 -71, i8* %v237, align 1
				%v238 = getelementptr inbounds i8, i8* %v50, i32 442
				store i8 -70, i8* %v238, align 1
				%v239 = getelementptr inbounds i8, i8* %v50, i32 443
				store i8 -69, i8* %v239, align 1
				%v240 = getelementptr inbounds i8, i8* %v50, i32 444
				store i8 -68, i8* %v240, align 1
				%v241 = getelementptr inbounds i8, i8* %v50, i32 445
				store i8 -67, i8* %v241, align 1
				%v242 = getelementptr inbounds i8, i8* %v50, i32 446
				store i8 -66, i8* %v242, align 1
				%v243 = getelementptr inbounds i8, i8* %v50, i32 447
				store i8 -65, i8* %v243, align 1
				%v244 = getelementptr inbounds i8, i8* %v50, i32 448
				store i8 -64, i8* %v244, align 1
				%v245 = getelementptr inbounds i8, i8* %v50, i32 449
				store i8 -63, i8* %v245, align 1
				%v246 = getelementptr inbounds i8, i8* %v50, i32 450
				store i8 -62, i8* %v246, align 1
				%v247 = getelementptr inbounds i8, i8* %v50, i32 451
				store i8 -61, i8* %v247, align 1
				%v248 = getelementptr inbounds i8, i8* %v50, i32 452
				store i8 -60, i8* %v248, align 1
				%v249 = getelementptr inbounds i8, i8* %v50, i32 453
				store i8 -59, i8* %v249, align 1
				%v250 = getelementptr inbounds i8, i8* %v50, i32 454
				store i8 -58, i8* %v250, align 1
				%v251 = getelementptr inbounds i8, i8* %v50, i32 455
				store i8 -57, i8* %v251, align 1
				%v252 = getelementptr inbounds i8, i8* %v50, i32 456
				store i8 -56, i8* %v252, align 1
				%v253 = getelementptr inbounds i8, i8* %v50, i32 457
				store i8 -55, i8* %v253, align 1
				%v254 = getelementptr inbounds i8, i8* %v50, i32 458
				store i8 -54, i8* %v254, align 1
				%v255 = getelementptr inbounds i8, i8* %v50, i32 459
				store i8 -53, i8* %v255, align 1
				%v256 = getelementptr inbounds i8, i8* %v50, i32 460
				store i8 -52, i8* %v256, align 1
				%v257 = getelementptr inbounds i8, i8* %v50, i32 461
				store i8 -51, i8* %v257, align 1
				%v258 = getelementptr inbounds i8, i8* %v50, i32 462
				store i8 -50, i8* %v258, align 1
				%v259 = getelementptr inbounds i8, i8* %v50, i32 463
				store i8 -49, i8* %v259, align 1
				%v260 = getelementptr inbounds i8, i8* %v50, i32 464
				store i8 -48, i8* %v260, align 1
				%v261 = getelementptr inbounds i8, i8* %v50, i32 465
				store i8 -47, i8* %v261, align 1
				%v262 = getelementptr inbounds i8, i8* %v50, i32 466
				store i8 -46, i8* %v262, align 1
				%v263 = getelementptr inbounds i8, i8* %v50, i32 467
				store i8 -45, i8* %v263, align 1
				%v264 = getelementptr inbounds i8, i8* %v50, i32 468
				store i8 -44, i8* %v264, align 1
				%v265 = getelementptr inbounds i8, i8* %v50, i32 469
				store i8 -43, i8* %v265, align 1
				%v266 = getelementptr inbounds i8, i8* %v50, i32 470
				store i8 -42, i8* %v266, align 1
				%v267 = getelementptr inbounds i8, i8* %v50, i32 471
				store i8 -41, i8* %v267, align 1
				%v268 = getelementptr inbounds i8, i8* %v50, i32 472
				store i8 -40, i8* %v268, align 1
				%v269 = getelementptr inbounds i8, i8* %v50, i32 473
				store i8 -39, i8* %v269, align 1
				%v270 = getelementptr inbounds i8, i8* %v50, i32 474
				store i8 -38, i8* %v270, align 1
				%v271 = getelementptr inbounds i8, i8* %v50, i32 475
				store i8 -37, i8* %v271, align 1
				%v272 = getelementptr inbounds i8, i8* %v50, i32 476
				store i8 -36, i8* %v272, align 1
				%v273 = getelementptr inbounds i8, i8* %v50, i32 477
				store i8 -35, i8* %v273, align 1
				%v274 = getelementptr inbounds i8, i8* %v50, i32 478
				store i8 -34, i8* %v274, align 1
				%v275 = getelementptr inbounds i8, i8* %v50, i32 479
				store i8 -33, i8* %v275, align 1
				%v276 = getelementptr inbounds i8, i8* %v50, i32 480
				store i8 -32, i8* %v276, align 1
				%v277 = getelementptr inbounds i8, i8* %v50, i32 481
				store i8 -31, i8* %v277, align 1
				%v278 = getelementptr inbounds i8, i8* %v50, i32 482
				store i8 -30, i8* %v278, align 1
				%v279 = getelementptr inbounds i8, i8* %v50, i32 483
				store i8 -29, i8* %v279, align 1
				%v280 = getelementptr inbounds i8, i8* %v50, i32 484
				store i8 -28, i8* %v280, align 1
				%v281 = getelementptr inbounds i8, i8* %v50, i32 485
				store i8 -27, i8* %v281, align 1
				%v282 = getelementptr inbounds i8, i8* %v50, i32 486
				store i8 -26, i8* %v282, align 1
				%v283 = getelementptr inbounds i8, i8* %v50, i32 487
				store i8 -25, i8* %v283, align 1
				%v284 = getelementptr inbounds i8, i8* %v50, i32 488
				store i8 -24, i8* %v284, align 1
				%v285 = getelementptr inbounds i8, i8* %v50, i32 489
				store i8 -23, i8* %v285, align 1
				%v286 = getelementptr inbounds i8, i8* %v50, i32 490
				store i8 -22, i8* %v286, align 1
				%v287 = getelementptr inbounds i8, i8* %v50, i32 491
				store i8 -21, i8* %v287, align 1
				%v288 = getelementptr inbounds i8, i8* %v50, i32 492
				store i8 -20, i8* %v288, align 1
				%v289 = getelementptr inbounds i8, i8* %v50, i32 493
				store i8 -19, i8* %v289, align 1
				%v290 = getelementptr inbounds i8, i8* %v50, i32 494
				store i8 -18, i8* %v290, align 1
				%v291 = getelementptr inbounds i8, i8* %v50, i32 495
				store i8 -17, i8* %v291, align 1
				%v292 = getelementptr inbounds i8, i8* %v50, i32 496
				store i8 -16, i8* %v292, align 1
				%v293 = getelementptr inbounds i8, i8* %v50, i32 497
				store i8 -15, i8* %v293, align 1
				%v294 = getelementptr inbounds i8, i8* %v50, i32 498
				store i8 -14, i8* %v294, align 1
				%v295 = getelementptr inbounds i8, i8* %v50, i32 499
				store i8 -13, i8* %v295, align 1
				%v296 = getelementptr inbounds i8, i8* %v50, i32 500
				store i8 -12, i8* %v296, align 1
				%v297 = getelementptr inbounds i8, i8* %v50, i32 501
				store i8 -11, i8* %v297, align 1
				%v298 = getelementptr inbounds i8, i8* %v50, i32 502
				store i8 -10, i8* %v298, align 1
				%v299 = getelementptr inbounds i8, i8* %v50, i32 503
				store i8 -9, i8* %v299, align 1
				%v300 = getelementptr inbounds i8, i8* %v50, i32 504
				store i8 -8, i8* %v300, align 1
				%v301 = getelementptr inbounds i8, i8* %v50, i32 505
				store i8 -7, i8* %v301, align 1
				%v302 = getelementptr inbounds i8, i8* %v50, i32 506
				store i8 -6, i8* %v302, align 1
				%v303 = getelementptr inbounds i8, i8* %v50, i32 507
				store i8 -5, i8* %v303, align 1
				%v304 = getelementptr inbounds i8, i8* %v50, i32 508
				store i8 -4, i8* %v304, align 1
				%v305 = getelementptr inbounds i8, i8* %v50, i32 509
				store i8 -3, i8* %v305, align 1
				%v306 = getelementptr inbounds i8, i8* %v50, i32 510
				store i8 -2, i8* %v306, align 1
				%v307 = getelementptr inbounds i8, i8* %v50, i32 511
				store i8 -1, i8* %v307, align 1
				ret void
				}

				attributes #0 = { nounwind "correctly-rounded-divide-sqrt-fp-math"="false" "denormal-fp-math"="preserve-sign" "disable-tail-calls"="false" "less-precise-fpmad"="false" "no-frame-pointer-elim"="false" "no-infs-fp-math"="true" "no-jump-tables"="false" "no-nans-fp-math"="true" "no-signed-zeros-fp-math"="true" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="cortex-m7" "target-features"="+d16,+dsp,+fp-armv8,+hwdiv,+thumb-mode,-crc,-crypto,-dotprod,-fp-only-sp,-fullfp16,-hwdiv-arm,-neon,-ras" "unsafe-fp-math"="false" "use-soft-float"="false" }

llvm/test/CodeGen/ARM/fp16-promote.ll

	Show First 20 Lines • Show All 811 Lines • ▼ Show 20 Lines
	}			}

	; f16 vectors are not legal in the backend. Vector elements are not assigned			; f16 vectors are not legal in the backend. Vector elements are not assigned
	; to the register, but are stored in the stack instead. Hence insertelement			; to the register, but are stored in the stack instead. Hence insertelement
	; and extractelement have these extra loads and stores.			; and extractelement have these extra loads and stores.

	; CHECK-ALL-LABEL: test_insertelement:			; CHECK-ALL-LABEL: test_insertelement:
	; CHECK-ALL: sub sp, sp, #8			; CHECK-ALL: sub sp, sp, #8
	; CHECK-ALL: ldrh
	; CHECK-ALL: ldrh			; CHECK-VFP: and
	; CHECK-ALL: ldrh			; CHECK-VFP: mov
	; CHECK-ALL: ldrh			; CHECK-VFP: ldrd
	; CHECK-ALL-DAG: strh			; CHECK-VFP: orr
	; CHECK-ALL-DAG: strh			; CHECK-VFP: ldrh
	; CHECK-ALL-DAG: mov			; CHECK-VFP: stm
	; CHECK-ALL-DAG: ldrh			; CHECK-VFP: strh
	; CHECK-ALL-DAG: orr			; CHECK-VFP: ldm
	; CHECK-ALL-DAG: strh			; CHECK-VFP: stm
	; CHECK-ALL-DAG: strh
	; CHECK-ALL-DAG: strh			; CHECK-NOVFP: ldrh
	; CHECK-ALL-DAG: ldrh			; CHECK-NOVFP: ldrh
	; CHECK-ALL-DAG: ldrh			; CHECK-NOVFP: ldrh
	; CHECK-ALL-DAG: ldrh			; CHECK-NOVFP: ldrh
	; CHECK-ALL-DAG: strh			; CHECK-NOVFP-DAG: strh
	; CHECK-ALL-DAG: strh			; CHECK-NOVFP-DAG: strh
	; CHECK-ALL-DAG: strh			; CHECK-NOVFP-DAG: mov
	; CHECK-ALL-DAG: strh			; CHECK-NOVFP-DAG: ldrh
				; CHECK-NOVFP-DAG: orr
				; CHECK-NOVFP-DAG: strh
				; CHECK-NOVFP-DAG: strh
				; CHECK-NOVFP-DAG: strh
				; CHECK-NOVFP-DAG: ldrh
				; CHECK-NOVFP-DAG: ldrh
				; CHECK-NOVFP-DAG: ldrh
				; CHECK-NOVFP-DAG: strh
				; CHECK-NOVFP-DAG: strh
				; CHECK-NOVFP-DAG: strh
				; CHECK-NOVFP-DAG: strh

	; CHECK-ALL: add sp, sp, #8			; CHECK-ALL: add sp, sp, #8
	define void @test_insertelement(half* %p, <4 x half>* %q, i32 %i) #0 {			define void @test_insertelement(half* %p, <4 x half>* %q, i32 %i) #0 {
	%a = load half, half* %p, align 2			%a = load half, half* %p, align 2
	%b = load <4 x half>, <4 x half>* %q, align 8			%b = load <4 x half>, <4 x half>* %q, align 8
	%c = insertelement <4 x half> %b, half %a, i32 %i			%c = insertelement <4 x half> %b, half %a, i32 %i
	store <4 x half> %c, <4 x half>* %q			store <4 x half> %c, <4 x half>* %q
	ret void			ret void
	}			}
	▲ Show 20 Lines • Show All 115 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[ARM][AArch64][DAG] Reenable post-legalize store merge
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 125359

llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

llvm/lib/Target/AArch64/AArch64ISelLowering.h

llvm/lib/Target/ARM/ARMISelLowering.h

llvm/test/CodeGen/AArch64/arm64-complex-ret.ll

llvm/test/CodeGen/AArch64/arm64-narrow-st-merge.ll

llvm/test/CodeGen/AArch64/arm64-variadic-aapcs.ll

llvm/test/CodeGen/AArch64/tailcall-explicit-sret.ll

llvm/test/CodeGen/AArch64/tailcall-implicit-sret.ll

llvm/test/CodeGen/ARM/arm-storebytesmerge.ll

llvm/test/CodeGen/ARM/fp16-promote.ll

This is an archive of the discontinued LLVM Phabricator instance.

[ARM][AArch64][DAG] Reenable post-legalize store mergeClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 125359

llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

llvm/lib/Target/AArch64/AArch64ISelLowering.h

llvm/lib/Target/ARM/ARMISelLowering.h

llvm/test/CodeGen/AArch64/arm64-complex-ret.ll

llvm/test/CodeGen/AArch64/arm64-narrow-st-merge.ll

llvm/test/CodeGen/AArch64/arm64-variadic-aapcs.ll

llvm/test/CodeGen/AArch64/tailcall-explicit-sret.ll

llvm/test/CodeGen/AArch64/tailcall-implicit-sret.ll

llvm/test/CodeGen/ARM/arm-storebytesmerge.ll

llvm/test/CodeGen/ARM/fp16-promote.ll

[ARM][AArch64][DAG] Reenable post-legalize store merge
ClosedPublic