Diff 28671

lib/CodeGen/SelectionDAG/TargetLowering.cpp

Show First 20 Lines • Show All 109 Lines • ▼ Show 20 Lines	TargetLowering::makeLibCall(SelectionDAG &DAG,
CLI.setDebugLoc(dl).setChain(DAG.getEntryNode())		CLI.setDebugLoc(dl).setChain(DAG.getEntryNode())
.setCallee(getLibcallCallingConv(LC), RetTy, Callee, std::move(Args), 0)		.setCallee(getLibcallCallingConv(LC), RetTy, Callee, std::move(Args), 0)
.setNoReturn(doesNotReturn).setDiscardResult(!isReturnValueUsed)		.setNoReturn(doesNotReturn).setDiscardResult(!isReturnValueUsed)
.setSExtResult(signExtend).setZExtResult(!signExtend);		.setSExtResult(signExtend).setZExtResult(!signExtend);
return LowerCallTo(CLI);		return LowerCallTo(CLI);
}		}



		abUnsubmitted Not Done Reply Inline Actions There was one newline too many, now there are two. Remove them both? ab: There was one newline too many, now there are two. Remove them both?
/// SoftenSetCCOperands - Soften the operands of a comparison. This code is		/// SoftenSetCCOperands - Soften the operands of a comparison. This code is
/// shared among BR_CC, SELECT_CC, and SETCC handlers.		/// shared among BR_CC, SELECT_CC, and SETCC handlers.
void TargetLowering::softenSetCCOperands(SelectionDAG &DAG, EVT VT,		void TargetLowering::softenSetCCOperands(SelectionDAG &DAG, EVT VT,
SDValue &NewLHS, SDValue &NewRHS,		SDValue &NewLHS, SDValue &NewRHS,
ISD::CondCode &CCCode,		ISD::CondCode &CCCode,
SDLoc dl) const {		SDLoc dl) const {
assert((VT == MVT::f32 \|\| VT == MVT::f64 \|\| VT == MVT::f128)		assert((VT == MVT::f32 \|\| VT == MVT::f64 \|\| VT == MVT::f128)
&& "Unsupported setcc type!");		&& "Unsupported setcc type!");

// Expand into one or more soft-fp libcall(s).		// Expand into one or more soft-fp libcall(s).
RTLIB::Libcall LC1 = RTLIB::UNKNOWN_LIBCALL, LC2 = RTLIB::UNKNOWN_LIBCALL;		RTLIB::Libcall LC1 = RTLIB::UNKNOWN_LIBCALL, LC2 = RTLIB::UNKNOWN_LIBCALL;
		bool getInverseCC = false;
		abUnsubmitted Not Done Reply Inline Actions Capital g, and name sounds like a function. What about something like "ShouldInvertCC" ? ab: Capital g, and name sounds like a function. What about something like "ShouldInvertCC" ?
switch (CCCode) {		switch (CCCode) {
case ISD::SETEQ:		case ISD::SETEQ:
case ISD::SETOEQ:		case ISD::SETOEQ:
LC1 = (VT == MVT::f32) ? RTLIB::OEQ_F32 :		LC1 = (VT == MVT::f32) ? RTLIB::OEQ_F32 :
(VT == MVT::f64) ? RTLIB::OEQ_F64 : RTLIB::OEQ_F128;		(VT == MVT::f64) ? RTLIB::OEQ_F64 : RTLIB::OEQ_F128;
break;		break;
case ISD::SETNE:		case ISD::SETNE:
case ISD::SETUNE:		case ISD::SETUNE:
Show All 23 Lines	void TargetLowering::softenSetCCOperands(SelectionDAG &DAG, EVT VT,
case ISD::SETUO:		case ISD::SETUO:
LC1 = (VT == MVT::f32) ? RTLIB::UO_F32 :		LC1 = (VT == MVT::f32) ? RTLIB::UO_F32 :
(VT == MVT::f64) ? RTLIB::UO_F64 : RTLIB::UO_F128;		(VT == MVT::f64) ? RTLIB::UO_F64 : RTLIB::UO_F128;
break;		break;
case ISD::SETO:		case ISD::SETO:
LC1 = (VT == MVT::f32) ? RTLIB::O_F32 :		LC1 = (VT == MVT::f32) ? RTLIB::O_F32 :
(VT == MVT::f64) ? RTLIB::O_F64 : RTLIB::O_F128;		(VT == MVT::f64) ? RTLIB::O_F64 : RTLIB::O_F128;
break;		break;
default:
LC1 = (VT == MVT::f32) ? RTLIB::UO_F32 :
(VT == MVT::f64) ? RTLIB::UO_F64 : RTLIB::UO_F128;
switch (CCCode) {
case ISD::SETONE:		case ISD::SETONE:
// SETONE = SETOLT \| SETOGT		// SETONE = SETOLT \| SETOGT
LC1 = (VT == MVT::f32) ? RTLIB::OLT_F32 :		LC1 = (VT == MVT::f32) ? RTLIB::OLT_F32 :
(VT == MVT::f64) ? RTLIB::OLT_F64 : RTLIB::OLT_F128;		(VT == MVT::f64) ? RTLIB::OLT_F64 : RTLIB::OLT_F128;
// Fallthrough
case ISD::SETUGT:
LC2 = (VT == MVT::f32) ? RTLIB::OGT_F32 :		LC2 = (VT == MVT::f32) ? RTLIB::OGT_F32 :
(VT == MVT::f64) ? RTLIB::OGT_F64 : RTLIB::OGT_F128;		(VT == MVT::f64) ? RTLIB::OGT_F64 : RTLIB::OGT_F128;
break;		break;
case ISD::SETUGE:		case ISD::SETUEQ:
LC2 = (VT == MVT::f32) ? RTLIB::OGE_F32 :		LC1 = (VT == MVT::f32) ? RTLIB::UO_F32 :
(VT == MVT::f64) ? RTLIB::OGE_F64 : RTLIB::OGE_F128;		(VT == MVT::f64) ? RTLIB::UO_F64 : RTLIB::UO_F128;
		LC2 = (VT == MVT::f32) ? RTLIB::OEQ_F32 :
		(VT == MVT::f64) ? RTLIB::OEQ_F64 : RTLIB::OEQ_F128;
break;		break;
		default:
		// Inverse CC for unordered comparison
		abUnsubmitted Not Done Reply Inline Actions "Invert CC for unordered comparisons." ? ab: "Invert CC for unordered comparisons." ?
		getInverseCC = true;
		switch (CCCode) {
case ISD::SETULT:		case ISD::SETULT:
LC2 = (VT == MVT::f32) ? RTLIB::OLT_F32 :		LC1 = (VT == MVT::f32) ? RTLIB::OGE_F32 :
		abUnsubmitted Not Done Reply Inline Actions Indentation seems off, clang-format? ab: Indentation seems off, clang-format?
(VT == MVT::f64) ? RTLIB::OLT_F64 : RTLIB::OLT_F128;		(VT == MVT::f64) ? RTLIB::OGE_F64 : RTLIB::OGE_F128;
break;		break;
case ISD::SETULE:		case ISD::SETULE:
LC2 = (VT == MVT::f32) ? RTLIB::OLE_F32 :		LC1 = (VT == MVT::f32) ? RTLIB::OGT_F32 :
		(VT == MVT::f64) ? RTLIB::OGT_F64 : RTLIB::OGT_F128;
		break;
		case ISD::SETUGT:
		LC1 = (VT == MVT::f32) ? RTLIB::OLE_F32 :
(VT == MVT::f64) ? RTLIB::OLE_F64 : RTLIB::OLE_F128;		(VT == MVT::f64) ? RTLIB::OLE_F64 : RTLIB::OLE_F128;
break;		break;
case ISD::SETUEQ:		case ISD::SETUGE:
LC2 = (VT == MVT::f32) ? RTLIB::OEQ_F32 :		LC1 = (VT == MVT::f32) ? RTLIB::OLT_F32 :
(VT == MVT::f64) ? RTLIB::OEQ_F64 : RTLIB::OEQ_F128;		(VT == MVT::f64) ? RTLIB::OLT_F64 : RTLIB::OLT_F128;
break;		break;
default: llvm_unreachable("Do not know how to soften this setcc!");		default: llvm_unreachable("Do not know how to soften this setcc!");
}		}
}		}

// Use the target specific return value for comparions lib calls.		// Use the target specific return value for comparions lib calls.
EVT RetVT = getCmpLibcallReturnType();		EVT RetVT = getCmpLibcallReturnType();
SDValue Ops[2] = { NewLHS, NewRHS };		SDValue Ops[2] = { NewLHS, NewRHS };
NewLHS = makeLibCall(DAG, LC1, RetVT, Ops, 2, false/sign irrelevant/,		NewLHS = makeLibCall(DAG, LC1, RetVT, Ops, 2, false/sign irrelevant/,
dl).first;		dl).first;
NewRHS = DAG.getConstant(0, dl, RetVT);		NewRHS = DAG.getConstant(0, dl, RetVT);

CCCode = getCmpLibcallCC(LC1);		CCCode = getCmpLibcallCC(LC1);
		if (getInverseCC)
		CCCode = getSetCCInverse(CCCode, true);
		abUnsubmitted Not Done Reply Inline Actions "true" -> "/isInteger=/true" ? ab: "true" -> "/isInteger=/true" ?

if (LC2 != RTLIB::UNKNOWN_LIBCALL) {		if (LC2 != RTLIB::UNKNOWN_LIBCALL) {
SDValue Tmp = DAG.getNode(ISD::SETCC, dl,		SDValue Tmp = DAG.getNode(ISD::SETCC, dl,
getSetCCResultType(*DAG.getContext(), RetVT),		getSetCCResultType(*DAG.getContext(), RetVT),
NewLHS, NewRHS, DAG.getCondCode(CCCode));		NewLHS, NewRHS, DAG.getCondCode(CCCode));
NewLHS = makeLibCall(DAG, LC2, RetVT, Ops, 2, false/sign irrelevant/,		NewLHS = makeLibCall(DAG, LC2, RetVT, Ops, 2, false/sign irrelevant/,
dl).first;		dl).first;
NewLHS = DAG.getNode(ISD::SETCC, dl,		NewLHS = DAG.getNode(ISD::SETCC, dl,
getSetCCResultType(*DAG.getContext(), RetVT), NewLHS,		getSetCCResultType(*DAG.getContext(), RetVT), NewLHS,
NewRHS, DAG.getCondCode(getCmpLibcallCC(LC2)));		NewRHS, DAG.getCondCode(getCmpLibcallCC(LC2)));
NewLHS = DAG.getNode(ISD::OR, dl, Tmp.getValueType(), Tmp, NewLHS);		NewLHS = DAG.getNode(ISD::OR, dl, Tmp.getValueType(), Tmp, NewLHS);
NewRHS = SDValue();		NewRHS = SDValue();
}		}
}		}

/// getJumpTableEncoding - Return the entry encoding for a jump table in the		/// getJumpTableEncoding - Return the entry encoding for a jump table in the
/// current function. The returned value is a member of the		/// current function. The returned value is a member of the
/// MachineJumpTableInfo::JTEntryKind enum.		/// MachineJumpTableInfo::JTEntryKind enum.
unsigned TargetLowering::getJumpTableEncoding() const {		unsigned TargetLowering::getJumpTableEncoding() const {
// In non-pic modes, just use the address of a block.		// In non-pic modes, just use the address of a block.
▲ Show 20 Lines • Show All 2,771 Lines • Show Last 20 Lines

test/CodeGen/AArch64/arm64-fp128.ll

	Show First 20 Lines • Show All 142 Lines • ▼ Show 20 Lines
	; CHECK-LABEL: test_setcc2:			; CHECK-LABEL: test_setcc2:

	%lhs = load fp128, fp128* @lhs, align 16			%lhs = load fp128, fp128* @lhs, align 16
	%rhs = load fp128, fp128* @rhs, align 16			%rhs = load fp128, fp128* @rhs, align 16
	; CHECK: ldr q0, [{{x[0-9]+}}, :lo12:lhs]			; CHECK: ldr q0, [{{x[0-9]+}}, :lo12:lhs]
	; CHECK: ldr q1, [{{x[0-9]+}}, :lo12:rhs]			; CHECK: ldr q1, [{{x[0-9]+}}, :lo12:rhs]

	%val = fcmp ugt fp128 %lhs, %rhs			%val = fcmp ugt fp128 %lhs, %rhs
	; CHECK: bl __gttf2			; CHECK: bl __letf2
	; CHECK: cmp w0, #0			; CHECK: cmp w0, #0
	; CHECK: cset [[GT:w[0-9]+]], gt			; CHECK: cset [[GT:w[0-9]+]], gt
				abUnsubmitted Not Done Reply Inline Actions Is this just "cset w0, gt" ? ab: Is this just "cset w0, gt" ?

	; CHECK: bl __unordtf2
	; CHECK: cmp w0, #0
	; CHECK: cset [[UNORDERED:w[0-9]+]], ne
	; CHECK: orr w0, [[UNORDERED]], [[GT]]

	ret i1 %val			ret i1 %val
	; CHECK: ret			; CHECK: ret
	}			}

	define i32 @test_br_cc() {			define i32 @test_br_cc() {
	; CHECK-LABEL: test_br_cc:			; CHECK-LABEL: test_br_cc:

	%lhs = load fp128, fp128* @lhs, align 16			%lhs = load fp128, fp128* @lhs, align 16
	%rhs = load fp128, fp128* @rhs, align 16			%rhs = load fp128, fp128* @rhs, align 16
	; CHECK: ldr q0, [{{x[0-9]+}}, :lo12:lhs]			; CHECK: ldr q0, [{{x[0-9]+}}, :lo12:lhs]
	; CHECK: ldr q1, [{{x[0-9]+}}, :lo12:rhs]			; CHECK: ldr q1, [{{x[0-9]+}}, :lo12:rhs]

	; olt == !uge, which LLVM unfortunately "optimizes" this to.			; olt == !uge, which LLVM unfortunately "optimizes" this to.
				abUnsubmitted Not Done Reply Inline Actions Can this comment be removed now? I guess your change lets us undo some other transform (which you should probably look into by the way) ab: Can this comment be removed now? I guess your change lets us undo some other transform (which…
				anadolskiyAuthorUnsubmitted Not Done Reply Inline Actions This comment explains line 171: why we compare with GE, instead of LT (that should be in case of ordered LT) anadolskiy: This comment explains line 171: why we compare with GE, instead of LT (that should be in case…
				abUnsubmitted Not Done Reply Inline Actions Hmm, that's not how I understood the comment. Checking both uno/__unordtf2 and oge/__getf2 is indeed an 'unfortunate "optimization"'. We used to do something like: IR: %1 = fcmp olt ... br i1 %1, label %iftrue, label %iffalse SelectionDAG: %1 = fcmp olt ... %2 = xor i1 %1, 1 brcond i1 %2, label %iffalse br label %iftrue Optimized SelectionDAG: %1 = fcmp uge ... brcond i1 %2, label %iffalse br label %iftrue It's this optimization that the comment complains about, I think, because a softened uge used to need two libcalls (as opposed to 1 for olt). Whereas I read: bl __lttf2 cmp w0, #0 b.ge <iffalse> iftrue: as a straightforward lowering for: %1 = fcmp olt ... %2 = xor i1 %1, 1 brcond i1 %2, label %iffalse br label %iftrue via (given that __lttf2 returns < 0 / -1 on "olt" only): %1 = call @__lttf2 %2 = icmp lt i32 %1, 0 %3 = xor i1 %2, 1 brcond i1 %3, label %iffalse br label %iftrue itself simplified to: %1 = call @__lttf2 %2 = icmp ge i32 %1, 0 brcond i1 %2, label %iffalse br label %iftrue In any case, not a big deal, but I might have missed something, so: am I making sense? ab: Hmm, that's not how I understood the comment. Checking both uno/__unordtf2 and oge/__getf2 is…
				anadolskiyAuthorUnsubmitted Not Done Reply Inline Actions Yes, exactly. But there's no XOR in given IR, so we must explain why GE. And I agree that <unfortunately "optimizes"> is now just "optimizes" anadolskiy: Yes, exactly. But there's no XOR in given IR, so we must explain why GE. And I agree that…
	%cond = fcmp olt fp128 %lhs, %rhs			%cond = fcmp olt fp128 %lhs, %rhs
	; CHECK: bl __getf2			; CHECK: bl __lttf2
	; CHECK: cmp w0, #0
	; CHECK: cset [[OGE:w[0-9]+]], ge

	; CHECK: bl __unordtf2
	; CHECK: cmp w0, #0			; CHECK: cmp w0, #0
	; CHECK: cset [[UNORDERED:w[0-9]+]], ne			; CHECK-NEXT: b.ge [[IFFALSE:.LBB[0-9]+_[0-9]+]]
				abUnsubmitted Not Done Reply Inline Actions You should check IFFALSE/RET29 somewhere. ab: You should check IFFALSE/RET29 somewhere.
				abUnsubmitted Not Done Reply Inline Actions CHECK-NEXT? ab: CHECK-NEXT?

	; CHECK: orr [[UGE:w[0-9]+]], [[UNORDERED]], [[OGE]]
	; CHECK: cbnz [[UGE]], [[RET29:.LBB[0-9]+_[0-9]+]]
	br i1 %cond, label %iftrue, label %iffalse			br i1 %cond, label %iftrue, label %iffalse

	iftrue:			iftrue:
	ret i32 42			ret i32 42
	; CHECK-NEXT: BB#			; CHECK-NEXT: BB#
	; CHECK-NEXT: movz w0, #0x2a			; CHECK-NEXT: movz w0, #0x2a
	; CHECK-NEXT: b [[REALRET:.LBB[0-9]+_[0-9]+]]			; CHECK: ret
				abUnsubmitted Not Done Reply Inline Actions CHECK-NEXT? ab: CHECK-NEXT?
				anadolskiyAuthorUnsubmitted Not Done Reply Inline Actions No, there is ldp instruction in between anadolskiy: No, there is ldp instruction in between

	iffalse:			iffalse:
	ret i32 29			ret i32 29
	; CHECK: [[RET29]]:			; CHECK: movz w0, #0x1d
	; CHECK-NEXT: movz w0, #0x1d
	; CHECK-NEXT: [[REALRET]]:
	; CHECK: ret			; CHECK: ret
				abUnsubmitted Not Done Reply Inline Actions CHECK-NEXT? ab: CHECK-NEXT?
				anadolskiyAuthorUnsubmitted Not Done Reply Inline Actions same here anadolskiy: same here
	}			}

	define void @test_select(i1 %cond, fp128 %lhs, fp128 %rhs) {			define void @test_select(i1 %cond, fp128 %lhs, fp128 %rhs) {
	; CHECK-LABEL: test_select:			; CHECK-LABEL: test_select:

	%val = select i1 %cond, fp128 %lhs, fp128 %rhs			%val = select i1 %cond, fp128 %lhs, fp128 %rhs
	store fp128 %val, fp128* @lhs, align 16			store fp128 %val, fp128* @lhs, align 16
	; CHECK: tst w0, #0x1			; CHECK: tst w0, #0x1
	▲ Show 20 Lines • Show All 68 Lines • Show Last 20 Lines

test/CodeGen/Mips/mips16fpe.ll

Show First 20 Lines • Show All 291 Lines • ▼ Show 20 Lines	;16hf-LABEL: test_ltsf2:
%0 = load float, float* @x, align 4		%0 = load float, float* @x, align 4
%1 = load float, float* @xx, align 4		%1 = load float, float* @xx, align 4
%lnot = fcmp uge float %0, %1		%lnot = fcmp uge float %0, %1
%2 = load float, float* @y, align 4		%2 = load float, float* @y, align 4
%cmp1 = fcmp olt float %0, %2		%cmp1 = fcmp olt float %0, %2
%and2 = and i1 %lnot, %cmp1		%and2 = and i1 %lnot, %cmp1
%and = zext i1 %and2 to i32		%and = zext i1 %and2 to i32
store i32 %and, i32* @ltsf2_result, align 4		store i32 %and, i32* @ltsf2_result, align 4
;16hf: lw ${{[0-9]+}}, %call16(__mips16_unordsf2)(${{[0-9]+}})		;16hf: lw ${{[0-9]+}}, %call16(__mips16_ltsf2)(${{[0-9]+}})
;16hf: lw ${{[0-9]+}}, %call16(__mips16_ltsf2)(${{[0-9]+}})		;16hf: lw ${{[0-9]+}}, %call16(__mips16_ltsf2)(${{[0-9]+}})
ret void		ret void
}		}

define void @test_ltdf2() nounwind {		define void @test_ltdf2() nounwind {
entry:		entry:
;16hf-LABEL: test_ltdf2:		;16hf-LABEL: test_ltdf2:
%0 = load double, double* @xd, align 8		%0 = load double, double* @xd, align 8
%1 = load double, double* @xxd, align 8		%1 = load double, double* @xxd, align 8
%lnot = fcmp uge double %0, %1		%lnot = fcmp uge double %0, %1
%2 = load double, double* @yd, align 8		%2 = load double, double* @yd, align 8
%cmp1 = fcmp olt double %0, %2		%cmp1 = fcmp olt double %0, %2
%and2 = and i1 %lnot, %cmp1		%and2 = and i1 %lnot, %cmp1
%and = zext i1 %and2 to i32		%and = zext i1 %and2 to i32
store i32 %and, i32* @ltdf2_result, align 4		store i32 %and, i32* @ltdf2_result, align 4
;16hf: lw ${{[0-9]+}}, %call16(__mips16_unorddf2)(${{[0-9]+}})		;16hf: lw ${{[0-9]+}}, %call16(__mips16_ltdf2)(${{[0-9]+}})
;16hf: lw ${{[0-9]+}}, %call16(__mips16_ltdf2)(${{[0-9]+}})		;16hf: lw ${{[0-9]+}}, %call16(__mips16_ltdf2)(${{[0-9]+}})
ret void		ret void
}		}

define void @test_lesf2() nounwind {		define void @test_lesf2() nounwind {
entry:		entry:
;16hf-LABEL: test_lesf2:		;16hf-LABEL: test_lesf2:
%0 = load float, float* @x, align 4		%0 = load float, float* @x, align 4
▲ Show 20 Lines • Show All 57 Lines • Show Last 20 Lines

test/CodeGen/Thumb2/float-cmp.ll

	Show First 20 Lines • Show All 75 Lines • ▼ Show 20 Lines
	; HARD: vcmpe.f32			; HARD: vcmpe.f32
	; HARD: moveq r0, #1			; HARD: moveq r0, #1
	; HARD: movvs r0, #1			; HARD: movvs r0, #1
	%1 = fcmp ueq float %a, %b			%1 = fcmp ueq float %a, %b
	ret i1 %1			ret i1 %1
	}			}
	define i1 @cmp_f_ugt(float %a, float %b) {			define i1 @cmp_f_ugt(float %a, float %b) {
	; CHECK-LABEL: cmp_f_ugt:			; CHECK-LABEL: cmp_f_ugt:
	; NONE: bl __aeabi_fcmpgt			; NONE: bl __aeabi_fcmple
				abUnsubmitted Not Done Reply Inline Actions Hmm, these might benefit from stricter CHECK/NONE, since I guess the result gets inverted? ab: Hmm, these might benefit from stricter CHECK/NONE, since I guess the result gets inverted?
				anadolskiyAuthorUnsubmitted Not Done Reply Inline Actions Sorry, I didn't understand that. Can you please explain? anadolskiy: Sorry, I didn't understand that. Can you please explain?
				abUnsubmitted Not Done Reply Inline Actions The IR does an UGT comparison, but this patch checks for OLE. Since UGT == !OLE, I imagine there's some code right after the call that inverts r0 somehow. I'm saying it might be a good idea to check (in this case, using "NONE:") that code as well. ab: The IR does an UGT comparison, but this patch checks for OLE. Since UGT == !OLE, I imagine…
	; NONE: bl __aeabi_fcmpun
	; HARD: vcmpe.f32			; HARD: vcmpe.f32
	; HARD: movhi r0, #1			; HARD: movhi r0, #1
	%1 = fcmp ugt float %a, %b			%1 = fcmp ugt float %a, %b
	ret i1 %1			ret i1 %1
	}			}
	define i1 @cmp_f_uge(float %a, float %b) {			define i1 @cmp_f_uge(float %a, float %b) {
	; CHECK-LABEL: cmp_f_uge:			; CHECK-LABEL: cmp_f_uge:
	; NONE: bl __aeabi_fcmpge			; NONE: bl __aeabi_fcmplt
	; NONE: bl __aeabi_fcmpun
	; HARD: vcmpe.f32			; HARD: vcmpe.f32
	; HARD: movpl r0, #1			; HARD: movpl r0, #1
	%1 = fcmp uge float %a, %b			%1 = fcmp uge float %a, %b
	ret i1 %1			ret i1 %1
	}			}
	define i1 @cmp_f_ult(float %a, float %b) {			define i1 @cmp_f_ult(float %a, float %b) {
	; CHECK-LABEL: cmp_f_ult:			; CHECK-LABEL: cmp_f_ult:
	; NONE: bl __aeabi_fcmplt			; NONE: bl __aeabi_fcmpge
	; NONE: bl __aeabi_fcmpun
	; HARD: vcmpe.f32			; HARD: vcmpe.f32
	; HARD: movlt r0, #1			; HARD: movlt r0, #1
	%1 = fcmp ult float %a, %b			%1 = fcmp ult float %a, %b
	ret i1 %1			ret i1 %1
	}			}
	define i1 @cmp_f_ule(float %a, float %b) {			define i1 @cmp_f_ule(float %a, float %b) {
	; CHECK-LABEL: cmp_f_ule:			; CHECK-LABEL: cmp_f_ule:
	; NONE: bl __aeabi_fcmple			; NONE: bl __aeabi_fcmpgt
	; NONE: bl __aeabi_fcmpun
	; HARD: vcmpe.f32			; HARD: vcmpe.f32
	; HARD: movle r0, #1			; HARD: movle r0, #1
	%1 = fcmp ule float %a, %b			%1 = fcmp ule float %a, %b
	ret i1 %1			ret i1 %1
	}			}
	define i1 @cmp_f_une(float %a, float %b) {			define i1 @cmp_f_une(float %a, float %b) {
	; CHECK-LABEL: cmp_f_une:			; CHECK-LABEL: cmp_f_une:
	; NONE: bl __aeabi_fcmpeq			; NONE: bl __aeabi_fcmpeq
	▲ Show 20 Lines • Show All 88 Lines • ▼ Show 20 Lines
	; SP: bl __aeabi_dcmpun			; SP: bl __aeabi_dcmpun
	; DP: vcmpe.f64			; DP: vcmpe.f64
	; DP: movvc r0, #1			; DP: movvc r0, #1
	%1 = fcmp ord double %a, %b			%1 = fcmp ord double %a, %b
	ret i1 %1			ret i1 %1
	}			}
	define i1 @cmp_d_ugt(double %a, double %b) {			define i1 @cmp_d_ugt(double %a, double %b) {
	; CHECK-LABEL: cmp_d_ugt:			; CHECK-LABEL: cmp_d_ugt:
	; NONE: bl __aeabi_dcmpgt			; NONE: bl __aeabi_dcmple
	; NONE: bl __aeabi_dcmpun			; SP: bl __aeabi_dcmple
	; SP: bl __aeabi_dcmpgt
	; SP: bl __aeabi_dcmpun
	; DP: vcmpe.f64			; DP: vcmpe.f64
	; DP: movhi r0, #1			; DP: movhi r0, #1
	%1 = fcmp ugt double %a, %b			%1 = fcmp ugt double %a, %b
	ret i1 %1			ret i1 %1
	}			}

	define i1 @cmp_d_ult(double %a, double %b) {			define i1 @cmp_d_ult(double %a, double %b) {
	; CHECK-LABEL: cmp_d_ult:			; CHECK-LABEL: cmp_d_ult:
	; NONE: bl __aeabi_dcmplt			; NONE: bl __aeabi_dcmpge
	; NONE: bl __aeabi_dcmpun			; SP: bl __aeabi_dcmpge
	; SP: bl __aeabi_dcmplt
	; SP: bl __aeabi_dcmpun
	; DP: vcmpe.f64			; DP: vcmpe.f64
	; DP: movlt r0, #1			; DP: movlt r0, #1
	%1 = fcmp ult double %a, %b			%1 = fcmp ult double %a, %b
	ret i1 %1			ret i1 %1
	}			}


	define i1 @cmp_d_uno(double %a, double %b) {			define i1 @cmp_d_uno(double %a, double %b) {
	Show All 22 Lines
	; DP: moveq r0, #1			; DP: moveq r0, #1
	; DP: movvs r0, #1			; DP: movvs r0, #1
	%1 = fcmp ueq double %a, %b			%1 = fcmp ueq double %a, %b
	ret i1 %1			ret i1 %1
	}			}

	define i1 @cmp_d_uge(double %a, double %b) {			define i1 @cmp_d_uge(double %a, double %b) {
	; CHECK-LABEL: cmp_d_uge:			; CHECK-LABEL: cmp_d_uge:
	; NONE: bl __aeabi_dcmpge			; NONE: bl __aeabi_dcmplt
	; NONE: bl __aeabi_dcmpun			; SP: bl __aeabi_dcmplt
	; SP: bl __aeabi_dcmpge
	; SP: bl __aeabi_dcmpun
	; DP: vcmpe.f64			; DP: vcmpe.f64
	; DP: movpl r0, #1			; DP: movpl r0, #1
	%1 = fcmp uge double %a, %b			%1 = fcmp uge double %a, %b
	ret i1 %1			ret i1 %1
	}			}

	define i1 @cmp_d_ule(double %a, double %b) {			define i1 @cmp_d_ule(double %a, double %b) {
	; CHECK-LABEL: cmp_d_ule:			; CHECK-LABEL: cmp_d_ule:
	; NONE: bl __aeabi_dcmple			; NONE: bl __aeabi_dcmpgt
	; NONE: bl __aeabi_dcmpun			; SP: bl __aeabi_dcmpgt
	; SP: bl __aeabi_dcmple
	; SP: bl __aeabi_dcmpun
	; DP: vcmpe.f64			; DP: vcmpe.f64
	; DP: movle r0, #1			; DP: movle r0, #1
	%1 = fcmp ule double %a, %b			%1 = fcmp ule double %a, %b
	ret i1 %1			ret i1 %1
	}			}

	define i1 @cmp_d_une(double %a, double %b) {			define i1 @cmp_d_une(double %a, double %b) {
	; CHECK-LABEL: cmp_d_une:			; CHECK-LABEL: cmp_d_une:
	; NONE: bl __aeabi_dcmpeq			; NONE: bl __aeabi_dcmpeq
	; SP: bl __aeabi_dcmpeq			; SP: bl __aeabi_dcmpeq
	; DP: vcmpe.f64			; DP: vcmpe.f64
	; DP: movne r0, #1			; DP: movne r0, #1
	%1 = fcmp une double %a, %b			%1 = fcmp une double %a, %b
	ret i1 %1			ret i1 %1
	}			}

test/CodeGen/Thumb2/float-intrinsics-double.ll

Show First 20 Lines • Show All 103 Lines • ▼ Show 20 Lines	; HARD: vfma.f64
ret double %1		ret double %1
}		}

; FIXME: the FPv4-SP version is less efficient than the no-FPU version		; FIXME: the FPv4-SP version is less efficient than the no-FPU version
declare double @llvm.fabs.f64(double %Val)		declare double @llvm.fabs.f64(double %Val)
define double @abs_d(double %a) {		define double @abs_d(double %a) {
; CHECK-LABEL: abs_d:		; CHECK-LABEL: abs_d:
; NONE: bic r1, r1, #-2147483648		; NONE: bic r1, r1, #-2147483648
; SP: bl __aeabi_dcmpgt
; SP: bl __aeabi_dcmpun
; SP: bl __aeabi_dsub		; SP: bl __aeabi_dsub
		; SP: bl __aeabi_dcmple
; DP: vabs.f64 d0, d0		; DP: vabs.f64 d0, d0
%1 = call double @llvm.fabs.f64(double %a)		%1 = call double @llvm.fabs.f64(double %a)
ret double %1		ret double %1
}		}

declare double @llvm.copysign.f64(double %Mag, double %Sgn)		declare double @llvm.copysign.f64(double %Mag, double %Sgn)
define double @copysign_d(double %a, double %b) {		define double @copysign_d(double %a, double %b) {
; CHECK-LABEL: copysign_d:		; CHECK-LABEL: copysign_d:
▲ Show 20 Lines • Show All 106 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[SDAG] Optimize unordered comparison in soft-float mode
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 28671

lib/CodeGen/SelectionDAG/TargetLowering.cpp

test/CodeGen/AArch64/arm64-fp128.ll

test/CodeGen/Mips/mips16fpe.ll

test/CodeGen/Thumb2/float-cmp.ll

test/CodeGen/Thumb2/float-intrinsics-double.ll

This is an archive of the discontinued LLVM Phabricator instance.

[SDAG] Optimize unordered comparison in soft-float modeClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 28671

lib/CodeGen/SelectionDAG/TargetLowering.cpp

test/CodeGen/AArch64/arm64-fp128.ll

test/CodeGen/Mips/mips16fpe.ll

test/CodeGen/Thumb2/float-cmp.ll

test/CodeGen/Thumb2/float-intrinsics-double.ll

[SDAG] Optimize unordered comparison in soft-float mode
ClosedPublic