Diff 137207

lib/CodeGen/SelectionDAG/DAGCombiner.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 16,842 Lines • ▼ Show 20 Lines	if (ConstantSDNode *SCCC = dyn_cast_or_null<ConstantSDNode>(SCC.getNode())) {
// fold select_cc false, x, y -> y		// fold select_cc false, x, y -> y
return !SCCC->isNullValue() ? N2 : N3;		return !SCCC->isNullValue() ? N2 : N3;
}		}

// Check to see if we can simplify the select into an fabs node		// Check to see if we can simplify the select into an fabs node
if (ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(N1)) {		if (ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(N1)) {
// Allow either -0.0 or 0.0		// Allow either -0.0 or 0.0
if (CFP->isZero()) {		if (CFP->isZero()) {
		// These patterns should produce -0.0 on one of the zero inputs. Check
		// for nsz before folding.
// select (setg[te] X, +/-0.0), X, fneg(X) -> fabs		// select (setg[te] X, +/-0.0), X, fneg(X) -> fabs
if ((CC == ISD::SETGE \|\| CC == ISD::SETGT) &&		if ((CC == ISD::SETGE \|\| CC == ISD::SETGT) && N0 == N2 &&
N0 == N2 && N3.getOpcode() == ISD::FNEG &&		N3.getOpcode() == ISD::FNEG &&
N2 == N3.getOperand(0))		N3.getNode()->getFlags().hasNoSignedZeros() && N2 == N3.getOperand(0))
return DAG.getNode(ISD::FABS, DL, VT, N0);		return DAG.getNode(ISD::FABS, DL, VT, N0);

// select (setl[te] X, +/-0.0), fneg(X), X -> fabs		// select (setl[te] X, +/-0.0), fneg(X), X -> fabs
if ((CC == ISD::SETLT \|\| CC == ISD::SETLE) &&		if ((CC == ISD::SETLT \|\| CC == ISD::SETLE) && N0 == N3 &&
N0 == N3 && N2.getOpcode() == ISD::FNEG &&		N2.getOpcode() == ISD::FNEG &&
N2.getOperand(0) == N3)		N2.getNode()->getFlags().hasNoSignedZeros() && N2.getOperand(0) == N3)
return DAG.getNode(ISD::FABS, DL, VT, N3);		return DAG.getNode(ISD::FABS, DL, VT, N3);

		// These patterns are sign-of-zero compliant, but the zero values must be
		// routed to the (0.0 - X) option, so only 2 out of 4 conditions are
		// supported.
		// select (setgt X, +/-0.0), X, (fsub 0.0, X) -> fabs
		if (CC == ISD::SETGT && N0 == N2 && N3.getOpcode() == ISD::FSUB &&
		N0 == N3.getOperand(1)) {
		if (auto CZ = dyn_cast<ConstantFPSDNode>(N3.getOperand(0))) {
		if (CZ->isZero() && !CZ->isNegative())
		return DAG.getNode(ISD::FABS, DL, VT, N0);
		}
		}

		// select (setle X, +/-0.0), (fsub 0.0, X), X -> fabs
		if (CC == ISD::SETLE && N0 == N3 && N2.getOpcode() == ISD::FSUB &&
		N0 == N2.getOperand(1)) {
		if (auto CZ = dyn_cast<ConstantFPSDNode>(N2.getOperand(0))) {
		if (CZ->isZero() && !CZ->isNegative())
		return DAG.getNode(ISD::FABS, DL, VT, N3);
		}
		}
}		}
}		}

// Turn "(a cond b) ? 1.0f : 2.0f" into "load (tmp + ((a cond b) ? 0 : 4)"		// Turn "(a cond b) ? 1.0f : 2.0f" into "load (tmp + ((a cond b) ? 0 : 4)"
// where "tmp" is a constant pool entry containing an array with 1.0 and 2.0		// where "tmp" is a constant pool entry containing an array with 1.0 and 2.0
// in it. This is a win when the constant is not otherwise available because		// in it. This is a win when the constant is not otherwise available because
// it replaces two constant pool loads with one. We only do this if the FP		// it replaces two constant pool loads with one. We only do this if the FP
// type is known to be legal, because if it isn't, then we are before legalize		// type is known to be legal, because if it isn't, then we are before legalize
▲ Show 20 Lines • Show All 63 Lines • ▼ Show 20 Lines	if (CC == ISD::SETEQ && N0->getOpcode() == ISD::AND &&
if (ConstAndRHS && ConstAndRHS->getAPIntValue().countPopulation() == 1) {		if (ConstAndRHS && ConstAndRHS->getAPIntValue().countPopulation() == 1) {
// Shift the tested bit over the sign bit.		// Shift the tested bit over the sign bit.
const APInt &AndMask = ConstAndRHS->getAPIntValue();		const APInt &AndMask = ConstAndRHS->getAPIntValue();
SDValue ShlAmt =		SDValue ShlAmt =
DAG.getConstant(AndMask.countLeadingZeros(), SDLoc(AndLHS),		DAG.getConstant(AndMask.countLeadingZeros(), SDLoc(AndLHS),
getShiftAmountTy(AndLHS.getValueType()));		getShiftAmountTy(AndLHS.getValueType()));
SDValue Shl = DAG.getNode(ISD::SHL, SDLoc(N0), VT, AndLHS, ShlAmt);		SDValue Shl = DAG.getNode(ISD::SHL, SDLoc(N0), VT, AndLHS, ShlAmt);

// Now arithmetic right shift it all the way over, so the result is either		// Now arithmetic right shift it all the way over, so the result is either
		spatelUnsubmitted Done Reply Inline Actions We're checking the flags on a node, but there is no regression test with 'nsz' FMF on the IR? spatel: We're checking the flags on a node, but there is no regression test with 'nsz' FMF on the IR?
// all-ones, or zero.		// all-ones, or zero.
SDValue ShrAmt =		SDValue ShrAmt =
DAG.getConstant(AndMask.getBitWidth() - 1, SDLoc(Shl),		DAG.getConstant(AndMask.getBitWidth() - 1, SDLoc(Shl),
getShiftAmountTy(Shl.getValueType()));		getShiftAmountTy(Shl.getValueType()));
SDValue Shr = DAG.getNode(ISD::SRA, SDLoc(N0), VT, Shl, ShrAmt);		SDValue Shr = DAG.getNode(ISD::SRA, SDLoc(N0), VT, Shl, ShrAmt);

return DAG.getNode(ISD::AND, DL, VT, Shr, N3);		return DAG.getNode(ISD::AND, DL, VT, Shr, N3);
}		}
}		}

// fold select C, 16, 0 -> shl C, 4		// fold select C, 16, 0 -> shl C, 4
if (N2C && isNullConstant(N3) && N2C->getAPIntValue().isPowerOf2() &&		if (N2C && isNullConstant(N3) && N2C->getAPIntValue().isPowerOf2() &&
TLI.getBooleanContents(N0.getValueType()) ==		TLI.getBooleanContents(N0.getValueType()) ==
TargetLowering::ZeroOrOneBooleanContent) {		TargetLowering::ZeroOrOneBooleanContent) {

// If the caller doesn't want us to simplify this into a zext of a compare,		// If the caller doesn't want us to simplify this into a zext of a compare,
// don't do it.		// don't do it.
if (NotExtCompare && N2C->isOne())		if (NotExtCompare && N2C->isOne())
return SDValue();		return SDValue();
		spatelUnsubmitted Done Reply Inline Actions Use 'auto' with 'dyn_cast': http://llvm.org/docs/CodingStandards.html#use-auto-type-deduction-to-make-code-more-readable ...although what happens with vector types? Are they handled on a different path? spatel: Use 'auto' with 'dyn_cast': http://llvm.org/docs/CodingStandards.html#use-auto-type-deduction…

// Get a SetCC of the condition		// Get a SetCC of the condition
// NOTE: Don't create a SETCC if it's not legal on this target.		// NOTE: Don't create a SETCC if it's not legal on this target.
if (!LegalOperations \|\|		if (!LegalOperations \|\|
TLI.isOperationLegal(ISD::SETCC, N0.getValueType())) {		TLI.isOperationLegal(ISD::SETCC, N0.getValueType())) {
SDValue Temp, SCC;		SDValue Temp, SCC;
// cast from setcc result type to select result type		// cast from setcc result type to select result type
if (LegalTypes) {		if (LegalTypes) {
▲ Show 20 Lines • Show All 739 Lines • Show Last 20 Lines

lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp

Show First 20 Lines • Show All 251 Lines • ▼ Show 20 Lines	SDValue DAGTypeLegalizer::ScalarizeVecRes_UnaryOp(SDNode *N) {
if (getTypeAction(OpVT) == TargetLowering::TypeScalarizeVector) {		if (getTypeAction(OpVT) == TargetLowering::TypeScalarizeVector) {
Op = GetScalarizedVector(Op);		Op = GetScalarizedVector(Op);
} else {		} else {
EVT VT = OpVT.getVectorElementType();		EVT VT = OpVT.getVectorElementType();
Op = DAG.getNode(		Op = DAG.getNode(
ISD::EXTRACT_VECTOR_ELT, DL, VT, Op,		ISD::EXTRACT_VECTOR_ELT, DL, VT, Op,
DAG.getConstant(0, DL, TLI.getVectorIdxTy(DAG.getDataLayout())));		DAG.getConstant(0, DL, TLI.getVectorIdxTy(DAG.getDataLayout())));
}		}
return DAG.getNode(N->getOpcode(), SDLoc(N), DestVT, Op);		return DAG.getNode(N->getOpcode(), SDLoc(N), DestVT, Op, N->getFlags());
}		}

SDValue DAGTypeLegalizer::ScalarizeVecRes_InregOp(SDNode *N) {		SDValue DAGTypeLegalizer::ScalarizeVecRes_InregOp(SDNode *N) {
EVT EltVT = N->getValueType(0).getVectorElementType();		EVT EltVT = N->getValueType(0).getVectorElementType();
EVT ExtVT = cast<VTSDNode>(N->getOperand(1))->getVT().getVectorElementType();		EVT ExtVT = cast<VTSDNode>(N->getOperand(1))->getVT().getVectorElementType();
SDValue LHS = GetScalarizedVector(N->getOperand(0));		SDValue LHS = GetScalarizedVector(N->getOperand(0));
return DAG.getNode(N->getOpcode(), SDLoc(N), EltVT,		return DAG.getNode(N->getOpcode(), SDLoc(N), EltVT,
LHS, DAG.getValueType(ExtVT));		LHS, DAG.getValueType(ExtVT));
▲ Show 20 Lines • Show All 1,065 Lines • ▼ Show 20 Lines	if (getTypeAction(InVT) == TargetLowering::TypeSplitVector)
GetSplitVector(N->getOperand(0), Lo, Hi);		GetSplitVector(N->getOperand(0), Lo, Hi);
else		else
std::tie(Lo, Hi) = DAG.SplitVectorOperand(N, 0);		std::tie(Lo, Hi) = DAG.SplitVectorOperand(N, 0);

if (N->getOpcode() == ISD::FP_ROUND) {		if (N->getOpcode() == ISD::FP_ROUND) {
Lo = DAG.getNode(N->getOpcode(), dl, LoVT, Lo, N->getOperand(1));		Lo = DAG.getNode(N->getOpcode(), dl, LoVT, Lo, N->getOperand(1));
Hi = DAG.getNode(N->getOpcode(), dl, HiVT, Hi, N->getOperand(1));		Hi = DAG.getNode(N->getOpcode(), dl, HiVT, Hi, N->getOperand(1));
} else {		} else {
Lo = DAG.getNode(N->getOpcode(), dl, LoVT, Lo);		Lo = DAG.getNode(N->getOpcode(), dl, LoVT, Lo, N->getFlags());
Hi = DAG.getNode(N->getOpcode(), dl, HiVT, Hi);		Hi = DAG.getNode(N->getOpcode(), dl, HiVT, Hi, N->getFlags());
}		}
}		}

void DAGTypeLegalizer::SplitVecRes_ExtendOp(SDNode *N, SDValue &Lo,		void DAGTypeLegalizer::SplitVecRes_ExtendOp(SDNode *N, SDValue &Lo,
SDValue &Hi) {		SDValue &Hi) {
SDLoc dl(N);		SDLoc dl(N);
EVT SrcVT = N->getOperand(0).getValueType();		EVT SrcVT = N->getOperand(0).getValueType();
EVT DestVT = N->getValueType(0);		EVT DestVT = N->getValueType(0);
▲ Show 20 Lines • Show All 1,312 Lines • ▼ Show 20 Lines	SDValue DAGTypeLegalizer::WidenVecRes_Shift(SDNode *N) {

return DAG.getNode(N->getOpcode(), SDLoc(N), WidenVT, InOp, ShOp);		return DAG.getNode(N->getOpcode(), SDLoc(N), WidenVT, InOp, ShOp);
}		}

SDValue DAGTypeLegalizer::WidenVecRes_Unary(SDNode *N) {		SDValue DAGTypeLegalizer::WidenVecRes_Unary(SDNode *N) {
// Unary op widening.		// Unary op widening.
EVT WidenVT = TLI.getTypeToTransformTo(*DAG.getContext(), N->getValueType(0));		EVT WidenVT = TLI.getTypeToTransformTo(*DAG.getContext(), N->getValueType(0));
SDValue InOp = GetWidenedVector(N->getOperand(0));		SDValue InOp = GetWidenedVector(N->getOperand(0));
return DAG.getNode(N->getOpcode(), SDLoc(N), WidenVT, InOp);		return DAG.getNode(N->getOpcode(), SDLoc(N), WidenVT, InOp, N->getFlags());
}		}

SDValue DAGTypeLegalizer::WidenVecRes_InregOp(SDNode *N) {		SDValue DAGTypeLegalizer::WidenVecRes_InregOp(SDNode *N) {
EVT WidenVT = TLI.getTypeToTransformTo(*DAG.getContext(), N->getValueType(0));		EVT WidenVT = TLI.getTypeToTransformTo(*DAG.getContext(), N->getValueType(0));
EVT ExtVT = EVT::getVectorVT(*DAG.getContext(),		EVT ExtVT = EVT::getVectorVT(*DAG.getContext(),
cast<VTSDNode>(N->getOperand(1))->getVT()		cast<VTSDNode>(N->getOperand(1))->getVT()
.getVectorElementType(),		.getVectorElementType(),
WidenVT.getVectorNumElements());		WidenVT.getVectorNumElements());
▲ Show 20 Lines • Show All 1,453 Lines • Show Last 20 Lines

lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

	Show First 20 Lines • Show All 2,556 Lines • ▼ Show 20 Lines
	}			}

	void SelectionDAGBuilder::visitFSub(const User &I) {			void SelectionDAGBuilder::visitFSub(const User &I) {
	// -0.0 - X --> fneg			// -0.0 - X --> fneg
	Type *Ty = I.getType();			Type *Ty = I.getType();
	if (isa<Constant>(I.getOperand(0)) &&			if (isa<Constant>(I.getOperand(0)) &&
	I.getOperand(0) == ConstantFP::getZeroValueForNegation(Ty)) {			I.getOperand(0) == ConstantFP::getZeroValueForNegation(Ty)) {
	SDValue Op2 = getValue(I.getOperand(1));			SDValue Op2 = getValue(I.getOperand(1));
				SDNodeFlags FMF = SDNodeFlags();
				if (cast<FPMathOperator>(&I)->hasNoSignedZeros())
				FMF.setNoSignedZeros(true);
	setValue(&I, DAG.getNode(ISD::FNEG, getCurSDLoc(),			setValue(&I, DAG.getNode(ISD::FNEG, getCurSDLoc(),
	Op2.getValueType(), Op2));			Op2.getValueType(), Op2, FMF));
	return;			return;
	}			}

	visitBinary(I, ISD::FSUB);			visitBinary(I, ISD::FSUB);
	}			}

	/// Checks if the given instruction performs a vector reduction, in which case			/// Checks if the given instruction performs a vector reduction, in which case
	/// we have the freedom to alter the elements in the result as long as the			/// we have the freedom to alter the elements in the result as long as the
	▲ Show 20 Lines • Show All 7,477 Lines • Show Last 20 Lines

test/CodeGen/X86/fabs.ll

	Show First 20 Lines • Show All 46 Lines • ▼ Show 20 Lines
	; X87-NEXT: fldz			; X87-NEXT: fldz
	; X87-NEXT: .LBB1_2:			; X87-NEXT: .LBB1_2:
	; X87-NEXT: fstp %st(0)			; X87-NEXT: fstp %st(0)
	; X87-NEXT: retl			; X87-NEXT: retl
	;			;
	; X87UNSAFE-LABEL: test2:			; X87UNSAFE-LABEL: test2:
	; X87UNSAFE: # %bb.0:			; X87UNSAFE: # %bb.0:
	; X87UNSAFE-NEXT: fldl {{[0-9]+}}(%esp)			; X87UNSAFE-NEXT: fldl {{[0-9]+}}(%esp)
	; X87UNSAFE-NEXT: fabs			; X87UNSAFE-NEXT: fldz
				; X87UNSAFE-NEXT: fchs
				; X87UNSAFE-NEXT: fucomp %st(1)
				; X87UNSAFE-NEXT: fnstsw %ax
				; X87UNSAFE-NEXT: # kill: def $ah killed $ah killed $ax
				; X87UNSAFE-NEXT: sahf
				; X87UNSAFE-NEXT: fld %st(0)
				; X87UNSAFE-NEXT: fchs
				; X87UNSAFE-NEXT: jbe .LBB1_2
				; X87UNSAFE-NEXT: # %bb.1:
				; X87UNSAFE-NEXT: fstp %st(1)
				; X87UNSAFE-NEXT: fldz
				; X87UNSAFE-NEXT: .LBB1_2:
				; X87UNSAFE-NEXT: fstp %st(0)
	; X87UNSAFE-NEXT: retl			; X87UNSAFE-NEXT: retl
	;			;
	; X64-LABEL: test2:			; X64-LABEL: test2:
	; X64: # %bb.0:			; X64: # %bb.0:
	; X64-NEXT: movsd {{.*#+}} xmm1 = mem[0],zero			; X64-NEXT: movsd {{.*#+}} xmm1 = mem[0],zero
	; X64-NEXT: movapd %xmm1, %xmm2			; X64-NEXT: movapd %xmm1, %xmm2
	; X64-NEXT: unpcklpd {{.*#+}} xmm2 = xmm2[0],xmm1[0]			; X64-NEXT: unpcklpd {{.*#+}} xmm2 = xmm2[0],xmm1[0]
	; X64-NEXT: xorpd %xmm0, %xmm2			; X64-NEXT: xorpd %xmm0, %xmm2
	Show All 27 Lines
	; X64: # %bb.0:			; X64: # %bb.0:
	; X64-NEXT: fldt {{[0-9]+}}(%rsp)			; X64-NEXT: fldt {{[0-9]+}}(%rsp)
	; X64-NEXT: fabs			; X64-NEXT: fabs
	; X64-NEXT: retq			; X64-NEXT: retq
	%Y = call x86_fp80 @fabsl(x86_fp80 %X) readnone			%Y = call x86_fp80 @fabsl(x86_fp80 %X) readnone
	ret x86_fp80 %Y			ret x86_fp80 %Y
	}			}

				define double @test4(double %X) {
				; CHECK-LABEL: test4:
				; CHECK: ## %bb.0:
				; CHECK-NEXT: fldl {{[0-9]+}}(%esp)
				; CHECK-NEXT: fldz
				; CHECK-NEXT: fxch %st(1)
				; CHECK-NEXT: fucom %st(1)
				; CHECK-NEXT: fnstsw %ax
				; CHECK-NEXT: ## kill: def %ah killed %ah killed %ax
				; CHECK-NEXT: sahf
				; CHECK-NEXT: fsubr %st(0), %st(1)
				; CHECK-NEXT: ja LBB3_2
				; CHECK-NEXT: ## %bb.1:
				; CHECK-NEXT: fstp %st(0)
				; CHECK-NEXT: fldz
				; CHECK-NEXT: fxch %st(1)
				; CHECK-NEXT: LBB3_2:
				; CHECK-NEXT: fstp %st(1)
				; CHECK-NEXT: retl
				;
				; UNSAFE-LABEL: test4:
				; UNSAFE: ## %bb.0:
				; UNSAFE-NEXT: fldl {{[0-9]+}}(%esp)
				; UNSAFE-NEXT: fabs
				; UNSAFE-NEXT: retl
				;
				; NOOPT-LABEL: test4:
				; NOOPT: ## %bb.0:
				; NOOPT-NEXT: xorps %xmm1, %xmm1
				; NOOPT-NEXT: movaps %xmm1, %xmm2
				; NOOPT-NEXT: subsd %xmm0, %xmm2
				; NOOPT-NEXT: cmpltsd %xmm0, %xmm1
				; NOOPT-NEXT: movaps %xmm1, %xmm3
				; NOOPT-NEXT: andpd %xmm0, %xmm3
				; NOOPT-NEXT: andnpd %xmm2, %xmm1
				; NOOPT-NEXT: orpd %xmm3, %xmm1
				; NOOPT-NEXT: movaps %xmm1, %xmm0
				; NOOPT-NEXT: retq
				; X87-LABEL: test4:
				; X87: # %bb.0:
				; X87-NEXT: fldl {{[0-9]+}}(%esp)
				; X87-NEXT: fldz
				; X87-NEXT: fxch %st(1)
				; X87-NEXT: fucom %st(1)
				; X87-NEXT: fnstsw %ax
				; X87-NEXT: # kill: def $ah killed $ah killed $ax
				; X87-NEXT: sahf
				; X87-NEXT: fsubr %st(0), %st(1)
				; X87-NEXT: ja .LBB3_2
				; X87-NEXT: # %bb.1:
				; X87-NEXT: fstp %st(0)
				; X87-NEXT: fldz
				; X87-NEXT: fxch %st(1)
				; X87-NEXT: .LBB3_2:
				; X87-NEXT: fstp %st(1)
				; X87-NEXT: retl
				;
				; X87UNSAFE-LABEL: test4:
				; X87UNSAFE: # %bb.0:
				; X87UNSAFE-NEXT: fldl {{[0-9]+}}(%esp)
				; X87UNSAFE-NEXT: fabs
				; X87UNSAFE-NEXT: retl
				;
				; X64-LABEL: test4:
				; X64: # %bb.0:
				; X64-NEXT: xorpd %xmm1, %xmm1
				; X64-NEXT: xorpd %xmm2, %xmm2
				; X64-NEXT: subsd %xmm0, %xmm2
				; X64-NEXT: cmpltsd %xmm0, %xmm1
				; X64-NEXT: movapd %xmm1, %xmm3
				; X64-NEXT: andnpd %xmm2, %xmm3
				; X64-NEXT: andpd %xmm0, %xmm1
				; X64-NEXT: orpd %xmm3, %xmm1
				; X64-NEXT: movapd %xmm1, %xmm0
				; X64-NEXT: retq
				%Y = fcmp ogt double %X, zeroinitializer
				%Z = fsub double zeroinitializer, %X
				%Q = select i1 %Y, double %X, double %Z
				ret double %Q
				}

				define double @test5(double %X) {
				; CHECK-LABEL: test5:
				; CHECK: ## %bb.0:
				; CHECK-NEXT: fldl {{[0-9]+}}(%esp)
				; CHECK-NEXT: fldz
				; CHECK-NEXT: fchs
				; CHECK-NEXT: fxch %st(1)
				; CHECK-NEXT: fucom %st(1)
				; CHECK-NEXT: fstp %st(1)
				; CHECK-NEXT: fnstsw %ax
				; CHECK-NEXT: ## kill: def %ah killed %ah killed %ax
				; CHECK-NEXT: sahf
				; CHECK-NEXT: fld %st(0)
				; CHECK-NEXT: fchs
				; CHECK-NEXT: jae LBB4_2
				; CHECK-NEXT: ## %bb.1:
				; CHECK-NEXT: fstp %st(1)
				; CHECK-NEXT: fldz
				; CHECK-NEXT: LBB4_2:
				; CHECK-NEXT: fstp %st(0)
				; CHECK-NEXT: retl
				;
				; UNSAFE-LABEL: test5:
				; UNSAFE: ## %bb.0:
				; UNSAFE-NEXT: fldl {{[0-9]+}}(%esp)
				; UNSAFE-NEXT: fabs
				; UNSAFE-NEXT: retl
				;
				; NOOPT-LABEL: test5:
				; NOOPT: ## %bb.0:
				; NOOPT-NEXT: movsd {{.*#+}} xmm1 = mem[0],zero
				; NOOPT-NEXT: movabsq $-9223372036854775808, %rax ## imm = 0x8000000000000000
				; NOOPT-NEXT: movq %xmm0, %rcx
				; NOOPT-NEXT: xorq %rax, %rcx
				; NOOPT-NEXT: movq %rcx, %xmm2
				; NOOPT-NEXT: cmplesd %xmm0, %xmm1
				; NOOPT-NEXT: movaps %xmm1, %xmm3
				; NOOPT-NEXT: andpd %xmm0, %xmm3
				; NOOPT-NEXT: andnpd %xmm2, %xmm1
				; NOOPT-NEXT: orpd %xmm3, %xmm1
				; NOOPT-NEXT: movaps %xmm1, %xmm0
				; NOOPT-NEXT: retq
				; X87-LABEL: test5:
				; X87: # %bb.0:
				; X87-NEXT: fldl {{[0-9]+}}(%esp)
				; X87-NEXT: fldz
				; X87-NEXT: fchs
				; X87-NEXT: fxch %st(1)
				; X87-NEXT: fucom %st(1)
				; X87-NEXT: fstp %st(1)
				; X87-NEXT: fnstsw %ax
				; X87-NEXT: # kill: def $ah killed $ah killed $ax
				; X87-NEXT: sahf
				; X87-NEXT: fld %st(0)
				; X87-NEXT: fchs
				; X87-NEXT: jae .LBB4_2
				; X87-NEXT: # %bb.1:
				; X87-NEXT: fstp %st(1)
				; X87-NEXT: fldz
				; X87-NEXT: .LBB4_2:
				; X87-NEXT: fstp %st(0)
				; X87-NEXT: retl
				;
				; X87UNSAFE-LABEL: test5:
				; X87UNSAFE: # %bb.0:
				; X87UNSAFE-NEXT: fldl {{[0-9]+}}(%esp)
				; X87UNSAFE-NEXT: fabs
				; X87UNSAFE-NEXT: retl
				;
				; X64-LABEL: test5:
				; X64: # %bb.0:
				; X64-NEXT: movsd {{.*#+}} xmm1 = mem[0],zero
				; X64-NEXT: movapd %xmm1, %xmm2
				; X64-NEXT: unpcklpd {{.*#+}} xmm2 = xmm2[0],xmm1[0]
				; X64-NEXT: xorpd %xmm0, %xmm2
				; X64-NEXT: cmplesd %xmm0, %xmm1
				; X64-NEXT: movapd %xmm1, %xmm3
				; X64-NEXT: andnpd %xmm2, %xmm3
				; X64-NEXT: andpd %xmm0, %xmm1
				; X64-NEXT: orpd %xmm3, %xmm1
				; X64-NEXT: movapd %xmm1, %xmm0
				; X64-NEXT: retq
				%Y = fcmp oge double %X, -0.0
				%Z = fsub nsz double -0.0, %X
				%Q = select i1 %Y, double %X, double %Z
				ret double %Q
				}

				define <4 x double> @test6(<4 x double> %X) {
				; X87-LABEL: test6:
				; X87: # %bb.0:
				; X87-NEXT: pushl %ebx
				; X87-NEXT: .cfi_def_cfa_offset 8
				; X87-NEXT: pushl %esi
				; X87-NEXT: .cfi_def_cfa_offset 12
				; X87-NEXT: .cfi_offset %esi, -12
				; X87-NEXT: .cfi_offset %ebx, -8
				; X87-NEXT: fldl {{[0-9]+}}(%esp)
				; X87-NEXT: fldl {{[0-9]+}}(%esp)
				; X87-NEXT: fldl {{[0-9]+}}(%esp)
				; X87-NEXT: fldl {{[0-9]+}}(%esp)
				; X87-NEXT: fldz
				; X87-NEXT: fchs
				; X87-NEXT: fxch %st(1)
				; X87-NEXT: fucom %st(1)
				; X87-NEXT: fnstsw %ax
				; X87-NEXT: movl %eax, %ecx
				; X87-NEXT: fxch %st(2)
				; X87-NEXT: fucom %st(1)
				; X87-NEXT: fnstsw %ax
				; X87-NEXT: movl %eax, %edx
				; X87-NEXT: fxch %st(3)
				; X87-NEXT: fucom %st(1)
				; X87-NEXT: fnstsw %ax
				; X87-NEXT: movl %eax, %ebx
				; X87-NEXT: fxch %st(4)
				; X87-NEXT: fucom %st(1)
				; X87-NEXT: fstp %st(1)
				; X87-NEXT: fnstsw %ax
				; X87-NEXT: # kill: def $ah killed $ah killed $ax
				; X87-NEXT: sahf
				; X87-NEXT: fld %st(0)
				; X87-NEXT: fchs
				; X87-NEXT: jae .LBB5_2
				; X87-NEXT: # %bb.1:
				; X87-NEXT: fstp %st(1)
				; X87-NEXT: fldz
				; X87-NEXT: .LBB5_2:
				; X87-NEXT: fstp %st(0)
				; X87-NEXT: movb %bh, %ah
				; X87-NEXT: sahf
				; X87-NEXT: fld %st(3)
				; X87-NEXT: fchs
				; X87-NEXT: jae .LBB5_4
				; X87-NEXT: # %bb.3:
				; X87-NEXT: fstp %st(4)
				; X87-NEXT: fldz
				; X87-NEXT: .LBB5_4:
				; X87-NEXT: fstp %st(0)
				; X87-NEXT: movl {{[0-9]+}}(%esp), %esi
				; X87-NEXT: movb %dh, %ah
				; X87-NEXT: sahf
				; X87-NEXT: fld %st(2)
				; X87-NEXT: fchs
				; X87-NEXT: jae .LBB5_6
				; X87-NEXT: # %bb.5:
				; X87-NEXT: fstp %st(3)
				; X87-NEXT: fldz
				; X87-NEXT: .LBB5_6:
				; X87-NEXT: fstp %st(0)
				; X87-NEXT: movb %ch, %ah
				; X87-NEXT: sahf
				; X87-NEXT: fld %st(1)
				; X87-NEXT: fchs
				; X87-NEXT: jae .LBB5_8
				; X87-NEXT: # %bb.7:
				; X87-NEXT: fstp %st(2)
				; X87-NEXT: fldz
				; X87-NEXT: .LBB5_8:
				; X87-NEXT: fstp %st(0)
				; X87-NEXT: fxch %st(1)
				; X87-NEXT: fstpl 24(%esi)
				; X87-NEXT: fxch %st(1)
				; X87-NEXT: fstpl 16(%esi)
				; X87-NEXT: fxch %st(1)
				; X87-NEXT: fstpl 8(%esi)
				; X87-NEXT: fstpl (%esi)
				; X87-NEXT: movl %esi, %eax
				; X87-NEXT: popl %esi
				; X87-NEXT: popl %ebx
				; X87-NEXT: retl $4
				;
				; X87UNSAFE-LABEL: test6:
				; X87UNSAFE: # %bb.0:
				; X87UNSAFE-NEXT: movl {{[0-9]+}}(%esp), %eax
				; X87UNSAFE-NEXT: fldl {{[0-9]+}}(%esp)
				; X87UNSAFE-NEXT: fldl {{[0-9]+}}(%esp)
				; X87UNSAFE-NEXT: fldl {{[0-9]+}}(%esp)
				; X87UNSAFE-NEXT: fldl {{[0-9]+}}(%esp)
				; X87UNSAFE-NEXT: fabs
				; X87UNSAFE-NEXT: fxch %st(1)
				; X87UNSAFE-NEXT: fabs
				; X87UNSAFE-NEXT: fxch %st(2)
				; X87UNSAFE-NEXT: fabs
				; X87UNSAFE-NEXT: fxch %st(3)
				; X87UNSAFE-NEXT: fabs
				; X87UNSAFE-NEXT: fstpl 24(%eax)
				; X87UNSAFE-NEXT: fxch %st(2)
				; X87UNSAFE-NEXT: fstpl 16(%eax)
				; X87UNSAFE-NEXT: fstpl 8(%eax)
				; X87UNSAFE-NEXT: fstpl (%eax)
				; X87UNSAFE-NEXT: retl $4
				;
				; X64-LABEL: test6:
				; X64: # %bb.0:
				; X64-NEXT: movapd {{.*#+}} xmm2 = [-0.000000e+00,-0.000000e+00]
				; X64-NEXT: movapd %xmm2, %xmm3
				; X64-NEXT: cmplepd %xmm1, %xmm3
				; X64-NEXT: movapd %xmm2, %xmm4
				; X64-NEXT: cmplepd %xmm0, %xmm4
				; X64-NEXT: movapd %xmm1, %xmm5
				; X64-NEXT: xorpd %xmm2, %xmm5
				; X64-NEXT: xorpd %xmm0, %xmm2
				; X64-NEXT: andpd %xmm4, %xmm0
				; X64-NEXT: andnpd %xmm2, %xmm4
				; X64-NEXT: orpd %xmm4, %xmm0
				; X64-NEXT: andpd %xmm3, %xmm1
				; X64-NEXT: andnpd %xmm5, %xmm3
				; X64-NEXT: orpd %xmm3, %xmm1
				; X64-NEXT: retq
				%Y = fcmp oge <4 x double> %X, <double -0.0, double -0.0, double -0.0, double -0.0>
				%Z = fsub nsz <4 x double> <double -0.0, double -0.0, double -0.0, double -0.0>, %X
				%Q = select <4 x i1> %Y, <4 x double> %X, <4 x double> %Z
				ret <4 x double> %Q
				}

				define <4 x double> @test7(<4 x double> %X) {
				; X87-LABEL: test7:
				; X87: # %bb.0:
				; X87-NEXT: pushl %ebx
				; X87-NEXT: .cfi_def_cfa_offset 8
				; X87-NEXT: pushl %esi
				; X87-NEXT: .cfi_def_cfa_offset 12
				; X87-NEXT: .cfi_offset %esi, -12
				; X87-NEXT: .cfi_offset %ebx, -8
				; X87-NEXT: fldl {{[0-9]+}}(%esp)
				; X87-NEXT: fldl {{[0-9]+}}(%esp)
				; X87-NEXT: fldl {{[0-9]+}}(%esp)
				; X87-NEXT: fldl {{[0-9]+}}(%esp)
				; X87-NEXT: fldz
				; X87-NEXT: fxch %st(1)
				; X87-NEXT: fucom %st(1)
				; X87-NEXT: fnstsw %ax
				; X87-NEXT: movl %eax, %ecx
				; X87-NEXT: fxch %st(2)
				; X87-NEXT: fucom %st(1)
				; X87-NEXT: fnstsw %ax
				; X87-NEXT: movl %eax, %edx
				; X87-NEXT: fxch %st(3)
				; X87-NEXT: fucom %st(1)
				; X87-NEXT: fnstsw %ax
				; X87-NEXT: movl %eax, %ebx
				; X87-NEXT: fxch %st(4)
				; X87-NEXT: fucom %st(1)
				; X87-NEXT: fstp %st(1)
				; X87-NEXT: fnstsw %ax
				; X87-NEXT: # kill: def $ah killed $ah killed $ax
				; X87-NEXT: sahf
				; X87-NEXT: fld %st(0)
				; X87-NEXT: fchs
				; X87-NEXT: jae .LBB6_2
				; X87-NEXT: # %bb.1:
				; X87-NEXT: fstp %st(1)
				; X87-NEXT: fldz
				; X87-NEXT: .LBB6_2:
				; X87-NEXT: fstp %st(0)
				; X87-NEXT: movb %bh, %ah
				; X87-NEXT: sahf
				; X87-NEXT: fld %st(3)
				; X87-NEXT: fchs
				; X87-NEXT: jae .LBB6_4
				; X87-NEXT: # %bb.3:
				; X87-NEXT: fstp %st(4)
				; X87-NEXT: fldz
				; X87-NEXT: .LBB6_4:
				; X87-NEXT: fstp %st(0)
				; X87-NEXT: movl {{[0-9]+}}(%esp), %esi
				; X87-NEXT: movb %dh, %ah
				; X87-NEXT: sahf
				; X87-NEXT: fld %st(2)
				; X87-NEXT: fchs
				; X87-NEXT: jae .LBB6_6
				; X87-NEXT: # %bb.5:
				; X87-NEXT: fstp %st(3)
				; X87-NEXT: fldz
				; X87-NEXT: .LBB6_6:
				; X87-NEXT: fstp %st(0)
				; X87-NEXT: movb %ch, %ah
				; X87-NEXT: sahf
				; X87-NEXT: fld %st(1)
				; X87-NEXT: fchs
				; X87-NEXT: jae .LBB6_8
				; X87-NEXT: # %bb.7:
				; X87-NEXT: fstp %st(2)
				; X87-NEXT: fldz
				; X87-NEXT: .LBB6_8:
				; X87-NEXT: fstp %st(0)
				; X87-NEXT: fxch %st(1)
				; X87-NEXT: fstpl 24(%esi)
				; X87-NEXT: fxch %st(1)
				; X87-NEXT: fstpl 16(%esi)
				; X87-NEXT: fxch %st(1)
				; X87-NEXT: fstpl 8(%esi)
				; X87-NEXT: fstpl (%esi)
				; X87-NEXT: movl %esi, %eax
				; X87-NEXT: popl %esi
				; X87-NEXT: popl %ebx
				; X87-NEXT: retl $4
				;
				; X87UNSAFE-LABEL: test7:
				; X87UNSAFE: # %bb.0:
				; X87UNSAFE-NEXT: movl {{[0-9]+}}(%esp), %eax
				; X87UNSAFE-NEXT: fldl {{[0-9]+}}(%esp)
				; X87UNSAFE-NEXT: fldl {{[0-9]+}}(%esp)
				; X87UNSAFE-NEXT: fldl {{[0-9]+}}(%esp)
				; X87UNSAFE-NEXT: fldl {{[0-9]+}}(%esp)
				; X87UNSAFE-NEXT: fabs
				; X87UNSAFE-NEXT: fxch %st(1)
				; X87UNSAFE-NEXT: fabs
				; X87UNSAFE-NEXT: fxch %st(2)
				; X87UNSAFE-NEXT: fabs
				; X87UNSAFE-NEXT: fxch %st(3)
				; X87UNSAFE-NEXT: fabs
				; X87UNSAFE-NEXT: fstpl 24(%eax)
				; X87UNSAFE-NEXT: fxch %st(2)
				; X87UNSAFE-NEXT: fstpl 16(%eax)
				; X87UNSAFE-NEXT: fstpl 8(%eax)
				; X87UNSAFE-NEXT: fstpl (%eax)
				; X87UNSAFE-NEXT: retl $4
				;
				; X64-LABEL: test7:
				; X64: # %bb.0:
				; X64-NEXT: xorpd %xmm2, %xmm2
				; X64-NEXT: xorpd %xmm3, %xmm3
				; X64-NEXT: cmplepd %xmm1, %xmm3
				; X64-NEXT: cmplepd %xmm0, %xmm2
				; X64-NEXT: movapd {{.*#+}} xmm4 = [-0.000000e+00,-0.000000e+00]
				; X64-NEXT: movapd %xmm1, %xmm5
				; X64-NEXT: xorpd %xmm4, %xmm5
				; X64-NEXT: xorpd %xmm0, %xmm4
				; X64-NEXT: andpd %xmm2, %xmm0
				; X64-NEXT: andnpd %xmm4, %xmm2
				; X64-NEXT: orpd %xmm2, %xmm0
				; X64-NEXT: andpd %xmm3, %xmm1
				; X64-NEXT: andnpd %xmm5, %xmm3
				; X64-NEXT: orpd %xmm3, %xmm1
				; X64-NEXT: retq
				%Y = fcmp oge <4 x double> %X, zeroinitializer
				%Z = fsub nsz <4 x double> zeroinitializer, %X
				%Q = select <4 x i1> %Y, <4 x double> %X, <4 x double> %Z
				ret <4 x double> %Q
				}

This is an archive of the discontinued LLVM Phabricator instance.

[SelectionDAG] New sign-of-zero compliant patterns for fabs folding
AbandonedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 137207

lib/CodeGen/SelectionDAG/DAGCombiner.cpp

lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp

lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp

test/CodeGen/X86/fabs.ll

This is an archive of the discontinued LLVM Phabricator instance.

[SelectionDAG] New sign-of-zero compliant patterns for fabs foldingAbandonedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 137207

lib/CodeGen/SelectionDAG/DAGCombiner.cpp

lib/CodeGen/SelectionDAG/LegalizeVectorTypes.cpp

lib/CodeGen/SelectionDAG/SelectionDAGBuilder.cpp

test/CodeGen/X86/fabs.ll

[SelectionDAG] New sign-of-zero compliant patterns for fabs folding
AbandonedPublic