Diff 172579

include/llvm/CodeGen/TargetLowering.h

Show First 20 Lines • Show All 1,726 Lines • ▼ Show 20 Lines	public:
/// multiplication-by-constant into simpler operations like shifts and adds.		/// multiplication-by-constant into simpler operations like shifts and adds.
/// This may be true if the target does not directly support the		/// This may be true if the target does not directly support the
/// multiplication operation for the specified type or the sequence of simpler		/// multiplication operation for the specified type or the sequence of simpler
/// ops is faster than the multiply.		/// ops is faster than the multiply.
virtual bool decomposeMulByConstant(EVT VT, SDValue C) const {		virtual bool decomposeMulByConstant(EVT VT, SDValue C) const {
return false;		return false;
}		}

		/// Return true if it is more correct/profitable to use strict FP_TO_INT
		/// conversion operations - canonicalizing the FP source value instead of
		/// converting all cases and then selecting based on value.
		/// This may be true if the target throws exceptions for out of bounds
		/// conversions or has fast FP CMOV.
		virtual bool shouldUseStrictFP_TO_INT(EVT FpVT, EVT IntVT,
		bool IsSigned) const {
		return false;
		}

//===--------------------------------------------------------------------===//		//===--------------------------------------------------------------------===//
// TargetLowering Configuration Methods - These methods should be invoked by		// TargetLowering Configuration Methods - These methods should be invoked by
// the derived class constructor to configure this object for the target.		// the derived class constructor to configure this object for the target.
//		//
protected:		protected:
/// Specify how the target extends the result of integer and floating point		/// Specify how the target extends the result of integer and floating point
/// boolean values from i1 to a wider type. See getBooleanContents.		/// boolean values from i1 to a wider type. See getBooleanContents.
void setBooleanContents(BooleanContent Ty) {		void setBooleanContents(BooleanContent Ty) {
▲ Show 20 Lines • Show All 2,074 Lines • Show Last 20 Lines

lib/CodeGen/SelectionDAG/TargetLowering.cpp

Show First 20 Lines • Show All 4,147 Lines • ▼ Show 20 Lines	bool TargetLowering::expandFP_TO_UINT(SDNode *Node, SDValue &Result,
EVT SetCCVT =		EVT SetCCVT =
getSetCCResultType(DAG.getDataLayout(), *DAG.getContext(), SrcVT);		getSetCCResultType(DAG.getDataLayout(), *DAG.getContext(), SrcVT);

// Only expand vector types if we have the appropriate vector bit operations.		// Only expand vector types if we have the appropriate vector bit operations.
if (DstVT.isVector() && (!isOperationLegalOrCustom(ISD::FP_TO_SINT, DstVT) \|\|		if (DstVT.isVector() && (!isOperationLegalOrCustom(ISD::FP_TO_SINT, DstVT) \|\|
!isOperationLegalOrCustomOrPromote(ISD::XOR, SrcVT)))		!isOperationLegalOrCustomOrPromote(ISD::XOR, SrcVT)))
return false;		return false;

// Expand based on maximum range of FP_TO_SINT:
// True = fp_to_sint(Src)
// False = 0x8000000000000000 + fp_to_sint(Src - 0x8000000000000000)
// Result = select (Src < 0x8000000000000000), True, False
APFloat apf(DAG.EVTToAPFloatSemantics(SrcVT),		APFloat apf(DAG.EVTToAPFloatSemantics(SrcVT),
APInt::getNullValue(SrcVT.getScalarSizeInBits()));		APInt::getNullValue(SrcVT.getScalarSizeInBits()));
APInt x = APInt::getSignMask(DstVT.getScalarSizeInBits());		APInt x = APInt::getSignMask(DstVT.getScalarSizeInBits());
(void)apf.convertFromAPInt(x, false, APFloat::rmNearestTiesToEven);		(void)apf.convertFromAPInt(x, false, APFloat::rmNearestTiesToEven);
		SDValue Cst = DAG.getConstantFP(apf, dl, SrcVT);
		efriedmaUnsubmitted Not Done Reply Inline Actions Do we need to check that Cst is finite? For example, 0x80000000 doesn't fit into a half-precision float. I guess it doesn't matter for x86, but it might matter in the future. efriedma: Do we need to check that Cst is finite? For example, 0x80000000 doesn't fit into a half…
		SDValue Sel = DAG.getSetCC(dl, SetCCVT, Src, Cst, ISD::SETLT);

		bool Strict = shouldUseStrictFP_TO_INT(SrcVT, DstVT, true);
		if (Strict) {
		// Expand based on maximum range of FP_TO_SINT:
		efriedmaUnsubmitted Not Done Reply Inline Actions f32/f64 results should then be whole integers I'm not sure what this means; are you saying the result of the subtraction a whole integer? efriedma: > f32/f64 results should then be whole integers I'm not sure what this means; are you saying…
		// Sel = Src < 0x8000000000000000
		// Val = select Sel, Src, Src - 0x8000000000000000
		efriedmaUnsubmitted Not Done Reply Inline Actions Maybe worth explaining why the extra rounding step here doesn't matter. efriedma: Maybe worth explaining why the extra rounding step here doesn't matter.
		// Ofs = select Sel, 0, 0x8000000000000000
		// Result = fp_to_sint(Val) ^ Ofs

		// TODO: Should any fast-math-flags be set for the FSUB?
		SDValue Val = DAG.getSelect(dl, SrcVT, Sel, Src,
		DAG.getNode(ISD::FSUB, dl, SrcVT, Src, Cst));
		SDValue Ofs = DAG.getSelect(dl, DstVT, Sel, DAG.getConstant(0, dl, DstVT),
		DAG.getConstant(x, dl, DstVT));
		Result = DAG.getNode(ISD::XOR, dl, DstVT,
		DAG.getNode(ISD::FP_TO_SINT, dl, DstVT, Val), Ofs);
		} else {
		// Expand based on maximum range of FP_TO_SINT:
		// True = fp_to_sint(Src)
		// False = 0x8000000000000000 + fp_to_sint(Src - 0x8000000000000000)
		// Result = select (Src < 0x8000000000000000), True, False

SDValue Tmp1 = DAG.getConstantFP(apf, dl, SrcVT);
SDValue Tmp2 = DAG.getSetCC(dl, SetCCVT, Src, Tmp1, ISD::SETLT);
SDValue True = DAG.getNode(ISD::FP_TO_SINT, dl, DstVT, Src);		SDValue True = DAG.getNode(ISD::FP_TO_SINT, dl, DstVT, Src);
// TODO: Should any fast-math-flags be set for the FSUB?		// TODO: Should any fast-math-flags be set for the FSUB?
SDValue False = DAG.getNode(ISD::FP_TO_SINT, dl, DstVT,		SDValue False = DAG.getNode(ISD::FP_TO_SINT, dl, DstVT,
DAG.getNode(ISD::FSUB, dl, SrcVT, Src, Tmp1));		DAG.getNode(ISD::FSUB, dl, SrcVT, Src, Cst));
False =		False =
DAG.getNode(ISD::XOR, dl, DstVT, False, DAG.getConstant(x, dl, DstVT));		DAG.getNode(ISD::XOR, dl, DstVT, False, DAG.getConstant(x, dl, DstVT));
Result = DAG.getSelect(dl, DstVT, Tmp2, True, False);		Result = DAG.getSelect(dl, DstVT, Sel, True, False);
		}
return true;		return true;
}		}

bool TargetLowering::expandUINT_TO_FP(SDNode *Node, SDValue &Result,		bool TargetLowering::expandUINT_TO_FP(SDNode *Node, SDValue &Result,
SelectionDAG &DAG) const {		SelectionDAG &DAG) const {
SDValue Src = Node->getOperand(0);		SDValue Src = Node->getOperand(0);
EVT SrcVT = Src.getValueType();		EVT SrcVT = Src.getValueType();
EVT DstVT = Node->getValueType(0);		EVT DstVT = Node->getValueType(0);
▲ Show 20 Lines • Show All 883 Lines • Show Last 20 Lines

lib/Target/X86/X86ISelLowering.h

Show First 20 Lines • Show All 1,044 Lines • ▼ Show 20 Lines	public:
/// to just the constant itself.		/// to just the constant itself.
bool shouldConvertConstantLoadToIntImm(const APInt &Imm,		bool shouldConvertConstantLoadToIntImm(const APInt &Imm,
Type *Ty) const override;		Type *Ty) const override;

bool convertSelectOfConstantsToMath(EVT VT) const override;		bool convertSelectOfConstantsToMath(EVT VT) const override;

bool decomposeMulByConstant(EVT VT, SDValue C) const override;		bool decomposeMulByConstant(EVT VT, SDValue C) const override;

		bool shouldUseStrictFP_TO_INT(EVT FpVT, EVT IntVT,
		bool IsSigned) const override;

/// Return true if EXTRACT_SUBVECTOR is cheap for this result type		/// Return true if EXTRACT_SUBVECTOR is cheap for this result type
/// with this index.		/// with this index.
bool isExtractSubvectorCheap(EVT ResVT, EVT SrcVT,		bool isExtractSubvectorCheap(EVT ResVT, EVT SrcVT,
unsigned Index) const override;		unsigned Index) const override;

bool storeOfVectorConstantIsCheap(EVT MemVT, unsigned NumElem,		bool storeOfVectorConstantIsCheap(EVT MemVT, unsigned NumElem,
unsigned AddrSpace) const override {		unsigned AddrSpace) const override {
// If we can replace more than 2 scalar stores, there will be a reduction		// If we can replace more than 2 scalar stores, there will be a reduction
▲ Show 20 Lines • Show All 521 Lines • Show Last 20 Lines

lib/Target/X86/X86ISelLowering.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 4,726 Lines • ▼ Show 20 Lines	bool X86TargetLowering::decomposeMulByConstant(EVT VT, SDValue C) const {
if (isOperationLegal(ISD::MUL, VT))		if (isOperationLegal(ISD::MUL, VT))
return false;		return false;

// shl+add, shl+sub, shl+add+neg		// shl+add, shl+sub, shl+add+neg
return (MulC + 1).isPowerOf2() \|\| (MulC - 1).isPowerOf2() \|\|		return (MulC + 1).isPowerOf2() \|\| (MulC - 1).isPowerOf2() \|\|
(1 - MulC).isPowerOf2() \|\| (-(MulC + 1)).isPowerOf2();		(1 - MulC).isPowerOf2() \|\| (-(MulC + 1)).isPowerOf2();
}		}

		bool X86TargetLowering::shouldUseStrictFP_TO_INT(EVT FpVT, EVT IntVT,
		bool IsSigned) const {
		// f80 UINT_TO_FP is more efficient using the Strict if FCMOV is available.
		return IsSigned && FpVT == MVT::f80 && Subtarget.hasCMov();
		}

bool X86TargetLowering::isExtractSubvectorCheap(EVT ResVT, EVT SrcVT,		bool X86TargetLowering::isExtractSubvectorCheap(EVT ResVT, EVT SrcVT,
unsigned Index) const {		unsigned Index) const {
if (!isOperationLegalOrCustom(ISD::EXTRACT_SUBVECTOR, ResVT))		if (!isOperationLegalOrCustom(ISD::EXTRACT_SUBVECTOR, ResVT))
return false;		return false;

// Mask vectors support all subregister combinations and operations that		// Mask vectors support all subregister combinations and operations that
// extract half of vector.		// extract half of vector.
if (ResVT.getVectorElementType() == MVT::i1)		if (ResVT.getVectorElementType() == MVT::i1)
▲ Show 20 Lines • Show All 36,891 Lines • Show Last 20 Lines

test/CodeGen/X86/fp-cvt.ll

	Show First 20 Lines • Show All 477 Lines • ▼ Show 20 Lines
	; X86-NEXT: retl			; X86-NEXT: retl
	;			;
	; X64-X87-LABEL: fptoui_i64_fp80:			; X64-X87-LABEL: fptoui_i64_fp80:
	; X64-X87: # %bb.0:			; X64-X87: # %bb.0:
	; X64-X87-NEXT: fldt {{[0-9]+}}(%rsp)			; X64-X87-NEXT: fldt {{[0-9]+}}(%rsp)
	; X64-X87-NEXT: flds {{.*}}(%rip)			; X64-X87-NEXT: flds {{.*}}(%rip)
	; X64-X87-NEXT: fld %st(1)			; X64-X87-NEXT: fld %st(1)
	; X64-X87-NEXT: fsub %st(1)			; X64-X87-NEXT: fsub %st(1)
				; X64-X87-NEXT: xorl %eax, %eax
				; X64-X87-NEXT: fxch %st(1)
				; X64-X87-NEXT: fucompi %st(2)
				; X64-X87-NEXT: fcmovnbe %st(1), %st(0)
				; X64-X87-NEXT: fstp %st(1)
	; X64-X87-NEXT: fnstcw -{{[0-9]+}}(%rsp)			; X64-X87-NEXT: fnstcw -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: movzwl -{{[0-9]+}}(%rsp), %eax			; X64-X87-NEXT: movzwl -{{[0-9]+}}(%rsp), %ecx
	; X64-X87-NEXT: movw $3199, -{{[0-9]+}}(%rsp) # imm = 0xC7F
	; X64-X87-NEXT: fldcw -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: movw %ax, -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: fistpll -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: fldcw -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: fnstcw -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: movzwl -{{[0-9]+}}(%rsp), %eax
	; X64-X87-NEXT: movw $3199, -{{[0-9]+}}(%rsp) # imm = 0xC7F			; X64-X87-NEXT: movw $3199, -{{[0-9]+}}(%rsp) # imm = 0xC7F
	; X64-X87-NEXT: fldcw -{{[0-9]+}}(%rsp)			; X64-X87-NEXT: fldcw -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: movw %ax, -{{[0-9]+}}(%rsp)			; X64-X87-NEXT: movw %cx, -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: fld %st(1)
	; X64-X87-NEXT: fistpll -{{[0-9]+}}(%rsp)			; X64-X87-NEXT: fistpll -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: fldcw -{{[0-9]+}}(%rsp)			; X64-X87-NEXT: fldcw -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: fucompi %st(1)			; X64-X87-NEXT: setbe %al
	; X64-X87-NEXT: fstp %st(0)			; X64-X87-NEXT: shlq $63, %rax
	; X64-X87-NEXT: jbe .LBB10_1
	; X64-X87-NEXT: # %bb.2:
	; X64-X87-NEXT: movq -{{[0-9]+}}(%rsp), %rax
	; X64-X87-NEXT: retq
	; X64-X87-NEXT: .LBB10_1:
	; X64-X87-NEXT: movabsq $-9223372036854775808, %rax # imm = 0x8000000000000000
	; X64-X87-NEXT: xorq -{{[0-9]+}}(%rsp), %rax			; X64-X87-NEXT: xorq -{{[0-9]+}}(%rsp), %rax
	; X64-X87-NEXT: retq			; X64-X87-NEXT: retq
	;			;
	; X64-SSSE3-LABEL: fptoui_i64_fp80:			; X64-SSSE3-LABEL: fptoui_i64_fp80:
	; X64-SSSE3: # %bb.0:			; X64-SSSE3: # %bb.0:
	; X64-SSSE3-NEXT: fldt {{[0-9]+}}(%rsp)			; X64-SSSE3-NEXT: fldt {{[0-9]+}}(%rsp)
	; X64-SSSE3-NEXT: flds {{.*}}(%rip)			; X64-SSSE3-NEXT: flds {{.*}}(%rip)
	; X64-SSSE3-NEXT: fld %st(1)			; X64-SSSE3-NEXT: fld %st(1)
	; X64-SSSE3-NEXT: fsub %st(1)			; X64-SSSE3-NEXT: fsub %st(1)
				; X64-SSSE3-NEXT: xorl %eax, %eax
				; X64-SSSE3-NEXT: fxch %st(1)
				; X64-SSSE3-NEXT: fucompi %st(2)
				; X64-SSSE3-NEXT: fcmovnbe %st(1), %st(0)
				; X64-SSSE3-NEXT: fstp %st(1)
	; X64-SSSE3-NEXT: fisttpll -{{[0-9]+}}(%rsp)			; X64-SSSE3-NEXT: fisttpll -{{[0-9]+}}(%rsp)
	; X64-SSSE3-NEXT: fld %st(1)			; X64-SSSE3-NEXT: setbe %al
	; X64-SSSE3-NEXT: fisttpll -{{[0-9]+}}(%rsp)			; X64-SSSE3-NEXT: shlq $63, %rax
	; X64-SSSE3-NEXT: fucompi %st(1)
	; X64-SSSE3-NEXT: fstp %st(0)
	; X64-SSSE3-NEXT: jbe .LBB10_1
	; X64-SSSE3-NEXT: # %bb.2:
	; X64-SSSE3-NEXT: movq -{{[0-9]+}}(%rsp), %rax
	; X64-SSSE3-NEXT: retq
	; X64-SSSE3-NEXT: .LBB10_1:
	; X64-SSSE3-NEXT: movabsq $-9223372036854775808, %rax # imm = 0x8000000000000000
	; X64-SSSE3-NEXT: xorq -{{[0-9]+}}(%rsp), %rax			; X64-SSSE3-NEXT: xorq -{{[0-9]+}}(%rsp), %rax
	; X64-SSSE3-NEXT: retq			; X64-SSSE3-NEXT: retq
	%1 = fptoui x86_fp80 %a0 to i64			%1 = fptoui x86_fp80 %a0 to i64
	ret i64 %1			ret i64 %1
	}			}

	define i64 @fptoui_i64_fp80_ld(x86_fp80 *%a0) nounwind {			define i64 @fptoui_i64_fp80_ld(x86_fp80 *%a0) nounwind {
	; X86-LABEL: fptoui_i64_fp80_ld:			; X86-LABEL: fptoui_i64_fp80_ld:
	Show All 35 Lines
	; X86-NEXT: retl			; X86-NEXT: retl
	;			;
	; X64-X87-LABEL: fptoui_i64_fp80_ld:			; X64-X87-LABEL: fptoui_i64_fp80_ld:
	; X64-X87: # %bb.0:			; X64-X87: # %bb.0:
	; X64-X87-NEXT: fldt (%rdi)			; X64-X87-NEXT: fldt (%rdi)
	; X64-X87-NEXT: flds {{.*}}(%rip)			; X64-X87-NEXT: flds {{.*}}(%rip)
	; X64-X87-NEXT: fld %st(1)			; X64-X87-NEXT: fld %st(1)
	; X64-X87-NEXT: fsub %st(1)			; X64-X87-NEXT: fsub %st(1)
				; X64-X87-NEXT: xorl %eax, %eax
				; X64-X87-NEXT: fxch %st(1)
				; X64-X87-NEXT: fucompi %st(2)
				; X64-X87-NEXT: fcmovnbe %st(1), %st(0)
				; X64-X87-NEXT: fstp %st(1)
	; X64-X87-NEXT: fnstcw -{{[0-9]+}}(%rsp)			; X64-X87-NEXT: fnstcw -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: movzwl -{{[0-9]+}}(%rsp), %eax			; X64-X87-NEXT: movzwl -{{[0-9]+}}(%rsp), %ecx
	; X64-X87-NEXT: movw $3199, -{{[0-9]+}}(%rsp) # imm = 0xC7F
	; X64-X87-NEXT: fldcw -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: movw %ax, -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: fistpll -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: fldcw -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: fnstcw -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: movzwl -{{[0-9]+}}(%rsp), %eax
	; X64-X87-NEXT: movw $3199, -{{[0-9]+}}(%rsp) # imm = 0xC7F			; X64-X87-NEXT: movw $3199, -{{[0-9]+}}(%rsp) # imm = 0xC7F
	; X64-X87-NEXT: fldcw -{{[0-9]+}}(%rsp)			; X64-X87-NEXT: fldcw -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: movw %ax, -{{[0-9]+}}(%rsp)			; X64-X87-NEXT: movw %cx, -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: fld %st(1)
	; X64-X87-NEXT: fistpll -{{[0-9]+}}(%rsp)			; X64-X87-NEXT: fistpll -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: fldcw -{{[0-9]+}}(%rsp)			; X64-X87-NEXT: fldcw -{{[0-9]+}}(%rsp)
	; X64-X87-NEXT: fucompi %st(1)			; X64-X87-NEXT: setbe %al
	; X64-X87-NEXT: fstp %st(0)			; X64-X87-NEXT: shlq $63, %rax
	; X64-X87-NEXT: jbe .LBB11_1
	; X64-X87-NEXT: # %bb.2:
	; X64-X87-NEXT: movq -{{[0-9]+}}(%rsp), %rax
	; X64-X87-NEXT: retq
	; X64-X87-NEXT: .LBB11_1:
	; X64-X87-NEXT: movabsq $-9223372036854775808, %rax # imm = 0x8000000000000000
	; X64-X87-NEXT: xorq -{{[0-9]+}}(%rsp), %rax			; X64-X87-NEXT: xorq -{{[0-9]+}}(%rsp), %rax
	; X64-X87-NEXT: retq			; X64-X87-NEXT: retq
	;			;
	; X64-SSSE3-LABEL: fptoui_i64_fp80_ld:			; X64-SSSE3-LABEL: fptoui_i64_fp80_ld:
	; X64-SSSE3: # %bb.0:			; X64-SSSE3: # %bb.0:
	; X64-SSSE3-NEXT: fldt (%rdi)			; X64-SSSE3-NEXT: fldt (%rdi)
	; X64-SSSE3-NEXT: flds {{.*}}(%rip)			; X64-SSSE3-NEXT: flds {{.*}}(%rip)
	; X64-SSSE3-NEXT: fld %st(1)			; X64-SSSE3-NEXT: fld %st(1)
	; X64-SSSE3-NEXT: fsub %st(1)			; X64-SSSE3-NEXT: fsub %st(1)
				; X64-SSSE3-NEXT: xorl %eax, %eax
				; X64-SSSE3-NEXT: fxch %st(1)
				; X64-SSSE3-NEXT: fucompi %st(2)
				; X64-SSSE3-NEXT: fcmovnbe %st(1), %st(0)
				; X64-SSSE3-NEXT: fstp %st(1)
	; X64-SSSE3-NEXT: fisttpll -{{[0-9]+}}(%rsp)			; X64-SSSE3-NEXT: fisttpll -{{[0-9]+}}(%rsp)
	; X64-SSSE3-NEXT: fld %st(1)			; X64-SSSE3-NEXT: setbe %al
	; X64-SSSE3-NEXT: fisttpll -{{[0-9]+}}(%rsp)			; X64-SSSE3-NEXT: shlq $63, %rax
	; X64-SSSE3-NEXT: fucompi %st(1)
	; X64-SSSE3-NEXT: fstp %st(0)
	; X64-SSSE3-NEXT: jbe .LBB11_1
	; X64-SSSE3-NEXT: # %bb.2:
	; X64-SSSE3-NEXT: movq -{{[0-9]+}}(%rsp), %rax
	; X64-SSSE3-NEXT: retq
	; X64-SSSE3-NEXT: .LBB11_1:
	; X64-SSSE3-NEXT: movabsq $-9223372036854775808, %rax # imm = 0x8000000000000000
	; X64-SSSE3-NEXT: xorq -{{[0-9]+}}(%rsp), %rax			; X64-SSSE3-NEXT: xorq -{{[0-9]+}}(%rsp), %rax
	; X64-SSSE3-NEXT: retq			; X64-SSSE3-NEXT: retq
	%1 = load x86_fp80, x86_fp80 *%a0			%1 = load x86_fp80, x86_fp80 *%a0
	%2 = fptoui x86_fp80 %1 to i64			%2 = fptoui x86_fp80 %1 to i64
	ret i64 %2			ret i64 %2
	}			}

	;			;
	▲ Show 20 Lines • Show All 493 Lines • Show Last 20 Lines

test/CodeGen/X86/scalar-fp-to-i64.ll

	Show First 20 Lines • Show All 1,141 Lines • ▼ Show 20 Lines
	; SSE3_32_LIN-NEXT: shll $31, %edx			; SSE3_32_LIN-NEXT: shll $31, %edx
	; SSE3_32_LIN-NEXT: xorl {{[0-9]+}}(%esp), %edx			; SSE3_32_LIN-NEXT: xorl {{[0-9]+}}(%esp), %edx
	; SSE3_32_LIN-NEXT: movl (%esp), %eax			; SSE3_32_LIN-NEXT: movl (%esp), %eax
	; SSE3_32_LIN-NEXT: addl $12, %esp			; SSE3_32_LIN-NEXT: addl $12, %esp
	; SSE3_32_LIN-NEXT: retl			; SSE3_32_LIN-NEXT: retl
	;			;
	; SSE3_64_WIN-LABEL: x_to_u64:			; SSE3_64_WIN-LABEL: x_to_u64:
	; SSE3_64_WIN: # %bb.0:			; SSE3_64_WIN: # %bb.0:
	; SSE3_64_WIN-NEXT: subq $16, %rsp			; SSE3_64_WIN-NEXT: pushq %rax
	; SSE3_64_WIN-NEXT: fldt (%rcx)			; SSE3_64_WIN-NEXT: fldt (%rcx)
	; SSE3_64_WIN-NEXT: flds __real@{{.*}}(%rip)			; SSE3_64_WIN-NEXT: flds __real@{{.*}}(%rip)
	; SSE3_64_WIN-NEXT: fld %st(1)			; SSE3_64_WIN-NEXT: fld %st(1)
	; SSE3_64_WIN-NEXT: fsub %st(1)			; SSE3_64_WIN-NEXT: fsub %st(1)
	; SSE3_64_WIN-NEXT: fisttpll {{[0-9]+}}(%rsp)			; SSE3_64_WIN-NEXT: xorl %eax, %eax
	; SSE3_64_WIN-NEXT: fld %st(1)			; SSE3_64_WIN-NEXT: fxch %st(1)
				; SSE3_64_WIN-NEXT: fucompi %st(2)
				; SSE3_64_WIN-NEXT: fcmovnbe %st(1), %st(0)
				; SSE3_64_WIN-NEXT: fstp %st(1)
	; SSE3_64_WIN-NEXT: fisttpll (%rsp)			; SSE3_64_WIN-NEXT: fisttpll (%rsp)
	; SSE3_64_WIN-NEXT: fucompi %st(1)			; SSE3_64_WIN-NEXT: setbe %al
	; SSE3_64_WIN-NEXT: fstp %st(0)			; SSE3_64_WIN-NEXT: shlq $63, %rax
	; SSE3_64_WIN-NEXT: jbe .LBB4_1			; SSE3_64_WIN-NEXT: xorq (%rsp), %rax
	; SSE3_64_WIN-NEXT: # %bb.2:			; SSE3_64_WIN-NEXT: popq %rcx
	; SSE3_64_WIN-NEXT: movq (%rsp), %rax
	; SSE3_64_WIN-NEXT: addq $16, %rsp
	; SSE3_64_WIN-NEXT: retq
	; SSE3_64_WIN-NEXT: .LBB4_1:
	; SSE3_64_WIN-NEXT: movabsq $-9223372036854775808, %rax # imm = 0x8000000000000000
	; SSE3_64_WIN-NEXT: xorq {{[0-9]+}}(%rsp), %rax
	; SSE3_64_WIN-NEXT: addq $16, %rsp
	; SSE3_64_WIN-NEXT: retq			; SSE3_64_WIN-NEXT: retq
	;			;
	; SSE3_64_LIN-LABEL: x_to_u64:			; SSE3_64_LIN-LABEL: x_to_u64:
	; SSE3_64_LIN: # %bb.0:			; SSE3_64_LIN: # %bb.0:
	; SSE3_64_LIN-NEXT: fldt {{[0-9]+}}(%rsp)			; SSE3_64_LIN-NEXT: fldt {{[0-9]+}}(%rsp)
	; SSE3_64_LIN-NEXT: flds {{.*}}(%rip)			; SSE3_64_LIN-NEXT: flds {{.*}}(%rip)
	; SSE3_64_LIN-NEXT: fld %st(1)			; SSE3_64_LIN-NEXT: fld %st(1)
	; SSE3_64_LIN-NEXT: fsub %st(1)			; SSE3_64_LIN-NEXT: fsub %st(1)
				; SSE3_64_LIN-NEXT: xorl %eax, %eax
				; SSE3_64_LIN-NEXT: fxch %st(1)
				; SSE3_64_LIN-NEXT: fucompi %st(2)
				; SSE3_64_LIN-NEXT: fcmovnbe %st(1), %st(0)
				; SSE3_64_LIN-NEXT: fstp %st(1)
	; SSE3_64_LIN-NEXT: fisttpll -{{[0-9]+}}(%rsp)			; SSE3_64_LIN-NEXT: fisttpll -{{[0-9]+}}(%rsp)
	; SSE3_64_LIN-NEXT: fld %st(1)			; SSE3_64_LIN-NEXT: setbe %al
	; SSE3_64_LIN-NEXT: fisttpll -{{[0-9]+}}(%rsp)			; SSE3_64_LIN-NEXT: shlq $63, %rax
	; SSE3_64_LIN-NEXT: fucompi %st(1)
	; SSE3_64_LIN-NEXT: fstp %st(0)
	; SSE3_64_LIN-NEXT: jbe .LBB4_1
	; SSE3_64_LIN-NEXT: # %bb.2:
	; SSE3_64_LIN-NEXT: movq -{{[0-9]+}}(%rsp), %rax
	; SSE3_64_LIN-NEXT: retq
	; SSE3_64_LIN-NEXT: .LBB4_1:
	; SSE3_64_LIN-NEXT: movabsq $-9223372036854775808, %rax # imm = 0x8000000000000000
	; SSE3_64_LIN-NEXT: xorq -{{[0-9]+}}(%rsp), %rax			; SSE3_64_LIN-NEXT: xorq -{{[0-9]+}}(%rsp), %rax
	; SSE3_64_LIN-NEXT: retq			; SSE3_64_LIN-NEXT: retq
	;			;
	; SSE2_32_WIN-LABEL: x_to_u64:			; SSE2_32_WIN-LABEL: x_to_u64:
	; SSE2_32_WIN: # %bb.0:			; SSE2_32_WIN: # %bb.0:
	; SSE2_32_WIN-NEXT: pushl %ebp			; SSE2_32_WIN-NEXT: pushl %ebp
	; SSE2_32_WIN-NEXT: movl %esp, %ebp			; SSE2_32_WIN-NEXT: movl %esp, %ebp
	; SSE2_32_WIN-NEXT: andl $-8, %esp			; SSE2_32_WIN-NEXT: andl $-8, %esp
	▲ Show 20 Lines • Show All 45 Lines • ▼ Show 20 Lines
	; SSE2_32_LIN-NEXT: shll $31, %edx			; SSE2_32_LIN-NEXT: shll $31, %edx
	; SSE2_32_LIN-NEXT: xorl {{[0-9]+}}(%esp), %edx			; SSE2_32_LIN-NEXT: xorl {{[0-9]+}}(%esp), %edx
	; SSE2_32_LIN-NEXT: movl {{[0-9]+}}(%esp), %eax			; SSE2_32_LIN-NEXT: movl {{[0-9]+}}(%esp), %eax
	; SSE2_32_LIN-NEXT: addl $20, %esp			; SSE2_32_LIN-NEXT: addl $20, %esp
	; SSE2_32_LIN-NEXT: retl			; SSE2_32_LIN-NEXT: retl
	;			;
	; SSE2_64_WIN-LABEL: x_to_u64:			; SSE2_64_WIN-LABEL: x_to_u64:
	; SSE2_64_WIN: # %bb.0:			; SSE2_64_WIN: # %bb.0:
	; SSE2_64_WIN-NEXT: subq $24, %rsp			; SSE2_64_WIN-NEXT: subq $16, %rsp
	; SSE2_64_WIN-NEXT: fldt (%rcx)			; SSE2_64_WIN-NEXT: fldt (%rcx)
	; SSE2_64_WIN-NEXT: flds __real@{{.*}}(%rip)			; SSE2_64_WIN-NEXT: flds __real@{{.*}}(%rip)
	; SSE2_64_WIN-NEXT: fld %st(1)			; SSE2_64_WIN-NEXT: fld %st(1)
	; SSE2_64_WIN-NEXT: fsub %st(1)			; SSE2_64_WIN-NEXT: fsub %st(1)
				; SSE2_64_WIN-NEXT: xorl %eax, %eax
				; SSE2_64_WIN-NEXT: fxch %st(1)
				; SSE2_64_WIN-NEXT: fucompi %st(2)
				; SSE2_64_WIN-NEXT: fcmovnbe %st(1), %st(0)
				; SSE2_64_WIN-NEXT: fstp %st(1)
	; SSE2_64_WIN-NEXT: fnstcw {{[0-9]+}}(%rsp)			; SSE2_64_WIN-NEXT: fnstcw {{[0-9]+}}(%rsp)
	; SSE2_64_WIN-NEXT: movzwl {{[0-9]+}}(%rsp), %eax			; SSE2_64_WIN-NEXT: movzwl {{[0-9]+}}(%rsp), %ecx
	; SSE2_64_WIN-NEXT: movw $3199, {{[0-9]+}}(%rsp) # imm = 0xC7F			; SSE2_64_WIN-NEXT: movw $3199, {{[0-9]+}}(%rsp) # imm = 0xC7F
	; SSE2_64_WIN-NEXT: fldcw {{[0-9]+}}(%rsp)			; SSE2_64_WIN-NEXT: fldcw {{[0-9]+}}(%rsp)
	; SSE2_64_WIN-NEXT: movw %ax, {{[0-9]+}}(%rsp)			; SSE2_64_WIN-NEXT: movw %cx, {{[0-9]+}}(%rsp)
	; SSE2_64_WIN-NEXT: fistpll {{[0-9]+}}(%rsp)			; SSE2_64_WIN-NEXT: fistpll {{[0-9]+}}(%rsp)
	; SSE2_64_WIN-NEXT: fldcw {{[0-9]+}}(%rsp)			; SSE2_64_WIN-NEXT: fldcw {{[0-9]+}}(%rsp)
	; SSE2_64_WIN-NEXT: fnstcw {{[0-9]+}}(%rsp)			; SSE2_64_WIN-NEXT: setbe %al
	; SSE2_64_WIN-NEXT: movzwl {{[0-9]+}}(%rsp), %eax			; SSE2_64_WIN-NEXT: shlq $63, %rax
	; SSE2_64_WIN-NEXT: movw $3199, {{[0-9]+}}(%rsp) # imm = 0xC7F
	; SSE2_64_WIN-NEXT: fldcw {{[0-9]+}}(%rsp)
	; SSE2_64_WIN-NEXT: movw %ax, {{[0-9]+}}(%rsp)
	; SSE2_64_WIN-NEXT: fld %st(1)
	; SSE2_64_WIN-NEXT: fistpll {{[0-9]+}}(%rsp)
	; SSE2_64_WIN-NEXT: fldcw {{[0-9]+}}(%rsp)
	; SSE2_64_WIN-NEXT: fucompi %st(1)
	; SSE2_64_WIN-NEXT: fstp %st(0)
	; SSE2_64_WIN-NEXT: jbe .LBB4_1
	; SSE2_64_WIN-NEXT: # %bb.2:
	; SSE2_64_WIN-NEXT: movq {{[0-9]+}}(%rsp), %rax
	; SSE2_64_WIN-NEXT: addq $24, %rsp
	; SSE2_64_WIN-NEXT: retq
	; SSE2_64_WIN-NEXT: .LBB4_1:
	; SSE2_64_WIN-NEXT: movabsq $-9223372036854775808, %rax # imm = 0x8000000000000000
	; SSE2_64_WIN-NEXT: xorq {{[0-9]+}}(%rsp), %rax			; SSE2_64_WIN-NEXT: xorq {{[0-9]+}}(%rsp), %rax
	; SSE2_64_WIN-NEXT: addq $24, %rsp			; SSE2_64_WIN-NEXT: addq $16, %rsp
	; SSE2_64_WIN-NEXT: retq			; SSE2_64_WIN-NEXT: retq
	;			;
	; SSE2_64_LIN-LABEL: x_to_u64:			; SSE2_64_LIN-LABEL: x_to_u64:
	; SSE2_64_LIN: # %bb.0:			; SSE2_64_LIN: # %bb.0:
	; SSE2_64_LIN-NEXT: fldt {{[0-9]+}}(%rsp)			; SSE2_64_LIN-NEXT: fldt {{[0-9]+}}(%rsp)
	; SSE2_64_LIN-NEXT: flds {{.*}}(%rip)			; SSE2_64_LIN-NEXT: flds {{.*}}(%rip)
	; SSE2_64_LIN-NEXT: fld %st(1)			; SSE2_64_LIN-NEXT: fld %st(1)
	; SSE2_64_LIN-NEXT: fsub %st(1)			; SSE2_64_LIN-NEXT: fsub %st(1)
				; SSE2_64_LIN-NEXT: xorl %eax, %eax
				; SSE2_64_LIN-NEXT: fxch %st(1)
				; SSE2_64_LIN-NEXT: fucompi %st(2)
				; SSE2_64_LIN-NEXT: fcmovnbe %st(1), %st(0)
				; SSE2_64_LIN-NEXT: fstp %st(1)
	; SSE2_64_LIN-NEXT: fnstcw -{{[0-9]+}}(%rsp)			; SSE2_64_LIN-NEXT: fnstcw -{{[0-9]+}}(%rsp)
	; SSE2_64_LIN-NEXT: movzwl -{{[0-9]+}}(%rsp), %eax			; SSE2_64_LIN-NEXT: movzwl -{{[0-9]+}}(%rsp), %ecx
	; SSE2_64_LIN-NEXT: movw $3199, -{{[0-9]+}}(%rsp) # imm = 0xC7F			; SSE2_64_LIN-NEXT: movw $3199, -{{[0-9]+}}(%rsp) # imm = 0xC7F
	; SSE2_64_LIN-NEXT: fldcw -{{[0-9]+}}(%rsp)			; SSE2_64_LIN-NEXT: fldcw -{{[0-9]+}}(%rsp)
	; SSE2_64_LIN-NEXT: movw %ax, -{{[0-9]+}}(%rsp)			; SSE2_64_LIN-NEXT: movw %cx, -{{[0-9]+}}(%rsp)
	; SSE2_64_LIN-NEXT: fistpll -{{[0-9]+}}(%rsp)			; SSE2_64_LIN-NEXT: fistpll -{{[0-9]+}}(%rsp)
	; SSE2_64_LIN-NEXT: fldcw -{{[0-9]+}}(%rsp)			; SSE2_64_LIN-NEXT: fldcw -{{[0-9]+}}(%rsp)
	; SSE2_64_LIN-NEXT: fnstcw -{{[0-9]+}}(%rsp)			; SSE2_64_LIN-NEXT: setbe %al
	; SSE2_64_LIN-NEXT: movzwl -{{[0-9]+}}(%rsp), %eax			; SSE2_64_LIN-NEXT: shlq $63, %rax
	; SSE2_64_LIN-NEXT: movw $3199, -{{[0-9]+}}(%rsp) # imm = 0xC7F
	; SSE2_64_LIN-NEXT: fldcw -{{[0-9]+}}(%rsp)
	; SSE2_64_LIN-NEXT: movw %ax, -{{[0-9]+}}(%rsp)
	; SSE2_64_LIN-NEXT: fld %st(1)
	; SSE2_64_LIN-NEXT: fistpll -{{[0-9]+}}(%rsp)
	; SSE2_64_LIN-NEXT: fldcw -{{[0-9]+}}(%rsp)
	; SSE2_64_LIN-NEXT: fucompi %st(1)
	; SSE2_64_LIN-NEXT: fstp %st(0)
	; SSE2_64_LIN-NEXT: jbe .LBB4_1
	; SSE2_64_LIN-NEXT: # %bb.2:
	; SSE2_64_LIN-NEXT: movq -{{[0-9]+}}(%rsp), %rax
	; SSE2_64_LIN-NEXT: retq
	; SSE2_64_LIN-NEXT: .LBB4_1:
	; SSE2_64_LIN-NEXT: movabsq $-9223372036854775808, %rax # imm = 0x8000000000000000
	; SSE2_64_LIN-NEXT: xorq -{{[0-9]+}}(%rsp), %rax			; SSE2_64_LIN-NEXT: xorq -{{[0-9]+}}(%rsp), %rax
	; SSE2_64_LIN-NEXT: retq			; SSE2_64_LIN-NEXT: retq
	;			;
	; X87_WIN-LABEL: x_to_u64:			; X87_WIN-LABEL: x_to_u64:
	; X87_WIN: # %bb.0:			; X87_WIN: # %bb.0:
	; X87_WIN-NEXT: pushl %ebp			; X87_WIN-NEXT: pushl %ebp
	; X87_WIN-NEXT: movl %esp, %ebp			; X87_WIN-NEXT: movl %esp, %ebp
	; X87_WIN-NEXT: andl $-8, %esp			; X87_WIN-NEXT: andl $-8, %esp
	▲ Show 20 Lines • Show All 505 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[TargetLowering] expandFP_TO_UINT - avoid FPE due to out of range conversion (PR17686)
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 172579

include/llvm/CodeGen/TargetLowering.h

lib/CodeGen/SelectionDAG/TargetLowering.cpp

lib/Target/X86/X86ISelLowering.h

lib/Target/X86/X86ISelLowering.cpp

test/CodeGen/X86/fp-cvt.ll

test/CodeGen/X86/scalar-fp-to-i64.ll

This is an archive of the discontinued LLVM Phabricator instance.

[TargetLowering] expandFP_TO_UINT - avoid FPE due to out of range conversion (PR17686)ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 172579

include/llvm/CodeGen/TargetLowering.h

lib/CodeGen/SelectionDAG/TargetLowering.cpp

lib/Target/X86/X86ISelLowering.h

lib/Target/X86/X86ISelLowering.cpp

test/CodeGen/X86/fp-cvt.ll

test/CodeGen/X86/scalar-fp-to-i64.ll

[TargetLowering] expandFP_TO_UINT - avoid FPE due to out of range conversion (PR17686)
ClosedPublic