Diff 140773

lib/Target/ARM/ARMISelLowering.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 1,041 Lines • ▼ Show 20 Lines	ARMTargetLowering::ARMTargetLowering(const TargetMachine &TM,
setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::Other, Custom);		setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::Other, Custom);
setOperationAction(ISD::EH_SJLJ_SETJMP, MVT::i32, Custom);		setOperationAction(ISD::EH_SJLJ_SETJMP, MVT::i32, Custom);
setOperationAction(ISD::EH_SJLJ_LONGJMP, MVT::Other, Custom);		setOperationAction(ISD::EH_SJLJ_LONGJMP, MVT::Other, Custom);
setOperationAction(ISD::EH_SJLJ_SETUP_DISPATCH, MVT::Other, Custom);		setOperationAction(ISD::EH_SJLJ_SETUP_DISPATCH, MVT::Other, Custom);
if (Subtarget->useSjLjEH())		if (Subtarget->useSjLjEH())
setLibcallName(RTLIB::UNWIND_RESUME, "_Unwind_SjLj_Resume");		setLibcallName(RTLIB::UNWIND_RESUME, "_Unwind_SjLj_Resume");

setOperationAction(ISD::SETCC, MVT::i32, Expand);		setOperationAction(ISD::SETCC, MVT::i32, Expand);
setOperationAction(ISD::SETCC, MVT::f16, Expand);
setOperationAction(ISD::SETCC, MVT::f32, Expand);		setOperationAction(ISD::SETCC, MVT::f32, Expand);
setOperationAction(ISD::SETCC, MVT::f64, Expand);		setOperationAction(ISD::SETCC, MVT::f64, Expand);
setOperationAction(ISD::SELECT, MVT::i32, Custom);		setOperationAction(ISD::SELECT, MVT::i32, Custom);
setOperationAction(ISD::SELECT, MVT::f32, Custom);		setOperationAction(ISD::SELECT, MVT::f32, Custom);
setOperationAction(ISD::SELECT, MVT::f64, Custom);		setOperationAction(ISD::SELECT, MVT::f64, Custom);
setOperationAction(ISD::SELECT_CC, MVT::f16, Custom);
setOperationAction(ISD::SELECT_CC, MVT::i32, Custom);		setOperationAction(ISD::SELECT_CC, MVT::i32, Custom);
setOperationAction(ISD::SELECT_CC, MVT::f32, Custom);		setOperationAction(ISD::SELECT_CC, MVT::f32, Custom);
setOperationAction(ISD::SELECT_CC, MVT::f64, Custom);		setOperationAction(ISD::SELECT_CC, MVT::f64, Custom);
		if (Subtarget->hasFullFP16()) {
		setOperationAction(ISD::SETCC, MVT::f16, Expand);
		setOperationAction(ISD::SELECT, MVT::f16, Custom);
		setOperationAction(ISD::SELECT_CC, MVT::f16, Custom);
		}

// Thumb-1 cannot currently select ARMISD::SUBE.		// Thumb-1 cannot currently select ARMISD::SUBE.
if (!Subtarget->isThumb1Only())		if (!Subtarget->isThumb1Only())
setOperationAction(ISD::SETCCE, MVT::i32, Custom);		setOperationAction(ISD::SETCCE, MVT::i32, Custom);

setOperationAction(ISD::BRCOND, MVT::Other, Custom);		setOperationAction(ISD::BRCOND, MVT::Other, Custom);
setOperationAction(ISD::BR_CC, MVT::i32, Custom);		setOperationAction(ISD::BR_CC, MVT::i32, Custom);
		if (Subtarget->hasFullFP16())
setOperationAction(ISD::BR_CC, MVT::f16, Custom);		setOperationAction(ISD::BR_CC, MVT::f16, Custom);
setOperationAction(ISD::BR_CC, MVT::f32, Custom);		setOperationAction(ISD::BR_CC, MVT::f32, Custom);
setOperationAction(ISD::BR_CC, MVT::f64, Custom);		setOperationAction(ISD::BR_CC, MVT::f64, Custom);
setOperationAction(ISD::BR_JT, MVT::Other, Custom);		setOperationAction(ISD::BR_JT, MVT::Other, Custom);

// We don't support sin/cos/fmod/copysign/pow		// We don't support sin/cos/fmod/copysign/pow
setOperationAction(ISD::FSIN, MVT::f64, Expand);		setOperationAction(ISD::FSIN, MVT::f64, Expand);
setOperationAction(ISD::FSIN, MVT::f32, Expand);		setOperationAction(ISD::FSIN, MVT::f32, Expand);
setOperationAction(ISD::FCOS, MVT::f32, Expand);		setOperationAction(ISD::FCOS, MVT::f32, Expand);
▲ Show 20 Lines • Show All 3,441 Lines • ▼ Show 20 Lines	SDValue ARMTargetLowering::LowerSELECT_CC(SDValue Op, SelectionDAG &DAG) const {

ARMCC::CondCodes CondCode, CondCode2;		ARMCC::CondCodes CondCode, CondCode2;
bool InvalidOnQNaN;		bool InvalidOnQNaN;
FPCCToARMCC(CC, CondCode, CondCode2, InvalidOnQNaN);		FPCCToARMCC(CC, CondCode, CondCode2, InvalidOnQNaN);

// Normalize the fp compare. If RHS is zero we keep it there so we match		// Normalize the fp compare. If RHS is zero we keep it there so we match
// CMPFPw0 instead of CMPFP.		// CMPFPw0 instead of CMPFP.
if (Subtarget->hasFPARMv8() && !isFloatingPointZero(RHS) &&		if (Subtarget->hasFPARMv8() && !isFloatingPointZero(RHS) &&
(TrueVal.getValueType() == MVT::f32 \|\| TrueVal.getValueType() == MVT::f64)) {		(TrueVal.getValueType() == MVT::f16 \|\|
		TrueVal.getValueType() == MVT::f32 \|\|
		TrueVal.getValueType() == MVT::f64)) {
		olista01Unsubmitted Not Done Reply Inline Actions Does this need to check Subtarget->hasFullFP16()? olista01: Does this need to check Subtarget->hasFullFP16()?
bool swpCmpOps = false;		bool swpCmpOps = false;
bool swpVselOps = false;		bool swpVselOps = false;
checkVSELConstraints(CC, CondCode, swpCmpOps, swpVselOps);		checkVSELConstraints(CC, CondCode, swpCmpOps, swpVselOps);

if (CondCode == ARMCC::GT \|\| CondCode == ARMCC::GE \|\|		if (CondCode == ARMCC::GT \|\| CondCode == ARMCC::GE \|\|
CondCode == ARMCC::VS \|\| CondCode == ARMCC::EQ) {		CondCode == ARMCC::VS \|\| CondCode == ARMCC::EQ) {
if (swpCmpOps)		if (swpCmpOps)
std::swap(LHS, RHS);		std::swap(LHS, RHS);
▲ Show 20 Lines • Show All 10,324 Lines • Show Last 20 Lines

test/CodeGen/ARM/fp16-instructions.ll

Show First 20 Lines • Show All 700 Lines • ▼ Show 20 Lines	define half @select_cc1() {
%1 = fcmp nsz oeq half undef, 0xH0001		%1 = fcmp nsz oeq half undef, 0xH0001
%2 = select i1 %1, half 0xHC000, half 0xH0002		%2 = select i1 %1, half 0xHC000, half 0xH0002
ret half %2		ret half %2

; CHECK-LABEL: select_cc1:		; CHECK-LABEL: select_cc1:
; CHECK-HARDFP-FULLFP16: vseleq.f16 s0, s{{.}}, s{{.}}		; CHECK-HARDFP-FULLFP16: vseleq.f16 s0, s{{.}}, s{{.}}
}		}

		; FIXME: more tests need to be added for VSELGE and VSELGT.
		; That is, more combinations of immediate operands that can or can't
		; be encoded as an FP16 immediate need to be added here.
		;
; 36. VSELGE		; 36. VSELGE
define half @select_cc2() {		define half @select_cc_ge1() {
%1 = fcmp nsz oge half undef, 0xH0001		%1 = fcmp nsz oge half undef, 0xH0001
%2 = select i1 %1, half 0xHC000, half 0xH0002		%2 = select i1 %1, half 0xHC000, half 0xH0002
ret half %2		ret half %2

; CHECK-LABEL: select_cc2:		; CHECK-LABEL: select_cc_ge1:
		; CHECK-HARDFP-FULLFP16: vselge.f16 s0, s{{.}}, s{{.}}
		}

		; FIXME: add fcmp ole, ult here.

		define half @select_cc_ge3() {
		%1 = fcmp nsz ugt half undef, 0xH0001
		%2 = select i1 %1, half 0xHC000, half 0xH0002
		ret half %2

		; CHECK-LABEL: select_cc_ge3:
; CHECK-HARDFP-FULLFP16: vselge.f16 s0, s{{.}}, s{{.}}		; CHECK-HARDFP-FULLFP16: vselge.f16 s0, s{{.}}, s{{.}}
}		}

; 37. VSELGT		; 37. VSELGT
define half @select_cc3() {		define half @select_cc_gt1() {
%1 = fcmp nsz ogt half undef, 0xH0001		%1 = fcmp nsz ogt half undef, 0xH0001
%2 = select i1 %1, half 0xHC000, half 0xH0002		%2 = select i1 %1, half 0xHC000, half 0xH0002
ret half %2		ret half %2

; CHECK-LABEL: select_cc3:		; CHECK-LABEL: select_cc_gt1:
		olista01Unsubmitted Not Done Reply Inline Actions What code actually gets emitted here? If it is correct but sub-optimal we should be testing it, otherwise this patch shouldn't be committed util the generated code is correct. olista01: What code actually gets emitted here? If it is correct but sub-optimal we should be testing it…
; CHECK-HARDFP-FULLFP16: vselgt.f16 s0, s{{.}}, s{{.}}		; CHECK-HARDFP-FULLFP16: vselgt.f16 s0, s{{.}}, s{{.}}
}		}

		define half @select_cc_gt2() {
		%1 = fcmp nsz uge half undef, 0xH0001
		%2 = select i1 %1, half 0xHC000, half 0xH0002
		ret half %2

		; CHECK-LABEL: select_cc_gt2:
		olista01Unsubmitted Not Done Reply Inline Actions This only checks the HARDFP-FULLFP16 case, should it also be checking the others? Also, should we check the VCMP instruction, as well as the VSEL? olista01: This only checks the HARDFP-FULLFP16 case, should it also be checking the others? Also, should…
		; CHECK-HARDFP-FULLFP16: vselgt.f16 s0, s{{.}}, s{{.}}
		}

		; FIXME: add fcmp ule, olt here.

; 38. VSELVS		; 38. VSELVS
define half @select_cc4() {		define half @select_cc4() {
%1 = fcmp nsz ueq half undef, 0xH0001		%1 = fcmp nsz ueq half undef, 0xH0001
%2 = select i1 %1, half 0xHC000, half 0xH0002		%2 = select i1 %1, half 0xHC000, half 0xH0002
ret half %2		ret half %2

; CHECK-LABEL: select_cc4:		; CHECK-LABEL: select_cc4:
; CHECK-HARDFP-FULLFP16: vselvs.f16 s0, s{{.}}, s{{.}}		; CHECK-HARDFP-FULLFP16: vselvs.f16 s0, s{{.}}, s{{.}}
}		}
		olista01Unsubmitted Not Done Reply Inline Actions Why are we generating more code for this case than the others? olista01: Why are we generating more code for this case than the others?

; 39. VSQRT - TODO		; 39. VSQRT - TODO

; 40. VSUB		; 40. VSUB
define float @Sub(float %a.coerce, float %b.coerce) {		define float @Sub(float %a.coerce, float %b.coerce) {
entry:		entry:
%0 = bitcast float %a.coerce to i32		%0 = bitcast float %a.coerce to i32
%tmp.0.extract.trunc = trunc i32 %0 to i16		%tmp.0.extract.trunc = trunc i32 %0 to i16
▲ Show 20 Lines • Show All 96 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[ARM] FP16 VSEL codegen follow up
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 140773

lib/Target/ARM/ARMISelLowering.cpp

test/CodeGen/ARM/fp16-instructions.ll

This is an archive of the discontinued LLVM Phabricator instance.

[ARM] FP16 VSEL codegen follow upClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 140773

lib/Target/ARM/ARMISelLowering.cpp

test/CodeGen/ARM/fp16-instructions.ll

[ARM] FP16 VSEL codegen follow up
ClosedPublic