Diff 267183

llvm/include/llvm/CodeGen/ValueTypes.h

Show First 20 Lines • Show All 98 Lines • ▼ Show 20 Lines	EVT changeVectorElementTypeToInteger() const {
MVT IntTy = MVT::getIntegerVT(BitWidth);		MVT IntTy = MVT::getIntegerVT(BitWidth);
MVT VecTy = MVT::getVectorVT(IntTy, getVectorNumElements(),		MVT VecTy = MVT::getVectorVT(IntTy, getVectorNumElements(),
isScalableVector());		isScalableVector());
assert(VecTy.SimpleTy != MVT::INVALID_SIMPLE_VALUE_TYPE &&		assert(VecTy.SimpleTy != MVT::INVALID_SIMPLE_VALUE_TYPE &&
"Simple vector VT not representable by simple integer vector VT!");		"Simple vector VT not representable by simple integer vector VT!");
return VecTy;		return VecTy;
}		}

		/// Return a VT for a vector type whose attributes match ourselves
		/// with the exception of the element type that is chosen by the caller.
		EVT changeVectorElementType(EVT EltVT) const {
		if (!isSimple())
		return changeExtendedVectorElementType(EltVT);
		MVT VecTy = MVT::getVectorVT(EltVT.V, getVectorElementCount());
		assert(VecTy.SimpleTy != MVT::INVALID_SIMPLE_VALUE_TYPE &&
		"Simple vector VT not representable by simple integer vector VT!");
		return VecTy;
		}

/// Return the type converted to an equivalently sized integer or vector		/// Return the type converted to an equivalently sized integer or vector
/// with integer element type. Similar to changeVectorElementTypeToInteger,		/// with integer element type. Similar to changeVectorElementTypeToInteger,
/// but also handles scalars.		/// but also handles scalars.
EVT changeTypeToInteger() {		EVT changeTypeToInteger() {
if (isVector())		if (isVector())
return changeVectorElementTypeToInteger();		return changeVectorElementTypeToInteger();

if (isSimple())		if (isSimple())
▲ Show 20 Lines • Show All 308 Lines • ▼ Show 20 Lines	struct compareRawBits {
}		}
};		};

private:		private:
// Methods for handling the Extended-type case in functions above.		// Methods for handling the Extended-type case in functions above.
// These are all out-of-line to prevent users of this header file		// These are all out-of-line to prevent users of this header file
// from having a dependency on Type.h.		// from having a dependency on Type.h.
EVT changeExtendedTypeToInteger() const;		EVT changeExtendedTypeToInteger() const;
		EVT changeExtendedVectorElementType(EVT EltVT) const;
EVT changeExtendedVectorElementTypeToInteger() const;		EVT changeExtendedVectorElementTypeToInteger() const;
static EVT getExtendedIntegerVT(LLVMContext &C, unsigned BitWidth);		static EVT getExtendedIntegerVT(LLVMContext &C, unsigned BitWidth);
static EVT getExtendedVectorVT(LLVMContext &C, EVT VT, unsigned NumElements,		static EVT getExtendedVectorVT(LLVMContext &C, EVT VT, unsigned NumElements,
bool IsScalable);		bool IsScalable);
static EVT getExtendedVectorVT(LLVMContext &Context, EVT VT,		static EVT getExtendedVectorVT(LLVMContext &Context, EVT VT,
ElementCount EC);		ElementCount EC);
bool isExtendedFloatingPoint() const LLVM_READONLY;		bool isExtendedFloatingPoint() const LLVM_READONLY;
bool isExtendedInteger() const LLVM_READONLY;		bool isExtendedInteger() const LLVM_READONLY;
Show All 21 Lines

llvm/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp

Show First 20 Lines • Show All 4,318 Lines • ▼ Show 20 Lines	SDValue DAGTypeLegalizer::PromoteIntRes_EXTRACT_SUBVECTOR(SDNode *N) {
EVT NOutVT = TLI.getTypeToTransformTo(*DAG.getContext(), OutVT);		EVT NOutVT = TLI.getTypeToTransformTo(*DAG.getContext(), OutVT);
assert(NOutVT.isVector() && "This type must be promoted to a vector type");		assert(NOutVT.isVector() && "This type must be promoted to a vector type");
unsigned OutNumElems = OutVT.getVectorNumElements();		unsigned OutNumElems = OutVT.getVectorNumElements();
EVT NOutVTElem = NOutVT.getVectorElementType();		EVT NOutVTElem = NOutVT.getVectorElementType();

SDLoc dl(N);		SDLoc dl(N);
SDValue BaseIdx = N->getOperand(1);		SDValue BaseIdx = N->getOperand(1);

		// TODO: We may be able to use this for types other than scalable
		// vectors and fix those tests that expect BUILD_VECTOR to be used
		if (OutVT.isScalableVector()) {
		SDValue InOp0 = N->getOperand(0);
		EVT InVT = InOp0.getValueType();

		// Promote operands and see if this is handled by target lowering,
		// Otherwise, use the BUILD_VECTOR approach below
		if (getTypeAction(InVT) == TargetLowering::TypePromoteInteger) {
		// Collect the (promoted) operands
		SDValue Ops[] = { GetPromotedInteger(InOp0), BaseIdx };
		efriedmaUnsubmitted Done Reply Inline Actions In general, there are four possibilities for legalization of the operand vector: Legal. In this case, I guess the operation you want is essentially ANY_EXTEND_VECTOR_INREG. You're currently handling this in target-specific code; I guess that's okay for now. Promote. In this case, you can promote both the operand and the result, what you're doing here. Widen. In this case, you just widen the operand. Split. In this case, you pick the correct half (or construct it with a shuffle), and extract from that. Currently, you're assuming the the result of GetPromotedInteger() has an element type narrower or equal to the element type of NOutVT. I'm not sure that's true on all targets, but I guess it's true for SVE. Better to explicitly check, I think. efriedma: In general, there are four possibilities for legalization of the operand vector: 1. Legal. In…

		EVT PromEltVT = Ops[0].getValueType().getVectorElementType();
		EVT ExtVT = NOutVT.changeVectorElementType(PromEltVT);
		SDValue Ext = DAG.getNode(ISD::EXTRACT_SUBVECTOR, SDLoc(N), ExtVT, Ops);
		return DAG.getNode(ISD::ANY_EXTEND, dl, NOutVT, Ext);
		}
		}
		efriedmaUnsubmitted Done Reply Inline Actions Please put a report_fatal_error here for scalable vectors, so we don't end up with some obscure invalid BUILD_VECTOR error. Alternatively, I guess you could call ExpandExtractFromVectorThroughStack(). efriedma: Please put a report_fatal_error here for scalable vectors, so we don't end up with some obscure…

SDValue InOp0 = N->getOperand(0);		SDValue InOp0 = N->getOperand(0);
if (getTypeAction(InOp0.getValueType()) == TargetLowering::TypePromoteInteger)		if (getTypeAction(InOp0.getValueType()) == TargetLowering::TypePromoteInteger)
InOp0 = GetPromotedInteger(N->getOperand(0));		InOp0 = GetPromotedInteger(N->getOperand(0));

EVT InVT = InOp0.getValueType();		EVT InVT = InOp0.getValueType();

SmallVector<SDValue, 8> Ops;		SmallVector<SDValue, 8> Ops;
Ops.reserve(OutNumElems);		Ops.reserve(OutNumElems);
▲ Show 20 Lines • Show All 237 Lines • Show Last 20 Lines

llvm/lib/CodeGen/ValueTypes.cpp

	Show All 20 Lines

	EVT EVT::changeExtendedVectorElementTypeToInteger() const {			EVT EVT::changeExtendedVectorElementTypeToInteger() const {
	LLVMContext &Context = LLVMTy->getContext();			LLVMContext &Context = LLVMTy->getContext();
	EVT IntTy = getIntegerVT(Context, getScalarSizeInBits());			EVT IntTy = getIntegerVT(Context, getScalarSizeInBits());
	return getVectorVT(Context, IntTy, getVectorNumElements(),			return getVectorVT(Context, IntTy, getVectorNumElements(),
	isScalableVector());			isScalableVector());
	}			}

				EVT EVT::changeExtendedVectorElementType(EVT EltVT) const {
				LLVMContext &Context = LLVMTy->getContext();
				return getVectorVT(Context, EltVT, getVectorElementCount());
				}

	EVT EVT::getExtendedIntegerVT(LLVMContext &Context, unsigned BitWidth) {			EVT EVT::getExtendedIntegerVT(LLVMContext &Context, unsigned BitWidth) {
	EVT VT;			EVT VT;
	VT.LLVMTy = IntegerType::get(Context, BitWidth);			VT.LLVMTy = IntegerType::get(Context, BitWidth);
	assert(VT.isExtended() && "Type is not extended!");			assert(VT.isExtended() && "Type is not extended!");
	return VT;			return VT;
	}			}

	EVT EVT::getExtendedVectorVT(LLVMContext &Context, EVT VT, unsigned NumElements,			EVT EVT::getExtendedVectorVT(LLVMContext &Context, EVT VT, unsigned NumElements,
	▲ Show 20 Lines • Show All 372 Lines • Show Last 20 Lines

llvm/lib/Target/AArch64/AArch64ISelLowering.h

Show First 20 Lines • Show All 882 Lines • ▼ Show 20 Lines	bool getPreIndexedAddressParts(SDNode *N, SDValue &Base, SDValue &Offset,
ISD::MemIndexedMode &AM,		ISD::MemIndexedMode &AM,
SelectionDAG &DAG) const override;		SelectionDAG &DAG) const override;
bool getPostIndexedAddressParts(SDNode N, SDNode Op, SDValue &Base,		bool getPostIndexedAddressParts(SDNode N, SDNode Op, SDValue &Base,
SDValue &Offset, ISD::MemIndexedMode &AM,		SDValue &Offset, ISD::MemIndexedMode &AM,
SelectionDAG &DAG) const override;		SelectionDAG &DAG) const override;

void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue> &Results,		void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue> &Results,
SelectionDAG &DAG) const override;		SelectionDAG &DAG) const override;
		void ReplaceExtractSubVectorResults(SDNode *N,
		SmallVectorImpl<SDValue> &Results,
		SelectionDAG &DAG) const;

bool shouldNormalizeToSelectSequence(LLVMContext &, EVT) const override;		bool shouldNormalizeToSelectSequence(LLVMContext &, EVT) const override;

void finalizeLowering(MachineFunction &MF) const override;		void finalizeLowering(MachineFunction &MF) const override;

bool shouldLocalize(const MachineInstr &MI,		bool shouldLocalize(const MachineInstr &MI,
const TargetTransformInfo *TTI) const override;		const TargetTransformInfo *TTI) const override;
};		};
Show All 9 Lines

llvm/lib/Target/AArch64/AArch64ISelLowering.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 895 Lines • ▼ Show 20 Lines	for (MVT VT : MVT::integer_scalable_vector_valuetypes()) {
setOperationAction(ISD::UMIN, VT, Custom);		setOperationAction(ISD::UMIN, VT, Custom);
setOperationAction(ISD::SMAX, VT, Custom);		setOperationAction(ISD::SMAX, VT, Custom);
setOperationAction(ISD::UMAX, VT, Custom);		setOperationAction(ISD::UMAX, VT, Custom);
setOperationAction(ISD::SHL, VT, Custom);		setOperationAction(ISD::SHL, VT, Custom);
setOperationAction(ISD::SRL, VT, Custom);		setOperationAction(ISD::SRL, VT, Custom);
setOperationAction(ISD::SRA, VT, Custom);		setOperationAction(ISD::SRA, VT, Custom);
if (VT.getScalarType() == MVT::i1)		if (VT.getScalarType() == MVT::i1)
setOperationAction(ISD::SETCC, VT, Custom);		setOperationAction(ISD::SETCC, VT, Custom);
		} else {
		if (VT.getVectorElementType() != MVT::i1)
		setOperationAction(ISD::EXTRACT_SUBVECTOR, VT, Custom);
		efriedmaUnsubmitted Done Reply Inline Actions Can you restrict this to specifically the types you're interested in handling? It looks like you only implemented handling for the following types: nxv8i8, nxv4i16, nxv2i32. efriedma: Can you restrict this to specifically the types you're interested in handling? It looks like…
}		}
}		}
setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::i8, Custom);		setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::i8, Custom);
setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::i16, Custom);		setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::i16, Custom);

for (MVT VT : MVT::fp_scalable_vector_valuetypes()) {		for (MVT VT : MVT::fp_scalable_vector_valuetypes()) {
if (isTypeLegal(VT)) {		if (isTypeLegal(VT)) {
setOperationAction(ISD::SPLAT_VECTOR, VT, Custom);		setOperationAction(ISD::SPLAT_VECTOR, VT, Custom);
▲ Show 20 Lines • Show All 7,634 Lines • ▼ Show 20 Lines	AArch64TargetLowering::LowerEXTRACT_VECTOR_ELT(SDValue Op,

// For extractions, we just return the result directly.		// For extractions, we just return the result directly.
return DAG.getNode(ISD::EXTRACT_VECTOR_ELT, DL, ExtrTy, WideVec,		return DAG.getNode(ISD::EXTRACT_VECTOR_ELT, DL, ExtrTy, WideVec,
Op.getOperand(1));		Op.getOperand(1));
}		}

SDValue AArch64TargetLowering::LowerEXTRACT_SUBVECTOR(SDValue Op,		SDValue AArch64TargetLowering::LowerEXTRACT_SUBVECTOR(SDValue Op,
SelectionDAG &DAG) const {		SelectionDAG &DAG) const {
		// If there is anything to do it will be handled by ReplaceNodeResult.
		if (Op.getValueType().isScalableVector())
		return SDValue();
		efriedmaUnsubmitted Done Reply Inline Actions I think you can just assert the type isn't scalable? It shouldn't be possible to get here. You're only marking EXTRACT_SUBVECTOR Custom for illegal types. efriedma: I think you can just assert the type isn't scalable? It shouldn't be possible to get here.

EVT VT = Op.getOperand(0).getValueType();		EVT VT = Op.getOperand(0).getValueType();
SDLoc dl(Op);		SDLoc dl(Op);
// Just in case...		// Just in case...
if (!VT.isVector())		if (!VT.isVector())
return SDValue();		return SDValue();

ConstantSDNode *Cst = dyn_cast<ConstantSDNode>(Op.getOperand(1));		ConstantSDNode *Cst = dyn_cast<ConstantSDNode>(Op.getOperand(1));
if (!Cst)		if (!Cst)
▲ Show 20 Lines • Show All 2,085 Lines • ▼ Show 20 Lines	static bool isConstantSplatVectorMaskForType(SDNode *N, EVT MemVT) {
return false;		return false;
}		}

static SDValue performSVEAndCombine(SDNode *N,		static SDValue performSVEAndCombine(SDNode *N,
TargetLowering::DAGCombinerInfo &DCI) {		TargetLowering::DAGCombinerInfo &DCI) {
if (DCI.isBeforeLegalizeOps())		if (DCI.isBeforeLegalizeOps())
return SDValue();		return SDValue();

		SelectionDAG &DAG = DCI.DAG;
SDValue Src = N->getOperand(0);		SDValue Src = N->getOperand(0);
		unsigned Opc = Src->getOpcode();

		// Zero/any extend of an unsigned unpack
		if (Opc == AArch64ISD::UUNPKHI \|\| Opc == AArch64ISD::UUNPKLO) {
		SDValue UnpkOp = Src->getOperand(0);
		SDValue Dup = N->getOperand(1);

		if (Dup.getOpcode() != AArch64ISD::DUP)
		return SDValue();

		SDLoc DL(N);
		ConstantSDNode *C = dyn_cast<ConstantSDNode>(Dup->getOperand(0));
		uint64_t ExtVal = C->getZExtValue();
		efriedmaUnsubmitted Not Done Reply Inline Actions Do you need to truncate ExtVal somewhere, so you don't end up with a DUP with an over-wide constant? efriedma: Do you need to truncate ExtVal somewhere, so you don't end up with a DUP with an over-wide…
		kmclaughlinAuthorUnsubmitted Done Reply Inline Actions I've changed the call to `getNode` below that creates the DUP to use `DAG.getAnyExtOrTrunc` (similar to what we do in LowerSPLAT_VECTOR) kmclaughlin: I've changed the call to `getNode` below that creates the DUP to use `DAG.getAnyExtOrTrunc`…
		efriedmaUnsubmitted Not Done Reply Inline Actions I'm specifically concerned that you could end up with something like `(nxv16i8 (dup (i32 0x12345678)))`. efriedma: I'm specifically concerned that you could end up with something like `(nxv16i8 (dup (i32…
		kmclaughlinAuthorUnsubmitted Not Done Reply Inline Actions I see what you mean - I've added a truncate of `Dup->getOperand(0)` for this, which will truncate the constant to the type of `UnpkOp` kmclaughlin: I see what you mean - I've added a truncate of `Dup->getOperand(0)` for this, which will…

		// If the mask is fully covered by the unpack, we don't need to push
		// a new AND onto the operand
		EVT EltTy = UnpkOp->getValueType(0).getVectorElementType();
		if ((ExtVal == 0xFF && EltTy == MVT::i8) \|\|
		(ExtVal == 0xFFFF && EltTy == MVT::i16) \|\|
		(ExtVal == 0xFFFFFFFF && EltTy == MVT::i32))
		return Src;

		// Otherwise, make sure we propagate the AND to the operand
		// of the unpack
		efriedmaUnsubmitted Not Done Reply Inline Actions It's not legal to generate operations with type EltTy after legalization. You get away with it here because it's guaranteed to constant-fold... but probably less confusing to use APInt::trunc instead. efriedma: It's not legal to generate operations with type EltTy after legalization. You get away with it…
		Dup = DAG.getNode(AArch64ISD::DUP, DL,
		UnpkOp->getValueType(0),
		DAG.getConstant(ExtVal, DL, MVT::i32));

		SDValue And = DAG.getNode(ISD::AND, DL,
		UnpkOp->getValueType(0), UnpkOp, Dup);

		return DAG.getNode(Opc, DL, N->getValueType(0), And);
		}

SDValue Mask = N->getOperand(1);		SDValue Mask = N->getOperand(1);

if (!Src.hasOneUse())		if (!Src.hasOneUse())
return SDValue();		return SDValue();

EVT MemVT;		EVT MemVT;

// SVE load instructions perform an implicit zero-extend, which makes them		// SVE load instructions perform an implicit zero-extend, which makes them
// perfect candidates for combining.		// perfect candidates for combining.
switch (Src->getOpcode()) {		switch (Opc) {
case AArch64ISD::LD1:		case AArch64ISD::LD1:
case AArch64ISD::LDNF1:		case AArch64ISD::LDNF1:
case AArch64ISD::LDFF1:		case AArch64ISD::LDFF1:
MemVT = cast<VTSDNode>(Src->getOperand(3))->getVT();		MemVT = cast<VTSDNode>(Src->getOperand(3))->getVT();
break;		break;
case AArch64ISD::GLD1:		case AArch64ISD::GLD1:
case AArch64ISD::GLD1_SCALED:		case AArch64ISD::GLD1_SCALED:
case AArch64ISD::GLD1_SXTW:		case AArch64ISD::GLD1_SXTW:
▲ Show 20 Lines • Show All 2,564 Lines • ▼ Show 20 Lines
}		}

static SDValue		static SDValue
performSignExtendInRegCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI,		performSignExtendInRegCombine(SDNode *N, TargetLowering::DAGCombinerInfo &DCI,
SelectionDAG &DAG) {		SelectionDAG &DAG) {
if (DCI.isBeforeLegalizeOps())		if (DCI.isBeforeLegalizeOps())
return SDValue();		return SDValue();

		SDLoc DL(N);
SDValue Src = N->getOperand(0);		SDValue Src = N->getOperand(0);
unsigned Opc = Src->getOpcode();		unsigned Opc = Src->getOpcode();

		// Sign extend of an unsigned unpack -> signed unpack
		if (Opc == AArch64ISD::UUNPKHI \|\| Opc == AArch64ISD::UUNPKLO) {
		unsigned SOpc = Opc == AArch64ISD::UUNPKHI ? AArch64ISD::SUNPKHI
		: AArch64ISD::SUNPKLO;

		// Push the sign extend to the operand of the unpack
		// This is necessary where, for example, the operand of the unpack
		// is another unpack:
		// 4i32 sign_extend_inreg (4i32 uunpklo(8i16 uunpklo (16i8 opnd)), from 4i8)
		efriedmaUnsubmitted Not Done Reply Inline Actions It seems a little fragile to assume the inner VT of the SIGN_EXTEND_INREG is exactly the type you're expecting here. Probably worth at least adding an assertion to encode the assumptions you're making. efriedma: It seems a little fragile to assume the inner VT of the SIGN_EXTEND_INREG is exactly the type…
		kmclaughlinAuthorUnsubmitted Done Reply Inline Actions I've added an assert above here to make sure the sign_extend_inreg and unpack types match, is this the assumption you were referring to? kmclaughlin: I've added an assert above here to make sure the sign_extend_inreg and unpack types match, is…
		efriedmaUnsubmitted Not Done Reply Inline Actions We assert that SIGN_EXTEND_INREG has valid operand/result types elsewhere. I was more concerned about the inner VT (`cast<VTSDNode>(N->getOperand(1))->getVT();`). You could end up creating an invalid SIGN_EXTEND_INREG if the type is something weird, like a non-byte-size integer type. efriedma: We assert that SIGN_EXTEND_INREG has valid operand/result types elsewhere. I was more…
		kmclaughlinAuthorUnsubmitted Not Done Reply Inline Actions Removed my previous check on the operand & result types and added an assert for the type of VT. kmclaughlin: Removed my previous check on the operand & result types and added an assert for the type of VT.
		// ->
		// 4i32 sunpklo (8i16 sign_extend_inreg(8i16 uunpklo (16i8 opnd), from 8i8)
		// ->
		// 4i32 sunpklo(8i16 sunpklo(16i8 opnd))
		SDValue ExtOp = Src->getOperand(0);
		auto VT = cast<VTSDNode>(N->getOperand(1))->getVT();
		EVT ExtVT = EVT::getVectorVT(*DAG.getContext(),
		VT.getVectorElementType(),
		VT.getVectorElementCount() * 2);

		SDValue Ext = DAG.getNode(ISD::SIGN_EXTEND_INREG, DL, ExtOp.getValueType(),
		ExtOp, DAG.getValueType(ExtVT));

		return DAG.getNode(SOpc, DL, N->getValueType(0), Ext);
		}

// SVE load nodes (e.g. AArch64ISD::GLD1) are straightforward candidates		// SVE load nodes (e.g. AArch64ISD::GLD1) are straightforward candidates
// for DAG Combine with SIGN_EXTEND_INREG. Bail out for all other nodes.		// for DAG Combine with SIGN_EXTEND_INREG. Bail out for all other nodes.
unsigned NewOpc;		unsigned NewOpc;
unsigned MemVTOpNum = 4;		unsigned MemVTOpNum = 4;
switch (Opc) {		switch (Opc) {
case AArch64ISD::LD1:		case AArch64ISD::LD1:
NewOpc = AArch64ISD::LD1S;		NewOpc = AArch64ISD::LD1S;
MemVTOpNum = 3;		MemVTOpNum = 3;
▲ Show 20 Lines • Show All 470 Lines • ▼ Show 20 Lines	static std::pair<SDValue, SDValue> splitInt128(SDValue N, SelectionDAG &DAG) {
SDLoc DL(N);		SDLoc DL(N);
SDValue Lo = DAG.getNode(ISD::TRUNCATE, DL, MVT::i64, N);		SDValue Lo = DAG.getNode(ISD::TRUNCATE, DL, MVT::i64, N);
SDValue Hi = DAG.getNode(ISD::TRUNCATE, DL, MVT::i64,		SDValue Hi = DAG.getNode(ISD::TRUNCATE, DL, MVT::i64,
DAG.getNode(ISD::SRL, DL, MVT::i128, N,		DAG.getNode(ISD::SRL, DL, MVT::i128, N,
DAG.getConstant(64, DL, MVT::i64)));		DAG.getConstant(64, DL, MVT::i64)));
return std::make_pair(Lo, Hi);		return std::make_pair(Lo, Hi);
}		}

		void AArch64TargetLowering::ReplaceExtractSubVectorResults(
		SDNode *N, SmallVectorImpl<SDValue> &Results, SelectionDAG &DAG) const {
		SDValue In = N->getOperand(0);
		EVT InVT = In.getValueType();

		// Common code will handle these just fine.
		if (!InVT.isScalableVector() \|\| !InVT.isInteger())
		return;

		SDLoc DL(N);
		EVT VT = N->getValueType(0);

		if (!isTypeLegal(InVT)) {
		// Bubble truncates to illegal types to the surface.
		efriedmaUnsubmitted Done Reply Inline Actions "Bubble truncates to illegal types to the surface" is an optimization? efriedma: "Bubble truncates to illegal types to the surface" is an optimization?
		kmclaughlinAuthorUnsubmitted Done Reply Inline Actions Removed - this was not required for this patch. kmclaughlin: Removed - this was not required for this patch.
		if (In->getOpcode() == ISD::TRUNCATE) {
		EVT TruncOpVT = In->getOperand(0)->getValueType(0);
		if (!isTypeLegal(TruncOpVT))
		return;

		EVT EltVT = TruncOpVT.getVectorElementType();
		EVT SubVecVT = VT.changeVectorElementType(EltVT);

		SDValue SubVec = DAG.getNode(ISD::EXTRACT_SUBVECTOR, DL, SubVecVT,
		In->getOperand(0), N->getOperand(1));

		Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, VT, SubVec));
		return;
		}

		return;
		}

		// The following checks bail if this is not a halving operation.

		if (InVT.getVectorNumElements() != (VT.getVectorNumElements()*2))
		david-armUnsubmitted Done Reply Inline Actions I think we want to move away from calling getVectorNumElements(), so might need to change this to something like ElementCount ResEC = VT.getVectorElementCount(); if (InVT.getVectorElementCount() != (ResEC * 2)) david-arm: I think we want to move away from calling getVectorNumElements(), so might need to change this…
		return;

		auto *CIndex = dyn_cast<ConstantSDNode>(N->getOperand(1));
		if (!CIndex)
		return;

		unsigned Index = CIndex->getZExtValue();
		if ((Index != 0) && (Index != VT.getVectorNumElements()))
		david-armUnsubmitted Done Reply Inline Actions And here you could then change this to: if ((Index != 0) && (Index != ResEC.Min)) david-arm: And here you could then change this to: if ((Index != 0) && (Index != ResEC.Min))
		return;

		unsigned Opcode = (Index == 0) ? AArch64ISD::UUNPKLO : AArch64ISD::UUNPKHI;
		EVT ExtendedHalfVT = VT.widenIntegerVectorElementType(*DAG.getContext());

		SDValue Half = DAG.getNode(Opcode, DL, ExtendedHalfVT, N->getOperand(0));
		Results.push_back(DAG.getNode(ISD::TRUNCATE, DL, VT, Half));
		}

// Create an even/odd pair of X registers holding integer value V.		// Create an even/odd pair of X registers holding integer value V.
static SDValue createGPRPairNode(SelectionDAG &DAG, SDValue V) {		static SDValue createGPRPairNode(SelectionDAG &DAG, SDValue V) {
SDLoc dl(V.getNode());		SDLoc dl(V.getNode());
SDValue VLo = DAG.getAnyExtOrTrunc(V, dl, MVT::i64);		SDValue VLo = DAG.getAnyExtOrTrunc(V, dl, MVT::i64);
SDValue VHi = DAG.getAnyExtOrTrunc(		SDValue VHi = DAG.getAnyExtOrTrunc(
DAG.getNode(ISD::SRL, dl, MVT::i128, V, DAG.getConstant(64, dl, MVT::i64)),		DAG.getNode(ISD::SRL, dl, MVT::i128, V, DAG.getConstant(64, dl, MVT::i64)),
dl, MVT::i64);		dl, MVT::i64);
if (DAG.getDataLayout().isBigEndian())		if (DAG.getDataLayout().isBigEndian())
▲ Show 20 Lines • Show All 136 Lines • ▼ Show 20 Lines	SDValue Result = DAG.getMemIntrinsicNode(
{LoadNode->getChain(), LoadNode->getBasePtr()}, LoadNode->getMemoryVT(),		{LoadNode->getChain(), LoadNode->getBasePtr()}, LoadNode->getMemoryVT(),
LoadNode->getMemOperand());		LoadNode->getMemOperand());

SDValue Pair = DAG.getNode(ISD::BUILD_PAIR, SDLoc(N), MVT::i128,		SDValue Pair = DAG.getNode(ISD::BUILD_PAIR, SDLoc(N), MVT::i128,
Result.getValue(0), Result.getValue(1));		Result.getValue(0), Result.getValue(1));
Results.append({Pair, Result.getValue(2) /* Chain */});		Results.append({Pair, Result.getValue(2) /* Chain */});
return;		return;
}		}
		case ISD::EXTRACT_SUBVECTOR:
		ReplaceExtractSubVectorResults(N, Results, DAG);
		return;
case ISD::INTRINSIC_WO_CHAIN: {		case ISD::INTRINSIC_WO_CHAIN: {
EVT VT = N->getValueType(0);		EVT VT = N->getValueType(0);
assert((VT == MVT::i8 \|\| VT == MVT::i16) &&		assert((VT == MVT::i8 \|\| VT == MVT::i16) &&
"custom lowering for unexpected type");		"custom lowering for unexpected type");

ConstantSDNode *CN = cast<ConstantSDNode>(N->getOperand(0));		ConstantSDNode *CN = cast<ConstantSDNode>(N->getOperand(0));
Intrinsic::ID IntID = static_cast<Intrinsic::ID>(CN->getZExtValue());		Intrinsic::ID IntID = static_cast<Intrinsic::ID>(CN->getZExtValue());
switch (IntID) {		switch (IntID) {
▲ Show 20 Lines • Show All 405 Lines • Show Last 20 Lines

llvm/test/CodeGen/AArch64/sve-ext.ll

This file was added.

				; RUN: llc -mtriple=aarch64-linux-gnu -mattr=+sve < %s \| FileCheck %s

				;
				; SEXT
				;

				define <vscale x 16 x i16> @sext_b_to_h(<vscale x 16 x i8> %a) {
				; CHECK-LABEL: sext_b_to_h:
				; CHECK-DAG: sunpklo z2.h, z0.b
				; CHECK-DAG: sunpkhi z1.h, z0.b
				; CHECK-DAG: mov z0.d, z2.d
				; CHECK-NEXT: ret
				%ext = sext <vscale x 16 x i8> %a to <vscale x 16 x i16>
				ret <vscale x 16 x i16> %ext
				}

				define <vscale x 8 x i32> @sext_h_to_s(<vscale x 8 x i16> %a) {
				; CHECK-LABEL: sext_h_to_s:
				; CHECK-DAG: sunpklo z2.s, z0.h
				; CHECK-DAG: sunpkhi z1.s, z0.h
				; CHECK-DAG: mov z0.d, z2.d
				; CHECK-NEXT: ret
				%ext = sext <vscale x 8 x i16> %a to <vscale x 8 x i32>
				ret <vscale x 8 x i32> %ext
				}

				define <vscale x 4 x i64> @sext_s_to_d(<vscale x 4 x i32> %a) {
				; CHECK-LABEL: sext_s_to_d:
				; CHECK-DAG: sunpklo z2.d, z0.s
				; CHECK-DAG: sunpkhi z1.d, z0.s
				; CHECK-DAG: mov z0.d, z2.d
				; CHECK-NEXT: ret
				%ext = sext <vscale x 4 x i32> %a to <vscale x 4 x i64>
				ret <vscale x 4 x i64> %ext
				}

				define <vscale x 16 x i32> @sext_b_to_s(<vscale x 16 x i8> %a) {
				; CHECK-LABEL: sext_b_to_s:
				; CHECK-DAG: sunpklo [[LO:z[0-9]+]].h, z0.b
				; CHECK-DAG: sunpkhi [[HI:z[0-9]+]].h, z0.b
				; CHECK-DAG: sunpklo [[LOLO:z[0-9]+]].s, [[LO]].h
				; CHECK-DAG: sunpkhi {{z[0-9]+}}.s, [[LO]].h
				; CHECK-DAG: sunpklo {{z[0-9]+}}.s, [[HI]].h
				; CHECK-DAG: sunpkhi {{z[0-9]+}}.s, [[HI]].h
				; CHECK-NOT: sxt
				; CHECK: ret
				%ext = sext <vscale x 16 x i8> %a to <vscale x 16 x i32>
				ret <vscale x 16 x i32> %ext
				}

				define <vscale x 16 x i64> @sext_b_to_d(<vscale x 16 x i8> %a) {
				; CHECK-DAG: sunpklo [[LO1:z[0-9]+]].h, z0.b
				; CHECK-DAG: sunpkhi [[HI1:z[0-9]+]].h, z0.b
				; CHECK-DAG: sunpklo [[LO2:z[0-9]+]].s, z1.h
				; CHECK-DAG: sunpkhi [[HI2:z[0-9]+]].s, z1.h
				; CHECK-DAG: sunpklo [[LO3:z[0-9]+]].s, z0.h
				; CHECK-DAG: sunpkhi [[HI3:z[0-9]+]].s, z0.h
				; CHECK-DAG: sunpklo z0.d, [[LO2]].s
				; CHECK-DAG: sunpkhi z1.d, [[LO2]].s
				; CHECK-DAG: sunpklo z2.d, [[HI2]].s
				; CHECK-DAG: sunpkhi z3.d, [[HI2]].s
				; CHECK-DAG: sunpklo z4.d, [[LO3]].s
				; CHECK-DAG: sunpkhi z5.d, [[LO3]].s
				; CHECK-DAG: sunpklo z6.d, [[HI3]].s
				; CHECK-DAG: sunpkhi z7.d, [[HI3]].s
				; CHECK-NOT: sxt
				; CHECK-NEXT: ret
				%ext = sext <vscale x 16 x i8> %a to <vscale x 16 x i64>
				ret <vscale x 16 x i64> %ext
				}

				define <vscale x 4 x i16> @sext_promote_b_to_s(<vscale x 4 x i8> %in) {
				; CHECK-LABEL: @sext_promote
				; CHECK-DAG: ptrue p0.s
				; CHECK-DAG: sxtb z0.s, p0/m, z0.s
				; CHECK-NEXT: ret
				%out = sext <vscale x 4 x i8> %in to <vscale x 4 x i16>
				ret <vscale x 4 x i16> %out
				}

				define <vscale x 2 x i32> @sext_promote_h_to_d(<vscale x 2 x i16> %in) {
				; CHECK-LABEL: @sext_promote_h_to_d
				; CHECK-DAG: ptrue p0.d
				; CHECK-DAG: sxth z0.d, p0/m, z0.d
				; CHECK-NEXT: ret
				%out = sext <vscale x 2 x i16> %in to <vscale x 2 x i32>
				ret <vscale x 2 x i32> %out
				}

				; ZEXT

				define <vscale x 16 x i16> @zext_b_to_h(<vscale x 16 x i8> %a) {
				; CHECK-LABEL: zext_b_to_h:
				; CHECK-DAG: uunpklo z2.h, z0.b
				; CHECK-DAG: uunpkhi z1.h, z0.b
				; CHECK-DAG: mov z0.d, z2.d
				; CHECK-NEXT: ret
				%ext = zext <vscale x 16 x i8> %a to <vscale x 16 x i16>
				ret <vscale x 16 x i16> %ext
				}

				define <vscale x 8 x i32> @zext_h_to_s(<vscale x 8 x i16> %a) {
				; CHECK-LABEL: zext_h_to_s:
				; CHECK-DAG: uunpklo z2.s, z0.h
				; CHECK-DAG: uunpkhi z1.s, z0.h
				; CHECK-DAG: mov z0.d, z2.d
				; CHECK-NEXT: ret
				%ext = zext <vscale x 8 x i16> %a to <vscale x 8 x i32>
				ret <vscale x 8 x i32> %ext
				}

				define <vscale x 4 x i64> @zext_s_to_d(<vscale x 4 x i32> %a) {
				; CHECK-LABEL: zext_s_to_d:
				; CHECK-DAG: uunpklo z2.d, z0.s
				; CHECK-DAG: uunpkhi z1.d, z0.s
				; CHECK-DAG: mov z0.d, z2.d
				; CHECK-NEXT: ret
				%ext = zext <vscale x 4 x i32> %a to <vscale x 4 x i64>
				ret <vscale x 4 x i64> %ext
				}

				define <vscale x 16 x i32> @zext_b_to_s(<vscale x 16 x i8> %a) {
				; CHECK-LABEL: zext_b_to_s:
				; CHECK-DAG: uunpklo [[LO:z[0-9]+]].h, z0.b
				; CHECK-DAG: uunpkhi [[HI:z[0-9]+]].h, z0.b
				; CHECK-DAG: uunpklo z0.s, [[LO]].h
				; CHECK-DAG: uunpkhi z1.s, [[LO]].h
				; CHECK-DAG: uunpklo z2.s, [[HI]].h
				; CHECK-DAG: uunpkhi z3.s, [[HI]].h
				; CHECK-NOT: and
				; CHECK: ret
				%ext = zext <vscale x 16 x i8> %a to <vscale x 16 x i32>
				ret <vscale x 16 x i32> %ext
				}

				define <vscale x 16 x i64> @zext_b_to_d(<vscale x 16 x i8> %a) {
				; CHECK-DAG: uunpklo [[LO1:z[0-9]+]].h, z0.b
				; CHECK-DAG: uunpkhi [[HI1:z[0-9]+]].h, z0.b
				; CHECK-DAG: uunpklo [[LO2:z[0-9]+]].s, z1.h
				; CHECK-DAG: uunpkhi [[HI2:z[0-9]+]].s, z1.h
				; CHECK-DAG: uunpklo [[LO3:z[0-9]+]].s, z0.h
				; CHECK-DAG: uunpkhi [[HI3:z[0-9]+]].s, z0.h
				; CHECK-DAG: uunpklo z0.d, [[LO2]].s
				; CHECK-DAG: uunpkhi z1.d, [[LO2]].s
				; CHECK-DAG: uunpklo z2.d, [[HI2]].s
				; CHECK-DAG: uunpkhi z3.d, [[HI2]].s
				; CHECK-DAG: uunpklo z4.d, [[LO3]].s
				; CHECK-DAG: uunpkhi z5.d, [[LO3]].s
				; CHECK-DAG: uunpklo z6.d, [[HI3]].s
				; CHECK-DAG: uunpkhi z7.d, [[HI3]].s
				; CHECK-NOT: and
				; CHECK-NEXT: ret
				%ext = zext <vscale x 16 x i8> %a to <vscale x 16 x i64>
				ret <vscale x 16 x i64> %ext
				}

				define <vscale x 4 x i16> @zext_promote_b_to_s(<vscale x 4 x i8> %in) {
				; CHECK-LABEL: @zext_promote
				; CHECK-DAG: and z0.s, z0.s, #0xff
				; CHECK-NEXT: ret
				%out = zext <vscale x 4 x i8> %in to <vscale x 4 x i16>
				ret <vscale x 4 x i16> %out
				}

				define <vscale x 2 x i32> @zext_promote_h_to_d(<vscale x 2 x i16> %in) {
				; CHECK-LABEL: @zext_promote_h_to_d
				; CHECK-DAG: and z0.d, z0.d, #0xffff
				; CHECK-NEXT: ret
				%out = zext <vscale x 2 x i16> %in to <vscale x 2 x i32>
				ret <vscale x 2 x i32> %out
				}

This is an archive of the discontinued LLVM Phabricator instance.

[CodeGen][SVE] Legalisation of extends with scalable types
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 267183

llvm/include/llvm/CodeGen/ValueTypes.h

llvm/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp

llvm/lib/CodeGen/ValueTypes.cpp

llvm/lib/Target/AArch64/AArch64ISelLowering.h

llvm/lib/Target/AArch64/AArch64ISelLowering.cpp

llvm/test/CodeGen/AArch64/sve-ext.ll

This is an archive of the discontinued LLVM Phabricator instance.

[CodeGen][SVE] Legalisation of extends with scalable typesClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 267183

llvm/include/llvm/CodeGen/ValueTypes.h

llvm/lib/CodeGen/SelectionDAG/LegalizeIntegerTypes.cpp

llvm/lib/CodeGen/ValueTypes.cpp

llvm/lib/Target/AArch64/AArch64ISelLowering.h

llvm/lib/Target/AArch64/AArch64ISelLowering.cpp

llvm/test/CodeGen/AArch64/sve-ext.ll

[CodeGen][SVE] Legalisation of extends with scalable types
ClosedPublic