Diff 529839

llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 426 Lines • ▼ Show 20 Lines	private:
SDValue visitADDE(SDNode *N);		SDValue visitADDE(SDNode *N);
SDValue visitUADDO_CARRY(SDNode *N);		SDValue visitUADDO_CARRY(SDNode *N);
SDValue visitSADDO_CARRY(SDNode *N);		SDValue visitSADDO_CARRY(SDNode *N);
SDValue visitUADDO_CARRYLike(SDValue N0, SDValue N1, SDValue CarryIn,		SDValue visitUADDO_CARRYLike(SDValue N0, SDValue N1, SDValue CarryIn,
SDNode *N);		SDNode *N);
SDValue visitSUBE(SDNode *N);		SDValue visitSUBE(SDNode *N);
SDValue visitUSUBO_CARRY(SDNode *N);		SDValue visitUSUBO_CARRY(SDNode *N);
SDValue visitSSUBO_CARRY(SDNode *N);		SDValue visitSSUBO_CARRY(SDNode *N);
SDValue visitMUL(SDNode *N);		template <class MatchContextClass> SDValue visitMUL(SDNode *N);
SDValue visitMULFIX(SDNode *N);		SDValue visitMULFIX(SDNode *N);
SDValue useDivRem(SDNode *N);		SDValue useDivRem(SDNode *N);
SDValue visitSDIV(SDNode *N);		SDValue visitSDIV(SDNode *N);
SDValue visitSDIVLike(SDValue N0, SDValue N1, SDNode *N);		SDValue visitSDIVLike(SDValue N0, SDValue N1, SDNode *N);
SDValue visitUDIV(SDNode *N);		SDValue visitUDIV(SDNode *N);
SDValue visitUDIVLike(SDValue N0, SDValue N1, SDNode *N);		SDValue visitUDIVLike(SDValue N0, SDValue N1, SDNode *N);
SDValue visitREM(SDNode *N);		SDValue visitREM(SDNode *N);
SDValue visitMULHU(SDNode *N);		SDValue visitMULHU(SDNode *N);
▲ Show 20 Lines • Show All 1,449 Lines • ▼ Show 20 Lines	SDValue DAGCombiner::visit(SDNode *N) {
case ISD::SADDO_CARRY: return visitSADDO_CARRY(N);		case ISD::SADDO_CARRY: return visitSADDO_CARRY(N);
case ISD::SUBE: return visitSUBE(N);		case ISD::SUBE: return visitSUBE(N);
case ISD::USUBO_CARRY: return visitUSUBO_CARRY(N);		case ISD::USUBO_CARRY: return visitUSUBO_CARRY(N);
case ISD::SSUBO_CARRY: return visitSSUBO_CARRY(N);		case ISD::SSUBO_CARRY: return visitSSUBO_CARRY(N);
case ISD::SMULFIX:		case ISD::SMULFIX:
case ISD::SMULFIXSAT:		case ISD::SMULFIXSAT:
case ISD::UMULFIX:		case ISD::UMULFIX:
case ISD::UMULFIXSAT: return visitMULFIX(N);		case ISD::UMULFIXSAT: return visitMULFIX(N);
case ISD::MUL: return visitMUL(N);		case ISD::MUL:
		return visitMUL<EmptyMatchContext>(N);
case ISD::SDIV: return visitSDIV(N);		case ISD::SDIV: return visitSDIV(N);
case ISD::UDIV: return visitUDIV(N);		case ISD::UDIV: return visitUDIV(N);
case ISD::SREM:		case ISD::SREM:
case ISD::UREM: return visitREM(N);		case ISD::UREM: return visitREM(N);
case ISD::MULHU: return visitMULHU(N);		case ISD::MULHU: return visitMULHU(N);
case ISD::MULHS: return visitMULHS(N);		case ISD::MULHS: return visitMULHS(N);
case ISD::AVGFLOORS:		case ISD::AVGFLOORS:
case ISD::AVGFLOORU:		case ISD::AVGFLOORU:
▲ Show 20 Lines • Show All 2,350 Lines • ▼ Show 20 Lines	SDValue DAGCombiner::visitMULFIX(SDNode *N) {

// fold (mulfix x, 0, scale) -> 0		// fold (mulfix x, 0, scale) -> 0
if (isNullConstant(N1))		if (isNullConstant(N1))
return DAG.getConstant(0, SDLoc(N), VT);		return DAG.getConstant(0, SDLoc(N), VT);

return SDValue();		return SDValue();
}		}

SDValue DAGCombiner::visitMUL(SDNode *N) {		template <class MatchContextClass> SDValue DAGCombiner::visitMUL(SDNode *N) {
SDValue N0 = N->getOperand(0);		SDValue N0 = N->getOperand(0);
SDValue N1 = N->getOperand(1);		SDValue N1 = N->getOperand(1);
EVT VT = N0.getValueType();		EVT VT = N0.getValueType();
SDLoc DL(N);		SDLoc DL(N);
		bool IsVP = ISD::isVPOpcode(N->getOpcode());
		craig.topperUnsubmitted Done Reply Inline Actions IS -> Is craig.topper: IS -> Is
		MatchContextClass matcher(DAG, TLI, N);

// fold (mul x, undef) -> 0		// fold (mul x, undef) -> 0
if (N0.isUndef() \|\| N1.isUndef())		if (N0.isUndef() \|\| N1.isUndef())
return DAG.getConstant(0, DL, VT);		return DAG.getConstant(0, DL, VT);

// fold (mul c1, c2) -> c1*c2		// fold (mul c1, c2) -> c1*c2
if (SDValue C = DAG.FoldConstantArithmetic(ISD::MUL, DL, VT, {N0, N1}))		if (SDValue C = DAG.FoldConstantArithmetic(ISD::MUL, DL, VT, {N0, N1}))
		craig.topperUnsubmitted Done Reply Inline Actions What does it mean to support a VP op in FoldConstantArithmetic? craig.topper: What does it mean to support a VP op in FoldConstantArithmetic?
		jacquesguanAuthorUnsubmitted Done Reply Inline Actions I was thinking wrong. This TODO is removed now. jacquesguan: I was thinking wrong. This TODO is removed now.
return C;		return C;

// canonicalize constant to RHS (vector doesn't have to splat)		// canonicalize constant to RHS (vector doesn't have to splat)
if (DAG.isConstantIntBuildVectorOrConstantInt(N0) &&		if (DAG.isConstantIntBuildVectorOrConstantInt(N0) &&
!DAG.isConstantIntBuildVectorOrConstantInt(N1))		!DAG.isConstantIntBuildVectorOrConstantInt(N1))
return DAG.getNode(ISD::MUL, DL, VT, N1, N0);		return matcher.getNode(ISD::MUL, DL, VT, N1, N0);

bool N1IsConst = false;		bool N1IsConst = false;
bool N1IsOpaqueConst = false;		bool N1IsOpaqueConst = false;
APInt ConstValue1;		APInt ConstValue1;

// fold vector ops		// fold vector ops
if (VT.isVector()) {		// TODO: Change this to use SimplifyVBinOp when it supports VP op.
		if (VT.isVector() && !IsVP) {
if (SDValue FoldedVOp = SimplifyVBinOp(N, DL))		if (SDValue FoldedVOp = SimplifyVBinOp(N, DL))
return FoldedVOp;		return FoldedVOp;

N1IsConst = ISD::isConstantSplatVector(N1.getNode(), ConstValue1);		N1IsConst = ISD::isConstantSplatVector(N1.getNode(), ConstValue1);
assert((!N1IsConst \|\|		assert((!N1IsConst \|\|
ConstValue1.getBitWidth() == VT.getScalarSizeInBits()) &&		ConstValue1.getBitWidth() == VT.getScalarSizeInBits()) &&
"Splat APInt should be element width");		"Splat APInt should be element width");
} else {		} else {
N1IsConst = isa<ConstantSDNode>(N1);		N1IsConst = isa<ConstantSDNode>(N1);
if (N1IsConst) {		if (N1IsConst) {
ConstValue1 = cast<ConstantSDNode>(N1)->getAPIntValue();		ConstValue1 = cast<ConstantSDNode>(N1)->getAPIntValue();
N1IsOpaqueConst = cast<ConstantSDNode>(N1)->isOpaque();		N1IsOpaqueConst = cast<ConstantSDNode>(N1)->isOpaque();
}		}
}		}

// fold (mul x, 0) -> 0		// fold (mul x, 0) -> 0
if (N1IsConst && ConstValue1.isZero())		if (N1IsConst && ConstValue1.isZero())
return N1;		return N1;

// fold (mul x, 1) -> x		// fold (mul x, 1) -> x
if (N1IsConst && ConstValue1.isOne())		if (N1IsConst && ConstValue1.isOne())
return N0;		return N0;

		if (!IsVP)
if (SDValue NewSel = foldBinOpIntoSelect(N))		if (SDValue NewSel = foldBinOpIntoSelect(N))
return NewSel;		return NewSel;

// fold (mul x, -1) -> 0-x		// fold (mul x, -1) -> 0-x
if (N1IsConst && ConstValue1.isAllOnes())		if (N1IsConst && ConstValue1.isAllOnes())
return DAG.getNegative(N0, DL, VT);		return matcher.getNode(ISD::SUB, DL, VT, DAG.getConstant(0, DL, VT), N0);

// fold (mul x, (1 << c)) -> x << c		// fold (mul x, (1 << c)) -> x << c
if (isConstantOrConstantVector(N1, /NoOpaques/ true) &&		if (isConstantOrConstantVector(N1, /NoOpaques/ true) &&
DAG.isKnownToBeAPowerOfTwo(N1) &&		DAG.isKnownToBeAPowerOfTwo(N1) &&
(!VT.isVector() \|\| Level <= AfterLegalizeVectorOps)) {		(!VT.isVector() \|\| Level <= AfterLegalizeVectorOps)) {
SDValue LogBase2 = BuildLogBase2(N1, DL);		SDValue LogBase2 = BuildLogBase2(N1, DL);
EVT ShiftVT = getShiftAmountTy(N0.getValueType());		EVT ShiftVT = getShiftAmountTy(N0.getValueType());
SDValue Trunc = DAG.getZExtOrTrunc(LogBase2, DL, ShiftVT);		SDValue Trunc = DAG.getZExtOrTrunc(LogBase2, DL, ShiftVT);
return DAG.getNode(ISD::SHL, DL, VT, N0, Trunc);		return matcher.getNode(ISD::SHL, DL, VT, N0, Trunc);
}		}

// fold (mul x, -(1 << c)) -> -(x << c) or (-x) << c		// fold (mul x, -(1 << c)) -> -(x << c) or (-x) << c
if (N1IsConst && !N1IsOpaqueConst && ConstValue1.isNegatedPowerOf2()) {		if (N1IsConst && !N1IsOpaqueConst && ConstValue1.isNegatedPowerOf2()) {
unsigned Log2Val = (-ConstValue1).logBase2();		unsigned Log2Val = (-ConstValue1).logBase2();
EVT ShiftVT = getShiftAmountTy(N0.getValueType());		EVT ShiftVT = getShiftAmountTy(N0.getValueType());

// FIXME: If the input is something that is easily negated (e.g. a		// FIXME: If the input is something that is easily negated (e.g. a
// single-use add), we should put the negate there.		// single-use add), we should put the negate there.
return DAG.getNode(ISD::SUB, DL, VT,		return matcher.getNode(
DAG.getConstant(0, DL, VT),		ISD::SUB, DL, VT, DAG.getConstant(0, DL, VT),
DAG.getNode(ISD::SHL, DL, VT, N0,		matcher.getNode(ISD::SHL, DL, VT, N0,
DAG.getConstant(Log2Val, DL, ShiftVT)));		DAG.getConstant(Log2Val, DL, ShiftVT)));
}		}

// Attempt to reuse an existing umul_lohi/smul_lohi node, but only if the		// Attempt to reuse an existing umul_lohi/smul_lohi node, but only if the
// hi result is in use in case we hit this mid-legalization.		// hi result is in use in case we hit this mid-legalization.
		if (!IsVP)
for (unsigned LoHiOpc : {ISD::UMUL_LOHI, ISD::SMUL_LOHI}) {		for (unsigned LoHiOpc : {ISD::UMUL_LOHI, ISD::SMUL_LOHI}) {
if (!LegalOperations \|\| TLI.isOperationLegalOrCustom(LoHiOpc, VT)) {		if (!LegalOperations \|\| TLI.isOperationLegalOrCustom(LoHiOpc, VT)) {
SDVTList LoHiVT = DAG.getVTList(VT, VT);		SDVTList LoHiVT = DAG.getVTList(VT, VT);
// TODO: Can we match commutable operands with getNodeIfExists?		// TODO: Can we match commutable operands with getNodeIfExists?
if (SDNode *LoHi = DAG.getNodeIfExists(LoHiOpc, LoHiVT, {N0, N1}))		if (SDNode *LoHi = DAG.getNodeIfExists(LoHiOpc, LoHiVT, {N0, N1}))
if (LoHi->hasAnyUseOfValue(1))		if (LoHi->hasAnyUseOfValue(1))
return SDValue(LoHi, 0);		return SDValue(LoHi, 0);
if (SDNode *LoHi = DAG.getNodeIfExists(LoHiOpc, LoHiVT, {N1, N0}))		if (SDNode *LoHi = DAG.getNodeIfExists(LoHiOpc, LoHiVT, {N1, N0}))
if (LoHi->hasAnyUseOfValue(1))		if (LoHi->hasAnyUseOfValue(1))
return SDValue(LoHi, 0);		return SDValue(LoHi, 0);
}		}
}		}

// Try to transform:		// Try to transform:
// (1) multiply-by-(power-of-2 +/- 1) into shift and add/sub.		// (1) multiply-by-(power-of-2 +/- 1) into shift and add/sub.
// mul x, (2^N + 1) --> add (shl x, N), x		// mul x, (2^N + 1) --> add (shl x, N), x
// mul x, (2^N - 1) --> sub (shl x, N), x		// mul x, (2^N - 1) --> sub (shl x, N), x
// Examples: x * 33 --> (x << 5) + x		// Examples: x * 33 --> (x << 5) + x
// x * 15 --> (x << 4) - x		// x * 15 --> (x << 4) - x
// x * -33 --> -((x << 5) + x)		// x * -33 --> -((x << 5) + x)
// x * -15 --> -((x << 4) - x) ; this reduces --> x - (x << 4)		// x * -15 --> -((x << 4) - x) ; this reduces --> x - (x << 4)
// (2) multiply-by-(power-of-2 +/- power-of-2) into shifts and add/sub.		// (2) multiply-by-(power-of-2 +/- power-of-2) into shifts and add/sub.
// mul x, (2^N + 2^M) --> (add (shl x, N), (shl x, M))		// mul x, (2^N + 2^M) --> (add (shl x, N), (shl x, M))
// mul x, (2^N - 2^M) --> (sub (shl x, N), (shl x, M))		// mul x, (2^N - 2^M) --> (sub (shl x, N), (shl x, M))
// Examples: x * 0x8800 --> (x << 15) + (x << 11)		// Examples: x * 0x8800 --> (x << 15) + (x << 11)
// x * 0xf800 --> (x << 16) - (x << 11)		// x * 0xf800 --> (x << 16) - (x << 11)
// x * -0x8800 --> -((x << 15) + (x << 11))		// x * -0x8800 --> -((x << 15) + (x << 11))
// x * -0xf800 --> -((x << 16) - (x << 11)) ; (x << 11) - (x << 16)		// x * -0xf800 --> -((x << 16) - (x << 11)) ; (x << 11) - (x << 16)
if (N1IsConst && TLI.decomposeMulByConstant(*DAG.getContext(), VT, N1)) {		if (!IsVP && N1IsConst &&
		TLI.decomposeMulByConstant(*DAG.getContext(), VT, N1)) {
// TODO: We could handle more general decomposition of any constant by		// TODO: We could handle more general decomposition of any constant by
// having the target set a limit on number of ops and making a		// having the target set a limit on number of ops and making a
// callback to determine that sequence (similar to sqrt expansion).		// callback to determine that sequence (similar to sqrt expansion).
unsigned MathOp = ISD::DELETED_NODE;		unsigned MathOp = ISD::DELETED_NODE;
APInt MulC = ConstValue1.abs();		APInt MulC = ConstValue1.abs();
// The constant `2` should be treated as (2^0 + 1).		// The constant `2` should be treated as (2^0 + 1).
unsigned TZeros = MulC == 2 ? 0 : MulC.countr_zero();		unsigned TZeros = MulC == 2 ? 0 : MulC.countr_zero();
MulC.lshrInPlace(TZeros);		MulC.lshrInPlace(TZeros);
Show All 17 Lines	if (MathOp != ISD::DELETED_NODE) {
: DAG.getNode(MathOp, DL, VT, Shl, N0);		: DAG.getNode(MathOp, DL, VT, Shl, N0);
if (ConstValue1.isNegative())		if (ConstValue1.isNegative())
R = DAG.getNegative(R, DL, VT);		R = DAG.getNegative(R, DL, VT);
return R;		return R;
}		}
}		}

// (mul (shl X, c1), c2) -> (mul X, c2 << c1)		// (mul (shl X, c1), c2) -> (mul X, c2 << c1)
if (N0.getOpcode() == ISD::SHL) {		if (matcher.match(N0, ISD::SHL)) {
SDValue N01 = N0.getOperand(1);		SDValue N01 = N0.getOperand(1);
if (SDValue C3 = DAG.FoldConstantArithmetic(ISD::SHL, DL, VT, {N1, N01}))		if (SDValue C3 = DAG.FoldConstantArithmetic(ISD::SHL, DL, VT, {N1, N01}))
return DAG.getNode(ISD::MUL, DL, VT, N0.getOperand(0), C3);		return DAG.getNode(ISD::MUL, DL, VT, N0.getOperand(0), C3);
}		}

// Change (mul (shl X, C), Y) -> (shl (mul X, Y), C) when the shift has one		// Change (mul (shl X, C), Y) -> (shl (mul X, Y), C) when the shift has one
// use.		// use.
{		{
SDValue Sh, Y;		SDValue Sh, Y;

// Check for both (mul (shl X, C), Y) and (mul Y, (shl X, C)).		// Check for both (mul (shl X, C), Y) and (mul Y, (shl X, C)).
if (N0.getOpcode() == ISD::SHL &&		if (matcher.match(N0, ISD::SHL) &&
isConstantOrConstantVector(N0.getOperand(1)) && N0->hasOneUse()) {		isConstantOrConstantVector(N0.getOperand(1)) && N0->hasOneUse()) {
Sh = N0; Y = N1;		Sh = N0; Y = N1;
} else if (N1.getOpcode() == ISD::SHL &&		} else if (matcher.match(N1, ISD::SHL) &&
isConstantOrConstantVector(N1.getOperand(1)) &&		isConstantOrConstantVector(N1.getOperand(1)) &&
N1->hasOneUse()) {		N1->hasOneUse()) {
Sh = N1; Y = N0;		Sh = N1; Y = N0;
}		}

if (Sh.getNode()) {		if (Sh.getNode()) {
SDValue Mul = DAG.getNode(ISD::MUL, DL, VT, Sh.getOperand(0), Y);		SDValue Mul = matcher.getNode(ISD::MUL, DL, VT, Sh.getOperand(0), Y);
return DAG.getNode(ISD::SHL, DL, VT, Mul, Sh.getOperand(1));		return matcher.getNode(ISD::SHL, DL, VT, Mul, Sh.getOperand(1));
}		}
}		}

// fold (mul (add x, c1), c2) -> (add (mul x, c2), c1*c2)		// fold (mul (add x, c1), c2) -> (add (mul x, c2), c1*c2)
if (N0.getOpcode() == ISD::ADD &&		if (matcher.match(N0, ISD::ADD) &&
DAG.isConstantIntBuildVectorOrConstantInt(N1) &&		DAG.isConstantIntBuildVectorOrConstantInt(N1) &&
DAG.isConstantIntBuildVectorOrConstantInt(N0.getOperand(1)) &&		DAG.isConstantIntBuildVectorOrConstantInt(N0.getOperand(1)) &&
isMulAddWithConstProfitable(N, N0, N1))		isMulAddWithConstProfitable(N, N0, N1))
return DAG.getNode(		return matcher.getNode(
ISD::ADD, DL, VT,		ISD::ADD, DL, VT,
DAG.getNode(ISD::MUL, SDLoc(N0), VT, N0.getOperand(0), N1),		matcher.getNode(ISD::MUL, SDLoc(N0), VT, N0.getOperand(0), N1),
DAG.getNode(ISD::MUL, SDLoc(N1), VT, N0.getOperand(1), N1));		matcher.getNode(ISD::MUL, SDLoc(N1), VT, N0.getOperand(1), N1));

// Fold (mul (vscale * C0), C1) to (vscale * (C0 * C1)).		// Fold (mul (vscale * C0), C1) to (vscale * (C0 * C1)).
ConstantSDNode *NC1 = isConstOrConstSplat(N1);		ConstantSDNode *NC1 = isConstOrConstSplat(N1);
if (N0.getOpcode() == ISD::VSCALE && NC1) {		if (!IsVP && N0.getOpcode() == ISD::VSCALE && NC1) {
const APInt &C0 = N0.getConstantOperandAPInt(0);		const APInt &C0 = N0.getConstantOperandAPInt(0);
const APInt &C1 = NC1->getAPIntValue();		const APInt &C1 = NC1->getAPIntValue();
return DAG.getVScale(DL, VT, C0 * C1);		return DAG.getVScale(DL, VT, C0 * C1);
}		}

// Fold (mul step_vector(C0), C1) to (step_vector(C0 * C1)).		// Fold (mul step_vector(C0), C1) to (step_vector(C0 * C1)).
APInt MulVal;		APInt MulVal;
if (N0.getOpcode() == ISD::STEP_VECTOR &&		if (!IsVP && N0.getOpcode() == ISD::STEP_VECTOR &&
ISD::isConstantSplatVector(N1.getNode(), MulVal)) {		ISD::isConstantSplatVector(N1.getNode(), MulVal)) {
const APInt &C0 = N0.getConstantOperandAPInt(0);		const APInt &C0 = N0.getConstantOperandAPInt(0);
APInt NewStep = C0 * MulVal;		APInt NewStep = C0 * MulVal;
return DAG.getStepVector(DL, VT, NewStep);		return DAG.getStepVector(DL, VT, NewStep);
}		}

// Fold ((mul x, 0/undef) -> 0,		// Fold ((mul x, 0/undef) -> 0,
// (mul x, 1) -> x) -> x)		// (mul x, 1) -> x) -> x)
Show All 21 Lines	if ((!LegalOperations \|\| TLI.isOperationLegalOrCustom(ISD::AND, VT)) &&
for (unsigned I = 0; I != NumElts; ++I)		for (unsigned I = 0; I != NumElts; ++I)
if (ClearMask[I])		if (ClearMask[I])
Mask[I] = Zero;		Mask[I] = Zero;
return DAG.getNode(ISD::AND, DL, VT, N0, DAG.getBuildVector(VT, DL, Mask));		return DAG.getNode(ISD::AND, DL, VT, N0, DAG.getBuildVector(VT, DL, Mask));
}		}
}		}

// reassociate mul		// reassociate mul
		// TODO: Change reassociateOps to support vp ops.
		if (!IsVP)
if (SDValue RMUL = reassociateOps(ISD::MUL, DL, N0, N1, N->getFlags()))		if (SDValue RMUL = reassociateOps(ISD::MUL, DL, N0, N1, N->getFlags()))
return RMUL;		return RMUL;

// Fold mul(vecreduce(x), vecreduce(y)) -> vecreduce(mul(x, y))		// Fold mul(vecreduce(x), vecreduce(y)) -> vecreduce(mul(x, y))
		// TODO: Change reassociateReduction to support vp ops.
		if (!IsVP)
if (SDValue SD =		if (SDValue SD =
reassociateReduction(ISD::VECREDUCE_MUL, ISD::MUL, DL, VT, N0, N1))		reassociateReduction(ISD::VECREDUCE_MUL, ISD::MUL, DL, VT, N0, N1))
return SD;		return SD;

// Simplify the operands using demanded-bits information.		// Simplify the operands using demanded-bits information.
if (SimplifyDemandedBits(SDValue(N, 0)))		if (SimplifyDemandedBits(SDValue(N, 0)))
return SDValue(N, 0);		return SDValue(N, 0);

return SDValue();		return SDValue();
}		}

▲ Show 20 Lines • Show All 21,158 Lines • ▼ Show 20 Lines	SDValue DAGCombiner::visitVP_FSUB(SDNode *N) {
// FSUB -> FMA combines:		// FSUB -> FMA combines:
if (SDValue Fused = visitFSUBForFMACombine<VPMatchContext>(N)) {		if (SDValue Fused = visitFSUBForFMACombine<VPMatchContext>(N)) {
AddToWorklist(Fused.getNode());		AddToWorklist(Fused.getNode());
return Fused;		return Fused;
}		}
return SDValue();		return SDValue();
}		}

SDValue DAGCombiner::visitVPOp(SDNode *N) {		SDValue DAGCombiner::visitVPOp(SDNode *N) {
		RKSimonUnsubmitted Not Done Reply Inline Actions (style) Don't use auto unless the type is obvious (i.e. a cast<>) RKSimon: (style) Don't use auto unless the type is obvious (i.e. a cast<>)
		craig.topperUnsubmitted Not Done Reply Inline Actions Don't call isConstOrConstSplat(N1) twice craig.topper: Don't call isConstOrConstSplat(N1) twice
		jacquesguanAuthorUnsubmitted Done Reply Inline Actions Done. jacquesguan: Done.

if (N->getOpcode() == ISD::VP_GATHER)		if (N->getOpcode() == ISD::VP_GATHER)
		craig.topperUnsubmitted Not Done Reply Inline Actions What about mul by positive 1 or 0? craig.topper: What about mul by positive 1 or 0?
		jacquesguanAuthorUnsubmitted Done Reply Inline Actions Done. jacquesguan: Done.
if (SDValue SD = visitVPGATHER(N))		if (SDValue SD = visitVPGATHER(N))
		craig.topperUnsubmitted Not Done Reply Inline Actions If one of the true/false values of the VP_SELECT is undef can we ignore the mask and EVL and return the other operand? @simoll @frasercrmck craig.topper: If one of the true/false values of the VP_SELECT is undef can we ignore the mask and EVL and…
		simollUnsubmitted Not Done Reply Inline Actions I believe so. Also for vp ops other than select or merge, if the mask is undef, we can scratch the operation entirely. If evl is undef, we can cut short to `unreachable`. simoll: I believe so. Also for vp ops other than select or merge, if the mask is undef, we can scratch…
		jacquesguanAuthorUnsubmitted Done Reply Inline Actions Done, thanks. jacquesguan: Done, thanks.
return SD;		return SD;

		craig.topperUnsubmitted Not Done Reply Inline Actions I think we should only use getSplatVector for scalable vectors. Fixed vectors should use getSplatBuildVector. craig.topper: I think we should only use getSplatVector for scalable vectors. Fixed vectors should use…
		craig.topperUnsubmitted Not Done Reply Inline Actions You can just call `DAG.getConstant(0, SDLoc(N), VT);` It will do the right thing. craig.topper: You can just call `DAG.getConstant(0, SDLoc(N), VT);` It will do the right thing.
		jacquesguanAuthorUnsubmitted Done Reply Inline Actions Done. jacquesguan: Done.
if (N->getOpcode() == ISD::VP_SCATTER)		if (N->getOpcode() == ISD::VP_SCATTER)
if (SDValue SD = visitVPSCATTER(N))		if (SDValue SD = visitVPSCATTER(N))
return SD;		return SD;

// VP operations in which all vector elements are disabled - either by		// VP operations in which all vector elements are disabled - either by
// determining that the mask is all false or that the EVL is 0 - can be		// determining that the mask is all false or that the EVL is 0 - can be
// eliminated.		// eliminated.
bool AreAllEltsDisabled = false;		bool AreAllEltsDisabled = false;
if (auto EVLIdx = ISD::getVPExplicitVectorLengthIdx(N->getOpcode()))		if (auto EVLIdx = ISD::getVPExplicitVectorLengthIdx(N->getOpcode()))
AreAllEltsDisabled \|= isNullConstant(N->getOperand(*EVLIdx));		AreAllEltsDisabled \|= isNullConstant(N->getOperand(*EVLIdx));
if (auto MaskIdx = ISD::getVPMaskIdx(N->getOpcode()))		if (auto MaskIdx = ISD::getVPMaskIdx(N->getOpcode()))
		craig.topperUnsubmitted Not Done Reply Inline Actions DAG.getConstant(0, SDLoc(N), VT) craig.topper: DAG.getConstant(0, SDLoc(N), VT)
		jacquesguanAuthorUnsubmitted Done Reply Inline Actions Done. jacquesguan: Done.
AreAllEltsDisabled \|=		AreAllEltsDisabled \|=
ISD::isConstantSplatVectorAllZeros(N->getOperand(*MaskIdx).getNode());		ISD::isConstantSplatVectorAllZeros(N->getOperand(*MaskIdx).getNode());

// This is the only generic VP combine we support for now.		// This is the only generic VP combine we support for now.
if (!AreAllEltsDisabled) {		if (!AreAllEltsDisabled) {
switch (N->getOpcode()) {		switch (N->getOpcode()) {
case ISD::VP_FADD:		case ISD::VP_FADD:
return visitVP_FADD(N);		return visitVP_FADD(N);
		craig.topperUnsubmitted Not Done Reply Inline Actions Same comment as above. craig.topper: Same comment as above.
		jacquesguanAuthorUnsubmitted Done Reply Inline Actions Done. jacquesguan: Done.
case ISD::VP_FSUB:		case ISD::VP_FSUB:
return visitVP_FSUB(N);		return visitVP_FSUB(N);
case ISD::VP_FMA:		case ISD::VP_FMA:
return visitFMA<VPMatchContext>(N);		return visitFMA<VPMatchContext>(N);
		case ISD::VP_MUL:
		return visitMUL<VPMatchContext>(N);
		default:
		break;
}		}
return SDValue();		return SDValue();
}		}

// Binary operations can be replaced by UNDEF.		// Binary operations can be replaced by UNDEF.
if (ISD::isVPBinaryOp(N->getOpcode()))		if (ISD::isVPBinaryOp(N->getOpcode()))
return DAG.getUNDEF(N->getValueType(0));		return DAG.getUNDEF(N->getValueType(0));

▲ Show 20 Lines • Show All 1,750 Lines • Show Last 20 Lines

llvm/test/CodeGen/RISCV/rvv/fixed-vectors-vmul-vp.ll

	Show First 20 Lines • Show All 983 Lines • ▼ Show 20 Lines
	; RV64-NEXT: ret			; RV64-NEXT: ret
	%elt.head = insertelement <16 x i64> poison, i64 %b, i32 0			%elt.head = insertelement <16 x i64> poison, i64 %b, i32 0
	%vb = shufflevector <16 x i64> %elt.head, <16 x i64> poison, <16 x i32> zeroinitializer			%vb = shufflevector <16 x i64> %elt.head, <16 x i64> poison, <16 x i32> zeroinitializer
	%head = insertelement <16 x i1> poison, i1 true, i32 0			%head = insertelement <16 x i1> poison, i1 true, i32 0
	%m = shufflevector <16 x i1> %head, <16 x i1> poison, <16 x i32> zeroinitializer			%m = shufflevector <16 x i1> %head, <16 x i1> poison, <16 x i32> zeroinitializer
	%v = call <16 x i64> @llvm.vp.mul.v16i64(<16 x i64> %va, <16 x i64> %vb, <16 x i1> %m, i32 %evl)			%v = call <16 x i64> @llvm.vp.mul.v16i64(<16 x i64> %va, <16 x i64> %vb, <16 x i1> %m, i32 %evl)
	ret <16 x i64> %v			ret <16 x i64> %v
	}			}


				define <8 x i64> @vmul_vv_undef_v8i64(<8 x i64> %va, <8 x i1> %m, i32 zeroext %evl) {
				; RV32-LABEL: vmul_vv_undef_v8i64:
				; RV32: # %bb.0:
				; RV32-NEXT: vsetvli a0, zero, e64, m4, ta, ma
				; RV32-NEXT: vmv.v.i v8, 0
				; RV32-NEXT: ret
				;
				; RV64-LABEL: vmul_vv_undef_v8i64:
				; RV64: # %bb.0:
				; RV64-NEXT: vsetivli zero, 8, e64, m4, ta, ma
				; RV64-NEXT: vmv.v.i v8, 0
				; RV64-NEXT: ret
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %va, <8 x i64> undef, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				define <8 x i64> @vmul_vx_undef_v8i64_unmasked(<8 x i64> %va, i32 zeroext %evl) {
				; RV32-LABEL: vmul_vx_undef_v8i64_unmasked:
				; RV32: # %bb.0:
				; RV32-NEXT: vsetvli a0, zero, e64, m4, ta, ma
				; RV32-NEXT: vmv.v.i v8, 0
				; RV32-NEXT: ret
				;
				; RV64-LABEL: vmul_vx_undef_v8i64_unmasked:
				; RV64: # %bb.0:
				; RV64-NEXT: vsetivli zero, 8, e64, m4, ta, ma
				; RV64-NEXT: vmv.v.i v8, 0
				; RV64-NEXT: ret
				%head = insertelement <8 x i1> poison, i1 true, i32 0
				%m = shufflevector <8 x i1> %head, <8 x i1> poison, <8 x i32> zeroinitializer
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %va, <8 x i64> undef, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				define <8 x i64> @vmul_vx_zero_v8i64(<8 x i64> %va, <8 x i1> %m, i32 zeroext %evl) {
				; RV32-LABEL: vmul_vx_zero_v8i64:
				; RV32: # %bb.0:
				; RV32-NEXT: vsetvli a0, zero, e64, m4, ta, ma
				; RV32-NEXT: vmv.v.i v8, 0
				; RV32-NEXT: ret
				;
				; RV64-LABEL: vmul_vx_zero_v8i64:
				; RV64: # %bb.0:
				; RV64-NEXT: vsetivli zero, 8, e64, m4, ta, ma
				; RV64-NEXT: vmv.v.i v8, 0
				; RV64-NEXT: ret
				%elt.head = insertelement <8 x i64> poison, i64 0, i32 0
				%vb = shufflevector <8 x i64> %elt.head, <8 x i64> poison, <8 x i32> zeroinitializer
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %va, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				define <8 x i64> @vmul_vx_zero_v8i64_unmasked(<8 x i64> %va, i32 zeroext %evl) {
				; RV32-LABEL: vmul_vx_zero_v8i64_unmasked:
				; RV32: # %bb.0:
				; RV32-NEXT: vsetvli a0, zero, e64, m4, ta, ma
				; RV32-NEXT: vmv.v.i v8, 0
				; RV32-NEXT: ret
				;
				; RV64-LABEL: vmul_vx_zero_v8i64_unmasked:
				; RV64: # %bb.0:
				; RV64-NEXT: vsetivli zero, 8, e64, m4, ta, ma
				; RV64-NEXT: vmv.v.i v8, 0
				; RV64-NEXT: ret
				%elt.head = insertelement <8 x i64> poison, i64 0, i32 0
				%vb = shufflevector <8 x i64> %elt.head, <8 x i64> poison, <8 x i32> zeroinitializer
				%head = insertelement <8 x i1> poison, i1 true, i32 0
				%m = shufflevector <8 x i1> %head, <8 x i1> poison, <8 x i32> zeroinitializer
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %va, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				define <8 x i64> @vmul_vx_one_v8i64(<8 x i64> %va, <8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_one_v8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m4, ta, ma
				; CHECK-NEXT: vsll.vi v8, v8, 0, v0.t
				; CHECK-NEXT: ret
				%elt.head = insertelement <8 x i64> poison, i64 1, i32 0
				%vb = shufflevector <8 x i64> %elt.head, <8 x i64> poison, <8 x i32> zeroinitializer
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %va, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				define <8 x i64> @vmul_vx_one_v8i64_unmasked(<8 x i64> %va, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_one_v8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m4, ta, ma
				; CHECK-NEXT: vsll.vi v8, v8, 0
				; CHECK-NEXT: ret
				%elt.head = insertelement <8 x i64> poison, i64 1, i32 0
				%vb = shufflevector <8 x i64> %elt.head, <8 x i64> poison, <8 x i32> zeroinitializer
				%head = insertelement <8 x i1> poison, i1 true, i32 0
				%m = shufflevector <8 x i1> %head, <8 x i1> poison, <8 x i32> zeroinitializer
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %va, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				define <8 x i64> @vmul_vx_negone_v8i64(<8 x i64> %va, <8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_negone_v8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: li a1, -1
				; CHECK-NEXT: vsetvli zero, a0, e64, m4, ta, ma
				; CHECK-NEXT: vmul.vx v8, v8, a1, v0.t
				; CHECK-NEXT: ret
				%elt.head = insertelement <8 x i64> poison, i64 -1, i32 0
				%vb = shufflevector <8 x i64> %elt.head, <8 x i64> poison, <8 x i32> zeroinitializer
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %va, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				define <8 x i64> @vmul_vx_negone_v8i64_unmasked(<8 x i64> %va, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_negone_v8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: li a1, -1
				; CHECK-NEXT: vsetvli zero, a0, e64, m4, ta, ma
				; CHECK-NEXT: vmul.vx v8, v8, a1
				; CHECK-NEXT: ret
				%elt.head = insertelement <8 x i64> poison, i64 -1, i32 0
				%vb = shufflevector <8 x i64> %elt.head, <8 x i64> poison, <8 x i32> zeroinitializer
				%head = insertelement <8 x i1> poison, i1 true, i32 0
				%m = shufflevector <8 x i1> %head, <8 x i1> poison, <8 x i32> zeroinitializer
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %va, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				define <8 x i64> @vmul_vx_pow2_v8i64(<8 x i64> %va, <8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_pow2_v8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m4, ta, ma
				; CHECK-NEXT: vsll.vi v8, v8, 6, v0.t
				; CHECK-NEXT: ret
				%elt.head = insertelement <8 x i64> poison, i64 64, i32 0
				%vb = shufflevector <8 x i64> %elt.head, <8 x i64> poison, <8 x i32> zeroinitializer
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %va, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				define <8 x i64> @vmul_vx_pow2_v8i64_unmasked(<8 x i64> %va, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_pow2_v8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m4, ta, ma
				; CHECK-NEXT: vsll.vi v8, v8, 6
				; CHECK-NEXT: ret
				%elt.head = insertelement <8 x i64> poison, i64 64, i32 0
				%vb = shufflevector <8 x i64> %elt.head, <8 x i64> poison, <8 x i32> zeroinitializer
				%head = insertelement <8 x i1> poison, i1 true, i32 0
				%m = shufflevector <8 x i1> %head, <8 x i1> poison, <8 x i32> zeroinitializer
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %va, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				define <8 x i64> @vmul_vx_negpow2_v8i64(<8 x i64> %va, <8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_negpow2_v8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: li a1, -64
				; CHECK-NEXT: vsetvli zero, a0, e64, m4, ta, ma
				; CHECK-NEXT: vmul.vx v8, v8, a1, v0.t
				; CHECK-NEXT: ret
				%elt.head = insertelement <8 x i64> poison, i64 -64, i32 0
				%vb = shufflevector <8 x i64> %elt.head, <8 x i64> poison, <8 x i32> zeroinitializer
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %va, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				define <8 x i64> @vmul_vx_negpow2_v8i64_unmasked(<8 x i64> %va, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_negpow2_v8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: li a1, -64
				; CHECK-NEXT: vsetvli zero, a0, e64, m4, ta, ma
				; CHECK-NEXT: vmul.vx v8, v8, a1
				; CHECK-NEXT: ret
				%elt.head = insertelement <8 x i64> poison, i64 -64, i32 0
				%vb = shufflevector <8 x i64> %elt.head, <8 x i64> poison, <8 x i32> zeroinitializer
				%head = insertelement <8 x i1> poison, i1 true, i32 0
				%m = shufflevector <8 x i1> %head, <8 x i1> poison, <8 x i32> zeroinitializer
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %va, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				declare <8 x i64> @llvm.vp.shl.v8i64(<8 x i64>, <8 x i64>, <8 x i1>, i32)

				define <8 x i64> @vmul_vshl_vx_v8i64(<8 x i64> %va, <8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vshl_vx_v8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m4, ta, ma
				; CHECK-NEXT: vsll.vi v8, v8, 3, v0.t
				; CHECK-NEXT: li a0, 7
				; CHECK-NEXT: vmul.vx v8, v8, a0, v0.t
				; CHECK-NEXT: ret
				%elt.head1 = insertelement <8 x i64> poison, i64 3, i32 0
				%vb = shufflevector <8 x i64> %elt.head1, <8 x i64> poison, <8 x i32> zeroinitializer
				%elt.head2 = insertelement <8 x i64> poison, i64 7, i32 0
				%vc = shufflevector <8 x i64> %elt.head2, <8 x i64> poison, <8 x i32> zeroinitializer
				%vshl = call <8 x i64> @llvm.vp.shl.v8i64(<8 x i64> %va, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %vshl, <8 x i64> %vc, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				define <8 x i64> @vmul_vshl_vx_v8i64_unmasked(<8 x i64> %va, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vshl_vx_v8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: li a0, 56
				; CHECK-NEXT: vsetivli zero, 8, e64, m4, ta, ma
				; CHECK-NEXT: vmul.vx v8, v8, a0
				; CHECK-NEXT: ret
				%head = insertelement <8 x i1> poison, i1 true, i32 0
				%m = shufflevector <8 x i1> %head, <8 x i1> poison, <8 x i32> zeroinitializer
				%elt.head1 = insertelement <8 x i64> poison, i64 3, i32 0
				%vb = shufflevector <8 x i64> %elt.head1, <8 x i64> poison, <8 x i32> zeroinitializer
				%elt.head2 = insertelement <8 x i64> poison, i64 7, i32 0
				%vc = shufflevector <8 x i64> %elt.head2, <8 x i64> poison, <8 x i32> zeroinitializer
				%vshl = call <8 x i64> @llvm.vp.shl.v8i64(<8 x i64> %va, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %vshl, <8 x i64> %vc, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				define <8 x i64> @vmul_vshl_vv_v8i64(<8 x i64> %va, <8 x i64> %vb, <8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vshl_vv_v8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m4, ta, ma
				; CHECK-NEXT: vsll.vi v8, v8, 7, v0.t
				; CHECK-NEXT: vmul.vv v8, v8, v12, v0.t
				; CHECK-NEXT: ret
				%elt.head = insertelement <8 x i64> poison, i64 7, i32 0
				%vc = shufflevector <8 x i64> %elt.head, <8 x i64> poison, <8 x i32> zeroinitializer
				%vshl = call <8 x i64> @llvm.vp.shl.v8i64(<8 x i64> %va, <8 x i64> %vc, <8 x i1> %m, i32 %evl)
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %vshl, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				define <8 x i64> @vmul_vshl_vv_v8i64_unmasked(<8 x i64> %va, <8 x i64> %vb, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vshl_vv_v8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m4, ta, ma
				; CHECK-NEXT: vmul.vv v8, v8, v12
				; CHECK-NEXT: vsll.vi v8, v8, 7
				; CHECK-NEXT: ret
				%head = insertelement <8 x i1> poison, i1 true, i32 0
				%m = shufflevector <8 x i1> %head, <8 x i1> poison, <8 x i32> zeroinitializer
				%elt.head = insertelement <8 x i64> poison, i64 7, i32 0
				%vc = shufflevector <8 x i64> %elt.head, <8 x i64> poison, <8 x i32> zeroinitializer
				%vshl = call <8 x i64> @llvm.vp.shl.v8i64(<8 x i64> %va, <8 x i64> %vc, <8 x i1> %m, i32 %evl)
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %vshl, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				declare <8 x i64> @llvm.vp.add.v8i64(<8 x i64>, <8 x i64>, <8 x i1>, i32)

				define <8 x i64> @vmul_vadd_vx_v8i64(<8 x i64> %va, <8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vadd_vx_v8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m4, ta, ma
				; CHECK-NEXT: vadd.vi v8, v8, 3, v0.t
				; CHECK-NEXT: li a0, 7
				; CHECK-NEXT: vmul.vx v8, v8, a0, v0.t
				; CHECK-NEXT: ret
				%elt.head1 = insertelement <8 x i64> poison, i64 3, i32 0
				%vb = shufflevector <8 x i64> %elt.head1, <8 x i64> poison, <8 x i32> zeroinitializer
				%elt.head2 = insertelement <8 x i64> poison, i64 7, i32 0
				%vc = shufflevector <8 x i64> %elt.head2, <8 x i64> poison, <8 x i32> zeroinitializer
				%vadd = call <8 x i64> @llvm.vp.add.v8i64(<8 x i64> %va, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %vadd, <8 x i64> %vc, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

				define <8 x i64> @vmul_vadd_vx_v8i64_unmasked(<8 x i64> %va, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vadd_vx_v8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: li a1, 21
				; CHECK-NEXT: vsetivli zero, 8, e64, m4, ta, ma
				; CHECK-NEXT: vmv.v.x v12, a1
				; CHECK-NEXT: li a1, 7
				; CHECK-NEXT: vsetvli zero, a0, e64, m4, ta, ma
				; CHECK-NEXT: vmadd.vx v8, a1, v12
				; CHECK-NEXT: ret
				%head = insertelement <8 x i1> poison, i1 true, i32 0
				%m = shufflevector <8 x i1> %head, <8 x i1> poison, <8 x i32> zeroinitializer
				%elt.head1 = insertelement <8 x i64> poison, i64 3, i32 0
				%vb = shufflevector <8 x i64> %elt.head1, <8 x i64> poison, <8 x i32> zeroinitializer
				%elt.head2 = insertelement <8 x i64> poison, i64 7, i32 0
				%vc = shufflevector <8 x i64> %elt.head2, <8 x i64> poison, <8 x i32> zeroinitializer
				%vadd = call <8 x i64> @llvm.vp.add.v8i64(<8 x i64> %va, <8 x i64> %vb, <8 x i1> %m, i32 %evl)
				%v = call <8 x i64> @llvm.vp.mul.v8i64(<8 x i64> %vadd, <8 x i64> %vc, <8 x i1> %m, i32 %evl)
				ret <8 x i64> %v
				}

llvm/test/CodeGen/RISCV/rvv/vmul-vp.ll

	Show First 20 Lines • Show All 1,285 Lines • ▼ Show 20 Lines
	; RV64-NEXT: ret			; RV64-NEXT: ret
	%elt.head = insertelement <vscale x 8 x i64> poison, i64 %b, i32 0			%elt.head = insertelement <vscale x 8 x i64> poison, i64 %b, i32 0
	%vb = shufflevector <vscale x 8 x i64> %elt.head, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer			%vb = shufflevector <vscale x 8 x i64> %elt.head, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
	%head = insertelement <vscale x 8 x i1> poison, i1 true, i32 0			%head = insertelement <vscale x 8 x i1> poison, i1 true, i32 0
	%m = shufflevector <vscale x 8 x i1> %head, <vscale x 8 x i1> poison, <vscale x 8 x i32> zeroinitializer			%m = shufflevector <vscale x 8 x i1> %head, <vscale x 8 x i1> poison, <vscale x 8 x i32> zeroinitializer
	%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)			%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
	ret <vscale x 8 x i64> %v			ret <vscale x 8 x i64> %v
	}			}

				define <vscale x 8 x i64> @vmul_vv_undef_nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vv_undef_nxv8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli a0, zero, e64, m8, ta, ma
				; CHECK-NEXT: vmv.v.i v8, 0
				; CHECK-NEXT: ret
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> undef, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				define <vscale x 8 x i64> @vmul_vx_undef_nxv8i64_unmasked(<vscale x 8 x i64> %va, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_undef_nxv8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli a0, zero, e64, m8, ta, ma
				; CHECK-NEXT: vmv.v.i v8, 0
				; CHECK-NEXT: ret
				%head = insertelement <vscale x 8 x i1> poison, i1 true, i32 0
				%m = shufflevector <vscale x 8 x i1> %head, <vscale x 8 x i1> poison, <vscale x 8 x i32> zeroinitializer
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> undef, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				define <vscale x 8 x i64> @vmul_vx_zero_nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_zero_nxv8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m8, ta, ma
				; CHECK-NEXT: vmul.vx v8, v8, zero, v0.t
				; CHECK-NEXT: ret
				%elt.head = insertelement <vscale x 8 x i64> poison, i64 0, i32 0
				%vb = shufflevector <vscale x 8 x i64> %elt.head, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				define <vscale x 8 x i64> @vmul_vx_zero_nxv8i64_unmasked(<vscale x 8 x i64> %va, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_zero_nxv8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m8, ta, ma
				; CHECK-NEXT: vmul.vx v8, v8, zero
				; CHECK-NEXT: ret
				%elt.head = insertelement <vscale x 8 x i64> poison, i64 0, i32 0
				%vb = shufflevector <vscale x 8 x i64> %elt.head, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%head = insertelement <vscale x 8 x i1> poison, i1 true, i32 0
				%m = shufflevector <vscale x 8 x i1> %head, <vscale x 8 x i1> poison, <vscale x 8 x i32> zeroinitializer
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				define <vscale x 8 x i64> @vmul_vx_one_nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_one_nxv8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m8, ta, ma
				; CHECK-NEXT: vsll.vi v8, v8, 0, v0.t
				; CHECK-NEXT: ret
				%elt.head = insertelement <vscale x 8 x i64> poison, i64 1, i32 0
				%vb = shufflevector <vscale x 8 x i64> %elt.head, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				define <vscale x 8 x i64> @vmul_vx_one_nxv8i64_unmasked(<vscale x 8 x i64> %va, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_one_nxv8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m8, ta, ma
				; CHECK-NEXT: vsll.vi v8, v8, 0
				; CHECK-NEXT: ret
				%elt.head = insertelement <vscale x 8 x i64> poison, i64 1, i32 0
				%vb = shufflevector <vscale x 8 x i64> %elt.head, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%head = insertelement <vscale x 8 x i1> poison, i1 true, i32 0
				%m = shufflevector <vscale x 8 x i1> %head, <vscale x 8 x i1> poison, <vscale x 8 x i32> zeroinitializer
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				define <vscale x 8 x i64> @vmul_vx_negone_nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_negone_nxv8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: li a1, -1
				; CHECK-NEXT: vsetvli zero, a0, e64, m8, ta, ma
				; CHECK-NEXT: vmul.vx v8, v8, a1, v0.t
				; CHECK-NEXT: ret
				%elt.head = insertelement <vscale x 8 x i64> poison, i64 -1, i32 0
				%vb = shufflevector <vscale x 8 x i64> %elt.head, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				define <vscale x 8 x i64> @vmul_vx_negone_nxv8i64_unmasked(<vscale x 8 x i64> %va, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_negone_nxv8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: li a1, -1
				; CHECK-NEXT: vsetvli zero, a0, e64, m8, ta, ma
				; CHECK-NEXT: vmul.vx v8, v8, a1
				; CHECK-NEXT: ret
				%elt.head = insertelement <vscale x 8 x i64> poison, i64 -1, i32 0
				%vb = shufflevector <vscale x 8 x i64> %elt.head, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%head = insertelement <vscale x 8 x i1> poison, i1 true, i32 0
				%m = shufflevector <vscale x 8 x i1> %head, <vscale x 8 x i1> poison, <vscale x 8 x i32> zeroinitializer
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				define <vscale x 8 x i64> @vmul_vx_pow2_nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_pow2_nxv8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m8, ta, ma
				; CHECK-NEXT: vsll.vi v8, v8, 6, v0.t
				; CHECK-NEXT: ret
				%elt.head = insertelement <vscale x 8 x i64> poison, i64 64, i32 0
				%vb = shufflevector <vscale x 8 x i64> %elt.head, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				define <vscale x 8 x i64> @vmul_vx_pow2_nxv8i64_unmasked(<vscale x 8 x i64> %va, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_pow2_nxv8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m8, ta, ma
				; CHECK-NEXT: vsll.vi v8, v8, 6
				; CHECK-NEXT: ret
				%elt.head = insertelement <vscale x 8 x i64> poison, i64 64, i32 0
				%vb = shufflevector <vscale x 8 x i64> %elt.head, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%head = insertelement <vscale x 8 x i1> poison, i1 true, i32 0
				%m = shufflevector <vscale x 8 x i1> %head, <vscale x 8 x i1> poison, <vscale x 8 x i32> zeroinitializer
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				define <vscale x 8 x i64> @vmul_vx_negpow2_nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_negpow2_nxv8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: li a1, -64
				; CHECK-NEXT: vsetvli zero, a0, e64, m8, ta, ma
				; CHECK-NEXT: vmul.vx v8, v8, a1, v0.t
				; CHECK-NEXT: ret
				%elt.head = insertelement <vscale x 8 x i64> poison, i64 -64, i32 0
				%vb = shufflevector <vscale x 8 x i64> %elt.head, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				define <vscale x 8 x i64> @vmul_vx_negpow2_nxv8i64_unmasked(<vscale x 8 x i64> %va, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vx_negpow2_nxv8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: li a1, -64
				; CHECK-NEXT: vsetvli zero, a0, e64, m8, ta, ma
				; CHECK-NEXT: vmul.vx v8, v8, a1
				; CHECK-NEXT: ret
				%elt.head = insertelement <vscale x 8 x i64> poison, i64 -64, i32 0
				%vb = shufflevector <vscale x 8 x i64> %elt.head, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%head = insertelement <vscale x 8 x i1> poison, i1 true, i32 0
				%m = shufflevector <vscale x 8 x i1> %head, <vscale x 8 x i1> poison, <vscale x 8 x i32> zeroinitializer
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				declare <vscale x 8 x i64> @llvm.vp.shl.nxv8i64(<vscale x 8 x i64>, <vscale x 8 x i64>, <vscale x 8 x i1>, i32)

				define <vscale x 8 x i64> @vmul_vshl_vx_nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vshl_vx_nxv8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: li a0, 56
				; CHECK-NEXT: vsetvli a1, zero, e64, m8, ta, ma
				; CHECK-NEXT: vmul.vx v8, v8, a0
				; CHECK-NEXT: ret
				%elt.head1 = insertelement <vscale x 8 x i64> poison, i64 3, i32 0
				%vb = shufflevector <vscale x 8 x i64> %elt.head1, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%elt.head2 = insertelement <vscale x 8 x i64> poison, i64 7, i32 0
				%vc = shufflevector <vscale x 8 x i64> %elt.head2, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%vshl = call <vscale x 8 x i64> @llvm.vp.shl.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %vshl, <vscale x 8 x i64> %vc, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				define <vscale x 8 x i64> @vmul_vshl_vx_nxv8i64_unmasked(<vscale x 8 x i64> %va, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vshl_vx_nxv8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: li a0, 56
				; CHECK-NEXT: vsetvli a1, zero, e64, m8, ta, ma
				; CHECK-NEXT: vmul.vx v8, v8, a0
				; CHECK-NEXT: ret
				%head = insertelement <vscale x 8 x i1> poison, i1 true, i32 0
				%m = shufflevector <vscale x 8 x i1> %head, <vscale x 8 x i1> poison, <vscale x 8 x i32> zeroinitializer
				%elt.head1 = insertelement <vscale x 8 x i64> poison, i64 3, i32 0
				%vb = shufflevector <vscale x 8 x i64> %elt.head1, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%elt.head2 = insertelement <vscale x 8 x i64> poison, i64 7, i32 0
				%vc = shufflevector <vscale x 8 x i64> %elt.head2, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%vshl = call <vscale x 8 x i64> @llvm.vp.shl.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %vshl, <vscale x 8 x i64> %vc, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				define <vscale x 8 x i64> @vmul_vshl_vv_nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vshl_vv_nxv8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m8, ta, ma
				; CHECK-NEXT: vmul.vv v8, v8, v16, v0.t
				; CHECK-NEXT: vsll.vi v8, v8, 7, v0.t
				; CHECK-NEXT: ret
				%elt.head = insertelement <vscale x 8 x i64> poison, i64 7, i32 0
				%vc = shufflevector <vscale x 8 x i64> %elt.head, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%vshl = call <vscale x 8 x i64> @llvm.vp.shl.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vc, <vscale x 8 x i1> %m, i32 %evl)
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %vshl, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				define <vscale x 8 x i64> @vmul_vshl_vv_nxv8i64_unmasked(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vshl_vv_nxv8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: vsetvli zero, a0, e64, m8, ta, ma
				; CHECK-NEXT: vmul.vv v8, v8, v16
				; CHECK-NEXT: vsll.vi v8, v8, 7
				; CHECK-NEXT: ret
				%head = insertelement <vscale x 8 x i1> poison, i1 true, i32 0
				%m = shufflevector <vscale x 8 x i1> %head, <vscale x 8 x i1> poison, <vscale x 8 x i32> zeroinitializer
				%elt.head = insertelement <vscale x 8 x i64> poison, i64 7, i32 0
				%vc = shufflevector <vscale x 8 x i64> %elt.head, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%vshl = call <vscale x 8 x i64> @llvm.vp.shl.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vc, <vscale x 8 x i1> %m, i32 %evl)
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %vshl, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				declare <vscale x 8 x i64> @llvm.vp.add.nxv8i64(<vscale x 8 x i64>, <vscale x 8 x i64>, <vscale x 8 x i1>, i32)

				define <vscale x 8 x i64> @vmul_vadd_vx_nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i1> %m, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vadd_vx_nxv8i64:
				; CHECK: # %bb.0:
				; CHECK-NEXT: li a1, 7
				; CHECK-NEXT: vsetvli zero, a0, e64, m8, ta, ma
				; CHECK-NEXT: vmul.vx v8, v8, a1, v0.t
				; CHECK-NEXT: li a0, 21
				; CHECK-NEXT: vadd.vx v8, v8, a0, v0.t
				; CHECK-NEXT: ret
				%elt.head1 = insertelement <vscale x 8 x i64> poison, i64 3, i32 0
				%vb = shufflevector <vscale x 8 x i64> %elt.head1, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%elt.head2 = insertelement <vscale x 8 x i64> poison, i64 7, i32 0
				%vc = shufflevector <vscale x 8 x i64> %elt.head2, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%vadd = call <vscale x 8 x i64> @llvm.vp.add.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %vadd, <vscale x 8 x i64> %vc, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

				define <vscale x 8 x i64> @vmul_vadd_vx_nxv8i64_unmasked(<vscale x 8 x i64> %va, i32 zeroext %evl) {
				; CHECK-LABEL: vmul_vadd_vx_nxv8i64_unmasked:
				; CHECK: # %bb.0:
				; CHECK-NEXT: li a1, 21
				; CHECK-NEXT: vsetvli a2, zero, e64, m8, ta, ma
				; CHECK-NEXT: vmv.v.x v16, a1
				; CHECK-NEXT: li a1, 7
				; CHECK-NEXT: vsetvli zero, a0, e64, m8, ta, ma
				; CHECK-NEXT: vmadd.vx v8, a1, v16
				; CHECK-NEXT: ret
				%head = insertelement <vscale x 8 x i1> poison, i1 true, i32 0
				%m = shufflevector <vscale x 8 x i1> %head, <vscale x 8 x i1> poison, <vscale x 8 x i32> zeroinitializer
				%elt.head1 = insertelement <vscale x 8 x i64> poison, i64 3, i32 0
				%vb = shufflevector <vscale x 8 x i64> %elt.head1, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%elt.head2 = insertelement <vscale x 8 x i64> poison, i64 7, i32 0
				%vc = shufflevector <vscale x 8 x i64> %elt.head2, <vscale x 8 x i64> poison, <vscale x 8 x i32> zeroinitializer
				%vadd = call <vscale x 8 x i64> @llvm.vp.add.nxv8i64(<vscale x 8 x i64> %va, <vscale x 8 x i64> %vb, <vscale x 8 x i1> %m, i32 %evl)
				%v = call <vscale x 8 x i64> @llvm.vp.mul.nxv8i64(<vscale x 8 x i64> %vadd, <vscale x 8 x i64> %vc, <vscale x 8 x i1> %m, i32 %evl)
				ret <vscale x 8 x i64> %v
				}

This is an archive of the discontinued LLVM Phabricator instance.

[DAGCombiner][VP] Add DAGCombine for VP_MUL.
Needs ReviewPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 529839

llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

llvm/test/CodeGen/RISCV/rvv/fixed-vectors-vmul-vp.ll

llvm/test/CodeGen/RISCV/rvv/vmul-vp.ll

This is an archive of the discontinued LLVM Phabricator instance.

[DAGCombiner][VP] Add DAGCombine for VP_MUL.Needs ReviewPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 529839

llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

llvm/test/CodeGen/RISCV/rvv/fixed-vectors-vmul-vp.ll

llvm/test/CodeGen/RISCV/rvv/vmul-vp.ll

[DAGCombiner][VP] Add DAGCombine for VP_MUL.
Needs ReviewPublic