Diff 98548

llvm/include/llvm/Target/TargetLowering.h

Show First 20 Lines • Show All 2,057 Lines • ▼ Show 20 Lines	public:
}		}

// Return true if it is profitable to use a scalar input to a BUILD_VECTOR		// Return true if it is profitable to use a scalar input to a BUILD_VECTOR
// even if the vector itself has multiple uses.		// even if the vector itself has multiple uses.
virtual bool aggressivelyPreferBuildVectorSources(EVT VecVT) const {		virtual bool aggressivelyPreferBuildVectorSources(EVT VecVT) const {
return false;		return false;
}		}

// Return true if the instruction that performs a << b actually performs
// a << (b % (sizeof(a) * 8)).
virtual bool supportsModuloShift(ISD::NodeType Inst, EVT ReturnType) const {
assert((Inst == ISD::SHL \|\| Inst == ISD::SRA \|\| Inst == ISD::SRL) &&
"Expect a shift instruction");
return false;
}

//===--------------------------------------------------------------------===//		//===--------------------------------------------------------------------===//
// Runtime Library hooks		// Runtime Library hooks
//		//

/// Rename the default libcall routine name for the specified libcall.		/// Rename the default libcall routine name for the specified libcall.
void setLibcallName(RTLIB::Libcall Call, const char *Name) {		void setLibcallName(RTLIB::Libcall Call, const char *Name) {
LibcallRoutineNames[Call] = Name;		LibcallRoutineNames[Call] = Name;
}		}
▲ Show 20 Lines • Show All 1,270 Lines • Show Last 20 Lines

llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 5,307 Lines • ▼ Show 20 Lines	if (N1CV && N1CV->isConstant()) {
if (SDValue C = DAG.FoldConstantArithmetic(ISD::SHL, SDLoc(N), VT,		if (SDValue C = DAG.FoldConstantArithmetic(ISD::SHL, SDLoc(N), VT,
N01CV, N1CV))		N01CV, N1CV))
return DAG.getNode(ISD::AND, SDLoc(N), VT, N00, C);		return DAG.getNode(ISD::AND, SDLoc(N), VT, N00, C);
}		}
}		}
}		}
}		}

// If the target supports masking y in (shl, y),
// fold (shl x, (and y, ((1 << numbits(x)) - 1))) -> (shl x, y)
if (TLI.isOperationLegal(ISD::SHL, VT) &&
TLI.supportsModuloShift(ISD::SHL, VT) && N1->getOpcode() == ISD::AND) {
if (ConstantSDNode *Mask = isConstOrConstSplat(N1->getOperand(1))) {
if (Mask->getZExtValue() == OpSizeInBits - 1) {
return DAG.getNode(ISD::SHL, SDLoc(N), VT, N0, N1->getOperand(0));
}
}
}

ConstantSDNode *N1C = isConstOrConstSplat(N1);		ConstantSDNode *N1C = isConstOrConstSplat(N1);

// fold (shl c1, c2) -> c1<<c2		// fold (shl c1, c2) -> c1<<c2
ConstantSDNode *N0C = getAsNonOpaqueConstant(N0);		ConstantSDNode *N0C = getAsNonOpaqueConstant(N0);
if (N0C && N1C && !N1C->isOpaque())		if (N0C && N1C && !N1C->isOpaque())
return DAG.FoldConstantArithmetic(ISD::SHL, SDLoc(N), VT, N0C, N1C);		return DAG.FoldConstantArithmetic(ISD::SHL, SDLoc(N), VT, N0C, N1C);
// fold (shl 0, x) -> 0		// fold (shl 0, x) -> 0
if (isNullConstantOrNullSplatConstant(N0))		if (isNullConstantOrNullSplatConstant(N0))
▲ Show 20 Lines • Show All 182 Lines • ▼ Show 20 Lines
}		}

SDValue DAGCombiner::visitSRA(SDNode *N) {		SDValue DAGCombiner::visitSRA(SDNode *N) {
SDValue N0 = N->getOperand(0);		SDValue N0 = N->getOperand(0);
SDValue N1 = N->getOperand(1);		SDValue N1 = N->getOperand(1);
EVT VT = N0.getValueType();		EVT VT = N0.getValueType();
unsigned OpSizeInBits = VT.getScalarSizeInBits();		unsigned OpSizeInBits = VT.getScalarSizeInBits();

// If the target supports masking y in (sra, y),
// fold (sra x, (and y, ((1 << numbits(x)) - 1))) -> (sra x, y)
if (TLI.isOperationLegal(ISD::SRA, VT) &&
TLI.supportsModuloShift(ISD::SRA, VT) && N1->getOpcode() == ISD::AND) {
if (ConstantSDNode *Mask = isConstOrConstSplat(N1->getOperand(1))) {
if (Mask->getZExtValue() == OpSizeInBits - 1) {
return DAG.getNode(ISD::SRA, SDLoc(N), VT, N0, N1->getOperand(0));
}
}
}

// Arithmetic shifting an all-sign-bit value is a no-op.		// Arithmetic shifting an all-sign-bit value is a no-op.
// fold (sra 0, x) -> 0		// fold (sra 0, x) -> 0
// fold (sra -1, x) -> -1		// fold (sra -1, x) -> -1
if (DAG.ComputeNumSignBits(N0) == OpSizeInBits)		if (DAG.ComputeNumSignBits(N0) == OpSizeInBits)
return N0;		return N0;

// fold vector ops		// fold vector ops
if (VT.isVector())		if (VT.isVector())
▲ Show 20 Lines • Show All 138 Lines • ▼ Show 20 Lines
}		}

SDValue DAGCombiner::visitSRL(SDNode *N) {		SDValue DAGCombiner::visitSRL(SDNode *N) {
SDValue N0 = N->getOperand(0);		SDValue N0 = N->getOperand(0);
SDValue N1 = N->getOperand(1);		SDValue N1 = N->getOperand(1);
EVT VT = N0.getValueType();		EVT VT = N0.getValueType();
unsigned OpSizeInBits = VT.getScalarSizeInBits();		unsigned OpSizeInBits = VT.getScalarSizeInBits();

// If the target supports masking y in (srl, y),
// fold (srl x, (and y, ((1 << numbits(x)) - 1))) -> (srl x, y)
if (TLI.isOperationLegal(ISD::SRL, VT) &&
TLI.supportsModuloShift(ISD::SRL, VT) && N1->getOpcode() == ISD::AND) {
if (ConstantSDNode *Mask = isConstOrConstSplat(N1->getOperand(1))) {
if (Mask->getZExtValue() == OpSizeInBits - 1) {
return DAG.getNode(ISD::SRL, SDLoc(N), VT, N0, N1->getOperand(0));
}
}
}

// fold vector ops		// fold vector ops
if (VT.isVector())		if (VT.isVector())
if (SDValue FoldedVOp = SimplifyVBinOp(N))		if (SDValue FoldedVOp = SimplifyVBinOp(N))
return FoldedVOp;		return FoldedVOp;

ConstantSDNode *N1C = isConstOrConstSplat(N1);		ConstantSDNode *N1C = isConstOrConstSplat(N1);

// fold (srl c1, c2) -> c1 >>u c2		// fold (srl c1, c2) -> c1 >>u c2
▲ Show 20 Lines • Show All 10,966 Lines • Show Last 20 Lines

llvm/lib/Target/PowerPC/PPCISelLowering.h

Show First 20 Lines • Show All 111 Lines • ▼ Show 20 Lines	enum NodeType : unsigned {
/// compute an offset from native SP to the address of the most recent		/// compute an offset from native SP to the address of the most recent
/// dynamic alloca.		/// dynamic alloca.
DYNAREAOFFSET,		DYNAREAOFFSET,

/// GlobalBaseReg - On Darwin, this node represents the result of the mflr		/// GlobalBaseReg - On Darwin, this node represents the result of the mflr
/// at function entry, used for PIC code.		/// at function entry, used for PIC code.
GlobalBaseReg,		GlobalBaseReg,

/// These nodes represent the 32-bit PPC shifts that operate on 6-bit		/// These nodes represent PPC shifts. For vector types, arbitrary shift
/// shift amounts. These nodes are generated by the multi-precision shift		/// amounts are supported - the actual bits shifted is the modulo result
/// code.		/// of the amount and the element width.
		efriedmaUnsubmitted Not Done Reply Inline Actions Maybe leave the comment noting that 32-bit shifts are modulo 64? efriedma: Maybe leave the comment noting that 32-bit shifts are modulo 64?
		timshenAuthorUnsubmitted Not Done Reply Inline Actions Documented. It's actually more subtle than "modulo 64". FWIW: For (shl (i32 a), b): if ((b % 64) >= 32) return 0; return a << (b % 32) timshen: Documented. It's actually more subtle than "modulo 64". FWIW: For (shl (i32 a), b): if…
SRL, SRA, SHL,		SRL, SRA, SHL,

/// The combination of sra[wd]i and addze used to implemented signed		/// The combination of sra[wd]i and addze used to implemented signed
/// integer division by a power of 2. The first operand is the dividend,		/// integer division by a power of 2. The first operand is the dividend,
		iterateeUnsubmitted Not Done Reply Inline Actions "For vector types, only the last n bits are used." iteratee: "For vector types, only the last n bits are used."
/// and the second is the constant shift amount (representing the		/// and the second is the constant shift amount (representing the
/// divisor).		/// divisor).
SRA_ADDZE,		SRA_ADDZE,

/// CALL - A direct function call.		/// CALL - A direct function call.
/// CALL_NOP is a call with the special NOP which follows 64-bit		/// CALL_NOP is a call with the special NOP which follows 64-bit
/// SVR4 calls.		/// SVR4 calls.
CALL, CALL_NOP,		CALL, CALL_NOP,
▲ Show 20 Lines • Show All 859 Lines • ▼ Show 20 Lines	private:

SDValue lowerEH_SJLJ_SETJMP(SDValue Op, SelectionDAG &DAG) const;		SDValue lowerEH_SJLJ_SETJMP(SDValue Op, SelectionDAG &DAG) const;
SDValue lowerEH_SJLJ_LONGJMP(SDValue Op, SelectionDAG &DAG) const;		SDValue lowerEH_SJLJ_LONGJMP(SDValue Op, SelectionDAG &DAG) const;

SDValue DAGCombineExtBoolTrunc(SDNode *N, DAGCombinerInfo &DCI) const;		SDValue DAGCombineExtBoolTrunc(SDNode *N, DAGCombinerInfo &DCI) const;
SDValue DAGCombineBuildVector(SDNode *N, DAGCombinerInfo &DCI) const;		SDValue DAGCombineBuildVector(SDNode *N, DAGCombinerInfo &DCI) const;
SDValue DAGCombineTruncBoolExt(SDNode *N, DAGCombinerInfo &DCI) const;		SDValue DAGCombineTruncBoolExt(SDNode *N, DAGCombinerInfo &DCI) const;
SDValue combineFPToIntToFP(SDNode *N, DAGCombinerInfo &DCI) const;		SDValue combineFPToIntToFP(SDNode *N, DAGCombinerInfo &DCI) const;
		SDValue combineSHL(SDNode *N, DAGCombinerInfo &DCI) const;
		SDValue combineSRA(SDNode *N, DAGCombinerInfo &DCI) const;
		SDValue combineSRL(SDNode *N, DAGCombinerInfo &DCI) const;

/// ConvertSETCCToSubtract - looks at SETCC that compares ints. It replaces		/// ConvertSETCCToSubtract - looks at SETCC that compares ints. It replaces
/// SETCC with integer subtraction when (1) there is a legal way of doing it		/// SETCC with integer subtraction when (1) there is a legal way of doing it
/// (2) keeping the result of comparison in GPR has performance benefit.		/// (2) keeping the result of comparison in GPR has performance benefit.
SDValue ConvertSETCCToSubtract(SDNode *N, DAGCombinerInfo &DCI) const;		SDValue ConvertSETCCToSubtract(SDNode *N, DAGCombinerInfo &DCI) const;

SDValue getSqrtEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled,		SDValue getSqrtEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled,
int &RefinementSteps, bool &UseOneConstNR,		int &RefinementSteps, bool &UseOneConstNR,
bool Reciprocal) const override;		bool Reciprocal) const override;
SDValue getRecipEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled,		SDValue getRecipEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled,
int &RefinementSteps) const override;		int &RefinementSteps) const override;
unsigned combineRepeatedFPDivisors() const override;		unsigned combineRepeatedFPDivisors() const override;

CCAssignFn *useFastISelCCs(unsigned Flag) const;		CCAssignFn *useFastISelCCs(unsigned Flag) const;

SDValue		SDValue
combineElementTruncationToVectorTruncation(SDNode *N,		combineElementTruncationToVectorTruncation(SDNode *N,
DAGCombinerInfo &DCI) const;		DAGCombinerInfo &DCI) const;

bool supportsModuloShift(ISD::NodeType Inst,
EVT ReturnType) const override {
assert((Inst == ISD::SHL \|\| Inst == ISD::SRA \|\| Inst == ISD::SRL) &&
"Expect a shift instruction");
assert(isOperationLegal(Inst, ReturnType));
return ReturnType.isVector();
}
};		};

namespace PPC {		namespace PPC {

FastISel *createFastISel(FunctionLoweringInfo &FuncInfo,		FastISel *createFastISel(FunctionLoweringInfo &FuncInfo,
const TargetLibraryInfo *LibInfo);		const TargetLibraryInfo *LibInfo);

} // end namespace PPC		} // end namespace PPC
Show All 28 Lines

llvm/lib/Target/PowerPC/PPCISelLowering.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 917 Lines • ▼ Show 20 Lines	if (!isPPC64) {
setLibcallName(RTLIB::SHL_I128, nullptr);		setLibcallName(RTLIB::SHL_I128, nullptr);
setLibcallName(RTLIB::SRL_I128, nullptr);		setLibcallName(RTLIB::SRL_I128, nullptr);
setLibcallName(RTLIB::SRA_I128, nullptr);		setLibcallName(RTLIB::SRA_I128, nullptr);
}		}

setStackPointerRegisterToSaveRestore(isPPC64 ? PPC::X1 : PPC::R1);		setStackPointerRegisterToSaveRestore(isPPC64 ? PPC::X1 : PPC::R1);

// We have target-specific dag combine patterns for the following nodes:		// We have target-specific dag combine patterns for the following nodes:
		setTargetDAGCombine(ISD::SHL);
		setTargetDAGCombine(ISD::SRA);
		setTargetDAGCombine(ISD::SRL);
setTargetDAGCombine(ISD::SINT_TO_FP);		setTargetDAGCombine(ISD::SINT_TO_FP);
setTargetDAGCombine(ISD::BUILD_VECTOR);		setTargetDAGCombine(ISD::BUILD_VECTOR);
if (Subtarget.hasFPCVT())		if (Subtarget.hasFPCVT())
setTargetDAGCombine(ISD::UINT_TO_FP);		setTargetDAGCombine(ISD::UINT_TO_FP);
setTargetDAGCombine(ISD::LOAD);		setTargetDAGCombine(ISD::LOAD);
setTargetDAGCombine(ISD::STORE);		setTargetDAGCombine(ISD::STORE);
setTargetDAGCombine(ISD::BR_CC);		setTargetDAGCombine(ISD::BR_CC);
if (Subtarget.useCRBits())		if (Subtarget.useCRBits())
▲ Show 20 Lines • Show All 10,373 Lines • ▼ Show 20 Lines
}		}

SDValue PPCTargetLowering::PerformDAGCombine(SDNode *N,		SDValue PPCTargetLowering::PerformDAGCombine(SDNode *N,
DAGCombinerInfo &DCI) const {		DAGCombinerInfo &DCI) const {
SelectionDAG &DAG = DCI.DAG;		SelectionDAG &DAG = DCI.DAG;
SDLoc dl(N);		SDLoc dl(N);
switch (N->getOpcode()) {		switch (N->getOpcode()) {
default: break;		default: break;
		case ISD::SHL:
		return combineSHL(N, DCI);
		case ISD::SRA:
		return combineSRA(N, DCI);
		case ISD::SRL:
		return combineSRL(N, DCI);
case PPCISD::SHL:		case PPCISD::SHL:
if (isNullConstant(N->getOperand(0))) // 0 << V -> 0.		if (isNullConstant(N->getOperand(0))) // 0 << V -> 0.
return N->getOperand(0);		return N->getOperand(0);
break;		break;
case PPCISD::SRL:		case PPCISD::SRL:
if (isNullConstant(N->getOperand(0))) // 0 >>u V -> 0.		if (isNullConstant(N->getOperand(0))) // 0 >>u V -> 0.
return N->getOperand(0);		return N->getOperand(0);
break;		break;
▲ Show 20 Lines • Show All 1,616 Lines • ▼ Show 20 Lines	default:
// false. Examples: f16, f80.		// false. Examples: f16, f80.
return false;		return false;
case MVT::f32:		case MVT::f32:
case MVT::f64:		case MVT::f64:
case MVT::ppcf128:		case MVT::ppcf128:
return Imm.isPosZero();		return Imm.isPosZero();
}		}
}		}

		// For shift operation op, if it's a vector opeartion,
		iterateeUnsubmitted Not Done Reply Inline Actions That's a typo. iteratee: That's a typo.
		// fold (op x, (and y, ((1 << numbits(x)) - 1))) -> (target op x, y)
		static SDValue stripModuloOnShift(const TargetLowering &TLI, SDNode *N,
		SelectionDAG &DAG) {
		SDValue N0 = N->getOperand(0);
		SDValue N1 = N->getOperand(1);
		EVT VT = N0.getValueType();
		unsigned OpSizeInBits = VT.getScalarSizeInBits();
		unsigned Opcode = N->getOpcode();
		unsigned TargetOpcode;

		switch (Opcode) {
		default:
		llvm_unreachable("Unexpected shift operation");
		case ISD::SHL:
		TargetOpcode = PPCISD::SHL;
		break;
		case ISD::SRL:
		TargetOpcode = PPCISD::SRL;
		break;
		case ISD::SRA:
		TargetOpcode = PPCISD::SRA;
		break;
		}

		if (VT.isVector() && TLI.isOperationLegal(Opcode, VT) &&
		N1->getOpcode() == ISD::AND)
		if (ConstantSDNode *Mask = isConstOrConstSplat(N1->getOperand(1)))
		if (Mask->getZExtValue() == OpSizeInBits - 1)
		return DAG.getNode(TargetOpcode, SDLoc(N), VT, N0, N1->getOperand(0));

		return SDValue();
		}

		SDValue PPCTargetLowering::combineSHL(SDNode *N, DAGCombinerInfo &DCI) const {
		if (auto Value = stripModuloOnShift(*this, N, DCI.DAG))
		return Value;

		return SDValue();
		}

		SDValue PPCTargetLowering::combineSRA(SDNode *N, DAGCombinerInfo &DCI) const {
		if (auto Value = stripModuloOnShift(*this, N, DCI.DAG))
		return Value;

		return SDValue();
		}

		SDValue PPCTargetLowering::combineSRL(SDNode *N, DAGCombinerInfo &DCI) const {
		if (auto Value = stripModuloOnShift(*this, N, DCI.DAG))
		efriedmaUnsubmitted Done Reply Inline Actions Duplicated code; can you refactor these? efriedma: Duplicated code; can you refactor these?
		return Value;

		return SDValue();
		}

llvm/lib/Target/PowerPC/PPCInstrAltivec.td

Show First 20 Lines • Show All 981 Lines • ▼ Show 20 Lines

// Vector shifts		// Vector shifts
def : Pat<(v16i8 (shl v16i8:$vA, v16i8:$vB)),		def : Pat<(v16i8 (shl v16i8:$vA, v16i8:$vB)),
(v16i8 (VSLB $vA, $vB))>;		(v16i8 (VSLB $vA, $vB))>;
def : Pat<(v8i16 (shl v8i16:$vA, v8i16:$vB)),		def : Pat<(v8i16 (shl v8i16:$vA, v8i16:$vB)),
(v8i16 (VSLH $vA, $vB))>;		(v8i16 (VSLH $vA, $vB))>;
def : Pat<(v4i32 (shl v4i32:$vA, v4i32:$vB)),		def : Pat<(v4i32 (shl v4i32:$vA, v4i32:$vB)),
(v4i32 (VSLW $vA, $vB))>;		(v4i32 (VSLW $vA, $vB))>;
		def : Pat<(v16i8 (PPCshl v16i8:$vA, v16i8:$vB)),
		iterateeUnsubmitted Not Done Reply Inline Actions Can these patterns go in a separate patch? They only seem partially related. iteratee: Can these patterns go in a separate patch? They only seem partially related.
		timshenAuthorUnsubmitted Not Done Reply Inline Actions They can, the problem is that there is no way to test that patch, since no one generates PPCshl on vector until this patch. Do you think it'd be ok to have a separate patch being unable to test? timshen: They can, the problem is that there is no way to test that patch, since no one generates PPCshl…
		iterateeUnsubmitted Not Done Reply Inline Actions If you add the patterns, they should be generated. That was what happened when I added the vector shift patterns for v1i128 iteratee: If you add the patterns, they should be generated. That was what happened when I added the…
		timshenAuthorUnsubmitted Not Done Reply Inline Actions The patterns will be generated, but they will match nothing at the time (therefore not easy to test). This is because no one generate the SDNodes "PPCshl", aka PPCISD::SHL, for vector operations, without the changes in stripModuloOnShift(). timshen: The patterns will be generated, but they will match nothing at the time (therefore not easy to…
		iterateeUnsubmitted Not Done Reply Inline Actions OK, why do you need a separate node for shift? iteratee: OK, why do you need a separate node for shift?
		timshenAuthorUnsubmitted Not Done Reply Inline Actions It already exists for scalar types. I simply extend it for vector types as well. They are different because shl (ISD::SHL) has UB, but PPCshl (PPCISD::SHL) doesn't. For example, (shl (i32 a), b) is UB when b >= 32. (PPCshl (i32 a), b), however, performs a << (b % 32) on vector types, as the instructions do too. See discussion here: http://lists.llvm.org/pipermail/llvm-commits/Week-of-Mon-20170508/452111.html timshen: 1) It already exists for scalar types. I simply extend it for vector types as well. 2) They are…
		iterateeUnsubmitted Not Done Reply Inline Actions OK, I get why you're doing it in dagcombiner, but why can't you just produce the instructions directly? Why do you need the intermediate nodes? iteratee: OK, I get why you're doing it in dagcombiner, but why can't you just produce the instructions…
		timshenAuthorUnsubmitted Not Done Reply Inline Actions Because I don't want to manually lower it to 8 * 2 = 16 instructions in C++ code. I prefer to write .td patterns for that. Without PPCISD::SHL I either write C++, or write pattern to match ISD::SHL. But ISD::SHL doesn't have the semantic we want. timshen: Because I don't want to manually lower it to 8 * 2 = 16 instructions in C++ code. I prefer to…
		iterateeUnsubmitted Not Done Reply Inline Actions OK. I get the reasoning behind delaying the output. iteratee: OK. I get the reasoning behind delaying the output.
		(v16i8 (VSLB $vA, $vB))>;
		def : Pat<(v8i16 (PPCshl v8i16:$vA, v8i16:$vB)),
		(v8i16 (VSLH $vA, $vB))>;
		def : Pat<(v4i32 (PPCshl v4i32:$vA, v4i32:$vB)),
		(v4i32 (VSLW $vA, $vB))>;

def : Pat<(v16i8 (srl v16i8:$vA, v16i8:$vB)),		def : Pat<(v16i8 (srl v16i8:$vA, v16i8:$vB)),
(v16i8 (VSRB $vA, $vB))>;		(v16i8 (VSRB $vA, $vB))>;
def : Pat<(v8i16 (srl v8i16:$vA, v8i16:$vB)),		def : Pat<(v8i16 (srl v8i16:$vA, v8i16:$vB)),
(v8i16 (VSRH $vA, $vB))>;		(v8i16 (VSRH $vA, $vB))>;
def : Pat<(v4i32 (srl v4i32:$vA, v4i32:$vB)),		def : Pat<(v4i32 (srl v4i32:$vA, v4i32:$vB)),
(v4i32 (VSRW $vA, $vB))>;		(v4i32 (VSRW $vA, $vB))>;
		def : Pat<(v16i8 (PPCsrl v16i8:$vA, v16i8:$vB)),
		(v16i8 (VSRB $vA, $vB))>;
		def : Pat<(v8i16 (PPCsrl v8i16:$vA, v8i16:$vB)),
		(v8i16 (VSRH $vA, $vB))>;
		def : Pat<(v4i32 (PPCsrl v4i32:$vA, v4i32:$vB)),
		(v4i32 (VSRW $vA, $vB))>;

def : Pat<(v16i8 (sra v16i8:$vA, v16i8:$vB)),		def : Pat<(v16i8 (sra v16i8:$vA, v16i8:$vB)),
(v16i8 (VSRAB $vA, $vB))>;		(v16i8 (VSRAB $vA, $vB))>;
def : Pat<(v8i16 (sra v8i16:$vA, v8i16:$vB)),		def : Pat<(v8i16 (sra v8i16:$vA, v8i16:$vB)),
(v8i16 (VSRAH $vA, $vB))>;		(v8i16 (VSRAH $vA, $vB))>;
def : Pat<(v4i32 (sra v4i32:$vA, v4i32:$vB)),		def : Pat<(v4i32 (sra v4i32:$vA, v4i32:$vB)),
(v4i32 (VSRAW $vA, $vB))>;		(v4i32 (VSRAW $vA, $vB))>;
		def : Pat<(v16i8 (PPCsra v16i8:$vA, v16i8:$vB)),
		(v16i8 (VSRAB $vA, $vB))>;
		def : Pat<(v8i16 (PPCsra v8i16:$vA, v8i16:$vB)),
		(v8i16 (VSRAH $vA, $vB))>;
		def : Pat<(v4i32 (PPCsra v4i32:$vA, v4i32:$vB)),
		(v4i32 (VSRAW $vA, $vB))>;

// Float to integer and integer to float conversions		// Float to integer and integer to float conversions
def : Pat<(v4i32 (fp_to_sint v4f32:$vA)),		def : Pat<(v4i32 (fp_to_sint v4f32:$vA)),
(VCTSXS_0 $vA)>;		(VCTSXS_0 $vA)>;
def : Pat<(v4i32 (fp_to_uint v4f32:$vA)),		def : Pat<(v4i32 (fp_to_uint v4f32:$vA)),
(VCTUXS_0 $vA)>;		(VCTUXS_0 $vA)>;
def : Pat<(v4f32 (sint_to_fp v4i32:$vA)),		def : Pat<(v4f32 (sint_to_fp v4i32:$vA)),
(VCFSX_0 $vA)>;		(VCFSX_0 $vA)>;
▲ Show 20 Lines • Show All 55 Lines • ▼ Show 20 Lines	def:Pat<(vmrgew_swapped_shuffle v16i8:$vA, v16i8:$vB),
(VMRGEW $vB, $vA)>;		(VMRGEW $vB, $vA)>;
def:Pat<(vmrgow_swapped_shuffle v16i8:$vA, v16i8:$vB),		def:Pat<(vmrgow_swapped_shuffle v16i8:$vA, v16i8:$vB),
(VMRGOW $vB, $vA)>;		(VMRGOW $vB, $vA)>;


// Vector shifts		// Vector shifts
def VRLD : VX1_Int_Ty<196, "vrld", int_ppc_altivec_vrld, v2i64>;		def VRLD : VX1_Int_Ty<196, "vrld", int_ppc_altivec_vrld, v2i64>;
def VSLD : VXForm_1<1476, (outs vrrc:$vD), (ins vrrc:$vA, vrrc:$vB),		def VSLD : VXForm_1<1476, (outs vrrc:$vD), (ins vrrc:$vA, vrrc:$vB),
"vsld $vD, $vA, $vB", IIC_VecGeneral,		"vsld $vD, $vA, $vB", IIC_VecGeneral, []>;
[(set v2i64:$vD, (shl v2i64:$vA, v2i64:$vB))]>;
def VSRD : VXForm_1<1732, (outs vrrc:$vD), (ins vrrc:$vA, vrrc:$vB),		def VSRD : VXForm_1<1732, (outs vrrc:$vD), (ins vrrc:$vA, vrrc:$vB),
"vsrd $vD, $vA, $vB", IIC_VecGeneral,		"vsrd $vD, $vA, $vB", IIC_VecGeneral, []>;
[(set v2i64:$vD, (srl v2i64:$vA, v2i64:$vB))]>;
def VSRAD : VXForm_1<964, (outs vrrc:$vD), (ins vrrc:$vA, vrrc:$vB),		def VSRAD : VXForm_1<964, (outs vrrc:$vD), (ins vrrc:$vA, vrrc:$vB),
"vsrad $vD, $vA, $vB", IIC_VecGeneral,		"vsrad $vD, $vA, $vB", IIC_VecGeneral, []>;
[(set v2i64:$vD, (sra v2i64:$vA, v2i64:$vB))]>;
		def : Pat<(v2i64 (shl v2i64:$vA, v2i64:$vB)),
		iterateeUnsubmitted Not Done Reply Inline Actions Minor point, the patterns above are grouped by type and then by PPCxxx vs xxx Can you group these the same? iteratee: Minor point, the patterns above are grouped by type and then by PPCxxx vs xxx Can you group…
		timshenAuthorUnsubmitted Not Done Reply Inline Actions Actually this is consistent - the ordering is (operation, PPC or not, types). timshen: Actually this is consistent - the ordering is (operation, PPC or not, types).
		(v2i64 (VSLD $vA, $vB))>;
		def : Pat<(v2i64 (PPCshl v2i64:$vA, v2i64:$vB)),
		(v2i64 (VSLD $vA, $vB))>;
		def : Pat<(v2i64 (srl v2i64:$vA, v2i64:$vB)),
		(v2i64 (VSRD $vA, $vB))>;
		def : Pat<(v2i64 (PPCsrl v2i64:$vA, v2i64:$vB)),
		(v2i64 (VSRD $vA, $vB))>;
		def : Pat<(v2i64 (sra v2i64:$vA, v2i64:$vB)),
		(v2i64 (VSRAD $vA, $vB))>;
		def : Pat<(v2i64 (PPCsra v2i64:$vA, v2i64:$vB)),
		(v2i64 (VSRAD $vA, $vB))>;

// Vector Integer Arithmetic Instructions		// Vector Integer Arithmetic Instructions
let isCommutable = 1 in {		let isCommutable = 1 in {
def VADDUDM : VXForm_1<192, (outs vrrc:$vD), (ins vrrc:$vA, vrrc:$vB),		def VADDUDM : VXForm_1<192, (outs vrrc:$vD), (ins vrrc:$vA, vrrc:$vB),
"vaddudm $vD, $vA, $vB", IIC_VecGeneral,		"vaddudm $vD, $vA, $vB", IIC_VecGeneral,
[(set v2i64:$vD, (add v2i64:$vA, v2i64:$vB))]>;		[(set v2i64:$vD, (add v2i64:$vA, v2i64:$vB))]>;
def VADDUQM : VXForm_1<256, (outs vrrc:$vD), (ins vrrc:$vA, vrrc:$vB),		def VADDUQM : VXForm_1<256, (outs vrrc:$vD), (ins vrrc:$vA, vrrc:$vB),
"vadduqm $vD, $vA, $vB", IIC_VecGeneral,		"vadduqm $vD, $vA, $vB", IIC_VecGeneral,
▲ Show 20 Lines • Show All 365 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[PPC] Move the combine "a << (b % (sizeof(a) * 8)) -> (PPCshl a, b)" to the backend. NFC.
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 98548

llvm/include/llvm/Target/TargetLowering.h

llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

llvm/lib/Target/PowerPC/PPCISelLowering.h

llvm/lib/Target/PowerPC/PPCISelLowering.cpp

llvm/lib/Target/PowerPC/PPCInstrAltivec.td

This is an archive of the discontinued LLVM Phabricator instance.

[PPC] Move the combine "a << (b % (sizeof(a) * 8)) -> (PPCshl a, b)" to the backend. NFC.ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 98548

llvm/include/llvm/Target/TargetLowering.h

llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp

llvm/lib/Target/PowerPC/PPCISelLowering.h

llvm/lib/Target/PowerPC/PPCISelLowering.cpp

llvm/lib/Target/PowerPC/PPCInstrAltivec.td

[PPC] Move the combine "a << (b % (sizeof(a) * 8)) -> (PPCshl a, b)" to the backend. NFC.
ClosedPublic