Diff 549950

llvm/lib/Transforms/InstCombine/InstructionCombining.cpp

Show First 20 Lines • Show All 745 Lines • ▼ Show 20 Lines
// -> (logic_shift (Binop1 (Binop2 X, inv_logic_shift(C1, C)), Y), C)		// -> (logic_shift (Binop1 (Binop2 X, inv_logic_shift(C1, C)), Y), C)
//		//
// (Binop1 (Binop2 (logic_shift X, Amt), Mask), (logic_shift Y, Amt))		// (Binop1 (Binop2 (logic_shift X, Amt), Mask), (logic_shift Y, Amt))
// IFF		// IFF
// 1) the logic_shifts match		// 1) the logic_shifts match
// 2) BinOp1 == BinOp2 (if BinOp == `add`, then also requires `shl`).		// 2) BinOp1 == BinOp2 (if BinOp == `add`, then also requires `shl`).
//		//
// -> (BinOp (logic_shift (BinOp X, Y)), Mask)		// -> (BinOp (logic_shift (BinOp X, Y)), Mask)
		//
		// (Binop1 (Binop2 (arithmetic_shift X, Amt), Mask), (arithmetic_shift Y, Amt))
		// IFF
		// 1) Binop1 is bitwise logical operator `and`, `or` or `xor`
		nikicUnsubmitted Done Reply Inline Actions There's just one kind of arithmetic shift, so it can't not match. nikic: There's just one kind of arithmetic shift, so it can't not match.
		// 2) Binop2 is `not`
		//
		// -> (arithmetic_shift Binop1((not X), Y), Amt)

Instruction *InstCombinerImpl::foldBinOpShiftWithShift(BinaryOperator &I) {		Instruction *InstCombinerImpl::foldBinOpShiftWithShift(BinaryOperator &I) {
auto IsValidBinOpc = [](unsigned Opc) {		auto IsValidBinOpc = [](unsigned Opc) {
switch (Opc) {		switch (Opc) {
default:		default:
return false;		return false;
case Instruction::And:		case Instruction::And:
case Instruction::Or:		case Instruction::Or:
case Instruction::Xor:		case Instruction::Xor:
case Instruction::Add:		case Instruction::Add:
// Skip Sub as we only match constant masks which will canonicalize to use		// Skip Sub as we only match constant masks which will canonicalize to use
// add.		// add.
return true;		return true;
}		}
};		};

// Check if we can distribute binop arbitrarily. `add` + `lshr` has extra		// Check if we can distribute binop arbitrarily. `add` + `lshr` has extra
// constraints.		// constraints.
auto IsCompletelyDistributable = [](unsigned BinOpc1, unsigned BinOpc2,		auto IsCompletelyDistributable = [](unsigned BinOpc1, unsigned BinOpc2,
unsigned ShOpc) {		unsigned ShOpc) {
		assert(ShOpc != Instruction::AShr);
return (BinOpc1 != Instruction::Add && BinOpc2 != Instruction::Add) \|\|		return (BinOpc1 != Instruction::Add && BinOpc2 != Instruction::Add) \|\|
ShOpc == Instruction::Shl;		ShOpc == Instruction::Shl;
		goldstein.w.nUnsubmitted Done Reply Inline Actions Also assert in here. goldstein.w.n: Also assert in here.
};		};

auto GetInvShift = [](unsigned ShOpc) {		auto GetInvShift = [](unsigned ShOpc) {
		assert(ShOpc != Instruction::AShr);
return ShOpc == Instruction::LShr ? Instruction::Shl : Instruction::LShr;		return ShOpc == Instruction::LShr ? Instruction::Shl : Instruction::LShr;
		goldstein.w.nUnsubmitted Done Reply Inline Actions Can you add assert `ShOpc != Instruction::AShr` here. Your code is fine in that regard, but now that the match logic supports `AShr` but much of the existing logic doesn't think we should have a fail-loudly check incase someone updates in the future. goldstein.w.n: Can you add assert `ShOpc != Instruction::AShr` here. Your code is fine in that regard, but now…
};		};

auto CanDistributeBinops = [&](unsigned BinOpc1, unsigned BinOpc2,		auto CanDistributeBinops = [&](unsigned BinOpc1, unsigned BinOpc2,
unsigned ShOpc, Constant *CMask,		unsigned ShOpc, Constant *CMask,
Constant *CShift) {		Constant *CShift) {
// If the BinOp1 is `and` we don't need to check the mask.		// If the BinOp1 is `and` we don't need to check the mask.
if (BinOpc1 == Instruction::And)		if (BinOpc1 == Instruction::And)
return true;		return true;
Show All 15 Lines	return ConstantExpr::get(
ShOpc, ConstantExpr::get(GetInvShift(ShOpc), CMask, CShift),		ShOpc, ConstantExpr::get(GetInvShift(ShOpc), CMask, CShift),
CShift) == CMask;		CShift) == CMask;
};		};

auto MatchBinOp = [&](unsigned ShOpnum) -> Instruction * {		auto MatchBinOp = [&](unsigned ShOpnum) -> Instruction * {
Constant CMask, CShift;		Constant CMask, CShift;
Value X, Y, ShiftedX, Mask, *Shift;		Value X, Y, ShiftedX, Mask, *Shift;
if (!match(I.getOperand(ShOpnum),		if (!match(I.getOperand(ShOpnum),
m_OneUse(m_LogicalShift(m_Value(Y), m_Value(Shift)))))		m_OneUse(m_Shift(m_Value(Y), m_Value(Shift)))))
return nullptr;		return nullptr;
if (!match(I.getOperand(1 - ShOpnum),		if (!match(I.getOperand(1 - ShOpnum),
m_BinOp(m_Value(ShiftedX), m_Value(Mask))))		m_BinOp(m_Value(ShiftedX), m_Value(Mask))))
return nullptr;		return nullptr;

if (!match(ShiftedX,		if (!match(ShiftedX, m_OneUse(m_Shift(m_Value(X), m_Specific(Shift)))))
m_OneUse(m_LogicalShift(m_Value(X), m_Specific(Shift)))))
return nullptr;		return nullptr;

// Make sure we are matching instruction shifts and not ConstantExpr		// Make sure we are matching instruction shifts and not ConstantExpr
auto *IY = dyn_cast<Instruction>(I.getOperand(ShOpnum));		auto *IY = dyn_cast<Instruction>(I.getOperand(ShOpnum));
auto *IX = dyn_cast<Instruction>(ShiftedX);		auto *IX = dyn_cast<Instruction>(ShiftedX);
if (!IY \|\| !IX)		if (!IY \|\| !IX)
return nullptr;		return nullptr;

// LHS and RHS need same shift opcode		// LHS and RHS need same shift opcode
unsigned ShOpc = IY->getOpcode();		unsigned ShOpc = IY->getOpcode();
if (ShOpc != IX->getOpcode())		if (ShOpc != IX->getOpcode())
return nullptr;		return nullptr;

// Make sure binop is real instruction and not ConstantExpr		// Make sure binop is real instruction and not ConstantExpr
auto *BO2 = dyn_cast<Instruction>(I.getOperand(1 - ShOpnum));		auto *BO2 = dyn_cast<Instruction>(I.getOperand(1 - ShOpnum));
if (!BO2)		if (!BO2)
return nullptr;		return nullptr;

unsigned BinOpc = BO2->getOpcode();		unsigned BinOpc = BO2->getOpcode();
// Make sure we have valid binops.		// Make sure we have valid binops.
if (!IsValidBinOpc(I.getOpcode()) \|\| !IsValidBinOpc(BinOpc))		if (!IsValidBinOpc(I.getOpcode()) \|\| !IsValidBinOpc(BinOpc))
return nullptr;		return nullptr;

		if (ShOpc == Instruction::AShr) {
		if (Instruction::isBitwiseLogicOp(I.getOpcode()) &&
		BinOpc == Instruction::Xor && match(Mask, m_AllOnes())) {
		Value *NotX = Builder.CreateNot(X);
		Value *NewBinOp = Builder.CreateBinOp(I.getOpcode(), Y, NotX);
		nikicUnsubmitted Done Reply Inline Actions Maybe `match(Mask, m_AllOnes())` and leave CMask alone? This will also match splat vectors with undef values, so we'd need a test for that. nikic: Maybe `match(Mask, m_AllOnes())` and leave CMask alone? This will also match splat vectors with…
		return BinaryOperator::Create(
		static_cast<Instruction::BinaryOps>(ShOpc), NewBinOp, Shift);
		nikicUnsubmitted Done Reply Inline Actions Might as well `CreateNot`? nikic: Might as well `CreateNot`?
		}

		nikicUnsubmitted Done Reply Inline Actions Cast shouldn't be needed. nikic: Cast shouldn't be needed.
		return nullptr;
		}

// If BinOp1 == BinOp2 and it's bitwise or shl with add, then just		// If BinOp1 == BinOp2 and it's bitwise or shl with add, then just
// distribute to drop the shift irrelevant of constants.		// distribute to drop the shift irrelevant of constants.
if (BinOpc == I.getOpcode() &&		if (BinOpc == I.getOpcode() &&
IsCompletelyDistributable(I.getOpcode(), BinOpc, ShOpc)) {		IsCompletelyDistributable(I.getOpcode(), BinOpc, ShOpc)) {
Value *NewBinOp2 = Builder.CreateBinOp(I.getOpcode(), X, Y);		Value *NewBinOp2 = Builder.CreateBinOp(I.getOpcode(), X, Y);
Value *NewBinOp1 = Builder.CreateBinOp(		Value *NewBinOp1 = Builder.CreateBinOp(
static_cast<Instruction::BinaryOps>(ShOpc), NewBinOp2, Shift);		static_cast<Instruction::BinaryOps>(ShOpc), NewBinOp2, Shift);
return BinaryOperator::Create(I.getOpcode(), NewBinOp1, Mask);		return BinaryOperator::Create(I.getOpcode(), NewBinOp1, Mask);
▲ Show 20 Lines • Show All 130 Lines • ▼ Show 20 Lines
/// distributes over either by factorizing out common terms		/// distributes over either by factorizing out common terms
/// (eg "(AB)+(AC)" -> "A*(B+C)") or expanding out if this results in		/// (eg "(AB)+(AC)" -> "A*(B+C)") or expanding out if this results in
/// simplifications (eg: "A & (B \| C) -> (A&B) \| (A&C)" if this is a win).		/// simplifications (eg: "A & (B \| C) -> (A&B) \| (A&C)" if this is a win).
/// Returns the simplified value, or null if it didn't simplify.		/// Returns the simplified value, or null if it didn't simplify.
Value *InstCombinerImpl::foldUsingDistributiveLaws(BinaryOperator &I) {		Value *InstCombinerImpl::foldUsingDistributiveLaws(BinaryOperator &I) {
Value LHS = I.getOperand(0), RHS = I.getOperand(1);		Value LHS = I.getOperand(0), RHS = I.getOperand(1);
BinaryOperator *Op0 = dyn_cast<BinaryOperator>(LHS);		BinaryOperator *Op0 = dyn_cast<BinaryOperator>(LHS);
BinaryOperator *Op1 = dyn_cast<BinaryOperator>(RHS);		BinaryOperator *Op1 = dyn_cast<BinaryOperator>(RHS);
Instruction::BinaryOps TopLevelOpcode = I.getOpcode();		Instruction::BinaryOps TopLevelOpcode = I.getOpcode();
		goldstein.w.nUnsubmitted Done Reply Inline Actions Imo the LHS/RHS logic are similiar enough it should be a lambda. Will make the code a lot cleaner. goldstein.w.n: Imo the LHS/RHS logic are similiar enough it should be a lambda. Will make the code a lot…

// Factorization.		// Factorization.
if (Value *R = tryFactorizationFolds(I))		if (Value *R = tryFactorizationFolds(I))
return R;		return R;

// Expansion.		// Expansion.
if (Op0 && rightDistributesOverLeft(Op0->getOpcode(), TopLevelOpcode)) {		if (Op0 && rightDistributesOverLeft(Op0->getOpcode(), TopLevelOpcode)) {
// The instruction has the form "(A op' B) op C". See if expanding it out		// The instruction has the form "(A op' B) op C". See if expanding it out
// to "(A op C) op' (B op C)" results in simplifications.		// to "(A op C) op' (B op C)" results in simplifications.
Value A = Op0->getOperand(0), B = Op0->getOperand(1), *C = RHS;		Value A = Op0->getOperand(0), B = Op0->getOperand(1), *C = RHS;
Instruction::BinaryOps InnerOpcode = Op0->getOpcode(); // op'		Instruction::BinaryOps InnerOpcode = Op0->getOpcode(); // op'

// Disable the use of undef because it's not safe to distribute undef.		// Disable the use of undef because it's not safe to distribute undef.
auto SQDistributive = SQ.getWithInstruction(&I).getWithoutUndef();		auto SQDistributive = SQ.getWithInstruction(&I).getWithoutUndef();
		goldstein.w.nUnsubmitted Done Reply Inline Actions This codeblock needs some comments. goldstein.w.n: This codeblock needs some comments.
Value *L = simplifyBinOp(TopLevelOpcode, A, C, SQDistributive);		Value *L = simplifyBinOp(TopLevelOpcode, A, C, SQDistributive);
Value *R = simplifyBinOp(TopLevelOpcode, B, C, SQDistributive);		Value *R = simplifyBinOp(TopLevelOpcode, B, C, SQDistributive);

// Do "A op C" and "B op C" both simplify?		// Do "A op C" and "B op C" both simplify?
if (L && R) {		if (L && R) {
// They do! Return "L op' R".		// They do! Return "L op' R".
++NumExpand;		++NumExpand;
C = Builder.CreateBinOp(InnerOpcode, L, R);		C = Builder.CreateBinOp(InnerOpcode, L, R);
▲ Show 20 Lines • Show All 3,468 Lines • Show Last 20 Lines

llvm/test/Transforms/InstCombine/binop-and-shifts.ll

Show First 20 Lines • Show All 548 Lines • ▼ Show 20 Lines	;
%bw1 = and i8 %shift1, %bw2		%bw1 = and i8 %shift1, %bw2
ret i8 %bw1		ret i8 %bw1
}		}

; Fold (-x >> y) & ((x >> y) ^ -1) -> (-x & ~x) >> y		; Fold (-x >> y) & ((x >> y) ^ -1) -> (-x & ~x) >> y

define i8 @and_ashr_not(i8 %x, i8 %y, i8 %shamt) {		define i8 @and_ashr_not(i8 %x, i8 %y, i8 %shamt) {
; CHECK-LABEL: @and_ashr_not(		; CHECK-LABEL: @and_ashr_not(
; CHECK-NEXT: [[X_SHIFT:%.]] = ashr i8 [[X:%.]], [[SHAMT:%.*]]		; CHECK-NEXT: [[TMP1:%.]] = xor i8 [[Y:%.]], -1
; CHECK-NEXT: [[Y_SHIFT:%.]] = ashr i8 [[Y:%.]], [[SHAMT]]		; CHECK-NEXT: [[TMP2:%.]] = and i8 [[TMP1]], [[X:%.]]
; CHECK-NEXT: [[Y_SHIFT_NOT:%.*]] = xor i8 [[Y_SHIFT]], -1		; CHECK-NEXT: [[AND:%.]] = ashr i8 [[TMP2]], [[SHAMT:%.]]
; CHECK-NEXT: [[AND:%.*]] = and i8 [[X_SHIFT]], [[Y_SHIFT_NOT]]
; CHECK-NEXT: ret i8 [[AND]]		; CHECK-NEXT: ret i8 [[AND]]
;		;
%x.shift = ashr i8 %x, %shamt		%x.shift = ashr i8 %x, %shamt
%y.shift = ashr i8 %y, %shamt		%y.shift = ashr i8 %y, %shamt
%y.shift.not = xor i8 %y.shift, -1		%y.shift.not = xor i8 %y.shift, -1
%and = and i8 %x.shift, %y.shift.not		%and = and i8 %x.shift, %y.shift.not
ret i8 %and		ret i8 %and
}		}

define i8 @and_ashr_not_commuted(i8 %x, i8 %y, i8 %shamt) {		define i8 @and_ashr_not_commuted(i8 %x, i8 %y, i8 %shamt) {
; CHECK-LABEL: @and_ashr_not_commuted(		; CHECK-LABEL: @and_ashr_not_commuted(
; CHECK-NEXT: [[X_SHIFT:%.]] = ashr i8 [[X:%.]], [[SHAMT:%.*]]		; CHECK-NEXT: [[TMP1:%.]] = xor i8 [[Y:%.]], -1
; CHECK-NEXT: [[Y_SHIFT:%.]] = ashr i8 [[Y:%.]], [[SHAMT]]		; CHECK-NEXT: [[TMP2:%.]] = and i8 [[TMP1]], [[X:%.]]
; CHECK-NEXT: [[Y_SHIFT_NOT:%.*]] = xor i8 [[Y_SHIFT]], -1		; CHECK-NEXT: [[AND:%.]] = ashr i8 [[TMP2]], [[SHAMT:%.]]
; CHECK-NEXT: [[AND:%.*]] = and i8 [[X_SHIFT]], [[Y_SHIFT_NOT]]
; CHECK-NEXT: ret i8 [[AND]]		; CHECK-NEXT: ret i8 [[AND]]
;		;
%x.shift = ashr i8 %x, %shamt		%x.shift = ashr i8 %x, %shamt
%y.shift = ashr i8 %y, %shamt		%y.shift = ashr i8 %y, %shamt
%y.shift.not = xor i8 %y.shift, -1		%y.shift.not = xor i8 %y.shift, -1
%and = and i8 %y.shift.not, %x.shift		%and = and i8 %y.shift.not, %x.shift
ret i8 %and		ret i8 %and
}		}
▲ Show 20 Lines • Show All 46 Lines • ▼ Show 20 Lines	;
%y.shift = ashr i8 %y, %shamt		%y.shift = ashr i8 %y, %shamt
%y.shift.not = xor i8 %y.shift, -2		%y.shift.not = xor i8 %y.shift, -2
%and = and i8 %x.shift, %y.shift.not		%and = and i8 %x.shift, %y.shift.not
ret i8 %and		ret i8 %and
}		}

define <4 x i8> @and_ashr_not_vec(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {		define <4 x i8> @and_ashr_not_vec(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {
; CHECK-LABEL: @and_ashr_not_vec(		; CHECK-LABEL: @and_ashr_not_vec(
; CHECK-NEXT: [[X_SHIFT:%.]] = ashr <4 x i8> [[X:%.]], [[SHAMT:%.*]]		; CHECK-NEXT: [[TMP1:%.]] = xor <4 x i8> [[Y:%.]], <i8 -1, i8 -1, i8 -1, i8 -1>
; CHECK-NEXT: [[Y_SHIFT:%.]] = ashr <4 x i8> [[Y:%.]], [[SHAMT]]		; CHECK-NEXT: [[TMP2:%.]] = and <4 x i8> [[TMP1]], [[X:%.]]
; CHECK-NEXT: [[Y_SHIFT_NOT:%.*]] = xor <4 x i8> [[Y_SHIFT]], <i8 -1, i8 -1, i8 -1, i8 -1>		; CHECK-NEXT: [[AND:%.]] = ashr <4 x i8> [[TMP2]], [[SHAMT:%.]]
; CHECK-NEXT: [[AND:%.*]] = and <4 x i8> [[X_SHIFT]], [[Y_SHIFT_NOT]]
; CHECK-NEXT: ret <4 x i8> [[AND]]		; CHECK-NEXT: ret <4 x i8> [[AND]]
;		;
%x.shift = ashr <4 x i8> %x, %shamt		%x.shift = ashr <4 x i8> %x, %shamt
%y.shift = ashr <4 x i8> %y, %shamt		%y.shift = ashr <4 x i8> %y, %shamt
%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 -1, i8 -1, i8 -1>		%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 -1, i8 -1, i8 -1>
%and = and <4 x i8> %x.shift, %y.shift.not		%and = and <4 x i8> %x.shift, %y.shift.not
ret <4 x i8> %and		ret <4 x i8> %and
}		}

define <4 x i8> @and_ashr_not_vec_commuted(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {		define <4 x i8> @and_ashr_not_vec_commuted(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {
; CHECK-LABEL: @and_ashr_not_vec_commuted(		; CHECK-LABEL: @and_ashr_not_vec_commuted(
; CHECK-NEXT: [[X_SHIFT:%.]] = ashr <4 x i8> [[X:%.]], [[SHAMT:%.*]]		; CHECK-NEXT: [[TMP1:%.]] = xor <4 x i8> [[Y:%.]], <i8 -1, i8 -1, i8 -1, i8 -1>
; CHECK-NEXT: [[Y_SHIFT:%.]] = ashr <4 x i8> [[Y:%.]], [[SHAMT]]		; CHECK-NEXT: [[TMP2:%.]] = and <4 x i8> [[TMP1]], [[X:%.]]
; CHECK-NEXT: [[Y_SHIFT_NOT:%.*]] = xor <4 x i8> [[Y_SHIFT]], <i8 -1, i8 -1, i8 -1, i8 -1>		; CHECK-NEXT: [[AND:%.]] = ashr <4 x i8> [[TMP2]], [[SHAMT:%.]]
; CHECK-NEXT: [[AND:%.*]] = and <4 x i8> [[X_SHIFT]], [[Y_SHIFT_NOT]]
; CHECK-NEXT: ret <4 x i8> [[AND]]		; CHECK-NEXT: ret <4 x i8> [[AND]]
;		;
%x.shift = ashr <4 x i8> %x, %shamt		%x.shift = ashr <4 x i8> %x, %shamt
%y.shift = ashr <4 x i8> %y, %shamt		%y.shift = ashr <4 x i8> %y, %shamt
%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 -1, i8 -1, i8 -1>		%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 -1, i8 -1, i8 -1>
%and = and <4 x i8> %y.shift.not, %x.shift		%and = and <4 x i8> %y.shift.not, %x.shift
ret <4 x i8> %and		ret <4 x i8> %and
}		}

define <4 x i8> @and_ashr_not_vec_undef_1(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {		define <4 x i8> @and_ashr_not_vec_undef_1(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {
; CHECK-LABEL: @and_ashr_not_vec_undef_1(		; CHECK-LABEL: @and_ashr_not_vec_undef_1(
; CHECK-NEXT: [[X_SHIFT:%.]] = ashr <4 x i8> [[X:%.]], [[SHAMT:%.*]]		; CHECK-NEXT: [[TMP1:%.]] = xor <4 x i8> [[Y:%.]], <i8 -1, i8 -1, i8 -1, i8 -1>
; CHECK-NEXT: [[Y_SHIFT:%.]] = ashr <4 x i8> [[Y:%.]], [[SHAMT]]		; CHECK-NEXT: [[TMP2:%.]] = and <4 x i8> [[TMP1]], [[X:%.]]
; CHECK-NEXT: [[Y_SHIFT_NOT:%.*]] = xor <4 x i8> [[Y_SHIFT]], <i8 -1, i8 undef, i8 undef, i8 undef>		; CHECK-NEXT: [[AND:%.]] = ashr <4 x i8> [[TMP2]], [[SHAMT:%.]]
; CHECK-NEXT: [[AND:%.*]] = and <4 x i8> [[X_SHIFT]], [[Y_SHIFT_NOT]]
; CHECK-NEXT: ret <4 x i8> [[AND]]		; CHECK-NEXT: ret <4 x i8> [[AND]]
;		;
%x.shift = ashr <4 x i8> %x, %shamt		%x.shift = ashr <4 x i8> %x, %shamt
%y.shift = ashr <4 x i8> %y, %shamt		%y.shift = ashr <4 x i8> %y, %shamt
%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 undef, i8 undef, i8 undef>		%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 undef, i8 undef, i8 undef>
%and = and <4 x i8> %x.shift, %y.shift.not		%and = and <4 x i8> %x.shift, %y.shift.not
ret <4 x i8> %and		ret <4 x i8> %and
}		}

define <4 x i8> @and_ashr_not_vec_undef_2(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {		define <4 x i8> @and_ashr_not_vec_undef_2(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {
; CHECK-LABEL: @and_ashr_not_vec_undef_2(		; CHECK-LABEL: @and_ashr_not_vec_undef_2(
; CHECK-NEXT: ret <4 x i8> zeroinitializer		; CHECK-NEXT: ret <4 x i8> zeroinitializer
;		;
%x.shift = ashr <4 x i8> %x, %shamt		%x.shift = ashr <4 x i8> %x, %shamt
%y.shift = ashr <4 x i8> %y, %shamt		%y.shift = ashr <4 x i8> %y, %shamt
%y.shift.not = xor <4 x i8> %y.shift, <i8 undef, i8 undef, i8 undef, i8 undef>		%y.shift.not = xor <4 x i8> %y.shift, <i8 undef, i8 undef, i8 undef, i8 undef>
%and = and <4 x i8> %x.shift, %y.shift.not		%and = and <4 x i8> %x.shift, %y.shift.not
ret <4 x i8> %and		ret <4 x i8> %and
}		}

; Fold (-x >> y) \| ((x >> y) ^ -1) -> (-x \| ~x) >> y		; Fold (-x >> y) \| ((x >> y) ^ -1) -> (-x \| ~x) >> y

define i8 @or_ashr_not(i8 %x, i8 %y, i8 %shamt) {		define i8 @or_ashr_not(i8 %x, i8 %y, i8 %shamt) {
; CHECK-LABEL: @or_ashr_not(		; CHECK-LABEL: @or_ashr_not(
; CHECK-NEXT: [[X_SHIFT:%.]] = ashr i8 [[X:%.]], [[SHAMT:%.*]]		; CHECK-NEXT: [[TMP1:%.]] = xor i8 [[Y:%.]], -1
; CHECK-NEXT: [[Y_SHIFT:%.]] = ashr i8 [[Y:%.]], [[SHAMT]]		; CHECK-NEXT: [[TMP2:%.]] = or i8 [[TMP1]], [[X:%.]]
; CHECK-NEXT: [[Y_SHIFT_NOT:%.*]] = xor i8 [[Y_SHIFT]], -1		; CHECK-NEXT: [[OR:%.]] = ashr i8 [[TMP2]], [[SHAMT:%.]]
; CHECK-NEXT: [[OR:%.*]] = or i8 [[X_SHIFT]], [[Y_SHIFT_NOT]]
; CHECK-NEXT: ret i8 [[OR]]		; CHECK-NEXT: ret i8 [[OR]]
;		;
%x.shift = ashr i8 %x, %shamt		%x.shift = ashr i8 %x, %shamt
%y.shift = ashr i8 %y, %shamt		%y.shift = ashr i8 %y, %shamt
%y.shift.not = xor i8 %y.shift, -1		%y.shift.not = xor i8 %y.shift, -1
%or = or i8 %x.shift, %y.shift.not		%or = or i8 %x.shift, %y.shift.not
ret i8 %or		ret i8 %or
}		}

define i8 @or_ashr_not_commuted(i8 %x, i8 %y, i8 %shamt) {		define i8 @or_ashr_not_commuted(i8 %x, i8 %y, i8 %shamt) {
; CHECK-LABEL: @or_ashr_not_commuted(		; CHECK-LABEL: @or_ashr_not_commuted(
; CHECK-NEXT: [[X_SHIFT:%.]] = ashr i8 [[X:%.]], [[SHAMT:%.*]]		; CHECK-NEXT: [[TMP1:%.]] = xor i8 [[Y:%.]], -1
; CHECK-NEXT: [[Y_SHIFT:%.]] = ashr i8 [[Y:%.]], [[SHAMT]]		; CHECK-NEXT: [[TMP2:%.]] = or i8 [[TMP1]], [[X:%.]]
; CHECK-NEXT: [[Y_SHIFT_NOT:%.*]] = xor i8 [[Y_SHIFT]], -1		; CHECK-NEXT: [[OR:%.]] = ashr i8 [[TMP2]], [[SHAMT:%.]]
; CHECK-NEXT: [[OR:%.*]] = or i8 [[X_SHIFT]], [[Y_SHIFT_NOT]]
; CHECK-NEXT: ret i8 [[OR]]		; CHECK-NEXT: ret i8 [[OR]]
;		;
%x.shift = ashr i8 %x, %shamt		%x.shift = ashr i8 %x, %shamt
%y.shift = ashr i8 %y, %shamt		%y.shift = ashr i8 %y, %shamt
%y.shift.not = xor i8 %y.shift, -1		%y.shift.not = xor i8 %y.shift, -1
%or = or i8 %y.shift.not, %x.shift		%or = or i8 %y.shift.not, %x.shift
ret i8 %or		ret i8 %or
}		}
▲ Show 20 Lines • Show All 46 Lines • ▼ Show 20 Lines	;
%y.shift = ashr i8 %y, %shamt		%y.shift = ashr i8 %y, %shamt
%y.shift.not = xor i8 %y.shift, -2		%y.shift.not = xor i8 %y.shift, -2
%or = or i8 %x.shift, %y.shift.not		%or = or i8 %x.shift, %y.shift.not
ret i8 %or		ret i8 %or
}		}

define <4 x i8> @or_ashr_not_vec(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {		define <4 x i8> @or_ashr_not_vec(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {
; CHECK-LABEL: @or_ashr_not_vec(		; CHECK-LABEL: @or_ashr_not_vec(
; CHECK-NEXT: [[X_SHIFT:%.]] = ashr <4 x i8> [[X:%.]], [[SHAMT:%.*]]		; CHECK-NEXT: [[TMP1:%.]] = xor <4 x i8> [[Y:%.]], <i8 -1, i8 -1, i8 -1, i8 -1>
; CHECK-NEXT: [[Y_SHIFT:%.]] = ashr <4 x i8> [[Y:%.]], [[SHAMT]]		; CHECK-NEXT: [[TMP2:%.]] = or <4 x i8> [[TMP1]], [[X:%.]]
; CHECK-NEXT: [[Y_SHIFT_NOT:%.*]] = xor <4 x i8> [[Y_SHIFT]], <i8 -1, i8 -1, i8 -1, i8 -1>		; CHECK-NEXT: [[OR:%.]] = ashr <4 x i8> [[TMP2]], [[SHAMT:%.]]
; CHECK-NEXT: [[OR:%.*]] = or <4 x i8> [[X_SHIFT]], [[Y_SHIFT_NOT]]
; CHECK-NEXT: ret <4 x i8> [[OR]]		; CHECK-NEXT: ret <4 x i8> [[OR]]
;		;
%x.shift = ashr <4 x i8> %x, %shamt		%x.shift = ashr <4 x i8> %x, %shamt
%y.shift = ashr <4 x i8> %y, %shamt		%y.shift = ashr <4 x i8> %y, %shamt
%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 -1, i8 -1, i8 -1>		%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 -1, i8 -1, i8 -1>
%or = or <4 x i8> %x.shift, %y.shift.not		%or = or <4 x i8> %x.shift, %y.shift.not
ret <4 x i8> %or		ret <4 x i8> %or
}		}

define <4 x i8> @or_ashr_not_vec_commuted(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {		define <4 x i8> @or_ashr_not_vec_commuted(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {
; CHECK-LABEL: @or_ashr_not_vec_commuted(		; CHECK-LABEL: @or_ashr_not_vec_commuted(
; CHECK-NEXT: [[X_SHIFT:%.]] = ashr <4 x i8> [[X:%.]], [[SHAMT:%.*]]		; CHECK-NEXT: [[TMP1:%.]] = xor <4 x i8> [[Y:%.]], <i8 -1, i8 -1, i8 -1, i8 -1>
; CHECK-NEXT: [[Y_SHIFT:%.]] = ashr <4 x i8> [[Y:%.]], [[SHAMT]]		; CHECK-NEXT: [[TMP2:%.]] = or <4 x i8> [[TMP1]], [[X:%.]]
; CHECK-NEXT: [[Y_SHIFT_NOT:%.*]] = xor <4 x i8> [[Y_SHIFT]], <i8 -1, i8 -1, i8 -1, i8 -1>		; CHECK-NEXT: [[OR:%.]] = ashr <4 x i8> [[TMP2]], [[SHAMT:%.]]
; CHECK-NEXT: [[OR:%.*]] = or <4 x i8> [[X_SHIFT]], [[Y_SHIFT_NOT]]
; CHECK-NEXT: ret <4 x i8> [[OR]]		; CHECK-NEXT: ret <4 x i8> [[OR]]
;		;
%x.shift = ashr <4 x i8> %x, %shamt		%x.shift = ashr <4 x i8> %x, %shamt
%y.shift = ashr <4 x i8> %y, %shamt		%y.shift = ashr <4 x i8> %y, %shamt
%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 -1, i8 -1, i8 -1>		%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 -1, i8 -1, i8 -1>
%or = or <4 x i8> %y.shift.not, %x.shift		%or = or <4 x i8> %y.shift.not, %x.shift
ret <4 x i8> %or		ret <4 x i8> %or
}		}

define <4 x i8> @or_ashr_not_vec_undef_1(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {		define <4 x i8> @or_ashr_not_vec_undef_1(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {
; CHECK-LABEL: @or_ashr_not_vec_undef_1(		; CHECK-LABEL: @or_ashr_not_vec_undef_1(
; CHECK-NEXT: [[X_SHIFT:%.]] = ashr <4 x i8> [[X:%.]], [[SHAMT:%.*]]		; CHECK-NEXT: [[TMP1:%.]] = xor <4 x i8> [[Y:%.]], <i8 -1, i8 -1, i8 -1, i8 -1>
; CHECK-NEXT: [[Y_SHIFT:%.]] = ashr <4 x i8> [[Y:%.]], [[SHAMT]]		; CHECK-NEXT: [[TMP2:%.]] = or <4 x i8> [[TMP1]], [[X:%.]]
; CHECK-NEXT: [[Y_SHIFT_NOT:%.*]] = xor <4 x i8> [[Y_SHIFT]], <i8 -1, i8 undef, i8 undef, i8 undef>		; CHECK-NEXT: [[OR:%.]] = ashr <4 x i8> [[TMP2]], [[SHAMT:%.]]
; CHECK-NEXT: [[OR:%.*]] = or <4 x i8> [[X_SHIFT]], [[Y_SHIFT_NOT]]
; CHECK-NEXT: ret <4 x i8> [[OR]]		; CHECK-NEXT: ret <4 x i8> [[OR]]
;		;
%x.shift = ashr <4 x i8> %x, %shamt		%x.shift = ashr <4 x i8> %x, %shamt
%y.shift = ashr <4 x i8> %y, %shamt		%y.shift = ashr <4 x i8> %y, %shamt
%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 undef, i8 undef, i8 undef>		%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 undef, i8 undef, i8 undef>
%or = or <4 x i8> %x.shift, %y.shift.not		%or = or <4 x i8> %x.shift, %y.shift.not
ret <4 x i8> %or		ret <4 x i8> %or
}		}

define <4 x i8> @or_ashr_not_vec_undef_2(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {		define <4 x i8> @or_ashr_not_vec_undef_2(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {
; CHECK-LABEL: @or_ashr_not_vec_undef_2(		; CHECK-LABEL: @or_ashr_not_vec_undef_2(
; CHECK-NEXT: ret <4 x i8> <i8 -1, i8 -1, i8 -1, i8 -1>		; CHECK-NEXT: ret <4 x i8> <i8 -1, i8 -1, i8 -1, i8 -1>
;		;
%x.shift = ashr <4 x i8> %x, %shamt		%x.shift = ashr <4 x i8> %x, %shamt
%y.shift = ashr <4 x i8> %y, %shamt		%y.shift = ashr <4 x i8> %y, %shamt
%y.shift.not = xor <4 x i8> %y.shift, <i8 undef, i8 undef, i8 undef, i8 undef>		%y.shift.not = xor <4 x i8> %y.shift, <i8 undef, i8 undef, i8 undef, i8 undef>
%or = or <4 x i8> %x.shift, %y.shift.not		%or = or <4 x i8> %x.shift, %y.shift.not
ret <4 x i8> %or		ret <4 x i8> %or
}		}

; Fold (-x >> y) ^ ((x >> y) ^ -1) -> (-x ^ ~x) >> y		; Fold (-x >> y) ^ ((x >> y) ^ -1) -> (-x ^ ~x) >> y

define i8 @xor_ashr_not(i8 %x, i8 %y, i8 %shamt) {		define i8 @xor_ashr_not(i8 %x, i8 %y, i8 %shamt) {
; CHECK-LABEL: @xor_ashr_not(		; CHECK-LABEL: @xor_ashr_not(
; CHECK-NEXT: [[Y_SHIFT1:%.]] = xor i8 [[Y:%.]], [[X:%.*]]		; CHECK-NEXT: [[TMP1:%.]] = xor i8 [[Y:%.]], [[X:%.*]]
; CHECK-NEXT: [[TMP1:%.]] = ashr i8 [[Y_SHIFT1]], [[SHAMT:%.]]		; CHECK-NEXT: [[DOTNOT:%.]] = ashr i8 [[TMP1]], [[SHAMT:%.]]
; CHECK-NEXT: [[XOR:%.*]] = xor i8 [[TMP1]], -1		; CHECK-NEXT: [[XOR:%.*]] = xor i8 [[DOTNOT]], -1
; CHECK-NEXT: ret i8 [[XOR]]		; CHECK-NEXT: ret i8 [[XOR]]
;		;
%x.shift = ashr i8 %x, %shamt		%x.shift = ashr i8 %x, %shamt
%y.shift = ashr i8 %y, %shamt		%y.shift = ashr i8 %y, %shamt
%y.shift.not = xor i8 %y.shift, -1		%y.shift.not = xor i8 %y.shift, -1
%xor = xor i8 %x.shift, %y.shift.not		%xor = xor i8 %x.shift, %y.shift.not
ret i8 %xor		ret i8 %xor
}		}

define i8 @xor_ashr_not_commuted(i8 %x, i8 %y, i8 %shamt) {		define i8 @xor_ashr_not_commuted(i8 %x, i8 %y, i8 %shamt) {
; CHECK-LABEL: @xor_ashr_not_commuted(		; CHECK-LABEL: @xor_ashr_not_commuted(
; CHECK-NEXT: [[Y_SHIFT1:%.]] = xor i8 [[Y:%.]], [[X:%.*]]		; CHECK-NEXT: [[TMP1:%.]] = xor i8 [[Y:%.]], [[X:%.*]]
; CHECK-NEXT: [[TMP1:%.]] = ashr i8 [[Y_SHIFT1]], [[SHAMT:%.]]		; CHECK-NEXT: [[DOTNOT:%.]] = ashr i8 [[TMP1]], [[SHAMT:%.]]
; CHECK-NEXT: [[XOR:%.*]] = xor i8 [[TMP1]], -1		; CHECK-NEXT: [[XOR:%.*]] = xor i8 [[DOTNOT]], -1
; CHECK-NEXT: ret i8 [[XOR]]		; CHECK-NEXT: ret i8 [[XOR]]
;		;
%x.shift = ashr i8 %x, %shamt		%x.shift = ashr i8 %x, %shamt
%y.shift = ashr i8 %y, %shamt		%y.shift = ashr i8 %y, %shamt
%y.shift.not = xor i8 %y.shift, -1		%y.shift.not = xor i8 %y.shift, -1
%xor = xor i8 %y.shift.not, %x.shift		%xor = xor i8 %y.shift.not, %x.shift
ret i8 %xor		ret i8 %xor
}		}
▲ Show 20 Lines • Show All 45 Lines • ▼ Show 20 Lines	;
%y.shift = ashr i8 %y, %shamt		%y.shift = ashr i8 %y, %shamt
%y.shift.not = xor i8 %y.shift, -2		%y.shift.not = xor i8 %y.shift, -2
%xor = xor i8 %x.shift, %y.shift.not		%xor = xor i8 %x.shift, %y.shift.not
ret i8 %xor		ret i8 %xor
}		}

define <4 x i8> @xor_ashr_not_vec(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {		define <4 x i8> @xor_ashr_not_vec(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {
; CHECK-LABEL: @xor_ashr_not_vec(		; CHECK-LABEL: @xor_ashr_not_vec(
; CHECK-NEXT: [[Y_SHIFT1:%.]] = xor <4 x i8> [[Y:%.]], [[X:%.*]]		; CHECK-NEXT: [[TMP1:%.]] = xor <4 x i8> [[Y:%.]], [[X:%.*]]
; CHECK-NEXT: [[TMP1:%.]] = ashr <4 x i8> [[Y_SHIFT1]], [[SHAMT:%.]]		; CHECK-NEXT: [[DOTNOT:%.]] = ashr <4 x i8> [[TMP1]], [[SHAMT:%.]]
; CHECK-NEXT: [[XOR:%.*]] = xor <4 x i8> [[TMP1]], <i8 -1, i8 -1, i8 -1, i8 -1>		; CHECK-NEXT: [[XOR:%.*]] = xor <4 x i8> [[DOTNOT]], <i8 -1, i8 -1, i8 -1, i8 -1>
; CHECK-NEXT: ret <4 x i8> [[XOR]]		; CHECK-NEXT: ret <4 x i8> [[XOR]]
;		;
%x.shift = ashr <4 x i8> %x, %shamt		%x.shift = ashr <4 x i8> %x, %shamt
%y.shift = ashr <4 x i8> %y, %shamt		%y.shift = ashr <4 x i8> %y, %shamt
%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 -1, i8 -1, i8 -1>		%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 -1, i8 -1, i8 -1>
%xor = xor <4 x i8> %x.shift, %y.shift.not		%xor = xor <4 x i8> %x.shift, %y.shift.not
ret <4 x i8> %xor		ret <4 x i8> %xor
}		}

define <4 x i8> @xor_ashr_not_vec_commuted(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {		define <4 x i8> @xor_ashr_not_vec_commuted(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {
; CHECK-LABEL: @xor_ashr_not_vec_commuted(		; CHECK-LABEL: @xor_ashr_not_vec_commuted(
; CHECK-NEXT: [[Y_SHIFT1:%.]] = xor <4 x i8> [[Y:%.]], [[X:%.*]]		; CHECK-NEXT: [[TMP1:%.]] = xor <4 x i8> [[Y:%.]], [[X:%.*]]
; CHECK-NEXT: [[TMP1:%.]] = ashr <4 x i8> [[Y_SHIFT1]], [[SHAMT:%.]]		; CHECK-NEXT: [[DOTNOT:%.]] = ashr <4 x i8> [[TMP1]], [[SHAMT:%.]]
; CHECK-NEXT: [[XOR:%.*]] = xor <4 x i8> [[TMP1]], <i8 -1, i8 -1, i8 -1, i8 -1>		; CHECK-NEXT: [[XOR:%.*]] = xor <4 x i8> [[DOTNOT]], <i8 -1, i8 -1, i8 -1, i8 -1>
; CHECK-NEXT: ret <4 x i8> [[XOR]]		; CHECK-NEXT: ret <4 x i8> [[XOR]]
;		;
%x.shift = ashr <4 x i8> %x, %shamt		%x.shift = ashr <4 x i8> %x, %shamt
%y.shift = ashr <4 x i8> %y, %shamt		%y.shift = ashr <4 x i8> %y, %shamt
%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 -1, i8 -1, i8 -1>		%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 -1, i8 -1, i8 -1>
%xor = xor <4 x i8> %y.shift.not, %x.shift		%xor = xor <4 x i8> %y.shift.not, %x.shift
ret <4 x i8> %xor		ret <4 x i8> %xor
}		}

define <4 x i8> @xor_ashr_not_vec_undef_1(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {		define <4 x i8> @xor_ashr_not_vec_undef_1(<4 x i8> %x, <4 x i8> %y, <4 x i8> %shamt) {
; CHECK-LABEL: @xor_ashr_not_vec_undef_1(		; CHECK-LABEL: @xor_ashr_not_vec_undef_1(
; CHECK-NEXT: [[Y_SHIFT1:%.]] = xor <4 x i8> [[Y:%.]], [[X:%.*]]		; CHECK-NEXT: [[TMP1:%.]] = xor <4 x i8> [[Y:%.]], [[X:%.*]]
; CHECK-NEXT: [[TMP1:%.]] = ashr <4 x i8> [[Y_SHIFT1]], [[SHAMT:%.]]		; CHECK-NEXT: [[DOTNOT:%.]] = ashr <4 x i8> [[TMP1]], [[SHAMT:%.]]
; CHECK-NEXT: [[XOR:%.*]] = xor <4 x i8> [[TMP1]], <i8 -1, i8 undef, i8 undef, i8 undef>		; CHECK-NEXT: [[XOR:%.*]] = xor <4 x i8> [[DOTNOT]], <i8 -1, i8 -1, i8 -1, i8 -1>
; CHECK-NEXT: ret <4 x i8> [[XOR]]		; CHECK-NEXT: ret <4 x i8> [[XOR]]
;		;
%x.shift = ashr <4 x i8> %x, %shamt		%x.shift = ashr <4 x i8> %x, %shamt
%y.shift = ashr <4 x i8> %y, %shamt		%y.shift = ashr <4 x i8> %y, %shamt
%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 undef, i8 undef, i8 undef>		%y.shift.not = xor <4 x i8> %y.shift, <i8 -1, i8 undef, i8 undef, i8 undef>
%xor = xor <4 x i8> %x.shift, %y.shift.not		%xor = xor <4 x i8> %x.shift, %y.shift.not
ret <4 x i8> %xor		ret <4 x i8> %xor
}		}
Show All 28 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[InstCombine] Fold (-a >> b) and/or/xor (~a >> b) into (-a and/or/xor ~a) >> b
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 549950

llvm/lib/Transforms/InstCombine/InstructionCombining.cpp

llvm/test/Transforms/InstCombine/binop-and-shifts.ll

This is an archive of the discontinued LLVM Phabricator instance.

[InstCombine] Fold (-a >> b) and/or/xor (~a >> b) into (-a and/or/xor ~a) >> bClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 549950

llvm/lib/Transforms/InstCombine/InstructionCombining.cpp

llvm/test/Transforms/InstCombine/binop-and-shifts.ll

[InstCombine] Fold (-a >> b) and/or/xor (~a >> b) into (-a and/or/xor ~a) >> b
ClosedPublic