Diff 162025

lib/Target/X86/X86ISelDAGToDAG.cpp

Show First 20 Lines • Show All 450 Lines • ▼ Show 20 Lines	bool useNonTemporalLoad(LoadSDNode *N) const {
return Subtarget->hasAVX512();		return Subtarget->hasAVX512();
}		}
}		}

bool foldLoadStoreIntoMemOperand(SDNode *Node);		bool foldLoadStoreIntoMemOperand(SDNode *Node);
bool matchBEXTRFromAnd(SDNode *Node);		bool matchBEXTRFromAnd(SDNode *Node);
bool shrinkAndImmediate(SDNode *N);		bool shrinkAndImmediate(SDNode *N);
bool isMaskZeroExtended(SDNode *N) const;		bool isMaskZeroExtended(SDNode *N) const;
		bool tryShiftAmountMod(SDNode *N);

MachineSDNode *emitPCMPISTR(unsigned ROpc, unsigned MOpc, bool MayFoldLoad,		MachineSDNode *emitPCMPISTR(unsigned ROpc, unsigned MOpc, bool MayFoldLoad,
const SDLoc &dl, MVT VT, SDNode *Node);		const SDLoc &dl, MVT VT, SDNode *Node);
MachineSDNode *emitPCMPESTR(unsigned ROpc, unsigned MOpc, bool MayFoldLoad,		MachineSDNode *emitPCMPESTR(unsigned ROpc, unsigned MOpc, bool MayFoldLoad,
const SDLoc &dl, MVT VT, SDNode *Node,		const SDLoc &dl, MVT VT, SDNode *Node,
SDValue &InFlag);		SDValue &InFlag);
};		};
}		}
▲ Show 20 Lines • Show All 2,218 Lines • ▼ Show 20 Lines	MachineSDNode *X86DAGToDAGISel::emitPCMPESTR(unsigned ROpc, unsigned MOpc,

SDValue Ops[] = { N0, N2, Imm, InFlag };		SDValue Ops[] = { N0, N2, Imm, InFlag };
SDVTList VTs = CurDAG->getVTList(VT, MVT::i32, MVT::Glue);		SDVTList VTs = CurDAG->getVTList(VT, MVT::i32, MVT::Glue);
MachineSDNode *CNode = CurDAG->getMachineNode(ROpc, dl, VTs, Ops);		MachineSDNode *CNode = CurDAG->getMachineNode(ROpc, dl, VTs, Ops);
InFlag = SDValue(CNode, 2);		InFlag = SDValue(CNode, 2);
return CNode;		return CNode;
}		}

		bool X86DAGToDAGISel::tryShiftAmountMod(SDNode *N) {
		EVT VT = N->getValueType(0);

		// Only handle scalar shifts.
		if (VT.isVector())
		return false;

		// Narrower shifts only mask to 5 bits in hardware.
		unsigned Size = VT == MVT::i64 ? 64 : 32;

		SDValue OrigShiftAmt = N->getOperand(1);
		SDValue ShiftAmt = OrigShiftAmt;
		SDLoc DL(N);

		// Skip over a truncate of the shift amount.
		if (ShiftAmt->getOpcode() == ISD::TRUNCATE)
		ShiftAmt = ShiftAmt->getOperand(0);

		// Special case to avoid messing up a BZHI pattern.
		lebedev.riUnsubmitted Not Done Reply Inline Actions Why? I would think we can simply add one more pattern to the `BZHI`? I think this is bad because it not only not "messing up a BZHI pattern", but anything else too, since it does not check that the user is `and %val, %mask`. lebedev.ri: Why? I would think we can simply add one more pattern to the `BZHI`? I think this is bad…
		craig.topperAuthorUnsubmitted Not Done Reply Inline Actions This code runs when the root node considered for isel is a srl/sra/shl. And it runs before any tablegen patterns on that node. Any patterns that used a shift, but where the shift was not the root node have already been matched. So I'm specifically blocking out this one bzhi pattern that has a shift as a root node. // x << (bitwidth - y) >> (bitwidth - y) defm : _bmi_bzhi_pattern<(srl (shl RC:$src, (sub bitwidth, GR8:$lz)), (sub bitwidth, GR8:$lz)), (srl (shl (x86memop addr:$src), (sub bitwidth, GR8:$lz)), (sub bitwidth, GR8:$lz)), RC, VT, DstInst, DstMemInst>; craig.topper: This code runs when the root node considered for isel is a srl/sra/shl. And it runs before any…
		lebedev.riUnsubmitted Not Done Reply Inline Actions I see, thank you for the explanation. lebedev.ri: I see, thank you for the explanation.
		// Look for (srl (shl X, (size - y)), (size - y)
		if (Subtarget->hasBMI2() && (VT == MVT::i32 \|\| VT == MVT::i64) &&
		N->getOpcode() == ISD::SRL && N->getOperand(0).getOpcode() == ISD::SHL &&
		// Shift amounts the same?
		N->getOperand(1) == N->getOperand(0).getOperand(1) &&
		// Shift amounts size - y?
		ShiftAmt.getOpcode() == ISD::SUB &&
		isa<ConstantSDNode>(ShiftAmt.getOperand(0)) &&
		cast<ConstantSDNode>(ShiftAmt.getOperand(0))->getZExtValue() == Size)
		return false;

		SDValue NewShiftAmt;
		if (ShiftAmt->getOpcode() == ISD::ADD \|\| ShiftAmt->getOpcode() == ISD::SUB) {
		SDValue Add0 = ShiftAmt->getOperand(0);
		SDValue Add1 = ShiftAmt->getOperand(1);
		// If we are shifting by X+/-N where N == 0 mod Size, then just shift by X
		lebedev.riUnsubmitted Not Done Reply Inline Actions Are you sure this shouldn't be `N mod Size == 0`? At least i think that is what the code does. lebedev.ri: Are you sure this shouldn't be `N mod Size == 0`? At least i think that is what the code does.
		// to avoid the ADD/SUB.
		if (isa<ConstantSDNode>(Add1) &&
		cast<ConstantSDNode>(Add1)->getZExtValue() % Size == 0) {
		NewShiftAmt = Add0;
		// If we are shifting by N-X where N == 0 mod Size, then just shift by -X to
		lebedev.riUnsubmitted Not Done Reply Inline Actions Same lebedev.ri: Same
		// generate a NEG instead of a SUB of a constant.
		} else if (ShiftAmt->getOpcode() == ISD::SUB &&
		isa<ConstantSDNode>(Add0) &&
		cast<ConstantSDNode>(Add0)->getZExtValue() != 0 &&
		cast<ConstantSDNode>(Add0)->getZExtValue() % Size == 0) {
		// Insert a negate op.
		// TODO: This isn't guaranteed to replace the sub if there is a logic cone
		// that uses it that's not a shift.
		EVT SubVT = ShiftAmt.getValueType();
		SDValue Zero = CurDAG->getConstant(0, DL, SubVT);
		SDValue Neg = CurDAG->getNode(ISD::SUB, DL, SubVT, Zero, Add1);
		NewShiftAmt = Neg;

		// Insert these operands into a valid topological order so they can
		// get selected independently.
		insertDAGNode(*CurDAG, OrigShiftAmt, Zero);
		insertDAGNode(*CurDAG, OrigShiftAmt, Neg);
		niravdUnsubmitted Not Done Reply Inline Actions There's a definitely an issue with insertDAGNode where collisions due to CSE could require a nontrivial reordering in AllNodes to maintain the 'users before operands' property and we do at most repositioning one node. At some point we should probably replace insertDAGNode with a backend-generic way to corectly reposition that node and it's operands recursively to guarantee correct behavior. That said, hitting the issue in a way that will mess with correctness is pretty hard.We should probably change the position given to insertDAGNode to be the immediate operand to minimize the probability of reordering size. niravd: There's a definitely an issue with insertDAGNode where collisions due to CSE could require a…
		} else
		return false;
		} else
		return false;

		if (NewShiftAmt.getValueType() != MVT::i8) {
		// Need to truncate the shift amount.
		NewShiftAmt = CurDAG->getNode(ISD::TRUNCATE, DL, MVT::i8, NewShiftAmt);
		// Add to a correct topological ordering.
		insertDAGNode(*CurDAG, OrigShiftAmt, NewShiftAmt);
		}

		// Insert a new mask to keep the shift amount legal. This should be removed
		// by isel patterns.
		NewShiftAmt = CurDAG->getNode(ISD::AND, DL, MVT::i8, NewShiftAmt,
		CurDAG->getConstant(Size - 1, DL, MVT::i8));
		// Place in a correct topological ordering.
		insertDAGNode(*CurDAG, OrigShiftAmt, NewShiftAmt);

		SDNode *UpdatedNode = CurDAG->UpdateNodeOperands(N, N->getOperand(0),
		NewShiftAmt);
		niravdUnsubmitted Not Done Reply Inline Actions You should overwrite N with the return value of the update in case the update is CSEd with another node, e.g., we are selecting in a block that has both the pre-optimized and post-optimized versions. Actually, we should probably add a test case for this. N = CurDAG->UpdateNodeOperands(N, N->getOperand(0), NewShiftAmt); niravd: You should overwrite N with the return value of the update in case the update is CSEd with…
		craig.topperAuthorUnsubmitted Not Done Reply Inline Actions I'm having a hard time getting the topological sort to give me an order that can cause this to happen. We're always doing isel on the post-optimized version i explicitly put in the IR first. There are more nodes in that path and that seems to be making it so that the pre-optimized path gets fully sorted into the topological order before the post-optimized side does. craig.topper: I'm having a hard time getting the topological sort to give me an order that can cause this to…
		niravdUnsubmitted Not Done Reply Inline Actions I don't have the details of the topological sort worked out, but it definitely seems reasonable that it precludes any problematic orderings. Given that, let's skip on adding a test case for this. niravd: I don't have the details of the topological sort worked out, but it definitely seems reasonable…
		if (UpdatedNode != N) {
		// If we found an existing node, we should replace ourselves with that node
		// and wait for it to be selected after its other users.
		ReplaceNode(N, UpdatedNode);
		return true;
		}

		// If the original shift amount is now dead, delete it so that we don't run
		// it through isel.
		if (OrigShiftAmt.getNode()->use_empty())
		CurDAG->RemoveDeadNode(OrigShiftAmt.getNode());

		// Now that we've optimized the shift amount, defer to normal isel to get
		// load folding and legacy vs BMI2 selection without repeating it here.
		SelectCode(N);
		return true;
		}

/// If the high bits of an 'and' operand are known zero, try setting the		/// If the high bits of an 'and' operand are known zero, try setting the
/// high bits of an 'and' constant operand to produce a smaller encoding by		/// high bits of an 'and' constant operand to produce a smaller encoding by
/// creating a small, sign-extended negative immediate rather than a large		/// creating a small, sign-extended negative immediate rather than a large
/// positive one. This reverses a transform in SimplifyDemandedBits that		/// positive one. This reverses a transform in SimplifyDemandedBits that
/// shrinks mask constants by clearing bits. There is also a possibility that		/// shrinks mask constants by clearing bits. There is also a possibility that
/// the 'and' mask can be made -1, so the 'and' itself is unnecessary. In that		/// the 'and' mask can be made -1, so the 'and' itself is unnecessary. In that
/// case, just replace the 'and'. Return 'true' if the node is replaced.		/// case, just replace the 'and'. Return 'true' if the node is replaced.
bool X86DAGToDAGISel::shrinkAndImmediate(SDNode *And) {		bool X86DAGToDAGISel::shrinkAndImmediate(SDNode *And) {
▲ Show 20 Lines • Show All 114 Lines • ▼ Show 20 Lines	SDValue VSelect = CurDAG->getNode(
ISD::VSELECT, SDLoc(Node), Node->getValueType(0), Node->getOperand(0),		ISD::VSELECT, SDLoc(Node), Node->getValueType(0), Node->getOperand(0),
Node->getOperand(1), Node->getOperand(2));		Node->getOperand(1), Node->getOperand(2));
ReplaceNode(Node, VSelect.getNode());		ReplaceNode(Node, VSelect.getNode());
SelectCode(VSelect.getNode());		SelectCode(VSelect.getNode());
// We already called ReplaceUses.		// We already called ReplaceUses.
return;		return;
}		}

		case ISD::SRL:
		case ISD::SRA:
		case ISD::SHL:
		if (tryShiftAmountMod(Node))
		return;
		break;

case ISD::AND:		case ISD::AND:
if (matchBEXTRFromAnd(Node))		if (matchBEXTRFromAnd(Node))
return;		return;
if (shrinkAndImmediate(Node))		if (shrinkAndImmediate(Node))
return;		return;

LLVM_FALLTHROUGH;		LLVM_FALLTHROUGH;
case ISD::OR:		case ISD::OR:
▲ Show 20 Lines • Show All 602 Lines • Show Last 20 Lines

test/CodeGen/X86/clear-lowbits.ll

	Show First 20 Lines • Show All 1,102 Lines • ▼ Show 20 Lines
	}			}

	; 32-bit			; 32-bit

	define i32 @clear_lowbits32_ic0(i32 %val, i32 %numlowbits) nounwind {			define i32 @clear_lowbits32_ic0(i32 %val, i32 %numlowbits) nounwind {
	; X86-NOBMI2-LABEL: clear_lowbits32_ic0:			; X86-NOBMI2-LABEL: clear_lowbits32_ic0:
	; X86-NOBMI2: # %bb.0:			; X86-NOBMI2: # %bb.0:
	; X86-NOBMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-NOBMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI2-NEXT: movl $32, %ecx			; X86-NOBMI2-NEXT: xorl %ecx, %ecx
	; X86-NOBMI2-NEXT: subl {{[0-9]+}}(%esp), %ecx			; X86-NOBMI2-NEXT: subl {{[0-9]+}}(%esp), %ecx
	; X86-NOBMI2-NEXT: shrl %cl, %eax			; X86-NOBMI2-NEXT: shrl %cl, %eax
	; X86-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx			; X86-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx
	; X86-NOBMI2-NEXT: shll %cl, %eax			; X86-NOBMI2-NEXT: shll %cl, %eax
	; X86-NOBMI2-NEXT: retl			; X86-NOBMI2-NEXT: retl
	;			;
	; X86-BMI2-LABEL: clear_lowbits32_ic0:			; X86-BMI2-LABEL: clear_lowbits32_ic0:
	; X86-BMI2: # %bb.0:			; X86-BMI2: # %bb.0:
	; X86-BMI2-NEXT: movl $32, %eax			; X86-BMI2-NEXT: xorl %eax, %eax
	; X86-BMI2-NEXT: subl {{[0-9]+}}(%esp), %eax			; X86-BMI2-NEXT: subl {{[0-9]+}}(%esp), %eax
	; X86-BMI2-NEXT: shrxl %eax, {{[0-9]+}}(%esp), %ecx			; X86-BMI2-NEXT: shrxl %eax, {{[0-9]+}}(%esp), %ecx
	; X86-BMI2-NEXT: shlxl %eax, %ecx, %eax			; X86-BMI2-NEXT: shlxl %eax, %ecx, %eax
	; X86-BMI2-NEXT: retl			; X86-BMI2-NEXT: retl
	;			;
	; X64-NOBMI2-LABEL: clear_lowbits32_ic0:			; X64-NOBMI2-LABEL: clear_lowbits32_ic0:
	; X64-NOBMI2: # %bb.0:			; X64-NOBMI2: # %bb.0:
	; X64-NOBMI2-NEXT: movl $32, %ecx			; X64-NOBMI2-NEXT: movl %esi, %ecx
	; X64-NOBMI2-NEXT: subl %esi, %ecx			; X64-NOBMI2-NEXT: negl %ecx
	; X64-NOBMI2-NEXT: shrl %cl, %edi			; X64-NOBMI2-NEXT: shrl %cl, %edi
	; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI2-NEXT: shll %cl, %edi			; X64-NOBMI2-NEXT: shll %cl, %edi
	; X64-NOBMI2-NEXT: movl %edi, %eax			; X64-NOBMI2-NEXT: movl %edi, %eax
	; X64-NOBMI2-NEXT: retq			; X64-NOBMI2-NEXT: retq
	;			;
	; X64-BMI2-LABEL: clear_lowbits32_ic0:			; X64-BMI2-LABEL: clear_lowbits32_ic0:
	; X64-BMI2: # %bb.0:			; X64-BMI2: # %bb.0:
	; X64-BMI2-NEXT: movl $32, %eax			; X64-BMI2-NEXT: negl %esi
	; X64-BMI2-NEXT: subl %esi, %eax			; X64-BMI2-NEXT: shrxl %esi, %edi, %eax
	; X64-BMI2-NEXT: shrxl %eax, %edi, %ecx			; X64-BMI2-NEXT: shlxl %esi, %eax, %eax
	; X64-BMI2-NEXT: shlxl %eax, %ecx, %eax
	; X64-BMI2-NEXT: retq			; X64-BMI2-NEXT: retq
	%numhighbits = sub i32 32, %numlowbits			%numhighbits = sub i32 32, %numlowbits
	%mask = shl i32 -1, %numhighbits			%mask = shl i32 -1, %numhighbits
	%masked = and i32 %mask, %val			%masked = and i32 %mask, %val
	ret i32 %masked			ret i32 %masked
	}			}

	define i32 @clear_lowbits32_ic1_indexzext(i32 %val, i8 %numlowbits) nounwind {			define i32 @clear_lowbits32_ic1_indexzext(i32 %val, i8 %numlowbits) nounwind {
	; X86-NOBMI2-LABEL: clear_lowbits32_ic1_indexzext:			; X86-NOBMI2-LABEL: clear_lowbits32_ic1_indexzext:
	; X86-NOBMI2: # %bb.0:			; X86-NOBMI2: # %bb.0:
	; X86-NOBMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-NOBMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI2-NEXT: movb $32, %cl			; X86-NOBMI2-NEXT: xorl %ecx, %ecx
	; X86-NOBMI2-NEXT: subb {{[0-9]+}}(%esp), %cl			; X86-NOBMI2-NEXT: subb {{[0-9]+}}(%esp), %cl
	; X86-NOBMI2-NEXT: shrl %cl, %eax			; X86-NOBMI2-NEXT: shrl %cl, %eax
				; X86-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx
	; X86-NOBMI2-NEXT: shll %cl, %eax			; X86-NOBMI2-NEXT: shll %cl, %eax
	; X86-NOBMI2-NEXT: retl			; X86-NOBMI2-NEXT: retl
	;			;
	; X86-BMI2-LABEL: clear_lowbits32_ic1_indexzext:			; X86-BMI2-LABEL: clear_lowbits32_ic1_indexzext:
	; X86-BMI2: # %bb.0:			; X86-BMI2: # %bb.0:
	; X86-BMI2-NEXT: movb $32, %al			; X86-BMI2-NEXT: xorl %eax, %eax
	; X86-BMI2-NEXT: subb {{[0-9]+}}(%esp), %al			; X86-BMI2-NEXT: subb {{[0-9]+}}(%esp), %al
	; X86-BMI2-NEXT: shrxl %eax, {{[0-9]+}}(%esp), %ecx			; X86-BMI2-NEXT: shrxl %eax, {{[0-9]+}}(%esp), %ecx
	; X86-BMI2-NEXT: shlxl %eax, %ecx, %eax			; X86-BMI2-NEXT: shlxl %eax, %ecx, %eax
	; X86-BMI2-NEXT: retl			; X86-BMI2-NEXT: retl
	;			;
	; X64-NOBMI2-LABEL: clear_lowbits32_ic1_indexzext:			; X64-NOBMI2-LABEL: clear_lowbits32_ic1_indexzext:
	; X64-NOBMI2: # %bb.0:			; X64-NOBMI2: # %bb.0:
	; X64-NOBMI2-NEXT: movb $32, %cl			; X64-NOBMI2-NEXT: movl %esi, %ecx
	; X64-NOBMI2-NEXT: subb %sil, %cl			; X64-NOBMI2-NEXT: negb %cl
	; X64-NOBMI2-NEXT: shrl %cl, %edi			; X64-NOBMI2-NEXT: shrl %cl, %edi
				; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI2-NEXT: shll %cl, %edi			; X64-NOBMI2-NEXT: shll %cl, %edi
	; X64-NOBMI2-NEXT: movl %edi, %eax			; X64-NOBMI2-NEXT: movl %edi, %eax
	; X64-NOBMI2-NEXT: retq			; X64-NOBMI2-NEXT: retq
	;			;
	; X64-BMI2-LABEL: clear_lowbits32_ic1_indexzext:			; X64-BMI2-LABEL: clear_lowbits32_ic1_indexzext:
	; X64-BMI2: # %bb.0:			; X64-BMI2: # %bb.0:
	; X64-BMI2-NEXT: movb $32, %al			; X64-BMI2-NEXT: negb %sil
	; X64-BMI2-NEXT: subb %sil, %al			; X64-BMI2-NEXT: shrxl %esi, %edi, %eax
	; X64-BMI2-NEXT: shrxl %eax, %edi, %ecx			; X64-BMI2-NEXT: shlxl %esi, %eax, %eax
	; X64-BMI2-NEXT: shlxl %eax, %ecx, %eax
	; X64-BMI2-NEXT: retq			; X64-BMI2-NEXT: retq
	%numhighbits = sub i8 32, %numlowbits			%numhighbits = sub i8 32, %numlowbits
	%sh_prom = zext i8 %numhighbits to i32			%sh_prom = zext i8 %numhighbits to i32
	%mask = shl i32 -1, %sh_prom			%mask = shl i32 -1, %sh_prom
	%masked = and i32 %mask, %val			%masked = and i32 %mask, %val
	ret i32 %masked			ret i32 %masked
	}			}

	define i32 @clear_lowbits32_ic2_load(i32* %w, i32 %numlowbits) nounwind {			define i32 @clear_lowbits32_ic2_load(i32* %w, i32 %numlowbits) nounwind {
	; X86-NOBMI2-LABEL: clear_lowbits32_ic2_load:			; X86-NOBMI2-LABEL: clear_lowbits32_ic2_load:
	; X86-NOBMI2: # %bb.0:			; X86-NOBMI2: # %bb.0:
	; X86-NOBMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-NOBMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI2-NEXT: movl (%eax), %eax			; X86-NOBMI2-NEXT: movl (%eax), %eax
	; X86-NOBMI2-NEXT: movl $32, %ecx			; X86-NOBMI2-NEXT: xorl %ecx, %ecx
	; X86-NOBMI2-NEXT: subl {{[0-9]+}}(%esp), %ecx			; X86-NOBMI2-NEXT: subl {{[0-9]+}}(%esp), %ecx
	; X86-NOBMI2-NEXT: shrl %cl, %eax			; X86-NOBMI2-NEXT: shrl %cl, %eax
	; X86-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx			; X86-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx
	; X86-NOBMI2-NEXT: shll %cl, %eax			; X86-NOBMI2-NEXT: shll %cl, %eax
	; X86-NOBMI2-NEXT: retl			; X86-NOBMI2-NEXT: retl
	;			;
	; X86-BMI2-LABEL: clear_lowbits32_ic2_load:			; X86-BMI2-LABEL: clear_lowbits32_ic2_load:
	; X86-BMI2: # %bb.0:			; X86-BMI2: # %bb.0:
	; X86-BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-BMI2-NEXT: movl $32, %ecx			; X86-BMI2-NEXT: xorl %ecx, %ecx
	; X86-BMI2-NEXT: subl {{[0-9]+}}(%esp), %ecx			; X86-BMI2-NEXT: subl {{[0-9]+}}(%esp), %ecx
	; X86-BMI2-NEXT: shrxl %ecx, (%eax), %eax			; X86-BMI2-NEXT: shrxl %ecx, (%eax), %eax
	; X86-BMI2-NEXT: shlxl %ecx, %eax, %eax			; X86-BMI2-NEXT: shlxl %ecx, %eax, %eax
	; X86-BMI2-NEXT: retl			; X86-BMI2-NEXT: retl
	;			;
	; X64-NOBMI2-LABEL: clear_lowbits32_ic2_load:			; X64-NOBMI2-LABEL: clear_lowbits32_ic2_load:
	; X64-NOBMI2: # %bb.0:			; X64-NOBMI2: # %bb.0:
				; X64-NOBMI2-NEXT: movl %esi, %ecx
	; X64-NOBMI2-NEXT: movl (%rdi), %eax			; X64-NOBMI2-NEXT: movl (%rdi), %eax
	; X64-NOBMI2-NEXT: movl $32, %ecx			; X64-NOBMI2-NEXT: negl %ecx
	; X64-NOBMI2-NEXT: subl %esi, %ecx
	; X64-NOBMI2-NEXT: shrl %cl, %eax			; X64-NOBMI2-NEXT: shrl %cl, %eax
	; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI2-NEXT: shll %cl, %eax			; X64-NOBMI2-NEXT: shll %cl, %eax
	; X64-NOBMI2-NEXT: retq			; X64-NOBMI2-NEXT: retq
	;			;
	; X64-BMI2-LABEL: clear_lowbits32_ic2_load:			; X64-BMI2-LABEL: clear_lowbits32_ic2_load:
	; X64-BMI2: # %bb.0:			; X64-BMI2: # %bb.0:
	; X64-BMI2-NEXT: movl $32, %eax			; X64-BMI2-NEXT: negl %esi
	; X64-BMI2-NEXT: subl %esi, %eax			; X64-BMI2-NEXT: shrxl %esi, (%rdi), %eax
	; X64-BMI2-NEXT: shrxl %eax, (%rdi), %ecx			; X64-BMI2-NEXT: shlxl %esi, %eax, %eax
	; X64-BMI2-NEXT: shlxl %eax, %ecx, %eax
	; X64-BMI2-NEXT: retq			; X64-BMI2-NEXT: retq
	%val = load i32, i32* %w			%val = load i32, i32* %w
	%numhighbits = sub i32 32, %numlowbits			%numhighbits = sub i32 32, %numlowbits
	%mask = shl i32 -1, %numhighbits			%mask = shl i32 -1, %numhighbits
	%masked = and i32 %mask, %val			%masked = and i32 %mask, %val
	ret i32 %masked			ret i32 %masked
	}			}

	define i32 @clear_lowbits32_ic3_load_indexzext(i32* %w, i8 %numlowbits) nounwind {			define i32 @clear_lowbits32_ic3_load_indexzext(i32* %w, i8 %numlowbits) nounwind {
	; X86-NOBMI2-LABEL: clear_lowbits32_ic3_load_indexzext:			; X86-NOBMI2-LABEL: clear_lowbits32_ic3_load_indexzext:
	; X86-NOBMI2: # %bb.0:			; X86-NOBMI2: # %bb.0:
	; X86-NOBMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-NOBMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI2-NEXT: movl (%eax), %eax			; X86-NOBMI2-NEXT: movl (%eax), %eax
	; X86-NOBMI2-NEXT: movb $32, %cl			; X86-NOBMI2-NEXT: xorl %ecx, %ecx
	; X86-NOBMI2-NEXT: subb {{[0-9]+}}(%esp), %cl			; X86-NOBMI2-NEXT: subb {{[0-9]+}}(%esp), %cl
	; X86-NOBMI2-NEXT: shrl %cl, %eax			; X86-NOBMI2-NEXT: shrl %cl, %eax
				; X86-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx
	; X86-NOBMI2-NEXT: shll %cl, %eax			; X86-NOBMI2-NEXT: shll %cl, %eax
	; X86-NOBMI2-NEXT: retl			; X86-NOBMI2-NEXT: retl
	;			;
	; X86-BMI2-LABEL: clear_lowbits32_ic3_load_indexzext:			; X86-BMI2-LABEL: clear_lowbits32_ic3_load_indexzext:
	; X86-BMI2: # %bb.0:			; X86-BMI2: # %bb.0:
	; X86-BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-BMI2-NEXT: movb $32, %cl			; X86-BMI2-NEXT: xorl %ecx, %ecx
	; X86-BMI2-NEXT: subb {{[0-9]+}}(%esp), %cl			; X86-BMI2-NEXT: subb {{[0-9]+}}(%esp), %cl
	; X86-BMI2-NEXT: shrxl %ecx, (%eax), %eax			; X86-BMI2-NEXT: shrxl %ecx, (%eax), %eax
	; X86-BMI2-NEXT: shlxl %ecx, %eax, %eax			; X86-BMI2-NEXT: shlxl %ecx, %eax, %eax
	; X86-BMI2-NEXT: retl			; X86-BMI2-NEXT: retl
	;			;
	; X64-NOBMI2-LABEL: clear_lowbits32_ic3_load_indexzext:			; X64-NOBMI2-LABEL: clear_lowbits32_ic3_load_indexzext:
	; X64-NOBMI2: # %bb.0:			; X64-NOBMI2: # %bb.0:
				; X64-NOBMI2-NEXT: movl %esi, %ecx
	; X64-NOBMI2-NEXT: movl (%rdi), %eax			; X64-NOBMI2-NEXT: movl (%rdi), %eax
	; X64-NOBMI2-NEXT: movb $32, %cl			; X64-NOBMI2-NEXT: negb %cl
	; X64-NOBMI2-NEXT: subb %sil, %cl
	; X64-NOBMI2-NEXT: shrl %cl, %eax			; X64-NOBMI2-NEXT: shrl %cl, %eax
				; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI2-NEXT: shll %cl, %eax			; X64-NOBMI2-NEXT: shll %cl, %eax
	; X64-NOBMI2-NEXT: retq			; X64-NOBMI2-NEXT: retq
	;			;
	; X64-BMI2-LABEL: clear_lowbits32_ic3_load_indexzext:			; X64-BMI2-LABEL: clear_lowbits32_ic3_load_indexzext:
	; X64-BMI2: # %bb.0:			; X64-BMI2: # %bb.0:
	; X64-BMI2-NEXT: movb $32, %al			; X64-BMI2-NEXT: negb %sil
	; X64-BMI2-NEXT: subb %sil, %al			; X64-BMI2-NEXT: shrxl %esi, (%rdi), %eax
	; X64-BMI2-NEXT: shrxl %eax, (%rdi), %ecx			; X64-BMI2-NEXT: shlxl %esi, %eax, %eax
	; X64-BMI2-NEXT: shlxl %eax, %ecx, %eax
	; X64-BMI2-NEXT: retq			; X64-BMI2-NEXT: retq
	%val = load i32, i32* %w			%val = load i32, i32* %w
	%numhighbits = sub i8 32, %numlowbits			%numhighbits = sub i8 32, %numlowbits
	%sh_prom = zext i8 %numhighbits to i32			%sh_prom = zext i8 %numhighbits to i32
	%mask = shl i32 -1, %sh_prom			%mask = shl i32 -1, %sh_prom
	%masked = and i32 %mask, %val			%masked = and i32 %mask, %val
	ret i32 %masked			ret i32 %masked
	}			}

	define i32 @clear_lowbits32_ic4_commutative(i32 %val, i32 %numlowbits) nounwind {			define i32 @clear_lowbits32_ic4_commutative(i32 %val, i32 %numlowbits) nounwind {
	; X86-NOBMI2-LABEL: clear_lowbits32_ic4_commutative:			; X86-NOBMI2-LABEL: clear_lowbits32_ic4_commutative:
	; X86-NOBMI2: # %bb.0:			; X86-NOBMI2: # %bb.0:
	; X86-NOBMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-NOBMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI2-NEXT: movl $32, %ecx			; X86-NOBMI2-NEXT: xorl %ecx, %ecx
	; X86-NOBMI2-NEXT: subl {{[0-9]+}}(%esp), %ecx			; X86-NOBMI2-NEXT: subl {{[0-9]+}}(%esp), %ecx
	; X86-NOBMI2-NEXT: shrl %cl, %eax			; X86-NOBMI2-NEXT: shrl %cl, %eax
	; X86-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx			; X86-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx
	; X86-NOBMI2-NEXT: shll %cl, %eax			; X86-NOBMI2-NEXT: shll %cl, %eax
	; X86-NOBMI2-NEXT: retl			; X86-NOBMI2-NEXT: retl
	;			;
	; X86-BMI2-LABEL: clear_lowbits32_ic4_commutative:			; X86-BMI2-LABEL: clear_lowbits32_ic4_commutative:
	; X86-BMI2: # %bb.0:			; X86-BMI2: # %bb.0:
	; X86-BMI2-NEXT: movl $32, %eax			; X86-BMI2-NEXT: xorl %eax, %eax
	; X86-BMI2-NEXT: subl {{[0-9]+}}(%esp), %eax			; X86-BMI2-NEXT: subl {{[0-9]+}}(%esp), %eax
	; X86-BMI2-NEXT: shrxl %eax, {{[0-9]+}}(%esp), %ecx			; X86-BMI2-NEXT: shrxl %eax, {{[0-9]+}}(%esp), %ecx
	; X86-BMI2-NEXT: shlxl %eax, %ecx, %eax			; X86-BMI2-NEXT: shlxl %eax, %ecx, %eax
	; X86-BMI2-NEXT: retl			; X86-BMI2-NEXT: retl
	;			;
	; X64-NOBMI2-LABEL: clear_lowbits32_ic4_commutative:			; X64-NOBMI2-LABEL: clear_lowbits32_ic4_commutative:
	; X64-NOBMI2: # %bb.0:			; X64-NOBMI2: # %bb.0:
	; X64-NOBMI2-NEXT: movl $32, %ecx			; X64-NOBMI2-NEXT: movl %esi, %ecx
	; X64-NOBMI2-NEXT: subl %esi, %ecx			; X64-NOBMI2-NEXT: negl %ecx
	; X64-NOBMI2-NEXT: shrl %cl, %edi			; X64-NOBMI2-NEXT: shrl %cl, %edi
	; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI2-NEXT: shll %cl, %edi			; X64-NOBMI2-NEXT: shll %cl, %edi
	; X64-NOBMI2-NEXT: movl %edi, %eax			; X64-NOBMI2-NEXT: movl %edi, %eax
	; X64-NOBMI2-NEXT: retq			; X64-NOBMI2-NEXT: retq
	;			;
	; X64-BMI2-LABEL: clear_lowbits32_ic4_commutative:			; X64-BMI2-LABEL: clear_lowbits32_ic4_commutative:
	; X64-BMI2: # %bb.0:			; X64-BMI2: # %bb.0:
	; X64-BMI2-NEXT: movl $32, %eax			; X64-BMI2-NEXT: negl %esi
	; X64-BMI2-NEXT: subl %esi, %eax			; X64-BMI2-NEXT: shrxl %esi, %edi, %eax
	; X64-BMI2-NEXT: shrxl %eax, %edi, %ecx			; X64-BMI2-NEXT: shlxl %esi, %eax, %eax
	; X64-BMI2-NEXT: shlxl %eax, %ecx, %eax
	; X64-BMI2-NEXT: retq			; X64-BMI2-NEXT: retq
	%numhighbits = sub i32 32, %numlowbits			%numhighbits = sub i32 32, %numlowbits
	%mask = shl i32 -1, %numhighbits			%mask = shl i32 -1, %numhighbits
	%masked = and i32 %val, %mask ; swapped order			%masked = and i32 %val, %mask ; swapped order
	ret i32 %masked			ret i32 %masked
	}			}

	; 64-bit			; 64-bit
	Show All 31 Lines
	; X86-BMI2-NEXT: xorl %eax, %eax			; X86-BMI2-NEXT: xorl %eax, %eax
	; X86-BMI2-NEXT: .LBB31_2:			; X86-BMI2-NEXT: .LBB31_2:
	; X86-BMI2-NEXT: andl {{[0-9]+}}(%esp), %edx			; X86-BMI2-NEXT: andl {{[0-9]+}}(%esp), %edx
	; X86-BMI2-NEXT: andl {{[0-9]+}}(%esp), %eax			; X86-BMI2-NEXT: andl {{[0-9]+}}(%esp), %eax
	; X86-BMI2-NEXT: retl			; X86-BMI2-NEXT: retl
	;			;
	; X64-NOBMI2-LABEL: clear_lowbits64_ic0:			; X64-NOBMI2-LABEL: clear_lowbits64_ic0:
	; X64-NOBMI2: # %bb.0:			; X64-NOBMI2: # %bb.0:
	; X64-NOBMI2-NEXT: movl $64, %ecx			; X64-NOBMI2-NEXT: movq %rsi, %rcx
	; X64-NOBMI2-NEXT: subl %esi, %ecx			; X64-NOBMI2-NEXT: negl %ecx
	; X64-NOBMI2-NEXT: shrq %cl, %rdi			; X64-NOBMI2-NEXT: shrq %cl, %rdi
	; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $rcx
	; X64-NOBMI2-NEXT: shlq %cl, %rdi			; X64-NOBMI2-NEXT: shlq %cl, %rdi
	; X64-NOBMI2-NEXT: movq %rdi, %rax			; X64-NOBMI2-NEXT: movq %rdi, %rax
	; X64-NOBMI2-NEXT: retq			; X64-NOBMI2-NEXT: retq
	;			;
	; X64-BMI2-LABEL: clear_lowbits64_ic0:			; X64-BMI2-LABEL: clear_lowbits64_ic0:
	; X64-BMI2: # %bb.0:			; X64-BMI2: # %bb.0:
	; X64-BMI2-NEXT: movl $64, %eax			; X64-BMI2-NEXT: negl %esi
	; X64-BMI2-NEXT: subl %esi, %eax			; X64-BMI2-NEXT: shrxq %rsi, %rdi, %rax
	; X64-BMI2-NEXT: shrxq %rax, %rdi, %rcx			; X64-BMI2-NEXT: shlxq %rsi, %rax, %rax
	; X64-BMI2-NEXT: shlxq %rax, %rcx, %rax
	; X64-BMI2-NEXT: retq			; X64-BMI2-NEXT: retq
	%numhighbits = sub i64 64, %numlowbits			%numhighbits = sub i64 64, %numlowbits
	%mask = shl i64 -1, %numhighbits			%mask = shl i64 -1, %numhighbits
	%masked = and i64 %mask, %val			%masked = and i64 %mask, %val
	ret i64 %masked			ret i64 %masked
	}			}

	define i64 @clear_lowbits64_ic1_indexzext(i64 %val, i8 %numlowbits) nounwind {			define i64 @clear_lowbits64_ic1_indexzext(i64 %val, i8 %numlowbits) nounwind {
	Show All 29 Lines
	; X86-BMI2-NEXT: xorl %eax, %eax			; X86-BMI2-NEXT: xorl %eax, %eax
	; X86-BMI2-NEXT: .LBB32_2:			; X86-BMI2-NEXT: .LBB32_2:
	; X86-BMI2-NEXT: andl {{[0-9]+}}(%esp), %edx			; X86-BMI2-NEXT: andl {{[0-9]+}}(%esp), %edx
	; X86-BMI2-NEXT: andl {{[0-9]+}}(%esp), %eax			; X86-BMI2-NEXT: andl {{[0-9]+}}(%esp), %eax
	; X86-BMI2-NEXT: retl			; X86-BMI2-NEXT: retl
	;			;
	; X64-NOBMI2-LABEL: clear_lowbits64_ic1_indexzext:			; X64-NOBMI2-LABEL: clear_lowbits64_ic1_indexzext:
	; X64-NOBMI2: # %bb.0:			; X64-NOBMI2: # %bb.0:
	; X64-NOBMI2-NEXT: movb $64, %cl			; X64-NOBMI2-NEXT: movl %esi, %ecx
	; X64-NOBMI2-NEXT: subb %sil, %cl			; X64-NOBMI2-NEXT: negb %cl
	; X64-NOBMI2-NEXT: shrq %cl, %rdi			; X64-NOBMI2-NEXT: shrq %cl, %rdi
				; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI2-NEXT: shlq %cl, %rdi			; X64-NOBMI2-NEXT: shlq %cl, %rdi
	; X64-NOBMI2-NEXT: movq %rdi, %rax			; X64-NOBMI2-NEXT: movq %rdi, %rax
	; X64-NOBMI2-NEXT: retq			; X64-NOBMI2-NEXT: retq
	;			;
	; X64-BMI2-LABEL: clear_lowbits64_ic1_indexzext:			; X64-BMI2-LABEL: clear_lowbits64_ic1_indexzext:
	; X64-BMI2: # %bb.0:			; X64-BMI2: # %bb.0:
	; X64-BMI2-NEXT: movb $64, %al			; X64-BMI2-NEXT: # kill: def $esi killed $esi def $rsi
	; X64-BMI2-NEXT: subb %sil, %al			; X64-BMI2-NEXT: negb %sil
	; X64-BMI2-NEXT: shrxq %rax, %rdi, %rcx			; X64-BMI2-NEXT: shrxq %rsi, %rdi, %rax
	; X64-BMI2-NEXT: shlxq %rax, %rcx, %rax			; X64-BMI2-NEXT: shlxq %rsi, %rax, %rax
	; X64-BMI2-NEXT: retq			; X64-BMI2-NEXT: retq
	%numhighbits = sub i8 64, %numlowbits			%numhighbits = sub i8 64, %numlowbits
	%sh_prom = zext i8 %numhighbits to i64			%sh_prom = zext i8 %numhighbits to i64
	%mask = shl i64 -1, %sh_prom			%mask = shl i64 -1, %sh_prom
	%masked = and i64 %mask, %val			%masked = and i64 %mask, %val
	ret i64 %masked			ret i64 %masked
	}			}

	Show All 36 Lines
	; X86-BMI2-NEXT: .LBB33_2:			; X86-BMI2-NEXT: .LBB33_2:
	; X86-BMI2-NEXT: andl 4(%esi), %edx			; X86-BMI2-NEXT: andl 4(%esi), %edx
	; X86-BMI2-NEXT: andl (%esi), %eax			; X86-BMI2-NEXT: andl (%esi), %eax
	; X86-BMI2-NEXT: popl %esi			; X86-BMI2-NEXT: popl %esi
	; X86-BMI2-NEXT: retl			; X86-BMI2-NEXT: retl
	;			;
	; X64-NOBMI2-LABEL: clear_lowbits64_ic2_load:			; X64-NOBMI2-LABEL: clear_lowbits64_ic2_load:
	; X64-NOBMI2: # %bb.0:			; X64-NOBMI2: # %bb.0:
				; X64-NOBMI2-NEXT: movq %rsi, %rcx
	; X64-NOBMI2-NEXT: movq (%rdi), %rax			; X64-NOBMI2-NEXT: movq (%rdi), %rax
	; X64-NOBMI2-NEXT: movl $64, %ecx			; X64-NOBMI2-NEXT: negl %ecx
	; X64-NOBMI2-NEXT: subl %esi, %ecx
	; X64-NOBMI2-NEXT: shrq %cl, %rax			; X64-NOBMI2-NEXT: shrq %cl, %rax
	; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $rcx
	; X64-NOBMI2-NEXT: shlq %cl, %rax			; X64-NOBMI2-NEXT: shlq %cl, %rax
	; X64-NOBMI2-NEXT: retq			; X64-NOBMI2-NEXT: retq
	;			;
	; X64-BMI2-LABEL: clear_lowbits64_ic2_load:			; X64-BMI2-LABEL: clear_lowbits64_ic2_load:
	; X64-BMI2: # %bb.0:			; X64-BMI2: # %bb.0:
	; X64-BMI2-NEXT: movl $64, %eax			; X64-BMI2-NEXT: negl %esi
	; X64-BMI2-NEXT: subl %esi, %eax			; X64-BMI2-NEXT: shrxq %rsi, (%rdi), %rax
	; X64-BMI2-NEXT: shrxq %rax, (%rdi), %rcx			; X64-BMI2-NEXT: shlxq %rsi, %rax, %rax
	; X64-BMI2-NEXT: shlxq %rax, %rcx, %rax
	; X64-BMI2-NEXT: retq			; X64-BMI2-NEXT: retq
	%val = load i64, i64* %w			%val = load i64, i64* %w
	%numhighbits = sub i64 64, %numlowbits			%numhighbits = sub i64 64, %numlowbits
	%mask = shl i64 -1, %numhighbits			%mask = shl i64 -1, %numhighbits
	%masked = and i64 %mask, %val			%masked = and i64 %mask, %val
	ret i64 %masked			ret i64 %masked
	}			}

	Show All 36 Lines
	; X86-BMI2-NEXT: .LBB34_2:			; X86-BMI2-NEXT: .LBB34_2:
	; X86-BMI2-NEXT: andl 4(%esi), %edx			; X86-BMI2-NEXT: andl 4(%esi), %edx
	; X86-BMI2-NEXT: andl (%esi), %eax			; X86-BMI2-NEXT: andl (%esi), %eax
	; X86-BMI2-NEXT: popl %esi			; X86-BMI2-NEXT: popl %esi
	; X86-BMI2-NEXT: retl			; X86-BMI2-NEXT: retl
	;			;
	; X64-NOBMI2-LABEL: clear_lowbits64_ic3_load_indexzext:			; X64-NOBMI2-LABEL: clear_lowbits64_ic3_load_indexzext:
	; X64-NOBMI2: # %bb.0:			; X64-NOBMI2: # %bb.0:
				; X64-NOBMI2-NEXT: movl %esi, %ecx
	; X64-NOBMI2-NEXT: movq (%rdi), %rax			; X64-NOBMI2-NEXT: movq (%rdi), %rax
	; X64-NOBMI2-NEXT: movb $64, %cl			; X64-NOBMI2-NEXT: negb %cl
	; X64-NOBMI2-NEXT: subb %sil, %cl
	; X64-NOBMI2-NEXT: shrq %cl, %rax			; X64-NOBMI2-NEXT: shrq %cl, %rax
				; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI2-NEXT: shlq %cl, %rax			; X64-NOBMI2-NEXT: shlq %cl, %rax
	; X64-NOBMI2-NEXT: retq			; X64-NOBMI2-NEXT: retq
	;			;
	; X64-BMI2-LABEL: clear_lowbits64_ic3_load_indexzext:			; X64-BMI2-LABEL: clear_lowbits64_ic3_load_indexzext:
	; X64-BMI2: # %bb.0:			; X64-BMI2: # %bb.0:
	; X64-BMI2-NEXT: movb $64, %al			; X64-BMI2-NEXT: # kill: def $esi killed $esi def $rsi
	; X64-BMI2-NEXT: subb %sil, %al			; X64-BMI2-NEXT: negb %sil
	; X64-BMI2-NEXT: shrxq %rax, (%rdi), %rcx			; X64-BMI2-NEXT: shrxq %rsi, (%rdi), %rax
	; X64-BMI2-NEXT: shlxq %rax, %rcx, %rax			; X64-BMI2-NEXT: shlxq %rsi, %rax, %rax
	; X64-BMI2-NEXT: retq			; X64-BMI2-NEXT: retq
	%val = load i64, i64* %w			%val = load i64, i64* %w
	%numhighbits = sub i8 64, %numlowbits			%numhighbits = sub i8 64, %numlowbits
	%sh_prom = zext i8 %numhighbits to i64			%sh_prom = zext i8 %numhighbits to i64
	%mask = shl i64 -1, %sh_prom			%mask = shl i64 -1, %sh_prom
	%masked = and i64 %mask, %val			%masked = and i64 %mask, %val
	ret i64 %masked			ret i64 %masked
	}			}
	Show All 31 Lines
	; X86-BMI2-NEXT: xorl %eax, %eax			; X86-BMI2-NEXT: xorl %eax, %eax
	; X86-BMI2-NEXT: .LBB35_2:			; X86-BMI2-NEXT: .LBB35_2:
	; X86-BMI2-NEXT: andl {{[0-9]+}}(%esp), %edx			; X86-BMI2-NEXT: andl {{[0-9]+}}(%esp), %edx
	; X86-BMI2-NEXT: andl {{[0-9]+}}(%esp), %eax			; X86-BMI2-NEXT: andl {{[0-9]+}}(%esp), %eax
	; X86-BMI2-NEXT: retl			; X86-BMI2-NEXT: retl
	;			;
	; X64-NOBMI2-LABEL: clear_lowbits64_ic4_commutative:			; X64-NOBMI2-LABEL: clear_lowbits64_ic4_commutative:
	; X64-NOBMI2: # %bb.0:			; X64-NOBMI2: # %bb.0:
	; X64-NOBMI2-NEXT: movl $64, %ecx			; X64-NOBMI2-NEXT: movq %rsi, %rcx
	; X64-NOBMI2-NEXT: subl %esi, %ecx			; X64-NOBMI2-NEXT: negl %ecx
	; X64-NOBMI2-NEXT: shrq %cl, %rdi			; X64-NOBMI2-NEXT: shrq %cl, %rdi
	; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI2-NEXT: # kill: def $cl killed $cl killed $rcx
	; X64-NOBMI2-NEXT: shlq %cl, %rdi			; X64-NOBMI2-NEXT: shlq %cl, %rdi
	; X64-NOBMI2-NEXT: movq %rdi, %rax			; X64-NOBMI2-NEXT: movq %rdi, %rax
	; X64-NOBMI2-NEXT: retq			; X64-NOBMI2-NEXT: retq
	;			;
	; X64-BMI2-LABEL: clear_lowbits64_ic4_commutative:			; X64-BMI2-LABEL: clear_lowbits64_ic4_commutative:
	; X64-BMI2: # %bb.0:			; X64-BMI2: # %bb.0:
	; X64-BMI2-NEXT: movl $64, %eax			; X64-BMI2-NEXT: negl %esi
	; X64-BMI2-NEXT: subl %esi, %eax			; X64-BMI2-NEXT: shrxq %rsi, %rdi, %rax
	; X64-BMI2-NEXT: shrxq %rax, %rdi, %rcx			; X64-BMI2-NEXT: shlxq %rsi, %rax, %rax
	; X64-BMI2-NEXT: shlxq %rax, %rcx, %rax
	; X64-BMI2-NEXT: retq			; X64-BMI2-NEXT: retq
	%numhighbits = sub i64 64, %numlowbits			%numhighbits = sub i64 64, %numlowbits
	%mask = shl i64 -1, %numhighbits			%mask = shl i64 -1, %numhighbits
	%masked = and i64 %val, %mask ; swapped order			%masked = and i64 %val, %mask ; swapped order
	ret i64 %masked			ret i64 %masked
	}			}

	; ---------------------------------------------------------------------------- ;			; ---------------------------------------------------------------------------- ;
	▲ Show 20 Lines • Show All 176 Lines • Show Last 20 Lines

test/CodeGen/X86/extract-lowbits.ll

	; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
	; RUN: llc -mtriple=i686-unknown-linux-gnu -mattr=-bmi,-tbm,-bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X86,NOBMI,X86-NOBMI			; RUN: llc -mtriple=i686-unknown-linux-gnu -mattr=-bmi,-tbm,-bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X86,NOBMI,X86-NOBMI
	; RUN: llc -mtriple=i686-unknown-linux-gnu -mattr=+bmi,-tbm,-bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X86,BMI1,X86-BMI1			; RUN: llc -mtriple=i686-unknown-linux-gnu -mattr=+bmi,-tbm,-bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X86,BMI1,X86-BMI1
	; RUN: llc -mtriple=i686-unknown-linux-gnu -mattr=+bmi,+tbm,-bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X86,BMI1,X86-BMI1,BMI1TBM,X86-BMI1TBM			; RUN: llc -mtriple=i686-unknown-linux-gnu -mattr=+bmi,+tbm,-bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X86,BMI1,X86-BMI1,BMI1TBM,X86-BMI1TBM
	; RUN: llc -mtriple=i686-unknown-linux-gnu -mattr=+bmi,+tbm,+bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X86,BMI1,X86-BMI1,BMI1BMI2,X86-BMI1BMI2,BMI1TBM,X86-BMI1TBM,BMI1TBMBMI2,X86-BMI1TBMBMI2			; RUN: llc -mtriple=i686-unknown-linux-gnu -mattr=+bmi,+tbm,+bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X86,BMI1,X86-BMI1,BMI1BMI2,X86-BMI1BMI2,BMI1TBM,X86-BMI1TBM,BMI1TBMBMI2,X86-BMI1TBMBMI2
	; RUN: llc -mtriple=i686-unknown-linux-gnu -mattr=+bmi,-tbm,+bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X86,BMI1,X86-BMI1,BMI1BMI2,X86-BMI1BMI2,BMI1NOTBMBMI2,X86-BMI1NOTBMBMI2			; RUN: llc -mtriple=i686-unknown-linux-gnu -mattr=+bmi,-tbm,+bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X86,BMI1,X86-BMI1,BMI1BMI2,X86-BMI1BMI2,BMI1NOTBMBMI2,X86-BMI1NOTBMBMI2
	; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mattr=-bmi,-tbm,-bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X64,NOBMI,X64-NOBMI			; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mattr=-bmi,-tbm,-bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X64,NOBMI,X64-NOBMI
	; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mattr=+bmi,-tbm,-bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X64,BMI1,X64-BMI1			; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mattr=+bmi,-tbm,-bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X64,BMI1,X64-BMI1
	; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mattr=+bmi,+tbm,-bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X64,BMI1,X64-BMI1,BMI1TBM,X64-BMI1TBM			; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mattr=+bmi,+tbm,-bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X64,BMI1,X64-BMI1,BMI1TBM,X64-BMI1TBM
	; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mattr=+bmi,+tbm,+bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X64,BMI1,X64-BMI1,BMI1BMI2,X64-BMI1BMI2,BMI1TBM,X64-BMI1TBM,BMI1TBMBMI2,X64-BMI1TBMBMI2			; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mattr=+bmi,+tbm,+bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X64,BMI1,X64-BMI1,BMI1BMI2,X64-BMI1BMI2,BMI1TBM,X64-BMI1TBM,BMI1TBMBMI2,X64-BMI1TBMBMI2
	; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mattr=+bmi,-tbm,+bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X64,BMI1,X64-BMI1,BMI1BMI2,X64-BMI1BMI2,BMI1NOTBMBMI2,X64-BMI1NOTBMBMI2			; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mattr=+bmi,-tbm,+bmi2 < %s \| FileCheck %s --check-prefixes=CHECK,X64,BMI1,X64-BMI1,BMI1BMI2,X64-BMI1BMI2,BMI1NOTBMBMI2,X64-BMI1NOTBMBMI2
				lebedev.riUnsubmitted Not Done Reply Inline Actions I'll commit the change to this file from D48490 tomorrow. That will expose more fold possibilities here. lebedev.ri: I'll commit the change to this file from D48490 tomorrow. That will expose more fold…

	; Please keep in sync with test/CodeGen/AArch64/extract-lowbits.ll			; Please keep in sync with test/CodeGen/AArch64/extract-lowbits.ll

	; https://bugs.llvm.org/show_bug.cgi?id=36419			; https://bugs.llvm.org/show_bug.cgi?id=36419
	; https://bugs.llvm.org/show_bug.cgi?id=37603			; https://bugs.llvm.org/show_bug.cgi?id=37603
	; https://bugs.llvm.org/show_bug.cgi?id=37610			; https://bugs.llvm.org/show_bug.cgi?id=37610

	; Patterns:			; Patterns:
	▲ Show 20 Lines • Show All 991 Lines • ▼ Show 20 Lines
	; ---------------------------------------------------------------------------- ;			; ---------------------------------------------------------------------------- ;
	; Pattern c. 32-bit			; Pattern c. 32-bit
	; ---------------------------------------------------------------------------- ;			; ---------------------------------------------------------------------------- ;

	define i32 @bzhi32_c0(i32 %val, i32 %numlowbits) nounwind {			define i32 @bzhi32_c0(i32 %val, i32 %numlowbits) nounwind {
	; X86-NOBMI-LABEL: bzhi32_c0:			; X86-NOBMI-LABEL: bzhi32_c0:
	; X86-NOBMI: # %bb.0:			; X86-NOBMI: # %bb.0:
	; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI-NEXT: movl $32, %ecx			; X86-NOBMI-NEXT: xorl %ecx, %ecx
	; X86-NOBMI-NEXT: subl {{[0-9]+}}(%esp), %ecx			; X86-NOBMI-NEXT: subl {{[0-9]+}}(%esp), %ecx
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
	; X86-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx			; X86-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X86-NOBMI-NEXT: shrl %cl, %eax			; X86-NOBMI-NEXT: shrl %cl, %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_c0:			; X86-BMI1BMI2-LABEL: bzhi32_c0:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: bzhil %eax, {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: bzhil %eax, {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_c0:			; X64-NOBMI-LABEL: bzhi32_c0:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movl $32, %ecx			; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: subl %esi, %ecx			; X64-NOBMI-NEXT: negl %ecx
	; X64-NOBMI-NEXT: shll %cl, %edi			; X64-NOBMI-NEXT: shll %cl, %edi
	; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI-NEXT: shrl %cl, %edi			; X64-NOBMI-NEXT: shrl %cl, %edi
	; X64-NOBMI-NEXT: movl %edi, %eax			; X64-NOBMI-NEXT: movl %edi, %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_c0:			; X64-BMI1BMI2-LABEL: bzhi32_c0:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: bzhil %esi, %edi, %eax			; X64-BMI1BMI2-NEXT: bzhil %esi, %edi, %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%numhighbits = sub i32 32, %numlowbits			%numhighbits = sub i32 32, %numlowbits
	%mask = lshr i32 -1, %numhighbits			%mask = lshr i32 -1, %numhighbits
	%masked = and i32 %mask, %val			%masked = and i32 %mask, %val
	ret i32 %masked			ret i32 %masked
	}			}

	define i32 @bzhi32_c1_indexzext(i32 %val, i8 %numlowbits) nounwind {			define i32 @bzhi32_c1_indexzext(i32 %val, i8 %numlowbits) nounwind {
	; X86-NOBMI-LABEL: bzhi32_c1_indexzext:			; X86-NOBMI-LABEL: bzhi32_c1_indexzext:
	; X86-NOBMI: # %bb.0:			; X86-NOBMI: # %bb.0:
	; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI-NEXT: movb $32, %cl			; X86-NOBMI-NEXT: xorl %ecx, %ecx
	; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl			; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
				; X86-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X86-NOBMI-NEXT: shrl %cl, %eax			; X86-NOBMI-NEXT: shrl %cl, %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_c1_indexzext:			; X86-BMI1BMI2-LABEL: bzhi32_c1_indexzext:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %al			; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %al
	; X86-BMI1BMI2-NEXT: bzhil %eax, {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: bzhil %eax, {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_c1_indexzext:			; X64-NOBMI-LABEL: bzhi32_c1_indexzext:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movb $32, %cl			; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: subb %sil, %cl			; X64-NOBMI-NEXT: negb %cl
	; X64-NOBMI-NEXT: shll %cl, %edi			; X64-NOBMI-NEXT: shll %cl, %edi
				; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI-NEXT: shrl %cl, %edi			; X64-NOBMI-NEXT: shrl %cl, %edi
	; X64-NOBMI-NEXT: movl %edi, %eax			; X64-NOBMI-NEXT: movl %edi, %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_c1_indexzext:			; X64-BMI1BMI2-LABEL: bzhi32_c1_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: bzhil %esi, %edi, %eax			; X64-BMI1BMI2-NEXT: bzhil %esi, %edi, %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%numhighbits = sub i8 32, %numlowbits			%numhighbits = sub i8 32, %numlowbits
	%sh_prom = zext i8 %numhighbits to i32			%sh_prom = zext i8 %numhighbits to i32
	%mask = lshr i32 -1, %sh_prom			%mask = lshr i32 -1, %sh_prom
	%masked = and i32 %mask, %val			%masked = and i32 %mask, %val
	ret i32 %masked			ret i32 %masked
	}			}

	define i32 @bzhi32_c2_load(i32* %w, i32 %numlowbits) nounwind {			define i32 @bzhi32_c2_load(i32* %w, i32 %numlowbits) nounwind {
	; X86-NOBMI-LABEL: bzhi32_c2_load:			; X86-NOBMI-LABEL: bzhi32_c2_load:
	; X86-NOBMI: # %bb.0:			; X86-NOBMI: # %bb.0:
	; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI-NEXT: movl (%eax), %eax			; X86-NOBMI-NEXT: movl (%eax), %eax
	; X86-NOBMI-NEXT: movl $32, %ecx			; X86-NOBMI-NEXT: xorl %ecx, %ecx
	; X86-NOBMI-NEXT: subl {{[0-9]+}}(%esp), %ecx			; X86-NOBMI-NEXT: subl {{[0-9]+}}(%esp), %ecx
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
	; X86-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx			; X86-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X86-NOBMI-NEXT: shrl %cl, %eax			; X86-NOBMI-NEXT: shrl %cl, %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_c2_load:			; X86-BMI1BMI2-LABEL: bzhi32_c2_load:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %ecx			; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %ecx
	; X86-BMI1BMI2-NEXT: bzhil %eax, (%ecx), %eax			; X86-BMI1BMI2-NEXT: bzhil %eax, (%ecx), %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_c2_load:			; X64-NOBMI-LABEL: bzhi32_c2_load:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
				; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: movl (%rdi), %eax			; X64-NOBMI-NEXT: movl (%rdi), %eax
	; X64-NOBMI-NEXT: movl $32, %ecx			; X64-NOBMI-NEXT: negl %ecx
	; X64-NOBMI-NEXT: subl %esi, %ecx
	; X64-NOBMI-NEXT: shll %cl, %eax			; X64-NOBMI-NEXT: shll %cl, %eax
	; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI-NEXT: shrl %cl, %eax			; X64-NOBMI-NEXT: shrl %cl, %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_c2_load:			; X64-BMI1BMI2-LABEL: bzhi32_c2_load:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: bzhil %esi, (%rdi), %eax			; X64-BMI1BMI2-NEXT: bzhil %esi, (%rdi), %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%val = load i32, i32* %w			%val = load i32, i32* %w
	%numhighbits = sub i32 32, %numlowbits			%numhighbits = sub i32 32, %numlowbits
	%mask = lshr i32 -1, %numhighbits			%mask = lshr i32 -1, %numhighbits
	%masked = and i32 %mask, %val			%masked = and i32 %mask, %val
	ret i32 %masked			ret i32 %masked
	}			}

	define i32 @bzhi32_c3_load_indexzext(i32* %w, i8 %numlowbits) nounwind {			define i32 @bzhi32_c3_load_indexzext(i32* %w, i8 %numlowbits) nounwind {
	; X86-NOBMI-LABEL: bzhi32_c3_load_indexzext:			; X86-NOBMI-LABEL: bzhi32_c3_load_indexzext:
	; X86-NOBMI: # %bb.0:			; X86-NOBMI: # %bb.0:
	; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI-NEXT: movl (%eax), %eax			; X86-NOBMI-NEXT: movl (%eax), %eax
	; X86-NOBMI-NEXT: movb $32, %cl			; X86-NOBMI-NEXT: xorl %ecx, %ecx
	; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl			; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
				; X86-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X86-NOBMI-NEXT: shrl %cl, %eax			; X86-NOBMI-NEXT: shrl %cl, %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_c3_load_indexzext:			; X86-BMI1BMI2-LABEL: bzhi32_c3_load_indexzext:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %cl			; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %cl
	; X86-BMI1BMI2-NEXT: bzhil %ecx, (%eax), %eax			; X86-BMI1BMI2-NEXT: bzhil %ecx, (%eax), %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_c3_load_indexzext:			; X64-NOBMI-LABEL: bzhi32_c3_load_indexzext:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
				; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: movl (%rdi), %eax			; X64-NOBMI-NEXT: movl (%rdi), %eax
	; X64-NOBMI-NEXT: movb $32, %cl			; X64-NOBMI-NEXT: negb %cl
	; X64-NOBMI-NEXT: subb %sil, %cl
	; X64-NOBMI-NEXT: shll %cl, %eax			; X64-NOBMI-NEXT: shll %cl, %eax
				; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI-NEXT: shrl %cl, %eax			; X64-NOBMI-NEXT: shrl %cl, %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_c3_load_indexzext:			; X64-BMI1BMI2-LABEL: bzhi32_c3_load_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: bzhil %esi, (%rdi), %eax			; X64-BMI1BMI2-NEXT: bzhil %esi, (%rdi), %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%val = load i32, i32* %w			%val = load i32, i32* %w
	%numhighbits = sub i8 32, %numlowbits			%numhighbits = sub i8 32, %numlowbits
	%sh_prom = zext i8 %numhighbits to i32			%sh_prom = zext i8 %numhighbits to i32
	%mask = lshr i32 -1, %sh_prom			%mask = lshr i32 -1, %sh_prom
	%masked = and i32 %mask, %val			%masked = and i32 %mask, %val
	ret i32 %masked			ret i32 %masked
	}			}

	define i32 @bzhi32_c4_commutative(i32 %val, i32 %numlowbits) nounwind {			define i32 @bzhi32_c4_commutative(i32 %val, i32 %numlowbits) nounwind {
	; X86-NOBMI-LABEL: bzhi32_c4_commutative:			; X86-NOBMI-LABEL: bzhi32_c4_commutative:
	; X86-NOBMI: # %bb.0:			; X86-NOBMI: # %bb.0:
	; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI-NEXT: movl $32, %ecx			; X86-NOBMI-NEXT: xorl %ecx, %ecx
	; X86-NOBMI-NEXT: subl {{[0-9]+}}(%esp), %ecx			; X86-NOBMI-NEXT: subl {{[0-9]+}}(%esp), %ecx
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
	; X86-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx			; X86-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X86-NOBMI-NEXT: shrl %cl, %eax			; X86-NOBMI-NEXT: shrl %cl, %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_c4_commutative:			; X86-BMI1BMI2-LABEL: bzhi32_c4_commutative:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: bzhil %eax, {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: bzhil %eax, {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_c4_commutative:			; X64-NOBMI-LABEL: bzhi32_c4_commutative:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movl $32, %ecx			; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: subl %esi, %ecx			; X64-NOBMI-NEXT: negl %ecx
	; X64-NOBMI-NEXT: shll %cl, %edi			; X64-NOBMI-NEXT: shll %cl, %edi
	; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI-NEXT: shrl %cl, %edi			; X64-NOBMI-NEXT: shrl %cl, %edi
	; X64-NOBMI-NEXT: movl %edi, %eax			; X64-NOBMI-NEXT: movl %edi, %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_c4_commutative:			; X64-BMI1BMI2-LABEL: bzhi32_c4_commutative:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	Show All 40 Lines
	; X86-BMI1BMI2-NEXT: xorl %edx, %edx			; X86-BMI1BMI2-NEXT: xorl %edx, %edx
	; X86-BMI1BMI2-NEXT: .LBB25_2:			; X86-BMI1BMI2-NEXT: .LBB25_2:
	; X86-BMI1BMI2-NEXT: andl {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: andl {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: andl {{[0-9]+}}(%esp), %edx			; X86-BMI1BMI2-NEXT: andl {{[0-9]+}}(%esp), %edx
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi64_c0:			; X64-NOBMI-LABEL: bzhi64_c0:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movl $64, %ecx			; X64-NOBMI-NEXT: movq %rsi, %rcx
	; X64-NOBMI-NEXT: subl %esi, %ecx			; X64-NOBMI-NEXT: negl %ecx
	; X64-NOBMI-NEXT: shlq %cl, %rdi			; X64-NOBMI-NEXT: shlq %cl, %rdi
	; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $rcx
	; X64-NOBMI-NEXT: shrq %cl, %rdi			; X64-NOBMI-NEXT: shrq %cl, %rdi
	; X64-NOBMI-NEXT: movq %rdi, %rax			; X64-NOBMI-NEXT: movq %rdi, %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_c0:			; X64-BMI1BMI2-LABEL: bzhi64_c0:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: bzhiq %rsi, %rdi, %rax			; X64-BMI1BMI2-NEXT: bzhiq %rsi, %rdi, %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	Show All 36 Lines
	; X86-BMI1BMI2-NEXT: xorl %edx, %edx			; X86-BMI1BMI2-NEXT: xorl %edx, %edx
	; X86-BMI1BMI2-NEXT: .LBB26_2:			; X86-BMI1BMI2-NEXT: .LBB26_2:
	; X86-BMI1BMI2-NEXT: andl {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: andl {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: andl {{[0-9]+}}(%esp), %edx			; X86-BMI1BMI2-NEXT: andl {{[0-9]+}}(%esp), %edx
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi64_c1_indexzext:			; X64-NOBMI-LABEL: bzhi64_c1_indexzext:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movb $64, %cl			; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: subb %sil, %cl			; X64-NOBMI-NEXT: negb %cl
	; X64-NOBMI-NEXT: shlq %cl, %rdi			; X64-NOBMI-NEXT: shlq %cl, %rdi
				; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI-NEXT: shrq %cl, %rdi			; X64-NOBMI-NEXT: shrq %cl, %rdi
	; X64-NOBMI-NEXT: movq %rdi, %rax			; X64-NOBMI-NEXT: movq %rdi, %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_c1_indexzext:			; X64-BMI1BMI2-LABEL: bzhi64_c1_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi			; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi
	; X64-BMI1BMI2-NEXT: bzhiq %rsi, %rdi, %rax			; X64-BMI1BMI2-NEXT: bzhiq %rsi, %rdi, %rax
	▲ Show 20 Lines • Show All 44 Lines • ▼ Show 20 Lines
	; X86-BMI1BMI2-NEXT: .LBB27_2:			; X86-BMI1BMI2-NEXT: .LBB27_2:
	; X86-BMI1BMI2-NEXT: andl (%esi), %eax			; X86-BMI1BMI2-NEXT: andl (%esi), %eax
	; X86-BMI1BMI2-NEXT: andl 4(%esi), %edx			; X86-BMI1BMI2-NEXT: andl 4(%esi), %edx
	; X86-BMI1BMI2-NEXT: popl %esi			; X86-BMI1BMI2-NEXT: popl %esi
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi64_c2_load:			; X64-NOBMI-LABEL: bzhi64_c2_load:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
				; X64-NOBMI-NEXT: movq %rsi, %rcx
	; X64-NOBMI-NEXT: movq (%rdi), %rax			; X64-NOBMI-NEXT: movq (%rdi), %rax
	; X64-NOBMI-NEXT: movl $64, %ecx			; X64-NOBMI-NEXT: negl %ecx
	; X64-NOBMI-NEXT: subl %esi, %ecx
	; X64-NOBMI-NEXT: shlq %cl, %rax			; X64-NOBMI-NEXT: shlq %cl, %rax
	; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $rcx
	; X64-NOBMI-NEXT: shrq %cl, %rax			; X64-NOBMI-NEXT: shrq %cl, %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_c2_load:			; X64-BMI1BMI2-LABEL: bzhi64_c2_load:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: bzhiq %rsi, (%rdi), %rax			; X64-BMI1BMI2-NEXT: bzhiq %rsi, (%rdi), %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%val = load i64, i64* %w			%val = load i64, i64* %w
	▲ Show 20 Lines • Show All 42 Lines • ▼ Show 20 Lines
	; X86-BMI1BMI2-NEXT: .LBB28_2:			; X86-BMI1BMI2-NEXT: .LBB28_2:
	; X86-BMI1BMI2-NEXT: andl (%esi), %eax			; X86-BMI1BMI2-NEXT: andl (%esi), %eax
	; X86-BMI1BMI2-NEXT: andl 4(%esi), %edx			; X86-BMI1BMI2-NEXT: andl 4(%esi), %edx
	; X86-BMI1BMI2-NEXT: popl %esi			; X86-BMI1BMI2-NEXT: popl %esi
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi64_c3_load_indexzext:			; X64-NOBMI-LABEL: bzhi64_c3_load_indexzext:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
				; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: movq (%rdi), %rax			; X64-NOBMI-NEXT: movq (%rdi), %rax
	; X64-NOBMI-NEXT: movb $64, %cl			; X64-NOBMI-NEXT: negb %cl
	; X64-NOBMI-NEXT: subb %sil, %cl
	; X64-NOBMI-NEXT: shlq %cl, %rax			; X64-NOBMI-NEXT: shlq %cl, %rax
				; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI-NEXT: shrq %cl, %rax			; X64-NOBMI-NEXT: shrq %cl, %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_c3_load_indexzext:			; X64-BMI1BMI2-LABEL: bzhi64_c3_load_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi			; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi
	; X64-BMI1BMI2-NEXT: bzhiq %rsi, (%rdi), %rax			; X64-BMI1BMI2-NEXT: bzhiq %rsi, (%rdi), %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	Show All 38 Lines
	; X86-BMI1BMI2-NEXT: xorl %edx, %edx			; X86-BMI1BMI2-NEXT: xorl %edx, %edx
	; X86-BMI1BMI2-NEXT: .LBB29_2:			; X86-BMI1BMI2-NEXT: .LBB29_2:
	; X86-BMI1BMI2-NEXT: andl {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: andl {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: andl {{[0-9]+}}(%esp), %edx			; X86-BMI1BMI2-NEXT: andl {{[0-9]+}}(%esp), %edx
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi64_c4_commutative:			; X64-NOBMI-LABEL: bzhi64_c4_commutative:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movl $64, %ecx			; X64-NOBMI-NEXT: movq %rsi, %rcx
	; X64-NOBMI-NEXT: subl %esi, %ecx			; X64-NOBMI-NEXT: negl %ecx
	; X64-NOBMI-NEXT: shlq %cl, %rdi			; X64-NOBMI-NEXT: shlq %cl, %rdi
	; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $rcx
	; X64-NOBMI-NEXT: shrq %cl, %rdi			; X64-NOBMI-NEXT: shrq %cl, %rdi
	; X64-NOBMI-NEXT: movq %rdi, %rax			; X64-NOBMI-NEXT: movq %rdi, %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_c4_commutative:			; X64-BMI1BMI2-LABEL: bzhi64_c4_commutative:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: bzhiq %rsi, %rdi, %rax			; X64-BMI1BMI2-NEXT: bzhiq %rsi, %rdi, %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%numhighbits = sub i64 64, %numlowbits			%numhighbits = sub i64 64, %numlowbits
	%mask = lshr i64 -1, %numhighbits			%mask = lshr i64 -1, %numhighbits
	%masked = and i64 %val, %mask ; swapped order			%masked = and i64 %val, %mask ; swapped order
	ret i64 %masked			ret i64 %masked
	}			}

	; ---------------------------------------------------------------------------- ;			; ---------------------------------------------------------------------------- ;
	; Pattern d. 32-bit.			; Pattern d. 32-bit.
	; ---------------------------------------------------------------------------- ;			; ---------------------------------------------------------------------------- ;

	define i32 @bzhi32_d0(i32 %val, i32 %numlowbits) nounwind {			define i32 @bzhi32_d0(i32 %val, i32 %numlowbits) nounwind {
	; X86-NOBMI-LABEL: bzhi32_d0:			; X86-NOBMI-LABEL: bzhi32_d0:
	; X86-NOBMI: # %bb.0:			; X86-NOBMI: # %bb.0:
	; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI-NEXT: movl $32, %ecx			; X86-NOBMI-NEXT: xorl %ecx, %ecx
	; X86-NOBMI-NEXT: subl {{[0-9]+}}(%esp), %ecx			; X86-NOBMI-NEXT: subl {{[0-9]+}}(%esp), %ecx
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
	; X86-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx			; X86-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X86-NOBMI-NEXT: shrl %cl, %eax			; X86-NOBMI-NEXT: shrl %cl, %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_d0:			; X86-BMI1BMI2-LABEL: bzhi32_d0:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: bzhil %eax, {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: bzhil %eax, {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_d0:			; X64-NOBMI-LABEL: bzhi32_d0:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movl $32, %ecx			; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: subl %esi, %ecx			; X64-NOBMI-NEXT: negl %ecx
	; X64-NOBMI-NEXT: shll %cl, %edi			; X64-NOBMI-NEXT: shll %cl, %edi
	; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI-NEXT: shrl %cl, %edi			; X64-NOBMI-NEXT: shrl %cl, %edi
	; X64-NOBMI-NEXT: movl %edi, %eax			; X64-NOBMI-NEXT: movl %edi, %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_d0:			; X64-BMI1BMI2-LABEL: bzhi32_d0:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: bzhil %esi, %edi, %eax			; X64-BMI1BMI2-NEXT: bzhil %esi, %edi, %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%numhighbits = sub i32 32, %numlowbits			%numhighbits = sub i32 32, %numlowbits
	%highbitscleared = shl i32 %val, %numhighbits			%highbitscleared = shl i32 %val, %numhighbits
	%masked = lshr i32 %highbitscleared, %numhighbits			%masked = lshr i32 %highbitscleared, %numhighbits
	ret i32 %masked			ret i32 %masked
	}			}

	define i32 @bzhi32_d1_indexzext(i32 %val, i8 %numlowbits) nounwind {			define i32 @bzhi32_d1_indexzext(i32 %val, i8 %numlowbits) nounwind {
	; X86-NOBMI-LABEL: bzhi32_d1_indexzext:			; X86-NOBMI-LABEL: bzhi32_d1_indexzext:
	; X86-NOBMI: # %bb.0:			; X86-NOBMI: # %bb.0:
	; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI-NEXT: movb $32, %cl			; X86-NOBMI-NEXT: xorl %ecx, %ecx
	; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl			; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
				; X86-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X86-NOBMI-NEXT: shrl %cl, %eax			; X86-NOBMI-NEXT: shrl %cl, %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_d1_indexzext:			; X86-BMI1BMI2-LABEL: bzhi32_d1_indexzext:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %al			; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %al
	; X86-BMI1BMI2-NEXT: bzhil %eax, {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: bzhil %eax, {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_d1_indexzext:			; X64-NOBMI-LABEL: bzhi32_d1_indexzext:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movb $32, %cl			; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: subb %sil, %cl			; X64-NOBMI-NEXT: negb %cl
	; X64-NOBMI-NEXT: shll %cl, %edi			; X64-NOBMI-NEXT: shll %cl, %edi
				; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI-NEXT: shrl %cl, %edi			; X64-NOBMI-NEXT: shrl %cl, %edi
	; X64-NOBMI-NEXT: movl %edi, %eax			; X64-NOBMI-NEXT: movl %edi, %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_d1_indexzext:			; X64-BMI1BMI2-LABEL: bzhi32_d1_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: bzhil %esi, %edi, %eax			; X64-BMI1BMI2-NEXT: bzhil %esi, %edi, %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%numhighbits = sub i8 32, %numlowbits			%numhighbits = sub i8 32, %numlowbits
	%sh_prom = zext i8 %numhighbits to i32			%sh_prom = zext i8 %numhighbits to i32
	%highbitscleared = shl i32 %val, %sh_prom			%highbitscleared = shl i32 %val, %sh_prom
	%masked = lshr i32 %highbitscleared, %sh_prom			%masked = lshr i32 %highbitscleared, %sh_prom
	ret i32 %masked			ret i32 %masked
	}			}

	define i32 @bzhi32_d2_load(i32* %w, i32 %numlowbits) nounwind {			define i32 @bzhi32_d2_load(i32* %w, i32 %numlowbits) nounwind {
	; X86-NOBMI-LABEL: bzhi32_d2_load:			; X86-NOBMI-LABEL: bzhi32_d2_load:
	; X86-NOBMI: # %bb.0:			; X86-NOBMI: # %bb.0:
	; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI-NEXT: movl (%eax), %eax			; X86-NOBMI-NEXT: movl (%eax), %eax
	; X86-NOBMI-NEXT: movl $32, %ecx			; X86-NOBMI-NEXT: xorl %ecx, %ecx
	; X86-NOBMI-NEXT: subl {{[0-9]+}}(%esp), %ecx			; X86-NOBMI-NEXT: subl {{[0-9]+}}(%esp), %ecx
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
	; X86-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx			; X86-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X86-NOBMI-NEXT: shrl %cl, %eax			; X86-NOBMI-NEXT: shrl %cl, %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_d2_load:			; X86-BMI1BMI2-LABEL: bzhi32_d2_load:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %ecx			; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %ecx
	; X86-BMI1BMI2-NEXT: bzhil %eax, (%ecx), %eax			; X86-BMI1BMI2-NEXT: bzhil %eax, (%ecx), %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_d2_load:			; X64-NOBMI-LABEL: bzhi32_d2_load:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
				; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: movl (%rdi), %eax			; X64-NOBMI-NEXT: movl (%rdi), %eax
	; X64-NOBMI-NEXT: movl $32, %ecx			; X64-NOBMI-NEXT: negl %ecx
	; X64-NOBMI-NEXT: subl %esi, %ecx
	; X64-NOBMI-NEXT: shll %cl, %eax			; X64-NOBMI-NEXT: shll %cl, %eax
	; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI-NEXT: shrl %cl, %eax			; X64-NOBMI-NEXT: shrl %cl, %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_d2_load:			; X64-BMI1BMI2-LABEL: bzhi32_d2_load:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: bzhil %esi, (%rdi), %eax			; X64-BMI1BMI2-NEXT: bzhil %esi, (%rdi), %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%val = load i32, i32* %w			%val = load i32, i32* %w
	%numhighbits = sub i32 32, %numlowbits			%numhighbits = sub i32 32, %numlowbits
	%highbitscleared = shl i32 %val, %numhighbits			%highbitscleared = shl i32 %val, %numhighbits
	%masked = lshr i32 %highbitscleared, %numhighbits			%masked = lshr i32 %highbitscleared, %numhighbits
	ret i32 %masked			ret i32 %masked
	}			}

	define i32 @bzhi32_d3_load_indexzext(i32* %w, i8 %numlowbits) nounwind {			define i32 @bzhi32_d3_load_indexzext(i32* %w, i8 %numlowbits) nounwind {
	; X86-NOBMI-LABEL: bzhi32_d3_load_indexzext:			; X86-NOBMI-LABEL: bzhi32_d3_load_indexzext:
	; X86-NOBMI: # %bb.0:			; X86-NOBMI: # %bb.0:
	; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI-NEXT: movl (%eax), %eax			; X86-NOBMI-NEXT: movl (%eax), %eax
	; X86-NOBMI-NEXT: movb $32, %cl			; X86-NOBMI-NEXT: xorl %ecx, %ecx
	; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl			; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
				; X86-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X86-NOBMI-NEXT: shrl %cl, %eax			; X86-NOBMI-NEXT: shrl %cl, %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_d3_load_indexzext:			; X86-BMI1BMI2-LABEL: bzhi32_d3_load_indexzext:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %cl			; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %cl
	; X86-BMI1BMI2-NEXT: bzhil %ecx, (%eax), %eax			; X86-BMI1BMI2-NEXT: bzhil %ecx, (%eax), %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_d3_load_indexzext:			; X64-NOBMI-LABEL: bzhi32_d3_load_indexzext:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
				; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: movl (%rdi), %eax			; X64-NOBMI-NEXT: movl (%rdi), %eax
	; X64-NOBMI-NEXT: movb $32, %cl			; X64-NOBMI-NEXT: negb %cl
	; X64-NOBMI-NEXT: subb %sil, %cl
	; X64-NOBMI-NEXT: shll %cl, %eax			; X64-NOBMI-NEXT: shll %cl, %eax
				; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI-NEXT: shrl %cl, %eax			; X64-NOBMI-NEXT: shrl %cl, %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_d3_load_indexzext:			; X64-BMI1BMI2-LABEL: bzhi32_d3_load_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: bzhil %esi, (%rdi), %eax			; X64-BMI1BMI2-NEXT: bzhil %esi, (%rdi), %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%val = load i32, i32* %w			%val = load i32, i32* %w
	▲ Show 20 Lines • Show All 75 Lines • ▼ Show 20 Lines
	; X86-BMI1BMI2-NEXT: movl %edi, %eax			; X86-BMI1BMI2-NEXT: movl %edi, %eax
	; X86-BMI1BMI2-NEXT: .LBB34_6:			; X86-BMI1BMI2-NEXT: .LBB34_6:
	; X86-BMI1BMI2-NEXT: popl %esi			; X86-BMI1BMI2-NEXT: popl %esi
	; X86-BMI1BMI2-NEXT: popl %edi			; X86-BMI1BMI2-NEXT: popl %edi
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi64_d0:			; X64-NOBMI-LABEL: bzhi64_d0:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movl $64, %ecx			; X64-NOBMI-NEXT: movq %rsi, %rcx
	; X64-NOBMI-NEXT: subl %esi, %ecx			; X64-NOBMI-NEXT: negl %ecx
	; X64-NOBMI-NEXT: shlq %cl, %rdi			; X64-NOBMI-NEXT: shlq %cl, %rdi
	; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $rcx
	; X64-NOBMI-NEXT: shrq %cl, %rdi			; X64-NOBMI-NEXT: shrq %cl, %rdi
	; X64-NOBMI-NEXT: movq %rdi, %rax			; X64-NOBMI-NEXT: movq %rdi, %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_d0:			; X64-BMI1BMI2-LABEL: bzhi64_d0:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: bzhiq %rsi, %rdi, %rax			; X64-BMI1BMI2-NEXT: bzhiq %rsi, %rdi, %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	▲ Show 20 Lines • Show All 72 Lines • ▼ Show 20 Lines
	; X86-BMI1BMI2-NEXT: movl %edi, %eax			; X86-BMI1BMI2-NEXT: movl %edi, %eax
	; X86-BMI1BMI2-NEXT: .LBB35_6:			; X86-BMI1BMI2-NEXT: .LBB35_6:
	; X86-BMI1BMI2-NEXT: popl %esi			; X86-BMI1BMI2-NEXT: popl %esi
	; X86-BMI1BMI2-NEXT: popl %edi			; X86-BMI1BMI2-NEXT: popl %edi
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi64_d1_indexzext:			; X64-NOBMI-LABEL: bzhi64_d1_indexzext:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movb $64, %cl			; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: subb %sil, %cl			; X64-NOBMI-NEXT: negb %cl
	; X64-NOBMI-NEXT: shlq %cl, %rdi			; X64-NOBMI-NEXT: shlq %cl, %rdi
				; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI-NEXT: shrq %cl, %rdi			; X64-NOBMI-NEXT: shrq %cl, %rdi
	; X64-NOBMI-NEXT: movq %rdi, %rax			; X64-NOBMI-NEXT: movq %rdi, %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_d1_indexzext:			; X64-BMI1BMI2-LABEL: bzhi64_d1_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi			; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi
	; X64-BMI1BMI2-NEXT: bzhiq %rsi, %rdi, %rax			; X64-BMI1BMI2-NEXT: bzhiq %rsi, %rdi, %rax
	▲ Show 20 Lines • Show All 76 Lines • ▼ Show 20 Lines
	; X86-BMI1BMI2-NEXT: movl %edi, %eax			; X86-BMI1BMI2-NEXT: movl %edi, %eax
	; X86-BMI1BMI2-NEXT: .LBB36_6:			; X86-BMI1BMI2-NEXT: .LBB36_6:
	; X86-BMI1BMI2-NEXT: popl %esi			; X86-BMI1BMI2-NEXT: popl %esi
	; X86-BMI1BMI2-NEXT: popl %edi			; X86-BMI1BMI2-NEXT: popl %edi
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi64_d2_load:			; X64-NOBMI-LABEL: bzhi64_d2_load:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
				; X64-NOBMI-NEXT: movq %rsi, %rcx
	; X64-NOBMI-NEXT: movq (%rdi), %rax			; X64-NOBMI-NEXT: movq (%rdi), %rax
	; X64-NOBMI-NEXT: movl $64, %ecx			; X64-NOBMI-NEXT: negl %ecx
	; X64-NOBMI-NEXT: subl %esi, %ecx
	; X64-NOBMI-NEXT: shlq %cl, %rax			; X64-NOBMI-NEXT: shlq %cl, %rax
	; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx			; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $rcx
	; X64-NOBMI-NEXT: shrq %cl, %rax			; X64-NOBMI-NEXT: shrq %cl, %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_d2_load:			; X64-BMI1BMI2-LABEL: bzhi64_d2_load:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: bzhiq %rsi, (%rdi), %rax			; X64-BMI1BMI2-NEXT: bzhiq %rsi, (%rdi), %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%val = load i64, i64* %w			%val = load i64, i64* %w
	▲ Show 20 Lines • Show All 74 Lines • ▼ Show 20 Lines
	; X86-BMI1BMI2-NEXT: movl %edi, %eax			; X86-BMI1BMI2-NEXT: movl %edi, %eax
	; X86-BMI1BMI2-NEXT: .LBB37_6:			; X86-BMI1BMI2-NEXT: .LBB37_6:
	; X86-BMI1BMI2-NEXT: popl %esi			; X86-BMI1BMI2-NEXT: popl %esi
	; X86-BMI1BMI2-NEXT: popl %edi			; X86-BMI1BMI2-NEXT: popl %edi
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi64_d3_load_indexzext:			; X64-NOBMI-LABEL: bzhi64_d3_load_indexzext:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
				; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: movq (%rdi), %rax			; X64-NOBMI-NEXT: movq (%rdi), %rax
	; X64-NOBMI-NEXT: movb $64, %cl			; X64-NOBMI-NEXT: negb %cl
	; X64-NOBMI-NEXT: subb %sil, %cl
	; X64-NOBMI-NEXT: shlq %cl, %rax			; X64-NOBMI-NEXT: shlq %cl, %rax
				; X64-NOBMI-NEXT: # kill: def $cl killed $cl killed $ecx
	; X64-NOBMI-NEXT: shrq %cl, %rax			; X64-NOBMI-NEXT: shrq %cl, %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_d3_load_indexzext:			; X64-BMI1BMI2-LABEL: bzhi64_d3_load_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi			; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi
	; X64-BMI1BMI2-NEXT: bzhiq %rsi, (%rdi), %rax			; X64-BMI1BMI2-NEXT: bzhiq %rsi, (%rdi), %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	▲ Show 20 Lines • Show All 283 Lines • Show Last 20 Lines

test/CodeGen/X86/schedule-x86-64-shld.ll

	Show First 20 Lines • Show All 156 Lines • ▼ Show 20 Lines
	; GENERIC: # %bb.0: # %entry			; GENERIC: # %bb.0: # %entry
	; GENERIC-NEXT: movl %edx, %ecx # sched: [1:0.33]			; GENERIC-NEXT: movl %edx, %ecx # sched: [1:0.33]
	; GENERIC-NEXT: shldq %cl, %rsi, %rdi # sched: [4:1.50]			; GENERIC-NEXT: shldq %cl, %rsi, %rdi # sched: [4:1.50]
	; GENERIC-NEXT: movq %rdi, %rax # sched: [1:0.33]			; GENERIC-NEXT: movq %rdi, %rax # sched: [1:0.33]
	; GENERIC-NEXT: retq # sched: [1:1.00]			; GENERIC-NEXT: retq # sched: [1:1.00]
	;			;
	; BTVER2-LABEL: lshift_cl:			; BTVER2-LABEL: lshift_cl:
	; BTVER2: # %bb.0: # %entry			; BTVER2: # %bb.0: # %entry
	; BTVER2-NEXT: movl %edx, %ecx # sched: [1:0.50]			; BTVER2-NEXT: movq %rdx, %rcx # sched: [1:0.50]
	; BTVER2-NEXT: shlq %cl, %rdi # sched: [1:0.50]			; BTVER2-NEXT: shlq %cl, %rdi # sched: [1:0.50]
	; BTVER2-NEXT: movl $64, %ecx # sched: [1:0.50]			; BTVER2-NEXT: negl %ecx # sched: [1:0.50]
	; BTVER2-NEXT: subl %edx, %ecx # sched: [1:0.50]			; BTVER2-NEXT: # kill: def $cl killed $cl killed $rcx
	; BTVER2-NEXT: # kill: def $cl killed $cl killed $ecx
	; BTVER2-NEXT: shrq %cl, %rsi # sched: [1:0.50]			; BTVER2-NEXT: shrq %cl, %rsi # sched: [1:0.50]
	; BTVER2-NEXT: orq %rdi, %rsi # sched: [1:0.50]			; BTVER2-NEXT: orq %rdi, %rsi # sched: [1:0.50]
	; BTVER2-NEXT: movq %rsi, %rax # sched: [1:0.50]			; BTVER2-NEXT: movq %rsi, %rax # sched: [1:0.50]
	; BTVER2-NEXT: retq # sched: [4:1.00]			; BTVER2-NEXT: retq # sched: [4:1.00]
	;			;
	; BDVER1-LABEL: lshift_cl:			; BDVER1-LABEL: lshift_cl:
	; BDVER1: # %bb.0: # %entry			; BDVER1: # %bb.0: # %entry
	; BDVER1-NEXT: movl %edx, %ecx			; BDVER1-NEXT: movq %rdx, %rcx
	; BDVER1-NEXT: shlq %cl, %rdi			; BDVER1-NEXT: shlq %cl, %rdi
	; BDVER1-NEXT: movl $64, %ecx			; BDVER1-NEXT: negl %ecx
	; BDVER1-NEXT: subl %edx, %ecx			; BDVER1-NEXT: # kill: def $cl killed $cl killed $rcx
	; BDVER1-NEXT: # kill: def $cl killed $cl killed $ecx
	; BDVER1-NEXT: shrq %cl, %rsi			; BDVER1-NEXT: shrq %cl, %rsi
	; BDVER1-NEXT: orq %rdi, %rsi			; BDVER1-NEXT: orq %rdi, %rsi
	; BDVER1-NEXT: movq %rsi, %rax			; BDVER1-NEXT: movq %rsi, %rax
	; BDVER1-NEXT: retq			; BDVER1-NEXT: retq
	entry:			entry:
	%shl = shl i64 %a, %c			%shl = shl i64 %a, %c
	%sub = sub nsw i64 64, %c			%sub = sub nsw i64 64, %c
	%shr = lshr i64 %b, %sub			%shr = lshr i64 %b, %sub
	▲ Show 20 Lines • Show All 41 Lines • ▼ Show 20 Lines
	; GENERIC: # %bb.0: # %entry			; GENERIC: # %bb.0: # %entry
	; GENERIC-NEXT: movl %edx, %ecx # sched: [1:0.33]			; GENERIC-NEXT: movl %edx, %ecx # sched: [1:0.33]
	; GENERIC-NEXT: shrdq %cl, %rsi, %rdi # sched: [4:1.50]			; GENERIC-NEXT: shrdq %cl, %rsi, %rdi # sched: [4:1.50]
	; GENERIC-NEXT: movq %rdi, %rax # sched: [1:0.33]			; GENERIC-NEXT: movq %rdi, %rax # sched: [1:0.33]
	; GENERIC-NEXT: retq # sched: [1:1.00]			; GENERIC-NEXT: retq # sched: [1:1.00]
	;			;
	; BTVER2-LABEL: rshift_cl:			; BTVER2-LABEL: rshift_cl:
	; BTVER2: # %bb.0: # %entry			; BTVER2: # %bb.0: # %entry
	; BTVER2-NEXT: movl %edx, %ecx # sched: [1:0.50]			; BTVER2-NEXT: movq %rdx, %rcx # sched: [1:0.50]
	; BTVER2-NEXT: shrq %cl, %rdi # sched: [1:0.50]			; BTVER2-NEXT: shrq %cl, %rdi # sched: [1:0.50]
	; BTVER2-NEXT: movl $64, %ecx # sched: [1:0.50]			; BTVER2-NEXT: negl %ecx # sched: [1:0.50]
	; BTVER2-NEXT: subl %edx, %ecx # sched: [1:0.50]			; BTVER2-NEXT: # kill: def $cl killed $cl killed $rcx
	; BTVER2-NEXT: # kill: def $cl killed $cl killed $ecx
	; BTVER2-NEXT: shlq %cl, %rsi # sched: [1:0.50]			; BTVER2-NEXT: shlq %cl, %rsi # sched: [1:0.50]
	; BTVER2-NEXT: orq %rdi, %rsi # sched: [1:0.50]			; BTVER2-NEXT: orq %rdi, %rsi # sched: [1:0.50]
	; BTVER2-NEXT: movq %rsi, %rax # sched: [1:0.50]			; BTVER2-NEXT: movq %rsi, %rax # sched: [1:0.50]
	; BTVER2-NEXT: retq # sched: [4:1.00]			; BTVER2-NEXT: retq # sched: [4:1.00]
	;			;
	; BDVER1-LABEL: rshift_cl:			; BDVER1-LABEL: rshift_cl:
	; BDVER1: # %bb.0: # %entry			; BDVER1: # %bb.0: # %entry
	; BDVER1-NEXT: movl %edx, %ecx			; BDVER1-NEXT: movq %rdx, %rcx
	; BDVER1-NEXT: shrq %cl, %rdi			; BDVER1-NEXT: shrq %cl, %rdi
	; BDVER1-NEXT: movl $64, %ecx			; BDVER1-NEXT: negl %ecx
	; BDVER1-NEXT: subl %edx, %ecx			; BDVER1-NEXT: # kill: def $cl killed $cl killed $rcx
	; BDVER1-NEXT: # kill: def $cl killed $cl killed $ecx
	; BDVER1-NEXT: shlq %cl, %rsi			; BDVER1-NEXT: shlq %cl, %rsi
	; BDVER1-NEXT: orq %rdi, %rsi			; BDVER1-NEXT: orq %rdi, %rsi
	; BDVER1-NEXT: movq %rsi, %rax			; BDVER1-NEXT: movq %rsi, %rax
	; BDVER1-NEXT: retq			; BDVER1-NEXT: retq
	entry:			entry:
	%shr = lshr i64 %a, %c			%shr = lshr i64 %a, %c
	%sub = sub nsw i64 64, %c			%sub = sub nsw i64 64, %c
	%shl = shl i64 %b, %sub			%shl = shl i64 %b, %sub
	▲ Show 20 Lines • Show All 41 Lines • ▼ Show 20 Lines
	; GENERIC: # %bb.0: # %entry			; GENERIC: # %bb.0: # %entry
	; GENERIC-NEXT: movl %esi, %ecx # sched: [1:0.33]			; GENERIC-NEXT: movl %esi, %ecx # sched: [1:0.33]
	; GENERIC-NEXT: shldq %cl, %rdi, {{.*}}(%rip) # sched: [10:1.50]			; GENERIC-NEXT: shldq %cl, %rdi, {{.*}}(%rip) # sched: [10:1.50]
	; GENERIC-NEXT: retq # sched: [1:1.00]			; GENERIC-NEXT: retq # sched: [1:1.00]
	;			;
	; BTVER2-LABEL: lshift_mem_cl:			; BTVER2-LABEL: lshift_mem_cl:
	; BTVER2: # %bb.0: # %entry			; BTVER2: # %bb.0: # %entry
	; BTVER2-NEXT: movq {{.*}}(%rip), %rax # sched: [5:1.00]			; BTVER2-NEXT: movq {{.*}}(%rip), %rax # sched: [5:1.00]
	; BTVER2-NEXT: movl %esi, %ecx # sched: [1:0.50]			; BTVER2-NEXT: movq %rsi, %rcx # sched: [1:0.50]
	; BTVER2-NEXT: shlq %cl, %rax # sched: [1:0.50]			; BTVER2-NEXT: shlq %cl, %rax # sched: [1:0.50]
	; BTVER2-NEXT: movl $64, %ecx # sched: [1:0.50]			; BTVER2-NEXT: negl %ecx # sched: [1:0.50]
	; BTVER2-NEXT: subl %esi, %ecx # sched: [1:0.50]			; BTVER2-NEXT: # kill: def $cl killed $cl killed $rcx
	; BTVER2-NEXT: # kill: def $cl killed $cl killed $ecx
	; BTVER2-NEXT: shrq %cl, %rdi # sched: [1:0.50]			; BTVER2-NEXT: shrq %cl, %rdi # sched: [1:0.50]
	; BTVER2-NEXT: orq %rax, %rdi # sched: [1:0.50]			; BTVER2-NEXT: orq %rax, %rdi # sched: [1:0.50]
	; BTVER2-NEXT: movq %rdi, {{.*}}(%rip) # sched: [1:1.00]			; BTVER2-NEXT: movq %rdi, {{.*}}(%rip) # sched: [1:1.00]
	; BTVER2-NEXT: retq # sched: [4:1.00]			; BTVER2-NEXT: retq # sched: [4:1.00]
	;			;
	; BDVER1-LABEL: lshift_mem_cl:			; BDVER1-LABEL: lshift_mem_cl:
	; BDVER1: # %bb.0: # %entry			; BDVER1: # %bb.0: # %entry
				; BDVER1-NEXT: movq %rsi, %rcx
	; BDVER1-NEXT: movq {{.*}}(%rip), %rax			; BDVER1-NEXT: movq {{.*}}(%rip), %rax
	; BDVER1-NEXT: movl %esi, %ecx
	; BDVER1-NEXT: shlq %cl, %rax			; BDVER1-NEXT: shlq %cl, %rax
	; BDVER1-NEXT: movl $64, %ecx			; BDVER1-NEXT: negl %ecx
	; BDVER1-NEXT: subl %esi, %ecx			; BDVER1-NEXT: # kill: def $cl killed $cl killed $rcx
	; BDVER1-NEXT: # kill: def $cl killed $cl killed $ecx
	; BDVER1-NEXT: shrq %cl, %rdi			; BDVER1-NEXT: shrq %cl, %rdi
	; BDVER1-NEXT: orq %rax, %rdi			; BDVER1-NEXT: orq %rax, %rdi
	; BDVER1-NEXT: movq %rdi, {{.*}}(%rip)			; BDVER1-NEXT: movq %rdi, {{.*}}(%rip)
	; BDVER1-NEXT: retq			; BDVER1-NEXT: retq
	entry:			entry:
	%b = load i64, i64* @x			%b = load i64, i64* @x
	%shl = shl i64 %b, %c			%shl = shl i64 %b, %c
	%sub = sub nsw i64 64, %c			%sub = sub nsw i64 64, %c
	▲ Show 20 Lines • Show All 126 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[X86] Replace (32/64 - n) shift amounts with (neg n) since the shift amount is masked in hardware
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 162025

lib/Target/X86/X86ISelDAGToDAG.cpp

test/CodeGen/X86/clear-lowbits.ll

test/CodeGen/X86/extract-lowbits.ll

test/CodeGen/X86/schedule-x86-64-shld.ll

This is an archive of the discontinued LLVM Phabricator instance.

[X86] Replace (32/64 - n) shift amounts with (neg n) since the shift amount is masked in hardwareClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 162025

lib/Target/X86/X86ISelDAGToDAG.cpp

test/CodeGen/X86/clear-lowbits.ll

test/CodeGen/X86/extract-lowbits.ll

test/CodeGen/X86/schedule-x86-64-shld.ll

[X86] Replace (32/64 - n) shift amounts with (neg n) since the shift amount is masked in hardware
ClosedPublic