Diff 150184

llvm/trunk/lib/Target/X86/X86InstrInfo.td

Show First 20 Lines • Show All 2,442 Lines • ▼ Show 20 Lines	def : Pat<(and GR64:$src, AndMask64:$mask),
(MOV8ri (CountTrailingOnes imm:$mask)), sub_8bit))>;		(MOV8ri (CountTrailingOnes imm:$mask)), sub_8bit))>;
def : Pat<(and (loadi64 addr:$src), AndMask64:$mask),		def : Pat<(and (loadi64 addr:$src), AndMask64:$mask),
(BZHI64rm addr:$src,		(BZHI64rm addr:$src,
(INSERT_SUBREG (i64 (IMPLICIT_DEF)),		(INSERT_SUBREG (i64 (IMPLICIT_DEF)),
(MOV8ri (CountTrailingOnes imm:$mask)), sub_8bit))>;		(MOV8ri (CountTrailingOnes imm:$mask)), sub_8bit))>;
}		}

let Predicates = [HasBMI2] in {		let Predicates = [HasBMI2] in {
def : Pat<(and GR32:$src, (add (shl 1, GR8:$lz), -1)),		multiclass _bmi_bzhi_pattern<dag regpattern, dag mempattern, RegisterClass RC,
(BZHI32rr GR32:$src,		ValueType VT, Instruction DstInst,
(INSERT_SUBREG (i32 (IMPLICIT_DEF)), GR8:$lz, sub_8bit))>;		Instruction DstMemInst> {
		def : Pat<regpattern,
def : Pat<(and (loadi32 addr:$src), (add (shl 1, GR8:$lz), -1)),		(DstInst RC:$src,
(BZHI32rm addr:$src,		(INSERT_SUBREG (VT (IMPLICIT_DEF)), GR8:$lz, sub_8bit))>;
(INSERT_SUBREG (i32 (IMPLICIT_DEF)), GR8:$lz, sub_8bit))>;		def : Pat<mempattern,
		(DstMemInst addr:$src,
def : Pat<(and GR64:$src, (add (shl 1, GR8:$lz), -1)),		(INSERT_SUBREG (VT (IMPLICIT_DEF)), GR8:$lz, sub_8bit))>;
(BZHI64rr GR64:$src,		}
(INSERT_SUBREG (i64 (IMPLICIT_DEF)), GR8:$lz, sub_8bit))>;
		multiclass bmi_bzhi_patterns<RegisterClass RC, int bitwidth, ValueType VT,
		Instruction DstInst, X86MemOperand x86memop,
		Instruction DstMemInst> {
		// x & ((1 << y) - 1)
		defm : _bmi_bzhi_pattern<(and RC:$src, (add (shl 1, GR8:$lz), -1)),
		(and (x86memop addr:$src),
		(add (shl 1, GR8:$lz), -1)),
		RC, VT, DstInst, DstMemInst>;

		// x & ~(-1 << y)
		defm : _bmi_bzhi_pattern<(and RC:$src, (xor (shl -1, GR8:$lz), -1)),
		(and (x86memop addr:$src),
		(xor (shl -1, GR8:$lz), -1)),
		RC, VT, DstInst, DstMemInst>;

		// x & (-1 >> (bitwidth - y))
		defm : _bmi_bzhi_pattern<(and RC:$src, (srl -1, (sub bitwidth, GR8:$lz))),
		(and (x86memop addr:$src),
		(srl -1, (sub bitwidth, GR8:$lz))),
		RC, VT, DstInst, DstMemInst>;

		// x << (bitwidth - y) >> (bitwidth - y)
		defm : _bmi_bzhi_pattern<(srl (shl RC:$src, (sub bitwidth, GR8:$lz)),
		(sub bitwidth, GR8:$lz)),
		(srl (shl (x86memop addr:$src),
		(sub bitwidth, GR8:$lz)),
		(sub bitwidth, GR8:$lz)),
		RC, VT, DstInst, DstMemInst>;
		}

def : Pat<(and (loadi64 addr:$src), (add (shl 1, GR8:$lz), -1)),		defm : bmi_bzhi_patterns<GR32, 32, i32, BZHI32rr, loadi32, BZHI32rm>;
(BZHI64rm addr:$src,		defm : bmi_bzhi_patterns<GR64, 64, i64, BZHI64rr, loadi64, BZHI64rm>;
(INSERT_SUBREG (i64 (IMPLICIT_DEF)), GR8:$lz, sub_8bit))>;

// x & (-1 >> (32 - y))		// x & (-1 >> (32 - y))
def : Pat<(and GR32:$src, (srl -1, (i8 (trunc (sub 32, GR32:$lz))))),		def : Pat<(and GR32:$src, (srl -1, (i8 (trunc (sub 32, GR32:$lz))))),
(BZHI32rr GR32:$src, GR32:$lz)>;		(BZHI32rr GR32:$src, GR32:$lz)>;
def : Pat<(and (loadi32 addr:$src), (srl -1, (i8 (trunc (sub 32, GR32:$lz))))),		def : Pat<(and (loadi32 addr:$src), (srl -1, (i8 (trunc (sub 32, GR32:$lz))))),
(BZHI32rm addr:$src, GR32:$lz)>;		(BZHI32rm addr:$src, GR32:$lz)>;

// x & (-1 >> (64 - y))		// x & (-1 >> (64 - y))
▲ Show 20 Lines • Show All 951 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/extract-lowbits.ll

	Show First 20 Lines • Show All 531 Lines • ▼ Show 20 Lines
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
	; X86-NOBMI-NEXT: notl %eax			; X86-NOBMI-NEXT: notl %eax
	; X86-NOBMI-NEXT: andl {{[0-9]+}}(%esp), %eax			; X86-NOBMI-NEXT: andl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_b0:			; X86-BMI1BMI2-LABEL: bzhi32_b0:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %al			; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %al
	; X86-BMI1BMI2-NEXT: movl $-1, %ecx			; X86-BMI1BMI2-NEXT: bzhil %eax, {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: shlxl %eax, %ecx, %eax
	; X86-BMI1BMI2-NEXT: andnl {{[0-9]+}}(%esp), %eax, %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_b0:			; X64-NOBMI-LABEL: bzhi32_b0:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movl $-1, %eax			; X64-NOBMI-NEXT: movl $-1, %eax
	; X64-NOBMI-NEXT: movl %esi, %ecx			; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: shll %cl, %eax			; X64-NOBMI-NEXT: shll %cl, %eax
	; X64-NOBMI-NEXT: notl %eax			; X64-NOBMI-NEXT: notl %eax
	; X64-NOBMI-NEXT: andl %edi, %eax			; X64-NOBMI-NEXT: andl %edi, %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_b0:			; X64-BMI1BMI2-LABEL: bzhi32_b0:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movl $-1, %eax			; X64-BMI1BMI2-NEXT: bzhil %esi, %edi, %eax
	; X64-BMI1BMI2-NEXT: shlxl %esi, %eax, %eax
	; X64-BMI1BMI2-NEXT: andnl %edi, %eax, %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%notmask = shl i32 -1, %numlowbits			%notmask = shl i32 -1, %numlowbits
	%mask = xor i32 %notmask, -1			%mask = xor i32 %notmask, -1
	%masked = and i32 %mask, %val			%masked = and i32 %mask, %val
	ret i32 %masked			ret i32 %masked
	}			}

	define i32 @bzhi32_b1_indexzext(i32 %val, i8 zeroext %numlowbits) nounwind {			define i32 @bzhi32_b1_indexzext(i32 %val, i8 zeroext %numlowbits) nounwind {
	; X86-NOBMI-LABEL: bzhi32_b1_indexzext:			; X86-NOBMI-LABEL: bzhi32_b1_indexzext:
	; X86-NOBMI: # %bb.0:			; X86-NOBMI: # %bb.0:
	; X86-NOBMI-NEXT: movb {{[0-9]+}}(%esp), %cl			; X86-NOBMI-NEXT: movb {{[0-9]+}}(%esp), %cl
	; X86-NOBMI-NEXT: movl $-1, %eax			; X86-NOBMI-NEXT: movl $-1, %eax
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
	; X86-NOBMI-NEXT: notl %eax			; X86-NOBMI-NEXT: notl %eax
	; X86-NOBMI-NEXT: andl {{[0-9]+}}(%esp), %eax			; X86-NOBMI-NEXT: andl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_b1_indexzext:			; X86-BMI1BMI2-LABEL: bzhi32_b1_indexzext:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %al			; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %al
	; X86-BMI1BMI2-NEXT: movl $-1, %ecx			; X86-BMI1BMI2-NEXT: bzhil %eax, {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: shlxl %eax, %ecx, %eax
	; X86-BMI1BMI2-NEXT: andnl {{[0-9]+}}(%esp), %eax, %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_b1_indexzext:			; X64-NOBMI-LABEL: bzhi32_b1_indexzext:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movl $-1, %eax			; X64-NOBMI-NEXT: movl $-1, %eax
	; X64-NOBMI-NEXT: movl %esi, %ecx			; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: shll %cl, %eax			; X64-NOBMI-NEXT: shll %cl, %eax
	; X64-NOBMI-NEXT: notl %eax			; X64-NOBMI-NEXT: notl %eax
	; X64-NOBMI-NEXT: andl %edi, %eax			; X64-NOBMI-NEXT: andl %edi, %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_b1_indexzext:			; X64-BMI1BMI2-LABEL: bzhi32_b1_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movl $-1, %eax			; X64-BMI1BMI2-NEXT: bzhil %esi, %edi, %eax
	; X64-BMI1BMI2-NEXT: shlxl %esi, %eax, %eax
	; X64-BMI1BMI2-NEXT: andnl %edi, %eax, %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%conv = zext i8 %numlowbits to i32			%conv = zext i8 %numlowbits to i32
	%notmask = shl i32 -1, %conv			%notmask = shl i32 -1, %conv
	%mask = xor i32 %notmask, -1			%mask = xor i32 %notmask, -1
	%masked = and i32 %mask, %val			%masked = and i32 %mask, %val
	ret i32 %masked			ret i32 %masked
	}			}

	define i32 @bzhi32_b2_load(i32* %w, i32 %numlowbits) nounwind {			define i32 @bzhi32_b2_load(i32* %w, i32 %numlowbits) nounwind {
	; X86-NOBMI-LABEL: bzhi32_b2_load:			; X86-NOBMI-LABEL: bzhi32_b2_load:
	; X86-NOBMI: # %bb.0:			; X86-NOBMI: # %bb.0:
	; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %edx			; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %edx
	; X86-NOBMI-NEXT: movb {{[0-9]+}}(%esp), %cl			; X86-NOBMI-NEXT: movb {{[0-9]+}}(%esp), %cl
	; X86-NOBMI-NEXT: movl $-1, %eax			; X86-NOBMI-NEXT: movl $-1, %eax
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
	; X86-NOBMI-NEXT: notl %eax			; X86-NOBMI-NEXT: notl %eax
	; X86-NOBMI-NEXT: andl (%edx), %eax			; X86-NOBMI-NEXT: andl (%edx), %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_b2_load:			; X86-BMI1BMI2-LABEL: bzhi32_b2_load:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %cl			; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %cl
	; X86-BMI1BMI2-NEXT: movl $-1, %edx			; X86-BMI1BMI2-NEXT: bzhil %ecx, (%eax), %eax
	; X86-BMI1BMI2-NEXT: shlxl %ecx, %edx, %ecx
	; X86-BMI1BMI2-NEXT: andnl (%eax), %ecx, %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_b2_load:			; X64-NOBMI-LABEL: bzhi32_b2_load:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movl $-1, %eax			; X64-NOBMI-NEXT: movl $-1, %eax
	; X64-NOBMI-NEXT: movl %esi, %ecx			; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: shll %cl, %eax			; X64-NOBMI-NEXT: shll %cl, %eax
	; X64-NOBMI-NEXT: notl %eax			; X64-NOBMI-NEXT: notl %eax
	; X64-NOBMI-NEXT: andl (%rdi), %eax			; X64-NOBMI-NEXT: andl (%rdi), %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_b2_load:			; X64-BMI1BMI2-LABEL: bzhi32_b2_load:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movl $-1, %eax			; X64-BMI1BMI2-NEXT: bzhil %esi, (%rdi), %eax
	; X64-BMI1BMI2-NEXT: shlxl %esi, %eax, %eax
	; X64-BMI1BMI2-NEXT: andnl (%rdi), %eax, %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%val = load i32, i32* %w			%val = load i32, i32* %w
	%notmask = shl i32 -1, %numlowbits			%notmask = shl i32 -1, %numlowbits
	%mask = xor i32 %notmask, -1			%mask = xor i32 %notmask, -1
	%masked = and i32 %mask, %val			%masked = and i32 %mask, %val
	ret i32 %masked			ret i32 %masked
	}			}

	define i32 @bzhi32_b3_load_indexzext(i32* %w, i8 zeroext %numlowbits) nounwind {			define i32 @bzhi32_b3_load_indexzext(i32* %w, i8 zeroext %numlowbits) nounwind {
	; X86-NOBMI-LABEL: bzhi32_b3_load_indexzext:			; X86-NOBMI-LABEL: bzhi32_b3_load_indexzext:
	; X86-NOBMI: # %bb.0:			; X86-NOBMI: # %bb.0:
	; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %edx			; X86-NOBMI-NEXT: movl {{[0-9]+}}(%esp), %edx
	; X86-NOBMI-NEXT: movb {{[0-9]+}}(%esp), %cl			; X86-NOBMI-NEXT: movb {{[0-9]+}}(%esp), %cl
	; X86-NOBMI-NEXT: movl $-1, %eax			; X86-NOBMI-NEXT: movl $-1, %eax
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
	; X86-NOBMI-NEXT: notl %eax			; X86-NOBMI-NEXT: notl %eax
	; X86-NOBMI-NEXT: andl (%edx), %eax			; X86-NOBMI-NEXT: andl (%edx), %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_b3_load_indexzext:			; X86-BMI1BMI2-LABEL: bzhi32_b3_load_indexzext:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %cl			; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %cl
	; X86-BMI1BMI2-NEXT: movl $-1, %edx			; X86-BMI1BMI2-NEXT: bzhil %ecx, (%eax), %eax
	; X86-BMI1BMI2-NEXT: shlxl %ecx, %edx, %ecx
	; X86-BMI1BMI2-NEXT: andnl (%eax), %ecx, %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_b3_load_indexzext:			; X64-NOBMI-LABEL: bzhi32_b3_load_indexzext:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movl $-1, %eax			; X64-NOBMI-NEXT: movl $-1, %eax
	; X64-NOBMI-NEXT: movl %esi, %ecx			; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: shll %cl, %eax			; X64-NOBMI-NEXT: shll %cl, %eax
	; X64-NOBMI-NEXT: notl %eax			; X64-NOBMI-NEXT: notl %eax
	; X64-NOBMI-NEXT: andl (%rdi), %eax			; X64-NOBMI-NEXT: andl (%rdi), %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_b3_load_indexzext:			; X64-BMI1BMI2-LABEL: bzhi32_b3_load_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movl $-1, %eax			; X64-BMI1BMI2-NEXT: bzhil %esi, (%rdi), %eax
	; X64-BMI1BMI2-NEXT: shlxl %esi, %eax, %eax
	; X64-BMI1BMI2-NEXT: andnl (%rdi), %eax, %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%val = load i32, i32* %w			%val = load i32, i32* %w
	%conv = zext i8 %numlowbits to i32			%conv = zext i8 %numlowbits to i32
	%notmask = shl i32 -1, %conv			%notmask = shl i32 -1, %conv
	%mask = xor i32 %notmask, -1			%mask = xor i32 %notmask, -1
	%masked = and i32 %mask, %val			%masked = and i32 %mask, %val
	ret i32 %masked			ret i32 %masked
	}			}

	define i32 @bzhi32_b4_commutative(i32 %val, i32 %numlowbits) nounwind {			define i32 @bzhi32_b4_commutative(i32 %val, i32 %numlowbits) nounwind {
	; X86-NOBMI-LABEL: bzhi32_b4_commutative:			; X86-NOBMI-LABEL: bzhi32_b4_commutative:
	; X86-NOBMI: # %bb.0:			; X86-NOBMI: # %bb.0:
	; X86-NOBMI-NEXT: movb {{[0-9]+}}(%esp), %cl			; X86-NOBMI-NEXT: movb {{[0-9]+}}(%esp), %cl
	; X86-NOBMI-NEXT: movl $-1, %eax			; X86-NOBMI-NEXT: movl $-1, %eax
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
	; X86-NOBMI-NEXT: notl %eax			; X86-NOBMI-NEXT: notl %eax
	; X86-NOBMI-NEXT: andl {{[0-9]+}}(%esp), %eax			; X86-NOBMI-NEXT: andl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_b4_commutative:			; X86-BMI1BMI2-LABEL: bzhi32_b4_commutative:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %al			; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %al
	; X86-BMI1BMI2-NEXT: movl $-1, %ecx			; X86-BMI1BMI2-NEXT: bzhil %eax, {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: shlxl %eax, %ecx, %eax
	; X86-BMI1BMI2-NEXT: andnl {{[0-9]+}}(%esp), %eax, %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_b4_commutative:			; X64-NOBMI-LABEL: bzhi32_b4_commutative:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movl $-1, %eax			; X64-NOBMI-NEXT: movl $-1, %eax
	; X64-NOBMI-NEXT: movl %esi, %ecx			; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: shll %cl, %eax			; X64-NOBMI-NEXT: shll %cl, %eax
	; X64-NOBMI-NEXT: notl %eax			; X64-NOBMI-NEXT: notl %eax
	; X64-NOBMI-NEXT: andl %edi, %eax			; X64-NOBMI-NEXT: andl %edi, %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_b4_commutative:			; X64-BMI1BMI2-LABEL: bzhi32_b4_commutative:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movl $-1, %eax			; X64-BMI1BMI2-NEXT: bzhil %esi, %edi, %eax
	; X64-BMI1BMI2-NEXT: shlxl %esi, %eax, %eax
	; X64-BMI1BMI2-NEXT: andnl %edi, %eax, %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%notmask = shl i32 -1, %numlowbits			%notmask = shl i32 -1, %numlowbits
	%mask = xor i32 %notmask, -1			%mask = xor i32 %notmask, -1
	%masked = and i32 %val, %mask ; swapped order			%masked = and i32 %val, %mask ; swapped order
	ret i32 %masked			ret i32 %masked
	}			}

	; 64-bit			; 64-bit
	▲ Show 20 Lines • Show All 42 Lines • ▼ Show 20 Lines
	; X64-NOBMI-NEXT: movl %esi, %ecx			; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: shlq %cl, %rax			; X64-NOBMI-NEXT: shlq %cl, %rax
	; X64-NOBMI-NEXT: notq %rax			; X64-NOBMI-NEXT: notq %rax
	; X64-NOBMI-NEXT: andq %rdi, %rax			; X64-NOBMI-NEXT: andq %rdi, %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_b0:			; X64-BMI1BMI2-LABEL: bzhi64_b0:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movq $-1, %rax			; X64-BMI1BMI2-NEXT: bzhiq %rsi, %rdi, %rax
	; X64-BMI1BMI2-NEXT: shlxq %rsi, %rax, %rax
	; X64-BMI1BMI2-NEXT: andnq %rdi, %rax, %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%notmask = shl i64 -1, %numlowbits			%notmask = shl i64 -1, %numlowbits
	%mask = xor i64 %notmask, -1			%mask = xor i64 %notmask, -1
	%masked = and i64 %mask, %val			%masked = and i64 %mask, %val
	ret i64 %masked			ret i64 %masked
	}			}

	define i64 @bzhi64_b1_indexzext(i64 %val, i8 zeroext %numlowbits) nounwind {			define i64 @bzhi64_b1_indexzext(i64 %val, i8 zeroext %numlowbits) nounwind {
	▲ Show 20 Lines • Show All 41 Lines • ▼ Show 20 Lines
	; X64-NOBMI-NEXT: shlq %cl, %rax			; X64-NOBMI-NEXT: shlq %cl, %rax
	; X64-NOBMI-NEXT: notq %rax			; X64-NOBMI-NEXT: notq %rax
	; X64-NOBMI-NEXT: andq %rdi, %rax			; X64-NOBMI-NEXT: andq %rdi, %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_b1_indexzext:			; X64-BMI1BMI2-LABEL: bzhi64_b1_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi			; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi
	; X64-BMI1BMI2-NEXT: movq $-1, %rax			; X64-BMI1BMI2-NEXT: bzhiq %rsi, %rdi, %rax
	; X64-BMI1BMI2-NEXT: shlxq %rsi, %rax, %rax
	; X64-BMI1BMI2-NEXT: andnq %rdi, %rax, %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%conv = zext i8 %numlowbits to i64			%conv = zext i8 %numlowbits to i64
	%notmask = shl i64 -1, %conv			%notmask = shl i64 -1, %conv
	%mask = xor i64 %notmask, -1			%mask = xor i64 %notmask, -1
	%masked = and i64 %mask, %val			%masked = and i64 %mask, %val
	ret i64 %masked			ret i64 %masked
	}			}

	▲ Show 20 Lines • Show All 45 Lines • ▼ Show 20 Lines
	; X64-NOBMI-NEXT: movl %esi, %ecx			; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: shlq %cl, %rax			; X64-NOBMI-NEXT: shlq %cl, %rax
	; X64-NOBMI-NEXT: notq %rax			; X64-NOBMI-NEXT: notq %rax
	; X64-NOBMI-NEXT: andq (%rdi), %rax			; X64-NOBMI-NEXT: andq (%rdi), %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_b2_load:			; X64-BMI1BMI2-LABEL: bzhi64_b2_load:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movq $-1, %rax			; X64-BMI1BMI2-NEXT: bzhiq %rsi, (%rdi), %rax
	; X64-BMI1BMI2-NEXT: shlxq %rsi, %rax, %rax
	; X64-BMI1BMI2-NEXT: andnq (%rdi), %rax, %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%val = load i64, i64* %w			%val = load i64, i64* %w
	%notmask = shl i64 -1, %numlowbits			%notmask = shl i64 -1, %numlowbits
	%mask = xor i64 %notmask, -1			%mask = xor i64 %notmask, -1
	%masked = and i64 %mask, %val			%masked = and i64 %mask, %val
	ret i64 %masked			ret i64 %masked
	}			}

	▲ Show 20 Lines • Show All 46 Lines • ▼ Show 20 Lines
	; X64-NOBMI-NEXT: shlq %cl, %rax			; X64-NOBMI-NEXT: shlq %cl, %rax
	; X64-NOBMI-NEXT: notq %rax			; X64-NOBMI-NEXT: notq %rax
	; X64-NOBMI-NEXT: andq (%rdi), %rax			; X64-NOBMI-NEXT: andq (%rdi), %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_b3_load_indexzext:			; X64-BMI1BMI2-LABEL: bzhi64_b3_load_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi			; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi
	; X64-BMI1BMI2-NEXT: movq $-1, %rax			; X64-BMI1BMI2-NEXT: bzhiq %rsi, (%rdi), %rax
	; X64-BMI1BMI2-NEXT: shlxq %rsi, %rax, %rax
	; X64-BMI1BMI2-NEXT: andnq (%rdi), %rax, %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%val = load i64, i64* %w			%val = load i64, i64* %w
	%conv = zext i8 %numlowbits to i64			%conv = zext i8 %numlowbits to i64
	%notmask = shl i64 -1, %conv			%notmask = shl i64 -1, %conv
	%mask = xor i64 %notmask, -1			%mask = xor i64 %notmask, -1
	%masked = and i64 %mask, %val			%masked = and i64 %mask, %val
	ret i64 %masked			ret i64 %masked
	}			}
	▲ Show 20 Lines • Show All 42 Lines • ▼ Show 20 Lines
	; X64-NOBMI-NEXT: movl %esi, %ecx			; X64-NOBMI-NEXT: movl %esi, %ecx
	; X64-NOBMI-NEXT: shlq %cl, %rax			; X64-NOBMI-NEXT: shlq %cl, %rax
	; X64-NOBMI-NEXT: notq %rax			; X64-NOBMI-NEXT: notq %rax
	; X64-NOBMI-NEXT: andq %rdi, %rax			; X64-NOBMI-NEXT: andq %rdi, %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_b4_commutative:			; X64-BMI1BMI2-LABEL: bzhi64_b4_commutative:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movq $-1, %rax			; X64-BMI1BMI2-NEXT: bzhiq %rsi, %rdi, %rax
	; X64-BMI1BMI2-NEXT: shlxq %rsi, %rax, %rax
	; X64-BMI1BMI2-NEXT: andnq %rdi, %rax, %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%notmask = shl i64 -1, %numlowbits			%notmask = shl i64 -1, %numlowbits
	%mask = xor i64 %notmask, -1			%mask = xor i64 %notmask, -1
	%masked = and i64 %val, %mask ; swapped order			%masked = and i64 %val, %mask ; swapped order
	ret i64 %masked			ret i64 %masked
	}			}

	; ---------------------------------------------------------------------------- ;			; ---------------------------------------------------------------------------- ;
	▲ Show 20 Lines • Show All 44 Lines • ▼ Show 20 Lines
	; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl			; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl
	; X86-NOBMI-NEXT: movl $-1, %eax			; X86-NOBMI-NEXT: movl $-1, %eax
	; X86-NOBMI-NEXT: shrl %cl, %eax			; X86-NOBMI-NEXT: shrl %cl, %eax
	; X86-NOBMI-NEXT: andl {{[0-9]+}}(%esp), %eax			; X86-NOBMI-NEXT: andl {{[0-9]+}}(%esp), %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_c1_indexzext:			; X86-BMI1BMI2-LABEL: bzhi32_c1_indexzext:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movb $32, %al			; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %al
	; X86-BMI1BMI2-NEXT: subb {{[0-9]+}}(%esp), %al			; X86-BMI1BMI2-NEXT: bzhil %eax, {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: movl $-1, %ecx
	; X86-BMI1BMI2-NEXT: shrxl %eax, %ecx, %eax
	; X86-BMI1BMI2-NEXT: andl {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_c1_indexzext:			; X64-NOBMI-LABEL: bzhi32_c1_indexzext:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movb $32, %cl			; X64-NOBMI-NEXT: movb $32, %cl
	; X64-NOBMI-NEXT: subb %sil, %cl			; X64-NOBMI-NEXT: subb %sil, %cl
	; X64-NOBMI-NEXT: movl $-1, %eax			; X64-NOBMI-NEXT: movl $-1, %eax
	; X64-NOBMI-NEXT: shrl %cl, %eax			; X64-NOBMI-NEXT: shrl %cl, %eax
	; X64-NOBMI-NEXT: andl %edi, %eax			; X64-NOBMI-NEXT: andl %edi, %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_c1_indexzext:			; X64-BMI1BMI2-LABEL: bzhi32_c1_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movb $32, %al			; X64-BMI1BMI2-NEXT: bzhil %esi, %edi, %eax
	; X64-BMI1BMI2-NEXT: subb %sil, %al
	; X64-BMI1BMI2-NEXT: movl $-1, %ecx
	; X64-BMI1BMI2-NEXT: shrxl %eax, %ecx, %eax
	; X64-BMI1BMI2-NEXT: andl %edi, %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%numhighbits = sub i8 32, %numlowbits			%numhighbits = sub i8 32, %numlowbits
	%sh_prom = zext i8 %numhighbits to i32			%sh_prom = zext i8 %numhighbits to i32
	%mask = lshr i32 -1, %sh_prom			%mask = lshr i32 -1, %sh_prom
	%masked = and i32 %mask, %val			%masked = and i32 %mask, %val
	ret i32 %masked			ret i32 %masked
	}			}

	▲ Show 20 Lines • Show All 45 Lines • ▼ Show 20 Lines
	; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl			; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl
	; X86-NOBMI-NEXT: movl $-1, %eax			; X86-NOBMI-NEXT: movl $-1, %eax
	; X86-NOBMI-NEXT: shrl %cl, %eax			; X86-NOBMI-NEXT: shrl %cl, %eax
	; X86-NOBMI-NEXT: andl (%edx), %eax			; X86-NOBMI-NEXT: andl (%edx), %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_c3_load_indexzext:			; X86-BMI1BMI2-LABEL: bzhi32_c3_load_indexzext:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %ecx			; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: movb $32, %al			; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %cl
	; X86-BMI1BMI2-NEXT: subb {{[0-9]+}}(%esp), %al			; X86-BMI1BMI2-NEXT: bzhil %ecx, (%eax), %eax
	; X86-BMI1BMI2-NEXT: movl $-1, %edx
	; X86-BMI1BMI2-NEXT: shrxl %eax, %edx, %eax
	; X86-BMI1BMI2-NEXT: andl (%ecx), %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_c3_load_indexzext:			; X64-NOBMI-LABEL: bzhi32_c3_load_indexzext:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movb $32, %cl			; X64-NOBMI-NEXT: movb $32, %cl
	; X64-NOBMI-NEXT: subb %sil, %cl			; X64-NOBMI-NEXT: subb %sil, %cl
	; X64-NOBMI-NEXT: movl $-1, %eax			; X64-NOBMI-NEXT: movl $-1, %eax
	; X64-NOBMI-NEXT: shrl %cl, %eax			; X64-NOBMI-NEXT: shrl %cl, %eax
	; X64-NOBMI-NEXT: andl (%rdi), %eax			; X64-NOBMI-NEXT: andl (%rdi), %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_c3_load_indexzext:			; X64-BMI1BMI2-LABEL: bzhi32_c3_load_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movb $32, %al			; X64-BMI1BMI2-NEXT: bzhil %esi, (%rdi), %eax
	; X64-BMI1BMI2-NEXT: subb %sil, %al
	; X64-BMI1BMI2-NEXT: movl $-1, %ecx
	; X64-BMI1BMI2-NEXT: shrxl %eax, %ecx, %eax
	; X64-BMI1BMI2-NEXT: andl (%rdi), %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%val = load i32, i32* %w			%val = load i32, i32* %w
	%numhighbits = sub i8 32, %numlowbits			%numhighbits = sub i8 32, %numlowbits
	%sh_prom = zext i8 %numhighbits to i32			%sh_prom = zext i8 %numhighbits to i32
	%mask = lshr i32 -1, %sh_prom			%mask = lshr i32 -1, %sh_prom
	%masked = and i32 %mask, %val			%masked = and i32 %mask, %val
	ret i32 %masked			ret i32 %masked
	}			}
	▲ Show 20 Lines • Show All 135 Lines • ▼ Show 20 Lines
	; X64-NOBMI-NEXT: subb %sil, %cl			; X64-NOBMI-NEXT: subb %sil, %cl
	; X64-NOBMI-NEXT: movq $-1, %rax			; X64-NOBMI-NEXT: movq $-1, %rax
	; X64-NOBMI-NEXT: shrq %cl, %rax			; X64-NOBMI-NEXT: shrq %cl, %rax
	; X64-NOBMI-NEXT: andq %rdi, %rax			; X64-NOBMI-NEXT: andq %rdi, %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_c1_indexzext:			; X64-BMI1BMI2-LABEL: bzhi64_c1_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movb $64, %al			; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi
	; X64-BMI1BMI2-NEXT: subb %sil, %al			; X64-BMI1BMI2-NEXT: bzhiq %rsi, %rdi, %rax
	; X64-BMI1BMI2-NEXT: movq $-1, %rcx
	; X64-BMI1BMI2-NEXT: shrxq %rax, %rcx, %rax
	; X64-BMI1BMI2-NEXT: andq %rdi, %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%numhighbits = sub i8 64, %numlowbits			%numhighbits = sub i8 64, %numlowbits
	%sh_prom = zext i8 %numhighbits to i64			%sh_prom = zext i8 %numhighbits to i64
	%mask = lshr i64 -1, %sh_prom			%mask = lshr i64 -1, %sh_prom
	%masked = and i64 %mask, %val			%masked = and i64 %mask, %val
	ret i64 %masked			ret i64 %masked
	}			}

	▲ Show 20 Lines • Show All 108 Lines • ▼ Show 20 Lines
	; X64-NOBMI-NEXT: subb %sil, %cl			; X64-NOBMI-NEXT: subb %sil, %cl
	; X64-NOBMI-NEXT: movq $-1, %rax			; X64-NOBMI-NEXT: movq $-1, %rax
	; X64-NOBMI-NEXT: shrq %cl, %rax			; X64-NOBMI-NEXT: shrq %cl, %rax
	; X64-NOBMI-NEXT: andq (%rdi), %rax			; X64-NOBMI-NEXT: andq (%rdi), %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_c3_load_indexzext:			; X64-BMI1BMI2-LABEL: bzhi64_c3_load_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movb $64, %al			; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi
	; X64-BMI1BMI2-NEXT: subb %sil, %al			; X64-BMI1BMI2-NEXT: bzhiq %rsi, (%rdi), %rax
	; X64-BMI1BMI2-NEXT: movq $-1, %rcx
	; X64-BMI1BMI2-NEXT: shrxq %rax, %rcx, %rax
	; X64-BMI1BMI2-NEXT: andq (%rdi), %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%val = load i64, i64* %w			%val = load i64, i64* %w
	%numhighbits = sub i8 64, %numlowbits			%numhighbits = sub i8 64, %numlowbits
	%sh_prom = zext i8 %numhighbits to i64			%sh_prom = zext i8 %numhighbits to i64
	%mask = lshr i64 -1, %sh_prom			%mask = lshr i64 -1, %sh_prom
	%masked = and i64 %mask, %val			%masked = and i64 %mask, %val
	ret i64 %masked			ret i64 %masked
	}			}
	▲ Show 20 Lines • Show All 102 Lines • ▼ Show 20 Lines
	; X86-NOBMI-NEXT: movb $32, %cl			; X86-NOBMI-NEXT: movb $32, %cl
	; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl			; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
	; X86-NOBMI-NEXT: shrl %cl, %eax			; X86-NOBMI-NEXT: shrl %cl, %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_d1_indexzext:			; X86-BMI1BMI2-LABEL: bzhi32_d1_indexzext:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movb $32, %al			; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %al
	; X86-BMI1BMI2-NEXT: subb {{[0-9]+}}(%esp), %al			; X86-BMI1BMI2-NEXT: bzhil %eax, {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: shlxl %eax, {{[0-9]+}}(%esp), %ecx
	; X86-BMI1BMI2-NEXT: shrxl %eax, %ecx, %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_d1_indexzext:			; X64-NOBMI-LABEL: bzhi32_d1_indexzext:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movb $32, %cl			; X64-NOBMI-NEXT: movb $32, %cl
	; X64-NOBMI-NEXT: subb %sil, %cl			; X64-NOBMI-NEXT: subb %sil, %cl
	; X64-NOBMI-NEXT: shll %cl, %edi			; X64-NOBMI-NEXT: shll %cl, %edi
	; X64-NOBMI-NEXT: shrl %cl, %edi			; X64-NOBMI-NEXT: shrl %cl, %edi
	; X64-NOBMI-NEXT: movl %edi, %eax			; X64-NOBMI-NEXT: movl %edi, %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_d1_indexzext:			; X64-BMI1BMI2-LABEL: bzhi32_d1_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movb $32, %al			; X64-BMI1BMI2-NEXT: bzhil %esi, %edi, %eax
	; X64-BMI1BMI2-NEXT: subb %sil, %al
	; X64-BMI1BMI2-NEXT: shlxl %eax, %edi, %ecx
	; X64-BMI1BMI2-NEXT: shrxl %eax, %ecx, %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%numhighbits = sub i8 32, %numlowbits			%numhighbits = sub i8 32, %numlowbits
	%sh_prom = zext i8 %numhighbits to i32			%sh_prom = zext i8 %numhighbits to i32
	%highbitscleared = shl i32 %val, %sh_prom			%highbitscleared = shl i32 %val, %sh_prom
	%masked = lshr i32 %highbitscleared, %sh_prom			%masked = lshr i32 %highbitscleared, %sh_prom
	ret i32 %masked			ret i32 %masked
	}			}

	▲ Show 20 Lines • Show All 46 Lines • ▼ Show 20 Lines
	; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl			; X86-NOBMI-NEXT: subb {{[0-9]+}}(%esp), %cl
	; X86-NOBMI-NEXT: shll %cl, %eax			; X86-NOBMI-NEXT: shll %cl, %eax
	; X86-NOBMI-NEXT: shrl %cl, %eax			; X86-NOBMI-NEXT: shrl %cl, %eax
	; X86-NOBMI-NEXT: retl			; X86-NOBMI-NEXT: retl
	;			;
	; X86-BMI1BMI2-LABEL: bzhi32_d3_load_indexzext:			; X86-BMI1BMI2-LABEL: bzhi32_d3_load_indexzext:
	; X86-BMI1BMI2: # %bb.0:			; X86-BMI1BMI2: # %bb.0:
	; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax			; X86-BMI1BMI2-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X86-BMI1BMI2-NEXT: movb $32, %cl			; X86-BMI1BMI2-NEXT: movb {{[0-9]+}}(%esp), %cl
	; X86-BMI1BMI2-NEXT: subb {{[0-9]+}}(%esp), %cl			; X86-BMI1BMI2-NEXT: bzhil %ecx, (%eax), %eax
	; X86-BMI1BMI2-NEXT: shlxl %ecx, (%eax), %eax
	; X86-BMI1BMI2-NEXT: shrxl %ecx, %eax, %eax
	; X86-BMI1BMI2-NEXT: retl			; X86-BMI1BMI2-NEXT: retl
	;			;
	; X64-NOBMI-LABEL: bzhi32_d3_load_indexzext:			; X64-NOBMI-LABEL: bzhi32_d3_load_indexzext:
	; X64-NOBMI: # %bb.0:			; X64-NOBMI: # %bb.0:
	; X64-NOBMI-NEXT: movl (%rdi), %eax			; X64-NOBMI-NEXT: movl (%rdi), %eax
	; X64-NOBMI-NEXT: movb $32, %cl			; X64-NOBMI-NEXT: movb $32, %cl
	; X64-NOBMI-NEXT: subb %sil, %cl			; X64-NOBMI-NEXT: subb %sil, %cl
	; X64-NOBMI-NEXT: shll %cl, %eax			; X64-NOBMI-NEXT: shll %cl, %eax
	; X64-NOBMI-NEXT: shrl %cl, %eax			; X64-NOBMI-NEXT: shrl %cl, %eax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi32_d3_load_indexzext:			; X64-BMI1BMI2-LABEL: bzhi32_d3_load_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movb $32, %al			; X64-BMI1BMI2-NEXT: bzhil %esi, (%rdi), %eax
	; X64-BMI1BMI2-NEXT: subb %sil, %al
	; X64-BMI1BMI2-NEXT: shlxl %eax, (%rdi), %ecx
	; X64-BMI1BMI2-NEXT: shrxl %eax, %ecx, %eax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%val = load i32, i32* %w			%val = load i32, i32* %w
	%numhighbits = sub i8 32, %numlowbits			%numhighbits = sub i8 32, %numlowbits
	%sh_prom = zext i8 %numhighbits to i32			%sh_prom = zext i8 %numhighbits to i32
	%highbitscleared = shl i32 %val, %sh_prom			%highbitscleared = shl i32 %val, %sh_prom
	%masked = lshr i32 %highbitscleared, %sh_prom			%masked = lshr i32 %highbitscleared, %sh_prom
	ret i32 %masked			ret i32 %masked
	}			}
	▲ Show 20 Lines • Show All 170 Lines • ▼ Show 20 Lines
	; X64-NOBMI-NEXT: subb %sil, %cl			; X64-NOBMI-NEXT: subb %sil, %cl
	; X64-NOBMI-NEXT: shlq %cl, %rdi			; X64-NOBMI-NEXT: shlq %cl, %rdi
	; X64-NOBMI-NEXT: shrq %cl, %rdi			; X64-NOBMI-NEXT: shrq %cl, %rdi
	; X64-NOBMI-NEXT: movq %rdi, %rax			; X64-NOBMI-NEXT: movq %rdi, %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_d1_indexzext:			; X64-BMI1BMI2-LABEL: bzhi64_d1_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movb $64, %al			; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi
	; X64-BMI1BMI2-NEXT: subb %sil, %al			; X64-BMI1BMI2-NEXT: bzhiq %rsi, %rdi, %rax
	; X64-BMI1BMI2-NEXT: shlxq %rax, %rdi, %rcx
	; X64-BMI1BMI2-NEXT: shrxq %rax, %rcx, %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%numhighbits = sub i8 64, %numlowbits			%numhighbits = sub i8 64, %numlowbits
	%sh_prom = zext i8 %numhighbits to i64			%sh_prom = zext i8 %numhighbits to i64
	%highbitscleared = shl i64 %val, %sh_prom			%highbitscleared = shl i64 %val, %sh_prom
	%masked = lshr i64 %highbitscleared, %sh_prom			%masked = lshr i64 %highbitscleared, %sh_prom
	ret i64 %masked			ret i64 %masked
	}			}

	▲ Show 20 Lines • Show All 172 Lines • ▼ Show 20 Lines
	; X64-NOBMI-NEXT: movb $64, %cl			; X64-NOBMI-NEXT: movb $64, %cl
	; X64-NOBMI-NEXT: subb %sil, %cl			; X64-NOBMI-NEXT: subb %sil, %cl
	; X64-NOBMI-NEXT: shlq %cl, %rax			; X64-NOBMI-NEXT: shlq %cl, %rax
	; X64-NOBMI-NEXT: shrq %cl, %rax			; X64-NOBMI-NEXT: shrq %cl, %rax
	; X64-NOBMI-NEXT: retq			; X64-NOBMI-NEXT: retq
	;			;
	; X64-BMI1BMI2-LABEL: bzhi64_d3_load_indexzext:			; X64-BMI1BMI2-LABEL: bzhi64_d3_load_indexzext:
	; X64-BMI1BMI2: # %bb.0:			; X64-BMI1BMI2: # %bb.0:
	; X64-BMI1BMI2-NEXT: movb $64, %al			; X64-BMI1BMI2-NEXT: # kill: def $esi killed $esi def $rsi
	; X64-BMI1BMI2-NEXT: subb %sil, %al			; X64-BMI1BMI2-NEXT: bzhiq %rsi, (%rdi), %rax
	; X64-BMI1BMI2-NEXT: shlxq %rax, (%rdi), %rcx
	; X64-BMI1BMI2-NEXT: shrxq %rax, %rcx, %rax
	; X64-BMI1BMI2-NEXT: retq			; X64-BMI1BMI2-NEXT: retq
	%val = load i64, i64* %w			%val = load i64, i64* %w
	%numhighbits = sub i8 64, %numlowbits			%numhighbits = sub i8 64, %numlowbits
	%sh_prom = zext i8 %numhighbits to i64			%sh_prom = zext i8 %numhighbits to i64
	%highbitscleared = shl i64 %val, %sh_prom			%highbitscleared = shl i64 %val, %sh_prom
	%masked = lshr i64 %highbitscleared, %sh_prom			%masked = lshr i64 %highbitscleared, %sh_prom
	ret i64 %masked			ret i64 %masked
	}			}
	▲ Show 20 Lines • Show All 276 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[X86] Emit BZHI when mask is ~(-1 << nbits))
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 150184

llvm/trunk/lib/Target/X86/X86InstrInfo.td

llvm/trunk/test/CodeGen/X86/extract-lowbits.ll

This is an archive of the discontinued LLVM Phabricator instance.

[X86] Emit BZHI when mask is ~(-1 << nbits))ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 150184

llvm/trunk/lib/Target/X86/X86InstrInfo.td

llvm/trunk/test/CodeGen/X86/extract-lowbits.ll

[X86] Emit BZHI when mask is ~(-1 << nbits))
ClosedPublic