Diff 122620

llvm/trunk/include/llvm/IR/IntrinsicsX86.td

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 1,294 Lines • ▼ Show 20 Lines	def int_x86_avx512_vpermilvar_ps_512 :
Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16i32_ty],		Intrinsic<[llvm_v16f32_ty], [llvm_v16f32_ty, llvm_v16i32_ty],
[IntrNoMem]>;		[IntrNoMem]>;

def int_x86_avx512_pshuf_b_512 :		def int_x86_avx512_pshuf_b_512 :
GCCBuiltin<"__builtin_ia32_pshufb512">,		GCCBuiltin<"__builtin_ia32_pshufb512">,
Intrinsic<[llvm_v64i8_ty], [llvm_v64i8_ty, llvm_v64i8_ty],		Intrinsic<[llvm_v64i8_ty], [llvm_v64i8_ty, llvm_v64i8_ty],
[IntrNoMem]>;		[IntrNoMem]>;

def int_x86_avx512_mask_shuf_f32x4_256 :
GCCBuiltin<"__builtin_ia32_shuf_f32x4_256_mask">,
Intrinsic<[llvm_v8f32_ty],
[llvm_v8f32_ty, llvm_v8f32_ty, llvm_i32_ty, llvm_v8f32_ty, llvm_i8_ty],
[IntrNoMem]>;

def int_x86_avx512_mask_shuf_f32x4 :
GCCBuiltin<"__builtin_ia32_shuf_f32x4_mask">,
Intrinsic<[llvm_v16f32_ty],
[llvm_v16f32_ty, llvm_v16f32_ty, llvm_i32_ty, llvm_v16f32_ty, llvm_i16_ty],
[IntrNoMem]>;

def int_x86_avx512_mask_shuf_f64x2_256 :
GCCBuiltin<"__builtin_ia32_shuf_f64x2_256_mask">,
Intrinsic<[llvm_v4f64_ty],
[llvm_v4f64_ty, llvm_v4f64_ty, llvm_i32_ty, llvm_v4f64_ty, llvm_i8_ty],
[IntrNoMem]>;

def int_x86_avx512_mask_shuf_f64x2 :
GCCBuiltin<"__builtin_ia32_shuf_f64x2_mask">,
Intrinsic<[llvm_v8f64_ty],
[llvm_v8f64_ty, llvm_v8f64_ty, llvm_i32_ty, llvm_v8f64_ty, llvm_i8_ty],
[IntrNoMem]>;

def int_x86_avx512_mask_shuf_i32x4_256 :
GCCBuiltin<"__builtin_ia32_shuf_i32x4_256_mask">,
Intrinsic<[llvm_v8i32_ty],
[llvm_v8i32_ty, llvm_v8i32_ty, llvm_i32_ty, llvm_v8i32_ty, llvm_i8_ty],
[IntrNoMem]>;

def int_x86_avx512_mask_shuf_i32x4 :
GCCBuiltin<"__builtin_ia32_shuf_i32x4_mask">,
Intrinsic<[llvm_v16i32_ty],
[llvm_v16i32_ty, llvm_v16i32_ty, llvm_i32_ty, llvm_v16i32_ty, llvm_i16_ty],
[IntrNoMem]>;

def int_x86_avx512_mask_shuf_i64x2_256 :
GCCBuiltin<"__builtin_ia32_shuf_i64x2_256_mask">,
Intrinsic<[llvm_v4i64_ty],
[llvm_v4i64_ty, llvm_v4i64_ty, llvm_i32_ty, llvm_v4i64_ty, llvm_i8_ty],
[IntrNoMem]>;

def int_x86_avx512_mask_shuf_i64x2 :
GCCBuiltin<"__builtin_ia32_shuf_i64x2_mask">,
Intrinsic<[llvm_v8i64_ty],
[llvm_v8i64_ty, llvm_v8i64_ty, llvm_i32_ty, llvm_v8i64_ty, llvm_i8_ty],
[IntrNoMem]>;
}		}

// Vector blend		// Vector blend
let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".		let TargetPrefix = "x86" in { // All intrinsics start with "llvm.x86.".
def int_x86_avx_blendv_pd_256 : GCCBuiltin<"__builtin_ia32_blendvpd256">,		def int_x86_avx_blendv_pd_256 : GCCBuiltin<"__builtin_ia32_blendvpd256">,
Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty,		Intrinsic<[llvm_v4f64_ty], [llvm_v4f64_ty,
llvm_v4f64_ty, llvm_v4f64_ty], [IntrNoMem]>;		llvm_v4f64_ty, llvm_v4f64_ty], [IntrNoMem]>;
def int_x86_avx_blendv_ps_256 : GCCBuiltin<"__builtin_ia32_blendvps256">,		def int_x86_avx_blendv_ps_256 : GCCBuiltin<"__builtin_ia32_blendvps256">,
▲ Show 20 Lines • Show All 4,687 Lines • Show Last 20 Lines

llvm/trunk/lib/IR/AutoUpgrade.cpp

Show First 20 Lines • Show All 70 Lines • ▼ Show 20 Lines	static bool ShouldUpgradeX86Intrinsic(Function *F, StringRef Name) {
// All of the intrinsics matches below should be marked with which llvm		// All of the intrinsics matches below should be marked with which llvm
// version started autoupgrading them. At some point in the future we would		// version started autoupgrading them. At some point in the future we would
// like to use this information to remove upgrade code for some older		// like to use this information to remove upgrade code for some older
// intrinsics. It is currently undecided how we will determine that future		// intrinsics. It is currently undecided how we will determine that future
// point.		// point.
if (Name=="ssse3.pabs.b.128" \|\| // Added in 6.0		if (Name=="ssse3.pabs.b.128" \|\| // Added in 6.0
Name=="ssse3.pabs.w.128" \|\| // Added in 6.0		Name=="ssse3.pabs.w.128" \|\| // Added in 6.0
Name=="ssse3.pabs.d.128" \|\| // Added in 6.0		Name=="ssse3.pabs.d.128" \|\| // Added in 6.0
		Name.startswith("avx512.mask.shuf.i") \|\| // Added in 6.0
		Name.startswith("avx512.mask.shuf.f") \|\| // Added in 6.0
Name.startswith("avx2.pabs.") \|\| // Added in 6.0		Name.startswith("avx2.pabs.") \|\| // Added in 6.0
Name.startswith("avx512.mask.pabs.") \|\| // Added in 6.0		Name.startswith("avx512.mask.pabs.") \|\| // Added in 6.0
Name.startswith("avx512.broadcastm") \|\| // Added in 6.0		Name.startswith("avx512.broadcastm") \|\| // Added in 6.0
Name.startswith("avx512.mask.pbroadcast") \|\| // Added in 6.0		Name.startswith("avx512.mask.pbroadcast") \|\| // Added in 6.0
Name.startswith("sse2.pcmpeq.") \|\| // Added in 3.1		Name.startswith("sse2.pcmpeq.") \|\| // Added in 3.1
Name.startswith("sse2.pcmpgt.") \|\| // Added in 3.1		Name.startswith("sse2.pcmpgt.") \|\| // Added in 3.1
Name.startswith("avx2.pcmpeq.") \|\| // Added in 3.1		Name.startswith("avx2.pcmpeq.") \|\| // Added in 3.1
Name.startswith("avx2.pcmpgt.") \|\| // Added in 3.1		Name.startswith("avx2.pcmpgt.") \|\| // Added in 3.1
▲ Show 20 Lines • Show All 1,178 Lines • ▼ Show 20 Lines	if (IsX86 && (Name.startswith("sse2.pcmp") \|\|
PointerType::getUnqual(VT));		PointerType::getUnqual(VT));
Value *Load = Builder.CreateAlignedLoad(Op, 1);		Value *Load = Builder.CreateAlignedLoad(Op, 1);
if (NumSrcElts == 2)		if (NumSrcElts == 2)
Rep = Builder.CreateShuffleVector(Load, UndefValue::get(Load->getType()),		Rep = Builder.CreateShuffleVector(Load, UndefValue::get(Load->getType()),
{ 0, 1, 0, 1 });		{ 0, 1, 0, 1 });
else		else
Rep = Builder.CreateShuffleVector(Load, UndefValue::get(Load->getType()),		Rep = Builder.CreateShuffleVector(Load, UndefValue::get(Load->getType()),
{ 0, 1, 2, 3, 0, 1, 2, 3 });		{ 0, 1, 2, 3, 0, 1, 2, 3 });
		} else if (IsX86 && (Name.startswith("avx512.mask.shuf.i") \|\|
		Name.startswith("avx512.mask.shuf.f"))) {
		unsigned Imm = cast<ConstantInt>(CI->getArgOperand(2))->getZExtValue();
		Type *VT = CI->getType();
		unsigned NumLanes = VT->getPrimitiveSizeInBits() / 128;
		unsigned NumElementsInLane = 128 / VT->getScalarSizeInBits();
		unsigned ControlBitsMask = NumLanes - 1;
		unsigned NumControlBits = NumLanes / 2;
		SmallVector<uint32_t, 8> ShuffleMask(0);

		for (unsigned l = 0; l != NumLanes; ++l) {
		unsigned LaneMask = (Imm >> (l * NumControlBits)) & ControlBitsMask;
		// We actually need the other source.
		if (l >= NumLanes / 2)
		LaneMask += NumLanes;
		for (unsigned i = 0; i != NumElementsInLane; ++i)
		ShuffleMask.push_back(LaneMask * NumElementsInLane + i);
		}
		Rep = Builder.CreateShuffleVector(CI->getArgOperand(0),
		CI->getArgOperand(1), ShuffleMask);
		Rep = EmitX86Select(Builder, CI->getArgOperand(4), Rep,
		CI->getArgOperand(3));
} else if (IsX86 && (Name.startswith("avx512.mask.broadcastf") \|\|		}else if (IsX86 && (Name.startswith("avx512.mask.broadcastf") \|\|
Name.startswith("avx512.mask.broadcasti"))) {		Name.startswith("avx512.mask.broadcasti"))) {
unsigned NumSrcElts =		unsigned NumSrcElts =
CI->getArgOperand(0)->getType()->getVectorNumElements();		CI->getArgOperand(0)->getType()->getVectorNumElements();
unsigned NumDstElts = CI->getType()->getVectorNumElements();		unsigned NumDstElts = CI->getType()->getVectorNumElements();

SmallVector<uint32_t, 8> ShuffleMask(NumDstElts);		SmallVector<uint32_t, 8> ShuffleMask(NumDstElts);
for (unsigned i = 0; i != NumDstElts; ++i)		for (unsigned i = 0; i != NumDstElts; ++i)
ShuffleMask[i] = i % NumSrcElts;		ShuffleMask[i] = i % NumSrcElts;
▲ Show 20 Lines • Show All 1,268 Lines • Show Last 20 Lines

llvm/trunk/lib/Target/X86/X86IntrinsicsInfo.h

Show First 20 Lines • Show All 1,032 Lines • ▼ Show 20 Lines	static const IntrinsicData IntrinsicsWithoutChain[] = {
X86_INTRINSIC_DATA(avx512_mask_scalef_ps_256, INTR_TYPE_2OP_MASK_RM,		X86_INTRINSIC_DATA(avx512_mask_scalef_ps_256, INTR_TYPE_2OP_MASK_RM,
X86ISD::SCALEF, 0),		X86ISD::SCALEF, 0),
X86_INTRINSIC_DATA(avx512_mask_scalef_ps_512, INTR_TYPE_2OP_MASK_RM,		X86_INTRINSIC_DATA(avx512_mask_scalef_ps_512, INTR_TYPE_2OP_MASK_RM,
X86ISD::SCALEF, 0),		X86ISD::SCALEF, 0),
X86_INTRINSIC_DATA(avx512_mask_scalef_sd, INTR_TYPE_SCALAR_MASK_RM,		X86_INTRINSIC_DATA(avx512_mask_scalef_sd, INTR_TYPE_SCALAR_MASK_RM,
X86ISD::SCALEFS, 0),		X86ISD::SCALEFS, 0),
X86_INTRINSIC_DATA(avx512_mask_scalef_ss, INTR_TYPE_SCALAR_MASK_RM,		X86_INTRINSIC_DATA(avx512_mask_scalef_ss, INTR_TYPE_SCALAR_MASK_RM,
X86ISD::SCALEFS, 0),		X86ISD::SCALEFS, 0),
X86_INTRINSIC_DATA(avx512_mask_shuf_f32x4, INTR_TYPE_3OP_IMM8_MASK,
X86ISD::SHUF128, 0),
X86_INTRINSIC_DATA(avx512_mask_shuf_f32x4_256, INTR_TYPE_3OP_IMM8_MASK,
X86ISD::SHUF128, 0),
X86_INTRINSIC_DATA(avx512_mask_shuf_f64x2, INTR_TYPE_3OP_IMM8_MASK,
X86ISD::SHUF128, 0),
X86_INTRINSIC_DATA(avx512_mask_shuf_f64x2_256, INTR_TYPE_3OP_IMM8_MASK,
X86ISD::SHUF128, 0),
X86_INTRINSIC_DATA(avx512_mask_shuf_i32x4, INTR_TYPE_3OP_IMM8_MASK,
X86ISD::SHUF128, 0),
X86_INTRINSIC_DATA(avx512_mask_shuf_i32x4_256, INTR_TYPE_3OP_IMM8_MASK,
X86ISD::SHUF128, 0),
X86_INTRINSIC_DATA(avx512_mask_shuf_i64x2, INTR_TYPE_3OP_IMM8_MASK,
X86ISD::SHUF128, 0),
X86_INTRINSIC_DATA(avx512_mask_shuf_i64x2_256, INTR_TYPE_3OP_IMM8_MASK,
X86ISD::SHUF128, 0),
X86_INTRINSIC_DATA(avx512_mask_sqrt_pd_128, INTR_TYPE_1OP_MASK, ISD::FSQRT, 0),		X86_INTRINSIC_DATA(avx512_mask_sqrt_pd_128, INTR_TYPE_1OP_MASK, ISD::FSQRT, 0),
X86_INTRINSIC_DATA(avx512_mask_sqrt_pd_256, INTR_TYPE_1OP_MASK, ISD::FSQRT, 0),		X86_INTRINSIC_DATA(avx512_mask_sqrt_pd_256, INTR_TYPE_1OP_MASK, ISD::FSQRT, 0),
X86_INTRINSIC_DATA(avx512_mask_sqrt_pd_512, INTR_TYPE_1OP_MASK, ISD::FSQRT,		X86_INTRINSIC_DATA(avx512_mask_sqrt_pd_512, INTR_TYPE_1OP_MASK, ISD::FSQRT,
X86ISD::FSQRT_RND),		X86ISD::FSQRT_RND),
X86_INTRINSIC_DATA(avx512_mask_sqrt_ps_128, INTR_TYPE_1OP_MASK, ISD::FSQRT, 0),		X86_INTRINSIC_DATA(avx512_mask_sqrt_ps_128, INTR_TYPE_1OP_MASK, ISD::FSQRT, 0),
X86_INTRINSIC_DATA(avx512_mask_sqrt_ps_256, INTR_TYPE_1OP_MASK, ISD::FSQRT, 0),		X86_INTRINSIC_DATA(avx512_mask_sqrt_ps_256, INTR_TYPE_1OP_MASK, ISD::FSQRT, 0),
X86_INTRINSIC_DATA(avx512_mask_sqrt_ps_512, INTR_TYPE_1OP_MASK, ISD::FSQRT,		X86_INTRINSIC_DATA(avx512_mask_sqrt_ps_512, INTR_TYPE_1OP_MASK, ISD::FSQRT,
X86ISD::FSQRT_RND),		X86ISD::FSQRT_RND),
▲ Show 20 Lines • Show All 597 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/avx512-intrinsics-fast-isel.ll

	; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
	; RUN: llc < %s -fast-isel -mtriple=i386-unknown-unknown -mattr=+avx512f \| FileCheck %s --check-prefix=ALL --check-prefix=X32			; RUN: llc < %s -fast-isel -mtriple=i386-unknown-unknown -mattr=+avx512f \| FileCheck %s --check-prefix=ALL --check-prefix=X32
	; RUN: llc < %s -fast-isel -mtriple=x86_64-unknown-unknown -mattr=+avx512f \| FileCheck %s --check-prefix=ALL --check-prefix=X64			; RUN: llc < %s -fast-isel -mtriple=x86_64-unknown-unknown -mattr=+avx512f \| FileCheck %s --check-prefix=ALL --check-prefix=X64

	; NOTE: This should use IR equivalent to what is generated by clang/test/CodeGen/avx512f-builtins.c			; NOTE: This should use IR equivalent to what is generated by clang/test/CodeGen/avx512f-builtins.c


				define <16 x float> @test_mm512_shuffle_f32x4(<16 x float> %__A, <16 x float> %__B) {
				; X32-LABEL: test_mm512_shuffle_f32x4:
				; X32: # BB#0: # %entry
				; X32-NEXT: vshuff64x2 {{.*#+}} zmm0 = zmm0[0,1,2,3],zmm1[0,1,0,1]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm512_shuffle_f32x4:
				; X64: # BB#0: # %entry
				; X64-NEXT: vshuff64x2 {{.*#+}} zmm0 = zmm0[0,1,2,3],zmm1[0,1,0,1]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <16 x float> %__A, <16 x float> %__B, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 16, i32 17, i32 18, i32 19, i32 16, i32 17, i32 18, i32 19>
				ret <16 x float> %shuffle
				}


				define <16 x float> @test_mm512_mask_shuffle_f32x4(<16 x float> %__W, i16 zeroext %__U, <16 x float> %__A, <16 x float> %__B) {
				; X32-LABEL: test_mm512_mask_shuffle_f32x4:
				; X32: # BB#0: # %entry
				; X32-NEXT: kmovw {{[0-9]+}}(%esp), %k1
				; X32-NEXT: vshuff32x4 {{.*#+}} zmm0 {%k1} = zmm1[0,1,2,3,4,5,6,7],zmm2[0,1,2,3,0,1,2,3]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm512_mask_shuffle_f32x4:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshuff32x4 {{.*#+}} zmm0 {%k1} = zmm1[0,1,2,3,4,5,6,7],zmm2[0,1,2,3,0,1,2,3]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <16 x float> %__A, <16 x float> %__B, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 16, i32 17, i32 18, i32 19, i32 16, i32 17, i32 18, i32 19>
				%0 = bitcast i16 %__U to <16 x i1>
				%1 = select <16 x i1> %0, <16 x float> %shuffle, <16 x float> %__W
				ret <16 x float> %1
				}

				define <16 x float> @test_mm512_maskz_shuffle_f32x4(i16 zeroext %__U, <16 x float> %__A, <16 x float> %__B) {
				; X32-LABEL: test_mm512_maskz_shuffle_f32x4:
				; X32: # BB#0: # %entry
				; X32-NEXT: kmovw {{[0-9]+}}(%esp), %k1
				; X32-NEXT: vshuff32x4 {{.*#+}} zmm0 {%k1} {z} = zmm0[0,1,2,3,4,5,6,7],zmm1[0,1,2,3,0,1,2,3]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm512_maskz_shuffle_f32x4:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshuff32x4 {{.*#+}} zmm0 {%k1} {z} = zmm0[0,1,2,3,4,5,6,7],zmm1[0,1,2,3,0,1,2,3]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <16 x float> %__A, <16 x float> %__B, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 16, i32 17, i32 18, i32 19, i32 16, i32 17, i32 18, i32 19>
				%0 = bitcast i16 %__U to <16 x i1>
				%1 = select <16 x i1> %0, <16 x float> %shuffle, <16 x float> zeroinitializer
				ret <16 x float> %1
				}

				define <8 x double> @test_mm512_shuffle_f64x2(<8 x double> %__A, <8 x double> %__B) {
				; X32-LABEL: test_mm512_shuffle_f64x2:
				; X32: # BB#0: # %entry
				; X32-NEXT: vshuff64x2 {{.*#+}} zmm0 = zmm0[0,1,2,3],zmm1[0,1,0,1]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm512_shuffle_f64x2:
				; X64: # BB#0: # %entry
				; X64-NEXT: vshuff64x2 {{.*#+}} zmm0 = zmm0[0,1,2,3],zmm1[0,1,0,1]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <8 x double> %__A, <8 x double> %__B, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 8, i32 9, i32 8, i32 9>
				ret <8 x double> %shuffle
				}

				define <8 x double> @test_mm512_mask_shuffle_f64x2(<8 x double> %__W, i8 zeroext %__U, <8 x double> %__A, <8 x double> %__B) {
				; X32-LABEL: test_mm512_mask_shuffle_f64x2:
				; X32: # BB#0: # %entry
				; X32-NEXT: movb {{[0-9]+}}(%esp), %al
				; X32-NEXT: kmovw %eax, %k1
				; X32-NEXT: vshuff64x2 {{.*#+}} zmm0 {%k1} = zmm1[0,1,2,3],zmm2[0,1,0,1]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm512_mask_shuffle_f64x2:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshuff64x2 {{.*#+}} zmm0 {%k1} = zmm1[0,1,2,3],zmm2[0,1,0,1]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <8 x double> %__A, <8 x double> %__B, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 8, i32 9, i32 8, i32 9>
				%0 = bitcast i8 %__U to <8 x i1>
				%1 = select <8 x i1> %0, <8 x double> %shuffle, <8 x double> %__W
				ret <8 x double> %1
				}

				define <8 x double> @test_mm512_maskz_shuffle_f64x2(i8 zeroext %__U, <8 x double> %__A, <8 x double> %__B) {
				; X32-LABEL: test_mm512_maskz_shuffle_f64x2:
				; X32: # BB#0: # %entry
				; X32-NEXT: movb {{[0-9]+}}(%esp), %al
				; X32-NEXT: kmovw %eax, %k1
				; X32-NEXT: vshuff64x2 {{.*#+}} zmm0 {%k1} {z} = zmm0[0,1,2,3],zmm1[0,1,0,1]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm512_maskz_shuffle_f64x2:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshuff64x2 {{.*#+}} zmm0 {%k1} {z} = zmm0[0,1,2,3],zmm1[0,1,0,1]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <8 x double> %__A, <8 x double> %__B, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 8, i32 9, i32 8, i32 9>
				%0 = bitcast i8 %__U to <8 x i1>
				%1 = select <8 x i1> %0, <8 x double> %shuffle, <8 x double> zeroinitializer
				ret <8 x double> %1
				}

				define <8 x i64> @test_mm512_shuffle_i32x4(<8 x i64> %__A, <8 x i64> %__B) local_unnamed_addr #0 {
				; X32-LABEL: test_mm512_shuffle_i32x4:
				; X32: # BB#0: # %entry
				; X32-NEXT: vshufi64x2 {{.*#+}} zmm0 = zmm0[0,1,2,3],zmm1[0,1,0,1]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm512_shuffle_i32x4:
				; X64: # BB#0: # %entry
				; X64-NEXT: vshufi64x2 {{.*#+}} zmm0 = zmm0[0,1,2,3],zmm1[0,1,0,1]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <8 x i64> %__A, <8 x i64> %__B, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 8, i32 9, i32 8, i32 9>
				ret <8 x i64> %shuffle
				}

				define <8 x i64> @test_mm512_mask_shuffle_i32x4(<8 x i64> %__W, i16 zeroext %__U, <8 x i64> %__A, <8 x i64> %__B) local_unnamed_addr #0 {
				; X32-LABEL: test_mm512_mask_shuffle_i32x4:
				; X32: # BB#0: # %entry
				; X32-NEXT: kmovw {{[0-9]+}}(%esp), %k1
				; X32-NEXT: vshufi32x4 {{.*#+}} zmm0 {%k1} = zmm1[0,1,2,3,4,5,6,7],zmm2[0,1,2,3,0,1,2,3]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm512_mask_shuffle_i32x4:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshufi32x4 {{.*#+}} zmm0 {%k1} = zmm1[0,1,2,3,4,5,6,7],zmm2[0,1,2,3,0,1,2,3]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <8 x i64> %__A, <8 x i64> %__B, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 8, i32 9, i32 8, i32 9>
				%0 = bitcast <8 x i64> %shuffle to <16 x i32>
				%1 = bitcast <8 x i64> %__W to <16 x i32>
				%2 = bitcast i16 %__U to <16 x i1>
				%3 = select <16 x i1> %2, <16 x i32> %0, <16 x i32> %1
				%4 = bitcast <16 x i32> %3 to <8 x i64>
				ret <8 x i64> %4
				}

				define <8 x i64> @test_mm512_maskz_shuffle_i32x4(i16 zeroext %__U, <8 x i64> %__A, <8 x i64> %__B) local_unnamed_addr #0 {
				; X32-LABEL: test_mm512_maskz_shuffle_i32x4:
				; X32: # BB#0: # %entry
				; X32-NEXT: kmovw {{[0-9]+}}(%esp), %k1
				; X32-NEXT: vshufi32x4 {{.*#+}} zmm0 {%k1} {z} = zmm0[0,1,2,3,4,5,6,7],zmm1[0,1,2,3,0,1,2,3]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm512_maskz_shuffle_i32x4:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshufi32x4 {{.*#+}} zmm0 {%k1} {z} = zmm0[0,1,2,3,4,5,6,7],zmm1[0,1,2,3,0,1,2,3]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <8 x i64> %__A, <8 x i64> %__B, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 8, i32 9, i32 8, i32 9>
				%0 = bitcast <8 x i64> %shuffle to <16 x i32>
				%1 = bitcast i16 %__U to <16 x i1>
				%2 = select <16 x i1> %1, <16 x i32> %0, <16 x i32> zeroinitializer
				%3 = bitcast <16 x i32> %2 to <8 x i64>
				ret <8 x i64> %3
				}

				define <8 x i64> @test_mm512_shuffle_i64x2(<8 x i64> %__A, <8 x i64> %__B) local_unnamed_addr #0 {
				; X32-LABEL: test_mm512_shuffle_i64x2:
				; X32: # BB#0: # %entry
				; X32-NEXT: vshufi64x2 {{.*#+}} zmm0 = zmm0[0,1,2,3],zmm1[0,1,0,1]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm512_shuffle_i64x2:
				; X64: # BB#0: # %entry
				; X64-NEXT: vshufi64x2 {{.*#+}} zmm0 = zmm0[0,1,2,3],zmm1[0,1,0,1]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <8 x i64> %__A, <8 x i64> %__B, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 8, i32 9, i32 8, i32 9>
				ret <8 x i64> %shuffle
				}

				define <8 x i64> @test_mm512_mask_shuffle_i64x2(<8 x i64> %__W, i8 zeroext %__U, <8 x i64> %__A, <8 x i64> %__B) local_unnamed_addr #0 {
				; X32-LABEL: test_mm512_mask_shuffle_i64x2:
				; X32: # BB#0: # %entry
				; X32-NEXT: movb {{[0-9]+}}(%esp), %al
				; X32-NEXT: kmovw %eax, %k1
				; X32-NEXT: vshufi64x2 {{.*#+}} zmm0 {%k1} = zmm1[0,1,2,3],zmm2[0,1,0,1]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm512_mask_shuffle_i64x2:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshufi64x2 {{.*#+}} zmm0 {%k1} = zmm1[0,1,2,3],zmm2[0,1,0,1]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <8 x i64> %__A, <8 x i64> %__B, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 8, i32 9, i32 8, i32 9>
				%0 = bitcast i8 %__U to <8 x i1>
				%1 = select <8 x i1> %0, <8 x i64> %shuffle, <8 x i64> %__W
				ret <8 x i64> %1
				}

				define <8 x i64> @test_mm512_maskz_shuffle_i64x2(i8 zeroext %__U, <8 x i64> %__A, <8 x i64> %__B) local_unnamed_addr #0 {
				; X32-LABEL: test_mm512_maskz_shuffle_i64x2:
				; X32: # BB#0: # %entry
				; X32-NEXT: movb {{[0-9]+}}(%esp), %al
				; X32-NEXT: kmovw %eax, %k1
				; X32-NEXT: vshufi64x2 {{.*#+}} zmm0 {%k1} {z} = zmm0[0,1,2,3],zmm1[0,1,0,1]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm512_maskz_shuffle_i64x2:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshufi64x2 {{.*#+}} zmm0 {%k1} {z} = zmm0[0,1,2,3],zmm1[0,1,0,1]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <8 x i64> %__A, <8 x i64> %__B, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 8, i32 9, i32 8, i32 9>
				%0 = bitcast i8 %__U to <8 x i1>
				%1 = select <8 x i1> %0, <8 x i64> %shuffle, <8 x i64> zeroinitializer
				ret <8 x i64> %1
				}



	define <8 x i64> @test_mm512_mask_set1_epi32(<8 x i64> %__O, i16 zeroext %__M, i32 %__A) {			define <8 x i64> @test_mm512_mask_set1_epi32(<8 x i64> %__O, i16 zeroext %__M, i32 %__A) {
	; X32-LABEL: test_mm512_mask_set1_epi32:			; X32-LABEL: test_mm512_mask_set1_epi32:
	; X32: # BB#0: # %entry			; X32: # BB#0: # %entry
	; X32-NEXT: movl {{[0-9]+}}(%esp), %eax			; X32-NEXT: movl {{[0-9]+}}(%esp), %eax
	; X32-NEXT: kmovw {{[0-9]+}}(%esp), %k1			; X32-NEXT: kmovw {{[0-9]+}}(%esp), %k1
	; X32-NEXT: vpbroadcastd %eax, %zmm0 {%k1}			; X32-NEXT: vpbroadcastd %eax, %zmm0 {%k1}
	; X32-NEXT: retl			; X32-NEXT: retl
	;			;
	▲ Show 20 Lines • Show All 1,290 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/avx512-intrinsics-upgrade.ll

Show First 20 Lines • Show All 1,642 Lines • ▼ Show 20 Lines	; CHECK-NEXT: retq
%vecinit.i = insertelement <16 x i32> undef, i32 %q, i32 0		%vecinit.i = insertelement <16 x i32> undef, i32 %q, i32 0
%b = shufflevector <16 x i32> %vecinit.i, <16 x i32> undef, <16 x i32> zeroinitializer		%b = shufflevector <16 x i32> %vecinit.i, <16 x i32> undef, <16 x i32> zeroinitializer
%res = call <16 x i32> @llvm.x86.avx512.mask.pmull.d.512(<16 x i32> %a, <16 x i32> %b, <16 x i32> zeroinitializer, i16 %mask)		%res = call <16 x i32> @llvm.x86.avx512.mask.pmull.d.512(<16 x i32> %a, <16 x i32> %b, <16 x i32> zeroinitializer, i16 %mask)
ret < 16 x i32> %res		ret < 16 x i32> %res
}		}

declare <16 x i32> @llvm.x86.avx512.mask.pmull.d.512(<16 x i32>, <16 x i32>, <16 x i32>, i16)		declare <16 x i32> @llvm.x86.avx512.mask.pmull.d.512(<16 x i32>, <16 x i32>, <16 x i32>, i16)


		declare <16 x float> @llvm.x86.avx512.mask.shuf.f32x4(<16 x float>, <16 x float>, i32, <16 x float>, i16)

		define <16 x float>@test_int_x86_avx512_mask_shuf_f32x4(<16 x float> %x0, <16 x float> %x1, <16 x float> %x3, i16 %x4) {
		; CHECK-LABEL: test_int_x86_avx512_mask_shuf_f32x4:
		; CHECK: ## BB#0:
		; CHECK-NEXT: vshuff32x4 {{.*#+}} zmm3 = zmm0[8,9,10,11,4,5,6,7],zmm1[4,5,6,7,0,1,2,3]
		; CHECK-NEXT: kmovw %edi, %k1
		; CHECK-NEXT: vshuff32x4 {{.*#+}} zmm2 {%k1} = zmm0[8,9,10,11,4,5,6,7],zmm1[4,5,6,7,0,1,2,3]
		; CHECK-NEXT: vaddps %zmm3, %zmm2, %zmm0
		; CHECK-NEXT: retq
		%res = call <16 x float> @llvm.x86.avx512.mask.shuf.f32x4(<16 x float> %x0, <16 x float> %x1, i32 22, <16 x float> %x3, i16 %x4)
		%res1 = call <16 x float> @llvm.x86.avx512.mask.shuf.f32x4(<16 x float> %x0, <16 x float> %x1, i32 22, <16 x float> %x3, i16 -1)
		%res2 = fadd <16 x float> %res, %res1
		ret <16 x float> %res2
		}

		declare <8 x double> @llvm.x86.avx512.mask.shuf.f64x2(<8 x double>, <8 x double>, i32, <8 x double>, i8)

		define <8 x double>@test_int_x86_avx512_mask_shuf_f64x2(<8 x double> %x0, <8 x double> %x1, <8 x double> %x3, i8 %x4) {
		; CHECK-LABEL: test_int_x86_avx512_mask_shuf_f64x2:
		; CHECK: ## BB#0:
		; CHECK-NEXT: vshuff64x2 {{.*#+}} zmm3 = zmm0[4,5,2,3],zmm1[2,3,0,1]
		; CHECK-NEXT: kmovw %edi, %k1
		; CHECK-NEXT: vshuff64x2 {{.*#+}} zmm2 {%k1} = zmm0[4,5,2,3],zmm1[2,3,0,1]
		; CHECK-NEXT: vaddpd %zmm3, %zmm2, %zmm2
		; CHECK-NEXT: vshuff64x2 {{.*#+}} zmm0 {%k1} {z} = zmm0[4,5,2,3],zmm1[2,3,0,1]
		; CHECK-NEXT: vaddpd %zmm0, %zmm2, %zmm0
		; CHECK-NEXT: retq
		%res = call <8 x double> @llvm.x86.avx512.mask.shuf.f64x2(<8 x double> %x0, <8 x double> %x1, i32 22, <8 x double> %x3, i8 %x4)
		%res1 = call <8 x double> @llvm.x86.avx512.mask.shuf.f64x2(<8 x double> %x0, <8 x double> %x1, i32 22, <8 x double> %x3, i8 -1)
		%res2 = call <8 x double> @llvm.x86.avx512.mask.shuf.f64x2(<8 x double> %x0, <8 x double> %x1, i32 22, <8 x double> zeroinitializer, i8 %x4)

		%res3 = fadd <8 x double> %res, %res1
		%res4 = fadd <8 x double> %res3, %res2
		ret <8 x double> %res4
		}

		declare <16 x i32> @llvm.x86.avx512.mask.shuf.i32x4(<16 x i32>, <16 x i32>, i32, <16 x i32>, i16)

		define <16 x i32>@test_int_x86_avx512_mask_shuf_i32x4(<16 x i32> %x0, <16 x i32> %x1, <16 x i32> %x3, i16 %x4) {
		; CHECK-LABEL: test_int_x86_avx512_mask_shuf_i32x4:
		; CHECK: ## BB#0:
		; CHECK-NEXT: vshufi32x4 {{.*#+}} zmm3 = zmm0[8,9,10,11,4,5,6,7],zmm1[4,5,6,7,0,1,2,3]
		; CHECK-NEXT: kmovw %edi, %k1
		; CHECK-NEXT: vshufi32x4 {{.*#+}} zmm2 {%k1} = zmm0[8,9,10,11,4,5,6,7],zmm1[4,5,6,7,0,1,2,3]
		; CHECK-NEXT: vpaddd %zmm3, %zmm2, %zmm0
		; CHECK-NEXT: retq
		%res = call <16 x i32> @llvm.x86.avx512.mask.shuf.i32x4(<16 x i32> %x0, <16 x i32> %x1, i32 22, <16 x i32> %x3, i16 %x4)
		%res1 = call <16 x i32> @llvm.x86.avx512.mask.shuf.i32x4(<16 x i32> %x0, <16 x i32> %x1, i32 22, <16 x i32> %x3, i16 -1)
		%res2 = add <16 x i32> %res, %res1
		ret <16 x i32> %res2
		}

		declare <8 x i64> @llvm.x86.avx512.mask.shuf.i64x2(<8 x i64>, <8 x i64>, i32, <8 x i64>, i8)

		define <8 x i64>@test_int_x86_avx512_mask_shuf_i64x2(<8 x i64> %x0, <8 x i64> %x1, <8 x i64> %x3, i8 %x4) {
		; CHECK-LABEL: test_int_x86_avx512_mask_shuf_i64x2:
		; CHECK: ## BB#0:
		; CHECK-NEXT: vshufi64x2 {{.*#+}} zmm3 = zmm0[4,5,2,3],zmm1[2,3,0,1]
		; CHECK-NEXT: kmovw %edi, %k1
		; CHECK-NEXT: vshufi64x2 {{.*#+}} zmm2 {%k1} = zmm0[4,5,2,3],zmm1[2,3,0,1]
		; CHECK-NEXT: vpaddq %zmm3, %zmm2, %zmm0
		; CHECK-NEXT: retq
		%res = call <8 x i64> @llvm.x86.avx512.mask.shuf.i64x2(<8 x i64> %x0, <8 x i64> %x1, i32 22, <8 x i64> %x3, i8 %x4)
		%res1 = call <8 x i64> @llvm.x86.avx512.mask.shuf.i64x2(<8 x i64> %x0, <8 x i64> %x1, i32 22, <8 x i64> %x3, i8 -1)
		%res2 = add <8 x i64> %res, %res1
		ret <8 x i64> %res2
		}

declare <8 x double> @llvm.x86.avx512.mask.shuf.pd.512(<8 x double>, <8 x double>, i32, <8 x double>, i8)		declare <8 x double> @llvm.x86.avx512.mask.shuf.pd.512(<8 x double>, <8 x double>, i32, <8 x double>, i8)

define <8 x double>@test_int_x86_avx512_mask_shuf_pd_512(<8 x double> %x0, <8 x double> %x1, <8 x double> %x3, i8 %x4) {		define <8 x double>@test_int_x86_avx512_mask_shuf_pd_512(<8 x double> %x0, <8 x double> %x1, <8 x double> %x3, i8 %x4) {
; CHECK-LABEL: test_int_x86_avx512_mask_shuf_pd_512:		; CHECK-LABEL: test_int_x86_avx512_mask_shuf_pd_512:
; CHECK: ## BB#0:		; CHECK: ## BB#0:
; CHECK-NEXT: vshufpd {{.*#+}} zmm3 = zmm0[0],zmm1[1],zmm0[3],zmm1[2],zmm0[5],zmm1[4],zmm0[6],zmm1[6]		; CHECK-NEXT: vshufpd {{.*#+}} zmm3 = zmm0[0],zmm1[1],zmm0[3],zmm1[2],zmm0[5],zmm1[4],zmm0[6],zmm1[6]
; CHECK-NEXT: kmovw %edi, %k1		; CHECK-NEXT: kmovw %edi, %k1
; CHECK-NEXT: vshufpd {{.*#+}} zmm2 {%k1} = zmm0[0],zmm1[1],zmm0[3],zmm1[2],zmm0[5],zmm1[4],zmm0[6],zmm1[6]		; CHECK-NEXT: vshufpd {{.*#+}} zmm2 {%k1} = zmm0[0],zmm1[1],zmm0[3],zmm1[2],zmm0[5],zmm1[4],zmm0[6],zmm1[6]
▲ Show 20 Lines • Show All 1,998 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/avx512-intrinsics.ll

Show First 20 Lines • Show All 3,333 Lines • ▼ Show 20 Lines	; CHECK-NEXT: retq
%res4 = call i8 @llvm.x86.avx512.mask.cmp.ss(<4 x float> %x0, <4 x float> %x1, i32 5, i8 %x3, i32 8)		%res4 = call i8 @llvm.x86.avx512.mask.cmp.ss(<4 x float> %x0, <4 x float> %x1, i32 5, i8 %x3, i32 8)

%res11 = and i8 %res1, %res2		%res11 = and i8 %res1, %res2
%res12 = and i8 %res3, %res4		%res12 = and i8 %res3, %res4
%res13 = and i8 %res11, %res12		%res13 = and i8 %res11, %res12
ret i8 %res13		ret i8 %res13
}		}

declare <16 x float> @llvm.x86.avx512.mask.shuf.f32x4(<16 x float>, <16 x float>, i32, <16 x float>, i16)

define <16 x float>@test_int_x86_avx512_mask_shuf_f32x4(<16 x float> %x0, <16 x float> %x1, <16 x float> %x3, i16 %x4) {
; CHECK-LABEL: test_int_x86_avx512_mask_shuf_f32x4:
; CHECK: ## BB#0:
; CHECK-NEXT: kmovw %edi, %k1
; CHECK-NEXT: vshuff32x4 {{.*#+}} zmm2 {%k1} = zmm0[8,9,10,11,4,5,6,7],zmm1[4,5,6,7,0,1,2,3]
; CHECK-NEXT: vshuff32x4 {{.*#+}} zmm0 = zmm0[8,9,10,11,4,5,6,7],zmm1[4,5,6,7,0,1,2,3]
; CHECK-NEXT: vaddps %zmm0, %zmm2, %zmm0
; CHECK-NEXT: retq
%res = call <16 x float> @llvm.x86.avx512.mask.shuf.f32x4(<16 x float> %x0, <16 x float> %x1, i32 22, <16 x float> %x3, i16 %x4)
%res1 = call <16 x float> @llvm.x86.avx512.mask.shuf.f32x4(<16 x float> %x0, <16 x float> %x1, i32 22, <16 x float> %x3, i16 -1)
%res2 = fadd <16 x float> %res, %res1
ret <16 x float> %res2
}

declare <8 x double> @llvm.x86.avx512.mask.shuf.f64x2(<8 x double>, <8 x double>, i32, <8 x double>, i8)

define <8 x double>@test_int_x86_avx512_mask_shuf_f64x2(<8 x double> %x0, <8 x double> %x1, <8 x double> %x3, i8 %x4) {
; CHECK-LABEL: test_int_x86_avx512_mask_shuf_f64x2:
; CHECK: ## BB#0:
; CHECK-NEXT: kmovw %edi, %k1
; CHECK-NEXT: vshuff64x2 {{.*#+}} zmm3 {%k1} {z} = zmm0[4,5,2,3],zmm1[2,3,0,1]
; CHECK-NEXT: vshuff64x2 {{.*#+}} zmm2 {%k1} = zmm0[4,5,2,3],zmm1[2,3,0,1]
; CHECK-NEXT: vshuff64x2 {{.*#+}} zmm0 = zmm0[4,5,2,3],zmm1[2,3,0,1]
; CHECK-NEXT: vaddpd %zmm0, %zmm2, %zmm0
; CHECK-NEXT: vaddpd %zmm3, %zmm0, %zmm0
; CHECK-NEXT: retq
%res = call <8 x double> @llvm.x86.avx512.mask.shuf.f64x2(<8 x double> %x0, <8 x double> %x1, i32 22, <8 x double> %x3, i8 %x4)
%res1 = call <8 x double> @llvm.x86.avx512.mask.shuf.f64x2(<8 x double> %x0, <8 x double> %x1, i32 22, <8 x double> %x3, i8 -1)
%res2 = call <8 x double> @llvm.x86.avx512.mask.shuf.f64x2(<8 x double> %x0, <8 x double> %x1, i32 22, <8 x double> zeroinitializer, i8 %x4)

%res3 = fadd <8 x double> %res, %res1
%res4 = fadd <8 x double> %res3, %res2
ret <8 x double> %res4
}

declare <16 x i32> @llvm.x86.avx512.mask.shuf.i32x4(<16 x i32>, <16 x i32>, i32, <16 x i32>, i16)

define <16 x i32>@test_int_x86_avx512_mask_shuf_i32x4(<16 x i32> %x0, <16 x i32> %x1, <16 x i32> %x3, i16 %x4) {
; CHECK-LABEL: test_int_x86_avx512_mask_shuf_i32x4:
; CHECK: ## BB#0:
; CHECK-NEXT: kmovw %edi, %k1
; CHECK-NEXT: vshufi32x4 {{.*#+}} zmm2 {%k1} = zmm0[8,9,10,11,4,5,6,7],zmm1[4,5,6,7,0,1,2,3]
; CHECK-NEXT: vshufi32x4 {{.*#+}} zmm0 = zmm0[8,9,10,11,4,5,6,7],zmm1[4,5,6,7,0,1,2,3]
; CHECK-NEXT: vpaddd %zmm0, %zmm2, %zmm0
; CHECK-NEXT: retq
%res = call <16 x i32> @llvm.x86.avx512.mask.shuf.i32x4(<16 x i32> %x0, <16 x i32> %x1, i32 22, <16 x i32> %x3, i16 %x4)
%res1 = call <16 x i32> @llvm.x86.avx512.mask.shuf.i32x4(<16 x i32> %x0, <16 x i32> %x1, i32 22, <16 x i32> %x3, i16 -1)
%res2 = add <16 x i32> %res, %res1
ret <16 x i32> %res2
}

declare <8 x i64> @llvm.x86.avx512.mask.shuf.i64x2(<8 x i64>, <8 x i64>, i32, <8 x i64>, i8)

define <8 x i64>@test_int_x86_avx512_mask_shuf_i64x2(<8 x i64> %x0, <8 x i64> %x1, <8 x i64> %x3, i8 %x4) {
; CHECK-LABEL: test_int_x86_avx512_mask_shuf_i64x2:
; CHECK: ## BB#0:
; CHECK-NEXT: kmovw %edi, %k1
; CHECK-NEXT: vshufi64x2 {{.*#+}} zmm2 {%k1} = zmm0[4,5,2,3],zmm1[2,3,0,1]
; CHECK-NEXT: vshufi64x2 {{.*#+}} zmm0 = zmm0[4,5,2,3],zmm1[2,3,0,1]
; CHECK-NEXT: vpaddq %zmm0, %zmm2, %zmm0
; CHECK-NEXT: retq
%res = call <8 x i64> @llvm.x86.avx512.mask.shuf.i64x2(<8 x i64> %x0, <8 x i64> %x1, i32 22, <8 x i64> %x3, i8 %x4)
%res1 = call <8 x i64> @llvm.x86.avx512.mask.shuf.i64x2(<8 x i64> %x0, <8 x i64> %x1, i32 22, <8 x i64> %x3, i8 -1)
%res2 = add <8 x i64> %res, %res1
ret <8 x i64> %res2
}

declare <8 x double> @llvm.x86.avx512.mask.getmant.pd.512(<8 x double>, i32, <8 x double>, i8, i32)		declare <8 x double> @llvm.x86.avx512.mask.getmant.pd.512(<8 x double>, i32, <8 x double>, i8, i32)

define <8 x double>@test_int_x86_avx512_mask_getmant_pd_512(<8 x double> %x0, <8 x double> %x2, i8 %x3) {		define <8 x double>@test_int_x86_avx512_mask_getmant_pd_512(<8 x double> %x0, <8 x double> %x2, i8 %x3) {
; CHECK-LABEL: test_int_x86_avx512_mask_getmant_pd_512:		; CHECK-LABEL: test_int_x86_avx512_mask_getmant_pd_512:
; CHECK: ## BB#0:		; CHECK: ## BB#0:
; CHECK-NEXT: kmovw %edi, %k1		; CHECK-NEXT: kmovw %edi, %k1
; CHECK-NEXT: vgetmantpd $11, %zmm0, %zmm1 {%k1}		; CHECK-NEXT: vgetmantpd $11, %zmm0, %zmm1 {%k1}
; CHECK-NEXT: vgetmantpd $11, {sae}, %zmm0, %zmm0		; CHECK-NEXT: vgetmantpd $11, {sae}, %zmm0, %zmm0
▲ Show 20 Lines • Show All 1,768 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/avx512vl-intrinsics-fast-isel.ll

	; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
	; RUN: llc < %s -fast-isel -mtriple=i386-unknown-unknown -mattr=+avx512f,+avx512vl \| FileCheck %s --check-prefix=ALL --check-prefix=X32			; RUN: llc < %s -fast-isel -mtriple=i386-unknown-unknown -mattr=+avx512f,+avx512vl \| FileCheck %s --check-prefix=ALL --check-prefix=X32
	; RUN: llc < %s -fast-isel -mtriple=x86_64-unknown-unknown -mattr=+avx512f,+avx512vl \| FileCheck %s --check-prefix=ALL --check-prefix=X64			; RUN: llc < %s -fast-isel -mtriple=x86_64-unknown-unknown -mattr=+avx512f,+avx512vl \| FileCheck %s --check-prefix=ALL --check-prefix=X64

	; NOTE: This should use IR equivalent to what is generated by clang/test/CodeGen/avx512vl-builtins.c			; NOTE: This should use IR equivalent to what is generated by clang/test/CodeGen/avx512vl-builtins.c

				define <8 x float> @test_mm256_shuffle_f32x4(<8 x float> %__A, <8 x float> %__B) {
				; X32-LABEL: test_mm256_shuffle_f32x4:
				; X32: # BB#0: # %entry
				; X32-NEXT: vperm2f128 {{.*#+}} ymm0 = ymm0[2,3],ymm1[2,3]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm256_shuffle_f32x4:
				; X64: # BB#0: # %entry
				; X64-NEXT: vperm2f128 {{.*#+}} ymm0 = ymm0[2,3],ymm1[2,3]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <8 x float> %__A, <8 x float> %__B, <8 x i32> <i32 4, i32 5, i32 6, i32 7, i32 12, i32 13, i32 14, i32 15>
				ret <8 x float> %shuffle
				}

				define <8 x float> @test_mm256_mask_shuffle_f32x4(<8 x float> %__W, i8 zeroext %__U, <8 x float> %__A, <8 x float> %__B) {
				; X32-LABEL: test_mm256_mask_shuffle_f32x4:
				; X32: # BB#0: # %entry
				; X32-NEXT: movb {{[0-9]+}}(%esp), %al
				; X32-NEXT: kmovw %eax, %k1
				; X32-NEXT: vshuff32x4 {{.*#+}} ymm0 {%k1} = ymm1[4,5,6,7],ymm2[4,5,6,7]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm256_mask_shuffle_f32x4:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshuff32x4 {{.*#+}} ymm0 {%k1} = ymm1[4,5,6,7],ymm2[4,5,6,7]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <8 x float> %__A, <8 x float> %__B, <8 x i32> <i32 4, i32 5, i32 6, i32 7, i32 12, i32 13, i32 14, i32 15>
				%0 = bitcast i8 %__U to <8 x i1>
				%1 = select <8 x i1> %0, <8 x float> %shuffle, <8 x float> %__W
				ret <8 x float> %1
				}

				define <8 x float> @test_mm256_maskz_shuffle_f32x4(i8 zeroext %__U, <8 x float> %__A, <8 x float> %__B) {
				; X32-LABEL: test_mm256_maskz_shuffle_f32x4:
				; X32: # BB#0: # %entry
				; X32-NEXT: movb {{[0-9]+}}(%esp), %al
				; X32-NEXT: kmovw %eax, %k1
				; X32-NEXT: vshuff32x4 {{.*#+}} ymm0 {%k1} {z} = ymm0[4,5,6,7],ymm1[4,5,6,7]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm256_maskz_shuffle_f32x4:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshuff32x4 {{.*#+}} ymm0 {%k1} {z} = ymm0[4,5,6,7],ymm1[4,5,6,7]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <8 x float> %__A, <8 x float> %__B, <8 x i32> <i32 4, i32 5, i32 6, i32 7, i32 12, i32 13, i32 14, i32 15>
				%0 = bitcast i8 %__U to <8 x i1>
				%1 = select <8 x i1> %0, <8 x float> %shuffle, <8 x float> zeroinitializer
				ret <8 x float> %1
				}

				define <4 x double> @test_mm256_shuffle_f64x2(<4 x double> %__A, <4 x double> %__B) {
				; X32-LABEL: test_mm256_shuffle_f64x2:
				; X32: # BB#0: # %entry
				; X32-NEXT: vperm2f128 {{.*#+}} ymm0 = ymm0[2,3],ymm1[2,3]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm256_shuffle_f64x2:
				; X64: # BB#0: # %entry
				; X64-NEXT: vperm2f128 {{.*#+}} ymm0 = ymm0[2,3],ymm1[2,3]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <4 x double> %__A, <4 x double> %__B, <4 x i32> <i32 2, i32 3, i32 6, i32 7>
				ret <4 x double> %shuffle
				}

				define <4 x double> @test_mm256_mask_shuffle_f64x2(<4 x double> %__W, i8 zeroext %__U, <4 x double> %__A, <4 x double> %__B) {
				; X32-LABEL: test_mm256_mask_shuffle_f64x2:
				; X32: # BB#0: # %entry
				; X32-NEXT: movb {{[0-9]+}}(%esp), %al
				; X32-NEXT: kmovw %eax, %k1
				; X32-NEXT: vshuff64x2 {{.*#+}} ymm0 {%k1} = ymm1[2,3],ymm2[2,3]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm256_mask_shuffle_f64x2:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshuff64x2 {{.*#+}} ymm0 {%k1} = ymm1[2,3],ymm2[2,3]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <4 x double> %__A, <4 x double> %__B, <4 x i32> <i32 2, i32 3, i32 6, i32 7>
				%0 = bitcast i8 %__U to <8 x i1>
				%extract = shufflevector <8 x i1> %0, <8 x i1> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
				%1 = select <4 x i1> %extract, <4 x double> %shuffle, <4 x double> %__W
				ret <4 x double> %1
				}

				define <4 x double> @test_mm256_maskz_shuffle_f64x2(i8 zeroext %__U, <4 x double> %__A, <4 x double> %__B) {
				; X32-LABEL: test_mm256_maskz_shuffle_f64x2:
				; X32: # BB#0: # %entry
				; X32-NEXT: movb {{[0-9]+}}(%esp), %al
				; X32-NEXT: kmovw %eax, %k1
				; X32-NEXT: vshuff64x2 {{.*#+}} ymm0 {%k1} {z} = ymm0[2,3],ymm1[2,3]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm256_maskz_shuffle_f64x2:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshuff64x2 {{.*#+}} ymm0 {%k1} {z} = ymm0[2,3],ymm1[2,3]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <4 x double> %__A, <4 x double> %__B, <4 x i32> <i32 2, i32 3, i32 6, i32 7>
				%0 = bitcast i8 %__U to <8 x i1>
				%extract = shufflevector <8 x i1> %0, <8 x i1> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
				%1 = select <4 x i1> %extract, <4 x double> %shuffle, <4 x double> zeroinitializer
				ret <4 x double> %1
				}

				define <4 x i64> @test_mm256_shuffle_i32x4(<4 x i64> %__A, <4 x i64> %__B) {
				; X32-LABEL: test_mm256_shuffle_i32x4:
				; X32: # BB#0: # %entry
				; X32-NEXT: vperm2i128 {{.*#+}} ymm0 = ymm0[2,3],ymm1[2,3]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm256_shuffle_i32x4:
				; X64: # BB#0: # %entry
				; X64-NEXT: vperm2i128 {{.*#+}} ymm0 = ymm0[2,3],ymm1[2,3]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <4 x i64> %__A, <4 x i64> %__B, <4 x i32> <i32 2, i32 3, i32 6, i32 7>
				ret <4 x i64> %shuffle
				}

				define <4 x i64> @test_mm256_mask_shuffle_i32x4(<4 x i64> %__W, i8 zeroext %__U, <4 x i64> %__A, <4 x i64> %__B) {
				; X32-LABEL: test_mm256_mask_shuffle_i32x4:
				; X32: # BB#0: # %entry
				; X32-NEXT: movb {{[0-9]+}}(%esp), %al
				; X32-NEXT: kmovw %eax, %k1
				; X32-NEXT: vshufi32x4 {{.*#+}} ymm0 {%k1} = ymm1[4,5,6,7],ymm2[4,5,6,7]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm256_mask_shuffle_i32x4:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshufi32x4 {{.*#+}} ymm0 {%k1} = ymm1[4,5,6,7],ymm2[4,5,6,7]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <4 x i64> %__A, <4 x i64> %__B, <4 x i32> <i32 2, i32 3, i32 6, i32 7>
				%0 = bitcast <4 x i64> %shuffle to <8 x i32>
				%1 = bitcast <4 x i64> %__W to <8 x i32>
				%2 = bitcast i8 %__U to <8 x i1>
				%3 = select <8 x i1> %2, <8 x i32> %0, <8 x i32> %1
				%4 = bitcast <8 x i32> %3 to <4 x i64>
				ret <4 x i64> %4
				}

				define <4 x i64> @test_mm256_maskz_shuffle_i32x4(i8 zeroext %__U, <4 x i64> %__A, <4 x i64> %__B) {
				; X32-LABEL: test_mm256_maskz_shuffle_i32x4:
				; X32: # BB#0: # %entry
				; X32-NEXT: movb {{[0-9]+}}(%esp), %al
				; X32-NEXT: kmovw %eax, %k1
				; X32-NEXT: vshufi32x4 {{.*#+}} ymm0 {%k1} {z} = ymm0[4,5,6,7],ymm1[4,5,6,7]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm256_maskz_shuffle_i32x4:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshufi32x4 {{.*#+}} ymm0 {%k1} {z} = ymm0[4,5,6,7],ymm1[4,5,6,7]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <4 x i64> %__A, <4 x i64> %__B, <4 x i32> <i32 2, i32 3, i32 6, i32 7>
				%0 = bitcast <4 x i64> %shuffle to <8 x i32>
				%1 = bitcast i8 %__U to <8 x i1>
				%2 = select <8 x i1> %1, <8 x i32> %0, <8 x i32> zeroinitializer
				%3 = bitcast <8 x i32> %2 to <4 x i64>
				ret <4 x i64> %3
				}

				define <4 x i64> @test_mm256_shuffle_i64x2(<4 x i64> %__A, <4 x i64> %__B) {
				; X32-LABEL: test_mm256_shuffle_i64x2:
				; X32: # BB#0: # %entry
				; X32-NEXT: vperm2i128 {{.*#+}} ymm0 = ymm0[2,3],ymm1[2,3]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm256_shuffle_i64x2:
				; X64: # BB#0: # %entry
				; X64-NEXT: vperm2i128 {{.*#+}} ymm0 = ymm0[2,3],ymm1[2,3]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <4 x i64> %__A, <4 x i64> %__B, <4 x i32> <i32 2, i32 3, i32 6, i32 7>
				ret <4 x i64> %shuffle
				}

				define <4 x i64> @test_mm256_mask_shuffle_i64x2(<4 x i64> %__W, i8 zeroext %__U, <4 x i64> %__A, <4 x i64> %__B) {
				; X32-LABEL: test_mm256_mask_shuffle_i64x2:
				; X32: # BB#0: # %entry
				; X32-NEXT: movb {{[0-9]+}}(%esp), %al
				; X32-NEXT: kmovw %eax, %k1
				; X32-NEXT: vshufi64x2 {{.*#+}} ymm0 {%k1} = ymm1[2,3],ymm2[2,3]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm256_mask_shuffle_i64x2:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshufi64x2 {{.*#+}} ymm0 {%k1} = ymm1[2,3],ymm2[2,3]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <4 x i64> %__A, <4 x i64> %__B, <4 x i32> <i32 2, i32 3, i32 6, i32 7>
				%0 = bitcast i8 %__U to <8 x i1>
				%extract = shufflevector <8 x i1> %0, <8 x i1> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
				%1 = select <4 x i1> %extract, <4 x i64> %shuffle, <4 x i64> %__W
				ret <4 x i64> %1
				}

				define <4 x i64> @test_mm256_maskz_shuffle_i64x2(i8 zeroext %__U, <4 x i64> %__A, <4 x i64> %__B) {
				; X32-LABEL: test_mm256_maskz_shuffle_i64x2:
				; X32: # BB#0: # %entry
				; X32-NEXT: movb {{[0-9]+}}(%esp), %al
				; X32-NEXT: kmovw %eax, %k1
				; X32-NEXT: vshufi64x2 {{.*#+}} ymm0 {%k1} {z} = ymm0[2,3],ymm1[2,3]
				; X32-NEXT: retl
				;
				; X64-LABEL: test_mm256_maskz_shuffle_i64x2:
				; X64: # BB#0: # %entry
				; X64-NEXT: kmovw %edi, %k1
				; X64-NEXT: vshufi64x2 {{.*#+}} ymm0 {%k1} {z} = ymm0[2,3],ymm1[2,3]
				; X64-NEXT: retq
				entry:
				%shuffle = shufflevector <4 x i64> %__A, <4 x i64> %__B, <4 x i32> <i32 2, i32 3, i32 6, i32 7>
				%0 = bitcast i8 %__U to <8 x i1>
				%extract = shufflevector <8 x i1> %0, <8 x i1> undef, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
				%1 = select <4 x i1> %extract, <4 x i64> %shuffle, <4 x i64> zeroinitializer
				ret <4 x i64> %1
				}

	define <2 x i64> @test_mm_mask_set1_epi32(<2 x i64> %__O, i8 zeroext %__M) {			define <2 x i64> @test_mm_mask_set1_epi32(<2 x i64> %__O, i8 zeroext %__M) {
	; X32-LABEL: test_mm_mask_set1_epi32:			; X32-LABEL: test_mm_mask_set1_epi32:
	; X32: # BB#0: # %entry			; X32: # BB#0: # %entry
	; X32-NEXT: movb {{[0-9]+}}(%esp), %al			; X32-NEXT: movb {{[0-9]+}}(%esp), %al
	; X32-NEXT: kmovw %eax, %k1			; X32-NEXT: kmovw %eax, %k1
	; X32-NEXT: vpbroadcastd {{\.LCPI.*}}, %xmm0 {%k1}			; X32-NEXT: vpbroadcastd {{\.LCPI.*}}, %xmm0 {%k1}
	; X32-NEXT: retl			; X32-NEXT: retl
	;			;
	▲ Show 20 Lines • Show All 1,548 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/avx512vl-intrinsics-upgrade.ll

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 3,245 Lines • ▼ Show 20 Lines
; CHECK: ## BB#0:		; CHECK: ## BB#0:
; CHECK-NEXT: vdivps %xmm1, %xmm0, %xmm0 ## EVEX TO VEX Compression encoding: [0xc5,0xf8,0x5e,0xc1]		; CHECK-NEXT: vdivps %xmm1, %xmm0, %xmm0 ## EVEX TO VEX Compression encoding: [0xc5,0xf8,0x5e,0xc1]
; CHECK-NEXT: retq ## encoding: [0xc3]		; CHECK-NEXT: retq ## encoding: [0xc3]
%res = call <4 x float> @llvm.x86.avx512.mask.div.ps.128(<4 x float> %a0, <4 x float> %a1, <4 x float>zeroinitializer, i8 -1)		%res = call <4 x float> @llvm.x86.avx512.mask.div.ps.128(<4 x float> %a0, <4 x float> %a1, <4 x float>zeroinitializer, i8 -1)
ret <4 x float> %res		ret <4 x float> %res
}		}
declare <4 x float> @llvm.x86.avx512.mask.div.ps.128(<4 x float>, <4 x float>, <4 x float>, i8)		declare <4 x float> @llvm.x86.avx512.mask.div.ps.128(<4 x float>, <4 x float>, <4 x float>, i8)

		declare <8 x float> @llvm.x86.avx512.mask.shuf.f32x4.256(<8 x float>, <8 x float>, i32, <8 x float>, i8)

		define <8 x float>@test_int_x86_avx512_mask_shuf_f32x4_256(<8 x float> %x0, <8 x float> %x1, <8 x float> %x3, i8 %x4) {
		; CHECK-LABEL: test_int_x86_avx512_mask_shuf_f32x4_256:
		; CHECK: ## BB#0:
		; CHECK-NEXT: vblendpd $12, %ymm1, %ymm0, %ymm0 ## encoding: [0xc4,0xe3,0x7d,0x0d,0xc1,0x0c]
		; CHECK-NEXT: ## ymm0 = ymm0[0,1],ymm1[2,3]
		; CHECK-NEXT: kmovw %edi, %k1 ## encoding: [0xc5,0xf8,0x92,0xcf]
		; CHECK-NEXT: vmovaps %ymm0, %ymm2 {%k1} ## encoding: [0x62,0xf1,0x7c,0x29,0x28,0xd0]
		; CHECK-NEXT: vmovaps %ymm0, %ymm1 {%k1} {z} ## encoding: [0x62,0xf1,0x7c,0xa9,0x28,0xc8]
		; CHECK-NEXT: vaddps %ymm0, %ymm2, %ymm0 ## EVEX TO VEX Compression encoding: [0xc5,0xec,0x58,0xc0]
		; CHECK-NEXT: vaddps %ymm0, %ymm1, %ymm0 ## EVEX TO VEX Compression encoding: [0xc5,0xf4,0x58,0xc0]
		; CHECK-NEXT: retq ## encoding: [0xc3]
		%res = call <8 x float> @llvm.x86.avx512.mask.shuf.f32x4.256(<8 x float> %x0, <8 x float> %x1, i32 22, <8 x float> %x3, i8 %x4)
		%res1 = call <8 x float> @llvm.x86.avx512.mask.shuf.f32x4.256(<8 x float> %x0, <8 x float> %x1, i32 22, <8 x float> %x3, i8 -1)
		%res2 = call <8 x float> @llvm.x86.avx512.mask.shuf.f32x4.256(<8 x float> %x0, <8 x float> %x1, i32 22, <8 x float> zeroinitializer, i8 %x4)
		%res3 = fadd <8 x float> %res, %res1
		%res4 = fadd <8 x float> %res2, %res3
		ret <8 x float> %res4
		}

		declare <4 x double> @llvm.x86.avx512.mask.shuf.f64x2.256(<4 x double>, <4 x double>, i32, <4 x double>, i8)

		define <4 x double>@test_int_x86_avx512_mask_shuf_f64x2_256(<4 x double> %x0, <4 x double> %x1, <4 x double> %x3, i8 %x4) {
		; CHECK-LABEL: test_int_x86_avx512_mask_shuf_f64x2_256:
		; CHECK: ## BB#0:
		; CHECK-NEXT: vblendpd $12, %ymm1, %ymm0, %ymm0 ## encoding: [0xc4,0xe3,0x7d,0x0d,0xc1,0x0c]
		; CHECK-NEXT: ## ymm0 = ymm0[0,1],ymm1[2,3]
		; CHECK-NEXT: kmovw %edi, %k1 ## encoding: [0xc5,0xf8,0x92,0xcf]
		; CHECK-NEXT: vmovapd %ymm0, %ymm2 {%k1} ## encoding: [0x62,0xf1,0xfd,0x29,0x28,0xd0]
		; CHECK-NEXT: vmovapd %ymm0, %ymm1 {%k1} {z} ## encoding: [0x62,0xf1,0xfd,0xa9,0x28,0xc8]
		; CHECK-NEXT: vaddpd %ymm0, %ymm2, %ymm0 ## EVEX TO VEX Compression encoding: [0xc5,0xed,0x58,0xc0]
		; CHECK-NEXT: vaddpd %ymm0, %ymm1, %ymm0 ## EVEX TO VEX Compression encoding: [0xc5,0xf5,0x58,0xc0]
		; CHECK-NEXT: retq ## encoding: [0xc3]
		%res = call <4 x double> @llvm.x86.avx512.mask.shuf.f64x2.256(<4 x double> %x0, <4 x double> %x1, i32 22, <4 x double> %x3, i8 %x4)
		%res1 = call <4 x double> @llvm.x86.avx512.mask.shuf.f64x2.256(<4 x double> %x0, <4 x double> %x1, i32 22, <4 x double> %x3, i8 -1)
		%res2 = call <4 x double> @llvm.x86.avx512.mask.shuf.f64x2.256(<4 x double> %x0, <4 x double> %x1, i32 22, <4 x double> zeroinitializer, i8 %x4)
		%res3 = fadd <4 x double> %res, %res1
		%res4 = fadd <4 x double> %res2, %res3
		ret <4 x double> %res4
		}

		declare <8 x i32> @llvm.x86.avx512.mask.shuf.i32x4.256(<8 x i32>, <8 x i32>, i32, <8 x i32>, i8)

		define <8 x i32>@test_int_x86_avx512_mask_shuf_i32x4_256(<8 x i32> %x0, <8 x i32> %x1, <8 x i32> %x3, i8 %x4) {
		; CHECK-LABEL: test_int_x86_avx512_mask_shuf_i32x4_256:
		; CHECK: ## BB#0:
		; CHECK-NEXT: vpblendd $240, %ymm1, %ymm0, %ymm0 ## encoding: [0xc4,0xe3,0x7d,0x02,0xc1,0xf0]
		; CHECK-NEXT: ## ymm0 = ymm0[0,1,2,3],ymm1[4,5,6,7]
		; CHECK-NEXT: kmovw %edi, %k1 ## encoding: [0xc5,0xf8,0x92,0xcf]
		; CHECK-NEXT: vmovdqa32 %ymm0, %ymm2 {%k1} ## encoding: [0x62,0xf1,0x7d,0x29,0x6f,0xd0]
		; CHECK-NEXT: vpaddd %ymm0, %ymm2, %ymm0 ## EVEX TO VEX Compression encoding: [0xc5,0xed,0xfe,0xc0]
		; CHECK-NEXT: retq ## encoding: [0xc3]
		%res = call <8 x i32> @llvm.x86.avx512.mask.shuf.i32x4.256(<8 x i32> %x0, <8 x i32> %x1, i32 22, <8 x i32> %x3, i8 %x4)
		%res1 = call <8 x i32> @llvm.x86.avx512.mask.shuf.i32x4.256(<8 x i32> %x0, <8 x i32> %x1, i32 22, <8 x i32> %x3, i8 -1)
		%res2 = add <8 x i32> %res, %res1
		ret <8 x i32> %res2
		}

		declare <4 x i64> @llvm.x86.avx512.mask.shuf.i64x2.256(<4 x i64>, <4 x i64>, i32, <4 x i64>, i8)

		define <4 x i64>@test_int_x86_avx512_mask_shuf_i64x2_256(<4 x i64> %x0, <4 x i64> %x1, <4 x i64> %x3, i8 %x4) {
		; CHECK-LABEL: test_int_x86_avx512_mask_shuf_i64x2_256:
		; CHECK: ## BB#0:
		; CHECK-NEXT: vpblendd $240, %ymm1, %ymm0, %ymm0 ## encoding: [0xc4,0xe3,0x7d,0x02,0xc1,0xf0]
		; CHECK-NEXT: ## ymm0 = ymm0[0,1,2,3],ymm1[4,5,6,7]
		; CHECK-NEXT: kmovw %edi, %k1 ## encoding: [0xc5,0xf8,0x92,0xcf]
		; CHECK-NEXT: vmovdqa64 %ymm0, %ymm2 {%k1} ## encoding: [0x62,0xf1,0xfd,0x29,0x6f,0xd0]
		; CHECK-NEXT: vpaddq %ymm0, %ymm2, %ymm0 ## EVEX TO VEX Compression encoding: [0xc5,0xed,0xd4,0xc0]
		; CHECK-NEXT: retq ## encoding: [0xc3]
		%res = call <4 x i64> @llvm.x86.avx512.mask.shuf.i64x2.256(<4 x i64> %x0, <4 x i64> %x1, i32 22, <4 x i64> %x3, i8 %x4)
		%res1 = call <4 x i64> @llvm.x86.avx512.mask.shuf.i64x2.256(<4 x i64> %x0, <4 x i64> %x1, i32 22, <4 x i64> %x3, i8 -1)
		%res2 = add <4 x i64> %res, %res1
		ret <4 x i64> %res2
		}

declare <2 x double> @llvm.x86.avx512.mask.shuf.pd.128(<2 x double>, <2 x double>, i32, <2 x double>, i8)		declare <2 x double> @llvm.x86.avx512.mask.shuf.pd.128(<2 x double>, <2 x double>, i32, <2 x double>, i8)

define <2 x double>@test_int_x86_avx512_mask_shuf_pd_128(<2 x double> %x0, <2 x double> %x1, <2 x double> %x3, i8 %x4) {		define <2 x double>@test_int_x86_avx512_mask_shuf_pd_128(<2 x double> %x0, <2 x double> %x1, <2 x double> %x3, i8 %x4) {
; CHECK-LABEL: test_int_x86_avx512_mask_shuf_pd_128:		; CHECK-LABEL: test_int_x86_avx512_mask_shuf_pd_128:
; CHECK: ## BB#0:		; CHECK: ## BB#0:
; CHECK-NEXT: vshufpd $1, %xmm1, %xmm0, %xmm3 ## EVEX TO VEX Compression encoding: [0xc5,0xf9,0xc6,0xd9,0x01]		; CHECK-NEXT: vshufpd $1, %xmm1, %xmm0, %xmm3 ## EVEX TO VEX Compression encoding: [0xc5,0xf9,0xc6,0xd9,0x01]
; CHECK-NEXT: ## xmm3 = xmm0[1],xmm1[0]		; CHECK-NEXT: ## xmm3 = xmm0[1],xmm1[0]
; CHECK-NEXT: kmovw %edi, %k1 ## encoding: [0xc5,0xf8,0x92,0xcf]		; CHECK-NEXT: kmovw %edi, %k1 ## encoding: [0xc5,0xf8,0x92,0xcf]
▲ Show 20 Lines • Show All 742 Lines • ▼ Show 20 Lines	; CHECK-NEXT: retq ## encoding: [0xc3]
ret <8 x i32> %res4		ret <8 x i32> %res4
}		}

define <8 x i32>@test_int_x86_avx512_mask_psrav8_si_const() {		define <8 x i32>@test_int_x86_avx512_mask_psrav8_si_const() {
; CHECK-LABEL: test_int_x86_avx512_mask_psrav8_si_const:		; CHECK-LABEL: test_int_x86_avx512_mask_psrav8_si_const:
; CHECK: ## BB#0:		; CHECK: ## BB#0:
; CHECK-NEXT: vmovdqa {{.*}}(%rip), %ymm0 ## EVEX TO VEX Compression ymm0 = [2,9,4294967284,23,4294967270,37,4294967256,51]		; CHECK-NEXT: vmovdqa {{.*}}(%rip), %ymm0 ## EVEX TO VEX Compression ymm0 = [2,9,4294967284,23,4294967270,37,4294967256,51]
; CHECK-NEXT: ## encoding: [0xc5,0xfd,0x6f,0x05,A,A,A,A]		; CHECK-NEXT: ## encoding: [0xc5,0xfd,0x6f,0x05,A,A,A,A]
; CHECK-NEXT: ## fixup A - offset: 4, value: LCPI280_0-4, kind: reloc_riprel_4byte		; CHECK-NEXT: ## fixup A - offset: 4, value: LCPI284_0-4, kind: reloc_riprel_4byte
; CHECK-NEXT: vpsravd {{.*}}(%rip), %ymm0, %ymm0 ## EVEX TO VEX Compression encoding: [0xc4,0xe2,0x7d,0x46,0x05,A,A,A,A]		; CHECK-NEXT: vpsravd {{.*}}(%rip), %ymm0, %ymm0 ## EVEX TO VEX Compression encoding: [0xc4,0xe2,0x7d,0x46,0x05,A,A,A,A]
; CHECK-NEXT: ## fixup A - offset: 5, value: LCPI280_1-4, kind: reloc_riprel_4byte		; CHECK-NEXT: ## fixup A - offset: 5, value: LCPI284_1-4, kind: reloc_riprel_4byte
; CHECK-NEXT: retq ## encoding: [0xc3]		; CHECK-NEXT: retq ## encoding: [0xc3]
%res = call <8 x i32> @llvm.x86.avx512.mask.psrav8.si(<8 x i32> <i32 2, i32 9, i32 -12, i32 23, i32 -26, i32 37, i32 -40, i32 51>, <8 x i32> <i32 1, i32 18, i32 35, i32 52, i32 69, i32 15, i32 32, i32 49>, <8 x i32> zeroinitializer, i8 -1)		%res = call <8 x i32> @llvm.x86.avx512.mask.psrav8.si(<8 x i32> <i32 2, i32 9, i32 -12, i32 23, i32 -26, i32 37, i32 -40, i32 51>, <8 x i32> <i32 1, i32 18, i32 35, i32 52, i32 69, i32 15, i32 32, i32 49>, <8 x i32> zeroinitializer, i8 -1)
ret <8 x i32> %res		ret <8 x i32> %res
}		}

declare <2 x i64> @llvm.x86.avx512.mask.psllv2.di(<2 x i64>, <2 x i64>, <2 x i64>, i8)		declare <2 x i64> @llvm.x86.avx512.mask.psllv2.di(<2 x i64>, <2 x i64>, <2 x i64>, i8)

define <2 x i64>@test_int_x86_avx512_mask_psllv2_di(<2 x i64> %x0, <2 x i64> %x1, <2 x i64> %x2, i8 %x3) {		define <2 x i64>@test_int_x86_avx512_mask_psllv2_di(<2 x i64> %x0, <2 x i64> %x1, <2 x i64> %x2, i8 %x3) {
▲ Show 20 Lines • Show All 564 Lines • ▼ Show 20 Lines	; CHECK-NEXT: retq ## encoding: [0xc3]
ret <2 x i64> %res4		ret <2 x i64> %res4
}		}

define <2 x i64>@test_int_x86_avx512_mask_psrav_q_128_const(i8 %x3) {		define <2 x i64>@test_int_x86_avx512_mask_psrav_q_128_const(i8 %x3) {
; CHECK-LABEL: test_int_x86_avx512_mask_psrav_q_128_const:		; CHECK-LABEL: test_int_x86_avx512_mask_psrav_q_128_const:
; CHECK: ## BB#0:		; CHECK: ## BB#0:
; CHECK-NEXT: vmovdqa {{.*}}(%rip), %xmm0 ## EVEX TO VEX Compression xmm0 = [2,18446744073709551607]		; CHECK-NEXT: vmovdqa {{.*}}(%rip), %xmm0 ## EVEX TO VEX Compression xmm0 = [2,18446744073709551607]
; CHECK-NEXT: ## encoding: [0xc5,0xf9,0x6f,0x05,A,A,A,A]		; CHECK-NEXT: ## encoding: [0xc5,0xf9,0x6f,0x05,A,A,A,A]
; CHECK-NEXT: ## fixup A - offset: 4, value: LCPI308_0-4, kind: reloc_riprel_4byte		; CHECK-NEXT: ## fixup A - offset: 4, value: LCPI312_0-4, kind: reloc_riprel_4byte
; CHECK-NEXT: vpsravq {{.*}}(%rip), %xmm0, %xmm0 ## encoding: [0x62,0xf2,0xfd,0x08,0x46,0x05,A,A,A,A]		; CHECK-NEXT: vpsravq {{.*}}(%rip), %xmm0, %xmm0 ## encoding: [0x62,0xf2,0xfd,0x08,0x46,0x05,A,A,A,A]
; CHECK-NEXT: ## fixup A - offset: 6, value: LCPI308_1-4, kind: reloc_riprel_4byte		; CHECK-NEXT: ## fixup A - offset: 6, value: LCPI312_1-4, kind: reloc_riprel_4byte
; CHECK-NEXT: retq ## encoding: [0xc3]		; CHECK-NEXT: retq ## encoding: [0xc3]
%res = call <2 x i64> @llvm.x86.avx512.mask.psrav.q.128(<2 x i64> <i64 2, i64 -9>, <2 x i64> <i64 1, i64 90>, <2 x i64> zeroinitializer, i8 -1)		%res = call <2 x i64> @llvm.x86.avx512.mask.psrav.q.128(<2 x i64> <i64 2, i64 -9>, <2 x i64> <i64 1, i64 90>, <2 x i64> zeroinitializer, i8 -1)
ret <2 x i64> %res		ret <2 x i64> %res
}		}

declare <4 x i64> @llvm.x86.avx512.mask.psrav.q.256(<4 x i64>, <4 x i64>, <4 x i64>, i8)		declare <4 x i64> @llvm.x86.avx512.mask.psrav.q.256(<4 x i64>, <4 x i64>, <4 x i64>, i8)

define <4 x i64>@test_int_x86_avx512_mask_psrav_q_256(<4 x i64> %x0, <4 x i64> %x1, <4 x i64> %x2, i8 %x3) {		define <4 x i64>@test_int_x86_avx512_mask_psrav_q_256(<4 x i64> %x0, <4 x i64> %x1, <4 x i64> %x2, i8 %x3) {
▲ Show 20 Lines • Show All 1,313 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/avx512vl-intrinsics.ll

This file is larger than 256 KB, so syntax highlighting is disabled by default.

	Show First 20 Lines • Show All 2,713 Lines • ▼ Show 20 Lines
	; CHECK-NEXT: vaddps %ymm0, %ymm1, %ymm0 ## EVEX TO VEX Compression encoding: [0xc5,0xf4,0x58,0xc0]			; CHECK-NEXT: vaddps %ymm0, %ymm1, %ymm0 ## EVEX TO VEX Compression encoding: [0xc5,0xf4,0x58,0xc0]
	; CHECK-NEXT: retq ## encoding: [0xc3]			; CHECK-NEXT: retq ## encoding: [0xc3]
	%res = call <8 x float> @llvm.x86.avx512.mask.rndscale.ps.256(<8 x float> %x0, i32 5, <8 x float> %x2, i8 %x3)			%res = call <8 x float> @llvm.x86.avx512.mask.rndscale.ps.256(<8 x float> %x0, i32 5, <8 x float> %x2, i8 %x3)
	%res1 = call <8 x float> @llvm.x86.avx512.mask.rndscale.ps.256(<8 x float> %x0, i32 66, <8 x float> %x2, i8 -1)			%res1 = call <8 x float> @llvm.x86.avx512.mask.rndscale.ps.256(<8 x float> %x0, i32 66, <8 x float> %x2, i8 -1)
	%res2 = fadd <8 x float> %res, %res1			%res2 = fadd <8 x float> %res, %res1
	ret <8 x float> %res2			ret <8 x float> %res2
	}			}

	declare <8 x float> @llvm.x86.avx512.mask.shuf.f32x4.256(<8 x float>, <8 x float>, i32, <8 x float>, i8)

	define <8 x float>@test_int_x86_avx512_mask_shuf_f32x4_256(<8 x float> %x0, <8 x float> %x1, <8 x float> %x3, i8 %x4) {
	; CHECK-LABEL: test_int_x86_avx512_mask_shuf_f32x4_256:
	; CHECK: ## BB#0:
	; CHECK-NEXT: kmovw %edi, %k1 ## encoding: [0xc5,0xf8,0x92,0xcf]
	; CHECK-NEXT: vshuff32x4 $22, %ymm1, %ymm0, %ymm3 {%k1} {z} ## encoding: [0x62,0xf3,0x7d,0xa9,0x23,0xd9,0x16]
	; CHECK-NEXT: ## ymm3 {%k1} {z} = ymm0[0,1,2,3],ymm1[4,5,6,7]
	; CHECK-NEXT: vshuff32x4 $22, %ymm1, %ymm0, %ymm2 {%k1} ## encoding: [0x62,0xf3,0x7d,0x29,0x23,0xd1,0x16]
	; CHECK-NEXT: ## ymm2 {%k1} = ymm0[0,1,2,3],ymm1[4,5,6,7]
	; CHECK-NEXT: vperm2f128 $48, %ymm1, %ymm0, %ymm0 ## EVEX TO VEX Compression encoding: [0xc4,0xe3,0x7d,0x06,0xc1,0x30]
	; CHECK-NEXT: ## ymm0 = ymm0[0,1],ymm1[2,3]
	; CHECK-NEXT: vaddps %ymm0, %ymm2, %ymm0 ## EVEX TO VEX Compression encoding: [0xc5,0xec,0x58,0xc0]
	; CHECK-NEXT: vaddps %ymm0, %ymm3, %ymm0 ## EVEX TO VEX Compression encoding: [0xc5,0xe4,0x58,0xc0]
	; CHECK-NEXT: retq ## encoding: [0xc3]
	%res = call <8 x float> @llvm.x86.avx512.mask.shuf.f32x4.256(<8 x float> %x0, <8 x float> %x1, i32 22, <8 x float> %x3, i8 %x4)
	%res1 = call <8 x float> @llvm.x86.avx512.mask.shuf.f32x4.256(<8 x float> %x0, <8 x float> %x1, i32 22, <8 x float> %x3, i8 -1)
	%res2 = call <8 x float> @llvm.x86.avx512.mask.shuf.f32x4.256(<8 x float> %x0, <8 x float> %x1, i32 22, <8 x float> zeroinitializer, i8 %x4)
	%res3 = fadd <8 x float> %res, %res1
	%res4 = fadd <8 x float> %res2, %res3
	ret <8 x float> %res4
	}

	declare <4 x double> @llvm.x86.avx512.mask.shuf.f64x2.256(<4 x double>, <4 x double>, i32, <4 x double>, i8)

	define <4 x double>@test_int_x86_avx512_mask_shuf_f64x2_256(<4 x double> %x0, <4 x double> %x1, <4 x double> %x3, i8 %x4) {
	; CHECK-LABEL: test_int_x86_avx512_mask_shuf_f64x2_256:
	; CHECK: ## BB#0:
	; CHECK-NEXT: kmovw %edi, %k1 ## encoding: [0xc5,0xf8,0x92,0xcf]
	; CHECK-NEXT: vshuff64x2 $22, %ymm1, %ymm0, %ymm3 {%k1} {z} ## encoding: [0x62,0xf3,0xfd,0xa9,0x23,0xd9,0x16]
	; CHECK-NEXT: ## ymm3 {%k1} {z} = ymm0[0,1],ymm1[2,3]
	; CHECK-NEXT: vshuff64x2 $22, %ymm1, %ymm0, %ymm2 {%k1} ## encoding: [0x62,0xf3,0xfd,0x29,0x23,0xd1,0x16]
	; CHECK-NEXT: ## ymm2 {%k1} = ymm0[0,1],ymm1[2,3]
	; CHECK-NEXT: vperm2f128 $48, %ymm1, %ymm0, %ymm0 ## EVEX TO VEX Compression encoding: [0xc4,0xe3,0x7d,0x06,0xc1,0x30]
	; CHECK-NEXT: ## ymm0 = ymm0[0,1],ymm1[2,3]
	; CHECK-NEXT: vaddpd %ymm0, %ymm2, %ymm0 ## EVEX TO VEX Compression encoding: [0xc5,0xed,0x58,0xc0]
	; CHECK-NEXT: vaddpd %ymm0, %ymm3, %ymm0 ## EVEX TO VEX Compression encoding: [0xc5,0xe5,0x58,0xc0]
	; CHECK-NEXT: retq ## encoding: [0xc3]
	%res = call <4 x double> @llvm.x86.avx512.mask.shuf.f64x2.256(<4 x double> %x0, <4 x double> %x1, i32 22, <4 x double> %x3, i8 %x4)
	%res1 = call <4 x double> @llvm.x86.avx512.mask.shuf.f64x2.256(<4 x double> %x0, <4 x double> %x1, i32 22, <4 x double> %x3, i8 -1)
	%res2 = call <4 x double> @llvm.x86.avx512.mask.shuf.f64x2.256(<4 x double> %x0, <4 x double> %x1, i32 22, <4 x double> zeroinitializer, i8 %x4)
	%res3 = fadd <4 x double> %res, %res1
	%res4 = fadd <4 x double> %res2, %res3
	ret <4 x double> %res4
	}

	declare <8 x i32> @llvm.x86.avx512.mask.shuf.i32x4.256(<8 x i32>, <8 x i32>, i32, <8 x i32>, i8)

	define <8 x i32>@test_int_x86_avx512_mask_shuf_i32x4_256(<8 x i32> %x0, <8 x i32> %x1, <8 x i32> %x3, i8 %x4) {
	; CHECK-LABEL: test_int_x86_avx512_mask_shuf_i32x4_256:
	; CHECK: ## BB#0:
	; CHECK-NEXT: kmovw %edi, %k1 ## encoding: [0xc5,0xf8,0x92,0xcf]
	; CHECK-NEXT: vshufi32x4 $22, %ymm1, %ymm0, %ymm2 {%k1} ## encoding: [0x62,0xf3,0x7d,0x29,0x43,0xd1,0x16]
	; CHECK-NEXT: ## ymm2 {%k1} = ymm0[0,1,2,3],ymm1[4,5,6,7]
	; CHECK-NEXT: vperm2i128 $48, %ymm1, %ymm0, %ymm0 ## EVEX TO VEX Compression encoding: [0xc4,0xe3,0x7d,0x46,0xc1,0x30]
	; CHECK-NEXT: ## ymm0 = ymm0[0,1],ymm1[2,3]
	; CHECK-NEXT: vpaddd %ymm0, %ymm2, %ymm0 ## EVEX TO VEX Compression encoding: [0xc5,0xed,0xfe,0xc0]
	; CHECK-NEXT: retq ## encoding: [0xc3]
	%res = call <8 x i32> @llvm.x86.avx512.mask.shuf.i32x4.256(<8 x i32> %x0, <8 x i32> %x1, i32 22, <8 x i32> %x3, i8 %x4)
	%res1 = call <8 x i32> @llvm.x86.avx512.mask.shuf.i32x4.256(<8 x i32> %x0, <8 x i32> %x1, i32 22, <8 x i32> %x3, i8 -1)
	%res2 = add <8 x i32> %res, %res1
	ret <8 x i32> %res2
	}

	declare <4 x i64> @llvm.x86.avx512.mask.shuf.i64x2.256(<4 x i64>, <4 x i64>, i32, <4 x i64>, i8)

	define <4 x i64>@test_int_x86_avx512_mask_shuf_i64x2_256(<4 x i64> %x0, <4 x i64> %x1, <4 x i64> %x3, i8 %x4) {
	; CHECK-LABEL: test_int_x86_avx512_mask_shuf_i64x2_256:
	; CHECK: ## BB#0:
	; CHECK-NEXT: kmovw %edi, %k1 ## encoding: [0xc5,0xf8,0x92,0xcf]
	; CHECK-NEXT: vshufi64x2 $22, %ymm1, %ymm0, %ymm2 {%k1} ## encoding: [0x62,0xf3,0xfd,0x29,0x43,0xd1,0x16]
	; CHECK-NEXT: ## ymm2 {%k1} = ymm0[0,1],ymm1[2,3]
	; CHECK-NEXT: vperm2i128 $48, %ymm1, %ymm0, %ymm0 ## EVEX TO VEX Compression encoding: [0xc4,0xe3,0x7d,0x46,0xc1,0x30]
	; CHECK-NEXT: ## ymm0 = ymm0[0,1],ymm1[2,3]
	; CHECK-NEXT: vpaddq %ymm0, %ymm2, %ymm0 ## EVEX TO VEX Compression encoding: [0xc5,0xed,0xd4,0xc0]
	; CHECK-NEXT: retq ## encoding: [0xc3]
	%res = call <4 x i64> @llvm.x86.avx512.mask.shuf.i64x2.256(<4 x i64> %x0, <4 x i64> %x1, i32 22, <4 x i64> %x3, i8 %x4)
	%res1 = call <4 x i64> @llvm.x86.avx512.mask.shuf.i64x2.256(<4 x i64> %x0, <4 x i64> %x1, i32 22, <4 x i64> %x3, i8 -1)
	%res2 = add <4 x i64> %res, %res1
	ret <4 x i64> %res2
	}

	declare <2 x double> @llvm.x86.avx512.mask.getmant.pd.128(<2 x double>, i32, <2 x double>, i8)			declare <2 x double> @llvm.x86.avx512.mask.getmant.pd.128(<2 x double>, i32, <2 x double>, i8)

	define <2 x double>@test_int_x86_avx512_mask_getmant_pd_128(<2 x double> %x0, <2 x double> %x2, i8 %x3) {			define <2 x double>@test_int_x86_avx512_mask_getmant_pd_128(<2 x double> %x0, <2 x double> %x2, i8 %x3) {
	; CHECK-LABEL: test_int_x86_avx512_mask_getmant_pd_128:			; CHECK-LABEL: test_int_x86_avx512_mask_getmant_pd_128:
	; CHECK: ## BB#0:			; CHECK: ## BB#0:
	; CHECK-NEXT: kmovw %edi, %k1 ## encoding: [0xc5,0xf8,0x92,0xcf]			; CHECK-NEXT: kmovw %edi, %k1 ## encoding: [0xc5,0xf8,0x92,0xcf]
	; CHECK-NEXT: vgetmantpd $11, %xmm0, %xmm2 {%k1} {z} ## encoding: [0x62,0xf3,0xfd,0x89,0x26,0xd0,0x0b]			; CHECK-NEXT: vgetmantpd $11, %xmm0, %xmm2 {%k1} {z} ## encoding: [0x62,0xf3,0xfd,0x89,0x26,0xd0,0x0b]
	; CHECK-NEXT: vgetmantpd $11, %xmm0, %xmm1 {%k1} ## encoding: [0x62,0xf3,0xfd,0x09,0x26,0xc8,0x0b]			; CHECK-NEXT: vgetmantpd $11, %xmm0, %xmm1 {%k1} ## encoding: [0x62,0xf3,0xfd,0x09,0x26,0xc8,0x0b]
	▲ Show 20 Lines • Show All 2,616 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[X86][AVX512] lowering shuffle i/f intrinsic - llvm part
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 122620

llvm/trunk/include/llvm/IR/IntrinsicsX86.td

llvm/trunk/lib/IR/AutoUpgrade.cpp

llvm/trunk/lib/Target/X86/X86IntrinsicsInfo.h

llvm/trunk/test/CodeGen/X86/avx512-intrinsics-fast-isel.ll

llvm/trunk/test/CodeGen/X86/avx512-intrinsics-upgrade.ll

llvm/trunk/test/CodeGen/X86/avx512-intrinsics.ll

llvm/trunk/test/CodeGen/X86/avx512vl-intrinsics-fast-isel.ll

llvm/trunk/test/CodeGen/X86/avx512vl-intrinsics-upgrade.ll

llvm/trunk/test/CodeGen/X86/avx512vl-intrinsics.ll

This is an archive of the discontinued LLVM Phabricator instance.

[X86][AVX512] lowering shuffle i/f intrinsic - llvm partClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 122620

llvm/trunk/include/llvm/IR/IntrinsicsX86.td

llvm/trunk/lib/IR/AutoUpgrade.cpp

llvm/trunk/lib/Target/X86/X86IntrinsicsInfo.h

llvm/trunk/test/CodeGen/X86/avx512-intrinsics-fast-isel.ll

llvm/trunk/test/CodeGen/X86/avx512-intrinsics-upgrade.ll

llvm/trunk/test/CodeGen/X86/avx512-intrinsics.ll

llvm/trunk/test/CodeGen/X86/avx512vl-intrinsics-fast-isel.ll

llvm/trunk/test/CodeGen/X86/avx512vl-intrinsics-upgrade.ll

llvm/trunk/test/CodeGen/X86/avx512vl-intrinsics.ll

[X86][AVX512] lowering shuffle i/f intrinsic - llvm part
ClosedPublic