Diff 14900

llvm/trunk/lib/Target/X86/InstPrinter/X86InstComments.cpp

Show First 20 Lines • Show All 193 Lines • ▼ Show 20 Lines	case X86::VMOVSHDUPrr:
Src1Name = getRegName(MI->getOperand(1).getReg());		Src1Name = getRegName(MI->getOperand(1).getReg());
// FALL THROUGH.		// FALL THROUGH.
case X86::MOVSHDUPrm:		case X86::MOVSHDUPrm:
case X86::VMOVSHDUPrm:		case X86::VMOVSHDUPrm:
DestName = getRegName(MI->getOperand(0).getReg());		DestName = getRegName(MI->getOperand(0).getReg());
DecodeMOVSHDUPMask(MVT::v4f32, ShuffleMask);		DecodeMOVSHDUPMask(MVT::v4f32, ShuffleMask);
break;		break;

		case X86::PSLLDQri:
		case X86::VPSLLDQri:
		Src1Name = getRegName(MI->getOperand(1).getReg());
		DestName = getRegName(MI->getOperand(0).getReg());
		if(MI->getOperand(MI->getNumOperands()-1).isImm())
		DecodePSLLDQMask(MVT::v16i8,
		MI->getOperand(MI->getNumOperands()-1).getImm(),
		ShuffleMask);
		break;

		case X86::VPSLLDQYri:
		Src1Name = getRegName(MI->getOperand(1).getReg());
		DestName = getRegName(MI->getOperand(0).getReg());
		if(MI->getOperand(MI->getNumOperands()-1).isImm())
		DecodePSLLDQMask(MVT::v32i8,
		MI->getOperand(MI->getNumOperands()-1).getImm(),
		ShuffleMask);
		break;

		case X86::PSRLDQri:
		case X86::VPSRLDQri:
		Src1Name = getRegName(MI->getOperand(1).getReg());
		DestName = getRegName(MI->getOperand(0).getReg());
		if(MI->getOperand(MI->getNumOperands()-1).isImm())
		DecodePSRLDQMask(MVT::v16i8,
		MI->getOperand(MI->getNumOperands()-1).getImm(),
		ShuffleMask);
		break;

		case X86::VPSRLDQYri:
		Src1Name = getRegName(MI->getOperand(1).getReg());
		DestName = getRegName(MI->getOperand(0).getReg());
		if(MI->getOperand(MI->getNumOperands()-1).isImm())
		DecodePSRLDQMask(MVT::v32i8,
		MI->getOperand(MI->getNumOperands()-1).getImm(),
		ShuffleMask);
		break;

case X86::PALIGNR128rr:		case X86::PALIGNR128rr:
case X86::VPALIGNR128rr:		case X86::VPALIGNR128rr:
Src1Name = getRegName(MI->getOperand(2).getReg());		Src1Name = getRegName(MI->getOperand(2).getReg());
// FALL THROUGH.		// FALL THROUGH.
case X86::PALIGNR128rm:		case X86::PALIGNR128rm:
case X86::VPALIGNR128rm:		case X86::VPALIGNR128rm:
Src2Name = getRegName(MI->getOperand(1).getReg());		Src2Name = getRegName(MI->getOperand(1).getReg());
DestName = getRegName(MI->getOperand(0).getReg());		DestName = getRegName(MI->getOperand(0).getReg());
▲ Show 20 Lines • Show All 477 Lines • Show Last 20 Lines

llvm/trunk/lib/Target/X86/Utils/X86ShuffleDecode.h

	Show All 34 Lines

	// <0,2> or <0,1,4,5>			// <0,2> or <0,1,4,5>
	void DecodeMOVLHPSMask(unsigned NElts, SmallVectorImpl<int> &ShuffleMask);			void DecodeMOVLHPSMask(unsigned NElts, SmallVectorImpl<int> &ShuffleMask);

	void DecodeMOVSLDUPMask(MVT VT, SmallVectorImpl<int> &ShuffleMask);			void DecodeMOVSLDUPMask(MVT VT, SmallVectorImpl<int> &ShuffleMask);

	void DecodeMOVSHDUPMask(MVT VT, SmallVectorImpl<int> &ShuffleMask);			void DecodeMOVSHDUPMask(MVT VT, SmallVectorImpl<int> &ShuffleMask);

				void DecodePSLLDQMask(MVT VT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);

				void DecodePSRLDQMask(MVT VT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);

	void DecodePALIGNRMask(MVT VT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);			void DecodePALIGNRMask(MVT VT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);

	void DecodePSHUFMask(MVT VT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);			void DecodePSHUFMask(MVT VT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);

	void DecodePSHUFHWMask(MVT VT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);			void DecodePSHUFHWMask(MVT VT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);

	void DecodePSHUFLWMask(MVT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);			void DecodePSHUFLWMask(MVT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);

	Show All 39 Lines

llvm/trunk/lib/Target/X86/Utils/X86ShuffleDecode.cpp

	Show First 20 Lines • Show All 73 Lines • ▼ Show 20 Lines
	void DecodeMOVSHDUPMask(MVT VT, SmallVectorImpl<int> &ShuffleMask) {			void DecodeMOVSHDUPMask(MVT VT, SmallVectorImpl<int> &ShuffleMask) {
	unsigned NumElts = VT.getVectorNumElements();			unsigned NumElts = VT.getVectorNumElements();
	for (int i = 0, e = NumElts / 2; i < e; ++i) {			for (int i = 0, e = NumElts / 2; i < e; ++i) {
	ShuffleMask.push_back(2 * i + 1);			ShuffleMask.push_back(2 * i + 1);
	ShuffleMask.push_back(2 * i + 1);			ShuffleMask.push_back(2 * i + 1);
	}			}
	}			}

				void DecodePSLLDQMask(MVT VT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask) {
				unsigned VectorSizeInBits = VT.getSizeInBits();
				unsigned NumElts = VectorSizeInBits / 8;
				unsigned NumLanes = VectorSizeInBits / 128;
				unsigned NumLaneElts = NumElts / NumLanes;

				for (unsigned l = 0; l < NumElts; l += NumLaneElts)
				for (unsigned i = 0; i < NumLaneElts; ++i) {
				int M = SM_SentinelZero;
				if (i >= Imm) M = i - Imm + l;
				ShuffleMask.push_back(M);
				}
				}

				void DecodePSRLDQMask(MVT VT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask) {
				unsigned VectorSizeInBits = VT.getSizeInBits();
				unsigned NumElts = VectorSizeInBits / 8;
				unsigned NumLanes = VectorSizeInBits / 128;
				unsigned NumLaneElts = NumElts / NumLanes;

				for (unsigned l = 0; l < NumElts; l += NumLaneElts)
				for (unsigned i = 0; i < NumLaneElts; ++i) {
				unsigned Base = i + Imm;
				int M = Base + l;
				if (Base >= NumLaneElts) M = SM_SentinelZero;
				ShuffleMask.push_back(M);
				}
				}

	void DecodePALIGNRMask(MVT VT, unsigned Imm,			void DecodePALIGNRMask(MVT VT, unsigned Imm,
	SmallVectorImpl<int> &ShuffleMask) {			SmallVectorImpl<int> &ShuffleMask) {
	unsigned NumElts = VT.getVectorNumElements();			unsigned NumElts = VT.getVectorNumElements();
	unsigned Offset = Imm * (VT.getVectorElementType().getSizeInBits() / 8);			unsigned Offset = Imm * (VT.getVectorElementType().getSizeInBits() / 8);

	unsigned NumLanes = VT.getSizeInBits() / 128;			unsigned NumLanes = VT.getSizeInBits() / 128;
	unsigned NumLaneElts = NumElts / NumLanes;			unsigned NumLaneElts = NumElts / NumLanes;

	▲ Show 20 Lines • Show All 277 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/avx-intrinsics-x86.ll

	Show First 20 Lines • Show All 449 Lines • ▼ Show 20 Lines


	define <4 x i32> @test_x86_sse2_psll_d(<4 x i32> %a0, <4 x i32> %a1) {			define <4 x i32> @test_x86_sse2_psll_d(<4 x i32> %a0, <4 x i32> %a1) {
	; CHECK: vpslld			; CHECK: vpslld
	%res = call <4 x i32> @llvm.x86.sse2.psll.d(<4 x i32> %a0, <4 x i32> %a1) ; <<4 x i32>> [#uses=1]			%res = call <4 x i32> @llvm.x86.sse2.psll.d(<4 x i32> %a0, <4 x i32> %a1) ; <<4 x i32>> [#uses=1]
	ret <4 x i32> %res			ret <4 x i32> %res
	}			}
	declare <4 x i32> @llvm.x86.sse2.psll.d(<4 x i32>, <4 x i32>) nounwind readnone			declare <4 x i32> @llvm.x86.sse2.psll.d(<4 x i32>, <4 x i32>) nounwind readnone


	define <2 x i64> @test_x86_sse2_psll_dq(<2 x i64> %a0) {			define <2 x i64> @test_x86_sse2_psll_dq(<2 x i64> %a0) {
	; CHECK: vpslldq			; CHECK: vpslldq {{.*#+}} xmm0 = xmm0[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15]
	%res = call <2 x i64> @llvm.x86.sse2.psll.dq(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]			%res = call <2 x i64> @llvm.x86.sse2.psll.dq(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]
	ret <2 x i64> %res			ret <2 x i64> %res
	}			}
	declare <2 x i64> @llvm.x86.sse2.psll.dq(<2 x i64>, i32) nounwind readnone			declare <2 x i64> @llvm.x86.sse2.psll.dq(<2 x i64>, i32) nounwind readnone


	define <2 x i64> @test_x86_sse2_psll_dq_bs(<2 x i64> %a0) {			define <2 x i64> @test_x86_sse2_psll_dq_bs(<2 x i64> %a0) {
	; CHECK: vpslldq			; CHECK: vpslldq {{.*#+}} xmm0 = zero,zero,zero,zero,zero,zero,zero,xmm0[0,1,2,3,4,5,6,7,8]
	%res = call <2 x i64> @llvm.x86.sse2.psll.dq.bs(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]			%res = call <2 x i64> @llvm.x86.sse2.psll.dq.bs(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]
	ret <2 x i64> %res			ret <2 x i64> %res
	}			}
	declare <2 x i64> @llvm.x86.sse2.psll.dq.bs(<2 x i64>, i32) nounwind readnone			declare <2 x i64> @llvm.x86.sse2.psll.dq.bs(<2 x i64>, i32) nounwind readnone


	define <2 x i64> @test_x86_sse2_psll_q(<2 x i64> %a0, <2 x i64> %a1) {			define <2 x i64> @test_x86_sse2_psll_q(<2 x i64> %a0, <2 x i64> %a1) {
	; CHECK: vpsllq			; CHECK: vpsllq
	%res = call <2 x i64> @llvm.x86.sse2.psll.q(<2 x i64> %a0, <2 x i64> %a1) ; <<2 x i64>> [#uses=1]			%res = call <2 x i64> @llvm.x86.sse2.psll.q(<2 x i64> %a0, <2 x i64> %a1) ; <<2 x i64>> [#uses=1]
	ret <2 x i64> %res			ret <2 x i64> %res
	}			}
	▲ Show 20 Lines • Show All 65 Lines • ▼ Show 20 Lines


	define <4 x i32> @test_x86_sse2_psrl_d(<4 x i32> %a0, <4 x i32> %a1) {			define <4 x i32> @test_x86_sse2_psrl_d(<4 x i32> %a0, <4 x i32> %a1) {
	; CHECK: vpsrld			; CHECK: vpsrld
	%res = call <4 x i32> @llvm.x86.sse2.psrl.d(<4 x i32> %a0, <4 x i32> %a1) ; <<4 x i32>> [#uses=1]			%res = call <4 x i32> @llvm.x86.sse2.psrl.d(<4 x i32> %a0, <4 x i32> %a1) ; <<4 x i32>> [#uses=1]
	ret <4 x i32> %res			ret <4 x i32> %res
	}			}
	declare <4 x i32> @llvm.x86.sse2.psrl.d(<4 x i32>, <4 x i32>) nounwind readnone			declare <4 x i32> @llvm.x86.sse2.psrl.d(<4 x i32>, <4 x i32>) nounwind readnone


	define <2 x i64> @test_x86_sse2_psrl_dq(<2 x i64> %a0) {			define <2 x i64> @test_x86_sse2_psrl_dq(<2 x i64> %a0) {
	; CHECK: vpsrldq			; CHECK: vpsrldq {{.*#+}} xmm0 = xmm0[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15]
	%res = call <2 x i64> @llvm.x86.sse2.psrl.dq(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]			%res = call <2 x i64> @llvm.x86.sse2.psrl.dq(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]
	ret <2 x i64> %res			ret <2 x i64> %res
	}			}
	declare <2 x i64> @llvm.x86.sse2.psrl.dq(<2 x i64>, i32) nounwind readnone			declare <2 x i64> @llvm.x86.sse2.psrl.dq(<2 x i64>, i32) nounwind readnone


	define <2 x i64> @test_x86_sse2_psrl_dq_bs(<2 x i64> %a0) {			define <2 x i64> @test_x86_sse2_psrl_dq_bs(<2 x i64> %a0) {
	; CHECK: vpsrldq			; CHECK: vpsrldq {{.*#+}} xmm0 = xmm0[7,8,9,10,11,12,13,14,15],zero,zero,zero,zero,zero,zero,zero
	%res = call <2 x i64> @llvm.x86.sse2.psrl.dq.bs(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]			%res = call <2 x i64> @llvm.x86.sse2.psrl.dq.bs(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]
	ret <2 x i64> %res			ret <2 x i64> %res
	}			}
	declare <2 x i64> @llvm.x86.sse2.psrl.dq.bs(<2 x i64>, i32) nounwind readnone			declare <2 x i64> @llvm.x86.sse2.psrl.dq.bs(<2 x i64>, i32) nounwind readnone


	define <2 x i64> @test_x86_sse2_psrl_q(<2 x i64> %a0, <2 x i64> %a1) {			define <2 x i64> @test_x86_sse2_psrl_q(<2 x i64> %a0, <2 x i64> %a1) {
	; CHECK: vpsrlq			; CHECK: vpsrlq
	%res = call <2 x i64> @llvm.x86.sse2.psrl.q(<2 x i64> %a0, <2 x i64> %a1) ; <<2 x i64>> [#uses=1]			%res = call <2 x i64> @llvm.x86.sse2.psrl.q(<2 x i64> %a0, <2 x i64> %a1) ; <<2 x i64>> [#uses=1]
	ret <2 x i64> %res			ret <2 x i64> %res
	}			}
	▲ Show 20 Lines • Show All 2,037 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/avx2-intrinsics-x86.ll

	Show First 20 Lines • Show All 152 Lines • ▼ Show 20 Lines


	define <8 x i32> @test_x86_avx2_psll_d(<8 x i32> %a0, <4 x i32> %a1) {			define <8 x i32> @test_x86_avx2_psll_d(<8 x i32> %a0, <4 x i32> %a1) {
	; CHECK: vpslld			; CHECK: vpslld
	%res = call <8 x i32> @llvm.x86.avx2.psll.d(<8 x i32> %a0, <4 x i32> %a1) ; <<8 x i32>> [#uses=1]			%res = call <8 x i32> @llvm.x86.avx2.psll.d(<8 x i32> %a0, <4 x i32> %a1) ; <<8 x i32>> [#uses=1]
	ret <8 x i32> %res			ret <8 x i32> %res
	}			}
	declare <8 x i32> @llvm.x86.avx2.psll.d(<8 x i32>, <4 x i32>) nounwind readnone			declare <8 x i32> @llvm.x86.avx2.psll.d(<8 x i32>, <4 x i32>) nounwind readnone


	define <4 x i64> @test_x86_avx2_psll_dq(<4 x i64> %a0) {			define <4 x i64> @test_x86_avx2_psll_dq(<4 x i64> %a0) {
	; CHECK: vpslldq			; CHECK: vpslldq {{.*#+}} ymm0 = ymm0[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31]
	%res = call <4 x i64> @llvm.x86.avx2.psll.dq(<4 x i64> %a0, i32 7) ; <<4 x i64>> [#uses=1]			%res = call <4 x i64> @llvm.x86.avx2.psll.dq(<4 x i64> %a0, i32 7) ; <<4 x i64>> [#uses=1]
	ret <4 x i64> %res			ret <4 x i64> %res
	}			}
	declare <4 x i64> @llvm.x86.avx2.psll.dq(<4 x i64>, i32) nounwind readnone			declare <4 x i64> @llvm.x86.avx2.psll.dq(<4 x i64>, i32) nounwind readnone


	define <4 x i64> @test_x86_avx2_psll_dq_bs(<4 x i64> %a0) {			define <4 x i64> @test_x86_avx2_psll_dq_bs(<4 x i64> %a0) {
	; CHECK: vpslldq			; CHECK: vpslldq {{.*#+}} ymm0 = zero,zero,zero,zero,zero,zero,zero,ymm0[0,1,2,3,4,5,6,7,8],zero,zero,zero,zero,zero,zero,zero,ymm0[16,17,18,19,20,21,22,23,24]
	%res = call <4 x i64> @llvm.x86.avx2.psll.dq.bs(<4 x i64> %a0, i32 7) ; <<4 x i64>> [#uses=1]			%res = call <4 x i64> @llvm.x86.avx2.psll.dq.bs(<4 x i64> %a0, i32 7) ; <<4 x i64>> [#uses=1]
	ret <4 x i64> %res			ret <4 x i64> %res
	}			}
	declare <4 x i64> @llvm.x86.avx2.psll.dq.bs(<4 x i64>, i32) nounwind readnone			declare <4 x i64> @llvm.x86.avx2.psll.dq.bs(<4 x i64>, i32) nounwind readnone


	define <4 x i64> @test_x86_avx2_psll_q(<4 x i64> %a0, <2 x i64> %a1) {			define <4 x i64> @test_x86_avx2_psll_q(<4 x i64> %a0, <2 x i64> %a1) {
	; CHECK: vpsllq			; CHECK: vpsllq
	%res = call <4 x i64> @llvm.x86.avx2.psll.q(<4 x i64> %a0, <2 x i64> %a1) ; <<4 x i64>> [#uses=1]			%res = call <4 x i64> @llvm.x86.avx2.psll.q(<4 x i64> %a0, <2 x i64> %a1) ; <<4 x i64>> [#uses=1]
	ret <4 x i64> %res			ret <4 x i64> %res
	}			}
	▲ Show 20 Lines • Show All 65 Lines • ▼ Show 20 Lines


	define <8 x i32> @test_x86_avx2_psrl_d(<8 x i32> %a0, <4 x i32> %a1) {			define <8 x i32> @test_x86_avx2_psrl_d(<8 x i32> %a0, <4 x i32> %a1) {
	; CHECK: vpsrld			; CHECK: vpsrld
	%res = call <8 x i32> @llvm.x86.avx2.psrl.d(<8 x i32> %a0, <4 x i32> %a1) ; <<8 x i32>> [#uses=1]			%res = call <8 x i32> @llvm.x86.avx2.psrl.d(<8 x i32> %a0, <4 x i32> %a1) ; <<8 x i32>> [#uses=1]
	ret <8 x i32> %res			ret <8 x i32> %res
	}			}
	declare <8 x i32> @llvm.x86.avx2.psrl.d(<8 x i32>, <4 x i32>) nounwind readnone			declare <8 x i32> @llvm.x86.avx2.psrl.d(<8 x i32>, <4 x i32>) nounwind readnone


	define <4 x i64> @test_x86_avx2_psrl_dq(<4 x i64> %a0) {			define <4 x i64> @test_x86_avx2_psrl_dq(<4 x i64> %a0) {
	; CHECK: vpsrldq			; CHECK: vpsrldq {{.*#+}} ymm0 = ymm0[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31]
	%res = call <4 x i64> @llvm.x86.avx2.psrl.dq(<4 x i64> %a0, i32 7) ; <<4 x i64>> [#uses=1]			%res = call <4 x i64> @llvm.x86.avx2.psrl.dq(<4 x i64> %a0, i32 7) ; <<4 x i64>> [#uses=1]
	ret <4 x i64> %res			ret <4 x i64> %res
	}			}
	declare <4 x i64> @llvm.x86.avx2.psrl.dq(<4 x i64>, i32) nounwind readnone			declare <4 x i64> @llvm.x86.avx2.psrl.dq(<4 x i64>, i32) nounwind readnone


	define <4 x i64> @test_x86_avx2_psrl_dq_bs(<4 x i64> %a0) {			define <4 x i64> @test_x86_avx2_psrl_dq_bs(<4 x i64> %a0) {
	; CHECK: vpsrldq			; CHECK: vpsrldq {{.*#+}} ymm0 = ymm0[7,8,9,10,11,12,13,14,15],zero,zero,zero,zero,zero,zero,zero,ymm0[23,24,25,26,27,28,29,30,31],zero,zero,zero,zero,zero,zero,zero
	%res = call <4 x i64> @llvm.x86.avx2.psrl.dq.bs(<4 x i64> %a0, i32 7) ; <<4 x i64>> [#uses=1]			%res = call <4 x i64> @llvm.x86.avx2.psrl.dq.bs(<4 x i64> %a0, i32 7) ; <<4 x i64>> [#uses=1]
	ret <4 x i64> %res			ret <4 x i64> %res
	}			}
	declare <4 x i64> @llvm.x86.avx2.psrl.dq.bs(<4 x i64>, i32) nounwind readnone			declare <4 x i64> @llvm.x86.avx2.psrl.dq.bs(<4 x i64>, i32) nounwind readnone


	define <4 x i64> @test_x86_avx2_psrl_q(<4 x i64> %a0, <2 x i64> %a1) {			define <4 x i64> @test_x86_avx2_psrl_q(<4 x i64> %a0, <2 x i64> %a1) {
	; CHECK: vpsrlq			; CHECK: vpsrlq
	%res = call <4 x i64> @llvm.x86.avx2.psrl.q(<4 x i64> %a0, <2 x i64> %a1) ; <<4 x i64>> [#uses=1]			%res = call <4 x i64> @llvm.x86.avx2.psrl.q(<4 x i64> %a0, <2 x i64> %a1) ; <<4 x i64>> [#uses=1]
	ret <4 x i64> %res			ret <4 x i64> %res
	}			}
	▲ Show 20 Lines • Show All 878 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/sse2-intrinsics-x86.ll

	Show First 20 Lines • Show All 402 Lines • ▼ Show 20 Lines


	define <4 x i32> @test_x86_sse2_psll_d(<4 x i32> %a0, <4 x i32> %a1) {			define <4 x i32> @test_x86_sse2_psll_d(<4 x i32> %a0, <4 x i32> %a1) {
	; CHECK: pslld			; CHECK: pslld
	%res = call <4 x i32> @llvm.x86.sse2.psll.d(<4 x i32> %a0, <4 x i32> %a1) ; <<4 x i32>> [#uses=1]			%res = call <4 x i32> @llvm.x86.sse2.psll.d(<4 x i32> %a0, <4 x i32> %a1) ; <<4 x i32>> [#uses=1]
	ret <4 x i32> %res			ret <4 x i32> %res
	}			}
	declare <4 x i32> @llvm.x86.sse2.psll.d(<4 x i32>, <4 x i32>) nounwind readnone			declare <4 x i32> @llvm.x86.sse2.psll.d(<4 x i32>, <4 x i32>) nounwind readnone


	define <2 x i64> @test_x86_sse2_psll_dq(<2 x i64> %a0) {			define <2 x i64> @test_x86_sse2_psll_dq(<2 x i64> %a0) {
	; CHECK: pslldq			; CHECK: pslldq {{.*#+}} xmm0 = xmm0[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15]
	%res = call <2 x i64> @llvm.x86.sse2.psll.dq(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]			%res = call <2 x i64> @llvm.x86.sse2.psll.dq(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]
	ret <2 x i64> %res			ret <2 x i64> %res
	}			}
	declare <2 x i64> @llvm.x86.sse2.psll.dq(<2 x i64>, i32) nounwind readnone			declare <2 x i64> @llvm.x86.sse2.psll.dq(<2 x i64>, i32) nounwind readnone


	define <2 x i64> @test_x86_sse2_psll_dq_bs(<2 x i64> %a0) {			define <2 x i64> @test_x86_sse2_psll_dq_bs(<2 x i64> %a0) {
	; CHECK: pslldq			; CHECK: pslldq {{.*#+}} xmm0 = zero,zero,zero,zero,zero,zero,zero,xmm0[0,1,2,3,4,5,6,7,8]
	%res = call <2 x i64> @llvm.x86.sse2.psll.dq.bs(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]			%res = call <2 x i64> @llvm.x86.sse2.psll.dq.bs(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]
	ret <2 x i64> %res			ret <2 x i64> %res
	}			}
	declare <2 x i64> @llvm.x86.sse2.psll.dq.bs(<2 x i64>, i32) nounwind readnone			declare <2 x i64> @llvm.x86.sse2.psll.dq.bs(<2 x i64>, i32) nounwind readnone


	define <2 x i64> @test_x86_sse2_psll_q(<2 x i64> %a0, <2 x i64> %a1) {			define <2 x i64> @test_x86_sse2_psll_q(<2 x i64> %a0, <2 x i64> %a1) {
	; CHECK: psllq			; CHECK: psllq
	%res = call <2 x i64> @llvm.x86.sse2.psll.q(<2 x i64> %a0, <2 x i64> %a1) ; <<2 x i64>> [#uses=1]			%res = call <2 x i64> @llvm.x86.sse2.psll.q(<2 x i64> %a0, <2 x i64> %a1) ; <<2 x i64>> [#uses=1]
	ret <2 x i64> %res			ret <2 x i64> %res
	}			}
	▲ Show 20 Lines • Show All 65 Lines • ▼ Show 20 Lines


	define <4 x i32> @test_x86_sse2_psrl_d(<4 x i32> %a0, <4 x i32> %a1) {			define <4 x i32> @test_x86_sse2_psrl_d(<4 x i32> %a0, <4 x i32> %a1) {
	; CHECK: psrld			; CHECK: psrld
	%res = call <4 x i32> @llvm.x86.sse2.psrl.d(<4 x i32> %a0, <4 x i32> %a1) ; <<4 x i32>> [#uses=1]			%res = call <4 x i32> @llvm.x86.sse2.psrl.d(<4 x i32> %a0, <4 x i32> %a1) ; <<4 x i32>> [#uses=1]
	ret <4 x i32> %res			ret <4 x i32> %res
	}			}
	declare <4 x i32> @llvm.x86.sse2.psrl.d(<4 x i32>, <4 x i32>) nounwind readnone			declare <4 x i32> @llvm.x86.sse2.psrl.d(<4 x i32>, <4 x i32>) nounwind readnone


	define <2 x i64> @test_x86_sse2_psrl_dq(<2 x i64> %a0) {			define <2 x i64> @test_x86_sse2_psrl_dq(<2 x i64> %a0) {
	; CHECK: psrldq			; CHECK: psrldq {{.*#+}} xmm0 = xmm0[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15]
	%res = call <2 x i64> @llvm.x86.sse2.psrl.dq(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]			%res = call <2 x i64> @llvm.x86.sse2.psrl.dq(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]
	ret <2 x i64> %res			ret <2 x i64> %res
	}			}
	declare <2 x i64> @llvm.x86.sse2.psrl.dq(<2 x i64>, i32) nounwind readnone			declare <2 x i64> @llvm.x86.sse2.psrl.dq(<2 x i64>, i32) nounwind readnone


	define <2 x i64> @test_x86_sse2_psrl_dq_bs(<2 x i64> %a0) {			define <2 x i64> @test_x86_sse2_psrl_dq_bs(<2 x i64> %a0) {
	; CHECK: psrldq			; CHECK: psrldq {{.*#+}} xmm0 = xmm0[7,8,9,10,11,12,13,14,15],zero,zero,zero,zero,zero,zero,zero
	%res = call <2 x i64> @llvm.x86.sse2.psrl.dq.bs(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]			%res = call <2 x i64> @llvm.x86.sse2.psrl.dq.bs(<2 x i64> %a0, i32 7) ; <<2 x i64>> [#uses=1]
	ret <2 x i64> %res			ret <2 x i64> %res
	}			}
	declare <2 x i64> @llvm.x86.sse2.psrl.dq.bs(<2 x i64>, i32) nounwind readnone			declare <2 x i64> @llvm.x86.sse2.psrl.dq.bs(<2 x i64>, i32) nounwind readnone


	define <2 x i64> @test_x86_sse2_psrl_q(<2 x i64> %a0, <2 x i64> %a1) {			define <2 x i64> @test_x86_sse2_psrl_q(<2 x i64> %a0, <2 x i64> %a1) {
	; CHECK: psrlq			; CHECK: psrlq
	%res = call <2 x i64> @llvm.x86.sse2.psrl.q(<2 x i64> %a0, <2 x i64> %a1) ; <<2 x i64>> [#uses=1]			%res = call <2 x i64> @llvm.x86.sse2.psrl.q(<2 x i64> %a0, <2 x i64> %a1) ; <<2 x i64>> [#uses=1]
	ret <2 x i64> %res			ret <2 x i64> %res
	}			}
	▲ Show 20 Lines • Show All 217 Lines • Show Last 20 Lines

llvm/trunk/test/CodeGen/X86/vector-shuffle-128-v8.ll

	Show First 20 Lines • Show All 1,391 Lines • ▼ Show 20 Lines
	; AVX-NEXT: retq			; AVX-NEXT: retq
	%a = insertelement <8 x i16> undef, i16 %i, i32 0			%a = insertelement <8 x i16> undef, i16 %i, i32 0
	%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 8, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>			%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 8, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
	ret <8 x i16> %shuffle			ret <8 x i16> %shuffle
	}			}

	define <8 x i16> @shuffle_v8i16_z8zzzzzz(i16 %i) {			define <8 x i16> @shuffle_v8i16_z8zzzzzz(i16 %i) {
	; SSE-LABEL: shuffle_v8i16_z8zzzzzz:			; SSE-LABEL: shuffle_v8i16_z8zzzzzz:
	; SSE: # BB#0:			; SSE: # BB#0:
	; SSE-NEXT: movzwl %di, %eax			; SSE-NEXT: movzwl %di, %eax
	; SSE-NEXT: movd %eax, %xmm0			; SSE-NEXT: movd %eax, %xmm0
	; SSE-NEXT: pslldq $2, %xmm0			; SSE-NEXT: pslldq {{.*#+}} xmm0 = zero,zero,xmm0[0,1,2,3,4,5,6,7,8,9,10,11,12,13]
	; SSE-NEXT: retq			; SSE-NEXT: retq
	;			;
	; AVX-LABEL: shuffle_v8i16_z8zzzzzz:			; AVX-LABEL: shuffle_v8i16_z8zzzzzz:
	; AVX: # BB#0:			; AVX: # BB#0:
	; AVX-NEXT: movzwl %di, %eax			; AVX-NEXT: movzwl %di, %eax
	; AVX-NEXT: vmovd %eax, %xmm0			; AVX-NEXT: vmovd %eax, %xmm0
	; AVX-NEXT: vpslldq $2, %xmm0, %xmm0			; AVX-NEXT: vpslldq {{.*#+}} xmm0 = zero,zero,xmm0[0,1,2,3,4,5,6,7,8,9,10,11,12,13]
	; AVX-NEXT: retq			; AVX-NEXT: retq
	%a = insertelement <8 x i16> undef, i16 %i, i32 0			%a = insertelement <8 x i16> undef, i16 %i, i32 0
	%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 2, i32 8, i32 3, i32 7, i32 6, i32 5, i32 4, i32 3>			%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 2, i32 8, i32 3, i32 7, i32 6, i32 5, i32 4, i32 3>
	ret <8 x i16> %shuffle			ret <8 x i16> %shuffle
	}			}

	define <8 x i16> @shuffle_v8i16_zzzzz8zz(i16 %i) {			define <8 x i16> @shuffle_v8i16_zzzzz8zz(i16 %i) {
	; SSE-LABEL: shuffle_v8i16_zzzzz8zz:			; SSE-LABEL: shuffle_v8i16_zzzzz8zz:
	; SSE: # BB#0:			; SSE: # BB#0:
	; SSE-NEXT: movzwl %di, %eax			; SSE-NEXT: movzwl %di, %eax
	; SSE-NEXT: movd %eax, %xmm0			; SSE-NEXT: movd %eax, %xmm0
	; SSE-NEXT: pslldq $10, %xmm0			; SSE-NEXT: pslldq {{.*#+}} xmm0 = zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,xmm0[0,1,2,3,4,5]
	; SSE-NEXT: retq			; SSE-NEXT: retq
	;			;
	; AVX-LABEL: shuffle_v8i16_zzzzz8zz:			; AVX-LABEL: shuffle_v8i16_zzzzz8zz:
	; AVX: # BB#0:			; AVX: # BB#0:
	; AVX-NEXT: movzwl %di, %eax			; AVX-NEXT: movzwl %di, %eax
	; AVX-NEXT: vmovd %eax, %xmm0			; AVX-NEXT: vmovd %eax, %xmm0
	; AVX-NEXT: vpslldq $10, %xmm0, %xmm0			; AVX-NEXT: vpslldq {{.*#+}} xmm0 = zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,xmm0[0,1,2,3,4,5]
	; AVX-NEXT: retq			; AVX-NEXT: retq
	%a = insertelement <8 x i16> undef, i16 %i, i32 0			%a = insertelement <8 x i16> undef, i16 %i, i32 0
	%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 0, i32 0, i32 0, i32 0, i32 0, i32 8, i32 0, i32 0>			%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 0, i32 0, i32 0, i32 0, i32 0, i32 8, i32 0, i32 0>
	ret <8 x i16> %shuffle			ret <8 x i16> %shuffle
	}			}

	define <8 x i16> @shuffle_v8i16_zuuzuuz8(i16 %i) {			define <8 x i16> @shuffle_v8i16_zuuzuuz8(i16 %i) {
	; SSE-LABEL: shuffle_v8i16_zuuzuuz8:			; SSE-LABEL: shuffle_v8i16_zuuzuuz8:
	; SSE: # BB#0:			; SSE: # BB#0:
	; SSE-NEXT: movzwl %di, %eax			; SSE-NEXT: movzwl %di, %eax
	; SSE-NEXT: movd %eax, %xmm0			; SSE-NEXT: movd %eax, %xmm0
	; SSE-NEXT: pslldq $14, %xmm0			; SSE-NEXT: pslldq {{.*#+}} xmm0 = zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,xmm0[0,1]
	; SSE-NEXT: retq			; SSE-NEXT: retq
	;			;
	; AVX-LABEL: shuffle_v8i16_zuuzuuz8:			; AVX-LABEL: shuffle_v8i16_zuuzuuz8:
	; AVX: # BB#0:			; AVX: # BB#0:
	; AVX-NEXT: movzwl %di, %eax			; AVX-NEXT: movzwl %di, %eax
	; AVX-NEXT: vmovd %eax, %xmm0			; AVX-NEXT: vmovd %eax, %xmm0
	; AVX-NEXT: vpslldq $14, %xmm0, %xmm0			; AVX-NEXT: vpslldq {{.*#+}} xmm0 = zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,xmm0[0,1]
	; AVX-NEXT: retq			; AVX-NEXT: retq
	%a = insertelement <8 x i16> undef, i16 %i, i32 0			%a = insertelement <8 x i16> undef, i16 %i, i32 0
	%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 0, i32 undef, i32 undef, i32 3, i32 undef, i32 undef, i32 6, i32 8>			%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 0, i32 undef, i32 undef, i32 3, i32 undef, i32 undef, i32 6, i32 8>
	ret <8 x i16> %shuffle			ret <8 x i16> %shuffle
	}			}

	define <8 x i16> @shuffle_v8i16_zzBzzzzz(i16 %i) {			define <8 x i16> @shuffle_v8i16_zzBzzzzz(i16 %i) {
	; SSE-LABEL: shuffle_v8i16_zzBzzzzz:			; SSE-LABEL: shuffle_v8i16_zzBzzzzz:
	; SSE: # BB#0:			; SSE: # BB#0:
	; SSE-NEXT: movzwl %di, %eax			; SSE-NEXT: movzwl %di, %eax
	; SSE-NEXT: movd %eax, %xmm0			; SSE-NEXT: movd %eax, %xmm0
	; SSE-NEXT: pslldq $4, %xmm0			; SSE-NEXT: pslldq {{.*#+}} xmm0 = zero,zero,zero,zero,xmm0[0,1,2,3,4,5,6,7,8,9,10,11]
	; SSE-NEXT: retq			; SSE-NEXT: retq
	;			;
	; AVX-LABEL: shuffle_v8i16_zzBzzzzz:			; AVX-LABEL: shuffle_v8i16_zzBzzzzz:
	; AVX: # BB#0:			; AVX: # BB#0:
	; AVX-NEXT: movzwl %di, %eax			; AVX-NEXT: movzwl %di, %eax
	; AVX-NEXT: vmovd %eax, %xmm0			; AVX-NEXT: vmovd %eax, %xmm0
	; AVX-NEXT: vpslldq $4, %xmm0, %xmm0			; AVX-NEXT: vpslldq {{.*#+}} xmm0 = zero,zero,zero,zero,xmm0[0,1,2,3,4,5,6,7,8,9,10,11]
	; AVX-NEXT: retq			; AVX-NEXT: retq
	%a = insertelement <8 x i16> undef, i16 %i, i32 3			%a = insertelement <8 x i16> undef, i16 %i, i32 3
	%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 0, i32 1, i32 11, i32 3, i32 4, i32 5, i32 6, i32 7>			%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 0, i32 1, i32 11, i32 3, i32 4, i32 5, i32 6, i32 7>
	ret <8 x i16> %shuffle			ret <8 x i16> %shuffle
	}			}

	define <8 x i16> @shuffle_v8i16_def01234(<8 x i16> %a, <8 x i16> %b) {			define <8 x i16> @shuffle_v8i16_def01234(<8 x i16> %a, <8 x i16> %b) {
	; SSE2-LABEL: shuffle_v8i16_def01234:			; SSE2-LABEL: shuffle_v8i16_def01234:
	; SSE2: # BB#0:			; SSE2: # BB#0:
	; SSE2-NEXT: pshufd {{.*#+}} xmm2 = xmm0[0,1,0,1]			; SSE2-NEXT: pshufd {{.*#+}} xmm2 = xmm0[0,1,0,1]
	; SSE2-NEXT: punpckhwd {{.*#+}} xmm1 = xmm1[4],xmm2[4],xmm1[5],xmm2[5],xmm1[6],xmm2[6],xmm1[7],xmm2[7]			; SSE2-NEXT: punpckhwd {{.*#+}} xmm1 = xmm1[4],xmm2[4],xmm1[5],xmm2[5],xmm1[6],xmm2[6],xmm1[7],xmm2[7]
	▲ Show 20 Lines • Show All 517 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

SSE pslldq/psrldq shuffle mask decodes
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 14900

llvm/trunk/lib/Target/X86/InstPrinter/X86InstComments.cpp

llvm/trunk/lib/Target/X86/Utils/X86ShuffleDecode.h

llvm/trunk/lib/Target/X86/Utils/X86ShuffleDecode.cpp

llvm/trunk/test/CodeGen/X86/avx-intrinsics-x86.ll

llvm/trunk/test/CodeGen/X86/avx2-intrinsics-x86.ll

llvm/trunk/test/CodeGen/X86/sse2-intrinsics-x86.ll

llvm/trunk/test/CodeGen/X86/vector-shuffle-128-v8.ll

This is an archive of the discontinued LLVM Phabricator instance.

SSE pslldq/psrldq shuffle mask decodesClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 14900

llvm/trunk/lib/Target/X86/InstPrinter/X86InstComments.cpp

llvm/trunk/lib/Target/X86/Utils/X86ShuffleDecode.h

llvm/trunk/lib/Target/X86/Utils/X86ShuffleDecode.cpp

llvm/trunk/test/CodeGen/X86/avx-intrinsics-x86.ll

llvm/trunk/test/CodeGen/X86/avx2-intrinsics-x86.ll

llvm/trunk/test/CodeGen/X86/sse2-intrinsics-x86.ll

llvm/trunk/test/CodeGen/X86/vector-shuffle-128-v8.ll

SSE pslldq/psrldq shuffle mask decodes
ClosedPublic