Diff 14453

lib/Target/X86/InstPrinter/X86InstComments.cpp

Context not available.
	DecodeMOVSHDUPMask(MVT::v4f32, ShuffleMask);	DecodeMOVSHDUPMask(MVT::v4f32, ShuffleMask);
	break;	break;

		case X86::PSLLDQri:
		case X86::VPSLLDQri:
		Src1Name = getRegName(MI->getOperand(1).getReg());
		DestName = getRegName(MI->getOperand(0).getReg());
		if(MI->getOperand(MI->getNumOperands()-1).isImm())
		DecodePSLLDQMask(MVT(MVT::v16i8).getSizeInBits(),
		chandlercUnsubmitted Not Done Reply Inline Actions This code doesn't really make sense. If you know the exact type you know the exact size, just pass 128. But what I meant with my comment was still to pass the MVT down, but to do the getSizeInBits query inside the decode routine. chandlerc: This code doesn't really make sense. If you know the exact type you know the exact size, just…
		MI->getOperand(MI->getNumOperands()-1).getImm(),
		ShuffleMask);
		break;

		case X86::VPSLLDQYri:
		Src1Name = getRegName(MI->getOperand(1).getReg());
		DestName = getRegName(MI->getOperand(0).getReg());
		if(MI->getOperand(MI->getNumOperands()-1).isImm())
		DecodePSLLDQMask(MVT(MVT::v32i8).getSizeInBits(),
		MI->getOperand(MI->getNumOperands()-1).getImm(),
		ShuffleMask);
		break;

		case X86::PSRLDQri:
		case X86::VPSRLDQri:
		Src1Name = getRegName(MI->getOperand(1).getReg());
		DestName = getRegName(MI->getOperand(0).getReg());
		if(MI->getOperand(MI->getNumOperands()-1).isImm())
		DecodePSRLDQMask(MVT(MVT::v16i8).getSizeInBits(),
		MI->getOperand(MI->getNumOperands()-1).getImm(),
		ShuffleMask);
		break;

		case X86::VPSRLDQYri:
		Src1Name = getRegName(MI->getOperand(1).getReg());
		DestName = getRegName(MI->getOperand(0).getReg());
		if(MI->getOperand(MI->getNumOperands()-1).isImm())
		DecodePSRLDQMask(MVT(MVT::v32i8).getSizeInBits(),
		MI->getOperand(MI->getNumOperands()-1).getImm(),
		ShuffleMask);
		break;

	case X86::PALIGNR128rr:	case X86::PALIGNR128rr:
	case X86::VPALIGNR128rr:	case X86::VPALIGNR128rr:
	Src1Name = getRegName(MI->getOperand(2).getReg());	Src1Name = getRegName(MI->getOperand(2).getReg());
Context not available.

lib/Target/X86/Utils/X86ShuffleDecode.h

Context not available.

	void DecodeMOVSHDUPMask(MVT VT, SmallVectorImpl<int> &ShuffleMask);	void DecodeMOVSHDUPMask(MVT VT, SmallVectorImpl<int> &ShuffleMask);

		void DecodePSLLDQMask(unsigned VectorSizeInBits, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);

		void DecodePSRLDQMask(unsigned VectorSizeInBits, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);

	void DecodePALIGNRMask(MVT VT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);	void DecodePALIGNRMask(MVT VT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);

	void DecodePSHUFMask(MVT VT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);	void DecodePSHUFMask(MVT VT, unsigned Imm, SmallVectorImpl<int> &ShuffleMask);
Context not available.

lib/Target/X86/Utils/X86ShuffleDecode.cpp

Context not available.
	}	}
	}	}

		void DecodePSLLDQMask(unsigned VectorSizeInBits, unsigned Imm, SmallVectorImpl<int> &ShuffleMask) {
		unsigned NumElts = VectorSizeInBits / 8;
		unsigned NumLanes = VectorSizeInBits / 128;
		chandlercUnsubmitted Not Done Reply Inline Actions I wouldn't decode this in terms of the vector element type. The mask should be a byte-vector mask in all cases, and VT should just provide the size of the vector (128-bit, 256-bit, 512-bit, whatever). chandlerc: I wouldn't decode this in terms of the vector element type. The mask should be a byte-vector…
		RKSimonAuthorUnsubmitted Not Done Reply Inline Actions Yes I'd be happy to do that - I just followed the pattern from palignr. This does mean that the computed ShuffleMask count might not match the number of elements in the MVT. Would it be better to change the MVT VT argument to unsigned VectorSizeInBytes to make that clear? RKSimon: Yes I'd be happy to do that - I just followed the pattern from palignr. This does mean that the…
		unsigned NumLaneElts = NumElts / NumLanes;

		for (unsigned l = 0; l != NumElts; l += NumLaneElts) {
		chandlercUnsubmitted Not Done Reply Inline Actions No need for braces aroun the outer loop. The above loop also uses int and < which is my personal preference for these loops. chandlerc: No need for braces aroun the outer loop. The above loop also uses int and < which is my…
		for (unsigned i = 0; i != NumLaneElts; ++i) {
		int M = SM_SentinelZero;
		if (i >= Imm) M = i - Imm + l;
		ShuffleMask.push_back(M);
		}
		}
		}

		void DecodePSRLDQMask(unsigned VectorSizeInBits, unsigned Imm, SmallVectorImpl<int> &ShuffleMask) {
		unsigned NumElts = VectorSizeInBits / 8;
		unsigned NumLanes = VectorSizeInBits / 128;
		unsigned NumLaneElts = NumElts / NumLanes;

		for (unsigned l = 0; l != NumElts; l += NumLaneElts) {
		for (unsigned i = 0; i != NumLaneElts; ++i) {
		unsigned Base = i + Imm;
		int M = Base + l;
		if (Base >= NumLaneElts) M = SM_SentinelZero;
		ShuffleMask.push_back(M);
		}
		}
		}

	void DecodePALIGNRMask(MVT VT, unsigned Imm,	void DecodePALIGNRMask(MVT VT, unsigned Imm,
	SmallVectorImpl<int> &ShuffleMask) {	SmallVectorImpl<int> &ShuffleMask) {
	unsigned NumElts = VT.getVectorNumElements();	unsigned NumElts = VT.getVectorNumElements();
Context not available.

test/CodeGen/X86/vector-shuffle-128-v8.ll

Context not available.
	; SSE: # BB#0:	; SSE: # BB#0:
	; SSE-NEXT: movzwl %di, %eax	; SSE-NEXT: movzwl %di, %eax
	; SSE-NEXT: movd %eax, %xmm0	; SSE-NEXT: movd %eax, %xmm0
	; SSE-NEXT: pslldq $2, %xmm0	; SSE-NEXT: pslldq $2, %xmm0 {{.*#+}} xmm0 = zero,zero,xmm0[0,1,2,3,4,5,6,7,8,9,10,11,12,13]
		chandlercUnsubmitted Not Done Reply Inline Actions No need to give the operands here when checking the comment. It looks like all of the new comments in this file need the same treatment. chandlerc: No need to give the operands here when checking the comment. It looks like all of the new…
	; SSE-NEXT: retq	; SSE-NEXT: retq
	;	;
	; AVX-LABEL: shuffle_v8i16_z8zzzzzz:	; AVX-LABEL: shuffle_v8i16_z8zzzzzz:
Context not available.
	; AVX: # BB#0:	; AVX: # BB#0:
	; AVX-NEXT: movzwl %di, %eax	; AVX-NEXT: movzwl %di, %eax
	; AVX-NEXT: vmovd %eax, %xmm0	; AVX-NEXT: vmovd %eax, %xmm0
	; AVX-NEXT: vpslldq $2, %xmm0, %xmm0	; AVX-NEXT: vpslldq $2, %xmm0, %xmm0 {{.*#+}} xmm0 = zero,zero,xmm0[0,1,2,3,4,5,6,7,8,9,10,11,12,13]
	; AVX-NEXT: retq	; AVX-NEXT: retq
	%a = insertelement <8 x i16> undef, i16 %i, i32 0	%a = insertelement <8 x i16> undef, i16 %i, i32 0
	%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 2, i32 8, i32 3, i32 7, i32 6, i32 5, i32 4, i32 3>	%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 2, i32 8, i32 3, i32 7, i32 6, i32 5, i32 4, i32 3>
Context not available.
	; SSE: # BB#0:	; SSE: # BB#0:
	; SSE-NEXT: movzwl %di, %eax	; SSE-NEXT: movzwl %di, %eax
	; SSE-NEXT: movd %eax, %xmm0	; SSE-NEXT: movd %eax, %xmm0
	; SSE-NEXT: pslldq $10, %xmm0	; SSE-NEXT: pslldq $10, %xmm0 {{.*#+}} xmm0 = zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,xmm0[0,1,2,3,4,5]
	; SSE-NEXT: retq	; SSE-NEXT: retq
	;	;
	; AVX-LABEL: shuffle_v8i16_zzzzz8zz:	; AVX-LABEL: shuffle_v8i16_zzzzz8zz:
Context not available.
	; AVX: # BB#0:	; AVX: # BB#0:
	; AVX-NEXT: movzwl %di, %eax	; AVX-NEXT: movzwl %di, %eax
	; AVX-NEXT: vmovd %eax, %xmm0	; AVX-NEXT: vmovd %eax, %xmm0
	; AVX-NEXT: vpslldq $10, %xmm0, %xmm0	; AVX-NEXT: vpslldq $10, %xmm0, %xmm0 {{.*#+}} xmm0 = zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,xmm0[0,1,2,3,4,5]
	; AVX-NEXT: retq	; AVX-NEXT: retq
	%a = insertelement <8 x i16> undef, i16 %i, i32 0	%a = insertelement <8 x i16> undef, i16 %i, i32 0
	%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 0, i32 0, i32 0, i32 0, i32 0, i32 8, i32 0, i32 0>	%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 0, i32 0, i32 0, i32 0, i32 0, i32 8, i32 0, i32 0>
Context not available.
	; SSE: # BB#0:	; SSE: # BB#0:
	; SSE-NEXT: movzwl %di, %eax	; SSE-NEXT: movzwl %di, %eax
	; SSE-NEXT: movd %eax, %xmm0	; SSE-NEXT: movd %eax, %xmm0
	; SSE-NEXT: pslldq $14, %xmm0	; SSE-NEXT: pslldq $14, %xmm0 {{.*#+}} xmm0 = zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,xmm0[0,1]
	; SSE-NEXT: retq	; SSE-NEXT: retq
	;	;
	; AVX-LABEL: shuffle_v8i16_zuuzuuz8:	; AVX-LABEL: shuffle_v8i16_zuuzuuz8:
Context not available.
	; AVX: # BB#0:	; AVX: # BB#0:
	; AVX-NEXT: movzwl %di, %eax	; AVX-NEXT: movzwl %di, %eax
	; AVX-NEXT: vmovd %eax, %xmm0	; AVX-NEXT: vmovd %eax, %xmm0
	; AVX-NEXT: vpslldq $14, %xmm0, %xmm0	; AVX-NEXT: vpslldq $14, %xmm0, %xmm0 {{.*#+}} xmm0 = zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,zero,xmm0[0,1]
	; AVX-NEXT: retq	; AVX-NEXT: retq
	%a = insertelement <8 x i16> undef, i16 %i, i32 0	%a = insertelement <8 x i16> undef, i16 %i, i32 0
	%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 0, i32 undef, i32 undef, i32 3, i32 undef, i32 undef, i32 6, i32 8>	%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 0, i32 undef, i32 undef, i32 3, i32 undef, i32 undef, i32 6, i32 8>
Context not available.
	; SSE: # BB#0:	; SSE: # BB#0:
	; SSE-NEXT: movzwl %di, %eax	; SSE-NEXT: movzwl %di, %eax
	; SSE-NEXT: movd %eax, %xmm0	; SSE-NEXT: movd %eax, %xmm0
	; SSE-NEXT: pslldq $4, %xmm0	; SSE-NEXT: pslldq $4, %xmm0 {{.*#+}} xmm0 = zero,zero,zero,zero,xmm0[0,1,2,3,4,5,6,7,8,9,10,11]
	; SSE-NEXT: retq	; SSE-NEXT: retq
	;	;
	; AVX-LABEL: shuffle_v8i16_zzBzzzzz:	; AVX-LABEL: shuffle_v8i16_zzBzzzzz:
Context not available.
	; AVX: # BB#0:	; AVX: # BB#0:
	; AVX-NEXT: movzwl %di, %eax	; AVX-NEXT: movzwl %di, %eax
	; AVX-NEXT: vmovd %eax, %xmm0	; AVX-NEXT: vmovd %eax, %xmm0
	; AVX-NEXT: vpslldq $4, %xmm0, %xmm0	; AVX-NEXT: vpslldq $4, %xmm0, %xmm0 {{.*#+}} xmm0 = zero,zero,zero,zero,xmm0[0,1,2,3,4,5,6,7,8,9,10,11]
	; AVX-NEXT: retq	; AVX-NEXT: retq
	%a = insertelement <8 x i16> undef, i16 %i, i32 3	%a = insertelement <8 x i16> undef, i16 %i, i32 3
	%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 0, i32 1, i32 11, i32 3, i32 4, i32 5, i32 6, i32 7>	%shuffle = shufflevector <8 x i16> zeroinitializer, <8 x i16> %a, <8 x i32> <i32 0, i32 1, i32 11, i32 3, i32 4, i32 5, i32 6, i32 7>
Context not available.

This is an archive of the discontinued LLVM Phabricator instance.

SSE pslldq/psrldq shuffle mask decodes
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 14453

lib/Target/X86/InstPrinter/X86InstComments.cpp

lib/Target/X86/Utils/X86ShuffleDecode.h

lib/Target/X86/Utils/X86ShuffleDecode.cpp

test/CodeGen/X86/vector-shuffle-128-v8.ll

This is an archive of the discontinued LLVM Phabricator instance.

SSE pslldq/psrldq shuffle mask decodesClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 14453

lib/Target/X86/InstPrinter/X86InstComments.cpp

lib/Target/X86/Utils/X86ShuffleDecode.h

lib/Target/X86/Utils/X86ShuffleDecode.cpp

test/CodeGen/X86/vector-shuffle-128-v8.ll

SSE pslldq/psrldq shuffle mask decodes
ClosedPublic