This is an archive of the discontinued LLVM Phabricator instance.

[InstCombine] try to turn shuffle into insertelement
ClosedPublic

Authored by spatel on Oct 22 2018, 9:14 AM.

Download Raw Diff

Details

Reviewers

efriedma
lebedev.ri
craig.topper
RKSimon

Commits

rGb12e410082d4: [InstCombine] try to turn shuffle into insertelement
rL345607: [InstCombine] try to turn shuffle into insertelement

Summary

shuffle (insert ?, Scalar, IndexC), V1, Mask --> insert V1, Scalar, IndexC'

The motivating case is at least a couple of steps away: I noticed that SLPVectorizer does not analyze shuffles as well as sequences of insert/extract in PR34724:
https://bugs.llvm.org/show_bug.cgi?id=34724
...so SLP may fail to vectorize when source code has shuffles to start with or instcombine has converted insert/extract to shuffles.

Independent of that, an insertelement is always a simpler op for IR analysis vs. a shuffle, so we should transform to insert when possible.

I don't think there's any codegen concern here - if a target can't insert a scalar directly to some fixed element in a vector (x86?), then this should get expanded to the insert+shuffle that we started with.

Diff Detail

Repository: rL LLVM

Event Timeline

spatel created this revision.Oct 22 2018, 9:14 AM

Herald added a subscriber: mcrosier. · View Herald TranscriptOct 22 2018, 9:15 AM

Ping.

LGTM with one minor

lib/Transforms/InstCombine/InstCombineVectorOps.cpp
1579 ↗	(On Diff #170437)	Worth returning an ConstantInt*/nullptr instead? Mainly to remove the external IndexC being used for the match at the start of the lambda.

This revision is now accepted and ready to land.Oct 30 2018, 4:29 AM

spatel added inline comments.Oct 30 2018, 7:55 AM

lib/Transforms/InstCombine/InstCombineVectorOps.cpp
1579 ↗	(On Diff #170437)	We can make this more like a souped-up 'match', so pass in both of the values that we want to capture: auto isShufflingScalarIntoOp1 = [&](Value &Scalar, ConstantInt &IndexC) {

Closed by commit rL345607: [InstCombine] try to turn shuffle into insertelement (authored by spatel). · Explain WhyOct 30 2018, 8:29 AM

This revision was automatically updated to reflect the committed changes.

Revision Contents

Path

Size

llvm/

trunk/

lib/

Transforms/

InstCombine/

InstCombineVectorOps.cpp

70 lines

test/

Transforms/

InstCombine/

insert-extract-shuffle.ll

39 lines

Diff 171710

llvm/trunk/lib/Transforms/InstCombine/InstCombineVectorOps.cpp

Show First 20 Lines • Show All 1,525 Lines • ▼ Show 20 Lines	static Instruction *foldIdentityExtractShuffle(ShuffleVectorInst &Shuf) {
for (unsigned i = 0; i != NumElts; ++i) {		for (unsigned i = 0; i != NumElts; ++i) {
Constant *ExtractMaskElt = Shuf.getMask()->getAggregateElement(i);		Constant *ExtractMaskElt = Shuf.getMask()->getAggregateElement(i);
Constant *MaskElt = Mask->getAggregateElement(i);		Constant *MaskElt = Mask->getAggregateElement(i);
NewMask[i] = isa<UndefValue>(ExtractMaskElt) ? ExtractMaskElt : MaskElt;		NewMask[i] = isa<UndefValue>(ExtractMaskElt) ? ExtractMaskElt : MaskElt;
}		}
return new ShuffleVectorInst(X, Y, ConstantVector::get(NewMask));		return new ShuffleVectorInst(X, Y, ConstantVector::get(NewMask));
}		}

		/// Try to replace a shuffle with an insertelement.
		static Instruction *foldShuffleWithInsert(ShuffleVectorInst &Shuf) {
		Value V0 = Shuf.getOperand(0), V1 = Shuf.getOperand(1);
		SmallVector<int, 16> Mask = Shuf.getShuffleMask();

		// The shuffle must not change vector sizes.
		// TODO: This restriction could be removed if the insert has only one use
		// (because the transform would require a new length-changing shuffle).
		int NumElts = Mask.size();
		if (NumElts != (int)(V0->getType()->getVectorNumElements()))
		return nullptr;

		// shuffle (insert ?, Scalar, IndexC), V1, Mask --> insert V1, Scalar, IndexC'
		auto isShufflingScalarIntoOp1 = [&](Value &Scalar, ConstantInt &IndexC) {
		// We need an insertelement with a constant index.
		if (!match(V0, m_InsertElement(m_Value(), m_Value(Scalar),
		m_ConstantInt(IndexC))))
		return false;

		// Test the shuffle mask to see if it splices the inserted scalar into the
		// operand 1 vector of the shuffle.
		int NewInsIndex = -1;
		for (int i = 0; i != NumElts; ++i) {
		// Ignore undef mask elements.
		if (Mask[i] == -1)
		continue;

		// The shuffle takes elements of operand 1 without lane changes.
		if (Mask[i] == NumElts + i)
		continue;

		// The shuffle must choose the inserted scalar exactly once.
		if (NewInsIndex != -1 \|\| Mask[i] != IndexC->getSExtValue())
		return false;

		// The shuffle is placing the inserted scalar into element i.
		NewInsIndex = i;
		}

		assert(NewInsIndex != -1 && "Did not fold shuffle with unused operand?");

		// Index is updated to the potentially translated insertion lane.
		IndexC = ConstantInt::get(IndexC->getType(), NewInsIndex);
		return true;
		};

		// If the shuffle is unnecessary, insert the scalar operand directly into
		// operand 1 of the shuffle. Example:
		// shuffle (insert ?, S, 1), V1, <1, 5, 6, 7> --> insert V1, S, 0
		Value *Scalar;
		ConstantInt *IndexC;
		if (isShufflingScalarIntoOp1(Scalar, IndexC))
		return InsertElementInst::Create(V1, Scalar, IndexC);

		// Try again after commuting shuffle. Example:
		// shuffle V0, (insert ?, S, 0), <0, 1, 2, 4> -->
		// shuffle (insert ?, S, 0), V0, <4, 5, 6, 0> --> insert V0, S, 3
		std::swap(V0, V1);
		ShuffleVectorInst::commuteShuffleMask(Mask, NumElts);
		if (isShufflingScalarIntoOp1(Scalar, IndexC))
		return InsertElementInst::Create(V1, Scalar, IndexC);

		return nullptr;
		}

Instruction *InstCombiner::visitShuffleVectorInst(ShuffleVectorInst &SVI) {		Instruction *InstCombiner::visitShuffleVectorInst(ShuffleVectorInst &SVI) {
Value *LHS = SVI.getOperand(0);		Value *LHS = SVI.getOperand(0);
Value *RHS = SVI.getOperand(1);		Value *RHS = SVI.getOperand(1);
if (auto *V = SimplifyShuffleVectorInst(		if (auto *V = SimplifyShuffleVectorInst(
LHS, RHS, SVI.getMask(), SVI.getType(), SQ.getWithInstruction(&SVI)))		LHS, RHS, SVI.getMask(), SVI.getType(), SQ.getWithInstruction(&SVI)))
return replaceInstUsesWith(SVI, V);		return replaceInstUsesWith(SVI, V);

if (Instruction *I = foldSelectShuffle(SVI, Builder, DL))		if (Instruction *I = foldSelectShuffle(SVI, Builder, DL))
Show All 9 Lines	if (Value *V = SimplifyDemandedVectorElts(&SVI, AllOnesEltMask, UndefElts)) {
if (V != &SVI)		if (V != &SVI)
return replaceInstUsesWith(SVI, V);		return replaceInstUsesWith(SVI, V);
return &SVI;		return &SVI;
}		}

if (Instruction *I = foldIdentityExtractShuffle(SVI))		if (Instruction *I = foldIdentityExtractShuffle(SVI))
return I;		return I;

		// This transform has the potential to lose undef knowledge, so it is
		// intentionally placed after SimplifyDemandedVectorElts().
		if (Instruction *I = foldShuffleWithInsert(SVI))
		return I;

SmallVector<int, 16> Mask = SVI.getShuffleMask();		SmallVector<int, 16> Mask = SVI.getShuffleMask();
Type *Int32Ty = Type::getInt32Ty(SVI.getContext());		Type *Int32Ty = Type::getInt32Ty(SVI.getContext());
unsigned LHSWidth = LHS->getType()->getVectorNumElements();		unsigned LHSWidth = LHS->getType()->getVectorNumElements();
bool MadeChange = false;		bool MadeChange = false;

// Canonicalize shuffle(x ,x,mask) -> shuffle(x, undef,mask')		// Canonicalize shuffle(x ,x,mask) -> shuffle(x, undef,mask')
// Canonicalize shuffle(undef,x,mask) -> shuffle(x, undef,mask').		// Canonicalize shuffle(undef,x,mask) -> shuffle(x, undef,mask').
if (LHS == RHS \|\| isa<UndefValue>(LHS)) {		if (LHS == RHS \|\| isa<UndefValue>(LHS)) {
▲ Show 20 Lines • Show All 320 Lines • Show Last 20 Lines

llvm/trunk/test/Transforms/InstCombine/insert-extract-shuffle.ll

Show First 20 Lines • Show All 297 Lines • ▼ Show 20 Lines	;
%x0 = extractelement <2 x float> %x, i32 0		%x0 = extractelement <2 x float> %x, i32 0
%x1 = extractelement <2 x float> %x, i32 1		%x1 = extractelement <2 x float> %x, i32 1
%v1 = insertelement <4 x float> undef, float %x0, i32 1		%v1 = insertelement <4 x float> undef, float %x0, i32 1
%v2 = insertelement <4 x float> %v1, float %x1, i32 2		%v2 = insertelement <4 x float> %v1, float %x1, i32 2
%v3 = insertelement <4 x float> %v2, float %y, i32 3		%v3 = insertelement <4 x float> %v2, float %y, i32 3
ret <4 x float> %v3		ret <4 x float> %v3
}		}

; TODO: Simplest case - insert scalar into undef, then shuffle that value in place into another vector.		; Simplest case - insert scalar into undef, then shuffle that value in place into another vector.

define <4 x float> @insert_shuffle(float %x, <4 x float> %y) {		define <4 x float> @insert_shuffle(float %x, <4 x float> %y) {
; CHECK-LABEL: @insert_shuffle(		; CHECK-LABEL: @insert_shuffle(
; CHECK-NEXT: [[XV:%.]] = insertelement <4 x float> undef, float [[X:%.]], i32 0		; CHECK-NEXT: [[R:%.]] = insertelement <4 x float> [[Y:%.]], float [[X:%.*]], i32 0
; CHECK-NEXT: [[R:%.]] = shufflevector <4 x float> [[XV]], <4 x float> [[Y:%.]], <4 x i32> <i32 0, i32 5, i32 6, i32 7>
; CHECK-NEXT: ret <4 x float> [[R]]		; CHECK-NEXT: ret <4 x float> [[R]]
;		;
%xv = insertelement <4 x float> undef, float %x, i32 0		%xv = insertelement <4 x float> undef, float %x, i32 0
%r = shufflevector <4 x float> %xv, <4 x float> %y, <4 x i32> <i32 0, i32 5, i32 6, i32 7>		%r = shufflevector <4 x float> %xv, <4 x float> %y, <4 x i32> <i32 0, i32 5, i32 6, i32 7>
ret <4 x float> %r		ret <4 x float> %r
}		}

; TODO: Insert scalar into some element of a dummy vector, then move it to a different element in another vector.		; Insert scalar into some element of a dummy vector, then move it to a different element in another vector.

define <4 x float> @insert_shuffle_translate(float %x, <4 x float> %y) {		define <4 x float> @insert_shuffle_translate(float %x, <4 x float> %y) {
; CHECK-LABEL: @insert_shuffle_translate(		; CHECK-LABEL: @insert_shuffle_translate(
; CHECK-NEXT: [[XV:%.]] = insertelement <4 x float> undef, float [[X:%.]], i32 0		; CHECK-NEXT: [[R:%.]] = insertelement <4 x float> [[Y:%.]], float [[X:%.*]], i32 1
; CHECK-NEXT: [[R:%.]] = shufflevector <4 x float> [[XV]], <4 x float> [[Y:%.]], <4 x i32> <i32 4, i32 0, i32 6, i32 7>
; CHECK-NEXT: ret <4 x float> [[R]]		; CHECK-NEXT: ret <4 x float> [[R]]
;		;
%xv = insertelement <4 x float> undef, float %x, i32 0		%xv = insertelement <4 x float> undef, float %x, i32 0
%r = shufflevector <4 x float> %xv, <4 x float> %y, <4 x i32> <i32 4, i32 0, i32 6, i32 7>		%r = shufflevector <4 x float> %xv, <4 x float> %y, <4 x i32> <i32 4, i32 0, i32 6, i32 7>
ret <4 x float> %r		ret <4 x float> %r
}		}

; TODO: The vector operand of the insert is irrelevant.		; The vector operand of the insert is irrelevant.

define <4 x float> @insert_not_undef_shuffle_translate(float %x, <4 x float> %y, <4 x float> %q) {		define <4 x float> @insert_not_undef_shuffle_translate(float %x, <4 x float> %y, <4 x float> %q) {
; CHECK-LABEL: @insert_not_undef_shuffle_translate(		; CHECK-LABEL: @insert_not_undef_shuffle_translate(
; CHECK-NEXT: [[XV:%.]] = insertelement <4 x float> undef, float [[X:%.]], i32 3		; CHECK-NEXT: [[R:%.]] = insertelement <4 x float> [[Y:%.]], float [[X:%.*]], i32 2
; CHECK-NEXT: [[R:%.]] = shufflevector <4 x float> [[XV]], <4 x float> [[Y:%.]], <4 x i32> <i32 4, i32 5, i32 3, i32 7>
; CHECK-NEXT: ret <4 x float> [[R]]		; CHECK-NEXT: ret <4 x float> [[R]]
;		;
%xv = insertelement <4 x float> %q, float %x, i32 3		%xv = insertelement <4 x float> %q, float %x, i32 3
%r = shufflevector <4 x float> %xv, <4 x float> %y, <4 x i32> <i32 4, i32 5, i32 3, i32 7>		%r = shufflevector <4 x float> %xv, <4 x float> %y, <4 x i32> <i32 4, i32 5, i32 3, i32 7>
ret <4 x float> %r		ret <4 x float> %r
}		}

; TODO: The insert may be the 2nd operand of the shuffle. The shuffle mask can include undef elements.		; The insert may be the 2nd operand of the shuffle. The shuffle mask can include undef elements.

define <4 x float> @insert_not_undef_shuffle_translate_commute(float %x, <4 x float> %y, <4 x float> %q) {		define <4 x float> @insert_not_undef_shuffle_translate_commute(float %x, <4 x float> %y, <4 x float> %q) {
; CHECK-LABEL: @insert_not_undef_shuffle_translate_commute(		; CHECK-LABEL: @insert_not_undef_shuffle_translate_commute(
; CHECK-NEXT: [[XV:%.]] = insertelement <4 x float> undef, float [[X:%.]], i32 2		; CHECK-NEXT: [[R:%.]] = insertelement <4 x float> [[Y:%.]], float [[X:%.*]], i32 1
; CHECK-NEXT: [[R:%.]] = shufflevector <4 x float> [[Y:%.]], <4 x float> [[XV]], <4 x i32> <i32 0, i32 6, i32 2, i32 undef>
; CHECK-NEXT: ret <4 x float> [[R]]		; CHECK-NEXT: ret <4 x float> [[R]]
;		;
%xv = insertelement <4 x float> %q, float %x, i32 2		%xv = insertelement <4 x float> %q, float %x, i32 2
%r = shufflevector <4 x float> %y, <4 x float> %xv, <4 x i32> <i32 0, i32 6, i32 2, i32 undef>		%r = shufflevector <4 x float> %y, <4 x float> %xv, <4 x i32> <i32 0, i32 6, i32 2, i32 undef>
ret <4 x float> %r		ret <4 x float> %r
}		}

; TODO: Both shuffle operands may be inserts - choose the correct side.		; Both shuffle operands may be inserts - choose the correct side.

define <4 x float> @insert_insert_shuffle_translate(float %x1, float %x2, <4 x float> %q) {		define <4 x float> @insert_insert_shuffle_translate(float %x1, float %x2, <4 x float> %q) {
; CHECK-LABEL: @insert_insert_shuffle_translate(		; CHECK-LABEL: @insert_insert_shuffle_translate(
; CHECK-NEXT: [[XV1:%.]] = insertelement <4 x float> undef, float [[X1:%.]], i32 0
; CHECK-NEXT: [[XV2:%.]] = insertelement <4 x float> [[Q:%.]], float [[X2:%.*]], i32 2		; CHECK-NEXT: [[XV2:%.]] = insertelement <4 x float> [[Q:%.]], float [[X2:%.*]], i32 2
; CHECK-NEXT: [[R:%.*]] = shufflevector <4 x float> [[XV1]], <4 x float> [[XV2]], <4 x i32> <i32 4, i32 0, i32 6, i32 7>		; CHECK-NEXT: [[R:%.]] = insertelement <4 x float> [[XV2]], float [[X1:%.]], i32 1
; CHECK-NEXT: ret <4 x float> [[R]]		; CHECK-NEXT: ret <4 x float> [[R]]
;		;
%xv1 = insertelement <4 x float> %q, float %x1, i32 0		%xv1 = insertelement <4 x float> %q, float %x1, i32 0
%xv2 = insertelement <4 x float> %q, float %x2, i32 2		%xv2 = insertelement <4 x float> %q, float %x2, i32 2
%r = shufflevector <4 x float> %xv1, <4 x float> %xv2, <4 x i32> <i32 4, i32 0, i32 6, i32 7>		%r = shufflevector <4 x float> %xv1, <4 x float> %xv2, <4 x i32> <i32 4, i32 0, i32 6, i32 7>
ret <4 x float> %r		ret <4 x float> %r
}		}

; TODO: Both shuffle operands may be inserts - choose the correct side.		; Both shuffle operands may be inserts - choose the correct side.

define <4 x float> @insert_insert_shuffle_translate_commute(float %x1, float %x2, <4 x float> %q) {		define <4 x float> @insert_insert_shuffle_translate_commute(float %x1, float %x2, <4 x float> %q) {
; CHECK-LABEL: @insert_insert_shuffle_translate_commute(		; CHECK-LABEL: @insert_insert_shuffle_translate_commute(
; CHECK-NEXT: [[XV1:%.]] = insertelement <4 x float> [[Q:%.]], float [[X1:%.*]], i32 0		; CHECK-NEXT: [[XV1:%.]] = insertelement <4 x float> [[Q:%.]], float [[X1:%.*]], i32 0
; CHECK-NEXT: [[XV2:%.]] = insertelement <4 x float> undef, float [[X2:%.]], i32 2		; CHECK-NEXT: [[R:%.]] = insertelement <4 x float> [[XV1]], float [[X2:%.]], i32 1
; CHECK-NEXT: [[R:%.*]] = shufflevector <4 x float> [[XV1]], <4 x float> [[XV2]], <4 x i32> <i32 0, i32 6, i32 2, i32 3>
; CHECK-NEXT: ret <4 x float> [[R]]		; CHECK-NEXT: ret <4 x float> [[R]]
;		;
%xv1 = insertelement <4 x float> %q, float %x1, i32 0		%xv1 = insertelement <4 x float> %q, float %x1, i32 0
%xv2 = insertelement <4 x float> %q, float %x2, i32 2		%xv2 = insertelement <4 x float> %q, float %x2, i32 2
%r = shufflevector <4 x float> %xv1, <4 x float> %xv2, <4 x i32> <i32 0, i32 6, i32 2, i32 3>		%r = shufflevector <4 x float> %xv1, <4 x float> %xv2, <4 x i32> <i32 0, i32 6, i32 2, i32 3>
ret <4 x float> %r		ret <4 x float> %r
}		}

		; Negative test - this only works if the shuffle is choosing exactly 1 element from 1 of the inputs.
		; TODO: But this could be a special-case because we're inserting into the same base vector.

define <4 x float> @insert_insert_shuffle_translate_wrong_mask(float %x1, float %x2, <4 x float> %q) {		define <4 x float> @insert_insert_shuffle_translate_wrong_mask(float %x1, float %x2, <4 x float> %q) {
; CHECK-LABEL: @insert_insert_shuffle_translate_wrong_mask(		; CHECK-LABEL: @insert_insert_shuffle_translate_wrong_mask(
; CHECK-NEXT: [[XV1:%.]] = insertelement <4 x float> [[Q:%.]], float [[X1:%.*]], i32 0		; CHECK-NEXT: [[XV1:%.]] = insertelement <4 x float> [[Q:%.]], float [[X1:%.*]], i32 0
; CHECK-NEXT: [[XV2:%.]] = insertelement <4 x float> [[Q]], float [[X2:%.]], i32 2		; CHECK-NEXT: [[XV2:%.]] = insertelement <4 x float> [[Q]], float [[X2:%.]], i32 2
; CHECK-NEXT: [[R:%.*]] = shufflevector <4 x float> [[XV1]], <4 x float> [[XV2]], <4 x i32> <i32 0, i32 6, i32 2, i32 7>		; CHECK-NEXT: [[R:%.*]] = shufflevector <4 x float> [[XV1]], <4 x float> [[XV2]], <4 x i32> <i32 0, i32 6, i32 2, i32 7>
; CHECK-NEXT: ret <4 x float> [[R]]		; CHECK-NEXT: ret <4 x float> [[R]]
;		;
%xv1 = insertelement <4 x float> %q, float %x1, i32 0		%xv1 = insertelement <4 x float> %q, float %x1, i32 0
%xv2 = insertelement <4 x float> %q, float %x2, i32 2		%xv2 = insertelement <4 x float> %q, float %x2, i32 2
%r = shufflevector <4 x float> %xv1, <4 x float> %xv2, <4 x i32> <i32 0, i32 6, i32 2, i32 7>		%r = shufflevector <4 x float> %xv1, <4 x float> %xv2, <4 x i32> <i32 0, i32 6, i32 2, i32 7>
ret <4 x float> %r		ret <4 x float> %r
}		}

; TODO: The insert may have other uses.		; The insert may have other uses.

declare void @use(<4 x float>)		declare void @use(<4 x float>)

define <4 x float> @insert_not_undef_shuffle_translate_commute_uses(float %x, <4 x float> %y, <4 x float> %q) {		define <4 x float> @insert_not_undef_shuffle_translate_commute_uses(float %x, <4 x float> %y, <4 x float> %q) {
; CHECK-LABEL: @insert_not_undef_shuffle_translate_commute_uses(		; CHECK-LABEL: @insert_not_undef_shuffle_translate_commute_uses(
; CHECK-NEXT: [[XV:%.]] = insertelement <4 x float> [[Q:%.]], float [[X:%.*]], i32 2		; CHECK-NEXT: [[XV:%.]] = insertelement <4 x float> [[Q:%.]], float [[X:%.*]], i32 2
; CHECK-NEXT: call void @use(<4 x float> [[XV]])		; CHECK-NEXT: call void @use(<4 x float> [[XV]])
; CHECK-NEXT: [[R:%.]] = shufflevector <4 x float> [[Y:%.]], <4 x float> [[XV]], <4 x i32> <i32 6, i32 undef, i32 2, i32 3>		; CHECK-NEXT: [[R:%.]] = insertelement <4 x float> [[Y:%.]], float [[X]], i32 0
; CHECK-NEXT: ret <4 x float> [[R]]		; CHECK-NEXT: ret <4 x float> [[R]]
;		;
%xv = insertelement <4 x float> %q, float %x, i32 2		%xv = insertelement <4 x float> %q, float %x, i32 2
call void @use(<4 x float> %xv)		call void @use(<4 x float> %xv)
%r = shufflevector <4 x float> %y, <4 x float> %xv, <4 x i32> <i32 6, i32 undef, i32 2, i32 3>		%r = shufflevector <4 x float> %y, <4 x float> %xv, <4 x i32> <i32 6, i32 undef, i32 2, i32 3>
ret <4 x float> %r		ret <4 x float> %r
}		}

		; Negative test - size-changing shuffle.

define <5 x float> @insert_not_undef_shuffle_translate_commute_lengthen(float %x, <4 x float> %y, <4 x float> %q) {		define <5 x float> @insert_not_undef_shuffle_translate_commute_lengthen(float %x, <4 x float> %y, <4 x float> %q) {
; CHECK-LABEL: @insert_not_undef_shuffle_translate_commute_lengthen(		; CHECK-LABEL: @insert_not_undef_shuffle_translate_commute_lengthen(
; CHECK-NEXT: [[XV:%.]] = insertelement <4 x float> undef, float [[X:%.]], i32 2		; CHECK-NEXT: [[XV:%.]] = insertelement <4 x float> undef, float [[X:%.]], i32 2
; CHECK-NEXT: [[R:%.]] = shufflevector <4 x float> [[Y:%.]], <4 x float> [[XV]], <5 x i32> <i32 0, i32 6, i32 2, i32 undef, i32 undef>		; CHECK-NEXT: [[R:%.]] = shufflevector <4 x float> [[Y:%.]], <4 x float> [[XV]], <5 x i32> <i32 0, i32 6, i32 2, i32 undef, i32 undef>
; CHECK-NEXT: ret <5 x float> [[R]]		; CHECK-NEXT: ret <5 x float> [[R]]
;		;
%xv = insertelement <4 x float> %q, float %x, i32 2		%xv = insertelement <4 x float> %q, float %x, i32 2
%r = shufflevector <4 x float> %y, <4 x float> %xv, <5 x i32> <i32 0, i32 6, i32 2, i32 undef, i32 undef>		%r = shufflevector <4 x float> %y, <4 x float> %xv, <5 x i32> <i32 0, i32 6, i32 2, i32 undef, i32 undef>
ret <5 x float> %r		ret <5 x float> %r
}		}