Diff 315776

llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

	Show First 20 Lines • Show All 4,257 Lines • ▼ Show 20 Lines
	}			}

	Value BoUpSLP::vectorizeTree(ArrayRef<Value > VL) {			Value BoUpSLP::vectorizeTree(ArrayRef<Value > VL) {
	InstructionsState S = getSameOpcode(VL);			InstructionsState S = getSameOpcode(VL);
	if (S.getOpcode()) {			if (S.getOpcode()) {
	if (TreeEntry *E = getTreeEntry(S.OpValue)) {			if (TreeEntry *E = getTreeEntry(S.OpValue)) {
	if (E->isSame(VL)) {			if (E->isSame(VL)) {
	Value *V = vectorizeTree(E);			Value *V = vectorizeTree(E);
	if (VL.size() == E->Scalars.size() && !E->ReuseShuffleIndices.empty()) {			if (VL.size() == E->Scalars.size() && !E->ReuseShuffleIndices.empty()) {
	// We need to get the vectorized value but without shuffle.
	if (auto *SV = dyn_cast<ShuffleVectorInst>(V)) {
	V = SV->getOperand(0);
	} else {
	// Reshuffle to get only unique values.			// Reshuffle to get only unique values.
	SmallVector<int, 4> UniqueIdxs;			SmallVector<int, 4> UniqueIdxs;
	SmallSet<int, 4> UsedIdxs;			SmallSet<int, 4> UsedIdxs;
	for (int Idx : E->ReuseShuffleIndices)			int Pos = 0;
				for (int Idx : E->ReuseShuffleIndices) {
	if (UsedIdxs.insert(Idx).second)			if (UsedIdxs.insert(Idx).second)
	UniqueIdxs.emplace_back(Idx);			UniqueIdxs.emplace_back(Pos);
	V = Builder.CreateShuffleVector(V, UniqueIdxs);			++Pos;
				anton-afanasyevUnsubmitted Not Done Reply Inline Actions This comment is obsolete after change. anton-afanasyev: This comment is obsolete after change.
	}			}
				V = Builder.CreateShuffleVector(V, UniqueIdxs, "shrink.shuffle");
	}			}
	return V;			return V;
	}			}
	}			}
	}			}

	// Check that every instruction appears once in this bundle.			// Check that every instruction appears once in this bundle.
	SmallVector<int, 4> ReuseShuffleIndicies;			SmallVector<int, 4> ReuseShuffleIndicies;
	▲ Show 20 Lines • Show All 3,514 Lines • Show Last 20 Lines

llvm/test/Transforms/SLPVectorizer/X86/shrink_after_reorder.ll

; NOTE: Assertions have been autogenerated by utils/update_test_checks.py		; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
; RUN: opt -slp-vectorizer -S -o - -mtriple=x86_64-unknown-linux-gnu -mcpu=haswell < %s \| FileCheck %s		; RUN: opt -slp-vectorizer -S -o - -mtriple=x86_64-unknown-linux-gnu -mcpu=haswell < %s \| FileCheck %s

define void @wombat(i32* %ptr, i32* %ptr1) {		define void @wombat(i32* %ptr, i32* %ptr1) {
; CHECK-LABEL: @wombat(		; CHECK-LABEL: @wombat(
; CHECK-NEXT: bb:		; CHECK-NEXT: bb:
; CHECK-NEXT: [[TMP7:%.]] = getelementptr inbounds i32, i32 [[PTR:%.*]], i64 1		; CHECK-NEXT: [[TMP7:%.]] = getelementptr inbounds i32, i32 [[PTR:%.*]], i64 1
; CHECK-NEXT: [[TMP8:%.]] = getelementptr inbounds i32, i32 [[PTR]], i64 0		; CHECK-NEXT: [[TMP8:%.]] = getelementptr inbounds i32, i32 [[PTR]], i64 0
; CHECK-NEXT: [[TMP0:%.]] = bitcast i32 [[TMP8]] to <2 x i32>*		; CHECK-NEXT: [[TMP0:%.]] = bitcast i32 [[TMP8]] to <2 x i32>*
; CHECK-NEXT: [[TMP1:%.]] = load <2 x i32>, <2 x i32> [[TMP0]], align 8		; CHECK-NEXT: [[TMP1:%.]] = load <2 x i32>, <2 x i32> [[TMP0]], align 8
; CHECK-NEXT: [[SHUFFLE:%.*]] = shufflevector <2 x i32> [[TMP1]], <2 x i32> poison, <4 x i32> <i32 1, i32 0, i32 1, i32 0>		; CHECK-NEXT: [[SHUFFLE:%.*]] = shufflevector <2 x i32> [[TMP1]], <2 x i32> poison, <4 x i32> <i32 1, i32 0, i32 1, i32 0>
; CHECK-NEXT: [[TMP27:%.]] = getelementptr inbounds i32, i32 [[PTR1:%.*]], i32 3		; CHECK-NEXT: [[TMP27:%.]] = getelementptr inbounds i32, i32 [[PTR1:%.*]], i32 3
; CHECK-NEXT: [[TMP2:%.*]] = add nsw <2 x i32> [[TMP1]], <i32 -1, i32 -1>		; CHECK-NEXT: [[SHRINK_SHUFFLE:%.*]] = shufflevector <4 x i32> [[SHUFFLE]], <4 x i32> poison, <2 x i32> <i32 0, i32 1>
		; CHECK-NEXT: [[TMP2:%.*]] = add nsw <2 x i32> [[SHRINK_SHUFFLE]], <i32 -1, i32 -1>
; CHECK-NEXT: [[SHUFFLE1:%.*]] = shufflevector <2 x i32> [[TMP2]], <2 x i32> poison, <4 x i32> <i32 0, i32 1, i32 0, i32 1>		; CHECK-NEXT: [[SHUFFLE1:%.*]] = shufflevector <2 x i32> [[TMP2]], <2 x i32> poison, <4 x i32> <i32 0, i32 1, i32 0, i32 1>
; CHECK-NEXT: [[TMP34:%.]] = getelementptr inbounds i32, i32 [[PTR1]], i32 4		; CHECK-NEXT: [[TMP34:%.]] = getelementptr inbounds i32, i32 [[PTR1]], i32 4
; CHECK-NEXT: [[TMP40:%.]] = getelementptr inbounds i32, i32 [[PTR1]], i32 5		; CHECK-NEXT: [[TMP40:%.]] = getelementptr inbounds i32, i32 [[PTR1]], i32 5
; CHECK-NEXT: [[TMP3:%.*]] = icmp sgt <4 x i32> [[SHUFFLE]], undef		; CHECK-NEXT: [[TMP3:%.*]] = icmp sgt <4 x i32> [[SHUFFLE]], undef
; CHECK-NEXT: [[TMP4:%.*]] = select <4 x i1> [[TMP3]], <4 x i32> undef, <4 x i32> [[SHUFFLE1]]		; CHECK-NEXT: [[TMP4:%.*]] = select <4 x i1> [[TMP3]], <4 x i32> undef, <4 x i32> [[SHUFFLE1]]
; CHECK-NEXT: [[TMP5:%.*]] = select <4 x i1> zeroinitializer, <4 x i32> zeroinitializer, <4 x i32> [[TMP4]]		; CHECK-NEXT: [[TMP5:%.*]] = select <4 x i1> zeroinitializer, <4 x i32> zeroinitializer, <4 x i32> [[TMP4]]
; CHECK-NEXT: [[TMP46:%.]] = getelementptr inbounds i32, i32 [[PTR1]], i32 6		; CHECK-NEXT: [[TMP46:%.]] = getelementptr inbounds i32, i32 [[PTR1]], i32 6
; CHECK-NEXT: [[TMP6:%.]] = bitcast i32 [[TMP27]] to <4 x i32>*		; CHECK-NEXT: [[TMP6:%.]] = bitcast i32 [[TMP27]] to <4 x i32>*
Show All 38 Lines	bb:
ret void		ret void
}		}

define internal i32 @ipvideo_decode_block_opcode_0xD_16() {		define internal i32 @ipvideo_decode_block_opcode_0xD_16() {
; CHECK-LABEL: @ipvideo_decode_block_opcode_0xD_16(		; CHECK-LABEL: @ipvideo_decode_block_opcode_0xD_16(
; CHECK-NEXT: entry:		; CHECK-NEXT: entry:
; CHECK-NEXT: br label [[FOR_BODY:%.*]]		; CHECK-NEXT: br label [[FOR_BODY:%.*]]
; CHECK: for.body:		; CHECK: for.body:
; CHECK-NEXT: [[TMP0:%.]] = phi <2 x i16> [ undef, [[ENTRY:%.]] ], [ [[TMP0]], [[IF_END:%.*]] ]		; CHECK-NEXT: [[TMP0:%.]] = phi <2 x i16> [ undef, [[ENTRY:%.]] ], [ [[SHRINK_SHUFFLE:%.]], [[IF_END:%.]] ]
; CHECK-NEXT: [[SHUFFLE:%.*]] = shufflevector <2 x i16> [[TMP0]], <2 x i16> poison, <8 x i32> <i32 0, i32 0, i32 0, i32 0, i32 1, i32 1, i32 1, i32 1>		; CHECK-NEXT: [[SHUFFLE:%.*]] = shufflevector <2 x i16> [[TMP0]], <2 x i16> poison, <8 x i32> <i32 0, i32 0, i32 0, i32 0, i32 1, i32 1, i32 1, i32 1>
; CHECK-NEXT: br label [[IF_END]]		; CHECK-NEXT: br label [[IF_END]]
; CHECK: if.end:		; CHECK: if.end:
; CHECK-NEXT: [[ARRAYIDX11_1:%.]] = getelementptr inbounds i16, i16 undef, i32 1		; CHECK-NEXT: [[ARRAYIDX11_1:%.]] = getelementptr inbounds i16, i16 undef, i32 1
; CHECK-NEXT: [[ARRAYIDX11_2:%.]] = getelementptr inbounds i16, i16 undef, i32 2		; CHECK-NEXT: [[ARRAYIDX11_2:%.]] = getelementptr inbounds i16, i16 undef, i32 2
; CHECK-NEXT: [[ARRAYIDX11_3:%.]] = getelementptr inbounds i16, i16 undef, i32 3		; CHECK-NEXT: [[ARRAYIDX11_3:%.]] = getelementptr inbounds i16, i16 undef, i32 3
; CHECK-NEXT: [[ARRAYIDX11_4:%.]] = getelementptr inbounds i16, i16 undef, i32 4		; CHECK-NEXT: [[ARRAYIDX11_4:%.]] = getelementptr inbounds i16, i16 undef, i32 4
; CHECK-NEXT: [[ARRAYIDX11_5:%.]] = getelementptr inbounds i16, i16 undef, i32 5		; CHECK-NEXT: [[ARRAYIDX11_5:%.]] = getelementptr inbounds i16, i16 undef, i32 5
; CHECK-NEXT: [[ARRAYIDX11_6:%.]] = getelementptr inbounds i16, i16 undef, i32 6		; CHECK-NEXT: [[ARRAYIDX11_6:%.]] = getelementptr inbounds i16, i16 undef, i32 6
; CHECK-NEXT: [[ARRAYIDX11_7:%.]] = getelementptr inbounds i16, i16 undef, i32 7		; CHECK-NEXT: [[ARRAYIDX11_7:%.]] = getelementptr inbounds i16, i16 undef, i32 7
; CHECK-NEXT: store <8 x i16> [[SHUFFLE]], <8 x i16>* undef, align 2		; CHECK-NEXT: store <8 x i16> [[SHUFFLE]], <8 x i16>* undef, align 2
		; CHECK-NEXT: [[SHRINK_SHUFFLE]] = shufflevector <8 x i16> [[SHUFFLE]], <8 x i16> poison, <2 x i32> <i32 0, i32 4>
; CHECK-NEXT: br label [[FOR_BODY]]		; CHECK-NEXT: br label [[FOR_BODY]]
;		;
entry:		entry:
br label %for.body		br label %for.body

for.body: ; preds = %if.end, %entry		for.body: ; preds = %if.end, %entry
%P.sroa.7.0 = phi i16 [ undef, %entry ], [ %P.sroa.7.0, %if.end ]		%P.sroa.7.0 = phi i16 [ undef, %entry ], [ %P.sroa.7.0, %if.end ]
%P.sroa.0.0 = phi i16 [ undef, %entry ], [ %P.sroa.0.0, %if.end ]		%P.sroa.0.0 = phi i16 [ undef, %entry ], [ %P.sroa.0.0, %if.end ]
Show All 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[SLP]Need shrink the load vector after reordering.
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 315776

llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp

llvm/test/Transforms/SLPVectorizer/X86/shrink_after_reorder.ll

This is an archive of the discontinued LLVM Phabricator instance.

[SLP]Need shrink the load vector after reordering.ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 315776

llvm/lib/Transforms/Vectorize/SLPVectorizer.cpp

llvm/test/Transforms/SLPVectorizer/X86/shrink_after_reorder.ll

[SLP]Need shrink the load vector after reordering.
ClosedPublic