This is an archive of the discontinued LLVM Phabricator instance.

Value t0 = mm256UnpackLoPs(ib, vs[0], vs[1]);
Value t1 = mm256UnpackHiPs(ib, vs[0], vs[1]);
Value t2 = mm256UnpackLoPs(ib, vs[2], vs[3]);
Value t3 = mm256UnpackHiPs(ib, vs[2], vs[3]);
Value t4 = mm256UnpackLoPs(ib, vs[4], vs[5]);
Value t5 = mm256UnpackHiPs(ib, vs[4], vs[5]);
Value t6 = mm256UnpackLoPs(ib, vs[6], vs[7]);
Value t7 = mm256UnpackHiPs(ib, vs[6], vs[7]);

It should be relatively easy to enable them on i32 since they have the same size.

This revision was landed with ongoing or failed builds.Feb 25 2022, 11:30 AM

Closed by commit rG875bbce9f720: [mlir][Vector] Prevent AVX2 lowering for non-f32 transpose ops (authored by dcaballe). · Explain Why

This revision was automatically updated to reflect the committed changes.

dcaballe added a commit: rG875bbce9f720: [mlir][Vector] Prevent AVX2 lowering for non-f32 transpose ops.

Revision Contents

Path

Size

mlir/

lib/

Dialect/

X86Vector/

Transforms/

AVXTranspose.cpp

5 lines

test/

Dialect/

Vector/

vector-transpose-lowering.mlir

9 lines

Diff 411479

mlir/lib/Dialect/X86Vector/Transforms/AVXTranspose.cpp

Show First 20 Lines • Show All 244 Lines • ▼ Show 20 Lines	TransposeOpLowering(LoweringOptions loweringOptions, MLIRContext *context,
: OpRewritePattern<vector::TransposeOp>(context, benefit),		: OpRewritePattern<vector::TransposeOp>(context, benefit),
loweringOptions(loweringOptions) {}		loweringOptions(loweringOptions) {}

LogicalResult matchAndRewrite(vector::TransposeOp op,		LogicalResult matchAndRewrite(vector::TransposeOp op,
PatternRewriter &rewriter) const override {		PatternRewriter &rewriter) const override {
auto loc = op.getLoc();		auto loc = op.getLoc();

// Check if the source vector type is supported. AVX2 patterns can only be		// Check if the source vector type is supported. AVX2 patterns can only be
// applied if the vector type has two dimensions greater than one.		// applied to f32 vector types with two dimensions greater than one.
VectorType srcType = op.getVectorType();		VectorType srcType = op.getVectorType();
		if (!srcType.getElementType().isF32())
		return rewriter.notifyMatchFailure(op, "Unsupported vector element type");

SmallVector<int64_t> srcGtOneDims;		SmallVector<int64_t> srcGtOneDims;
for (auto &en : llvm::enumerate(srcType.getShape()))		for (auto &en : llvm::enumerate(srcType.getShape()))
if (en.value() > 1)		if (en.value() > 1)
srcGtOneDims.push_back(en.index());		srcGtOneDims.push_back(en.index());

if (srcGtOneDims.size() != 2)		if (srcGtOneDims.size() != 2)
return rewriter.notifyMatchFailure(op, "Unsupported vector type");		return rewriter.notifyMatchFailure(op, "Unsupported vector type");

▲ Show 20 Lines • Show All 71 Lines • Show Last 20 Lines

mlir/test/Dialect/Vector/vector-transpose-lowering.mlir

Show First 20 Lines • Show All 542 Lines • ▼ Show 20 Lines	func @transpose210_1x8x8xf32(%arg0: vector<1x8x8xf32>) -> vector<8x8x1xf32> {
// AVX2-NEXT: vector.insert {{.*}}[7]		// AVX2-NEXT: vector.insert {{.*}}[7]
// AVX2-NEXT: vector.shape_cast %{{.*}} : vector<8x8xf32> to vector<8x8x1xf32>		// AVX2-NEXT: vector.shape_cast %{{.*}} : vector<8x8xf32> to vector<8x8x1xf32>
%0 = vector.transpose %arg0, [2, 1, 0] : vector<1x8x8xf32> to vector<8x8x1xf32>		%0 = vector.transpose %arg0, [2, 1, 0] : vector<1x8x8xf32> to vector<8x8x1xf32>
return %0 : vector<8x8x1xf32>		return %0 : vector<8x8x1xf32>
}		}

// -----		// -----

		func @do_not_lower_nonf32_to_avx2(%arg0: vector<4x8xi32>) -> vector<8x4xi32> {
		%0 = vector.transpose %arg0, [1, 0] : vector<4x8xi32> to vector<8x4xi32>
		return %0 : vector<8x4xi32>
		}

		// AVX2-NOT: vector.shuffle

		// -----

// AVX2-LABEL: func @transpose021_8x1x8		// AVX2-LABEL: func @transpose021_8x1x8
func @transpose021_8x1x8xf32(%arg0: vector<8x1x8xf32>) -> vector<8x8x1xf32> {		func @transpose021_8x1x8xf32(%arg0: vector<8x1x8xf32>) -> vector<8x8x1xf32> {
%0 = vector.transpose %arg0, [0, 2, 1] : vector<8x1x8xf32> to vector<8x8x1xf32>		%0 = vector.transpose %arg0, [0, 2, 1] : vector<8x1x8xf32> to vector<8x8x1xf32>
return %0 : vector<8x8x1xf32>		return %0 : vector<8x8x1xf32>
}		}

// AVX2-NOT: vector.shuffle		// AVX2-NOT: vector.shuffle

▲ Show 20 Lines • Show All 51 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][Vector] Prevent AVX2 lowering for non-f32 transpose opsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 411479

mlir/lib/Dialect/X86Vector/Transforms/AVXTranspose.cpp

mlir/test/Dialect/Vector/vector-transpose-lowering.mlir

[mlir][Vector] Prevent AVX2 lowering for non-f32 transpose ops
ClosedPublic