This is an archive of the discontinued LLVM Phabricator instance.

[mlir][linalg] Fix lowering of tensor.pack operations
ClosedPublic

Authored by sabauma on Sep 1 2023, 2:01 PM.

Download Raw Diff

Details

Reviewers

hanchung
qedawkins
chelini
nicolasvasilache

Commits

rGf32427e0447c: [mlir][linalg] Fix lowering of tensor.pack operations

Summary

Tensor pack operations are optimistically lowered to pad + insert_slice
when the pack operation only pads the input tensor. The existing
lowering emits insert_slice operations which do not meet the
rank-reducibility requirements of insert_slice.

This change updates the logic in linalg::lowerPack to first check the
rank-reducibility requirement. When the requirement is not met, the
lowering will emit the full sequence of pad + expand + transpose.

Diff Detail

Repository: rG LLVM Github Monorepo

Event Timeline

sabauma created this revision.Sep 1 2023, 2:01 PM

Herald added a project: Restricted Project. · View Herald TranscriptSep 1 2023, 2:01 PM

Herald added subscribers: bviyer, Moerafaat, bzcheeseman and 24 others. · View Herald Transcript

sabauma added reviewers: hanchung, qedawkins, chelini.Sep 1 2023, 2:11 PM

sabauma published this revision for review.Sep 1 2023, 2:13 PM

Herald added a reviewer: nicolasvasilache. · View Herald TranscriptSep 1 2023, 2:13 PM

Herald added a project: Restricted Project. · View Herald Transcript

Herald added subscribers: limo1996, stephenneuendorffer, nicolasvasilache. · View Herald Transcript

Thanks, looks good to me.

mlir/lib/Dialect/Linalg/Transforms/Transforms.cpp
326	nit: tot -> to

This revision is now accepted and ready to land.Sep 4 2023, 4:32 PM

Spelling fix

@chelini If there are no other comments, would you mind submitting the change. I do not have commit access.

This revision was landed with ongoing or failed builds.Sep 5 2023, 12:14 PM

Closed by commit rGf32427e0447c: [mlir][linalg] Fix lowering of tensor.pack operations (authored by sabauma, committed by chelini). · Explain Why

This revision was automatically updated to reflect the committed changes.

chelini added a commit: rGf32427e0447c: [mlir][linalg] Fix lowering of tensor.pack operations.

Revision Contents

Path

Size

mlir/

lib/

Dialect/

Linalg/

Transforms/

Transforms.cpp

52 lines

test/

Dialect/

Linalg/

transform-lower-pack.mlir

34 lines

Diff 555863

mlir/lib/Dialect/Linalg/Transforms/Transforms.cpp

Show First 20 Lines • Show All 315 Lines • ▼ Show 20 Lines	LLVM_DEBUG(
[&](ReassociationIndices ri) {		[&](ReassociationIndices ri) {
llvm::interleaveComma(ri, llvm::dbgs() << "\|");		llvm::interleaveComma(ri, llvm::dbgs() << "\|");
});		});
DBGSNL();		DBGSNL();
llvm::interleaveComma(stripMinedShape, DBGS() << "stripMinedShape: ");		llvm::interleaveComma(stripMinedShape, DBGS() << "stripMinedShape: ");
DBGSNL(); DBGS() << "collapsed type: " << collapsed; DBGSNL(););		DBGSNL(); DBGS() << "collapsed type: " << collapsed; DBGSNL(););

if (packOp.isLikePad()) {		if (packOp.isLikePad()) {
		// Pack ops which operate as simple pads may not produce legal
		// tensor.insert_slice operations when the packed type does not rank reduce
		// to the padded type.
		cheliniUnsubmitted Not Done Reply Inline Actions nit: tot -> to chelini: nit: tot -> to
		SliceVerificationResult rankReduces =
		isRankReducedType(packedTensorType, padOp.getResultType());

		if (rankReduces == SliceVerificationResult::Success) {
// This pack is just a plain pad.		// This pack is just a plain pad.
// Just insert the pad in the higher ranked tensor.		// Just insert the pad in the higher ranked tensor.
auto emptyOp =		auto emptyOp =
rewriter.create<tensor::EmptyOp>(loc, packedTensorType, ValueRange{});		rewriter.create<tensor::EmptyOp>(loc, packedTensorType, ValueRange{});
// Offsets.		// Offsets.
SmallVector<OpFoldResult> zeros(packedRank, rewriter.getIndexAttr(0));		SmallVector<OpFoldResult> zeros(packedRank, rewriter.getIndexAttr(0));
// Strides.		// Strides.
SmallVector<OpFoldResult> ones(packedRank, rewriter.getIndexAttr(1));		SmallVector<OpFoldResult> ones(packedRank, rewriter.getIndexAttr(1));
SmallVector<OpFoldResult> sizes =		SmallVector<OpFoldResult> sizes =
tensor::getMixedSizes(rewriter, loc, packOp.getDest());		tensor::getMixedSizes(rewriter, loc, packOp.getDest());

auto insertSliceOp = rewriter.create<tensor::InsertSliceOp>(		auto insertSliceOp = rewriter.create<tensor::InsertSliceOp>(
loc, /source=/padOp, /dest=/emptyOp,		loc, /source=/padOp, /dest=/emptyOp,
/offsets=/zeros, sizes,		/offsets=/zeros, sizes,
/strides=/ones);		/strides=/ones);

LLVM_DEBUG(DBGS() << "insert_slice op: " << insertSliceOp; DBGSNL(););		LLVM_DEBUG(DBGS() << "insert_slice op: " << insertSliceOp; DBGSNL(););

rewriter.replaceOp(packOp, insertSliceOp->getResults());		rewriter.replaceOp(packOp, insertSliceOp->getResults());

return LowerPackResult{padOp, /reshapeOp=/nullptr,		return LowerPackResult{padOp, /reshapeOp=/nullptr,
/transposeOp=/nullptr};		/transposeOp=/nullptr};
}		}
		}
// 5. Expand from the padded result to the stripMinedShape.		// 5. Expand from the padded result to the stripMinedShape.
auto reshapeOp = rewriter.create<tensor::ExpandShapeOp>(		auto reshapeOp = rewriter.create<tensor::ExpandShapeOp>(
loc,		loc,
RankedTensorType::Builder(packedTensorType).setShape(stripMinedShape),		RankedTensorType::Builder(packedTensorType).setShape(stripMinedShape),
padOp.getResult(), packingMetadata.reassociations);		padOp.getResult(), packingMetadata.reassociations);

// 6. Transpose stripMinedShape to packedShape.		// 6. Transpose stripMinedShape to packedShape.
SmallVector<int64_t> transpPerm =		SmallVector<int64_t> transpPerm =
▲ Show 20 Lines • Show All 1,245 Lines • Show Last 20 Lines

mlir/test/Dialect/Linalg/transform-lower-pack.mlir

	Show First 20 Lines • Show All 357 Lines • ▼ Show 20 Lines

	transform.sequence failures(propagate) {			transform.sequence failures(propagate) {
	^bb1(%module_op: !transform.any_op):			^bb1(%module_op: !transform.any_op):
	%pack = transform.structured.match ops{["tensor.pack"]} in %module_op			%pack = transform.structured.match ops{["tensor.pack"]} in %module_op
	: (!transform.any_op) -> !transform.op<"tensor.pack">			: (!transform.any_op) -> !transform.op<"tensor.pack">
	transform.structured.lower_pack %pack : (!transform.op<"tensor.pack">)			transform.structured.lower_pack %pack : (!transform.op<"tensor.pack">)
	-> (!transform.op<"tensor.pad">, !transform.op<"tensor.expand_shape">, !transform.op<"linalg.transpose">)			-> (!transform.op<"tensor.pad">, !transform.op<"tensor.expand_shape">, !transform.op<"linalg.transpose">)
	}			}

				// -----

				// CHECK-LABEL: func.func @pack_as_pad_with_unit_dims(
				// CHECK: %[[SRC:.+]]: tensor<3x1x1x1xf32>,
				// CHECK: %[[OUT:.+]]: tensor<1x1x1x1x8x1xf32>)
				func.func @pack_as_pad_with_unit_dims(%arg0: tensor<3x1x1x1xf32>, %arg1: tensor<1x1x1x1x8x1xf32>) -> (tensor<1x1x1x1x8x1xf32>) {
				%zero = arith.constant 0.0 : f32

				// CHECK: %[[PAD:.+]] = tensor.pad %[[SRC]] low[0, 0, 0, 0] high[5, 0, 0, 0] {
				// CHECK: : tensor<3x1x1x1xf32> to tensor<8x1x1x1xf32>
				// CHECK: %[[EXPAND:.+]] = tensor.expand_shape %[[PAD]] [{{.*}}[0, 1], [2, 3], [4], [5]]
				// CHECK-SAME: tensor<8x1x1x1xf32> into tensor<1x8x1x1x1x1xf32>
				// CHECK: %[[TRANSPOSED:.+]] = linalg.transpose
				// CHECK-SAME: ins(%[[EXPAND]] : tensor<1x8x1x1x1x1xf32>)
				// CHECK-SAME: outs(%[[OUT]] : tensor<1x1x1x1x8x1xf32>)
				// CHECK-SAME: permutation = [0, 2, 4, 5, 1, 3]
				// CHECK: return %[[TRANSPOSED]] : tensor<1x1x1x1x8x1xf32>
				%pack = tensor.pack %arg0
				padding_value(%zero : f32)
				inner_dims_pos = [0, 1]
				inner_tiles = [8, 1] into %arg1 : tensor<3x1x1x1xf32> -> tensor<1x1x1x1x8x1xf32>

				return %pack : tensor<1x1x1x1x8x1xf32>
				}


				transform.sequence failures(propagate) {
				^bb1(%module_op: !transform.any_op):
				%pack = transform.structured.match ops{["tensor.pack"]} in %module_op
				: (!transform.any_op) -> !transform.op<"tensor.pack">
				transform.structured.lower_pack %pack : (!transform.op<"tensor.pack">)
				-> (!transform.op<"tensor.pad">, !transform.op<"tensor.expand_shape">, !transform.op<"linalg.transpose">)
				}