Diff 419757

mlir/include/mlir/Dialect/Utils/ReshapeOpsUtils.h

Show First 20 Lines • Show All 62 Lines • ▼ Show 20 Lines	SmallVector<ReassociationIndices, 2> convertReassociationMapsToIndices(
OpBuilder &b, ArrayRef<ReassociationExprs> reassociationExprs);		OpBuilder &b, ArrayRef<ReassociationExprs> reassociationExprs);

/// Return the reassociations maps to use to reshape given the source type and		/// Return the reassociations maps to use to reshape given the source type and
/// the target type when possible. Return llvm::None when this computation		/// the target type when possible. Return llvm::None when this computation
/// failed.		/// failed.
Optional<SmallVector<ReassociationIndices>>		Optional<SmallVector<ReassociationIndices>>
getReassociationIndicesForReshape(ShapedType sourceType, ShapedType targetType);		getReassociationIndicesForReshape(ShapedType sourceType, ShapedType targetType);

		/// Returns the reassociation maps to collapse `sourceShape` to `targetShape` if
		/// possible.
		Optional<SmallVector<ReassociationIndices>>
		getReassociationIndicesForCollapse(ArrayRef<int64_t> sourceShape,
		ArrayRef<int64_t> targetShape);

/// Return true if the reassociation specification is valid, false otherwise.		/// Return true if the reassociation specification is valid, false otherwise.
/// When false, the `invalidIndex` integer pointer is optionally filled with the		/// When false, the `invalidIndex` integer pointer is optionally filled with the
/// index of the offending reassociation map.		/// index of the offending reassociation map.
bool isReassociationValid(ArrayRef<AffineMap> reassociation,		bool isReassociationValid(ArrayRef<AffineMap> reassociation,
int *invalidIndex = nullptr);		int *invalidIndex = nullptr);

template <typename ReshapeOpTy, typename InverseReshapeOpTy>		template <typename ReshapeOpTy, typename InverseReshapeOpTy>
static OpFoldResult foldReshapeOp(ReshapeOpTy reshapeOp,		static OpFoldResult foldReshapeOp(ReshapeOpTy reshapeOp,
▲ Show 20 Lines • Show All 72 Lines • ▼ Show 20 Lines	static LogicalResult verifyReshapeLikeShapes(OpTy op, ShapedType collapsedType,
ShapedType expandedType,		ShapedType expandedType,
bool isExpandingReshape) {		bool isExpandingReshape) {
return reshapeLikeShapesAreCompatible(		return reshapeLikeShapesAreCompatible(
[&](const Twine &msg) { return op->emitOpError(msg); },		[&](const Twine &msg) { return op->emitOpError(msg); },
collapsedType.getShape(), expandedType.getShape(),		collapsedType.getShape(), expandedType.getShape(),
op.getReassociationIndices(), isExpandingReshape);		op.getReassociationIndices(), isExpandingReshape);
}		}

		/// Returns true iff the type is a MemRefType and has a non-identity layout.
		bool hasNonIdentityLayout(Type type);

/// Pattern to collapse producer/consumer reshape ops that are both collapsing		/// Pattern to collapse producer/consumer reshape ops that are both collapsing
/// dimensions or are both expanding dimensions.		/// dimensions or are both expanding dimensions.
template <typename ReshapeOpTy>		template <typename ReshapeOpTy>
struct CollapseReshapeOps : public OpRewritePattern<ReshapeOpTy> {		struct ComposeReassociativeReshapeOps : public OpRewritePattern<ReshapeOpTy> {
using OpRewritePattern<ReshapeOpTy>::OpRewritePattern;		using OpRewritePattern<ReshapeOpTy>::OpRewritePattern;
LogicalResult matchAndRewrite(ReshapeOpTy reshapeOp,		LogicalResult matchAndRewrite(ReshapeOpTy reshapeOp,
PatternRewriter &rewriter) const override {		PatternRewriter &rewriter) const override {
auto srcReshapeOp = reshapeOp.src().template getDefiningOp<ReshapeOpTy>();		auto srcReshapeOp = reshapeOp.src().template getDefiningOp<ReshapeOpTy>();
if (!srcReshapeOp)		if (!srcReshapeOp)
return failure();		return failure();

		ShapedType srcType = srcReshapeOp.getSrcType();
		ShapedType intermediateType = reshapeOp.getSrcType();
ShapedType resultType = reshapeOp.getResultType();		ShapedType resultType = reshapeOp.getResultType();

		if (hasNonIdentityLayout(srcReshapeOp.src().getType()) \|\|
		hasNonIdentityLayout(reshapeOp.src().getType()) \|\|
		hasNonIdentityLayout(reshapeOp.result().getType()))
		return failure();

Optional<SmallVector<ReassociationIndices>> reassociationIndices =		Optional<SmallVector<ReassociationIndices>> reassociationIndices =
composeReassociationIndices(srcReshapeOp.getReassociationIndices(),		composeReassociationIndices(srcReshapeOp.getReassociationIndices(),
reshapeOp.getReassociationIndices(),		reshapeOp.getReassociationIndices(),
rewriter.getContext());		rewriter.getContext());
if (!reassociationIndices)		if (!reassociationIndices)
return failure();		return failure();
rewriter.replaceOpWithNewOp<ReshapeOpTy>(		rewriter.replaceOpWithNewOp<ReshapeOpTy>(
reshapeOp, resultType, srcReshapeOp.src(), *reassociationIndices);		reshapeOp, resultType, srcReshapeOp.src(), *reassociationIndices);
return success();		return success();
}		}
};		};

/// Pattern to collapse producer/consumer reshape ops that are both collapsing		/// Pattern to compose
/// dimensions or are both expanding dimensions.		/// `collapse_shape(expand_shape(%src, reassociation_1), reassociation_2)`.
template <typename ReshapeOpTy, typename InverseReshapeOpTy>		/// In that case both `srcType` and `resultType` can be expressed as a function
struct CollapseMixedReshapeOps : public OpRewritePattern<ReshapeOpTy> {		/// of `intermediateType`.
using OpRewritePattern<ReshapeOpTy>::OpRewritePattern;		/// In order to demonstrate the approach, let's assume that `rank(srcType) >
LogicalResult matchAndRewrite(ReshapeOpTy reshapeOp,		/// `rank(resultType)`, i.e. the resulting operation should be `collapse_shape`.
		/// In that case, we can iterate over every set of indices in `reassociation_2`
		/// and try to find ids of sets of indices in `reassociation_1` that cover it
		/// completely.
		///
		/// Example:
		///
		/// %0 = tensor.expand_shape %arg [[0], [1], [2, 3]]
		/// : tensor<?x?x?xi64> into tensor<?x?x?x1xi64>
		/// %1 = tensor.collapse_shape %0 [[0, 1], [2, 3]]
		/// : tensor<?x?x?x1xi64> into tensor<?x?xi64>
		///
		/// can be canonicalized into
		///
		/// %0 = tensor.collapse_shape %arg [[0, 1], [2]]
		/// : tensor<?x?x?xi64> into tensor<?x?xi64>
		///
		/// because [0] and [1] from `expand_shape` reassociation cover completely
		/// `[0, 1]` from `collapse_shape`. If it is impossible to find such union of
		/// indices, then we fail.
		//
		/// When `rank(srcType) < rank(resultType)`, then we just swap `reassociation_1`
		/// `reassociation_2` and produce `expand_shape`.
		template <typename CollapseOpTy, typename ExpandOpTy>
		struct ComposeCollapseOfExpandOp : public OpRewritePattern<CollapseOpTy> {
		using OpRewritePattern<CollapseOpTy>::OpRewritePattern;
		LogicalResult matchAndRewrite(CollapseOpTy collapseOp,
PatternRewriter &rewriter) const override {		PatternRewriter &rewriter) const override {
auto srcReshapeOp =		auto expandOp = collapseOp.src().template getDefiningOp<ExpandOpTy>();
reshapeOp.src().template getDefiningOp<InverseReshapeOpTy>();		if (!expandOp)
if (!srcReshapeOp)
return failure();		return failure();

ShapedType srcReshapeSrcType = srcReshapeOp.getSrcType();		ShapedType srcType = expandOp.getSrcType();
ShapedType intermediateType = reshapeOp.getSrcType();		ShapedType intermediateType = collapseOp.getSrcType();
ShapedType resultType = reshapeOp.getResultType();		ShapedType resultType = collapseOp.getResultType();
		nicolasvasilacheUnsubmitted Done Reply Inline Actions You need to bail on non-identity layout for MemRefType atm. You can use a simple templated hasNonIdentityLayout helper specialization to bail out early. nicolasvasilache: You need to bail on non-identity layout for MemRefType atm. You can use a simple templated…

		if (hasNonIdentityLayout(collapseOp.src().getType()) \|\|
		hasNonIdentityLayout(expandOp.src().getType()) \|\|
		hasNonIdentityLayout(expandOp.result().getType()))
		return failure();

// If the source reshape can be collapsed/expanded into the target reshape		int64_t srcRank = srcType.getRank();
// they can still be folded. This can only be reasoned about statically		int64_t resultRank = resultType.getRank();
// for cases where		if (srcType == resultType)
// - either all shapes are static, or
// - The number of dynamic dimensions matches in the source of source and
// result with all other dimensions being 1.
Optional<SmallVector<ReassociationIndices>> reassociationIndices =
getReassociationIndicesForReshape(srcReshapeSrcType, resultType);
if (!reassociationIndices)
return failure();		return failure();
bool originalOpExpands =
intermediateType.getRank() > srcReshapeSrcType.getRank();		SmallVector<ReassociationIndices, 4> higherRankReassociation,
bool resultingOpExpands =		lowerRankReassociation;
resultType.getRank() > srcReshapeSrcType.getRank();
if (!(resultingOpExpands ^ originalOpExpands))		bool isResultCollapsed = srcRank > resultRank;
rewriter.replaceOpWithNewOp<InverseReshapeOpTy>(		if (isResultCollapsed) {
reshapeOp, resultType, srcReshapeOp.src(), *reassociationIndices);		higherRankReassociation = expandOp.getReassociationIndices();
		lowerRankReassociation = collapseOp.getReassociationIndices();
		} else {
		higherRankReassociation = collapseOp.getReassociationIndices();
		nicolasvasilacheUnsubmitted Not Done Reply Inline Actions The complexity of the double loop logic + case disjunction looks unnecessary to me. You could just use two maps. DenseMap<unsigned, unsigned> map1; unsigned index = 0, group = 0; for (auto &reassoc : op1.getReassociationIndices()) { for (unsigned i = 0, e = reassoc.size(); i < e; ++i) map1.insert(std::pair<unsigned, unsigned>(index++, group)); ++group; } // Same for map2, this could become a separate reshape util by itself. Then you can simply: SmallVector<ReassociationIndices> composedReassociation(targetRank); for (unsigned i = 0, e = sourceRank; i < e; ++i) composedReassociation[map2[map1[i]]].push_back(i); This should work for all 4 cases (Collapse+Collapse, Collapse+Expand, Expand+Collapse, Expand+Expand). Then you can just: if (rankExpanding) rewriter.replaceOpWithNewOp<ExpandOpTy>( secondOp, resultType, firstOp.src(), composedReassociation); else rewriter.replaceOpWithNewOp<CollapseOpTy>( secondOp, resultType, firstOp.src(), composedReassociation); nicolasvasilache: The complexity of the double loop logic + case disjunction looks unnecessary to me. You could…
		pifon2aAuthorUnsubmitted Done Reply Inline Actions I am not sure how this approach would work for the cases, when the composition is impossible. smth like 2x5xf32 -> [0, 1] collapse to 10xf32 -> [0, 1] expand to 5x2xf32. Or ?x?xf32 -> [0], [1, 2] expand to ?x?x2xf32 -> [0, 1], [2] collapse to ?x2xf32. pifon2a: I am not sure how this approach would work for the cases, when the composition is impossible.
		nicolasvasilacheUnsubmitted Not Done Reply Inline Actions You could factor out relevants parts of the verifier as to ensure the resulting Expand/Collapse is valid and bail on invalid rewrites. We do similar type of probing in other places already (at least around cast ops `areCastCompatible` and some others I can't remember offhand). nicolasvasilache: You could factor out relevants parts of the verifier as to ensure the resulting Expand/Collapse…
		nicolasvasilacheUnsubmitted Done Reply Inline Actions Please disregard my suggestion, the intuition was wrong and too simplistic, my apologies for the noise. Still, if there are ways to reuse parts of the verifier (and rewrite where necessary if affinemap is too annoying), please consider it rather than introducing new non-trivial code. Thanks! nicolasvasilache: Please disregard my suggestion, the intuition was wrong and too simplistic, my apologies for…
		pifon2aAuthorUnsubmitted Done Reply Inline Actions I reused parts of `getReassociationIndicesForReshape`. pifon2a: I reused parts of `getReassociationIndicesForReshape`.
		lowerRankReassociation = expandOp.getReassociationIndices();
		}

		int higherRankIndicesID = 0;
		SmallVector<ReassociationIndices, 4> composedReassociation;
		for (const auto &lowerRankIndices : lowerRankReassociation) {
		ReassociationIndices composedIndices;
		while (higherRankIndicesID < higherRankReassociation.size()) {
		auto rightmostIndex =
		higherRankReassociation[higherRankIndicesID].back();
		if (rightmostIndex > lowerRankIndices.back())
		return failure();
		composedIndices.push_back(higherRankIndicesID++);
		if (rightmostIndex == lowerRankIndices.back())
		break;
		}
		composedReassociation.push_back(composedIndices);
		}
		if (isResultCollapsed)
		rewriter.replaceOpWithNewOp<CollapseOpTy>(
		collapseOp, resultType, expandOp.src(), composedReassociation);
else		else
rewriter.replaceOpWithNewOp<ReshapeOpTy>(		rewriter.replaceOpWithNewOp<ExpandOpTy>(
reshapeOp, resultType, srcReshapeOp.src(), *reassociationIndices);		collapseOp, resultType, expandOp.src(), composedReassociation);
return success();		return success();
}		}
};		};

		template <typename ExpandOpTy, typename CollapseOpTy>
		struct ComposeExpandOfCollapseOp : public OpRewritePattern<ExpandOpTy> {
		using OpRewritePattern<ExpandOpTy>::OpRewritePattern;
		LogicalResult matchAndRewrite(ExpandOpTy expandOp,
		PatternRewriter &rewriter) const override {
		nicolasvasilacheUnsubmitted Done Reply Inline Actions you need to bail on non-identity layout for MemRefType atm nicolasvasilache: you need to bail on non-identity layout for MemRefType atm
		auto collapseOp = expandOp.src().template getDefiningOp<CollapseOpTy>();
		if (!collapseOp)
		return failure();

		ShapedType srcType = collapseOp.getSrcType();
		ShapedType intermediateType = expandOp.getSrcType();
		ShapedType resultType = expandOp.getResultType();

		if (hasNonIdentityLayout(expandOp.src().getType()) \|\|
		hasNonIdentityLayout(collapseOp.src().getType()) \|\|
		hasNonIdentityLayout(collapseOp.result().getType()))
		return failure();

		int64_t srcRank = srcType.getRank();
		int64_t resultRank = resultType.getRank();
		if (srcType == resultType)
		return failure();

		auto srcReassociation = collapseOp.getReassociationIndices();
		auto resultReassociation = expandOp.getReassociationIndices();
		if (srcRank > resultRank) {
		auto composedReassociation = findCollapsingReassociation(
		srcReassociation, resultReassociation, srcType.getShape(),
		resultType.getShape());
		if (!composedReassociation.hasValue())
		return failure();

		rewriter.replaceOpWithNewOp<CollapseOpTy>(
		expandOp, resultType, collapseOp.src(), *composedReassociation);
		return success();
		}
		auto composedReassociation =
		findCollapsingReassociation(resultReassociation, srcReassociation,
		resultType.getShape(), srcType.getShape());
		if (!composedReassociation.hasValue())
		return failure();

		rewriter.replaceOpWithNewOp<ExpandOpTy>(
		expandOp, resultType, collapseOp.src(), *composedReassociation);
		return success();
		}

		private:
		// Attempts to find a way to collapse `srcShape` to `resultShape` by
		// collapsing subshapes defined by the reassociation indices.
		Optional<SmallVector<ReassociationIndices>> findCollapsingReassociation(
		ArrayRef<ReassociationIndices> srcReassociation,
		ArrayRef<ReassociationIndices> resultReassociation,
		ArrayRef<int64_t> srcShape, ArrayRef<int64_t> resultShape) const {
		SmallVector<ReassociationIndices, 4> composedReassociation;

		for (auto item : llvm::zip(srcReassociation, resultReassociation)) {
		auto &srcIndices = std::get<0>(item);
		auto &resultIndices = std::get<1>(item);
		auto srcSubShape = srcShape.slice(srcIndices.front(), srcIndices.size());
		auto resultSubShape =
		resultShape.slice(resultIndices.front(), resultIndices.size());

		if (srcSubShape.size() == resultSubShape.size()) {
		if (srcSubShape == resultSubShape)
		composedReassociation.push_back(srcIndices);
		else
		return llvm::None;
		}

		// Find reassociation to collapse `srcSubShape` into `resultSubShape`.
		auto subShapeReassociation =
		getReassociationIndicesForCollapse(srcSubShape, resultSubShape);
		if (!subShapeReassociation.hasValue())
		return llvm::None;

		// Remap the subshape indices back to the original srcShape.
		for (auto &subshape_indices : *subShapeReassociation) {
		ReassociationIndices shape_indices;
		for (int64_t index : subshape_indices)
		shape_indices.push_back(srcIndices.front() + index);
		composedReassociation.push_back(shape_indices);
		}
		}
		return {std::move(composedReassociation)};
		}
		};

} // namespace mlir		} // namespace mlir

#endif // MLIR_DIALECT_UTILS_RESHAPEOPSUTILS_H		#endif // MLIR_DIALECT_UTILS_RESHAPEOPSUTILS_H

mlir/lib/Dialect/MemRef/IR/MemRefOps.cpp

Show First 20 Lines • Show All 1,787 Lines • ▼ Show 20 Lines	if (*expectedResultType != canonicalizedResultType)
return emitOpError("expected expanded type to be ")		return emitOpError("expected expanded type to be ")
<< *expectedResultType << " but found " << canonicalizedResultType;		<< *expectedResultType << " but found " << canonicalizedResultType;

return success();		return success();
}		}

void ExpandShapeOp::getCanonicalizationPatterns(RewritePatternSet &results,		void ExpandShapeOp::getCanonicalizationPatterns(RewritePatternSet &results,
MLIRContext *context) {		MLIRContext *context) {
results.add<CollapseReshapeOps<ExpandShapeOp>,		results.add<ComposeReassociativeReshapeOps<ExpandShapeOp>,
CollapseMixedReshapeOps<ExpandShapeOp, CollapseShapeOp>>(context);		ComposeExpandOfCollapseOp<ExpandShapeOp, CollapseShapeOp>>(
		context);
}		}

/// Compute the layout map after collapsing a given source MemRef type with the		/// Compute the layout map after collapsing a given source MemRef type with the
/// specified reassociation indices.		/// specified reassociation indices.
///		///
/// Note: All collapsed dims in a reassociation group must be contiguous. It is		/// Note: All collapsed dims in a reassociation group must be contiguous. It is
/// not possible to check this by inspecting a MemRefType in the general case.		/// not possible to check this by inspecting a MemRefType in the general case.
/// But it is assumed. If this is not the case, the behavior is undefined.		/// But it is assumed. If this is not the case, the behavior is undefined.
▲ Show 20 Lines • Show All 147 Lines • ▼ Show 20 Lines	if (srcType.getLayout().isIdentity()) {
if (failed(computedLayout))		if (failed(computedLayout))
return emitOpError(		return emitOpError(
"invalid source layout map or collapsing non-contiguous dims");		"invalid source layout map or collapsing non-contiguous dims");
auto computedType =		auto computedType =
MemRefType::get(resultType.getShape(), srcType.getElementType(),		MemRefType::get(resultType.getShape(), srcType.getElementType(),
*computedLayout, srcType.getMemorySpaceAsInt());		*computedLayout, srcType.getMemorySpaceAsInt());
expectedResultType = canonicalizeStridedLayout(computedType);		expectedResultType = canonicalizeStridedLayout(computedType);
}		}

auto canonicalizedResultType = canonicalizeStridedLayout(resultType);		auto canonicalizedResultType = canonicalizeStridedLayout(resultType);
		nicolasvasilacheUnsubmitted Done Reply Inline Actions I don't this this can be correct in the absence of explicit layout map handling. nicolasvasilache: I don't this this can be correct in the absence of explicit layout map handling.
if (expectedResultType != canonicalizedResultType)		if (expectedResultType != canonicalizedResultType)
return emitOpError("expected collapsed type to be ")		return emitOpError("expected collapsed type to be ")
<< expectedResultType << " but found " << canonicalizedResultType;		<< expectedResultType << " but found " << canonicalizedResultType;

return success();		return success();
}		}

struct CollapseShapeOpMemRefCastFolder		struct CollapseShapeOpMemRefCastFolder
Show All 23 Lines	if (newResultType == op.getResultType()) {
rewriter.replaceOpWithNewOp<CastOp>(op, op.getType(), newOp);		rewriter.replaceOpWithNewOp<CastOp>(op, op.getType(), newOp);
}		}
return success();		return success();
}		}
};		};

void CollapseShapeOp::getCanonicalizationPatterns(RewritePatternSet &results,		void CollapseShapeOp::getCanonicalizationPatterns(RewritePatternSet &results,
MLIRContext *context) {		MLIRContext *context) {
results.add<CollapseReshapeOps<CollapseShapeOp>,		results.add<ComposeReassociativeReshapeOps<CollapseShapeOp>,
CollapseMixedReshapeOps<CollapseShapeOp, ExpandShapeOp>,		ComposeCollapseOfExpandOp<CollapseShapeOp, ExpandShapeOp>,
		nicolasvasilacheUnsubmitted Done Reply Inline Actions I don't this this can be correct in the absence of explicit layout map handling. nicolasvasilache: I don't this this can be correct in the absence of explicit layout map handling.
CollapseShapeOpMemRefCastFolder>(context);		CollapseShapeOpMemRefCastFolder>(context);
}		}

OpFoldResult ExpandShapeOp::fold(ArrayRef<Attribute> operands) {		OpFoldResult ExpandShapeOp::fold(ArrayRef<Attribute> operands) {
return foldReshapeOp<ExpandShapeOp, CollapseShapeOp>(*this, operands);		return foldReshapeOp<ExpandShapeOp, CollapseShapeOp>(*this, operands);
}		}

OpFoldResult CollapseShapeOp::fold(ArrayRef<Attribute> operands) {		OpFoldResult CollapseShapeOp::fold(ArrayRef<Attribute> operands) {
▲ Show 20 Lines • Show All 888 Lines • Show Last 20 Lines

mlir/lib/Dialect/Tensor/IR/TensorOps.cpp

Show First 20 Lines • Show All 884 Lines • ▼ Show 20 Lines	LogicalResult matchAndRewrite(TensorReshapeOp reshapeOp,
return success();		return success();
}		}
};		};

} // namespace		} // namespace

void ExpandShapeOp::getCanonicalizationPatterns(RewritePatternSet &results,		void ExpandShapeOp::getCanonicalizationPatterns(RewritePatternSet &results,
MLIRContext *context) {		MLIRContext *context) {
results.add<CollapseReshapeOps<ExpandShapeOp>,		results.add<ComposeReassociativeReshapeOps<ExpandShapeOp>,
CollapseMixedReshapeOps<ExpandShapeOp, CollapseShapeOp>,		ComposeExpandOfCollapseOp<ExpandShapeOp, CollapseShapeOp>,
FoldReshapeWithConstant<ExpandShapeOp>,		FoldReshapeWithConstant<ExpandShapeOp>,
FoldReshapeWithFromElements<ExpandShapeOp>>(context);		FoldReshapeWithFromElements<ExpandShapeOp>>(context);
}		}

void CollapseShapeOp::getCanonicalizationPatterns(RewritePatternSet &results,		void CollapseShapeOp::getCanonicalizationPatterns(RewritePatternSet &results,
MLIRContext *context) {		MLIRContext *context) {
results.add<CollapseReshapeOps<CollapseShapeOp>,		results.add<ComposeReassociativeReshapeOps<CollapseShapeOp>,
CollapseMixedReshapeOps<CollapseShapeOp, ExpandShapeOp>,		ComposeCollapseOfExpandOp<CollapseShapeOp, ExpandShapeOp>,
FoldReshapeWithConstant<CollapseShapeOp>,		FoldReshapeWithConstant<CollapseShapeOp>,
FoldReshapeWithFromElements<CollapseShapeOp>>(context);		FoldReshapeWithFromElements<CollapseShapeOp>>(context);
}		}

OpFoldResult ExpandShapeOp::fold(ArrayRef<Attribute> operands) {		OpFoldResult ExpandShapeOp::fold(ArrayRef<Attribute> operands) {
return foldReshapeOp<ExpandShapeOp, CollapseShapeOp>(*this, operands);		return foldReshapeOp<ExpandShapeOp, CollapseShapeOp>(*this, operands);
}		}
OpFoldResult CollapseShapeOp::fold(ArrayRef<Attribute> operands) {		OpFoldResult CollapseShapeOp::fold(ArrayRef<Attribute> operands) {
▲ Show 20 Lines • Show All 1,091 Lines • Show Last 20 Lines

mlir/lib/Dialect/Utils/ReshapeOpsUtils.cpp

Show All 12 Lines

#include <numeric>		#include <numeric>

using namespace mlir;		using namespace mlir;

Optional<SmallVector<ReassociationIndices>>		Optional<SmallVector<ReassociationIndices>>
mlir::getReassociationIndicesForReshape(ShapedType sourceType,		mlir::getReassociationIndicesForReshape(ShapedType sourceType,
ShapedType targetType) {		ShapedType targetType) {
// Make the sourceType greater rank than the targetType. If they are same		if (sourceType.getRank() > targetType.getRank())
// rank, then its an unsupported reshape op.		return getReassociationIndicesForCollapse(sourceType.getShape(),
if (sourceType.getRank() == targetType.getRank())		targetType.getShape());
return llvm::None;
if (sourceType.getRank() < targetType.getRank())		if (sourceType.getRank() < targetType.getRank())
std::swap(sourceType, targetType);		return getReassociationIndicesForCollapse(targetType.getShape(),
		sourceType.getShape());
		return llvm::None;
		}

ArrayRef<int64_t> sourceShape = sourceType.getShape();		Optional<SmallVector<ReassociationIndices>>
ArrayRef<int64_t> targetShape = targetType.getShape();		mlir::getReassociationIndicesForCollapse(ArrayRef<int64_t> sourceShape,
		ArrayRef<int64_t> targetShape) {
		if (sourceShape.size() <= targetShape.size())
		return llvm::None;
unsigned sourceDim = 0;		unsigned sourceDim = 0;
SmallVector<ReassociationIndices> reassociationMap;		SmallVector<ReassociationIndices> reassociationMap;
reassociationMap.reserve(targetType.getRank());		reassociationMap.reserve(targetShape.size());

ReassociationIndices currIndices;		ReassociationIndices currIndices;
int64_t prodOfCollapsedDims = 1;		int64_t prodOfCollapsedDims = 1;
while (sourceDim < sourceShape.size()) {		while (sourceDim < sourceShape.size()) {
unsigned targetDim = reassociationMap.size();		unsigned targetDim = reassociationMap.size();
// If we have mapped all the target dimensions stop and handle the remaining		// If we have mapped all the target dimensions stop and handle the remaining
// tail of size-1 dimensions explictly.		// tail of size-1 dimensions explictly.
if (targetDim == targetType.getRank())		if (targetDim == targetShape.size())
break;		break;

int64_t currTargetShape = targetShape[targetDim];		int64_t currTargetShape = targetShape[targetDim];
while (sourceShape[sourceDim] != ShapedType::kDynamicSize &&		while (sourceShape[sourceDim] != ShapedType::kDynamicSize &&
prodOfCollapsedDims * sourceShape[sourceDim] < currTargetShape &&		prodOfCollapsedDims * sourceShape[sourceDim] < currTargetShape &&
sourceDim < sourceShape.size()) {		sourceDim < sourceShape.size()) {
prodOfCollapsedDims *= sourceShape[sourceDim];		prodOfCollapsedDims *= sourceShape[sourceDim];
currIndices.push_back(sourceDim++);		currIndices.push_back(sourceDim++);
▲ Show 20 Lines • Show All 133 Lines • ▼ Show 20 Lines	mlir::getSymbolLessAffineMaps(ArrayRef<ReassociationExprs> reassociation) {
SmallVector<AffineMap, 4> maps;		SmallVector<AffineMap, 4> maps;
maps.reserve(reassociation.size());		maps.reserve(reassociation.size());
for (const auto &exprs : reassociation) {		for (const auto &exprs : reassociation) {
assert(!exprs.empty());		assert(!exprs.empty());
maps.push_back(AffineMap::get(maxDim + 1, 0, exprs, exprs[0].getContext()));		maps.push_back(AffineMap::get(maxDim + 1, 0, exprs, exprs[0].getContext()));
}		}
return maps;		return maps;
}		}

bool mlir::isReassociationValid(ArrayRef<AffineMap> reassociation,		bool mlir::isReassociationValid(ArrayRef<AffineMap> reassociation,
int *invalidIndex) {		int *invalidIndex) {
if (reassociation.empty())		if (reassociation.empty())
return true;		return true;
unsigned nDims = reassociation[0].getNumDims();		unsigned nDims = reassociation[0].getNumDims();
unsigned nextExpectedDim = 0;		unsigned nextExpectedDim = 0;
for (const auto &it : llvm::enumerate(reassociation)) {		for (const auto &it : llvm::enumerate(reassociation)) {
auto m = it.value();		auto m = it.value();
▲ Show 20 Lines • Show All 55 Lines • ▼ Show 20 Lines	if (dynamicShape) {
" of collapsed type to be static value of " +		" of collapsed type to be static value of " +
Twine(linearizedStaticShape));		Twine(linearizedStaticShape));
}		}
}		}
expandedDimStart += map.value().size();		expandedDimStart += map.value().size();
}		}
return success();		return success();
}		}

		bool mlir::hasNonIdentityLayout(Type type) {
		if (auto memrefType = type.dyn_cast<MemRefType>())
		return !memrefType.getLayout().isIdentity();
		return false;
		}

mlir/test/Dialect/MemRef/canonicalize.mlir

	Show First 20 Lines • Show All 296 Lines • ▼ Show 20 Lines
	func @allocator(%arg0 : memref<memref<?xi32>>, %arg1 : index) {			func @allocator(%arg0 : memref<memref<?xi32>>, %arg1 : index) {
	%0 = memref.alloc(%arg1) : memref<?xi32>			%0 = memref.alloc(%arg1) : memref<?xi32>
	memref.store %0, %arg0[] : memref<memref<?xi32>>			memref.store %0, %arg0[] : memref<memref<?xi32>>
	return			return
	}			}

	// -----			// -----

	func @collapsing_memref_reshapes_to_zero_dim(%arg0 : memref<1x1x1xf32>)			func @compose_collapse_of_collapse_zero_dim(%arg0 : memref<1x1x1xf32>)
	-> memref<f32> {			-> memref<f32> {
	%0 = memref.collapse_shape %arg0 [[0, 1, 2]]			%0 = memref.collapse_shape %arg0 [[0, 1, 2]]
	: memref<1x1x1xf32> into memref<1xf32>			: memref<1x1x1xf32> into memref<1xf32>
	%1 = memref.collapse_shape %0 [] : memref<1xf32> into memref<f32>			%1 = memref.collapse_shape %0 [] : memref<1xf32> into memref<f32>
	return %1 : memref<f32>			return %1 : memref<f32>
	}			}
	// CHECK-LABEL: collapsing_memref_reshapes_to_zero			// CHECK-LABEL: func @compose_collapse_of_collapse_zero_dim
	// CHECK: memref.collapse_shape %{{.*}} []			// CHECK: memref.collapse_shape %{{.*}} []
	// CHECK-SAME: memref<1x1x1xf32> into memref<f32>			// CHECK-SAME: memref<1x1x1xf32> into memref<f32>

	// -----			// -----

	func @collapsing_memref_reshapes(%arg0 : memref<?x?x?x?x?xf32>)			func @compose_collapse_of_collapse(%arg0 : memref<?x?x?x?x?xf32>)
	-> memref<?x?xf32> {			-> memref<?x?xf32> {
	%0 = memref.collapse_shape %arg0 [[0, 1], [2], [3, 4]]			%0 = memref.collapse_shape %arg0 [[0, 1], [2], [3, 4]]
	: memref<?x?x?x?x?xf32> into memref<?x?x?xf32>			: memref<?x?x?x?x?xf32> into memref<?x?x?xf32>
	%1 = memref.collapse_shape %0 [[0, 1], [2]]			%1 = memref.collapse_shape %0 [[0, 1], [2]]
	: memref<?x?x?xf32> into memref<?x?xf32>			: memref<?x?x?xf32> into memref<?x?xf32>
	return %1 : memref<?x?xf32>			return %1 : memref<?x?xf32>
	}			}
	// CHECK-LABEL: collapsing_memref_reshapes			// CHECK-LABEL: func @compose_collapse_of_collapse
	// CHECK: memref.collapse_shape %{{.*}} {{\[}}[0, 1, 2], [3, 4]]			// CHECK: memref.collapse_shape %{{.*}} {{\[}}[0, 1, 2], [3, 4]]
	// CHECK-NOT: memref.collapse_shape			// CHECK-NOT: memref.collapse_shape

	// -----			// -----

	func @expanding_memref_reshapes(%arg0 : memref<?x?xf32>)			func @do_not_compose_collapse_of_expand_non_identity_layout(
				%arg0: memref<?x?xf32, offset : 0, strides : [?, 1]>)
				-> memref<?xf32, offset : 0, strides : [?]> {
				%1 = memref.expand_shape %arg0 [[0, 1], [2]] :
				memref<?x?xf32, offset : 0, strides : [?, 1]> into
				memref<?x4x?xf32, offset : 0, strides : [?, ?, 1]>
				%2 = memref.collapse_shape %1 [[0, 1, 2]] :
				memref<?x4x?xf32, offset : 0, strides : [?, ?, 1]> into
				memref<?xf32, offset : 0, strides : [?]>
				return %2 : memref<?xf32, offset : 0, strides : [?]>
				}
				// CHECK-LABEL: func @do_not_compose_collapse_of_expand_non_identity_layout
				// CHECK: expand
				// CHECK: collapse

				// -----

				func @compose_expand_of_expand(%arg0 : memref<?x?xf32>)
	-> memref<?x6x4x5x?xf32> {			-> memref<?x6x4x5x?xf32> {
	%0 = memref.expand_shape %arg0 [[0, 1], [2]]			%0 = memref.expand_shape %arg0 [[0, 1], [2]]
	: memref<?x?xf32> into memref<?x4x?xf32>			: memref<?x?xf32> into memref<?x4x?xf32>
	%1 = memref.expand_shape %0 [[0, 1], [2], [3, 4]]			%1 = memref.expand_shape %0 [[0, 1], [2], [3, 4]]
	: memref<?x4x?xf32> into memref<?x6x4x5x?xf32>			: memref<?x4x?xf32> into memref<?x6x4x5x?xf32>
	return %1 : memref<?x6x4x5x?xf32>			return %1 : memref<?x6x4x5x?xf32>
	}			}
	// CHECK-LABEL: expanding_memref_reshapes			// CHECK-LABEL: func @compose_expand_of_expand
	// CHECK: memref.expand_shape %{{.*}} {{\[}}[0, 1, 2], [3, 4]]			// CHECK: memref.expand_shape %{{.*}} {{\[}}[0, 1, 2], [3, 4]]
	// CHECK-NOT: memref.expand_shape			// CHECK-NOT: memref.expand_shape

	// -----			// -----

	func @expanding_memref_reshapes_to_zero_dim(%arg0 : memref<f32>)			func @compose_expand_of_expand_of_zero_dim(%arg0 : memref<f32>)
	-> memref<1x1x1xf32> {			-> memref<1x1x1xf32> {
	%0 = memref.expand_shape %arg0 [] : memref<f32> into memref<1xf32>			%0 = memref.expand_shape %arg0 [] : memref<f32> into memref<1xf32>
	%1 = memref.expand_shape %0 [[0, 1, 2]]			%1 = memref.expand_shape %0 [[0, 1, 2]]
	: memref<1xf32> into memref<1x1x1xf32>			: memref<1xf32> into memref<1x1x1xf32>
	return %1 : memref<1x1x1xf32>			return %1 : memref<1x1x1xf32>
	}			}
	// CHECK-LABEL: expanding_memref_reshapes_to_zero			// CHECK-LABEL: func @compose_expand_of_expand_of_zero_dim
	// CHECK: memref.expand_shape %{{.*}} []			// CHECK: memref.expand_shape %{{.*}} []
	// CHECK-SAME: memref<f32> into memref<1x1x1xf32>			// CHECK-SAME: memref<f32> into memref<1x1x1xf32>

	// -----			// -----

	func @fold_memref_reshape(%arg0 : memref<12x4xf32>) -> memref<12x4xf32> {			func @fold_collapse_of_expand(%arg0 : memref<12x4xf32>) -> memref<12x4xf32> {
	%0 = memref.expand_shape %arg0 [[0, 1], [2]]			%0 = memref.expand_shape %arg0 [[0, 1], [2]]
	: memref<12x4xf32> into memref<3x4x4xf32>			: memref<12x4xf32> into memref<3x4x4xf32>
	%1 = memref.collapse_shape %0 [[0, 1], [2]]			%1 = memref.collapse_shape %0 [[0, 1], [2]]
	: memref<3x4x4xf32> into memref<12x4xf32>			: memref<3x4x4xf32> into memref<12x4xf32>
	return %1 : memref<12x4xf32>			return %1 : memref<12x4xf32>
	}			}
	// CHECK-LABEL: @fold_memref_reshape			// CHECK-LABEL: func @fold_collapse_of_expand
	// CHECK-NOT: linalg.{{.*}}_shape			// CHECK-NOT: linalg.{{.*}}_shape

	// -----			// -----

	func @fold_memref_reshape_dynamic(%arg0 : memref<?x?xf32>) -> memref<?x?xf32> {			func @fold_collapse_collapse_of_expand(%arg0 : memref<?x?xf32>)
				-> memref<?x?xf32> {
				nicolasvasilacheUnsubmitted Done Reply Inline Actions Please add a test case with memref + layout and make sure it does not canonicalize. Once they land, we can reuse layout computation utils for expand/collapse and expand (haha) the behavior. nicolasvasilache: Please add a test case with memref + layout and make sure it does not canonicalize. Once they…
	%0 = memref.expand_shape %arg0 [[0, 1], [2]]			%0 = memref.expand_shape %arg0 [[0, 1], [2]]
	: memref<?x?xf32> into memref<?x4x?xf32>			: memref<?x?xf32> into memref<?x4x?xf32>
	%1 = memref.collapse_shape %0 [[0, 1], [2]]			%1 = memref.collapse_shape %0 [[0, 1], [2]]
	: memref<?x4x?xf32> into memref<?x?xf32>			: memref<?x4x?xf32> into memref<?x?xf32>
	return %1 : memref<?x?xf32>			return %1 : memref<?x?xf32>
	}			}
	// CHECK-LABEL: @fold_memref_reshape_dynamic			// CHECK-LABEL: @fold_collapse_collapse_of_expand
	// CHECK-NOT: linalg.{{.*}}_shape			// CHECK-NOT: linalg.{{.*}}_shape

	// -----			// -----

	func @fold_memref_expand_cast(%arg0 : memref<?x?xf32>) -> memref<2x4x4xf32> {			func @fold_memref_expand_cast(%arg0 : memref<?x?xf32>) -> memref<2x4x4xf32> {
	%0 = memref.cast %arg0 : memref<?x?xf32> to memref<8x4xf32>			%0 = memref.cast %arg0 : memref<?x?xf32> to memref<8x4xf32>
	%1 = memref.expand_shape %0 [[0, 1], [2]]			%1 = memref.expand_shape %0 [[0, 1], [2]]
	: memref<8x4xf32> into memref<2x4x4xf32>			: memref<8x4xf32> into memref<2x4x4xf32>
	▲ Show 20 Lines • Show All 351 Lines • Show Last 20 Lines

mlir/test/Dialect/Tensor/canonicalize.mlir

Show First 20 Lines • Show All 640 Lines • ▼ Show 20 Lines	func @fold_overlapping_insert(%input : tensor<?x?x?xf32>, %slice1: tensor<4x?x8xf32>, %slice2: tensor<4x?x8xf32>, %i: index, %size: index) -> (tensor<?x?x?xf32>) {
// CHECK: %[[INSERT:.+]] = tensor.insert_slice %[[SLICE2]] into %[[INPUT]]		// CHECK: %[[INSERT:.+]] = tensor.insert_slice %[[SLICE2]] into %[[INPUT]]
%1 = tensor.insert_slice %slice2 into %0[%c0, %i, 0] [4, %size, 8] [1, 1, %c1] : tensor<4x?x8xf32> into tensor<?x?x?xf32>		%1 = tensor.insert_slice %slice2 into %0[%c0, %i, 0] [4, %size, 8] [1, 1, %c1] : tensor<4x?x8xf32> into tensor<?x?x?xf32>
// CHECK: return %[[INSERT]]		// CHECK: return %[[INSERT]]
return %1 : tensor<?x?x?xf32>		return %1 : tensor<?x?x?xf32>
}		}

// -----		// -----

func @expanding_tensor_reshapes(%arg0 : tensor<?x?xf32>)		func @compose_expand_of_expand(%arg0 : tensor<?x?xf32>)
-> tensor<?x6x4x?x5xf32> {		-> tensor<?x6x4x?x5xf32> {
%0 = tensor.expand_shape %arg0 [[0, 1], [2]]		%0 = tensor.expand_shape %arg0 [[0, 1], [2]]
: tensor<?x?xf32> into tensor<?x4x?xf32>		: tensor<?x?xf32> into tensor<?x4x?xf32>
%1 = tensor.expand_shape %0 [[0, 1], [2], [3, 4]]		%1 = tensor.expand_shape %0 [[0, 1], [2], [3, 4]]
: tensor<?x4x?xf32> into tensor<?x6x4x?x5xf32>		: tensor<?x4x?xf32> into tensor<?x6x4x?x5xf32>
return %1 : tensor<?x6x4x?x5xf32>		return %1 : tensor<?x6x4x?x5xf32>
}		}
// CHECK-LABEL: expanding_tensor_reshapes		// CHECK-LABEL: compose_expand_of_expand
// CHECK: tensor.expand_shape %{{.*}} {{\[}}[0, 1, 2], [3, 4]]		// CHECK: tensor.expand_shape %{{.*}} {{\[}}[0, 1, 2], [3, 4]]
// CHECK-NOT: tensor.expand_shape		// CHECK-NOT: tensor.expand_shape

// -----		// -----

func @expanding_tensor_reshapes_to_zero_dim(%arg0 : tensor<f32>)		func @compose_expand_of_expand_of_zero_dim(%arg0 : tensor<f32>)
-> tensor<1x1x1xf32> {		-> tensor<1x1x1xf32> {
%0 = tensor.expand_shape %arg0 [] : tensor<f32> into tensor<1xf32>		%0 = tensor.expand_shape %arg0 [] : tensor<f32> into tensor<1xf32>
%1 = tensor.expand_shape %0 [[0, 1, 2]]		%1 = tensor.expand_shape %0 [[0, 1, 2]]
: tensor<1xf32> into tensor<1x1x1xf32>		: tensor<1xf32> into tensor<1x1x1xf32>
return %1 : tensor<1x1x1xf32>		return %1 : tensor<1x1x1xf32>
}		}
// CHECK-LABEL: expanding_tensor_reshapes_to_zero		// CHECK-LABEL: compose_expand_of_expand_of_zero_dim
// CHECK: tensor.expand_shape %{{.*}} []		// CHECK: tensor.expand_shape %{{.*}} []
// CHECK-SAME: tensor<f32> into tensor<1x1x1xf32>		// CHECK-SAME: tensor<f32> into tensor<1x1x1xf32>

// -----		// -----

func @fold_tensor_reshape(%arg0 : tensor<12x4xf32>) -> tensor<12x4xf32> {		func @fold_collapse_of_expand(%arg0 : tensor<12x4xf32>) -> tensor<12x4xf32> {
%0 = tensor.expand_shape %arg0 [[0, 1], [2]]		%0 = tensor.expand_shape %arg0 [[0, 1], [2]]
: tensor<12x4xf32> into tensor<3x4x4xf32>		: tensor<12x4xf32> into tensor<3x4x4xf32>
%1 = tensor.collapse_shape %0 [[0, 1], [2]]		%1 = tensor.collapse_shape %0 [[0, 1], [2]]
: tensor<3x4x4xf32> into tensor<12x4xf32>		: tensor<3x4x4xf32> into tensor<12x4xf32>
return %1 : tensor<12x4xf32>		return %1 : tensor<12x4xf32>
}		}
// CHECK-LABEL: @fold_tensor_reshape		// CHECK-LABEL: @fold_collapse_of_expand
// CHECK-NOT: linalg.{{.*}}shape		// CHECK-NOT: linalg.{{.*}}shape

// -----		// -----

func @fold_tensor_reshape_dynamic(%arg0 : tensor<?x?xf32>) -> tensor<?x?xf32> {		func @fold_collapse_of_expand_dynamic(%arg0 : tensor<?x?xf32>)
		-> tensor<?x?xf32> {
%0 = tensor.expand_shape %arg0 [[0, 1], [2]]		%0 = tensor.expand_shape %arg0 [[0, 1], [2]]
: tensor<?x?xf32> into tensor<?x4x?xf32>		: tensor<?x?xf32> into tensor<?x4x?xf32>
%1 = tensor.collapse_shape %0 [[0, 1], [2]]		%1 = tensor.collapse_shape %0 [[0, 1], [2]]
: tensor<?x4x?xf32> into tensor<?x?xf32>		: tensor<?x4x?xf32> into tensor<?x?xf32>
return %1 : tensor<?x?xf32>		return %1 : tensor<?x?xf32>
}		}
// CHECK-LABEL: @fold_tensor_reshape_dynamic		// CHECK-LABEL: @fold_collapse_of_expand_dynamic
// CHECK-NOT: linalg.{{.*}}_shape		// CHECK-NOT: linalg.{{.*}}_shape

// -----		// -----
func @reshape_collapse(%arg0 : tensor<2x3x4x5x6x7x8xf32>)
		func @compose_expand_of_collapse(%arg0 : tensor<2x3x4x5x6x7x8xf32>)
-> tensor<24x5x42x8xf32> {		-> tensor<24x5x42x8xf32> {
%0 = tensor.collapse_shape %arg0 [[0, 1, 2, 3, 4, 5, 6]]		%0 = tensor.collapse_shape %arg0 [[0, 1, 2, 3, 4, 5, 6]]
: tensor<2x3x4x5x6x7x8xf32> into tensor<40320xf32>		: tensor<2x3x4x5x6x7x8xf32> into tensor<40320xf32>
%1 = tensor.expand_shape %0 [[0, 1, 2, 3]]		%1 = tensor.expand_shape %0 [[0, 1, 2, 3]]
: tensor<40320xf32> into tensor<24x5x42x8xf32>		: tensor<40320xf32> into tensor<24x5x42x8xf32>
return %1 : tensor<24x5x42x8xf32>		return %1 : tensor<24x5x42x8xf32>
}		}
// CHECK: func @reshape_collapse		// CHECK: func @compose_expand_of_collapse
// CHECK-SAME: %[[ARG0:.+]]: tensor<2x3x4x5x6x7x8xf32>		// CHECK-SAME: %[[ARG0:.+]]: tensor<2x3x4x5x6x7x8xf32>
// CHECK: %[[RESULT:.+]] = tensor.collapse_shape %[[ARG0]]		// CHECK: %[[RESULT:.+]] = tensor.collapse_shape %[[ARG0]]
// CHECK-SAME: [0, 1, 2], [3], [4, 5], [6]		// CHECK-SAME: [0, 1, 2], [3], [4, 5], [6]
// CHECK: return %[[RESULT]]		// CHECK: return %[[RESULT]]

// -----		// -----

func @reshape_expand(%arg0 : tensor<24x5x42x8xf32>)		func @compose_expand_of_collapse_7D(%arg0 : tensor<24x5x42x8xf32>)
-> tensor<2x3x4x5x6x7x8xf32> {		-> tensor<2x3x4x5x6x7x8xf32> {
%0 = tensor.collapse_shape %arg0 [[0, 1, 2, 3]]		%0 = tensor.collapse_shape %arg0 [[0, 1, 2, 3]]
: tensor<24x5x42x8xf32> into tensor<40320xf32>		: tensor<24x5x42x8xf32> into tensor<40320xf32>
%1 = tensor.expand_shape %0 [[0, 1, 2, 3, 4, 5, 6]]		%1 = tensor.expand_shape %0 [[0, 1, 2, 3, 4, 5, 6]]
: tensor<40320xf32> into tensor<2x3x4x5x6x7x8xf32>		: tensor<40320xf32> into tensor<2x3x4x5x6x7x8xf32>
return %1 : tensor<2x3x4x5x6x7x8xf32>		return %1 : tensor<2x3x4x5x6x7x8xf32>
}		}
// CHECK: func @reshape_expand		// CHECK: func @compose_expand_of_collapse_7D
// CHECK-SAME: %[[ARG0:.+]]: tensor<24x5x42x8xf32>		// CHECK-SAME: %[[ARG0:.+]]: tensor<24x5x42x8xf32>
// CHECK: %[[RESULT:.+]] = tensor.expand_shape %[[ARG0]]		// CHECK: %[[RESULT:.+]] = tensor.expand_shape %[[ARG0]]
// CHECK-SAME: [0, 1, 2], [3], [4, 5], [6]		// CHECK-SAME: [0, 1, 2], [3], [4, 5], [6]
// CHECK: return %[[RESULT]]		// CHECK: return %[[RESULT]]

// -----		// -----

func @expand_reshape_1D(%arg0 : tensor<2048xf32>) -> tensor<4x512xf32> {		func @compose_collapse_of_expand(%arg : tensor<?x?x?xi64>)
		-> tensor<?x?xi64> {
		%0 = tensor.expand_shape %arg [[0], [1], [2, 3]]
		: tensor<?x?x?xi64> into tensor<?x?x?x1xi64>
		%1 = tensor.collapse_shape %0 [[0, 1], [2, 3]]
		: tensor<?x?x?x1xi64> into tensor<?x?xi64>
		return %1 : tensor<?x?xi64>
		}
		// CHECK-LABEL: func @compose_collapse_of_expand
		// CHECK: (%[[ARG:.*]]: tensor<?x?x?xi64>)
		// CHECK-NEXT: tensor.collapse_shape %[[ARG]]
		// CHECK-SAME: [0, 1], [2]
		// CHECK-SAME: : tensor<?x?x?xi64> into tensor<?x?xi64>

		// -----

		func @compose_collapse_of_expand_1D(%arg0 : tensor<2048xf32>)
		-> tensor<4x512xf32> {
%0 = tensor.expand_shape %arg0 [[0, 1, 2, 3]]		%0 = tensor.expand_shape %arg0 [[0, 1, 2, 3]]
: tensor<2048xf32> into tensor<1x4x1x512xf32>		: tensor<2048xf32> into tensor<1x4x1x512xf32>
%1 = tensor.collapse_shape %0 [[0, 1, 2], [3]]		%1 = tensor.collapse_shape %0 [[0, 1, 2], [3]]
: tensor<1x4x1x512xf32> into tensor<4x512xf32>		: tensor<1x4x1x512xf32> into tensor<4x512xf32>
return %1 : tensor<4x512xf32>		return %1 : tensor<4x512xf32>
}		}
// CHECK: func @expand_reshape_1D		// CHECK: func @compose_collapse_of_expand_1D
// CHECK: tensor.expand_shape %{{.*}} {{\[}}[0, 1]]		// CHECK: tensor.expand_shape %{{.*}} {{\[}}[0, 1]]
// CHECK-SAME: tensor<2048xf32> into tensor<4x512xf32>		// CHECK-SAME: tensor<2048xf32> into tensor<4x512xf32>

// -----		// -----

// CHECK-LABEL: zero_rank_reshape_multi		// CHECK-LABEL: func @zero_rank_reshape_multi
func @zero_rank_reshape_multi(%arg0: tensor<f32>) -> tensor<f32> {		func @zero_rank_reshape_multi(%arg0: tensor<f32>) -> tensor<f32> {
// CHECK: return %arg0		// CHECK: return %arg0
%0 = tensor.expand_shape %arg0 [] : tensor<f32> into tensor<1xf32>		%0 = tensor.expand_shape %arg0 [] : tensor<f32> into tensor<1xf32>
%1 = tensor.expand_shape %0 [[0, 1]] : tensor<1xf32> into tensor<1x1xf32>		%1 = tensor.expand_shape %0 [[0, 1]] : tensor<1xf32> into tensor<1x1xf32>
%2 = tensor.collapse_shape %1 [] : tensor<1x1xf32> into tensor<f32>		%2 = tensor.collapse_shape %1 [] : tensor<1x1xf32> into tensor<f32>
return %2 : tensor<f32>		return %2 : tensor<f32>
}		}

// -----		// -----

func @collapsing_tensor_reshapes(%arg0 : tensor<?x?x?x?x?xf32>)		func @compose_collapse_of_collapse(%arg0 : tensor<?x?x?x?x?xf32>)
-> tensor<?x?xf32> {		-> tensor<?x?xf32> {
%0 = tensor.collapse_shape %arg0 [[0, 1], [2], [3, 4]]		%0 = tensor.collapse_shape %arg0 [[0, 1], [2], [3, 4]]
: tensor<?x?x?x?x?xf32> into tensor<?x?x?xf32>		: tensor<?x?x?x?x?xf32> into tensor<?x?x?xf32>
%1 = tensor.collapse_shape %0 [[0, 1], [2]]		%1 = tensor.collapse_shape %0 [[0, 1], [2]]
: tensor<?x?x?xf32> into tensor<?x?xf32>		: tensor<?x?x?xf32> into tensor<?x?xf32>
return %1 : tensor<?x?xf32>		return %1 : tensor<?x?xf32>
}		}
// CHECK-LABEL: collapsing_tensor_reshapes		// CHECK-LABEL: func @compose_collapse_of_collapse
// CHECK: tensor.collapse_shape %{{.*}} {{\[}}[0, 1, 2], [3, 4]]		// CHECK: tensor.collapse_shape %{{.*}} {{\[}}[0, 1, 2], [3, 4]]
// CHECK-NOT: tensor.collapse_shape		// CHECK-NOT: tensor.collapse_shape

// -----		// -----

func @collapsing_tensor_reshapes_to_zero_dim(%arg0 : tensor<1x1x1xf32>)		func @compose_collapse_of_collapse_zero_dim(%arg0 : tensor<1x1x1xf32>)
-> tensor<f32> {		-> tensor<f32> {
%0 = tensor.collapse_shape %arg0 [[0, 1, 2]]		%0 = tensor.collapse_shape %arg0 [[0, 1, 2]]
: tensor<1x1x1xf32> into tensor<1xf32>		: tensor<1x1x1xf32> into tensor<1xf32>
%1 = tensor.collapse_shape %0 [] : tensor<1xf32> into tensor<f32>		%1 = tensor.collapse_shape %0 [] : tensor<1xf32> into tensor<f32>
return %1 : tensor<f32>		return %1 : tensor<f32>
}		}
// CHECK-LABEL: collapsing_tensor_reshapes_to_zero		// CHECK-LABEL: func @compose_collapse_of_collapse_zero_dim
// CHECK: tensor.collapse_shape %{{.*}} []		// CHECK: tensor.collapse_shape %{{.*}} []
// CHECK-SAME: tensor<1x1x1xf32> into tensor<f32>		// CHECK-SAME: tensor<1x1x1xf32> into tensor<f32>

// -----		// -----

func @fold_reshape_1D(%arg0 : tensor<4x512xf32>) -> tensor<2048xf32> {		func @fold_collapse_of_expand_1D(%arg0 : tensor<4x512xf32>) -> tensor<2048xf32> {
%0 = tensor.expand_shape %arg0 [[0, 1, 2], [3]]		%0 = tensor.expand_shape %arg0 [[0, 1, 2], [3]]
: tensor<4x512xf32> into tensor<1x4x1x512xf32>		: tensor<4x512xf32> into tensor<1x4x1x512xf32>
%1 = tensor.collapse_shape %0 [[0, 1, 2, 3]]		%1 = tensor.collapse_shape %0 [[0, 1, 2, 3]]
: tensor<1x4x1x512xf32> into tensor<2048xf32>		: tensor<1x4x1x512xf32> into tensor<2048xf32>
return %1 : tensor<2048xf32>		return %1 : tensor<2048xf32>
}		}
// CHECK: func @fold_reshape_1D		// CHECK: func @fold_collapse_of_expand_1D
// CHECK: tensor.collapse_shape %{{.*}} {{\[}}[0, 1]]		// CHECK: tensor.collapse_shape %{{.*}} {{\[}}[0, 1]]
// CHECK-SAME: tensor<4x512xf32> into tensor<2048xf32>		// CHECK-SAME: tensor<4x512xf32> into tensor<2048xf32>

// -----		// -----

func @fold_reshape_unit_dims(%arg0 : tensor<2048x1x1xf32>)		func @fold_collapse_of_expand_unit_dims(%arg0 : tensor<2048x1x1xf32>)
-> tensor<4x512x1x1xf32> {		-> tensor<4x512x1x1xf32> {
%0 = tensor.expand_shape %arg0 [[0, 1, 2, 3], [4], [5]]		%0 = tensor.expand_shape %arg0 [[0, 1, 2, 3], [4], [5]]
: tensor<2048x1x1xf32> into tensor<1x4x1x512x1x1xf32>		: tensor<2048x1x1xf32> into tensor<1x4x1x512x1x1xf32>
%1 = tensor.collapse_shape %0 [[0, 1, 2], [3], [4], [5]]		%1 = tensor.collapse_shape %0 [[0, 1, 2], [3], [4], [5]]
: tensor<1x4x1x512x1x1xf32> into tensor<4x512x1x1xf32>		: tensor<1x4x1x512x1x1xf32> into tensor<4x512x1x1xf32>
return %1 : tensor<4x512x1x1xf32>		return %1 : tensor<4x512x1x1xf32>
}		}
// CHECK: func @fold_reshape_unit_dims		// CHECK: func @fold_collapse_of_expand_unit_dims
// CHECK: tensor.expand_shape %{{.*}} {{\[}}[0, 1], [2], [3]]		// CHECK: tensor.expand_shape %{{.*}} {{\[}}[0, 1], [2], [3]]
// CHECK-SAME: tensor<2048x1x1xf32> into tensor<4x512x1x1xf32>		// CHECK-SAME: tensor<2048x1x1xf32> into tensor<4x512x1x1xf32>

// -----		// -----

func @expand_reshape_unit_dims(%arg0 : tensor<2048x1x2048xf32>)		func @compose_collapse_of_expand_unit_dims(%arg0 : tensor<2048x1x2048xf32>)
-> tensor<4x512x1x512x4xf32> {		-> tensor<4x512x1x512x4xf32> {
%0 = tensor.expand_shape %arg0 [[0, 1, 2, 3, 4], [5], [6, 7, 8]]		%0 = tensor.expand_shape %arg0 [[0, 1, 2, 3, 4], [5], [6, 7, 8]]
: tensor<2048x1x2048xf32> into tensor<1x4x1x512x1x1x512x1x4xf32>		: tensor<2048x1x2048xf32> into tensor<1x4x1x512x1x1x512x1x4xf32>
%1 = tensor.collapse_shape %0 [[0, 1, 2], [3, 4], [5], [6, 7], [8]]		%1 = tensor.collapse_shape %0 [[0, 1, 2], [3, 4], [5], [6, 7], [8]]
: tensor<1x4x1x512x1x1x512x1x4xf32> into tensor<4x512x1x512x4xf32>		: tensor<1x4x1x512x1x1x512x1x4xf32> into tensor<4x512x1x512x4xf32>
return %1 : tensor<4x512x1x512x4xf32>		return %1 : tensor<4x512x1x512x4xf32>
}		}
// CHECK: func @expand_reshape_unit_dims		// CHECK: func @compose_collapse_of_expand_unit_dims
// CHECK: tensor.expand_shape %{{.*}} {{\[}}[0, 1], [2], [3, 4]]		// CHECK: tensor.expand_shape %{{.*}} {{\[}}[0, 1], [2], [3, 4]]
// CHECK-SAME: tensor<2048x1x2048xf32> into tensor<4x512x1x512x4xf32>		// CHECK-SAME: tensor<2048x1x2048xf32> into tensor<4x512x1x512x4xf32>

// -----		// -----

func @fold_reshape_trailing_unit_dims(%arg0: tensor<2xf32>) -> tensor<2x1xf32> {		func @compose_collapse_of_expand_trailing_unit_dims(%arg0: tensor<2xf32>)
		-> tensor<2x1xf32> {
%0 = tensor.expand_shape %arg0 [[0, 1, 2]]		%0 = tensor.expand_shape %arg0 [[0, 1, 2]]
: tensor<2xf32> into tensor<2x1x1xf32>		: tensor<2xf32> into tensor<2x1x1xf32>
%1 = tensor.collapse_shape %0 [[0], [1, 2]]		%1 = tensor.collapse_shape %0 [[0], [1, 2]]
: tensor<2x1x1xf32> into tensor<2x1xf32>		: tensor<2x1x1xf32> into tensor<2x1xf32>
return %1 : tensor<2x1xf32>		return %1 : tensor<2x1xf32>
}		}
// CHECK: func @fold_reshape_trailing_unit_dims		// CHECK: func @compose_collapse_of_expand_trailing_unit_dims
// CHECK: tensor.expand_shape %{{.*}} {{\[}}[0, 1]]		// CHECK: tensor.expand_shape %{{.*}} {{\[}}[0, 1]]
// CHECK-SAME: tensor<2xf32> into tensor<2x1xf32>		// CHECK-SAME: tensor<2xf32> into tensor<2x1xf32>

// -----		// -----

func @collapse_reshape_unit_dims_dynamic(%arg0 : tensor<?x1x?x1x1x?x?x1x1xf32>)		func @compose_collapse_of_collapse_unit_dims_dynamic(
-> tensor<?x?x?x?xf32> {		%arg0 : tensor<?x1x?x1x1x?x?x1x1xf32>) -> tensor<?x?x?x?xf32> {
%0 = tensor.collapse_shape %arg0 [[0], [1, 2], [3], [4], [5], [6, 7, 8]]		%0 = tensor.collapse_shape %arg0 [[0], [1, 2], [3], [4], [5], [6, 7, 8]]
: tensor<?x1x?x1x1x?x?x1x1xf32> into tensor<?x?x1x1x?x?xf32>		: tensor<?x1x?x1x1x?x?x1x1xf32> into tensor<?x?x1x1x?x?xf32>
%1 = tensor.collapse_shape %0 [[0], [1], [2, 3, 4], [5]]		%1 = tensor.collapse_shape %0 [[0], [1], [2, 3, 4], [5]]
: tensor<?x?x1x1x?x?xf32> into tensor<?x?x?x?xf32>		: tensor<?x?x1x1x?x?xf32> into tensor<?x?x?x?xf32>
return %1 : tensor<?x?x?x?xf32>		return %1 : tensor<?x?x?x?xf32>
}		}
// CHECK: func @collapse_reshape_unit_dims_dynamic		// CHECK: func @compose_collapse_of_collapse_unit_dims_dynamic
// CHECK: tensor.collapse_shape		// CHECK: tensor.collapse_shape
// CHECK-SAME: [0], [1, 2], [3, 4, 5], [6, 7, 8]		// CHECK-SAME: [0], [1, 2], [3, 4, 5], [6, 7, 8]
// CHECK-SAME: tensor<?x1x?x1x1x?x?x1x1xf32> into tensor<?x?x?x?xf32>		// CHECK-SAME: tensor<?x1x?x1x1x?x?x1x1xf32> into tensor<?x?x?x?xf32>

// -----		// -----

func @fold_reshape_trailing_unit_dims(%arg0: tensor<2xf32>) -> tensor<2x1xf32>		func @fold_collapse_of_expand_trailing_unit_dims(%arg0: tensor<2xf32>)
{		-> tensor<2x1xf32> {
%0 = tensor.expand_shape %arg0 [[0, 1, 2]]		%0 = tensor.expand_shape %arg0 [[0, 1, 2]]
: tensor<2xf32> into tensor<2x1x1xf32>		: tensor<2xf32> into tensor<2x1x1xf32>
%1 = tensor.collapse_shape %0 [[0], [1, 2]]		%1 = tensor.collapse_shape %0 [[0], [1, 2]]
: tensor<2x1x1xf32> into tensor<2x1xf32>		: tensor<2x1x1xf32> into tensor<2x1xf32>
return %1 : tensor<2x1xf32>		return %1 : tensor<2x1xf32>
}		}
// CHECK: func @fold_reshape_trailing_unit_dims		// CHECK: func @fold_collapse_of_expand_trailing_unit_dims
// CHECK: tensor.expand_shape %{{.*}} {{\[}}[0, 1]]		// CHECK: tensor.expand_shape %{{.*}} {{\[}}[0, 1]]
// CHECK-SAME: tensor<2xf32> into tensor<2x1xf32>		// CHECK-SAME: tensor<2xf32> into tensor<2x1xf32>

// -----		// -----

func @fold_reshape_trailing_unit_dims_dynamic(%arg0: tensor<1x1x?x1x1x1xf32>)		func @fold_collapse_of_collapse_trailing_unit_dims_dynamic(
-> tensor<?xf32> {		%arg0: tensor<1x1x?x1x1x1xf32>) -> tensor<?xf32> {
%0 = tensor.collapse_shape %arg0 [[0, 1, 2], [3], [4], [5]]		%0 = tensor.collapse_shape %arg0 [[0, 1, 2], [3], [4], [5]]
: tensor<1x1x?x1x1x1xf32> into tensor<?x1x1x1xf32>		: tensor<1x1x?x1x1x1xf32> into tensor<?x1x1x1xf32>
%1 = tensor.collapse_shape %0 [[0, 1, 2, 3]]		%1 = tensor.collapse_shape %0 [[0, 1, 2, 3]]
: tensor<?x1x1x1xf32> into tensor<?xf32>		: tensor<?x1x1x1xf32> into tensor<?xf32>
return %1 : tensor<?xf32>		return %1 : tensor<?xf32>
}		}
// CHECK: func @fold_reshape_trailing_unit_dims_dynamic		// CHECK: func @fold_collapse_of_collapse_trailing_unit_dims_dynamic
// CHECK: tensor.collapse_shape %{{.*}} {{\[}}[0, 1, 2, 3, 4, 5]]		// CHECK: tensor.collapse_shape %{{.*}} {{\[}}[0, 1, 2, 3, 4, 5]]
// CHECK-SAME: tensor<1x1x?x1x1x1xf32> into tensor<?xf32>		// CHECK-SAME: tensor<1x1x?x1x1x1xf32> into tensor<?xf32>

// -----		// -----

func @fold_reshape_trailing_unit_dims(%arg0: tensor<12x42x1x1xf32>)		func @fold_collapse_of_expand_trailing_unit_dims(%arg0: tensor<12x42x1x1xf32>)
-> tensor<12x42xf32> {		-> tensor<12x42xf32> {
%0 = tensor.expand_shape %arg0 [[0], [1], [2], [3, 4]]		%0 = tensor.expand_shape %arg0 [[0], [1], [2], [3, 4]]
: tensor<12x42x1x1xf32> into tensor<12x42x1x1x1xf32>		: tensor<12x42x1x1xf32> into tensor<12x42x1x1x1xf32>
%1 = tensor.collapse_shape %0 [[0], [1, 2, 3, 4]]		%1 = tensor.collapse_shape %0 [[0], [1, 2, 3, 4]]
: tensor<12x42x1x1x1xf32> into tensor<12x42xf32>		: tensor<12x42x1x1x1xf32> into tensor<12x42xf32>
return %1 : tensor<12x42xf32>		return %1 : tensor<12x42xf32>
}		}
// CHECK: func @fold_reshape_trailing_unit_dims		// CHECK: func @fold_collapse_of_expand_trailing_unit_dims
// CHECK: tensor.collapse_shape %{{.*}} {{\[}}[0], [1, 2, 3]]		// CHECK: tensor.collapse_shape %{{.*}} {{\[}}[0], [1, 2, 3]]
// CHECK-SAME: tensor<12x42x1x1xf32> into tensor<12x42xf32>		// CHECK-SAME: tensor<12x42x1x1xf32> into tensor<12x42xf32>

// -----		// -----

func @fold_reshapes_unit_dims_in_middle(%arg0 : tensor<?x?x?xf32>) -> tensor<?x?xf32> {		func @fold_collapse_of_expand_unit_dims_in_middle(%arg0 : tensor<?x?x?xf32>)
		-> tensor<?x?xf32> {
%0 = tensor.expand_shape %arg0 [[0], [1], [2, 3]]		%0 = tensor.expand_shape %arg0 [[0], [1], [2, 3]]
: tensor<?x?x?xf32> into tensor<?x?x1x?xf32>		: tensor<?x?x?xf32> into tensor<?x?x1x?xf32>
%1 = tensor.collapse_shape %0 [[0], [1, 2, 3]]		%1 = tensor.collapse_shape %0 [[0], [1, 2, 3]]
: tensor<?x?x1x?xf32> into tensor<?x?xf32>		: tensor<?x?x1x?xf32> into tensor<?x?xf32>
return %1 : tensor<?x?xf32>		return %1 : tensor<?x?xf32>
}		}
// CHECK-LABEL: func @fold_reshapes_unit_dims_in_middle		// CHECK-LABEL: func @fold_collapse_of_expand_unit_dims_in_middle
// CHECK-SAME: (%[[ARG:.*]]: tensor<?x?x?xf32>		// CHECK-SAME: (%[[ARG:.*]]: tensor<?x?x?xf32>
// CHECK: tensor.collapse_shape %[[ARG]] {{\[}}[0], [1, 2]]		// CHECK: tensor.collapse_shape %[[ARG]] {{\[}}[0], [1, 2]]
// CHECK-SAME: tensor<?x?x?xf32> into tensor<?x?xf32>		// CHECK-SAME: tensor<?x?x?xf32> into tensor<?x?xf32>

// -----		// -----

func @no_fold_reshape_incompatible(%arg0 : tensor<4x6x8xf32>)		func @no_fold_collapse_of_expand_incompatible(%arg0 : tensor<4x6x8xf32>)
-> tensor<2x6x16xf32> {		-> tensor<2x6x16xf32> {
%0 = tensor.expand_shape %arg0 [[0, 1], [2, 3], [4]]		%0 = tensor.expand_shape %arg0 [[0, 1], [2, 3], [4]]
: tensor<4x6x8xf32> into tensor<2x2x3x2x8xf32>		: tensor<4x6x8xf32> into tensor<2x2x3x2x8xf32>
%1 = tensor.collapse_shape %0 [[0], [1, 2], [3, 4]]		%1 = tensor.collapse_shape %0 [[0], [1, 2], [3, 4]]
: tensor<2x2x3x2x8xf32> into tensor<2x6x16xf32>		: tensor<2x2x3x2x8xf32> into tensor<2x6x16xf32>
return %1 : tensor<2x6x16xf32>		return %1 : tensor<2x6x16xf32>
}		}
// CHECK-LABEL: func @no_fold_reshape_incompatible		// CHECK-LABEL: func @no_fold_collapse_of_expand_incompatible
// CHECK: tensor.expand_shape		// CHECK: tensor.expand_shape
// CHECK: tensor.collapse_shape		// CHECK: tensor.collapse_shape

// -----		// -----

func @no_fold_reshape_empty_expr(%arg0: tensor<3x2x2xf32>) -> tensor<12x1xf32> {		func @no_fold_collapse_of_expand_empty_expr(%arg0: tensor<3x2x2xf32>)
		-> tensor<12x1xf32> {
%0 = tensor.expand_shape %arg0 [[0], [1], [2, 3]]		%0 = tensor.expand_shape %arg0 [[0], [1], [2, 3]]
: tensor<3x2x2xf32> into tensor<3x2x2x1xf32>		: tensor<3x2x2xf32> into tensor<3x2x2x1xf32>
%1 = tensor.collapse_shape %0 [[0, 1, 2], [3]]		%1 = tensor.collapse_shape %0 [[0, 1, 2], [3]]
: tensor<3x2x2x1xf32> into tensor<12x1xf32>		: tensor<3x2x2x1xf32> into tensor<12x1xf32>
return %1 : tensor<12x1xf32>		return %1 : tensor<12x1xf32>
}		}
// CHECK: func @no_fold_reshape_empty_expr		// CHECK: func @no_fold_collapse_of_expand_empty_expr
// CHECK-SAME: %[[ARG0:.+]]: tensor<3x2x2xf32>		// CHECK-SAME: %[[ARG0:.+]]: tensor<3x2x2xf32>
// CHECK: %[[RARG0:.+]] = tensor.expand_shape %[[ARG0]]		// CHECK: %[[RARG0:.+]] = tensor.expand_shape %[[ARG0]]
// CHECK-SAME: [0], [1], [2, 3]		// CHECK-SAME: [0], [1], [2, 3]
// CHECK: %[[RES:.+]] = tensor.collapse_shape %[[RARG0]]		// CHECK: %[[RES:.+]] = tensor.collapse_shape %[[RARG0]]
// CHECK-SAME: [0, 1, 2], [3]		// CHECK-SAME: [0, 1, 2], [3]
// CHECK: return %[[RES:.+]] : tensor<12x1xf32>		// CHECK: return %[[RES:.+]] : tensor<12x1xf32>

// -----		// -----
▲ Show 20 Lines • Show All 60 Lines • ▼ Show 20 Lines	func @fold_rank() -> (index) {
%rank_0 = tensor.rank %const_0 : tensor<2x1x4xi32>		%rank_0 = tensor.rank %const_0 : tensor<2x1x4xi32>

// CHECK-NEXT: return [[C3]]		// CHECK-NEXT: return [[C3]]
return %rank_0 : index		return %rank_0 : index
}		}

// -----		// -----

// CHECK-LABEL: func @pad_tensor_same_static_shape(		// CHECK-LABEL: func @pad_same_static_shape(
// CHECK-SAME: %[[ARG0:.*]]: tensor<5x6xf32>		// CHECK-SAME: %[[ARG0:.*]]: tensor<5x6xf32>
// CHECK-NOT: tensor.pad		// CHECK-NOT: tensor.pad
// CHECK: return %[[ARG0]]		// CHECK: return %[[ARG0]]
func @pad_tensor_same_static_shape(%arg0: tensor<5x6xf32>, %a: index)		func @pad_same_static_shape(%arg0: tensor<5x6xf32>, %a: index)
-> tensor<5x6xf32> {		-> tensor<5x6xf32> {
%cst = arith.constant 0.000000e+00 : f32		%cst = arith.constant 0.000000e+00 : f32
%0 = tensor.pad %arg0 low[%a, 0] high[0, %a] {		%0 = tensor.pad %arg0 low[%a, 0] high[0, %a] {
^bb0(%arg1: index, %arg2: index):		^bb0(%arg1: index, %arg2: index):
tensor.yield %cst : f32		tensor.yield %cst : f32
} : tensor<5x6xf32> to tensor<5x6xf32>		} : tensor<5x6xf32> to tensor<5x6xf32>
return %0 : tensor<5x6xf32>		return %0 : tensor<5x6xf32>
}		}

// -----		// -----

// CHECK-LABEL: func @pad_tensor_nofold_same_static_shape(		// CHECK-LABEL: func @pad_nofold_same_static_shape(
// CHECK-SAME: %[[ARG0:.*]]: tensor<5x6xf32>		// CHECK-SAME: %[[ARG0:.*]]: tensor<5x6xf32>
// CHECK: %[[PAD:.*]] = tensor.pad		// CHECK: %[[PAD:.*]] = tensor.pad
// CHECK: return %[[PAD]]		// CHECK: return %[[PAD]]
func @pad_tensor_nofold_same_static_shape(%arg0: tensor<5x6xf32>, %a: index)		func @pad_nofold_same_static_shape(%arg0: tensor<5x6xf32>, %a: index)
-> tensor<5x6xf32> {		-> tensor<5x6xf32> {
%cst = arith.constant 0.000000e+00 : f32		%cst = arith.constant 0.000000e+00 : f32
%0 = tensor.pad %arg0 nofold low[%a, 0] high[0, %a] {		%0 = tensor.pad %arg0 nofold low[%a, 0] high[0, %a] {
^bb0(%arg1: index, %arg2: index):		^bb0(%arg1: index, %arg2: index):
tensor.yield %cst : f32		tensor.yield %cst : f32
} : tensor<5x6xf32> to tensor<5x6xf32>		} : tensor<5x6xf32> to tensor<5x6xf32>
return %0 : tensor<5x6xf32>		return %0 : tensor<5x6xf32>
}		}

// -----		// -----

// CHECK-LABEL: func @pad_tensor_after_cast_different_shape(		// CHECK-LABEL: func @pad_after_cast_different_shape(
// CHECK-SAME: %[[INPUT:.*]]: tensor<?x64x?x?xf32>) -> tensor<?x?x?x?xf32> {		// CHECK-SAME: %[[INPUT:.*]]: tensor<?x64x?x?xf32>) -> tensor<?x?x?x?xf32> {
// CHECK: %[[CST:.*]] = arith.constant 0.000000e+00 : f32		// CHECK: %[[CST:.*]] = arith.constant 0.000000e+00 : f32
// CHECK: %[[PADDED:.*]] = tensor.pad %[[INPUT]]		// CHECK: %[[PADDED:.*]] = tensor.pad %[[INPUT]]
// CHECK-SAME: low[0, 0, 1, 1] high[0, 0, 1, 1] {		// CHECK-SAME: low[0, 0, 1, 1] high[0, 0, 1, 1] {
// CHECK: ^bb0(%[[ARG1:.]]: index, %[[ARG2:.]]: index, %[[ARG3:.]]: index, %[[ARG4:.]]: index):		// CHECK: ^bb0(%[[ARG1:.]]: index, %[[ARG2:.]]: index, %[[ARG3:.]]: index, %[[ARG4:.]]: index):
// CHECK: tensor.yield %[[CST]] : f32		// CHECK: tensor.yield %[[CST]] : f32
// CHECK: } : tensor<?x64x?x?xf32> to tensor<?x64x?x?xf32>		// CHECK: } : tensor<?x64x?x?xf32> to tensor<?x64x?x?xf32>
// CHECK: %[[DYNAMIC:.]] = tensor.cast %[[PADDED:.]] :		// CHECK: %[[DYNAMIC:.]] = tensor.cast %[[PADDED:.]] :
// CHECK-SAME: tensor<?x64x?x?xf32> to tensor<?x?x?x?xf32>		// CHECK-SAME: tensor<?x64x?x?xf32> to tensor<?x?x?x?xf32>
// CHECK: return %[[DYNAMIC]] : tensor<?x?x?x?xf32>		// CHECK: return %[[DYNAMIC]] : tensor<?x?x?x?xf32>
// CHECK: }		// CHECK: }
func @pad_tensor_after_cast_different_shape(%arg0: tensor<?x64x?x?xf32>)		func @pad_after_cast_different_shape(%arg0: tensor<?x64x?x?xf32>)
-> tensor<?x?x?x?xf32> {		-> tensor<?x?x?x?xf32> {
%cst = arith.constant 0.000000e+00 : f32		%cst = arith.constant 0.000000e+00 : f32
%dynamic = tensor.cast %arg0 : tensor<?x64x?x?xf32> to tensor<?x?x?x?xf32>		%dynamic = tensor.cast %arg0 : tensor<?x64x?x?xf32> to tensor<?x?x?x?xf32>
%padded = tensor.pad %dynamic low[0, 0, 1, 1] high[0, 0, 1, 1] {		%padded = tensor.pad %dynamic low[0, 0, 1, 1] high[0, 0, 1, 1] {
^bb0(%arg1: index, %arg2: index, %arg3: index, %arg4: index):		^bb0(%arg1: index, %arg2: index, %arg3: index, %arg4: index):
tensor.yield %cst: f32		tensor.yield %cst: f32
} : tensor<?x?x?x?xf32> to tensor<?x?x?x?xf32>		} : tensor<?x?x?x?xf32> to tensor<?x?x?x?xf32>
return %padded: tensor<?x?x?x?xf32>		return %padded: tensor<?x?x?x?xf32>
}		}

// -----		// -----

// CHECK-LABEL: func @pad_tensor_after_cast_same_shape(		// CHECK-LABEL: func @pad_after_cast_same_shape(
// CHECK-SAME: %[[INPUT:.*]]: tensor<?x64x?x?xf32>,		// CHECK-SAME: %[[INPUT:.*]]: tensor<?x64x?x?xf32>,
// CHECK-SAME: %[[PADDING:.*]]: index) -> tensor<?x?x?x?xf32> {		// CHECK-SAME: %[[PADDING:.*]]: index) -> tensor<?x?x?x?xf32> {
// CHECK: %[[CST:.*]] = arith.constant 0.000000e+00 : f32		// CHECK: %[[CST:.*]] = arith.constant 0.000000e+00 : f32
// CHECK: %[[PADDED:.*]] = tensor.pad %[[INPUT]]		// CHECK: %[[PADDED:.*]] = tensor.pad %[[INPUT]]
// CHECK-SAME: low[0, %[[PADDING]], 1, 1] high[0, %[[PADDING]], 1, 1] {		// CHECK-SAME: low[0, %[[PADDING]], 1, 1] high[0, %[[PADDING]], 1, 1] {
// CHECK: ^bb0(%[[ARG1:.]]: index, %[[ARG2:.]]: index, %[[ARG3:.]]: index, %[[ARG4:.]]: index):		// CHECK: ^bb0(%[[ARG1:.]]: index, %[[ARG2:.]]: index, %[[ARG3:.]]: index, %[[ARG4:.]]: index):
// CHECK: tensor.yield %[[CST]] : f32		// CHECK: tensor.yield %[[CST]] : f32
// CHECK: } : tensor<?x64x?x?xf32> to tensor<?x?x?x?xf32>		// CHECK: } : tensor<?x64x?x?xf32> to tensor<?x?x?x?xf32>
// CHECK: return %[[PADDED:.*]] : tensor<?x?x?x?xf32>		// CHECK: return %[[PADDED:.*]] : tensor<?x?x?x?xf32>
// CHECK: }		// CHECK: }
func @pad_tensor_after_cast_same_shape(%arg0: tensor<?x64x?x?xf32>, %padding : index)		func @pad_after_cast_same_shape(%arg0: tensor<?x64x?x?xf32>, %padding : index)
-> tensor<?x?x?x?xf32> {		-> tensor<?x?x?x?xf32> {
%cst = arith.constant 0.000000e+00 : f32		%cst = arith.constant 0.000000e+00 : f32
%dynamic = tensor.cast %arg0 : tensor<?x64x?x?xf32> to tensor<?x?x?x?xf32>		%dynamic = tensor.cast %arg0 : tensor<?x64x?x?xf32> to tensor<?x?x?x?xf32>
%padded = tensor.pad %dynamic low[0, %padding, 1, 1] high[0, %padding, 1, 1] {		%padded = tensor.pad %dynamic low[0, %padding, 1, 1] high[0, %padding, 1, 1] {
^bb0(%arg1: index, %arg2: index, %arg3: index, %arg4: index):		^bb0(%arg1: index, %arg2: index, %arg3: index, %arg4: index):
tensor.yield %cst: f32		tensor.yield %cst: f32
} : tensor<?x?x?x?xf32> to tensor<?x?x?x?xf32>		} : tensor<?x?x?x?xf32> to tensor<?x?x?x?xf32>
return %padded: tensor<?x?x?x?xf32>		return %padded: tensor<?x?x?x?xf32>
}		}

// -----		// -----

// CHECK-LABEL: func @pad_tensor_of_cast(		// CHECK-LABEL: func @pad_of_cast(
// CHECK-NOT: tensor.cast		// CHECK-NOT: tensor.cast
// CHECK: tensor.pad		// CHECK: tensor.pad
// CHECK: tensor<8x?xf32> to tensor<8x32xf32>		// CHECK: tensor<8x?xf32> to tensor<8x32xf32>
func @pad_tensor_of_cast(%t: tensor<8x?xf32>, %s: index) -> tensor<8x32xf32> {		func @pad_of_cast(%t: tensor<8x?xf32>, %s: index) -> tensor<8x32xf32> {
%c0 = arith.constant 0 : index		%c0 = arith.constant 0 : index
%cst = arith.constant 0.000000e+00 : f32		%cst = arith.constant 0.000000e+00 : f32
%0 = tensor.cast %t : tensor<8x?xf32> to tensor<?x?xf32>		%0 = tensor.cast %t : tensor<8x?xf32> to tensor<?x?xf32>
%1 = tensor.pad %0 low[%c0, %c0] high[%c0, %s] {		%1 = tensor.pad %0 low[%c0, %c0] high[%c0, %s] {
^bb0(%arg9: index, %arg10: index):		^bb0(%arg9: index, %arg10: index):
tensor.yield %cst : f32		tensor.yield %cst : f32
} : tensor<?x?xf32> to tensor<8x32xf32>		} : tensor<?x?xf32> to tensor<8x32xf32>
return %1 : tensor<8x32xf32>		return %1 : tensor<8x32xf32>
Show All 29 Lines	func @cast_of_pad_less_static(%arg0: tensor<32x?x?xf32>, %padding: index) -> tensor<?x32x32xf32> {
// CHECK: %[[CAST:.*]] = tensor.cast		// CHECK: %[[CAST:.*]] = tensor.cast
%casted = tensor.cast %padded : tensor<32x?x?xf32> to tensor<?x32x32xf32>		%casted = tensor.cast %padded : tensor<32x?x?xf32> to tensor<?x32x32xf32>
// CHECK: return %[[CAST]]		// CHECK: return %[[CAST]]
return %casted : tensor<?x32x32xf32>		return %casted : tensor<?x32x32xf32>
}		}

// -----		// -----

func @tensor_pad_cast_fold(%arg0: tensor<4x4xf32>) -> tensor<4x4xf32> {		func @pad_cast_fold(%arg0: tensor<4x4xf32>) -> tensor<4x4xf32> {
%c0 = arith.constant 0 : index		%c0 = arith.constant 0 : index
%cst = arith.constant 0.0 : f32		%cst = arith.constant 0.0 : f32
%0 = tensor.cast %arg0 : tensor<4x4xf32> to tensor<?x?xf32>		%0 = tensor.cast %arg0 : tensor<4x4xf32> to tensor<?x?xf32>
%1 = tensor.pad %0 low[%c0, %c0] high[%c0, %c0] {		%1 = tensor.pad %0 low[%c0, %c0] high[%c0, %c0] {
^bb0(%arg1: index, %arg2: index):		^bb0(%arg1: index, %arg2: index):
tensor.yield %cst : f32		tensor.yield %cst : f32
} : tensor<?x?xf32> to tensor<4x4xf32>		} : tensor<?x?xf32> to tensor<4x4xf32>
return %1 : tensor<4x4xf32>		return %1 : tensor<4x4xf32>
}		}
// CHECK-LABEL: @tensor_pad_cast		// CHECK-LABEL: @pad_cast
// CHECK-SAME: %[[ARG0:.+]]: tensor<4x4xf32>		// CHECK-SAME: %[[ARG0:.+]]: tensor<4x4xf32>
// CHECK: return %[[ARG0]]		// CHECK: return %[[ARG0]]

// -----		// -----

// CHECK-LABEL: func @fold_pad_tensor_source_cast(		// CHECK-LABEL: func @fold_pad_source_cast(
// CHECK-SAME: %[[ARG0:.*]]: tensor<4x?xf32>		// CHECK-SAME: %[[ARG0:.*]]: tensor<4x?xf32>
// CHECK-NOT: tensor.cast		// CHECK-NOT: tensor.cast
// CHECK: %[[RESULT:.*]] = tensor.pad %[[ARG0]]		// CHECK: %[[RESULT:.*]] = tensor.pad %[[ARG0]]
func @fold_pad_tensor_source_cast(%arg0: tensor<4x?xf32>) -> tensor<4x4xf32> {		func @fold_pad_source_cast(%arg0: tensor<4x?xf32>) -> tensor<4x4xf32> {
%cst = arith.constant 0.0 : f32		%cst = arith.constant 0.0 : f32
%0 = tensor.cast %arg0 : tensor<4x?xf32> to tensor<?x?xf32>		%0 = tensor.cast %arg0 : tensor<4x?xf32> to tensor<?x?xf32>
%1 = tensor.pad %0 low[0, 0] high[0, 1] {		%1 = tensor.pad %0 low[0, 0] high[0, 1] {
^bb0(%arg1: index, %arg2: index):		^bb0(%arg1: index, %arg2: index):
tensor.yield %cst : f32		tensor.yield %cst : f32
} : tensor<?x?xf32> to tensor<4x4xf32>		} : tensor<?x?xf32> to tensor<4x4xf32>
return %1 : tensor<4x4xf32>		return %1 : tensor<4x4xf32>
}		}
▲ Show 20 Lines • Show All 96 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[mlir] Rewrite canonicalization of collapse(expand) and expand(collapse) .
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 419757

mlir/include/mlir/Dialect/Utils/ReshapeOpsUtils.h

mlir/lib/Dialect/MemRef/IR/MemRefOps.cpp

mlir/lib/Dialect/Tensor/IR/TensorOps.cpp

mlir/lib/Dialect/Utils/ReshapeOpsUtils.cpp

mlir/test/Dialect/MemRef/canonicalize.mlir

mlir/test/Dialect/Tensor/canonicalize.mlir

This is an archive of the discontinued LLVM Phabricator instance.

[mlir] Rewrite canonicalization of collapse(expand) and expand(collapse) .ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 419757

mlir/include/mlir/Dialect/Utils/ReshapeOpsUtils.h

mlir/lib/Dialect/MemRef/IR/MemRefOps.cpp

mlir/lib/Dialect/Tensor/IR/TensorOps.cpp

mlir/lib/Dialect/Utils/ReshapeOpsUtils.cpp

mlir/test/Dialect/MemRef/canonicalize.mlir

mlir/test/Dialect/Tensor/canonicalize.mlir

[mlir] Rewrite canonicalization of collapse(expand) and expand(collapse) .
ClosedPublic