Diff 316803

mlir/include/mlir/Dialect/Linalg/IR/LinalgBase.td

Show All 26 Lines	let description = [{
Additional [Linalg Dialect		Additional [Linalg Dialect
Documentation](https://mlir.llvm.org/docs/Dialects/Linalg) and a		Documentation](https://mlir.llvm.org/docs/Dialects/Linalg) and a
[Rationale		[Rationale
Document](https://mlir.llvm.org/docs/Rationale/RationaleLinalgDialect) are		Document](https://mlir.llvm.org/docs/Rationale/RationaleLinalgDialect) are
are also available and should be read first before going in the details of		are also available and should be read first before going in the details of
the op semantics.		the op semantics.
}];		}];
let cppNamespace = "::mlir::linalg";		let cppNamespace = "::mlir::linalg";
		let dependentDialects = [
		"AffineDialect", "StandardOpsDialect", "tensor::TensorDialect"
		];
}		}

// Whether a type is a RangeType.		// Whether a type is a RangeType.
def LinalgIsRangeTypePred : CPred<"$_self.isa<RangeType>()">;		def LinalgIsRangeTypePred : CPred<"$_self.isa<RangeType>()">;
def Range : DialectType<Linalg_Dialect, LinalgIsRangeTypePred, "range">;		def Range : DialectType<Linalg_Dialect, LinalgIsRangeTypePred, "range">;

#endif // LINALG_BASE		#endif // LINALG_BASE

mlir/include/mlir/Dialect/Linalg/IR/LinalgStructuredOpsInterface.td

Show First 20 Lines • Show All 940 Lines • ▼ Show 20 Lines	InterfaceMethod<
/retTy=/"AffineMap",		/retTy=/"AffineMap",
/methodName=/"getShapesToLoopsMap",		/methodName=/"getShapesToLoopsMap",
/args=/(ins),		/args=/(ins),
/methodBody=/"",		/methodBody=/"",
/defaultImplementation=/[{		/defaultImplementation=/[{
return inversePermutation(getLoopsToShapesMap());		return inversePermutation(getLoopsToShapesMap());
}]		}]
>,		>,
		InterfaceMethod<
		/desc=/[{
		Return the position in the results of the affine map computed
		by getLoopsToShapesMap() that represents the shape of an
		operand (input or output) at a dimension.
		}],
		/retTy=/"Optional<unsigned>",
		/methodName=/"getOperandDimPositionInLoopsToShapeMap",
		/args=/(ins "unsigned":$operandIdx, "unsigned":$dim),
		/methodBody=/"",
		/defaultImplementation=/[{
		unsigned pos = 0;
		for (auto type : llvm::enumerate(getShapedOperandTypes())) {
		if (type.index() == operandIdx) return pos + dim;
		pos += type.value().getRank();
		}
		return {};
		}]
		>,
		InterfaceMethod<
		/desc=/[{
		Return the position in the results of the affine map computed
		by getLoopsToShapesMap() that represents the shape of an
		input operand at a dimension.
		}],
		/retTy=/"Optional<unsigned>",
		/methodName=/"getInputValueDimPositionInLoopsToShapeMap",
		/args=/(ins "unsigned":$inputIdx, "unsigned":$dim),
		/methodBody=/"",
		/defaultImplementation=/[{
		if (inputIdx >= getNumInputs()) return {};
		return getOperandDimPositionInLoopsToShapeMap(inputIdx, dim);
		}]
		>,
		InterfaceMethod<
		/desc=/[{
		Return the position in the results of the affine map computed
		by getLoopsToShapesMap() that represents the shape of the
		result value at a dimension.
		}],
		/retTy=/"Optional<unsigned>",
		/methodName=/"getResultValueDimPositionInLoopsToShapeMap",
		/args=/(ins "unsigned":$resultIdx, "unsigned":$dim),
		/methodBody=/"",
		/defaultImplementation=/[{
		if (resultIdx >= getNumOutputs()) return {};
		return getOperandDimPositionInLoopsToShapeMap(
		getNumInputs() + resultIdx, dim);
		}]
		>,

//===------------------------------------------------------------------===//		//===------------------------------------------------------------------===//
// Other static interface methods.		// Other static interface methods.
//===------------------------------------------------------------------===//		//===------------------------------------------------------------------===//
StaticInterfaceMethod<		StaticInterfaceMethod<
/desc=/[{		/desc=/[{
Create an operation of the current type with the given location,		Create an operation of the current type with the given location,
operands, and attributes.		operands, and attributes.
▲ Show 20 Lines • Show All 65 Lines • ▼ Show 20 Lines	SmallVector<Value, 4> getAssumedNonShapedOperands() {
for (unsigned i = 0; i < nExtraOperands; ++i) {		for (unsigned i = 0; i < nExtraOperands; ++i) {
res.push_back(getOperation()->getOperand(numShapedOperands + i));		res.push_back(getOperation()->getOperand(numShapedOperands + i));
assert((res.back().getType().isSignlessIntOrIndexOrFloat()		assert((res.back().getType().isSignlessIntOrIndexOrFloat()
\|\| res.back().getType().template isa<VectorType>()) &&		\|\| res.back().getType().template isa<VectorType>()) &&
"expected scalar or vector type");		"expected scalar or vector type");
}		}
return res;		return res;
}		}

		/// Returns the value that expresses the shape of the output in terms of
		/// shape of the input operands where possible
		Optional<Value> inferResultDimFromInputShapes
		(OpBuilder &b, Location loc, unsigned resultIdx, unsigned im);

//========================================================================//		//========================================================================//
// Helper functions to mutate the `operand_segment_sizes` attribute.		// Helper functions to mutate the `operand_segment_sizes` attribute.
// These are useful when cloning and changing operand types.		// These are useful when cloning and changing operand types.
//========================================================================//		//========================================================================//
void setNumInputs(unsigned num) { setOperandSegmentAt(0, num); }		void setNumInputs(unsigned num) { setOperandSegmentAt(0, num); }
void setNumOutputBuffers(unsigned num) { setOperandSegmentAt(1, num); }		void setNumOutputBuffers(unsigned num) { setOperandSegmentAt(1, num); }

private:		private:
Show All 14 Lines

mlir/include/mlir/Dialect/Linalg/IR/LinalgTypes.h

	//===- LinalgTypes.h - Linalg Types ---------------------------------------===//			//===- LinalgTypes.h - Linalg Types ---------------------------------------===//
	//			//
	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.			// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
	// See https://llvm.org/LICENSE.txt for license information.			// See https://llvm.org/LICENSE.txt for license information.
	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception			// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
	//			//
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//

	#ifndef MLIR_DIALECT_LINALG_LINALGTYPES_H_			#ifndef MLIR_DIALECT_LINALG_LINALGTYPES_H_
	#define MLIR_DIALECT_LINALG_LINALGTYPES_H_			#define MLIR_DIALECT_LINALG_LINALGTYPES_H_

				#include "mlir/Dialect/Affine/IR/AffineOps.h"
				#include "mlir/Dialect/StandardOps/IR/Ops.h"
				#include "mlir/Dialect/Tensor/IR/Tensor.h"
	#include "mlir/IR/Dialect.h"			#include "mlir/IR/Dialect.h"
	#include "mlir/IR/Types.h"			#include "mlir/IR/Types.h"

	#include "mlir/Dialect/Linalg/IR/LinalgOpsDialect.h.inc"			#include "mlir/Dialect/Linalg/IR/LinalgOpsDialect.h.inc"

	namespace mlir {			namespace mlir {
	class MLIRContext;			class MLIRContext;

	Show All 21 Lines

mlir/include/mlir/IR/AffineExprVisitor.h

Show First 20 Lines • Show All 153 Lines • ▼ Show 20 Lines	public:
// the user does not specify what to do for a particular instruction type.		// the user does not specify what to do for a particular instruction type.
// The default behavior is to generalize the instruction type to its subtype		// The default behavior is to generalize the instruction type to its subtype
// and try visiting the subtype. All of this should be inlined perfectly,		// and try visiting the subtype. All of this should be inlined perfectly,
// because there are no virtual functions to get in the way.		// because there are no virtual functions to get in the way.
//		//

// Default visit methods. Note that the default op-specific binary op visit		// Default visit methods. Note that the default op-specific binary op visit
// methods call the general visitAffineBinaryOpExpr visit method.		// methods call the general visitAffineBinaryOpExpr visit method.
void visitAffineBinaryOpExpr(AffineBinaryOpExpr expr) {}		RetTy visitAffineBinaryOpExpr(AffineBinaryOpExpr expr) { return RetTy(); }
void visitAddExpr(AffineBinaryOpExpr expr) {		RetTy visitAddExpr(AffineBinaryOpExpr expr) {
static_cast<SubClass *>(this)->visitAffineBinaryOpExpr(expr);		return static_cast<SubClass *>(this)->visitAffineBinaryOpExpr(expr);
}		}
void visitMulExpr(AffineBinaryOpExpr expr) {		RetTy visitMulExpr(AffineBinaryOpExpr expr) {
static_cast<SubClass *>(this)->visitAffineBinaryOpExpr(expr);		return static_cast<SubClass *>(this)->visitAffineBinaryOpExpr(expr);
}		}
void visitModExpr(AffineBinaryOpExpr expr) {		RetTy visitModExpr(AffineBinaryOpExpr expr) {
static_cast<SubClass *>(this)->visitAffineBinaryOpExpr(expr);		return static_cast<SubClass *>(this)->visitAffineBinaryOpExpr(expr);
}		}
void visitFloorDivExpr(AffineBinaryOpExpr expr) {		RetTy visitFloorDivExpr(AffineBinaryOpExpr expr) {
static_cast<SubClass *>(this)->visitAffineBinaryOpExpr(expr);		return static_cast<SubClass *>(this)->visitAffineBinaryOpExpr(expr);
}		}
void visitCeilDivExpr(AffineBinaryOpExpr expr) {		RetTy visitCeilDivExpr(AffineBinaryOpExpr expr) {
static_cast<SubClass *>(this)->visitAffineBinaryOpExpr(expr);		return static_cast<SubClass *>(this)->visitAffineBinaryOpExpr(expr);
}		}
void visitConstantExpr(AffineConstantExpr expr) {}		RetTy visitConstantExpr(AffineConstantExpr expr) { return RetTy(); }
void visitDimExpr(AffineDimExpr expr) {}		RetTy visitDimExpr(AffineDimExpr expr) { return RetTy(); }
void visitSymbolExpr(AffineSymbolExpr expr) {}		RetTy visitSymbolExpr(AffineSymbolExpr expr) { return RetTy(); }

private:		private:
// Walk the operands - each operand is itself walked in post order.		// Walk the operands - each operand is itself walked in post order.
void walkOperandsPostOrder(AffineBinaryOpExpr expr) {		RetTy walkOperandsPostOrder(AffineBinaryOpExpr expr) {
walkPostOrder(expr.getLHS());		walkPostOrder(expr.getLHS());
walkPostOrder(expr.getRHS());		walkPostOrder(expr.getRHS());
}		}
};		};

// This class is used to flatten a pure affine expression (AffineExpr,		// This class is used to flatten a pure affine expression (AffineExpr,
// which is in a tree form) into a sum of products (w.r.t constants) when		// which is in a tree form) into a sum of products (w.r.t constants) when
// possible, and in that process simplifying the expression. For a modulo,		// possible, and in that process simplifying the expression. For a modulo,
▲ Show 20 Lines • Show All 133 Lines • Show Last 20 Lines

mlir/lib/Dialect/Linalg/IR/LinalgOps.cpp

Show All 10 Lines
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

#include "mlir/Dialect/Linalg/IR/LinalgOps.h"		#include "mlir/Dialect/Linalg/IR/LinalgOps.h"

#include "mlir/Dialect/Affine/IR/AffineOps.h"		#include "mlir/Dialect/Affine/IR/AffineOps.h"
#include "mlir/Dialect/Linalg/EDSC/Intrinsics.h"		#include "mlir/Dialect/Linalg/EDSC/Intrinsics.h"
#include "mlir/Dialect/Linalg/IR/LinalgTypes.h"		#include "mlir/Dialect/Linalg/IR/LinalgTypes.h"
#include "mlir/Dialect/StandardOps/IR/Ops.h"		#include "mlir/Dialect/StandardOps/IR/Ops.h"
		#include "mlir/IR/AffineExprVisitor.h"
#include "mlir/IR/Matchers.h"		#include "mlir/IR/Matchers.h"
#include "mlir/IR/OpImplementation.h"		#include "mlir/IR/OpImplementation.h"
#include "mlir/IR/PatternMatch.h"		#include "mlir/IR/PatternMatch.h"

#include "llvm/ADT/DenseMap.h"		#include "llvm/ADT/DenseMap.h"
#include "llvm/ADT/SetVector.h"		#include "llvm/ADT/SetVector.h"
		#include "llvm/ADT/SmallSet.h"
#include "llvm/ADT/StringSet.h"		#include "llvm/ADT/StringSet.h"
#include "llvm/Support/FormatVariadic.h"		#include "llvm/Support/FormatVariadic.h"
#include "llvm/Support/MathExtras.h"		#include "llvm/Support/MathExtras.h"
#include "llvm/Support/raw_ostream.h"		#include "llvm/Support/raw_ostream.h"

using namespace mlir;		using namespace mlir;
using namespace mlir::linalg;		using namespace mlir::linalg;

▲ Show 20 Lines • Show All 48 Lines • ▼ Show 20 Lines	if (auto d = result.dyn_cast<AffineDimExpr>()) {
if (res[d.getPosition()].offset)		if (res[d.getPosition()].offset)
continue;		continue;
res[d.getPosition()] = Range{zeroVal, viewSizes[idx], oneVal};		res[d.getPosition()] = Range{zeroVal, viewSizes[idx], oneVal};
}		}
}		}
return res;		return res;
}		}

		/// Visitor to check if any of the given set of positions from AffineDimExprs
		hanchungUnsubmitted Not Done Reply Inline Actions IIRC, Value can be nullptr, so we don't need optional here? hanchung: IIRC, Value can be nullptr, so we don't need optional here?
		mravishankarAuthorUnsubmitted Done Reply Inline Actions Thats true, but the signature of `Optional` makes it explicit that this can return `llvm::None`. Its easier to follow that. We can dcoument that it returns `nullptr` on failure, but that might just be easier to miss. This makes it more explicit. WDYT? mravishankar: Thats true, but the signature of `Optional` makes it explicit that this can return `llvm::None`.
		hanchungUnsubmitted Not Done Reply Inline Actions Yes, you are right on that. It is indeed more explicit. Personally, I don't have a strong feeling on this because I know `Value` could be nullptr and it could ends up with an assertion at some point. It already has Optional semantic to me. Another point is that Optional introduces a bit more memory usage (ie sizeof(bool) and padding may be added). If `Value` itself carries this information and people commonly use it, I'd prefer returning `nullptr` on failure. However, I went through some usage, and found that some people use `Optional<Value>` and some people use `Value` directly. There is no convention here. So I'll leave the decision to you. hanchung: Yes, you are right on that. It is indeed more explicit. Personally, I don't have a strong…
		/// are used within an AffineExpr.
		struct HasAffineDimExprVisitor
		: public AffineExprVisitor<HasAffineDimExprVisitor, bool> {
		HasAffineDimExprVisitor(llvm::SmallSet<unsigned, 4> &positions)
		: positions(positions) {}

		bool visitAffineBinaryOpExpr(AffineBinaryOpExpr binaryOpExpr) {
		return visit(binaryOpExpr.getLHS()) \|\| visit(binaryOpExpr.getRHS());
		}

		bool visitDimExpr(AffineDimExpr dimExpr) {
		return positions.count(dimExpr.getPosition());
		}

		bool visitConstantExpr(AffineConstantExpr constExpr) { return false; }

		bool visitSymbolExpr(AffineSymbolExpr symbolExpr) { return false; }

		private:
		llvm::SmallSet<unsigned, 4> positions;
		};

		Optional<Value> LinalgOp::inferResultDimFromInputShapes(OpBuilder &b,
		Location loc,
		unsigned resultIdx,
		unsigned dim) {
		// An example that helps understand the logic below.
		// Consider the following expression O(i+j, j) += A(i,k) * B(k, j)
		// We want to express the shape of dim 0 of O in terms of shape of the inputs.
		hanchungUnsubmitted Done Reply Inline Actions Let's initialize resultDimSubMapPos with `dim`, so we don't need the last statement `...+=dim`? hanchung: Let's initialize resultDimSubMapPos with `dim`, so we don't need the last statement `...+=dim`?
		mravishankarAuthorUnsubmitted Done Reply Inline Actions I feel like that would make the logic more complicated. This is easier to follow IMO. Will leave it as is if thats OK. mravishankar: I feel like that would make the logic more complicated. This is easier to follow IMO. Will…
		hanchungUnsubmitted Done Reply Inline Actions Sure, both are okay to me. I just feel that the comment states what it's doing and it looks simpler to me. But both looks good to me. hanchung: Sure, both are okay to me. I just feel that the comment states what it's doing and it looks…
		// This is achieved as follows.
		// loopsToShapesMap = (d0, d1, d2) -> (d0, d2, d2, d1, d0 + d1, d1)
		// subMapOfResultDim = (d0, d1, d2) -> (d0 + d1)
		// shapesToLoopsMap = (d0, d2, d2, d3, d4, d5) -> (d0, d3, d2)
		// resultFromFromInputDim = subMapOfResultDim.compose(shapesToLoopMap)
		// = (d0, d1, d2, d3, d4, d5) -> (d0 + d1)
		AffineMap loopsToShapesMap = getLoopsToShapesMap();

		// Find the position in the above map that represents the shape of the
		nicolasvasilacheUnsubmitted Done Reply Inline Actions Please give this a good name and add to the LinalgStructuredOpInterface. nicolasvasilache: Please give this a good name and add to the LinalgStructuredOpInterface.
		// result:dim being inferred.
		nicolasvasilacheUnsubmitted Done Reply Inline Actions inferred nicolasvasilache: inferred
		Optional<unsigned> resultDimSubMapPos =
		getResultValueDimPositionInLoopsToShapeMap(resultIdx, dim);
		if (!resultDimSubMapPos)
		return {};
		nicolasvasilacheUnsubmitted Not Done Reply Inline Actions Just iterate of getInputShapes ? If it's not in the LinalgStructuredOpsInterface just add it too, plz nicolasvasilache: Just iterate of getInputShapes ? If it's not in the LinalgStructuredOpsInterface just add it…
		mravishankarAuthorUnsubmitted Done Reply Inline Actions Not needed anymore after interface method is added. mravishankar: Not needed anymore after interface method is added.

		/// From loopsToShapesMap extract the submap that represents the shape of the
		/// (resultIdx, dim) needed
		AffineMap loopToResultDimShapeMap =
		loopsToShapesMap.getSubMap(*resultDimSubMapPos);
		AffineMap operandShapesToResultDimMap =
		loopToResultDimShapeMap.compose(getShapesToLoopsMap());

		// Check that the result dim map does not contain the positions corresponding
		// to the outputs.
		llvm::SmallSet<unsigned, 4> outputDims;
		unsigned outputDimPosStart =
		getResultValueDimPositionInLoopsToShapeMap(0, 0).getValue();
		unsigned outputDimPosEnd =
		getResultValueDimPositionInLoopsToShapeMap(getNumOutputs() - 1,
		getOutputOpOperands()
		.back()
		.get()
		.getType()
		.cast<ShapedType>()
		.getRank() -
		1)
		.getValue();
		llvm::for_each(llvm::seq<unsigned>(outputDimPosStart, outputDimPosEnd),
		[&outputDims](unsigned dim) { outputDims.insert(dim); });
		HasAffineDimExprVisitor checkDimExpr(outputDims);
		if (checkDimExpr.visit(operandShapesToResultDimMap.getResult(0)))
		return llvm::None;
		return applyMapToValues(b, loc, operandShapesToResultDimMap,
		createFlatListOfOperandDims(b, loc))[0];
		}

/// Forward declarations.		/// Forward declarations.
template <typename NamedStructuredOpType>		template <typename NamedStructuredOpType>
static void buildNamedStructuredOpRegionAndAttributes(OpBuilder &opBuilder,		static void buildNamedStructuredOpRegionAndAttributes(OpBuilder &opBuilder,
OperationState &result,		OperationState &result,
TypeRange inputTypes,		TypeRange inputTypes,
TypeRange outputTypes);		TypeRange outputTypes);

static ParseResult		static ParseResult
▲ Show 20 Lines • Show All 1,920 Lines • ▼ Show 20 Lines	LogicalResult matchAndRewrite(Operation *op,
// Clone op.		// Clone op.
Operation *newOp =		Operation *newOp =
linalgOp.clone(rewriter, op->getLoc(), newResultTypes, newOperands);		linalgOp.clone(rewriter, op->getLoc(), newResultTypes, newOperands);
rewriter.replaceOp(op, newOp->getResults());		rewriter.replaceOp(op, newOp->getResults());

return success();		return success();
}		}
};		};

		/// Replaces std.dim operations that use the result of a LinalgOp (on tensors)
		/// with std.dim operations that use one of the arguments. For example,
		///
		/// %0 = linalg.matmul ins(%arg0, %arg1, ...)
		/// %1 = dim %0, %c0
		///
		/// with
		///
		/// %1 = dim %arg0, %c0
		///
		/// where possible. With this the result of the `linalg.matmul` is not used in
		/// dim operations. If the value produced is replaced with another value (say by
		/// tiling `linalg.matmul`) will make the `linalg.matmul` truly dead instead of
		/// used in a dim op that would prevent the DCE of this op.
		nicolasvasilacheUnsubmitted Done Reply Inline Actions prevent nicolasvasilache: prevent
		struct ReplaceDimOfLinalgOpResult : public OpRewritePattern<DimOp> {
		using OpRewritePattern<DimOp>::OpRewritePattern;

		LogicalResult matchAndRewrite(DimOp dimOp,
		PatternRewriter &rewriter) const override {
		Value dimValue = dimOp.memrefOrTensor();
		Optional<int64_t> dimIndex = dimOp.getConstantIndex();
		if (!dimIndex)
		return failure();
		auto linalgOp = dimValue.getDefiningOp<LinalgOp>();
		if (!linalgOp)
		return failure();

		unsigned resultIndex = dimValue.cast<OpResult>().getResultNumber();
		nicolasvasilacheUnsubmitted Done Reply Inline Actions This revision introduces OpInterface support for `getLoopsToShapesMap` and `getShapesToLoopsMap` and dropped special-case logic. Let's please use those instead of reintroducing special-case logic, this will be more future-proof. This should prob take the form of a new interface method `Value inferDimFromInputs(unsigned resultIdx, unsigned dim)` which: computes the index of result(resultIdx)[dim] in the flattened list of shapes (i.e. sum the ranks for all input operands and results < resultIdx + dim). let's call this "IDX" extract the map consisting of the single `IDX` result from `getLoopsToShapesMap` compose 2. with `getShapesToLoopsMap` that is the expression of the output dim you want in terms of the expression of the input dims. call applyMapToValues with 3. and the flattened list of dims. e.g. assume some hypothetical op that resembles matmul with a twist: `O(i + j, j) += A(i, k) * B(k, j)`: getLoopsToShapesMap is `(i, j, k) -> (i, k, k, j, i + j, j)` getShapesToLoopsMap is `(d0, d1, d2, d3, d4, d5) -> (d0, d3, d1)` Assume you wanted the expression of `dim res, 0` (i.e. `i + j`, a.k.a `dim A, 0 + dim B, 1`). Step 1. IDX = 4 Step 2. extract IDX from `getLoopsToShapesMap`, i.e. `(i, j, k) -> (i + j)` Step 3. compute `([ (i, j, k) -> (0, 0, 0, 0, i + j, 0) ]).compose( [(d0, d1, d2, d3, d4, d5) -> (d0, d3, d1)] )` returns `[d0, d1, d2, d3, d4, d5) -> (d0 + d1)]` Step 4. call `applyMapToValues(b, loc, [d0, d1, d2, d3, d4, d5) -> (d0 + d1)], op.createFlatListOfOperandDims())` In step 4. you will prob need to adjust to only take the input operands. By default we also capture the output because of output buffers. Does this make sense ? nicolasvasilache: This [revision](https://github.com/llvm/llvm-project/commit/01c4418544b7934f8216a6616562bbaf34d…
		mravishankarAuthorUnsubmitted Done Reply Inline Actions I think it makes sense. But there is a corner case here that might make the pattern rewriter go into a loop, and it doesnt happen today. Take an op where the loop shape actually depends on the shape of the output. %cst = constant 0.0 : f32 %1 = linalg.generic {indexing_maps = [affine_map<(d0, d1) -> (d0, d1)>], iterator_types = ["parallel", "parallel"]} ins() { ^bb0(): linalg.yield %cst : f32 } -> tensor<?x?xf32> Today, the loop computation fails to get the right loop shape for such ops (the method `createLoopRanges` I think will throw an error cause `createFlatListOfOperandDims` does not append the shape of the results that makes `affineApplyMapToValues(b, loc, getShapesToLoopsMap(), createFlatListOfOperandDims()` fail due to mismatch in number of values passed and numdims of the map. (The next CL in the stack fixes that issue). So here we need to guard against that. I like the approach you described above, but this canonicalization should fail in such cases otherwise it will put the rewriter in a loop. It doesnt happen today cause of what I described in the previous paragraph) mravishankar: I think it makes sense. But there is a corner case here that might make the pattern rewriter go…
		Optional<Value> operandDimValue = linalgOp.inferResultDimFromInputShapes(
		rewriter, dimOp.getLoc(), resultIndex,
		static_cast<unsigned>(*dimIndex));
		if (!operandDimValue) {
		// Its always possible to replace using the corresponding `outs`
		// parameter.
		operandDimValue = rewriter.create<DimOp>(
		dimOp.getLoc(), linalgOp.getOutput(resultIndex), *dimIndex);
		}
		rewriter.replaceOp(dimOp, *operandDimValue);
		return success();
		}
		};

} // namespace		} // namespace

namespace {		namespace {
// Deduplicate redundant args of a linalg op.		// Deduplicate redundant args of a linalg op.
// An arg is redundant if it has the same Value and indexing map as another.		// An arg is redundant if it has the same Value and indexing map as another.
struct DeduplicateInputs : public RewritePattern {		struct DeduplicateInputs : public RewritePattern {
DeduplicateInputs(PatternBenefit benefit = 1)		DeduplicateInputs(PatternBenefit benefit = 1)
: RewritePattern(benefit, MatchAnyOpTypeTag()) {}		: RewritePattern(benefit, MatchAnyOpTypeTag()) {}

LogicalResult matchAndRewrite(Operation *op,		LogicalResult matchAndRewrite(Operation *op,
PatternRewriter &rewriter) const override {		PatternRewriter &rewriter) const override {
// This pattern reduces the number of arguments of an op, which breaks		// This pattern reduces the number of arguments of an op, which breaks
// the invariants of semantically charged named ops.		// the invariants of semantically charged named ops.
if (!isa<GenericOp, IndexedGenericOp>(op))		if (!isa<GenericOp, IndexedGenericOp>(op))
return failure();		return failure();
auto linalgOp = cast<LinalgOp>(op);		auto linalgOp = cast<LinalgOp>(op);

// Associate each input to an equivalent "canonical" input that has the same		// Associate each input to an equivalent "canonical" input that has the same
// Value and indexing map.		// Value and indexing map.
//		//
// In the non-duplicate case, input `i` will have canonical input `i`. But		// In the non-duplicate case, input `i` will have canonical input `i`. But
		hanchungUnsubmitted Done Reply Inline Actions nit: use auto because there is a dyn_cast. https://llvm.org/docs/CodingStandards.html#use-auto-type-deduction-to-make-code-more-readable hanchung: nit: use auto because there is a dyn_cast. https://llvm.org/docs/CodingStandards.html#use-auto…
// in the case of duplicated inputs, the canonical input could be some other		// in the case of duplicated inputs, the canonical input could be some other
// input `< i`. That is, a later input will have some earlier input as its		// input `< i`. That is, a later input will have some earlier input as its
// canonical input.		// canonical input.
llvm::SmallDenseMap<std::pair<Value, AffineMap>, int> canonicalInput;		llvm::SmallDenseMap<std::pair<Value, AffineMap>, int> canonicalInput;
// For later remapping tasks like deduplicating payload block arguments,		// For later remapping tasks like deduplicating payload block arguments,
// having a simple "inputIndex -> canonicalInputIndex" integer mapping is		// having a simple "inputIndex -> canonicalInputIndex" integer mapping is
// convenient.		// convenient.
SmallVector<int, 6> canonicalInputIndices;		SmallVector<int, 6> canonicalInputIndices;
▲ Show 20 Lines • Show All 107 Lines • ▼ Show 20 Lines	for (Value yieldVal : yieldOp.values()) {
if (argumentNumber < numIndexArgs)		if (argumentNumber < numIndexArgs)
return failure();		return failure();
returnedArgs.push_back(op->getOperand(argumentNumber - numIndexArgs));		returnedArgs.push_back(op->getOperand(argumentNumber - numIndexArgs));
}		}
rewriter.replaceOp(genericOp, returnedArgs);		rewriter.replaceOp(genericOp, returnedArgs);
return success();		return success();
}		}
};		};

/// Canonicalize a `linalgOp` -> `dim` pattern by replacing the `dim` arg
/// with the corresponding output tensor argument of the linalg op.
struct ReplaceDimOfLinalgResult : public OpRewritePattern<DimOp> {
using OpRewritePattern<DimOp>::OpRewritePattern;

LogicalResult matchAndRewrite(DimOp dimOp,
PatternRewriter &rewriter) const override {
Value dimOpArg = dimOp.memrefOrTensor();
auto linalgOp = dimOpArg.getDefiningOp<LinalgOp>();
if (!linalgOp)
return failure();

auto results = linalgOp.getOperation()->getResults();
int64_t id = std::distance(results.begin(), llvm::find(results, dimOpArg));
auto outputTensors = linalgOp.getOutputTensors();
rewriter.replaceOpWithNewOp<DimOp>(dimOp, outputTensors[id], dimOp.index());
return success();
}
};
} // namespace		} // namespace

#define CANONICALIZERS_AND_FOLDERS(XXX) \		#define CANONICALIZERS_AND_FOLDERS(XXX) \
void XXX::getCanonicalizationPatterns(OwningRewritePatternList &results, \		void XXX::getCanonicalizationPatterns(OwningRewritePatternList &results, \
MLIRContext *context) { \		MLIRContext *context) { \
results.insert<DeduplicateInputs, EraseDeadLinalgOp, FoldTensorCastOp, \		results.insert<DeduplicateInputs, EraseDeadLinalgOp, FoldTensorCastOp, \
RemoveIdentityLinalgOps>(); \		RemoveIdentityLinalgOps>(); \
results.insert<ReplaceDimOfLinalgResult>(context); \		results.insert<ReplaceDimOfLinalgOpResult>(context); \
} \		} \
\		\
LogicalResult XXX::fold(ArrayRef<Attribute>, \		LogicalResult XXX::fold(ArrayRef<Attribute>, \
SmallVectorImpl<OpFoldResult> &) { \		SmallVectorImpl<OpFoldResult> &) { \
return foldMemRefCast(*this); \		return foldMemRefCast(*this); \
}		}

CANONICALIZERS_AND_FOLDERS(ConvOp)		CANONICALIZERS_AND_FOLDERS(ConvOp)
Show All 10 Lines

mlir/lib/Dialect/Linalg/IR/LinalgTypes.cpp

	Show First 20 Lines • Show All 52 Lines • ▼ Show 20 Lines

	} // end anonymous namespace			} // end anonymous namespace

	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	// LinalgDialect			// LinalgDialect
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//

	void mlir::linalg::LinalgDialect::initialize() {			void mlir::linalg::LinalgDialect::initialize() {
	getContext()->getOrLoadDialect("std");
	getContext()->getOrLoadDialect("tensor");

	addTypes<RangeType>();			addTypes<RangeType>();
	addOperations<			addOperations<
	#define GET_OP_LIST			#define GET_OP_LIST
	#include "mlir/Dialect/Linalg/IR/LinalgOps.cpp.inc"			#include "mlir/Dialect/Linalg/IR/LinalgOps.cpp.inc"
	>();			>();
	addOperations<			addOperations<
	#define GET_OP_LIST			#define GET_OP_LIST
	#include "mlir/Dialect/Linalg/IR/LinalgStructuredOps.cpp.inc"			#include "mlir/Dialect/Linalg/IR/LinalgStructuredOps.cpp.inc"
	Show All 27 Lines

mlir/test/Dialect/Linalg/canonicalize.mlir

Show First 20 Lines • Show All 384 Lines • ▼ Show 20 Lines	func @init_tensor_dynamic_dim(%arg0 : index) -> (index) {
return %1 : index		return %1 : index
}		}
// CHECK: func @init_tensor_dynamic_dim		// CHECK: func @init_tensor_dynamic_dim
// CHECK-SAME: %[[ARG0:[a-zA-Z0-9_]+]]: index		// CHECK-SAME: %[[ARG0:[a-zA-Z0-9_]+]]: index
// CHECK: return %[[ARG0]]		// CHECK: return %[[ARG0]]

// -----		// -----

		func @init_tensor_dynamic_dim2(%arg0 : index, %arg1 : index) -> (index, index) {
		%c0 = constant 0 : index
		%c1 = constant 1 : index
		%0 = linalg.init_tensor [%arg0, %arg1] : tensor<?x?xf32>
		%1 = dim %0, %c0 : tensor<?x?xf32>
		%2 = dim %0, %c1 : tensor<?x?xf32>
		return %1, %2 : index, index
		}
		// CHECK: func @init_tensor_dynamic_dim2
		// CHECK-SAME: %[[ARG0:[a-zA-Z0-9_]+]]: index
		// CHECK-SAME: %[[ARG1:[a-zA-Z0-9_]+]]: index
		// CHECK: return %[[ARG0]], %[[ARG1]]

		// -----

		func @remove_dim_result_uses
		(%arg0 : tensor<?x?xf32>, %arg1 : tensor<?x?xf32>,
		%arg2 : tensor<?x?xf32>) -> (index) {
		%c0 = constant 0 : index
		%0 = linalg.generic
		{indexing_maps = [affine_map<(d0, d1, d2) -> (d0, d2)>,
		affine_map<(d0, d1, d2) -> (d2, d1)>,
		affine_map<(d0, d1, d2) -> (d0 + d1, d1)>],
		iterator_types = ["parallel", "parallel", "reduction"]}
		ins(%arg0, %arg1 : tensor<?x?xf32>, tensor<?x?xf32>)
		outs(%arg2 : tensor<?x?xf32>) {
		^bb0(%arg3 : f32, %arg4 : f32, %arg5 : f32):
		%1 = mulf %arg3, %arg4 : f32
		%2 = addf %1, %arg5 : f32
		linalg.yield %2 : f32
		} -> tensor<?x?xf32>
		%3 = dim %0, %c0 : tensor<?x?xf32>
		return %3 : index
		}
		// CHECK: #[[MAP:.+]] = affine_map<()[s0, s1] -> (s0 + s1)>
		// CHECK: func @remove_dim_result_uses
		// CHECK-SAME: %[[ARG0:[a-zA-Z0-9_]+]]: tensor<?x?xf32>
		// CHECK-SAME: %[[ARG1:[a-zA-Z0-9_]+]]: tensor<?x?xf32>
		// CHECK-SAME: %[[ARG2:[a-zA-Z0-9_]+]]: tensor<?x?xf32>
		// CHECK-DAG: %[[C0:.+]] = constant 0 : index
		// CHECK-DAG: %[[C1:.+]] = constant 1 : index
		// CHECK-DAG: %[[T0:.+]] = dim %[[ARG0]], %[[C0]]
		// CHECK-DAG: %[[T1:.+]] = dim %[[ARG1]], %[[C1]]
		// CHECK: %[[T2:.+]] = affine.apply #[[MAP]]()[%[[T0]], %[[T1]]]
		// CHECK: return %[[T2]]

		// -----

		func @remove_dim_result_uses_outs
		(%arg0 : tensor<?xf32>, %arg1 : index) -> (index) {
		%c0 = constant 0 : index
		%c1 = constant 1 : index
		%d0 = dim %arg0, %c0 : tensor<?xf32>
		%0 = linalg.init_tensor [%d0, %arg1] : tensor<?x?xf32>
		%1 = linalg.generic
		{indexing_maps = [affine_map<(d0, d1) -> (d0)>,
		affine_map<(d0, d1) -> (d0, d1)>],
		iterator_types = ["parallel", "parallel"]}
		ins(%arg0 : tensor<?xf32>) outs(%0 : tensor<?x?xf32>) {
		^bb0(%arg2: f32, %arg3: f32) :
		linalg.yield %arg2 : f32
		} -> tensor<?x?xf32>
		%2 = dim %1, %c1 : tensor<?x?xf32>
		return %2 : index
		}
		// CHECK: func @remove_dim_result_uses_outs
		// CHECK-SAME: %[[ARG1:[a-zA-Z0-9_]+]]: index
		// CHECK: return %[[ARG1]]

		// -----

		func @remove_dim_result_uses_sequence
		(%arg0 : tensor<?x?xf32>, %arg1 : tensor<?x?xf32>,
		%arg2 : tensor<?x?xf32>) -> (index, index, index, index) {
		%c0 = constant 0 : index
		%c1 = constant 1 : index
		%0 = linalg.matmul ins(%arg0, %arg1 : tensor<?x?xf32>, tensor<?x?xf32>)
		outs(%arg2 : tensor<?x?xf32>) -> tensor<?x?xf32>
		%1 = dim %0, %c0 : tensor<?x?xf32>
		%2 = dim %0, %c1 : tensor<?x?xf32>
		%3 = linalg.generic
		{indexing_maps = [affine_map<(d0, d1, d2) -> (d1, d0)>,
		affine_map<(d0, d1, d2) -> (d0, d2)>,
		affine_map<(d0, d1, d2) -> (d0, d2)>],
		iterator_types = ["parallel", "reduction", "parallel"]}
		ins(%arg0, %arg1 : tensor<?x?xf32>, tensor<?x?xf32>)
		outs(%0 : tensor<?x?xf32>) {
		^bb0(%arg3 : f32, %arg4 : f32, %arg5 : f32):
		%4 = mulf %arg3, %arg4 : f32
		%5 = addf %4, %arg5 : f32
		linalg.yield %5 : f32
		} -> tensor<?x?xf32>
		%6 = dim %3, %c0 : tensor<?x?xf32>
		%7 = dim %3, %c1 : tensor<?x?xf32>
		return %1, %2, %6, %7 : index, index, index, index
		}
		// CHECK-LABEL: func @remove_dim_result_uses_sequence
		// CHECK-SAME: %[[ARG0:[a-zA-Z0-9_]+]]: tensor<?x?xf32>
		// CHECK-SAME: %[[ARG1:[a-zA-Z0-9_]+]]: tensor<?x?xf32>
		// CHECK-SAME: %[[ARG2:[a-zA-Z0-9_]+]]: tensor<?x?xf32>
		// CHECK-DAG: %[[C0:.+]] = constant 0 : index
		// CHECK-DAG: %[[C1:.+]] = constant 1 : index
		// CHECK-DAG: %[[T0:.+]] = dim %[[ARG0]], %[[C0]]
		// CHECK-DAG: %[[T1:.+]] = dim %[[ARG1]], %[[C1]]
		// CHECK-DAG: %[[T2:.+]] = dim %[[ARG0]], %[[C1]]
		// CHECK-DAG: %[[T3:.+]] = dim %[[ARG1]], %[[C1]]
		// CHECK: return %[[T0]], %[[T1]], %[[T2]], %[[T3]]

		// -----

		func @keep_result_dim_uses_sequence2
		(%arg0 : tensor<?xf32>, %arg1 : index) -> (index, index) {
		%c0 = constant 0 : index
		%c1 = constant 1 : index
		%d0 = dim %arg0, %c0 : tensor<?xf32>
		%0 = linalg.init_tensor [%d0, %arg1] : tensor<?x?xf32>
		%1 = linalg.generic
		{indexing_maps = [affine_map<(d0, d1) -> (d0)>,
		affine_map<(d0, d1) -> (d0, d1)>],
		iterator_types = ["parallel", "parallel"]}
		ins(%arg0 : tensor<?xf32>) outs(%0 : tensor<?x?xf32>) {
		^bb0(%arg2: f32, %arg3 : f32):
		linalg.yield %arg2 : f32
		} -> tensor<?x?xf32>
		%2 = dim %1, %c0 : tensor<?x?xf32>
		%3 = dim %1, %c1 : tensor<?x?xf32>
		return %2, %3 : index, index
		}
		// CHECK: func @keep_result_dim_uses_sequence2
		// CHECK-SAME: %[[ARG0:[a-zA-Z0-9_]+]]: tensor<?xf32>
		// CHECK-SAME: %[[ARG1:[a-zA-Z0-9_]+]]: index
		// CHECK-DAG: %[[C0:.+]] = constant 0 : index
		// CHECK-DAG: %[[T0:.+]] = dim %[[ARG0]], %[[C0]]
		// CHECK: return %[[T0]], %[[ARG1]]

		// -----

#map = affine_map<(d0) -> (d0)>		#map = affine_map<(d0) -> (d0)>

func @init_tensor_dim_of_linalg_result(%arg_0 : tensor<?xf32>,		func @init_tensor_dim_of_linalg_result(%arg_0 : tensor<?xf32>,
%arg_1: tensor<?xf32>) -> (tensor<?xf32>, tensor<?xf32>) {		%arg_1: tensor<?xf32>) -> (index, index) {
%0, %1 = linalg.generic {		%0, %1 = linalg.generic {
indexing_maps = [#map, #map, #map],		indexing_maps = [#map, #map, #map],
iterator_types = ["parallel"]		iterator_types = ["parallel"]
} ins(%arg_0 : tensor<?xf32>)		} ins(%arg_0 : tensor<?xf32>)
outs(%arg_0, %arg_1 : tensor<?xf32>, tensor<?xf32>) {		outs(%arg_0, %arg_1 : tensor<?xf32>, tensor<?xf32>) {
^bb0(%in: f32, %out_0: f32, %out_1: f32):		^bb0(%in: f32, %out_0: f32, %out_1: f32):
linalg.yield %in, %in : f32, f32		linalg.yield %in, %in : f32, f32
} -> tensor<?xf32>, tensor<?xf32>		} -> tensor<?xf32>, tensor<?xf32>

%c0 = constant 0 : index		%c0 = constant 0 : index
%num_elem_0 = dim %0, %c0 : tensor<?xf32>		%num_elem_0 = dim %0, %c0 : tensor<?xf32>
%result_0 = linalg.init_tensor [%num_elem_0] : tensor<?xf32>

%num_elem_1 = dim %1, %c0 : tensor<?xf32>		%num_elem_1 = dim %1, %c0 : tensor<?xf32>
%result_1 = linalg.init_tensor [%num_elem_1] : tensor<?xf32>		return %num_elem_0, %num_elem_1 : index, index
return %result_0, %result_1 : tensor<?xf32>, tensor<?xf32>
}		}
// CHECK-LABEL: func @init_tensor_dim_of_linalg_result(		// CHECK: func @init_tensor_dim_of_linalg_result(
// CHECK-SAME: [[ARG_0:%.]]: tensor<?xf32>, [[ARG_1:%.]]: tensor<?xf32>)		// CHECK-SAME: %[[ARG_0:[a-zA-Z0-9_]+]]: tensor<?xf32>
// CHECK: dim [[ARG_0]]		// CHECK-SAME: %[[ARG_1:[a-zA-Z0-9_]+]]: tensor<?xf32>)
// CHECK: dim [[ARG_1]]		// CHECK: %[[R0:.+]] = dim %[[ARG_0]]
		// CHECK: %[[R1:.+]] = dim %[[ARG_0]]
		// CHECK: return %[[R0]], %[[R1]]

// -----		// -----

func @init_tensor_reshape_expansion(%arg0 : index) -> tensor<2x3x5x4x?x7xf32> {		func @init_tensor_reshape_expansion(%arg0 : index) -> tensor<2x3x5x4x?x7xf32> {
%0 = linalg.init_tensor [6, 5, %arg0] : tensor<6x5x?xf32>		%0 = linalg.init_tensor [6, 5, %arg0] : tensor<6x5x?xf32>
%1 = linalg.tensor_reshape %0		%1 = linalg.tensor_reshape %0
[affine_map<(d0, d1, d2, d3, d4, d5) -> (d0, d1)>,		[affine_map<(d0, d1, d2, d3, d4, d5) -> (d0, d1)>,
affine_map<(d0, d1, d2, d3, d4, d5) -> (d2)>,		affine_map<(d0, d1, d2, d3, d4, d5) -> (d2)>,
▲ Show 20 Lines • Show All 55 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][Linalg] Add canonicalization of linalg op -> dim op.
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 316803

mlir/include/mlir/Dialect/Linalg/IR/LinalgBase.td

mlir/include/mlir/Dialect/Linalg/IR/LinalgStructuredOpsInterface.td

mlir/include/mlir/Dialect/Linalg/IR/LinalgTypes.h

mlir/include/mlir/IR/AffineExprVisitor.h

mlir/lib/Dialect/Linalg/IR/LinalgOps.cpp

mlir/lib/Dialect/Linalg/IR/LinalgTypes.cpp

mlir/test/Dialect/Linalg/canonicalize.mlir

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][Linalg] Add canonicalization of linalg op -> dim op.ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 316803

mlir/include/mlir/Dialect/Linalg/IR/LinalgBase.td

mlir/include/mlir/Dialect/Linalg/IR/LinalgStructuredOpsInterface.td

mlir/include/mlir/Dialect/Linalg/IR/LinalgTypes.h

mlir/include/mlir/IR/AffineExprVisitor.h

mlir/lib/Dialect/Linalg/IR/LinalgOps.cpp

mlir/lib/Dialect/Linalg/IR/LinalgTypes.cpp

mlir/test/Dialect/Linalg/canonicalize.mlir

[mlir][Linalg] Add canonicalization of linalg op -> dim op.
ClosedPublic