Diff 419503

mlir/include/mlir/Dialect/Linalg/Transforms/Transforms.h

	Show First 20 Lines • Show All 113 Lines • ▼ Show 20 Lines

	/// Patterns to fold unit-extent dimensions in operands/results of linalg ops on			/// Patterns to fold unit-extent dimensions in operands/results of linalg ops on
	/// tensors.			/// tensors.
	void populateFoldUnitExtentDimsPatterns(RewritePatternSet &patterns);			void populateFoldUnitExtentDimsPatterns(RewritePatternSet &patterns);

	/// Patterns that are used to inline constant operands into linalg generic ops.			/// Patterns that are used to inline constant operands into linalg generic ops.
	void populateInlineConstantOperandsPatterns(RewritePatternSet &patterns);			void populateInlineConstantOperandsPatterns(RewritePatternSet &patterns);

				/// Patterns that are used to bubble up extract slice op above linalg op.
				gysitUnsubmitted Done Reply Inline Actions nit: typo gysit: nit: typo
				void populateBubbleUpExtractSliceOpPatterns(RewritePatternSet &patterns);

	/// Options that control fusion of elementwise operations.			/// Options that control fusion of elementwise operations.
	struct LinalgElementwiseFusionOptions {			struct LinalgElementwiseFusionOptions {
	/// Enable fusion of reshapes into the shape with elementwise operations. By			/// Enable fusion of reshapes into the shape with elementwise operations. By
	/// default it is disabled for unit dimensions reshape.			/// default it is disabled for unit dimensions reshape.
	ControlElementwiseOpsFusionFn controlFoldingReshapesFn = skipUnitDimReshape;			ControlElementwiseOpsFusionFn controlFoldingReshapesFn = skipUnitDimReshape;

	LinalgElementwiseFusionOptions &			LinalgElementwiseFusionOptions &
	setControlFoldingReshapes(ControlElementwiseOpsFusionFn fun) {			setControlFoldingReshapes(ControlElementwiseOpsFusionFn fun) {
	▲ Show 20 Lines • Show All 1,352 Lines • Show Last 20 Lines

mlir/include/mlir/Dialect/Linalg/Utils/Utils.h

	Show First 20 Lines • Show All 160 Lines • ▼ Show 20 Lines
	/// corresponding result size is the corresponding value from `sizeBounds`.			/// corresponding result size is the corresponding value from `sizeBounds`.
	/// Note: The returned tile sizes are closed intervals.			/// Note: The returned tile sizes are closed intervals.
	SmallVector<Value> computeTileSizes(OpBuilder &b, Location loc, ValueRange ivs,			SmallVector<Value> computeTileSizes(OpBuilder &b, Location loc, ValueRange ivs,
	ValueRange tileSizes,			ValueRange tileSizes,
	ArrayRef<Value> sizeBounds);			ArrayRef<Value> sizeBounds);

	/// Creates an extract_slice/subview op for a single `valueToTile` with			/// Creates an extract_slice/subview op for a single `valueToTile` with
	/// `builder`. This new operation extracts a tile of `valueToTile`, starting			/// `builder`. This new operation extracts a tile of `valueToTile`, starting
	/// at offsets `lbs` and with sizes `subShapeSizes`.			/// at offsets `lbs` and with sizes `subShapeSizes`. `omitPartialTileCheck`
				/// controls whether to omit the partial/boundary tile condition check in cases
				/// where we statically know that it is unnecessary.
	Value makeTiledShape(OpBuilder &builder, Location loc, Value valueToTile,			Value makeTiledShape(OpBuilder &builder, Location loc, Value valueToTile,
	ValueRange tileSizes, AffineMap map, ValueRange lbs,			ValueRange tileSizes, AffineMap map, ValueRange lbs,
	ValueRange ubs, ValueRange subShapeSizes);			ValueRange ubs, ValueRange subShapeSizes,
				bool omitPartialTileCheck);
				mravishankarUnsubmitted Done Reply Inline Actions Do you want this value to be default `true` ? mravishankar: Do you want this value to be default `true` ?
				okkwonAuthorUnsubmitted Done Reply Inline Actions Initially I set it to `true` by default. But I found there are only few cases I need to modify, so I just modified the places instead. okkwon: Initially I set it to `true` by default. But I found there are only few cases I need to modify…
				nicolasvasilacheUnsubmitted Done Reply Inline Actions Can we rename this `omitPartialTileCheck` and rewrite the comment using this terminology? Something like: "In cases where we statically know that the partial/boundary tile condition is unnecessary, we can omit the emission of " nicolasvasilache: Can we rename this `omitPartialTileCheck` and rewrite the comment using this terminology?

	/// Creates extract_slice/subview ops for all `valuesToTile` of the given			/// Creates extract_slice/subview ops for all `valuesToTile` of the given
	/// `linalgOp` with `builder`, assuming `linalgOp` is being fused into a loop			/// `linalgOp` with `builder`, assuming `linalgOp` is being fused into a loop
	/// nest for tiling with the given induction variables `ivs` and tile sizes			/// nest for tiling with the given induction variables `ivs` and tile sizes
	/// `tileSizes`. `sizeBounds` are the iteration space bounds for all the			/// `tileSizes`. `sizeBounds` are the iteration space bounds for all the
	/// implicit loops in `linalgOp`.			/// implicit loops in `linalgOp`. `omitPartialTileCheck` controls whether to
				/// omit the partial/boundary tile condition check in cases where we statically
				/// know that it is unnecessary.
	///			///
	/// Note that a constant zero in `tileSizes` means no tiling at that implicit			/// Note that a constant zero in `tileSizes` means no tiling at that implicit
	/// loop. The number of non-zero values in `tileSizes` should be equal to the			/// loop. The number of non-zero values in `tileSizes` should be equal to the
	/// number of values in `ivs`.			/// number of values in `ivs`.
	SmallVector<Value, 4> makeTiledShapes(OpBuilder &builder, Location loc,			SmallVector<Value, 4> makeTiledShapes(OpBuilder &builder, Location loc,
	LinalgOp linalgOp,			LinalgOp linalgOp,
	ArrayRef<Value> valuesToTile,			ArrayRef<Value> valuesToTile,
	ValueRange ivs, ValueRange tileSizes,			ValueRange ivs, ValueRange tileSizes,
	ArrayRef<Value> sizeBounds);			ArrayRef<Value> sizeBounds,
				bool omitPartialTileCheck);

	/// Add the tile loop induction variables `ivs` to the IndexOp results found in			/// Add the tile loop induction variables `ivs` to the IndexOp results found in
	/// the body of the `tiledOp` to account for the tile offset.			/// the body of the `tiledOp` to account for the tile offset.
	void addTileLoopIvsToIndexOpResults(OpBuilder &b, LinalgOp tiledOp,			void addTileLoopIvsToIndexOpResults(OpBuilder &b, LinalgOp tiledOp,
	ArrayRef<Value> ivs);			ArrayRef<Value> ivs);

	using FusableOpDependencesTy = llvm::MapVector<			using FusableOpDependencesTy = llvm::MapVector<
	Operation *,			Operation *,
	▲ Show 20 Lines • Show All 240 Lines • Show Last 20 Lines

mlir/include/mlir/IR/AffineMap.h

	Show First 20 Lines • Show All 474 Lines • ▼ Show 20 Lines
	/// affine_map<(d0, d1, d2) -> (d0, 0)>			/// affine_map<(d0, d1, d2) -> (d0, 0)>
	/// ```			/// ```
	///			///
	/// returns:			/// returns:
	///			///
	/// ```mlir			/// ```mlir
	/// affine_map<(d0, d1) -> (d0, 0, 0)>			/// affine_map<(d0, d1) -> (d0, 0, 0)>
	/// ```			/// ```
	AffineMap inverseAndBroadcastProjectedPermuation(AffineMap map);			AffineMap inverseAndBroadcastProjectedPermutation(AffineMap map);

	/// Concatenates a list of `maps` into a single AffineMap, stepping over			/// Concatenates a list of `maps` into a single AffineMap, stepping over
	/// potentially empty maps. Assumes each of the underlying map has 0 symbols.			/// potentially empty maps. Assumes each of the underlying map has 0 symbols.
	/// The resulting map has a number of dims equal to the max of `maps`' dims and			/// The resulting map has a number of dims equal to the max of `maps`' dims and
	/// the concatenated results as its results.			/// the concatenated results as its results.
	/// Returns an empty map if all input `maps` are empty.			/// Returns an empty map if all input `maps` are empty.
	///			///
	/// Example:			/// Example:
	▲ Show 20 Lines • Show All 105 Lines • Show Last 20 Lines

mlir/lib/Dialect/Linalg/Transforms/BubbleUpExtractSlice.cpp

This file was added.

				//===- BubbleUpExtractSlice.cpp - bubble up tensor.extract_slice ----------===//
				//
				// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
				// See https://llvm.org/LICENSE.txt for license information.
				// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
				//
				//===----------------------------------------------------------------------===//
				//
				// This file implements patterns that transforms linalg.<op> +
				// tensor.extract_slice into tensor.extract_slice + linalg.<op> to reduce
				// the computation for the linalg op.
				//
				//===----------------------------------------------------------------------===//

				#include "PassDetail.h"
				#include "mlir/Dialect/Affine/IR/AffineOps.h"
				#include "mlir/Dialect/Arithmetic/Utils/Utils.h"
				#include "mlir/Dialect/Linalg/IR/Linalg.h"
				#include "mlir/Dialect/Linalg/Passes.h"
				#include "mlir/Dialect/Linalg/Transforms/Transforms.h"
				#include "mlir/Transforms/GreedyPatternRewriteDriver.h"

				using namespace mlir;
				using namespace mlir::linalg;

				namespace {
				/// Bubble up extract_slice above Linalg operation.
				///
				/// A sequence of operations
				mravishankarUnsubmitted Done Reply Inline Actions You could use this https://github.com/llvm/llvm-project/blob/6168b422258e41087a5393b7b77a7349a8922a68/mlir/include/mlir/Dialect/Arithmetic/Utils/Utils.h#L92 mravishankar: You could use this https://github.com/llvm/llvm-project/blob/6168b422258e41087a5393b7b77a7349a8…
				///
				/// ```mlir
				/// %0 = linalg.<op> ... arg0, arg1, ...
				/// %1 = tensor.extract_slice %0 ...
				/// ```
				///
				/// can be replaced with
				///
				/// ```mlir
				/// %0 = tensor.extract_slice %arg0
				/// %1 = tensor.extract_slice %arg1
				/// %2 = linalg.<op> ... %0, %1, ...
				/// ```
				///
				/// This results in the reduce computation of the linalg operation.
				///
				struct BubbleUpExtractSliceOpPattern
				: OpRewritePattern<tensor::ExtractSliceOp> {
				using OpRewritePattern<tensor::ExtractSliceOp>::OpRewritePattern;

				LogicalResult matchAndRewrite(tensor::ExtractSliceOp sliceOp,
				PatternRewriter &rewriter) const final {
				Value source = sliceOp.source();
				auto linalgOp = source.getDefiningOp<LinalgOp>();
				if (!linalgOp) {
				return rewriter.notifyMatchFailure(sliceOp,
				"expected source to be linalg op");
				}

				// TODO: we might relax this if we want heuristics to detect that all uses
				// are small portion of the output.
				nicolasvasilacheUnsubmitted Done Reply Inline Actions Add a TODO that we could relax this in the future if we want heuristics to detect that all uses are "small" portions of the output ? nicolasvasilache: Add a TODO that we could relax this in the future if we want heuristics to detect that all uses…
				if (!linalgOp->hasOneUse()) {
				return rewriter.notifyMatchFailure(sliceOp,
				"expected single use of linalg op");
				}

				if (linalgOp.getNumOutputs() != 1) {
				return rewriter.notifyMatchFailure(sliceOp,
				"expected single output of linalg op");
				}

				if (!linalgOp.hasTensorSemantics()) {
				return rewriter.notifyMatchFailure(sliceOp,
				"expected tensor of linalg op");
				}

				if (!sliceOp.hasUnitStride())
				return rewriter.notifyMatchFailure(sliceOp, "expected unit stride");

				OpOperand *outOperand = linalgOp.getOutputOperand(0);
				AffineMap indexingMap = linalgOp.getTiedIndexingMap(outOperand);
				if (!indexingMap.isProjectedPermutation()) {
				return rewriter.notifyMatchFailure(
				nicolasvasilacheUnsubmitted Done Reply Inline Actions typo: projected nicolasvasilache: typo: projected
				sliceOp, "expected a projected permutation for output");
				}

				auto linalgLoc = linalgOp.getLoc();
				auto allShapeSizes =
				linalgOp.createFlatListOfOperandDims(rewriter, linalgLoc);
				AffineMap shapeSizesToLoopsMap = linalgOp.getShapesToLoopsMap();
				if (!shapeSizesToLoopsMap) {
				return rewriter.notifyMatchFailure(
				linalgOp, "failed to get loops map from shape sizes");
				}
				auto sizeBounds = applyMapToValues(rewriter, linalgLoc,
				shapeSizesToLoopsMap, allShapeSizes);

				auto sliceLoc = sliceOp.getLoc();
				auto offsetVals = getValueOrCreateConstantIndexOp(
				rewriter, sliceLoc, sliceOp.getMixedOffsets());
				auto sizeVals = getValueOrCreateConstantIndexOp(rewriter, sliceLoc,
				sliceOp.getMixedSizes());

				// The offsets and sizes from the slice operation only give you the tile
				// size of the output. Use that compute the tile sizes and offsets of the
				// loops. For loops not used to access the output, set the tile sizes to
				// loop bounds and set the offset to 0.
				Value zero = rewriter.create<arith::ConstantIndexOp>(linalgLoc, 0);
				SmallVector<Value, 4> tileOffsets(sizeBounds.size(), zero);
				SmallVector<Value, 4> tileSizes = sizeBounds;
				for (auto const &result : enumerate(indexingMap.getResults())) {
				unsigned position = result.value().cast<AffineDimExpr>().getPosition();
				tileOffsets[position] = offsetVals[result.index()];
				tileSizes[position] = sizeVals[result.index()];
				}

				SmallVector<Value> valuesToTile = linalgOp.getInputAndOutputOperands();

				SmallVector<Value, 4> tiledOperands = makeTiledShapes(
				rewriter, linalgLoc, linalgOp, valuesToTile, tileOffsets, tileSizes,
				sizeBounds, /omitPartialTileCheck=/true);

				SmallVector<Type, 4> resultTensorTypes;
				for (OpOperand *opOperand : linalgOp.getOutputTensorOperands())
				resultTensorTypes.push_back(
				tiledOperands[opOperand->getOperandNumber()].getType());

				Operation *newOp =
				linalgOp.clone(rewriter, linalgLoc, resultTensorTypes, tiledOperands);
				rewriter.replaceOp(sliceOp, newOp->getResults());
				return success();
				}
				};
				} // namespace

				void mlir::linalg::populateBubbleUpExtractSliceOpPatterns(
				RewritePatternSet &patterns) {
				auto *context = patterns.getContext();
				patterns.add<BubbleUpExtractSliceOpPattern>(context);
				}

mlir/lib/Dialect/Linalg/Transforms/CMakeLists.txt

	add_mlir_dialect_library(MLIRLinalgTransforms			add_mlir_dialect_library(MLIRLinalgTransforms
				BubbleUpExtractSlice.cpp
	BufferizableOpInterfaceImpl.cpp			BufferizableOpInterfaceImpl.cpp
	Bufferize.cpp			Bufferize.cpp
	CodegenStrategy.cpp			CodegenStrategy.cpp
	ComprehensiveBufferizePass.cpp			ComprehensiveBufferizePass.cpp
	Detensorize.cpp			Detensorize.cpp
	DropUnitDims.cpp			DropUnitDims.cpp
	ElementwiseOpFusion.cpp			ElementwiseOpFusion.cpp
	ElementwiseToLinalg.cpp			ElementwiseToLinalg.cpp
	▲ Show 20 Lines • Show All 58 Lines • Show Last 20 Lines

mlir/lib/Dialect/Linalg/Transforms/Fusion.cpp

Show First 20 Lines • Show All 136 Lines • ▼ Show 20 Lines	if (it != fusedLoopsAndRanges.end()) {
<< loopRanges.back() << "\n");		<< loopRanges.back() << "\n");
}		}
}		}

SmallVector<Value, 8> clonedShapes;		SmallVector<Value, 8> clonedShapes;
clonedShapes.reserve(producer.getNumInputsAndOutputs());		clonedShapes.reserve(producer.getNumInputsAndOutputs());

// Compute subranges for all tensor input/output operands.		// Compute subranges for all tensor input/output operands.
clonedShapes.append(makeTiledShapes(b, loc, producer,		clonedShapes.append(makeTiledShapes(
getTiledOperands(producer), ivs,		b, loc, producer, getTiledOperands(producer), ivs, tileSizes, sizeBounds,
tileSizes, sizeBounds));		/*omitPartialTileCheck=/false));

// Iterate over the results in order.		// Iterate over the results in order.
// Extract the subtensor type from the linearized range.		// Extract the subtensor type from the linearized range.
// Since we do not enforce any canonicalizations on the fly, this is always		// Since we do not enforce any canonicalizations on the fly, this is always
// fully dynamic at construction time.		// fully dynamic at construction time.
SmallVector<Type, 4> resultTypes;		SmallVector<Type, 4> resultTypes;
resultTypes.reserve(producer->getNumResults());		resultTypes.reserve(producer->getNumResults());
for (RankedTensorType t : producer.getOutputTensorTypes()) {		for (RankedTensorType t : producer.getOutputTensorTypes()) {
▲ Show 20 Lines • Show All 743 Lines • Show Last 20 Lines

mlir/lib/Dialect/Linalg/Transforms/FusionOnTensors.cpp

Show First 20 Lines • Show All 157 Lines • ▼ Show 20 Lines	for (auto it : zip(tiledSliceDimIndices, tiledProducerLoopIndices)) {
int64_t tiledProducerLoop = std::get<1>(it);		int64_t tiledProducerLoop = std::get<1>(it);
tileIvs[tiledProducerLoop] = sliceOpRanges[tiledSliceDim].offset;		tileIvs[tiledProducerLoop] = sliceOpRanges[tiledSliceDim].offset;
tileSizes[tiledProducerLoop] = sliceOpRanges[tiledSliceDim].size;		tileSizes[tiledProducerLoop] = sliceOpRanges[tiledSliceDim].size;
allIvs[tiledProducerLoop] = tileIvs[tiledProducerLoop];		allIvs[tiledProducerLoop] = tileIvs[tiledProducerLoop];
}		}
erase_value(tileIvs, nullptr);		erase_value(tileIvs, nullptr);
SmallVector<Value> tiledOperands = producerOp.getInputAndOutputOperands();		SmallVector<Value> tiledOperands = producerOp.getInputAndOutputOperands();
tiledOperands = makeTiledShapes(b, loc, producerOp, tiledOperands, tileIvs,		tiledOperands = makeTiledShapes(b, loc, producerOp, tiledOperands, tileIvs,
tileSizes, producerLoopBounds);		tileSizes, producerLoopBounds,
		/*omitPartialTileCheck=/false);

// Output fusion has to update the iteration arguments of the tile loop nest.		// Output fusion has to update the iteration arguments of the tile loop nest.
// In particular, the iteration argument of the outermost tile loop needs to		// In particular, the iteration argument of the outermost tile loop needs to
// be set to the producer output instead of the producer result and `clonedOp`		// be set to the producer output instead of the producer result and `clonedOp`
// shall use the existing `sliceOp` result instead of the tiled producer		// shall use the existing `sliceOp` result instead of the tiled producer
// output operand.		// output operand.
if (iterArg) {		if (iterArg) {
OpOperand *outputOperand =		OpOperand *outputOperand =
▲ Show 20 Lines • Show All 305 Lines • Show Last 20 Lines

mlir/lib/Dialect/Linalg/Transforms/Tiling.cpp

Show First 20 Lines • Show All 172 Lines • ▼ Show 20 Lines	auto tiledLoopBodyBuilder =
// Tile the `operandValuesToUse` that either match the `op` operands		// Tile the `operandValuesToUse` that either match the `op` operands
// themselves or the tile loop arguments forwarding them.		// themselves or the tile loop arguments forwarding them.
assert(operandValuesToUse.size() ==		assert(operandValuesToUse.size() ==
static_cast<size_t>(op.getNumInputsAndOutputs()) &&		static_cast<size_t>(op.getNumInputsAndOutputs()) &&
"expect the number of operands and inputs and outputs to match");		"expect the number of operands and inputs and outputs to match");
SmallVector<Value> valuesToTile = operandValuesToUse;		SmallVector<Value> valuesToTile = operandValuesToUse;
auto sizeBounds =		auto sizeBounds =
applyMapToValues(b, loc, shapeSizesToLoopsMap, allShapeSizes);		applyMapToValues(b, loc, shapeSizesToLoopsMap, allShapeSizes);
SmallVector<Value, 4> tiledOperands = makeTiledShapes(		SmallVector<Value, 4> tiledOperands =
b, loc, op, valuesToTile, interchangedIvs, tileSizes, sizeBounds);		makeTiledShapes(b, loc, op, valuesToTile, interchangedIvs, tileSizes,
		sizeBounds, /omitPartialTileCheck=/false);

// TODO: use an interface/adaptor to avoid leaking position in		// TODO: use an interface/adaptor to avoid leaking position in
// `tiledOperands`.		// `tiledOperands`.
SmallVector<Type, 4> resultTensorTypes;		SmallVector<Type, 4> resultTensorTypes;
for (OpOperand *opOperand : op.getOutputTensorOperands())		for (OpOperand *opOperand : op.getOutputTensorOperands())
resultTensorTypes.push_back(		resultTensorTypes.push_back(
tiledOperands[opOperand->getOperandNumber()].getType());		tiledOperands[opOperand->getOperandNumber()].getType());

▲ Show 20 Lines • Show All 129 Lines • ▼ Show 20 Lines	loopNest = mlir::scf::buildLoopNest(
SmallVector<Value> offsets =		SmallVector<Value> offsets =
computeTileOffsets(b, loc, localIvs, tileSizes);		computeTileOffsets(b, loc, localIvs, tileSizes);
SmallVector<Value> sizes =		SmallVector<Value> sizes =
computeTileSizes(b, loc, localIvs, tileSizes, allDims);		computeTileSizes(b, loc, localIvs, tileSizes, allDims);
// Create ExtractSliceOp: Extract a tile from the tensor::PadOp.		// Create ExtractSliceOp: Extract a tile from the tensor::PadOp.
// Note: The tensor::PadOp is located outside of the loop nest. It is		// Note: The tensor::PadOp is located outside of the loop nest. It is
// later moved inside by ExtractSliceOfPadTensorSwapPattern.		// later moved inside by ExtractSliceOfPadTensorSwapPattern.
auto map = AffineMap::getMultiDimIdentityMap(rank, b.getContext());		auto map = AffineMap::getMultiDimIdentityMap(rank, b.getContext());
Value tiledOutput =		Value tiledOutput = makeTiledShape(
makeTiledShape(b, loc, newPadOp->getResult(0), tileSizes, map,		b, loc, newPadOp->getResult(0), tileSizes, map, offsets, allDims,
offsets, allDims, sizes);		sizes, /omitPartialTileCheck=/false);
auto sliceOp = tiledOutput.getDefiningOp<tensor::ExtractSliceOp>();		auto sliceOp = tiledOutput.getDefiningOp<tensor::ExtractSliceOp>();
assert(sliceOp && "expected ExtractSliceOp");		assert(sliceOp && "expected ExtractSliceOp");
// Insert the tile into the output tensor.		// Insert the tile into the output tensor.
// TODO: Propagate RewriterBase everywhere.		// TODO: Propagate RewriterBase everywhere.
IRRewriter rewriter(b);		IRRewriter rewriter(b);
Value yieldValue =		Value yieldValue =
insertSliceIntoTensor(rewriter, loc, sliceOp, sliceOp, iterArgs[0]);		insertSliceIntoTensor(rewriter, loc, sliceOp, sliceOp, iterArgs[0]);
return scf::ValueVector({yieldValue});		return scf::ValueVector({yieldValue});
▲ Show 20 Lines • Show All 159 Lines • Show Last 20 Lines

mlir/lib/Dialect/Linalg/Transforms/Vectorization.cpp

Show First 20 Lines • Show All 498 Lines • ▼ Show 20 Lines	for (OpOperand *opOperand : linalgOp.getInputAndOutputOperands()) {
}		}
VectorType readType;		VectorType readType;
AffineMap map;		AffineMap map;
// TODO: can we keep this simplification?		// TODO: can we keep this simplification?
// if (linalgOp.getShape(opOperand).empty()) {		// if (linalgOp.getShape(opOperand).empty()) {
// readType = VectorType::get({}, bbarg.getType());		// readType = VectorType::get({}, bbarg.getType());
// } else {		// } else {
if (opOperand->getOperandNumber() < linalgOp.getNumInputs()) {		if (opOperand->getOperandNumber() < linalgOp.getNumInputs()) {
map = inverseAndBroadcastProjectedPermuation(		map = inverseAndBroadcastProjectedPermutation(
linalgOp.getTiedIndexingMap(opOperand));		linalgOp.getTiedIndexingMap(opOperand));
readType = VectorType::get(commonVectorShape,		readType = VectorType::get(commonVectorShape,
getElementTypeOrSelf(opOperand->get()));		getElementTypeOrSelf(opOperand->get()));
} else {		} else {
map = inversePermutation(		map = inversePermutation(
reindexIndexingMap(linalgOp.getTiedIndexingMap(opOperand)));		reindexIndexingMap(linalgOp.getTiedIndexingMap(opOperand)));
readType = VectorType::get(map.compose(linalgOp.getShape(opOperand)),		readType = VectorType::get(map.compose(linalgOp.getShape(opOperand)),
getElementTypeOrSelf(opOperand->get()));		getElementTypeOrSelf(opOperand->get()));
▲ Show 20 Lines • Show All 1,192 Lines • Show Last 20 Lines

mlir/lib/Dialect/Linalg/Utils/Utils.cpp

Show First 20 Lines • Show All 739 Lines • ▼ Show 20 Lines	static Value fullyComposeAndAffineApply(OpBuilder &b, Location loc,
SmallVector<Value> normalizedOperands(operands.begin(), operands.end());		SmallVector<Value> normalizedOperands(operands.begin(), operands.end());
mlir::fullyComposeAffineMapAndOperands(&map, &normalizedOperands);		mlir::fullyComposeAffineMapAndOperands(&map, &normalizedOperands);
canonicalizeMapAndOperands(&map, &normalizedOperands);		canonicalizeMapAndOperands(&map, &normalizedOperands);
return b.createOrFold<AffineApplyOp>(loc, map, normalizedOperands);		return b.createOrFold<AffineApplyOp>(loc, map, normalizedOperands);
}		}

Value makeTiledShape(OpBuilder &builder, Location loc, Value valueToTile,		Value makeTiledShape(OpBuilder &builder, Location loc, Value valueToTile,
ValueRange tileSizes, AffineMap map, ValueRange lbs,		ValueRange tileSizes, AffineMap map, ValueRange lbs,
ValueRange ubs, ValueRange subShapeSizes) {		ValueRange ubs, ValueRange subShapeSizes,
		bool omitPartialTileCheck) {
auto shapedType = valueToTile.getType().dyn_cast<ShapedType>();		auto shapedType = valueToTile.getType().dyn_cast<ShapedType>();
assert(shapedType && "only shaped types can be tiled");		assert(shapedType && "only shaped types can be tiled");
ArrayRef<int64_t> shape = shapedType.getShape();		ArrayRef<int64_t> shape = shapedType.getShape();
int64_t rank = shapedType.getRank();		int64_t rank = shapedType.getRank();

// Construct a new subview / extract_slice for the tile.		// Construct a new subview / extract_slice for the tile.
SmallVector<OpFoldResult, 4> offsets, sizes, strides;		SmallVector<OpFoldResult, 4> offsets, sizes, strides;
offsets.reserve(rank);		offsets.reserve(rank);
Show All 11 Lines	for (unsigned r = 0; r < rank; ++r) {
}		}
LLVM_DEBUG(llvm::dbgs() << ": tiled: figure out subsize...\n");		LLVM_DEBUG(llvm::dbgs() << ": tiled: figure out subsize...\n");

// Tiling creates a new slice at the proper index, the slice step is 1		// Tiling creates a new slice at the proper index, the slice step is 1
// (i.e. the op does not subsample, stepping occurs in the loop).		// (i.e. the op does not subsample, stepping occurs in the loop).
auto m = map.getSubMap({r});		auto m = map.getSubMap({r});
LLVM_DEBUG(llvm::dbgs() << "makeTiledShape: submap: " << m << "\n");		LLVM_DEBUG(llvm::dbgs() << "makeTiledShape: submap: " << m << "\n");
auto offset = applyMapToValues(builder, loc, m, lbs).front();		auto offset = applyMapToValues(builder, loc, m, lbs).front();
offsets.push_back(offset);		offsets.push_back(getAsOpFoldResult(offset));
auto closedIntSize =		auto closedIntSize =
applyMapToValues(builder, loc, m, subShapeSizes).front();		applyMapToValues(builder, loc, m, subShapeSizes).front();
// Resulting size needs to be made half open interval again.		// Resulting size needs to be made half open interval again.
AffineExpr s0 = getAffineSymbolExpr(0, builder.getContext());		AffineExpr s0 = getAffineSymbolExpr(0, builder.getContext());
Value size =		Value size =
fullyComposeAndAffineApply(builder, loc, s0 + 1, closedIntSize);		fullyComposeAndAffineApply(builder, loc, s0 + 1, closedIntSize);
LLVM_DEBUG(llvm::dbgs() << "makeTiledShape: raw size: " << size << "\n");		LLVM_DEBUG(llvm::dbgs() << "makeTiledShape: raw size: " << size << "\n");
		LLVM_DEBUG(llvm::dbgs()
		<< "makeTiledShape: new offset: " << offset << "\n");
		strides.push_back(builder.getIndexAttr(1));

		if (omitPartialTileCheck) {
		// We statically know that the partial/boundary tile condition is
		// unnecessary.
		LLVM_DEBUG(llvm::dbgs() << "makeTiledShape: new size: " << size << "\n");
		sizes.push_back(getAsOpFoldResult(size));
		continue;
		}

// The size of the subview / extract_slice should be trimmed to avoid		// The size of the subview / extract_slice should be trimmed to avoid
// out-of-bounds accesses, unless:		// out-of-bounds accesses, unless:
// a. We statically know the subshape size divides the shape size evenly.		// a. We statically know the subshape size divides the shape size evenly.
// b. The subshape size is 1. According to the way the loops are set up,		// b. The subshape size is 1. According to the way the loops are set up,
// tensors with "0" dimensions would never be constructed.		// tensors with "0" dimensions would never be constructed.
int64_t shapeSize = shape[r];		int64_t shapeSize = shape[r];
auto sizeCst = size.getDefiningOp<arith::ConstantIndexOp>();		auto sizeCst = size.getDefiningOp<arith::ConstantIndexOp>();
Show All 30 Lines	if (!hasTileSizeOne && !dividesEvenly) {
// Compute min(dim - offset, size) to avoid out-of-bounds accesses.		// Compute min(dim - offset, size) to avoid out-of-bounds accesses.
AffineMap minMap = AffineMap::inferFromExprList(		AffineMap minMap = AffineMap::inferFromExprList(
{ArrayRef<AffineExpr>{dim1 - dim2, dim0}})		{ArrayRef<AffineExpr>{dim1 - dim2, dim0}})
.front();		.front();
SmallVector<Value, 4> operands{size, d, offset};		SmallVector<Value, 4> operands{size, d, offset};
fullyComposeAffineMapAndOperands(&minMap, &operands);		fullyComposeAffineMapAndOperands(&minMap, &operands);
canonicalizeMapAndOperands(&minMap, &operands);		canonicalizeMapAndOperands(&minMap, &operands);
size = builder.create<AffineMinOp>(loc, builder.getIndexType(), minMap,		size = builder.create<AffineMinOp>(loc, builder.getIndexType(), minMap,
operands);		operands);
		nicolasvasilacheUnsubmitted Done Reply Inline Actions Can we invert the logic and create an early exit + comments in the simpler case? nicolasvasilache: Can we invert the logic and create an early exit + comments in the simpler case?
}		}

sizes.push_back(size);
LLVM_DEBUG(llvm::dbgs()
<< "makeTiledShape: new offset: " << offset << "\n");
LLVM_DEBUG(llvm::dbgs() << "makeTiledShape: new size: " << size << "\n");		LLVM_DEBUG(llvm::dbgs() << "makeTiledShape: new size: " << size << "\n");
strides.push_back(builder.getIndexAttr(1));		sizes.push_back(getAsOpFoldResult(size));
}		}

auto sliceOp = TypeSwitch<ShapedType, Operation >(shapedType)		auto sliceOp = TypeSwitch<ShapedType, Operation >(shapedType)
.Case([&](MemRefType) {		.Case([&](MemRefType) {
return builder.create<memref::SubViewOp>(		return builder.create<memref::SubViewOp>(
loc, valueToTile, offsets, sizes, strides);		loc, valueToTile, offsets, sizes, strides);
})		})
.Case([&](RankedTensorType) {		.Case([&](RankedTensorType) {
Show All 35 Lines	SmallVector<Value> computeTileSizes(OpBuilder &b, Location loc, ValueRange ivs,
}		}
return sizes;		return sizes;
}		}

SmallVector<Value, 4> makeTiledShapes(OpBuilder &b, Location loc,		SmallVector<Value, 4> makeTiledShapes(OpBuilder &b, Location loc,
LinalgOp linalgOp,		LinalgOp linalgOp,
ArrayRef<Value> valuesToTile,		ArrayRef<Value> valuesToTile,
ValueRange ivs, ValueRange tileSizes,		ValueRange ivs, ValueRange tileSizes,
ArrayRef<Value> sizeBounds) {		ArrayRef<Value> sizeBounds,
		bool omitPartialTileCheck) {
assert(ivs.size() == static_cast<size_t>(llvm::count_if(		assert(ivs.size() == static_cast<size_t>(llvm::count_if(
llvm::make_range(tileSizes.begin(), tileSizes.end()),		llvm::make_range(tileSizes.begin(), tileSizes.end()),
[](Value v) { return !isZero(v); })) &&		[](Value v) { return !isZero(v); })) &&
"expected as many ivs as non-zero sizes");		"expected as many ivs as non-zero sizes");

// Construct (potentially temporary) mins and maxes on which to apply maps		// Construct (potentially temporary) mins and maxes on which to apply maps
// that define tile subshapes.		// that define tile subshapes.
SmallVector<Value> lbs = computeTileOffsets(b, loc, ivs, tileSizes);		SmallVector<Value> lbs = computeTileOffsets(b, loc, ivs, tileSizes);
Show All 18 Lines	if (!isTiled(map, tileSizes) && !linalgOp.isOutputTensor(opOperand)) {
tiledShapes.push_back(shapedOp);		tiledShapes.push_back(shapedOp);
LLVM_DEBUG(llvm::dbgs() << ": not tiled: use shape: "		LLVM_DEBUG(llvm::dbgs() << ": not tiled: use shape: "
<< opOperand->get().getType() << "\n");		<< opOperand->get().getType() << "\n");
continue;		continue;
}		}
LLVM_DEBUG(llvm::dbgs() << ": tiled: figure out subshape...\n");		LLVM_DEBUG(llvm::dbgs() << ": tiled: figure out subshape...\n");

tiledShapes.push_back(makeTiledShape(b, loc, shapedOp, tileSizes, map, lbs,		tiledShapes.push_back(makeTiledShape(b, loc, shapedOp, tileSizes, map, lbs,
sizeBounds, subShapeSizes));		sizeBounds, subShapeSizes,
		omitPartialTileCheck));
}		}

return tiledShapes;		return tiledShapes;
}		}

void addTileLoopIvsToIndexOpResults(OpBuilder &b, LinalgOp tiledOp,		void addTileLoopIvsToIndexOpResults(OpBuilder &b, LinalgOp tiledOp,
ArrayRef<Value> ivs) {		ArrayRef<Value> ivs) {
if (tiledOp.hasIndexSemantics()) {		if (tiledOp.hasIndexSemantics()) {
Show All 17 Lines

mlir/lib/IR/AffineMap.cpp

Show First 20 Lines • Show All 673 Lines • ▼ Show 20 Lines	AffineMap mlir::inversePermutation(AffineMap map) {
for (auto expr : exprs)		for (auto expr : exprs)
if (expr)		if (expr)
seenExprs.push_back(expr);		seenExprs.push_back(expr);
if (seenExprs.size() != map.getNumInputs())		if (seenExprs.size() != map.getNumInputs())
return AffineMap();		return AffineMap();
return AffineMap::get(map.getNumResults(), 0, seenExprs, map.getContext());		return AffineMap::get(map.getNumResults(), 0, seenExprs, map.getContext());
}		}

AffineMap mlir::inverseAndBroadcastProjectedPermuation(AffineMap map) {		AffineMap mlir::inverseAndBroadcastProjectedPermutation(AffineMap map) {
assert(map.isProjectedPermutation(/allowZeroInResults=/true));		assert(map.isProjectedPermutation(/allowZeroInResults=/true));
MLIRContext *context = map.getContext();		MLIRContext *context = map.getContext();
AffineExpr zero = mlir::getAffineConstantExpr(0, context);		AffineExpr zero = mlir::getAffineConstantExpr(0, context);
// Start with all the results as 0.		// Start with all the results as 0.
SmallVector<AffineExpr, 4> exprs(map.getNumInputs(), zero);		SmallVector<AffineExpr, 4> exprs(map.getNumInputs(), zero);
for (unsigned i : llvm::seq(unsigned(0), map.getNumResults())) {		for (unsigned i : llvm::seq(unsigned(0), map.getNumResults())) {
// Skip zeros from input map. 'exprs' is already initialized to zero.		// Skip zeros from input map. 'exprs' is already initialized to zero.
if (auto constExpr = map.getResult(i).dyn_cast<AffineConstantExpr>()) {		if (auto constExpr = map.getResult(i).dyn_cast<AffineConstantExpr>()) {
▲ Show 20 Lines • Show All 73 Lines • Show Last 20 Lines

mlir/test/Dialect/Linalg/bubble-up-extract-slice-op.mlir

This file was added.

				//RUN: mlir-opt -test-linalg-transform-patterns=test-bubble-up-extract-slice-op-pattern -split-input-file %s \| FileCheck %s

				func @dynamic(%arg0: tensor<?x?xf32>, %arg1: tensor<?xf32>, %arg2: index, %arg3: index, %arg4: index, %arg5:index) -> tensor<?x?xf32> {
				%0 = linalg.generic {
				indexing_maps = [affine_map<(d0, d1) -> (d0, d1)>,
				affine_map<(d0, d1) -> (d1)>,
				affine_map<(d0, d1) -> (d0, d1)>],
				iterator_types = ["parallel", "parallel"]
				} ins(%arg0, %arg1 : tensor<?x?xf32>, tensor<?xf32>)
				outs(%arg0 : tensor<?x?xf32>) {
				^bb0(%b0 : f32, %b1 : f32, %b2 : f32):
				%add = arith.addf %b0, %b1 : f32
				linalg.yield %add : f32
				} -> tensor<?x?xf32>
				%1 = tensor.extract_slice %0 [%arg2, %arg3] [%arg4, %arg5] [1, 1]
				: tensor<?x?xf32> to tensor<?x?xf32>
				return %1 : tensor<?x?xf32>
				}

				// CHECK: func @dynamic
				// CHECK: %[[SLICE0:.+]] = tensor.extract_slice %arg0[%arg2, %arg3] [%arg4, %arg5] [1, 1] : tensor<?x?xf32> to tensor<?x?xf32>
				// CHECK: %[[SLICE1:.+]] = tensor.extract_slice %arg1[%arg3] [%arg5] [1] : tensor<?xf32> to tensor<?xf32>
				// CHECK: %[[SLICE2:.+]] = tensor.extract_slice %arg0[%arg2, %arg3] [%arg4, %arg5] [1, 1] : tensor<?x?xf32> to tensor<?x?xf32>
				// CHECK: %[[GENERIC:.+]] = linalg.generic {indexing_maps = [#map0, #map1, #map0], iterator_types = ["parallel", "parallel"]}
				// CHECK-SAME: ins(%[[SLICE0]], %[[SLICE1]] : tensor<?x?xf32>, tensor<?xf32>) outs(%[[SLICE2]] : tensor<?x?xf32>)
				// CHECK: return %[[GENERIC]] : tensor<?x?xf32>

				//-----

				func @static(%arg0: tensor<16x8xf32>, %arg1: tensor<8xf32>) -> tensor<4x2xf32> {
				%0 = linalg.generic {
				indexing_maps = [affine_map<(d0, d1) -> (d0, d1)>,
				affine_map<(d0, d1) -> (d1)>,
				affine_map<(d0, d1) -> (d0, d1)>],
				iterator_types = ["parallel", "parallel"]
				} ins(%arg0, %arg1 : tensor<16x8xf32>, tensor<8xf32>)
				outs(%arg0 : tensor<16x8xf32>) {
				^bb0(%b0 : f32, %b1 : f32, %b2 : f32):
				%add = arith.addf %b0, %b1 : f32
				linalg.yield %add : f32
				} -> tensor<16x8xf32>
				%1 = tensor.extract_slice %0 [8, 4] [4, 2] [1, 1]
				: tensor<16x8xf32> to tensor<4x2xf32>
				return %1 : tensor<4x2xf32>
				}

				// CHECK: func @static
				// CHECK: %[[SLICE0:.+]] = tensor.extract_slice %arg0[8, 4] [4, 2] [1, 1] : tensor<16x8xf32> to tensor<4x2xf32>
				// CHECK: %[[SLICE1:.+]] = tensor.extract_slice %arg1[4] [2] [1] : tensor<8xf32> to tensor<2xf32>
				// CHECK: %[[SLICE2:.+]] = tensor.extract_slice %arg0[8, 4] [4, 2] [1, 1] : tensor<16x8xf32> to tensor<4x2xf32>
				// CHECK: %[[GENERIC:.+]] = linalg.generic {indexing_maps = [#map0, #map1, #map0], iterator_types = ["parallel", "parallel"]}
				// CHECK-SAME: ins(%[[SLICE0]], %[[SLICE1]] : tensor<4x2xf32>, tensor<2xf32>) outs(%[[SLICE2]] : tensor<4x2xf32>)
				// CHECK: return %[[GENERIC]] : tensor<4x2xf32>

				//-----

				func @mixed(%arg0: tensor<?x8xf32>, %arg1: tensor<8xf32>, %arg2: index, %arg3: index) -> tensor<?x2xf32> {
				%0 = linalg.generic {
				indexing_maps = [affine_map<(d0, d1) -> (d0, d1)>,
				affine_map<(d0, d1) -> (d1)>,
				affine_map<(d0, d1) -> (d0, d1)>],
				iterator_types = ["parallel", "parallel"]
				} ins(%arg0, %arg1 : tensor<?x8xf32>, tensor<8xf32>)
				outs(%arg0 : tensor<?x8xf32>) {
				^bb0(%b0 : f32, %b1 : f32, %b2 : f32):
				%add = arith.addf %b0, %b1 : f32
				linalg.yield %add : f32
				} -> tensor<?x8xf32>
				%1 = tensor.extract_slice %0 [8, %arg2] [%arg3, 2] [1, 1]
				: tensor<?x8xf32> to tensor<?x2xf32>
				return %1 : tensor<?x2xf32>
				}

				// CHECK: func @mixed
				// CHECK: %[[SLICE0:.+]] = tensor.extract_slice %arg0[8, %arg2] [%arg3, 2] [1, 1] : tensor<?x8xf32> to tensor<?x2xf32>
				// CHECK: %[[SLICE1:.+]] = tensor.extract_slice %arg1[%arg2] [2] [1] : tensor<8xf32> to tensor<2xf32>
				// CHECK: %[[SLICE2:.+]] = tensor.extract_slice %arg0[8, %arg2] [%arg3, 2] [1, 1] : tensor<?x8xf32> to tensor<?x2xf32>
				// CHECK: %[[GENERIC:.+]] = linalg.generic {indexing_maps = [#map0, #map1, #map0], iterator_types = ["parallel", "parallel"]}
				// CHECK-SAME: ins(%[[SLICE0]], %[[SLICE1]] : tensor<?x2xf32>, tensor<2xf32>) outs(%[[SLICE2]] : tensor<?x2xf32>)
				// CHECK: return %[[GENERIC]] : tensor<?x2xf32>

				//-----

				func @dynamic_to_static(%arg0: tensor<?x?xf32>, %arg1: tensor<?xf32>) -> tensor<4x2xf32> {
				%0 = linalg.generic {
				indexing_maps = [affine_map<(d0, d1) -> (d0, d1)>,
				affine_map<(d0, d1) -> (d1)>,
				affine_map<(d0, d1) -> (d0, d1)>],
				iterator_types = ["parallel", "parallel"]
				} ins(%arg0, %arg1 : tensor<?x?xf32>, tensor<?xf32>)
				outs(%arg0 : tensor<?x?xf32>) {
				^bb0(%b0 : f32, %b1 : f32, %b2 : f32):
				%add = arith.addf %b0, %b1 : f32
				linalg.yield %add : f32
				} -> tensor<?x?xf32>
				%1 = tensor.extract_slice %0 [8, 4] [4, 2] [1, 1]
				: tensor<?x?xf32> to tensor<4x2xf32>
				return %1 : tensor<4x2xf32>
				}

				// CHECK: func @dynamic_to_static
				// CHECK: %[[SLICE0:.+]] = tensor.extract_slice %arg0[8, 4] [4, 2] [1, 1] : tensor<?x?xf32> to tensor<4x2xf32>
				// CHECK: %[[SLICE1:.+]] = tensor.extract_slice %arg1[4] [2] [1] : tensor<?xf32> to tensor<2xf32>
				// CHECK: %[[SLICE2:.+]] = tensor.extract_slice %arg0[8, 4] [4, 2] [1, 1] : tensor<?x?xf32> to tensor<4x2xf32>
				// CHECK: %[[GENERIC:.+]] = linalg.generic {indexing_maps = [#map0, #map1, #map0], iterator_types = ["parallel", "parallel"]}
				// CHECK-SAME: ins(%[[SLICE0]], %[[SLICE1]] : tensor<4x2xf32>, tensor<2xf32>) outs(%[[SLICE2]] : tensor<4x2xf32>)
				// CHECK: return %[[GENERIC]] : tensor<4x2xf32>

				//-----

				func @matmul_slice() -> tensor<2x2xf32> {
				%lhs = arith.constant dense<1.0> : tensor<4x4xf32>
				%rhs = arith.constant dense<1.0> : tensor<4x4xf32>
				%dst = arith.constant dense<[[0.0, 1.0, 2.0, 3.0], [4.0, 5.0, 6.0, 7.0], [8.0, 9.0, 10.0, 11.0], [12.0, 13.0, 14.0, 15.0]]> : tensor<4x4xf32>
				%0 = linalg.matmul ins(%lhs, %rhs : tensor<4x4xf32>, tensor<4x4xf32>) outs(%dst : tensor<4x4xf32>) -> tensor<4x4xf32>
				%1 = tensor.extract_slice %0[1,1][2,2][1,1] : tensor<4x4xf32> to tensor<2x2xf32>
				return %1 : tensor<2x2xf32>
				}

				// CHECK: func @matmul_slice
				// CHECK: %[[SLICE0:.+]] = arith.constant dense<1.000000e+00> : tensor<2x4xf32>
				// CHECK: %[[SLICE1:.+]] = arith.constant dense<1.000000e+00> : tensor<4x2xf32>
				// CHECK: %[[SLICE3:.+]] = tensor.extract_slice %[[CST:.+]][1, 1] [2, 2] [1, 1] : tensor<4x4xf32> to tensor<2x2xf32>
				// CHECK: %[[MATMUL:.+]] = linalg.matmul ins(%[[SLICE0]], %[[SLICE1]] : tensor<2x4xf32>, tensor<4x2xf32>) outs(%[[SLICE3]] : tensor<2x2xf32>) -> tensor<2x2xf32>
				// CHECK: return %[[MATMUL]] : tensor<2x2xf32>

				//-----

				func @conv_slice(%input: tensor<1x225x225x3xf32>, %filter: tensor<3x3x3x32xf32>) -> tensor<1x32x32x16xf32> {
				%c112 = arith.constant 112 : index
				%c32 = arith.constant 32 : index
				%c16 = arith.constant 16 : index
				%c8 = arith.constant 8 : index
				%c4 = arith.constant 4 : index
				%c0 = arith.constant 0 : index
				%cst = arith.constant 0.0 : f32

				%init = linalg.init_tensor [1, 112, 112, 32] : tensor<1x112x112x32xf32>
				%fill = linalg.fill ins(%cst : f32) outs(%init : tensor<1x112x112x32xf32>) -> tensor<1x112x112x32xf32>

				%conv = linalg.conv_2d_nhwc_hwcf
				{dilations = dense<1> : tensor<2xi64>, strides = dense<2> : tensor<2xi64>}
				ins(%input, %filter : tensor<1x225x225x3xf32>, tensor<3x3x3x32xf32>)
				outs(%fill : tensor<1x112x112x32xf32>) -> tensor<1x112x112x32xf32>

				%slice = tensor.extract_slice %conv [0, 64, 64, 16] [1, 32, 32, 16] [1, 1, 1, 1] : tensor<1x112x112x32xf32> to tensor<1x32x32x16xf32>

				return %slice : tensor<1x32x32x16xf32>
				}

				// CHECK: func @conv_slice
				// CHECK: %[[INIT:.+]] = linalg.init_tensor [1, 112, 112, 32] : tensor<1x112x112x32xf32>
				// CHECK: %[[SLICE0:.+]] = tensor.extract_slice %arg0[0, 128, 128, 0] [1, 65, 65, 3] [1, 1, 1, 1] : tensor<1x225x225x3xf32> to tensor<1x65x65x3xf32>
				// CHECK: %[[SLICE1:.+]] = tensor.extract_slice %arg1[0, 0, 0, 16] [3, 3, 3, 16] [1, 1, 1, 1] : tensor<3x3x3x32xf32> to tensor<3x3x3x16xf32>
				// CHECK: %[[SLICE2:.+]] = tensor.extract_slice %[[INIT]][0, 64, 64, 16] [1, 32, 32, 16] [1, 1, 1, 1] : tensor<1x112x112x32xf32> to tensor<1x32x32x16xf32>
				// CHECK: %[[FILL:.+]] = linalg.fill ins(%[[CST:.+]] : f32) outs(%[[SLICE2]] : tensor<1x32x32x16xf32>) -> tensor<1x32x32x16xf32>
				// CHECK: %[[CONV:.+]] = linalg.conv_2d_nhwc_hwcf {dilations = dense<1> : tensor<2xi64>, strides = dense<2> : tensor<2xi64>} ins(%[[SLICE0]], %[[SLICE1]] : tensor<1x65x65x3xf32>, tensor<3x3x3x16xf32>) outs(%[[FILL]] : tensor<1x32x32x16xf32>) -> tensor<1x32x32x16xf32>
				// CHECK: return %[[CONV]] : tensor<1x32x32x16xf32>

mlir/test/lib/Dialect/Linalg/TestLinalgTransforms.cpp

Show First 20 Lines • Show All 126 Lines • ▼ Show 20 Lines	Option<bool> skipPartial{
*this, "skip-partial",		*this, "skip-partial",
llvm::cl::desc("Skip loops inside partial iterations during peeling"),		llvm::cl::desc("Skip loops inside partial iterations during peeling"),
llvm::cl::init(false)};		llvm::cl::init(false)};
Option<std::string> loopType{		Option<std::string> loopType{
*this, "loop-type",		*this, "loop-type",
llvm::cl::desc("Specify the type of loops to generate: for, parallel or "		llvm::cl::desc("Specify the type of loops to generate: for, parallel or "
"tiled_loop"),		"tiled_loop"),
llvm::cl::init("for")};		llvm::cl::init("for")};
		Option<bool> testBubbleUpExtractSliceOpPattern{
		*this, "test-bubble-up-extract-slice-op-pattern",
		llvm::cl::desc("Test rewrite of linalgOp + extract_slice into "
		"extract_slice + linalgOp"),
		llvm::cl::init(false)};
};		};
} // namespace		} // namespace

static void applyPatterns(FuncOp funcOp) {		static void applyPatterns(FuncOp funcOp) {
MLIRContext *ctx = funcOp.getContext();		MLIRContext *ctx = funcOp.getContext();
RewritePatternSet patterns(ctx);		RewritePatternSet patterns(ctx);

//===--------------------------------------------------------------------===//		//===--------------------------------------------------------------------===//
▲ Show 20 Lines • Show All 487 Lines • ▼ Show 20 Lines	linalg::populateSplitReductionPattern(
return std::make_pair(4, insertDimIndex);		return std::make_pair(4, insertDimIndex);
},		},
LinalgTransformationFilter(		LinalgTransformationFilter(
ArrayRef<StringAttr>{},		ArrayRef<StringAttr>{},
StringAttr::get(funcOp.getContext(), "SPLIT")));		StringAttr::get(funcOp.getContext(), "SPLIT")));
(void)applyPatternsAndFoldGreedily(funcOp, std::move(patterns));		(void)applyPatternsAndFoldGreedily(funcOp, std::move(patterns));
}		}

		static void applyBubbleUpExtractSliceOpPattern(FuncOp funcOp) {
		RewritePatternSet patterns(funcOp.getContext());
		populateBubbleUpExtractSliceOpPatterns(patterns);
		(void)applyPatternsAndFoldGreedily(funcOp, std::move(patterns));
		}

/// Apply transformations specified as patterns.		/// Apply transformations specified as patterns.
void TestLinalgTransforms::runOnOperation() {		void TestLinalgTransforms::runOnOperation() {
auto lambda = [&](void *) {		auto lambda = [&](void *) {
getOperation().walk([](LinalgOp op) {		getOperation().walk([](LinalgOp op) {
op->removeAttr(LinalgTransforms::kLinalgTransformMarker);		op->removeAttr(LinalgTransforms::kLinalgTransformMarker);
});		});
};		};
std::unique_ptr<void, decltype(lambda)> cleanupGuard{(void *)1, lambda};		std::unique_ptr<void, decltype(lambda)> cleanupGuard{(void *)1, lambda};
Show All 35 Lines	void TestLinalgTransforms::runOnOperation() {
if (testTilePattern)		if (testTilePattern)
return applyTilePattern(getOperation(), loopType, tileSizes, peeledLoops,		return applyTilePattern(getOperation(), loopType, tileSizes, peeledLoops,
/scalarizeDynamicDims=/false);		/scalarizeDynamicDims=/false);
if (testTileScalarizeDynamicDims)		if (testTileScalarizeDynamicDims)
return applyTilePattern(getOperation(), loopType, tileSizes,		return applyTilePattern(getOperation(), loopType, tileSizes,
/peeledLoops=/{}, /scalarizeDynamicDims=/true);		/peeledLoops=/{}, /scalarizeDynamicDims=/true);
if (testSplitReduction)		if (testSplitReduction)
return applySplitReduction(getOperation());		return applySplitReduction(getOperation());
		if (testBubbleUpExtractSliceOpPattern)
		return applyBubbleUpExtractSliceOpPattern(getOperation());
}		}

namespace mlir {		namespace mlir {
namespace test {		namespace test {
void registerTestLinalgTransforms() {		void registerTestLinalgTransforms() {
PassRegistration<TestLinalgTransforms>();		PassRegistration<TestLinalgTransforms>();
}		}
} // namespace test		} // namespace test
} // namespace mlir		} // namespace mlir

This is an archive of the discontinued LLVM Phabricator instance.

[mlir] Bubble up tensor.extract_slice above linalg operation
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 419503

mlir/include/mlir/Dialect/Linalg/Transforms/Transforms.h

mlir/include/mlir/Dialect/Linalg/Utils/Utils.h

mlir/include/mlir/IR/AffineMap.h

mlir/lib/Dialect/Linalg/Transforms/BubbleUpExtractSlice.cpp

mlir/lib/Dialect/Linalg/Transforms/CMakeLists.txt

mlir/lib/Dialect/Linalg/Transforms/Fusion.cpp

mlir/lib/Dialect/Linalg/Transforms/FusionOnTensors.cpp

mlir/lib/Dialect/Linalg/Transforms/Tiling.cpp

mlir/lib/Dialect/Linalg/Transforms/Vectorization.cpp

mlir/lib/Dialect/Linalg/Utils/Utils.cpp

mlir/lib/IR/AffineMap.cpp

mlir/test/Dialect/Linalg/bubble-up-extract-slice-op.mlir

mlir/test/lib/Dialect/Linalg/TestLinalgTransforms.cpp

This is an archive of the discontinued LLVM Phabricator instance.

[mlir] Bubble up tensor.extract_slice above linalg operationClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 419503

mlir/include/mlir/Dialect/Linalg/Transforms/Transforms.h

mlir/include/mlir/Dialect/Linalg/Utils/Utils.h

mlir/include/mlir/IR/AffineMap.h

mlir/lib/Dialect/Linalg/Transforms/BubbleUpExtractSlice.cpp

mlir/lib/Dialect/Linalg/Transforms/CMakeLists.txt

mlir/lib/Dialect/Linalg/Transforms/Fusion.cpp

mlir/lib/Dialect/Linalg/Transforms/FusionOnTensors.cpp

mlir/lib/Dialect/Linalg/Transforms/Tiling.cpp

mlir/lib/Dialect/Linalg/Transforms/Vectorization.cpp

mlir/lib/Dialect/Linalg/Utils/Utils.cpp

mlir/lib/IR/AffineMap.cpp

mlir/test/Dialect/Linalg/bubble-up-extract-slice-op.mlir

mlir/test/lib/Dialect/Linalg/TestLinalgTransforms.cpp

[mlir] Bubble up tensor.extract_slice above linalg operation
ClosedPublic