Diff 503871

mlir/include/mlir/Dialect/NVGPU/Utils/MMAUtils.h

Show First 20 Lines • Show All 87 Lines • ▼ Show 20 Lines	FailureOr<LdMatrixParams> getLdMatrixParams(const WarpMatrixInfo &type,
bool transpose);		bool transpose);
/// Returns an AffineMap which maps a single dimension representing the laneId		/// Returns an AffineMap which maps a single dimension representing the laneId
/// to two results representing offsets within the matrix operand that should		/// to two results representing offsets within the matrix operand that should
/// be the pointer locations a thread should pass to the ldmatrix instruction.		/// be the pointer locations a thread should pass to the ldmatrix instruction.
FailureOr<AffineMap>		FailureOr<AffineMap>
getLaneIdToLdMatrixMatrixCoord(OpBuilder &builder, Location loc,		getLaneIdToLdMatrixMatrixCoord(OpBuilder &builder, Location loc,
const LdMatrixParams &params);		const LdMatrixParams &params);

/// Transform `vector.contract` into (m,k)x(n,k)x(m,n) form so that it can be
/// converted to `nvgpu.mma.sync`. This specific form is meant to indicate that
/// the vector operands are organized such that the reduction dimension is
/// contiguous.
struct PrepareContractToGPUMMASync
: public OpRewritePattern<vector::ContractionOp> {
using OpRewritePattern<vector::ContractionOp>::OpRewritePattern;

LogicalResult matchAndRewrite(vector::ContractionOp op,
PatternRewriter &rewriter) const override;
};

} // namespace nvgpu		} // namespace nvgpu
} // namespace mlir		} // namespace mlir

#endif // MLIR_DIALECT_NVGPU_UTILS_MMAUTILS_H		#endif // MLIR_DIALECT_NVGPU_UTILS_MMAUTILS_H

mlir/include/mlir/Dialect/Vector/Transforms/VectorRewritePatterns.h

Show All 11 Lines
#include <utility>		#include <utility>
#include <optional>		#include <optional>

#include "mlir/Dialect/Vector/IR/VectorOps.h"		#include "mlir/Dialect/Vector/IR/VectorOps.h"
#include "mlir/Dialect/Vector/Transforms/VectorTransformsEnums.h.inc"		#include "mlir/Dialect/Vector/Transforms/VectorTransformsEnums.h.inc"
#include "mlir/Dialect/Vector/Utils/VectorUtils.h"		#include "mlir/Dialect/Vector/Utils/VectorUtils.h"
#include "mlir/IR/BuiltinOps.h"		#include "mlir/IR/BuiltinOps.h"
#include "mlir/IR/PatternMatch.h"		#include "mlir/IR/PatternMatch.h"
		#include "mlir/Support/LogicalResult.h"

namespace mlir {		namespace mlir {
class RewritePatternSet;		class RewritePatternSet;

namespace vector {		namespace vector {

//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
// Vector transformation options exposed as auxiliary structs.		// Vector transformation options exposed as auxiliary structs.
▲ Show 20 Lines • Show All 114 Lines • ▼ Show 20 Lines

/// Collects patterns to progressively lower vector contraction ops on high-D		/// Collects patterns to progressively lower vector contraction ops on high-D
/// into low-D reduction and product ops.		/// into low-D reduction and product ops.
void populateVectorContractLoweringPatterns(		void populateVectorContractLoweringPatterns(
RewritePatternSet &patterns,		RewritePatternSet &patterns,
VectorTransformsOptions options = VectorTransformsOptions(),		VectorTransformsOptions options = VectorTransformsOptions(),
PatternBenefit benefit = 1);		PatternBenefit benefit = 1);

		/// Canonicalization of a `vector.contraction %a, %b, %c` with row-major matmul
		/// semantics to a contraction with MMT semantics (matrix matrix multiplication
		/// with the RHS transposed). This specific form is meant to have the vector
		/// operands are organized such that the reduction dimension is contiguous.
		/// Example:
		/// ```
		/// vector.contract {indexing_maps = [affine_map<(m, n, k) -> (m, k)>,
		/// affine_map<(m, n, k) -> (n, k)>,
		/// affine_map<(m, n, k) -> (m, n)>],
		/// iterator_types = ["parallel", "parallel", "reduction"],
		/// kind = #vector.kind<add>} %a, %b, %c : ...
		/// ```
		///
		/// The `constraint` predicate is used to decide which `vector.contraction` ops
		/// to filter out.
		void populateVectorContractCanonicalizeMatmulToMMT(
		RewritePatternSet &patterns,
		std::function<LogicalResult(vector::ContractionOp)> constraint =
		[](vector::ContractionOp) { return success(); },
		PatternBenefit = 1);

/// Collect patterns to convert reduction op to vector.contract and fold		/// Collect patterns to convert reduction op to vector.contract and fold
/// transpose/broadcast ops into the contract.		/// transpose/broadcast ops into the contract.
void populateVectorReductionToContractPatterns(RewritePatternSet &patterns,		void populateVectorReductionToContractPatterns(RewritePatternSet &patterns,
PatternBenefit benefit = 1);		PatternBenefit benefit = 1);

/// Collect patterns to convert scan op		/// Collect patterns to convert scan op
void populateVectorScanLoweringPatterns(RewritePatternSet &patterns,		void populateVectorScanLoweringPatterns(RewritePatternSet &patterns,
PatternBenefit benefit = 1);		PatternBenefit benefit = 1);
▲ Show 20 Lines • Show All 356 Lines • ▼ Show 20 Lines	FailureOr<Value> lowerParallel(PatternRewriter &rewriter,
vector::ContractionOp op, int64_t lhsIndex,		vector::ContractionOp op, int64_t lhsIndex,
int64_t rhsIndex, Value mask) const;		int64_t rhsIndex, Value mask) const;
// Lower one reduction dimension.		// Lower one reduction dimension.
FailureOr<Value> lowerReduction(PatternRewriter &rewriter,		FailureOr<Value> lowerReduction(PatternRewriter &rewriter,
vector::ContractionOp op, Value mask) const;		vector::ContractionOp op, Value mask) const;
};		};

} // namespace vector		} // namespace vector
} // namespace mlir		} // namespace mlir
		dcaballeUnsubmitted Done Reply Inline Actions Excuse my ignorance... What is MMT and TNT? Perhaps adding a comment would help. dcaballe: Excuse my ignorance... What is MMT and TNT? Perhaps adding a comment would help.
		kuharAuthorUnsubmitted Done Reply Inline Actions It's probably my ignorance, I wasn't sure if there's some standard nomenclature for this. The goal is to have the contraction in the matrix x matrix-transposed form (LHS row-major, RHS col-major, OUT row-major). The original code called it MMA (matrix multiply-accumulate), but I thought that was too nvidia-specific because it doesn't suggest anything about the canonical form outside of the context of the nvidia isa, IIUC. Do you have any concrete suggestions or pointers to relevant documentation/literature? kuhar: It's probably my ignorance, I wasn't sure if there's some standard nomenclature for this. The…
		ThomasRaouxUnsubmitted Done Reply Inline Actions Since it is an important piece I would spell it out and expand MMT to matmul with rhs transpose and the following IR example should be enough to explain what the transformation does. ThomasRaoux: Since it is an important piece I would spell it out and expand MMT to matmul with rhs transpose…

#endif // MLIR_DIALECT_VECTOR_TRANSFORMS_VECTORREWRITEPATTERNS_H		#endif // MLIR_DIALECT_VECTOR_TRANSFORMS_VECTORREWRITEPATTERNS_H
		ThomasRaouxUnsubmitted Done Reply Inline Actions can we expose a `populate` function instead of having the class in the public header? ThomasRaoux:* can we expose a `populate*` function instead of having the class in the public header?
		kuharAuthorUnsubmitted Done Reply Inline Actions I wanted to keep this move simple and decided to follow the way this pattern was implemented (and also how the neighboring vector patterns are exposed). I wanted to move it to a 'populate' function in a subsequent review, but I can do it in one step if that's prefered. WDYT? kuhar: I wanted to keep this move simple and decided to follow the way this pattern was implemented…
		ThomasRaouxUnsubmitted Done Reply Inline Actions Since it is better to not change what we expose publicly multiple times I would suggest adding the `populate` function right away. It should be a minimal amount a changes. ThomasRaoux: Since it is better to not change what we expose publicly multiple times I would suggest adding…

mlir/lib/Conversion/VectorToGPU/VectorToGPU.cpp

	Show All 18 Lines
	#include "mlir/Dialect/Arith/IR/Arith.h"			#include "mlir/Dialect/Arith/IR/Arith.h"
	#include "mlir/Dialect/GPU/IR/GPUDialect.h"			#include "mlir/Dialect/GPU/IR/GPUDialect.h"
	#include "mlir/Dialect/MemRef/IR/MemRef.h"			#include "mlir/Dialect/MemRef/IR/MemRef.h"
	#include "mlir/Dialect/NVGPU/IR/NVGPUDialect.h"			#include "mlir/Dialect/NVGPU/IR/NVGPUDialect.h"
	#include "mlir/Dialect/NVGPU/Utils/MMAUtils.h"			#include "mlir/Dialect/NVGPU/Utils/MMAUtils.h"
	#include "mlir/Dialect/SCF/IR/SCF.h"			#include "mlir/Dialect/SCF/IR/SCF.h"
	#include "mlir/Dialect/Utils/StructuredOpsUtils.h"			#include "mlir/Dialect/Utils/StructuredOpsUtils.h"
	#include "mlir/Dialect/Vector/IR/VectorOps.h"			#include "mlir/Dialect/Vector/IR/VectorOps.h"
				#include "mlir/Dialect/Vector/Transforms/VectorRewritePatterns.h"
	#include "mlir/Dialect/Vector/Utils/VectorUtils.h"			#include "mlir/Dialect/Vector/Utils/VectorUtils.h"
	#include "mlir/IR/Builders.h"			#include "mlir/IR/Builders.h"
	#include "mlir/IR/BuiltinOps.h"			#include "mlir/IR/BuiltinOps.h"
	#include "mlir/IR/Region.h"			#include "mlir/IR/Region.h"
	#include "mlir/Pass/Pass.h"			#include "mlir/Pass/Pass.h"
	#include "mlir/Support/LogicalResult.h"			#include "mlir/Support/LogicalResult.h"
	#include "mlir/Transforms/GreedyPatternRewriteDriver.h"			#include "mlir/Transforms/GreedyPatternRewriteDriver.h"
	#include "mlir/Transforms/Passes.h"			#include "mlir/Transforms/Passes.h"
	▲ Show 20 Lines • Show All 1,133 Lines • ▼ Show 20 Lines

	void mlir::populatePrepareVectorToMMAPatterns(RewritePatternSet &patterns,			void mlir::populatePrepareVectorToMMAPatterns(RewritePatternSet &patterns,
	bool useNvGpu) {			bool useNvGpu) {
	if (!useNvGpu) {			if (!useNvGpu) {
	patterns.add<PrepareContractToGPUMMA, CombineTransferReadOpTranspose>(			patterns.add<PrepareContractToGPUMMA, CombineTransferReadOpTranspose>(
	patterns.getContext());			patterns.getContext());
	return;			return;
	}			}
	patterns			vector::populateVectorContractCanonicalizeMatmulToMMT(patterns);
	.add<nvgpu::PrepareContractToGPUMMASync, CombineTransferReadOpTranspose>(			patterns.add<CombineTransferReadOpTranspose>(patterns.getContext());
	patterns.getContext());
	}			}

	LogicalResult mlir::convertVectorToMMAOps(RewriterBase &rewriter,			LogicalResult mlir::convertVectorToMMAOps(RewriterBase &rewriter,
	Operation *rootOp) {			Operation *rootOp) {
	SetVector<Operation > ops = getOpToConvert(rootOp, /useNvGpu=*/false);			SetVector<Operation > ops = getOpToConvert(rootOp, /useNvGpu=*/false);
	llvm::DenseMap<Value, Value> valueMapping;			llvm::DenseMap<Value, Value> valueMapping;

	auto globalRes = LogicalResult::success();			auto globalRes = LogicalResult::success();
	▲ Show 20 Lines • Show All 99 Lines • Show Last 20 Lines

mlir/lib/Dialect/NVGPU/Utils/MMAUtils.cpp

Show First 20 Lines • Show All 266 Lines • ▼ Show 20 Lines	nvgpu::getLaneIdToLdMatrixMatrixCoord(OpBuilder &builder, Location loc,
// This case corresponds to col-major matrixA or row-major matrixB or		// This case corresponds to col-major matrixA or row-major matrixB or
// col-major matrixC. This is when the memory layout in `srcMemref` does not		// col-major matrixC. This is when the memory layout in `srcMemref` does not
// match mma.sync hardware vector register operand layout.		// match mma.sync hardware vector register operand layout.
if (params.contiguousDimType == vector::IteratorType::parallel)		if (params.contiguousDimType == vector::IteratorType::parallel)
return makeMap({contiguous, strided});		return makeMap({contiguous, strided});

return failure();		return failure();
}		}

LogicalResult nvgpu::PrepareContractToGPUMMASync::matchAndRewrite(
vector::ContractionOp op, PatternRewriter &rewriter) const {
Location loc = op.getLoc();
Value lhs = op.getLhs();
Value rhs = op.getRhs();
Value res = op.getAcc();

// Set up the parallel/reduction structure in right form.
using MapList = ArrayRef<ArrayRef<AffineExpr>>;
auto infer = [](MapList m) { return AffineMap::inferFromExprList(m); };
AffineExpr m;
AffineExpr n;
AffineExpr k;
bindDims(rewriter.getContext(), m, n, k);
static constexpr std::array<int64_t, 2> perm = {1, 0};
auto iteratorTypes = op.getIteratorTypes().getValue();
SmallVector<AffineMap, 4> maps = op.getIndexingMapsArray();
if (iteratorTypes.size() != 3)
return failure();
if (!(vector::isParallelIterator(iteratorTypes[0]) &&
vector::isParallelIterator(iteratorTypes[1]) &&
vector::isReductionIterator(iteratorTypes[2])))
return failure();

// The canonical form is "TNT" = A row-major, B col-major, C row-major.
const auto canonicalForm = infer({{m, k}, {n, k}, {m, n}});
if (maps == canonicalForm) {
return failure();
}
if (maps == infer({{m, k}, {k, n}, {m, n}})) {
rhs = rewriter.create<vector::TransposeOp>(loc, rhs, perm);
} else if (maps == infer({{k, m}, {k, n}, {m, n}})) {
lhs = rewriter.create<vector::TransposeOp>(loc, lhs, perm);
} else if (maps == infer({{k, m}, {k, n}, {m, n}})) {
rhs = rewriter.create<vector::TransposeOp>(loc, rhs, perm);
lhs = rewriter.create<vector::TransposeOp>(loc, lhs, perm);
} else if (maps == infer({{k, m}, {k, n}, {n, m}})) {
std::swap(rhs, lhs);
rhs = rewriter.create<vector::TransposeOp>(loc, rhs, perm);
lhs = rewriter.create<vector::TransposeOp>(loc, lhs, perm);
} else if (maps == infer({{k, m}, {n, k}, {n, m}})) {
std::swap(rhs, lhs);
rhs = rewriter.create<vector::TransposeOp>(loc, rhs, perm);
} else if (maps == infer({{m, k}, {k, n}, {n, m}})) {
std::swap(lhs, rhs);
lhs = rewriter.create<vector::TransposeOp>(loc, lhs, perm);
} else if (maps == infer({{m, k}, {n, k}, {n, m}})) {
std::swap(lhs, rhs);
} else {
return failure();
}
rewriter.replaceOpWithNewOp<vector::ContractionOp>(
op, lhs, rhs, res, rewriter.getAffineMapArrayAttr(canonicalForm),
op.getIteratorTypes());
return success();
}

mlir/lib/Dialect/Vector/Transforms/VectorTransforms.cpp

//===- VectorTransforms.cpp - Conversion within the Vector dialect --------===//		//===- VectorTransforms.cpp - Conversion within the Vector dialect --------===//
//		//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.		// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.		// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception		// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
//		//
// This file implements target-independent rewrites as 1->N patterns.		// This file implements target-independent rewrites as 1->N patterns.
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

#include "mlir/Dialect/Vector/Transforms/VectorTransforms.h"		#include "mlir/Dialect/Vector/Transforms/VectorTransforms.h"

		#include <functional>
#include <optional>		#include <optional>
#include <type_traits>		#include <type_traits>

#include "mlir/Dialect/Affine/IR/AffineOps.h"		#include "mlir/Dialect/Affine/IR/AffineOps.h"
#include "mlir/Dialect/Arith/IR/Arith.h"		#include "mlir/Dialect/Arith/IR/Arith.h"
#include "mlir/Dialect/Arith/Utils/Utils.h"		#include "mlir/Dialect/Arith/Utils/Utils.h"
#include "mlir/Dialect/Linalg/IR/Linalg.h"		#include "mlir/Dialect/Linalg/IR/Linalg.h"
#include "mlir/Dialect/MemRef/IR/MemRef.h"		#include "mlir/Dialect/MemRef/IR/MemRef.h"
#include "mlir/Dialect/SCF/IR/SCF.h"		#include "mlir/Dialect/SCF/IR/SCF.h"
#include "mlir/Dialect/Utils/IndexingUtils.h"		#include "mlir/Dialect/Utils/IndexingUtils.h"
#include "mlir/Dialect/Utils/StructuredOpsUtils.h"		#include "mlir/Dialect/Utils/StructuredOpsUtils.h"
#include "mlir/Dialect/Vector/IR/VectorOps.h"		#include "mlir/Dialect/Vector/IR/VectorOps.h"
		#include "mlir/Dialect/Vector/TransformOps/VectorTransformOps.h"
		#include "mlir/Dialect/Vector/Transforms/VectorRewritePatterns.h"
#include "mlir/Dialect/Vector/Utils/VectorUtils.h"		#include "mlir/Dialect/Vector/Utils/VectorUtils.h"
#include "mlir/IR/BuiltinAttributeInterfaces.h"		#include "mlir/IR/BuiltinAttributeInterfaces.h"
#include "mlir/IR/BuiltinTypes.h"		#include "mlir/IR/BuiltinTypes.h"
#include "mlir/IR/ImplicitLocOpBuilder.h"		#include "mlir/IR/ImplicitLocOpBuilder.h"
#include "mlir/IR/Matchers.h"		#include "mlir/IR/Matchers.h"
#include "mlir/IR/PatternMatch.h"		#include "mlir/IR/PatternMatch.h"
#include "mlir/Interfaces/VectorInterfaces.h"		#include "mlir/Interfaces/VectorInterfaces.h"
		#include "mlir/Support/LogicalResult.h"

#include "llvm/ADT/DenseSet.h"		#include "llvm/ADT/DenseSet.h"
#include "llvm/ADT/MapVector.h"		#include "llvm/ADT/MapVector.h"
#include "llvm/ADT/STLExtras.h"		#include "llvm/ADT/STLExtras.h"
#include "llvm/Support/CommandLine.h"		#include "llvm/Support/CommandLine.h"
#include "llvm/Support/Debug.h"		#include "llvm/Support/Debug.h"
#include "llvm/Support/raw_ostream.h"		#include "llvm/Support/raw_ostream.h"

▲ Show 20 Lines • Show All 3,006 Lines • ▼ Show 20 Lines	if (initialValueRank == 0) {
lastOutput);		lastOutput);
}		}

rewriter.replaceOp(scanOp, {result, reduction});		rewriter.replaceOp(scanOp, {result, reduction});
return success();		return success();
}		}
};		};

		/// Canonicalization of a `vector.contraction %a, %b, %c` with row-major matmul
		/// semantics to a contraction suitable for MMT (matrix matrix multiplication
		/// with the RHS transposed) lowering.
		struct CanonicalizeContractMatmulToMMT final
		: OpRewritePattern<vector::ContractionOp> {
		using OpRewritePattern::OpRewritePattern;

		using FilterConstraintType =
		std::function<LogicalResult(vector::ContractionOp op)>;

		CanonicalizeContractMatmulToMMT(MLIRContext *context, PatternBenefit benefit,
		FilterConstraintType constraint)
		: OpRewritePattern<vector::ContractionOp>(context, benefit),
		filter(std::move(constraint)) {}

		LogicalResult matchAndRewrite(vector::ContractionOp op,
		PatternRewriter &rewriter) const override {
		// TODO: Remove native masks from contraction op?
		if (!op.getMasks().empty())
		return failure();

		if (failed(filter(op)))
		return failure();

		Location loc = op.getLoc();
		Value lhs = op.getLhs();
		Value rhs = op.getRhs();
		Value res = op.getAcc();

		// Set up the parallel/reduction structure in right form.
		using MapList = ArrayRef<ArrayRef<AffineExpr>>;
		auto infer = [](MapList m) { return AffineMap::inferFromExprList(m); };
		AffineExpr m;
		AffineExpr n;
		AffineExpr k;
		bindDims(rewriter.getContext(), m, n, k);
		static constexpr std::array<int64_t, 2> perm = {1, 0};
		auto iteratorTypes = op.getIteratorTypes().getValue();
		SmallVector<AffineMap, 4> maps = op.getIndexingMapsArray();
		if (iteratorTypes.size() != 3 \|\|
		!vector::isParallelIterator(iteratorTypes[0]) \|\|
		!vector::isParallelIterator(iteratorTypes[1]) \|\|
		!vector::isReductionIterator(iteratorTypes[2]))
		return rewriter.notifyMatchFailure(op, "contraction is not a gemm");

		// The canonical form is "TNT" = A row-major, B col-major, C row-major.
		const auto canonicalForm = infer({{m, k}, {n, k}, {m, n}});
		if (maps == canonicalForm)
		return rewriter.notifyMatchFailure(op, "already in the canonical form");

		// Create a vector transpose making sure to emit zero/sign-extend at the
		// end.
		auto createTranspose = [&rewriter, loc](Value mat) -> Value {
		if (auto sext = mat.getDefiningOp<arith::ExtSIOp>()) {
		Value trans =
		rewriter.create<vector::TransposeOp>(loc, sext.getIn(), perm);
		return rewriter.create<arith::ExtSIOp>(loc, mat.getType(), trans);
		}
		if (auto zext = mat.getDefiningOp<arith::ExtUIOp>()) {
		Value trans =
		rewriter.create<vector::TransposeOp>(loc, zext.getIn(), perm);
		return rewriter.create<arith::ExtUIOp>(loc, mat.getType(), trans);
		}
		return rewriter.create<vector::TransposeOp>(loc, mat, perm);
		};

		if (maps == infer({{m, k}, {k, n}, {m, n}})) {
		rhs = createTranspose(rhs);
		} else if (maps == infer({{k, m}, {n, k}, {m, n}})) {
		lhs = createTranspose(lhs);
		} else if (maps == infer({{k, m}, {k, n}, {m, n}})) {
		rhs = createTranspose(rhs);
		lhs = createTranspose(lhs);
		} else if (maps == infer({{k, m}, {k, n}, {n, m}})) {
		std::swap(rhs, lhs);
		rhs = createTranspose(rhs);
		lhs = createTranspose(lhs);
		} else if (maps == infer({{k, m}, {n, k}, {n, m}})) {
		std::swap(rhs, lhs);
		rhs = createTranspose(rhs);
		} else if (maps == infer({{m, k}, {k, n}, {n, m}})) {
		std::swap(lhs, rhs);
		lhs = createTranspose(lhs);
		} else if (maps == infer({{m, k}, {n, k}, {n, m}})) {
		std::swap(lhs, rhs);
		} else {
		return rewriter.notifyMatchFailure(op, "unhandled contraction form");
		}
		rewriter.replaceOpWithNewOp<vector::ContractionOp>(
		op, lhs, rhs, res, rewriter.getAffineMapArrayAttr(canonicalForm),
		op.getIteratorTypes());
		return success();
		};

		private:
		FilterConstraintType filter;
		};

} // namespace		} // namespace

void mlir::vector::populateVectorMaskMaterializationPatterns(		void mlir::vector::populateVectorMaskMaterializationPatterns(
RewritePatternSet &patterns, bool force32BitVectorIndices,		RewritePatternSet &patterns, bool force32BitVectorIndices,
PatternBenefit benefit) {		PatternBenefit benefit) {
patterns.add<VectorCreateMaskOpConversion,		patterns.add<VectorCreateMaskOpConversion,
MaterializeTransferMask<vector::TransferReadOp>,		MaterializeTransferMask<vector::TransferReadOp>,
MaterializeTransferMask<vector::TransferWriteOp>>(		MaterializeTransferMask<vector::TransferWriteOp>>(
Show All 35 Lines	void mlir::vector::populateVectorContractLoweringPatterns(
RewritePatternSet &patterns, VectorTransformsOptions options,		RewritePatternSet &patterns, VectorTransformsOptions options,
PatternBenefit benefit) {		PatternBenefit benefit) {
patterns.add<OuterProductOpLowering>(patterns.getContext(), benefit);		patterns.add<OuterProductOpLowering>(patterns.getContext(), benefit);
patterns.add<ContractionOpLowering, ContractionOpToMatmulOpLowering,		patterns.add<ContractionOpLowering, ContractionOpToMatmulOpLowering,
ContractionOpToOuterProductOpLowering>(		ContractionOpToOuterProductOpLowering>(
options, patterns.getContext(), benefit);		options, patterns.getContext(), benefit);
}		}

		void mlir::vector::populateVectorContractCanonicalizeMatmulToMMT(
		RewritePatternSet &patterns,
		std::function<LogicalResult(vector::ContractionOp)> constraint,
		PatternBenefit benefit) {
		patterns.add<CanonicalizeContractMatmulToMMT>(patterns.getContext(), benefit,
		std::move(constraint));
		}

void mlir::vector::populateVectorTransposeLoweringPatterns(		void mlir::vector::populateVectorTransposeLoweringPatterns(
RewritePatternSet &patterns, VectorTransformsOptions options,		RewritePatternSet &patterns, VectorTransformsOptions options,
PatternBenefit benefit) {		PatternBenefit benefit) {
patterns.add<TransposeOpLowering, TransposeOp2DToShuffleLowering>(		patterns.add<TransposeOpLowering, TransposeOp2DToShuffleLowering>(
options, patterns.getContext(), benefit);		options, patterns.getContext(), benefit);
}		}

void mlir::vector::populateVectorReductionToContractPatterns(		void mlir::vector::populateVectorReductionToContractPatterns(
Show All 34 Lines

mlir/test/Dialect/Vector/vector-contract-matmul-transforms.mlir

This file was added.

				// RUN: mlir-opt %s -test-vector-contraction-prepare-for-mmt-lowering \| FileCheck %s

				// CHECK-LABEL: func.func @not_matmul
				// CHECK-SAME: ([[ARG0:%.+]]: vector<4xf32>, [[ARG1:%.+]]: vector<4xf32>, [[ARG2:%.+]]: f32)
				// CHECK-NEXT: vector.contract
				// CHECK-NEXT: return
				func.func @not_matmul(%arg0: vector<4xf32>, %arg1: vector<4xf32>, %arg2: f32) -> f32 {
				%0 = vector.contract {indexing_maps = [affine_map<(d0) -> (d0)>,
				affine_map<(d0) -> (d0)>,
				affine_map<(d0) -> ()>],
				iterator_types = ["reduction"],
				kind = #vector.kind<add>} %arg0, %arg1, %arg2 :
				vector<4xf32>, vector<4xf32> into f32
				return %0 : f32
				}

				// This contraction is already in the canonical form.
				// CHECK-LABEL: func.func @matmul_mk_nk_mn_4x4xi32
				// CHECK-SAME: ([[ARG0:%.+]]: vector<4x4xi32>, [[ARG1:%.+]]: vector<4x4xi32>, [[ARG2:%.+]]: vector<4x4xi32>)
				// CHECK-NEXT: [[RES:%.+]] = vector.contract {{.+}} [[ARG0]], [[ARG1]], [[ARG2]]
				// CHECK-NEXT: return [[RES]]
				func.func @matmul_mk_nk_mn_4x4xi32(%arg0: vector<4x4xi32>, %arg1: vector<4x4xi32>, %arg2: vector<4x4xi32>) -> vector<4x4xi32> {
				%res = vector.contract {indexing_maps = [affine_map<(d0, d1, d2) -> (d0, d2)>,
				affine_map<(d0, d1, d2) -> (d1, d2)>,
				affine_map<(d0, d1, d2) -> (d0, d1)>],
				iterator_types = ["parallel", "parallel", "reduction"],
				kind = #vector.kind<add>} %arg0, %arg1, %arg2 : vector<4x4xi32>, vector<4x4xi32> into vector<4x4xi32>
				return %res : vector<4x4xi32>
				}

				// CHECK-LABEL: func.func @matmul_mk_kn_mn_4x4xi32
				// CHECK-SAME: ([[ARG0:%.+]]: vector<4x4xi32>, [[ARG1:%.+]]: vector<4x4xi32>, [[ARG2:%.+]]: vector<4x4xi32>)
				// CHECK-NEXT: [[TRANS:%.+]] = vector.transpose [[ARG1]], [1, 0] : vector<4x4xi32> to vector<4x4xi32>
				// CHECK-NEXT: [[RES:%.+]] = vector.contract {{.+}} [[ARG0]], [[TRANS]], [[ARG2]]
				// CHECK-NEXT: return [[RES]]
				func.func @matmul_mk_kn_mn_4x4xi32(%arg0: vector<4x4xi32>, %arg1: vector<4x4xi32>, %arg2: vector<4x4xi32>) -> vector<4x4xi32> {
				%res = vector.contract {indexing_maps = [affine_map<(d0, d1, d2) -> (d0, d2)>,
				affine_map<(d0, d1, d2) -> (d2, d1)>,
				affine_map<(d0, d1, d2) -> (d0, d1)>],
				iterator_types = ["parallel", "parallel", "reduction"],
				kind = #vector.kind<add>} %arg0, %arg1, %arg2 : vector<4x4xi32>, vector<4x4xi32> into vector<4x4xi32>
				return %res : vector<4x4xi32>
				}

				// CHECK-LABEL: func.func @matmul_mk_kn_mn_4x4xi8_extsi_i32
				// CHECK-SAME: ([[ARG0:%.+]]: vector<4x4xi8>, [[ARG1:%.+]]: vector<4x4xi8>, [[ARG2:%.+]]: vector<4x4xi32>)
				// CHECK-NEXT: [[LHS:%.+]] = arith.extsi [[ARG0]] : vector<4x4xi8> to vector<4x4xi32>
				// CHECK-NEXT: [[TRANS:%.+]] = vector.transpose [[ARG1]], [1, 0] : vector<4x4xi8> to vector<4x4xi8>
				// CHECK-NEXT: [[RHS:%.+]] = arith.extsi [[TRANS]] : vector<4x4xi8> to vector<4x4xi32>
				// CHECK-NEXT: [[RES:%.+]] = vector.contract {{.+}} [[LHS]], [[RHS]], [[ARG2]]
				// CHECK-NEXT: return [[RES]]
				func.func @matmul_mk_kn_mn_4x4xi8_extsi_i32(%arg0: vector<4x4xi8>, %arg1: vector<4x4xi8>, %arg2: vector<4x4xi32>) -> vector<4x4xi32> {
				%lhs = arith.extsi %arg0: vector<4x4xi8> to vector<4x4xi32>
				%rhs = arith.extsi %arg1: vector<4x4xi8> to vector<4x4xi32>
				%res = vector.contract {indexing_maps = [affine_map<(d0, d1, d2) -> (d0, d2)>,
				affine_map<(d0, d1, d2) -> (d2, d1)>,
				affine_map<(d0, d1, d2) -> (d0, d1)>],
				iterator_types = ["parallel", "parallel", "reduction"],
				kind = #vector.kind<add>} %lhs, %rhs, %arg2 : vector<4x4xi32>, vector<4x4xi32> into vector<4x4xi32>
				return %res : vector<4x4xi32>
				}

				// Check that non-square shapes are also handled.
				// CHECK-LABEL: func.func @matmul_mk_kn_mn_4x16xi32
				// CHECK-SAME: ([[ARG0:%.+]]: vector<4x16xi32>, [[ARG1:%.+]]: vector<16x4xi32>, [[ARG2:%.+]]: vector<4x4xi32>)
				// CHECK-NEXT: [[TRANS:%.+]] = vector.transpose [[ARG1]], [1, 0] : vector<16x4xi32> to vector<4x16xi32>
				// CHECK-NEXT: [[RES:%.+]] = vector.contract {{.+}} [[ARG0]], [[TRANS]], [[ARG2]]
				// CHECK-NEXT: return [[RES]]
				func.func @matmul_mk_kn_mn_4x16xi32(%arg0: vector<4x16xi32>, %arg1: vector<16x4xi32>, %arg2: vector<4x4xi32>) -> vector<4x4xi32> {
				%res = vector.contract {indexing_maps = [affine_map<(d0, d1, d2) -> (d0, d2)>,
				affine_map<(d0, d1, d2) -> (d2, d1)>,
				affine_map<(d0, d1, d2) -> (d0, d1)>],
				iterator_types = ["parallel", "parallel", "reduction"],
				kind = #vector.kind<add>} %arg0, %arg1, %arg2 : vector<4x16xi32>, vector<16x4xi32> into vector<4x4xi32>
				return %res : vector<4x4xi32>
				}

				// CHECK-LABEL: func.func @matmul_mk_kn_mn_4x4xi8_extui_i32
				// CHECK-SAME: ([[ARG0:%.+]]: vector<4x4xi8>, [[ARG1:%.+]]: vector<4x4xi8>, [[ARG2:%.+]]: vector<4x4xi32>)
				// CHECK-NEXT: [[LHS:%.+]] = arith.extui [[ARG0]] : vector<4x4xi8> to vector<4x4xi32>
				// CHECK-NEXT: [[TRANS:%.+]] = vector.transpose [[ARG1]], [1, 0] : vector<4x4xi8> to vector<4x4xi8>
				// CHECK-NEXT: [[RHS:%.+]] = arith.extui [[TRANS]] : vector<4x4xi8> to vector<4x4xi32>
				// CHECK-NEXT: [[RES:%.+]] = vector.contract {{.+}} [[LHS]], [[RHS]], [[ARG2]]
				// CHECK-NEXT: return [[RES]]
				func.func @matmul_mk_kn_mn_4x4xi8_extui_i32(%arg0: vector<4x4xi8>, %arg1: vector<4x4xi8>, %arg2: vector<4x4xi32>) -> vector<4x4xi32> {
				%lhs = arith.extui %arg0: vector<4x4xi8> to vector<4x4xi32>
				%rhs = arith.extui %arg1: vector<4x4xi8> to vector<4x4xi32>
				%res = vector.contract {indexing_maps = [affine_map<(d0, d1, d2) -> (d0, d2)>,
				affine_map<(d0, d1, d2) -> (d2, d1)>,
				affine_map<(d0, d1, d2) -> (d0, d1)>],
				iterator_types = ["parallel", "parallel", "reduction"],
				kind = #vector.kind<add>} %lhs, %rhs, %arg2 : vector<4x4xi32>, vector<4x4xi32> into vector<4x4xi32>
				return %res : vector<4x4xi32>
				}

				// CHECK-LABEL: func.func @matmul_km_nk_mn_4x4xi32
				// CHECK-SAME: ([[ARG0:%.+]]: vector<4x4xi32>, [[ARG1:%.+]]: vector<4x4xi32>, [[ARG2:%.+]]: vector<4x4xi32>)
				// CHECK-NEXT: [[TRANS:%.+]] = vector.transpose [[ARG0]], [1, 0] : vector<4x4xi32> to vector<4x4xi32>
				// CHECK-NEXT: [[RES:%.+]] = vector.contract {{.+}} [[TRANS]], [[ARG1]], [[ARG2]]
				// CHECK-NEXT: return [[RES]]
				func.func @matmul_km_nk_mn_4x4xi32(%arg0: vector<4x4xi32>, %arg1: vector<4x4xi32>, %arg2: vector<4x4xi32>) -> vector<4x4xi32> {
				%res = vector.contract {indexing_maps = [affine_map<(d0, d1, d2) -> (d2, d0)>,
				affine_map<(d0, d1, d2) -> (d1, d2)>,
				affine_map<(d0, d1, d2) -> (d0, d1)>],
				iterator_types = ["parallel", "parallel", "reduction"],
				kind = #vector.kind<add>} %arg0, %arg1, %arg2 : vector<4x4xi32>, vector<4x4xi32> into vector<4x4xi32>
				return %res : vector<4x4xi32>
				}

				// CHECK-LABEL: func.func @matmul_km_kn_mn_4x4xi32
				// CHECK-SAME: ([[ARG0:%.+]]: vector<4x4xi32>, [[ARG1:%.+]]: vector<4x4xi32>, [[ARG2:%.+]]: vector<4x4xi32>)
				// CHECK-DAG: [[LHS:%.+]] = vector.transpose [[ARG0]], [1, 0] : vector<4x4xi32> to vector<4x4xi32>
				// CHECK-DAG: [[RHS:%.+]] = vector.transpose [[ARG1]], [1, 0] : vector<4x4xi32> to vector<4x4xi32>
				// CHECK-NEXT: [[RES:%.+]] = vector.contract {{.+}} [[LHS]], [[RHS]], [[ARG2]]
				// CHECK-NEXT: return [[RES]]
				func.func @matmul_km_kn_mn_4x4xi32(%arg0: vector<4x4xi32>, %arg1: vector<4x4xi32>, %arg2: vector<4x4xi32>) -> vector<4x4xi32> {
				%res = vector.contract {indexing_maps = [affine_map<(d0, d1, d2) -> (d2, d0)>,
				affine_map<(d0, d1, d2) -> (d2, d1)>,
				affine_map<(d0, d1, d2) -> (d0, d1)>],
				iterator_types = ["parallel", "parallel", "reduction"],
				kind = #vector.kind<add>} %arg0, %arg1, %arg2 : vector<4x4xi32>, vector<4x4xi32> into vector<4x4xi32>
				return %res : vector<4x4xi32>
				}

				// CHECK-LABEL: func.func @matmul_km_kn_mn_4x4xi8_mixed_ext_i32
				// CHECK-SAME: ([[ARG0:%.+]]: vector<4x4xi8>, [[ARG1:%.+]]: vector<4x4xi8>, [[ARG2:%.+]]: vector<4x4xi32>)
				// CHECK-DAG: [[LHST:%.+]] = vector.transpose [[ARG0]], [1, 0] : vector<4x4xi8> to vector<4x4xi8>
				// CHECK-DAG: [[LHS:%.+]] = arith.extsi [[LHST]] : vector<4x4xi8> to vector<4x4xi32>
				// CHECK-DAG: [[RHST:%.+]] = vector.transpose [[ARG1]], [1, 0] : vector<4x4xi8> to vector<4x4xi8>
				// CHECK-DAG: [[RHS:%.+]] = arith.extui [[RHST]] : vector<4x4xi8> to vector<4x4xi32>
				// CHECK-NEXT: [[RES:%.+]] = vector.contract {{.+}} [[LHS]], [[RHS]], [[ARG2]]
				// CHECK-NEXT: return [[RES]]
				func.func @matmul_km_kn_mn_4x4xi8_mixed_ext_i32(%arg0: vector<4x4xi8>, %arg1: vector<4x4xi8>, %arg2: vector<4x4xi32>) -> vector<4x4xi32> {
				%lhs = arith.extsi %arg0 : vector<4x4xi8> to vector<4x4xi32>
				%rhs = arith.extui %arg1 : vector<4x4xi8> to vector<4x4xi32>
				%res = vector.contract {indexing_maps = [affine_map<(d0, d1, d2) -> (d2, d0)>,
				affine_map<(d0, d1, d2) -> (d2, d1)>,
				affine_map<(d0, d1, d2) -> (d0, d1)>],
				iterator_types = ["parallel", "parallel", "reduction"],
				kind = #vector.kind<add>} %lhs, %rhs, %arg2 : vector<4x4xi32>, vector<4x4xi32> into vector<4x4xi32>
				return %res : vector<4x4xi32>
				}

				// CHECK-LABEL: func.func @matmul_mk_nk_nm_4x4xi32
				// CHECK-SAME: ([[ARG0:%.+]]: vector<4x4xi32>, [[ARG1:%.+]]: vector<4x4xi32>, [[ARG2:%.+]]: vector<4x4xi32>)
				// CHECK-NEXT: [[RES:%.+]] = vector.contract {{.+}} [[ARG1]], [[ARG0]], [[ARG2]]
				// CHECK-NEXT: return [[RES]]
				func.func @matmul_mk_nk_nm_4x4xi32(%arg0: vector<4x4xi32>, %arg1: vector<4x4xi32>, %arg2: vector<4x4xi32>) -> vector<4x4xi32> {
				%res = vector.contract {indexing_maps = [affine_map<(d0, d1, d2) -> (d0, d2)>,
				affine_map<(d0, d1, d2) -> (d1, d2)>,
				affine_map<(d0, d1, d2) -> (d1, d0)>],
				iterator_types = ["parallel", "parallel", "reduction"],
				kind = #vector.kind<add>} %arg0, %arg1, %arg2 : vector<4x4xi32>, vector<4x4xi32> into vector<4x4xi32>
				return %res : vector<4x4xi32>
				}

				// CHECK-LABEL: func.func @matmul_km_kn_nm_4x4xi32
				// CHECK-SAME: ([[ARG0:%.+]]: vector<4x4xi32>, [[ARG1:%.+]]: vector<4x4xi32>, [[ARG2:%.+]]: vector<4x4xi32>)
				// CHECK-DAG: [[LHS:%.+]] = vector.transpose [[ARG0]], [1, 0] : vector<4x4xi32> to vector<4x4xi32>
				// CHECK-DAG: [[RHS:%.+]] = vector.transpose [[ARG1]], [1, 0] : vector<4x4xi32> to vector<4x4xi32>
				// CHECK-NEXT: [[RES:%.+]] = vector.contract {{.+}} [[RHS]], [[LHS]], [[ARG2]]
				// CHECK-NEXT: return [[RES]]
				func.func @matmul_km_kn_nm_4x4xi32(%arg0: vector<4x4xi32>, %arg1: vector<4x4xi32>, %arg2: vector<4x4xi32>) -> vector<4x4xi32> {
				%res = vector.contract {indexing_maps = [affine_map<(d0, d1, d2) -> (d2, d0)>,
				affine_map<(d0, d1, d2) -> (d2, d1)>,
				affine_map<(d0, d1, d2) -> (d1, d0)>],
				iterator_types = ["parallel", "parallel", "reduction"],
				kind = #vector.kind<add>} %arg0, %arg1, %arg2 : vector<4x4xi32>, vector<4x4xi32> into vector<4x4xi32>
				return %res : vector<4x4xi32>
				}

				// CHECK-LABEL: func.func @matmul_mk_kn_nm_4x4xi32
				// CHECK-SAME: ([[ARG0:%.+]]: vector<4x4xi32>, [[ARG1:%.+]]: vector<4x4xi32>, [[ARG2:%.+]]: vector<4x4xi32>)
				// CHECK-DAG: [[RHS:%.+]] = vector.transpose [[ARG1]], [1, 0] : vector<4x4xi32> to vector<4x4xi32>
				// CHECK-NEXT: [[RES:%.+]] = vector.contract {{.+}} [[RHS]], [[ARG0]], [[ARG2]]
				// CHECK-NEXT: return [[RES]]
				func.func @matmul_mk_kn_nm_4x4xi32(%arg0: vector<4x4xi32>, %arg1: vector<4x4xi32>, %arg2: vector<4x4xi32>) -> vector<4x4xi32> {
				%res = vector.contract {indexing_maps = [affine_map<(d0, d1, d2) -> (d0, d2)>,
				affine_map<(d0, d1, d2) -> (d2, d1)>,
				affine_map<(d0, d1, d2) -> (d1, d0)>],
				iterator_types = ["parallel", "parallel", "reduction"],
				kind = #vector.kind<add>} %arg0, %arg1, %arg2 : vector<4x4xi32>, vector<4x4xi32> into vector<4x4xi32>
				return %res : vector<4x4xi32>
				}

				// CHECK-LABEL: func.func @matmul_km_nk_nm_4x4xi32
				// CHECK-SAME: ([[ARG0:%.+]]: vector<4x4xi32>, [[ARG1:%.+]]: vector<4x4xi32>, [[ARG2:%.+]]: vector<4x4xi32>)
				// CHECK-DAG: [[LHS:%.+]] = vector.transpose [[ARG0]], [1, 0] : vector<4x4xi32> to vector<4x4xi32>
				// CHECK-NEXT: [[RES:%.+]] = vector.contract {{.+}} [[ARG1]], [[LHS]], [[ARG2]]
				// CHECK-NEXT: return [[RES]]
				func.func @matmul_km_nk_nm_4x4xi32(%arg0: vector<4x4xi32>, %arg1: vector<4x4xi32>, %arg2: vector<4x4xi32>) -> vector<4x4xi32> {
				%res = vector.contract {indexing_maps = [affine_map<(d0, d1, d2) -> (d2, d0)>,
				affine_map<(d0, d1, d2) -> (d1, d2)>,
				affine_map<(d0, d1, d2) -> (d1, d0)>],
				iterator_types = ["parallel", "parallel", "reduction"],
				kind = #vector.kind<add>} %arg0, %arg1, %arg2 : vector<4x4xi32>, vector<4x4xi32> into vector<4x4xi32>
				return %res : vector<4x4xi32>
				}

mlir/test/lib/Dialect/Vector/TestVectorTransforms.cpp

//===- TestVectorTransforms.cpp - Test Vector transforms and lowerings ----===//		//===- TestVectorTransforms.cpp - Test Vector transforms and lowerings ----===//
//		//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.		// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.		// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception		// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

#include <type_traits>		#include <type_traits>
#include <optional>		#include <optional>

#include "mlir/Analysis/SliceAnalysis.h"		#include "mlir/Analysis/SliceAnalysis.h"
#include "mlir/Dialect/Affine/IR/AffineOps.h"		#include "mlir/Dialect/Affine/IR/AffineOps.h"
		#include "mlir/Dialect/Arith/IR/Arith.h"
#include "mlir/Dialect/Func/IR/FuncOps.h"		#include "mlir/Dialect/Func/IR/FuncOps.h"
#include "mlir/Dialect/GPU/IR/GPUDialect.h"		#include "mlir/Dialect/GPU/IR/GPUDialect.h"
#include "mlir/Dialect/LLVMIR/LLVMDialect.h"		#include "mlir/Dialect/LLVMIR/LLVMDialect.h"
#include "mlir/Dialect/Linalg/IR/Linalg.h"		#include "mlir/Dialect/Linalg/IR/Linalg.h"
#include "mlir/Dialect/Linalg/Passes.h"		#include "mlir/Dialect/Linalg/Passes.h"
#include "mlir/Dialect/Linalg/Transforms/Transforms.h"		#include "mlir/Dialect/Linalg/Transforms/Transforms.h"
#include "mlir/Dialect/MemRef/IR/MemRef.h"		#include "mlir/Dialect/MemRef/IR/MemRef.h"
#include "mlir/Dialect/SCF/IR/SCF.h"		#include "mlir/Dialect/SCF/IR/SCF.h"
▲ Show 20 Lines • Show All 172 Lines • ▼ Show 20 Lines	void runOnOperation() override {
populateVectorBroadcastLoweringPatterns(patterns);		populateVectorBroadcastLoweringPatterns(patterns);
populateVectorContractLoweringPatterns(patterns, options);		populateVectorContractLoweringPatterns(patterns, options);
populateVectorMaskOpLoweringPatterns(patterns);		populateVectorMaskOpLoweringPatterns(patterns);
populateVectorShapeCastLoweringPatterns(patterns);		populateVectorShapeCastLoweringPatterns(patterns);
(void)applyPatternsAndFoldGreedily(getOperation(), std::move(patterns));		(void)applyPatternsAndFoldGreedily(getOperation(), std::move(patterns));
}		}
};		};

		struct TestVectorContractionPrepareForMMTLowering
		: public PassWrapper<TestVectorContractionPrepareForMMTLowering,
		OperationPass<func::FuncOp>> {
		MLIR_DEFINE_EXPLICIT_INTERNAL_INLINE_TYPE_ID(
		TestVectorContractionPrepareForMMTLowering)

		StringRef getArgument() const final {
		return "test-vector-contraction-prepare-for-mmt-lowering";
		}
		StringRef getDescription() const final {
		return "Test vector.contraction matmul canonicalization for MMT lowering.";
		}
		TestVectorContractionPrepareForMMTLowering() = default;

		void getDependentDialects(DialectRegistry &registry) const override {
		registry
		.insert<AffineDialect, arith::ArithDialect, vector::VectorDialect>();
		}

		void runOnOperation() override {
		MLIRContext *ctx = &getContext();
		RewritePatternSet patterns(ctx);
		vector::populateVectorContractCanonicalizeMatmulToMMT(patterns);
		(void)applyPatternsAndFoldGreedily(getOperation(), std::move(patterns));
		}
		};

struct TestVectorTransposeLowering		struct TestVectorTransposeLowering
: public PassWrapper<TestVectorTransposeLowering,		: public PassWrapper<TestVectorTransposeLowering,
OperationPass<func::FuncOp>> {		OperationPass<func::FuncOp>> {
MLIR_DEFINE_EXPLICIT_INTERNAL_INLINE_TYPE_ID(TestVectorTransposeLowering)		MLIR_DEFINE_EXPLICIT_INTERNAL_INLINE_TYPE_ID(TestVectorTransposeLowering)

StringRef getArgument() const final {		StringRef getArgument() const final {
return "test-vector-transpose-lowering";		return "test-vector-transpose-lowering";
}		}
▲ Show 20 Lines • Show All 677 Lines • ▼ Show 20 Lines

namespace mlir {		namespace mlir {
namespace test {		namespace test {
void registerTestVectorLowerings() {		void registerTestVectorLowerings() {
PassRegistration<TestVectorToVectorLowering>();		PassRegistration<TestVectorToVectorLowering>();

PassRegistration<TestVectorContractionLowering>();		PassRegistration<TestVectorContractionLowering>();

		PassRegistration<TestVectorContractionPrepareForMMTLowering>();

PassRegistration<TestVectorTransposeLowering>();		PassRegistration<TestVectorTransposeLowering>();

PassRegistration<TestVectorUnrollingPatterns>();		PassRegistration<TestVectorUnrollingPatterns>();

PassRegistration<TestVectorTransferUnrollingPatterns>();		PassRegistration<TestVectorTransferUnrollingPatterns>();

PassRegistration<TestVectorTransferFullPartialSplitPatterns>();		PassRegistration<TestVectorTransferFullPartialSplitPatterns>();

Show All 26 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][vector][nvgpu] Move MMA contraction preparation to VectorUtils
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 503871

mlir/include/mlir/Dialect/NVGPU/Utils/MMAUtils.h

mlir/include/mlir/Dialect/Vector/Transforms/VectorRewritePatterns.h

mlir/lib/Conversion/VectorToGPU/VectorToGPU.cpp

mlir/lib/Dialect/NVGPU/Utils/MMAUtils.cpp

mlir/lib/Dialect/Vector/Transforms/VectorTransforms.cpp

mlir/test/Dialect/Vector/vector-contract-matmul-transforms.mlir

mlir/test/lib/Dialect/Vector/TestVectorTransforms.cpp

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][vector][nvgpu] Move MMA contraction preparation to VectorUtilsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 503871

mlir/include/mlir/Dialect/NVGPU/Utils/MMAUtils.h

mlir/include/mlir/Dialect/Vector/Transforms/VectorRewritePatterns.h

mlir/lib/Conversion/VectorToGPU/VectorToGPU.cpp

mlir/lib/Dialect/NVGPU/Utils/MMAUtils.cpp

mlir/lib/Dialect/Vector/Transforms/VectorTransforms.cpp

mlir/test/Dialect/Vector/vector-contract-matmul-transforms.mlir

mlir/test/lib/Dialect/Vector/TestVectorTransforms.cpp

[mlir][vector][nvgpu] Move MMA contraction preparation to VectorUtils
ClosedPublic