Diff 429812

mlir/include/mlir/Dialect/Tosa/IR/TosaOps.h

	Show All 28 Lines

	namespace tosa {			namespace tosa {

	#include "mlir/Dialect/Tosa/IR/TosaInterfaces.h.inc"			#include "mlir/Dialect/Tosa/IR/TosaInterfaces.h.inc"

	} // namespace tosa			} // namespace tosa
	} // namespace mlir			} // namespace mlir

				//===----------------------------------------------------------------------===//
				// Utility Functions
				//===----------------------------------------------------------------------===//
				namespace mlir {
				namespace tosa {
				/// Appends the canonicalization patterns for all the TOSA ops to the `patterns`
				void populateTosaOpsCanonicalizationPatterns(MLIRContext *ctx,
				RewritePatternSet &patterns);
				} // namespace tosa
				} // namespace mlir

	#define GET_OP_CLASSES			#define GET_OP_CLASSES
	#include "mlir/Dialect/Tosa/IR/TosaOps.h.inc"			#include "mlir/Dialect/Tosa/IR/TosaOps.h.inc"

	#endif // MLIR_DIALECT_TOSA_IR_TOSAOPS_H			#endif // MLIR_DIALECT_TOSA_IR_TOSAOPS_H

mlir/include/mlir/Dialect/Tosa/Transforms/Passes.h

	Show All 20 Lines

	// Expose Rewrite Functions that decompose TOSA Ops into further TOSA Ops.			// Expose Rewrite Functions that decompose TOSA Ops into further TOSA Ops.
	// The rewrites can be selectively added to a conversion pass.			// The rewrites can be selectively added to a conversion pass.
	void populateTosaDecomposeConv2D(MLIRContext *ctx, RewritePatternSet &patterns);			void populateTosaDecomposeConv2D(MLIRContext *ctx, RewritePatternSet &patterns);
	void populateTosaDecomposeTransposeConv(MLIRContext *ctx,			void populateTosaDecomposeTransposeConv(MLIRContext *ctx,
	RewritePatternSet &patterns);			RewritePatternSet &patterns);
	void populateTosaDecomposeDepthwise(MLIRContext *ctx,			void populateTosaDecomposeDepthwise(MLIRContext *ctx,
	RewritePatternSet &patterns);			RewritePatternSet &patterns);
				void populateTosaFoldConstantTransposePatterns(MLIRContext *ctx,
				RewritePatternSet &patterns);

				std::unique_ptr<Pass> createTosaConstantFoldPass();
	std::unique_ptr<Pass> createTosaInferShapesPass();			std::unique_ptr<Pass> createTosaInferShapesPass();
	std::unique_ptr<Pass> createTosaMakeBroadcastablePass();			std::unique_ptr<Pass> createTosaMakeBroadcastablePass();
	std::unique_ptr<Pass> createTosaTestQuantUtilAPIPass();			std::unique_ptr<Pass> createTosaTestQuantUtilAPIPass();
	std::unique_ptr<Pass> createTosaOptionalDecompositions();			std::unique_ptr<Pass> createTosaOptionalDecompositions();

	#define GEN_PASS_REGISTRATION			#define GEN_PASS_REGISTRATION
	#include "mlir/Dialect/Tosa/Transforms/Passes.h.inc"			#include "mlir/Dialect/Tosa/Transforms/Passes.h.inc"

	} // namespace tosa			} // namespace tosa
	} // namespace mlir			} // namespace mlir

	#endif // MLIR_DIALECT_TOSA_TRANSFORMS_PASSES_H			#endif // MLIR_DIALECT_TOSA_TRANSFORMS_PASSES_H

mlir/include/mlir/Dialect/Tosa/Transforms/Passes.td

	Show All 9 Lines
	//			//
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//

	#ifndef MLIR_DIALECT_TOSA_TRANSFORMS_PASSES			#ifndef MLIR_DIALECT_TOSA_TRANSFORMS_PASSES
	#define MLIR_DIALECT_TOSA_TRANSFORMS_PASSES			#define MLIR_DIALECT_TOSA_TRANSFORMS_PASSES

	include "mlir/Pass/PassBase.td"			include "mlir/Pass/PassBase.td"

				def TosaConstantFoldPass : Pass<"tosa-constant-fold", "func::FuncOp"> {
				let summary = "Fold operations on constants tensors";
				let description = [{
				Pass that enables folding of elementwise operation patterns on
				jpienaarUnsubmitted Not Done Reply Inline Actions Is element wise a restriction of this pass? jpienaar: Is element wise a restriction of this pass?
				GeorgeARMAuthorUnsubmitted Done Reply Inline Actions As it stands now it doesn't really have any restrictions, was trying ahead-of-time to limit its scope. Happy to rephrase or leave as is and change its scope if needed in the future. GeorgeARM: As it stands now it doesn't really have any restrictions, was trying ahead-of-time to limit its…
				constant tensors.
				}];

				let constructor = "createTosaConstantFoldPass()";
				}

	def TosaInferShapes : Pass<"tosa-infer-shapes", "func::FuncOp"> {			def TosaInferShapes : Pass<"tosa-infer-shapes", "func::FuncOp"> {
	let summary = "Propagate shapes across TOSA operations";			let summary = "Propagate shapes across TOSA operations";
	let description = [{			let description = [{
	Pass that uses operand types and propagates shapes to TOSA operations.			Pass that uses operand types and propagates shapes to TOSA operations.
	This includes legalizing rankless and dynamic shapes towards static.			This includes legalizing rankless and dynamic shapes towards static.
	}];			}];

	let constructor = "createTosaInferShapesPass()";			let constructor = "createTosaInferShapesPass()";
	Show All 32 Lines

mlir/lib/Conversion/TosaToLinalg/TosaToLinalgPass.cpp

Show First 20 Lines • Show All 70 Lines • ▼ Show 20 Lines	void mlir::tosa::addTosaToLinalgPasses(OpPassManager &pm,
// Optional decompositions are designed to benefit linalg.		// Optional decompositions are designed to benefit linalg.
if (!disableTosaDecompositions)		if (!disableTosaDecompositions)
pm.addNestedPass<func::FuncOp>(tosa::createTosaOptionalDecompositions());		pm.addNestedPass<func::FuncOp>(tosa::createTosaOptionalDecompositions());
pm.addNestedPass<func::FuncOp>(createCanonicalizerPass());		pm.addNestedPass<func::FuncOp>(createCanonicalizerPass());

pm.addNestedPass<func::FuncOp>(tosa::createTosaMakeBroadcastablePass());		pm.addNestedPass<func::FuncOp>(tosa::createTosaMakeBroadcastablePass());
pm.addNestedPass<func::FuncOp>(tosa::createTosaToLinalgNamed());		pm.addNestedPass<func::FuncOp>(tosa::createTosaToLinalgNamed());
pm.addNestedPass<func::FuncOp>(createCanonicalizerPass());		pm.addNestedPass<func::FuncOp>(createCanonicalizerPass());
		pm.addNestedPass<func::FuncOp>(tosa::createTosaConstantFoldPass());
		stellaraccidentUnsubmitted Not Done Reply Inline Actions I am fairly certain that we will want to remove this -- optimizations like this are orthogonal to actually lowering to linalg. It is fairly important that optimization passes be separate from lowerings. This qualifies to me as an optimization because it has a cost model (ie. Only apply if has single use) which we will likely want try vary. stellaraccident: I am fairly certain that we will want to remove this -- optimizations like this are orthogonal…
		GeorgeARMAuthorUnsubmitted Done Reply Inline Actions Agree with you. In my original patch this wasn't registered in the TosaToLinalg conversion pipeline. Was added back after a suggestion from @rsuderman. Happy to remove. GeorgeARM: Agree with you. In my original patch this wasn't registered in the TosaToLinalg conversion…
		stellaraccidentUnsubmitted Not Done Reply Inline Actions It looks like this pipeline has some potentially phase ordering concerns, so I'll defer to rsuderman in terms of next step. If this is a temporary step to preserve current behavior, it is fine with me to keep it (to be removed in a future cleanup), but if that is the case, let's add a todo. stellaraccident: It looks like this pipeline has some potentially phase ordering concerns, so I'll defer to…
		rsudermanUnsubmitted Not Done Reply Inline Actions We should be good having it inlined here. If we see a regression related to convolutional models we may have to adjust the constant folding. Overall it should still be fine with you linalg constant folding but this should be good enough now. rsuderman: We should be good having it inlined here. If we see a regression related to convolutional…
pm.addNestedPass<func::FuncOp>(tosa::createTosaMakeBroadcastablePass());		pm.addNestedPass<func::FuncOp>(tosa::createTosaMakeBroadcastablePass());
pm.addNestedPass<func::FuncOp>(tosa::createTosaToLinalg());		pm.addNestedPass<func::FuncOp>(tosa::createTosaToLinalg());
}		}

mlir/lib/Dialect/Tosa/IR/TosaOps.cpp

Show First 20 Lines • Show All 88 Lines • ▼ Show 20 Lines	if (value.isa<ElementsAttr>())
return builder.create<tosa::ConstOp>(loc, type, value.cast<ElementsAttr>());		return builder.create<tosa::ConstOp>(loc, type, value.cast<ElementsAttr>());
return nullptr;		return nullptr;
}		}

//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
// Operator Canonicalizers.		// Operator Canonicalizers.
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

		template <typename... Args>
		void addOpsCanonicalizations(MLIRContext *ctx, RewritePatternSet &patterns) {
		(void)std::initializer_list<int>{
		0, (Args::getCanonicalizationPatterns(patterns, ctx), 0)...};
		}

		void mlir::tosa::populateTosaOpsCanonicalizationPatterns(
		MLIRContext *ctx, RewritePatternSet &patterns) {
		addOpsCanonicalizations<
		#define GET_OP_LIST
		#include "mlir/Dialect/Tosa/IR/TosaOps.cpp.inc"
		>(ctx, patterns);
		}

struct ConcatOptimization : public OpRewritePattern<tosa::ConcatOp> {		struct ConcatOptimization : public OpRewritePattern<tosa::ConcatOp> {
using OpRewritePattern<tosa::ConcatOp>::OpRewritePattern;		using OpRewritePattern<tosa::ConcatOp>::OpRewritePattern;

LogicalResult matchAndRewrite(tosa::ConcatOp op,		LogicalResult matchAndRewrite(tosa::ConcatOp op,
PatternRewriter &rewriter) const override {		PatternRewriter &rewriter) const override {
if (op.input1().size() != 1)		if (op.input1().size() != 1)
return failure();		return failure();
if (op.input1().front().getType() != op.getType()) {		if (op.input1().front().getType() != op.getType()) {
▲ Show 20 Lines • Show All 79 Lines • ▼ Show 20 Lines	if (!notOp)
return failure();		return failure();
rewriter.updateRootInPlace(op, [&]() {		rewriter.updateRootInPlace(op, [&]() {
op.getOperation()->setOperands(		op.getOperation()->setOperands(
{notOp.input1(), op.on_false(), op.on_true()});		{notOp.input1(), op.on_false(), op.on_true()});
});		});
return success();		return success();
}		}

struct ConstantTransposeOptimization
: public OpRewritePattern<tosa::TransposeOp> {
using OpRewritePattern::OpRewritePattern;

LogicalResult matchAndRewrite(tosa::TransposeOp op,
PatternRewriter &rewriter) const override {
auto outputType = op.getType().cast<ShapedType>();
ArrayRef<int64_t> outputShape = outputType.getShape();
// TOSA supports quantized types.
if (!outputType.getElementType().isIntOrIndexOrFloat())
return failure();

DenseElementsAttr inputValues;
if (!matchPattern(op.input1(), m_Constant(&inputValues)))
return failure();
// Make sure the input is a constant that has a single user.
if (!llvm::hasSingleElement(op.input1().getDefiningOp()->getUsers()))
return failure();

DenseIntElementsAttr permAttr;
if (!matchPattern(op.perms(), m_Constant(&permAttr)))
return failure();
auto permValues = llvm::to_vector<6>(llvm::map_range(
// TOSA allows both 32- and 64-bit integer tensors here.
permAttr.getValues<APInt>(),
[](const APInt &val) { return val.getZExtValue(); }));

auto inputType = op.input1().getType().cast<ShapedType>();
ArrayRef<int64_t> inputShape = inputType.getShape();
int64_t numElements = inputType.getNumElements();

SmallVector<Attribute, 4> outputValues;
outputValues.resize(numElements);

// Transpose the input constant. Because we don't know its rank in advance,
// we need to loop over the range [0, element count) and delinearize the
// index.
auto attrValues = inputValues.getValues<Attribute>();
for (int srcLinearIndex = 0; srcLinearIndex < numElements;
++srcLinearIndex) {
SmallVector<uint64_t, 6> srcIndices(inputType.getRank(), 0);
int totalCount = srcLinearIndex;
for (int dim = inputType.getRank() - 1; dim >= 0; --dim) {
srcIndices[dim] = totalCount % inputShape[dim];
totalCount /= inputShape[dim];
}

SmallVector<uint64_t, 6> dstIndices(outputType.getRank(), 0);
for (int dim = outputType.getRank() - 1; dim >= 0; --dim)
dstIndices[dim] = srcIndices[permValues[dim]];

uint64_t dstLinearIndex = dstIndices.front();
for (int dim = 1; dim < outputType.getRank(); ++dim)
dstLinearIndex = dstLinearIndex * outputShape[dim] + dstIndices[dim];

outputValues[dstLinearIndex] = attrValues[srcIndices];
}

rewriter.replaceOpWithNewOp<tosa::ConstOp>(
op, outputType, DenseElementsAttr::get(outputType, outputValues));
return success();
}
};

struct NoOpOptimization : public OpRewritePattern<tosa::TransposeOp> {		struct NoOpOptimization : public OpRewritePattern<tosa::TransposeOp> {
using OpRewritePattern::OpRewritePattern;		using OpRewritePattern::OpRewritePattern;

LogicalResult matchAndRewrite(tosa::TransposeOp op,		LogicalResult matchAndRewrite(tosa::TransposeOp op,
PatternRewriter &rewriter) const override {		PatternRewriter &rewriter) const override {
auto perm = op.perms();		auto perm = op.perms();

DenseIntElementsAttr permAttr;		DenseIntElementsAttr permAttr;
Show All 13 Lines	LogicalResult matchAndRewrite(tosa::TransposeOp op,

rewriter.replaceOp(op, op.input1());		rewriter.replaceOp(op, op.input1());
return success();		return success();
}		}
};		};

void TransposeOp::getCanonicalizationPatterns(RewritePatternSet &results,		void TransposeOp::getCanonicalizationPatterns(RewritePatternSet &results,
MLIRContext *context) {		MLIRContext *context) {
results.add<ConstantTransposeOptimization>(context);
results.add<NoOpOptimization>(context);		results.add<NoOpOptimization>(context);
}		}

struct AddZeroOptimization : public OpRewritePattern<tosa::AddOp> {		struct AddZeroOptimization : public OpRewritePattern<tosa::AddOp> {
using OpRewritePattern::OpRewritePattern;		using OpRewritePattern::OpRewritePattern;

LogicalResult matchAndRewrite(tosa::AddOp op,		LogicalResult matchAndRewrite(tosa::AddOp op,
PatternRewriter &rewriter) const override {		PatternRewriter &rewriter) const override {
▲ Show 20 Lines • Show All 1,691 Lines • Show Last 20 Lines

mlir/lib/Dialect/Tosa/Transforms/CMakeLists.txt

	add_mlir_dialect_library(MLIRTosaTransforms			add_mlir_dialect_library(MLIRTosaTransforms
				TosaConstantFoldPass.cpp
	TosaDecomposeTransposeConv.cpp			TosaDecomposeTransposeConv.cpp
	TosaDecomposeConv2D.cpp			TosaDecomposeConv2D.cpp
	TosaDecomposeDepthwise.cpp			TosaDecomposeDepthwise.cpp
				TosaFoldConstantTranspose.cpp
	TosaInferShapes.cpp			TosaInferShapes.cpp
	TosaMakeBroadcastable.cpp			TosaMakeBroadcastable.cpp
	TosaOptionalDecompositions.cpp			TosaOptionalDecompositions.cpp

	ADDITIONAL_HEADER_DIRS			ADDITIONAL_HEADER_DIRS
	${MLIR_MAIN_INCLUDE_DIR}/mlir/Dialect/Tosa/Transforms			${MLIR_MAIN_INCLUDE_DIR}/mlir/Dialect/Tosa/Transforms

	DEPENDS			DEPENDS
	MLIRTosaPassIncGen			MLIRTosaPassIncGen

	LINK_LIBS PUBLIC			LINK_LIBS PUBLIC
	MLIRFunc			MLIRFunc
	MLIRPass			MLIRPass
	MLIRTosa			MLIRTosa
	MLIRTransformUtils			MLIRTransformUtils
	)			)

mlir/lib/Dialect/Tosa/Transforms/TosaConstantFoldPass.cpp

This file was copied from mlir/lib/Dialect/Tosa/Transforms/TosaOptionalDecompositions.cpp.

	//===- TosaOptionalDecompositions.cpp			//===- TosaConstantFoldPass.cpp -------------------------------------------===//
	//------------------------------------------===//
	//			//
	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.			// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
	// See https://llvm.org/LICENSE.txt for license information.			// See https://llvm.org/LICENSE.txt for license information.
	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception			// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
	//			//
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	//			//
	// Pass to apply the Tosa operations decompositions			// This file implements constant folding transformations on TOSA operations
	// exposed as populate functions in
	// include/mlir/Dialect/Tosa/Transforms/Passes.h
	//			//
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//

	#include "mlir/Dialect/Tosa/IR/TosaOps.h"			#include "mlir/Dialect/Tosa/IR/TosaOps.h"
	#include "mlir/Dialect/Tosa/Transforms/PassDetail.h"			#include "mlir/Dialect/Tosa/Transforms/PassDetail.h"
	#include "mlir/Dialect/Tosa/Transforms/Passes.h"			#include "mlir/Dialect/Tosa/Transforms/Passes.h"
	#include "mlir/Pass/Pass.h"			#include "mlir/Pass/Pass.h"
	#include "mlir/Transforms/GreedyPatternRewriteDriver.h"			#include "mlir/Transforms/GreedyPatternRewriteDriver.h"

	using namespace mlir;			using namespace mlir;
				using namespace mlir::tosa;

	namespace {			namespace {

	struct TosaOptionalDecompositions			struct TosaConstantFoldPass
	: public TosaOptionalDecompositionsBase<TosaOptionalDecompositions> {			: public TosaConstantFoldPassBase<TosaConstantFoldPass> {
	void runOnOperation() override {			void runOnOperation() override {
	auto *ctx = &getContext();			auto *ctx = &getContext();
	RewritePatternSet patterns(ctx);			RewritePatternSet patterns(ctx);
	auto func = getOperation();			auto func = getOperation();

	mlir::tosa::populateTosaDecomposeConv2D(ctx, patterns);			mlir::tosa::populateTosaFoldConstantTransposePatterns(ctx, patterns);
	mlir::tosa::populateTosaDecomposeTransposeConv(ctx, patterns);			mlir::tosa::populateTosaOpsCanonicalizationPatterns(ctx, patterns);
	mlir::tosa::populateTosaDecomposeDepthwise(ctx, patterns);

				rsudermanUnsubmitted Not Done Reply Inline Actions You will want to include the canonicalization patterns as well. It is valuable to run the ConstantFoldPass separately however when we do finally apply it we will want it alternating with canoncalizations so guarantee the patterns run to completeness. rsuderman: You will want to include the canonicalization patterns as well. It is valuable to run the…
				GeorgeARMAuthorUnsubmitted Not Done Reply Inline Actions are you suggesting @rsuderman to register TOSA related canonicalization patterns as well? GeorgeARM: are you suggesting @rsuderman to register TOSA related canonicalization patterns as well?
				rsudermanUnsubmitted Not Done Reply Inline Actions Yes I believe so. I'll breakdown the logic - it is reasonably common to see the pattern transpose-reshape-transpose. If we only run the transpose constant propagation then the first transpose will be constant folded. The next reshape will be canonicalized however the second transpose will never have an opportunity to constant propagate. It sounds silly but this may actually significant affect codegen performance. rsuderman: Yes I believe so. I'll breakdown the logic - it is reasonably common to see the pattern…
				jpienaarUnsubmitted Not Done Reply Inline Actions https://github.com/llvm/llvm-project/blob/12e41d9264b6f84213be86aab75016fb82ebc1d1/mlir/lib/Dialect/Tosa/IR/TosaOps.cpp#L78 like expansion may help ease adding all the canonicalization patterns in here without needing to duplicate. jpienaar: https://github.com/llvm/llvm-project/blob/12e41d9264b6f84213be86aab75016fb82ebc1d1/mlir/lib/Dia…
	if (applyPatternsAndFoldGreedily(func, std::move(patterns)).failed())			if (applyPatternsAndFoldGreedily(func, std::move(patterns)).failed())
	signalPassFailure();			signalPassFailure();
	}			}
	};			};

	} // namespace			} // namespace

	std::unique_ptr<Pass> mlir::tosa::createTosaOptionalDecompositions() {			std::unique_ptr<Pass> mlir::tosa::createTosaConstantFoldPass() {
	return std::make_unique<TosaOptionalDecompositions>();			return std::make_unique<TosaConstantFoldPass>();
	}			}

mlir/lib/Dialect/Tosa/Transforms/TosaDecomposeConv2D.cpp

	//===- TosaDecomposeConv2D.cpp ------------------------------------------===//			//===- TosaDecomposeConv2D.cpp --------------------------------------------===//
	//			//
	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.			// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
	// See https://llvm.org/LICENSE.txt for license information.			// See https://llvm.org/LICENSE.txt for license information.
	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception			// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
	//			//
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	//			//
	// Decompose TOSA Conv2D operation to a series of TOSA Ops specifically			// Decompose TOSA Conv2D operation to a series of TOSA Ops specifically
	▲ Show 20 Lines • Show All 106 Lines • Show Last 20 Lines

mlir/lib/Dialect/Tosa/Transforms/TosaDecomposeDepthwise.cpp

	//===- TosaDecomposeDepthwise.cpp			//===- TosaDecomposeDepthwise.cpp -----------------------------------------===//
	//------------------------------------------===//
	//			//
	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.			// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
	// See https://llvm.org/LICENSE.txt for license information.			// See https://llvm.org/LICENSE.txt for license information.
	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception			// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
	//			//
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	//			//
	// Decompose TOSA Depthwise operation to a series of TOSA Ops specifically			// Decompose TOSA Depthwise operation to a series of TOSA Ops specifically
	▲ Show 20 Lines • Show All 111 Lines • Show Last 20 Lines

mlir/lib/Dialect/Tosa/Transforms/TosaDecomposeTransposeConv.cpp

	//===- TosaDecomposeTransposeConv.cpp			//===- TosaDecomposeTransposeConv.cpp -------------------------------------===//
	//------------------------------------------===//
	//			//
	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.			// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
	// See https://llvm.org/LICENSE.txt for license information.			// See https://llvm.org/LICENSE.txt for license information.
	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception			// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
	//			//
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	//			//
	// Decompose TOSA TransposeConv operation to a series of TOSA Ops specifically			// Decompose TOSA TransposeConv operation to a series of TOSA Ops specifically
	▲ Show 20 Lines • Show All 370 Lines • Show Last 20 Lines

mlir/lib/Dialect/Tosa/Transforms/TosaFoldConstantTranspose.cpp

This file was added.

				//===- TosaFoldConstantTranspose.cpp --------------------------------------===//
				//
				// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
				// See https://llvm.org/LICENSE.txt for license information.
				// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
				//
				//===----------------------------------------------------------------------===//
				//
				// Fold TOSA Transpose operation on constant data
				//
				//===----------------------------------------------------------------------===//

				#include "mlir/Dialect/Tosa/IR/TosaOps.h"
				#include "mlir/Dialect/Tosa/Transforms/Passes.h"
				#include "mlir/IR/Matchers.h"
				#include "mlir/Pass/Pass.h"

				using namespace mlir;
				using namespace mlir::tosa;

				namespace {

				struct TosaFoldConstantTranspose : public OpRewritePattern<tosa::TransposeOp> {
				using OpRewritePattern::OpRewritePattern;

				LogicalResult matchAndRewrite(tosa::TransposeOp op,
				PatternRewriter &rewriter) const override {
				auto outputType = op.getType().cast<ShapedType>();
				// TOSA supports quantized types.
				if (!outputType.getElementType().isIntOrIndexOrFloat())
				jpienaarUnsubmitted Not Done Reply Inline Actions I'd move this closer to first use: in general the preference is as closely scoped/as small live range as possible. jpienaar: I'd move this closer to first use: in general the preference is as closely scoped/as small live…
				return failure();

				DenseElementsAttr inputValues;
				if (!matchPattern(op.input1(), m_Constant(&inputValues)))
				return failure();
				// Make sure the input is a constant that has a single user.
				if (!llvm::hasSingleElement(op.input1().getDefiningOp()->getUsers()))
				return failure();

				DenseIntElementsAttr permAttr;
				if (!matchPattern(op.perms(), m_Constant(&permAttr)))
				return failure();
				auto permValues = llvm::to_vector<6>(llvm::map_range(
				// TOSA allows both 32- and 64-bit integer tensors here.
				permAttr.getValues<APInt>(),
				[](const APInt &val) { return val.getZExtValue(); }));

				auto inputType = op.input1().getType().cast<ShapedType>();
				ArrayRef<int64_t> inputShape = inputType.getShape();
				int64_t numElements = inputType.getNumElements();

				SmallVector<Attribute, 4> outputValues;
				outputValues.resize(numElements);

				// Transpose the input constant. Because we don't know its rank in advance,
				// we need to loop over the range [0, element count) and delinearize the
				// index.
				auto attrValues = inputValues.getValues<Attribute>();
				ArrayRef<int64_t> outputShape = outputType.getShape();
				for (int srcLinearIndex = 0; srcLinearIndex < numElements;
				++srcLinearIndex) {
				SmallVector<uint64_t, 6> srcIndices(inputType.getRank(), 0);
				int totalCount = srcLinearIndex;
				for (int dim = inputType.getRank() - 1; dim >= 0; --dim) {
				srcIndices[dim] = totalCount % inputShape[dim];
				totalCount /= inputShape[dim];
				}

				SmallVector<uint64_t, 6> dstIndices(outputType.getRank(), 0);
				for (int dim = outputType.getRank() - 1; dim >= 0; --dim)
				dstIndices[dim] = srcIndices[permValues[dim]];

				uint64_t dstLinearIndex = dstIndices.front();
				for (int dim = 1; dim < outputType.getRank(); ++dim)
				dstLinearIndex = dstLinearIndex * outputShape[dim] + dstIndices[dim];

				outputValues[dstLinearIndex] = attrValues[srcIndices];
				}

				rewriter.replaceOpWithNewOp<tosa::ConstOp>(
				op, outputType, DenseElementsAttr::get(outputType, outputValues));
				return success();
				}
				};

				} // namespace

				void mlir::tosa::populateTosaFoldConstantTransposePatterns(
				MLIRContext *ctx, RewritePatternSet &patterns) {
				patterns.add<TosaFoldConstantTranspose>(ctx);
				}
				rsudermanUnsubmitted Not Done Reply Inline Actions Add newline. rsuderman: Add newline.

mlir/lib/Dialect/Tosa/Transforms/TosaInferShapes.cpp

	//===- TosaInferShapes.cpp ------------------------------------------===//			//===- TosaInferShapes.cpp ------------------------------------------------===//
	//			//
	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.			// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
	// See https://llvm.org/LICENSE.txt for license information.			// See https://llvm.org/LICENSE.txt for license information.
	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception			// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
	//			//
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	//			//
	// Propogate shapes forward along TOSA operations to resolve dynamic shape			// Propogate shapes forward along TOSA operations to resolve dynamic shape
	▲ Show 20 Lines • Show All 318 Lines • Show Last 20 Lines

mlir/lib/Dialect/Tosa/Transforms/TosaOptionalDecompositions.cpp

This file was copied to mlir/lib/Dialect/Tosa/Transforms/TosaConstantFoldPass.cpp.

	//===- TosaOptionalDecompositions.cpp			//===- TosaOptionalDecompositions.cpp -------------------------------------===//
	//------------------------------------------===//
	//			//
	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.			// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
	// See https://llvm.org/LICENSE.txt for license information.			// See https://llvm.org/LICENSE.txt for license information.
	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception			// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
	//			//
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	//			//
	// Pass to apply the Tosa operations decompositions			// Pass to apply the Tosa operations decompositions
	Show All 36 Lines

mlir/test/Dialect/Tosa/canonicalize.mlir

	Show First 20 Lines • Show All 385 Lines • ▼ Show 20 Lines

	// CHECK-LABEL: @tile_nofold			// CHECK-LABEL: @tile_nofold
	func.func @tile_nofold(%arg0: tensor<3x4xf32>) -> tensor<3x8xf32> {			func.func @tile_nofold(%arg0: tensor<3x4xf32>) -> tensor<3x8xf32> {
	// CHECK: "tosa.tile"			// CHECK: "tosa.tile"
	%0 = "tosa.tile"(%arg0) { multiples = [1, 2] }: (tensor<3x4xf32>) -> tensor<3x8xf32>			%0 = "tosa.tile"(%arg0) { multiples = [1, 2] }: (tensor<3x4xf32>) -> tensor<3x8xf32>
	return %0 : tensor<3x8xf32>			return %0 : tensor<3x8xf32>
	}			}

	// CHECK-LABEL: @transpose_fold
	func.func @transpose_fold(%arg0: tensor<3x4xf32>) -> tensor<3x4xf32> {
	// CHECK: return %arg0
	%0 = arith.constant dense<[0, 1]> : tensor<2xi32>
	%1 = "tosa.transpose"(%arg0, %0) { perms = [1, 0] }: (tensor<3x4xf32>, tensor<2xi32>) -> tensor<3x4xf32>
	return %1 : tensor<3x4xf32>
	}

	// CHECK-LABEL: @transpose_nofold
	func.func @transpose_nofold(%arg0: tensor<3x3xf32>) -> tensor<3x3xf32> {
	// CHECK: "tosa.transpose"
	%0 = arith.constant dense<[1, 0]> : tensor<2xi32>
	%1 = "tosa.transpose"(%arg0, %0) { perms = [1, 0] }: (tensor<3x3xf32>, tensor<2xi32>) -> tensor<3x3xf32>
	return %1 : tensor<3x3xf32>
	}

	// CHECK-LABEL: @transpose_nofold_shape
	func.func @transpose_nofold_shape(%arg0: tensor<3x4xf32>) -> tensor<?x?xf32> {
	// CHECK: "tosa.transpose"
	%0 = arith.constant dense<[1, 0]> : tensor<2xi32>
	%1 = "tosa.transpose"(%arg0, %0) { perms = [1, 0] }: (tensor<3x4xf32>, tensor<2xi32>) -> tensor<?x?xf32>
	return %1 : tensor<?x?xf32>
	}

	// CHECK-LABEL: @transpose_fold_splat
	func.func @transpose_fold_splat() -> tensor<3x2xf32> {
	%input = "tosa.const"() {value = dense<4.0> : tensor<2x3xf32>} : () -> tensor<2x3xf32>
	%perms = "tosa.const"() {value = dense<[1, 0]> : tensor<2xi32>} : () -> tensor<2xi32>
	// CHECK: %[[CST:.+]] = "tosa.const"()
	// CHECK-SAME{LITERAL}: value = dense<4.000000e+00> : tensor<3x2xf32>
	%1 = "tosa.transpose"(%input, %perms) : (tensor<2x3xf32>, tensor<2xi32>) -> tensor<3x2xf32>
	// CHECK: return %[[CST]]
	return %1 : tensor<3x2xf32>
	}

	// CHECK-LABEL: @transpose_fold_2d_float
	func.func @transpose_fold_2d_float() -> tensor<3x2xf32> {
	%input = "tosa.const"() {value = dense<[[0.0, 1.0, 2.0], [3.0, 4.0, 5.0]]> : tensor<2x3xf32>} : () -> tensor<2x3xf32>
	%perms = "tosa.const"() {value = dense<[1, 0]> : tensor<2xi32>} : () -> tensor<2xi32>
	// CHECK: %[[CST:.+]] = "tosa.const"()
	// CHECK-SAME{LITERAL}: value = dense<[[0.000000e+00, 3.000000e+00], [1.000000e+00, 4.000000e+00], [2.000000e+00, 5.000000e+00]]> : tensor<3x2xf32>
	%1 = "tosa.transpose"(%input, %perms) : (tensor<2x3xf32>, tensor<2xi32>) -> tensor<3x2xf32>
	// CHECK: return %[[CST]]
	return %1 : tensor<3x2xf32>
	}

	// CHECK-LABEL: @transpose_fold_4d_int
	func.func @transpose_fold_4d_int() -> tensor<3x1x4x2xi32> {
	%input = "tosa.const"() {value = dense<[[
	[[ 0, 1, 2, 3], [ 4, 5, 6, 7], [ 8, 9, 10, 11]],
	[[12, 13, 14, 15], [16, 17, 18, 19], [20, 21, 22, 23]]
	]]> : tensor<1x2x3x4xi32>} : () -> tensor<1x2x3x4xi32>
	%perms = "tosa.const"() {value = dense<[2, 0, 3, 1]> : tensor<4xi64>} : () -> tensor<4xi64>
	// CHECK: %[[CST:.+]] = "tosa.const"()
	// CHECK-SAME{LITERAL}: value = dense<[
	// CHECK-SAME{LITERAL}: [[[0, 12], [1, 13], [2, 14], [3, 15]]],
	// CHECK-SAME{LITERAL}: [[[4, 16], [5, 17], [6, 18], [7, 19]]],
	// CHECK-SAME{LITERAL}: [[[8, 20], [9, 21], [10, 22], [11, 23]]]
	// CHECK-SAME{LITERAL}: ]>
	%1 = "tosa.transpose"(%input, %perms) : (tensor<1x2x3x4xi32>, tensor<4xi64>) -> tensor<3x1x4x2xi32>
	// CHECK: return %[[CST]]
	return %1 : tensor<3x1x4x2xi32>
	}

	// CHECK-LABEL: @transpose_nofold_non_cst_input
	func.func @transpose_nofold_non_cst_input(%input: tensor<2x3xf32>) -> tensor<3x2xf32> {
	%perms = "tosa.const"() {value = dense<[1, 0]> : tensor<2xi32>} : () -> tensor<2xi32>
	// CHECK: tosa.transpose
	%1 = "tosa.transpose"(%input, %perms) : (tensor<2x3xf32>, tensor<2xi32>) -> tensor<3x2xf32>
	return %1 : tensor<3x2xf32>
	}

	// CHECK-LABEL: @transpose_nofold_non_cst_perms
	func.func @transpose_nofold_non_cst_perms(%perms: tensor<2xi32>) -> tensor<3x2xf32> {
	%input = "tosa.const"() {value = dense<[[0.0, 1.0, 2.0], [3.0, 4.0, 5.0]]> : tensor<2x3xf32>} : () -> tensor<2x3xf32>
	// CHECK: tosa.transpose
	%1 = "tosa.transpose"(%input, %perms) : (tensor<2x3xf32>, tensor<2xi32>) -> tensor<3x2xf32>
	return %1 : tensor<3x2xf32>
	}

	// CHECK-LABEL: @transpose_nofold_multi_users
	func.func @transpose_nofold_multi_users() -> (tensor<3x2xf32>, tensor<2x3xf32>) {
	%input = "tosa.const"() {value = dense<[[0.0, 1.0, 2.0], [3.0, 4.0, 5.0]]> : tensor<2x3xf32>} : () -> tensor<2x3xf32>
	%perms = "tosa.const"() {value = dense<[1, 0]> : tensor<2xi32>} : () -> tensor<2xi32>
	// CHECK: tosa.transpose
	%1 = "tosa.transpose"(%input, %perms) : (tensor<2x3xf32>, tensor<2xi32>) -> tensor<3x2xf32>
	return %1, %input : tensor<3x2xf32>, tensor<2x3xf32>
	}

	// CHECK-LABEL: @transpose_nofold_quantized_types
	func.func @transpose_nofold_quantized_types() -> tensor<1x1x16x1x!quant.uniform<i8<-127:127>:f32:3, {1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,2.100000e+00,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01}>> {
	%perms = "tosa.const"() {value = dense<[1, 2, 3, 0]> : tensor<4xi32>} : () -> tensor<4xi32>
	%input = "tosa.const"() {value = dense<[[[[-127, 127, 127, -127, -127, -127, -127, -127, -127, 127, 127, 127, 127, 127, -127, 127]]]]> : tensor<1x1x1x16xi8>} : () -> tensor<1x1x1x16xi8>
	// CHECK: tosa.transpose
	%0 = "tosa.transpose"(%input, %perms) : (tensor<1x1x1x16xi8>, tensor<4xi32>) -> tensor<1x1x16x1x!quant.uniform<i8<-127:127>:f32:3, {1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,2.100000e+00,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01}>>
	return %0: tensor<1x1x16x1x!quant.uniform<i8<-127:127>:f32:3, {1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,2.100000e+00,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01}>>
	}

	// CHECK-LABEL: @transpose_no_op			// CHECK-LABEL: @transpose_no_op
	func.func @transpose_no_op(%arg0: tensor<3x4x5x6xf32>) -> tensor<3x4x5x6xf32> {			func.func @transpose_no_op(%arg0: tensor<3x4x5x6xf32>) -> tensor<3x4x5x6xf32> {
	// CHECK: return %arg0			// CHECK: return %arg0
	// CHECK-NOT: tosa.transpose			// CHECK-NOT: tosa.transpose
	%perms = "tosa.const"() {value = dense<[0, 1, 2, 3]> : tensor<4xi32>} : () -> tensor<4xi32>			%perms = "tosa.const"() {value = dense<[0, 1, 2, 3]> : tensor<4xi32>} : () -> tensor<4xi32>
	%1 = "tosa.transpose"(%arg0, %perms) : (tensor<3x4x5x6xf32>, tensor<4xi32>) -> tensor<3x4x5x6xf32>			%1 = "tosa.transpose"(%arg0, %perms) : (tensor<3x4x5x6xf32>, tensor<4xi32>) -> tensor<3x4x5x6xf32>
	return %1 : tensor<3x4x5x6xf32>			return %1 : tensor<3x4x5x6xf32>
	}			}

	// CHECK-LABEL: @single_bit_reshape			// CHECK-LABEL: @single_bit_reshape
	// https://github.com/llvm/llvm-project/issues/55440			// https://github.com/llvm/llvm-project/issues/55440
	func.func @single_bit_reshape() -> tensor<1xi1> {			func.func @single_bit_reshape() -> tensor<1xi1> {
	// CHECK: "tosa.const"() {value = dense<true> : tensor<1xi1>}			// CHECK: "tosa.const"() {value = dense<true> : tensor<1xi1>}
	%0 = arith.constant dense<true> : tensor<1x1xi1>			%0 = arith.constant dense<true> : tensor<1x1xi1>
	%1 = "tosa.reshape"(%0) {new_shape = [1]} : (tensor<1x1xi1>) -> tensor<1xi1>			%1 = "tosa.reshape"(%0) {new_shape = [1]} : (tensor<1x1xi1>) -> tensor<1xi1>
	return %1 : tensor<1xi1>			return %1 : tensor<1xi1>
	}			}
				rsudermanUnsubmitted Not Done Reply Inline Actions Add newline back. rsuderman: Add newline back.

mlir/test/Dialect/Tosa/constant-op-fold.mlir

This file was added.

				// RUN: mlir-opt --split-input-file --tosa-constant-fold %s \| FileCheck %s

				// CHECK-LABEL: @transpose_fold
				func.func @transpose_fold(%arg0: tensor<3x4xf32>) -> tensor<3x4xf32> {
				// CHECK: return %arg0
				%0 = arith.constant dense<[0, 1]> : tensor<2xi32>
				%1 = "tosa.transpose"(%arg0, %0) { perms = [1, 0] }: (tensor<3x4xf32>, tensor<2xi32>) -> tensor<3x4xf32>
				return %1 : tensor<3x4xf32>
				}

				// CHECK-LABEL: @transpose_nofold
				func.func @transpose_nofold(%arg0: tensor<3x3xf32>) -> tensor<3x3xf32> {
				// CHECK: "tosa.transpose"
				%0 = arith.constant dense<[1, 0]> : tensor<2xi32>
				%1 = "tosa.transpose"(%arg0, %0) { perms = [1, 0] }: (tensor<3x3xf32>, tensor<2xi32>) -> tensor<3x3xf32>
				return %1 : tensor<3x3xf32>
				}

				// CHECK-LABEL: @transpose_nofold_shape
				func.func @transpose_nofold_shape(%arg0: tensor<3x4xf32>) -> tensor<?x?xf32> {
				// CHECK: "tosa.transpose"
				%0 = arith.constant dense<[1, 0]> : tensor<2xi32>
				%1 = "tosa.transpose"(%arg0, %0) { perms = [1, 0] }: (tensor<3x4xf32>, tensor<2xi32>) -> tensor<?x?xf32>
				return %1 : tensor<?x?xf32>
				}

				// CHECK-LABEL: @transpose_fold_splat
				func.func @transpose_fold_splat() -> tensor<3x2xf32> {
				%input = "tosa.const"() {value = dense<4.0> : tensor<2x3xf32>} : () -> tensor<2x3xf32>
				%perms = "tosa.const"() {value = dense<[1, 0]> : tensor<2xi32>} : () -> tensor<2xi32>
				// CHECK: %[[CST:.+]] = "tosa.const"()
				// CHECK-SAME{LITERAL}: value = dense<4.000000e+00> : tensor<3x2xf32>
				%1 = "tosa.transpose"(%input, %perms) : (tensor<2x3xf32>, tensor<2xi32>) -> tensor<3x2xf32>
				// CHECK: return %[[CST]]
				return %1 : tensor<3x2xf32>
				}

				// CHECK-LABEL: @transpose_fold_2d_float
				func.func @transpose_fold_2d_float() -> tensor<3x2xf32> {
				%input = "tosa.const"() {value = dense<[[0.0, 1.0, 2.0], [3.0, 4.0, 5.0]]> : tensor<2x3xf32>} : () -> tensor<2x3xf32>
				%perms = "tosa.const"() {value = dense<[1, 0]> : tensor<2xi32>} : () -> tensor<2xi32>
				// CHECK: %[[CST:.+]] = "tosa.const"()
				// CHECK-SAME{LITERAL}: value = dense<[[0.000000e+00, 3.000000e+00], [1.000000e+00, 4.000000e+00], [2.000000e+00, 5.000000e+00]]> : tensor<3x2xf32>
				%1 = "tosa.transpose"(%input, %perms) : (tensor<2x3xf32>, tensor<2xi32>) -> tensor<3x2xf32>
				// CHECK: return %[[CST]]
				return %1 : tensor<3x2xf32>
				}

				// CHECK-LABEL: @transpose_fold_4d_int
				func.func @transpose_fold_4d_int() -> tensor<3x1x4x2xi32> {
				%input = "tosa.const"() {value = dense<[[
				[[ 0, 1, 2, 3], [ 4, 5, 6, 7], [ 8, 9, 10, 11]],
				[[12, 13, 14, 15], [16, 17, 18, 19], [20, 21, 22, 23]]
				]]> : tensor<1x2x3x4xi32>} : () -> tensor<1x2x3x4xi32>
				%perms = "tosa.const"() {value = dense<[2, 0, 3, 1]> : tensor<4xi64>} : () -> tensor<4xi64>
				// CHECK: %[[CST:.+]] = "tosa.const"()
				// CHECK-SAME{LITERAL}: value = dense<[
				// CHECK-SAME{LITERAL}: [[[0, 12], [1, 13], [2, 14], [3, 15]]],
				// CHECK-SAME{LITERAL}: [[[4, 16], [5, 17], [6, 18], [7, 19]]],
				// CHECK-SAME{LITERAL}: [[[8, 20], [9, 21], [10, 22], [11, 23]]]
				// CHECK-SAME{LITERAL}: ]>
				%1 = "tosa.transpose"(%input, %perms) : (tensor<1x2x3x4xi32>, tensor<4xi64>) -> tensor<3x1x4x2xi32>
				// CHECK: return %[[CST]]
				return %1 : tensor<3x1x4x2xi32>
				}

				// CHECK-LABEL: @transpose_nofold_non_cst_input
				func.func @transpose_nofold_non_cst_input(%input: tensor<2x3xf32>) -> tensor<3x2xf32> {
				%perms = "tosa.const"() {value = dense<[1, 0]> : tensor<2xi32>} : () -> tensor<2xi32>
				// CHECK: tosa.transpose
				%1 = "tosa.transpose"(%input, %perms) : (tensor<2x3xf32>, tensor<2xi32>) -> tensor<3x2xf32>
				return %1 : tensor<3x2xf32>
				}

				// CHECK-LABEL: @transpose_nofold_non_cst_perms
				func.func @transpose_nofold_non_cst_perms(%perms: tensor<2xi32>) -> tensor<3x2xf32> {
				%input = "tosa.const"() {value = dense<[[0.0, 1.0, 2.0], [3.0, 4.0, 5.0]]> : tensor<2x3xf32>} : () -> tensor<2x3xf32>
				// CHECK: tosa.transpose
				%1 = "tosa.transpose"(%input, %perms) : (tensor<2x3xf32>, tensor<2xi32>) -> tensor<3x2xf32>
				return %1 : tensor<3x2xf32>
				}

				// CHECK-LABEL: @transpose_nofold_multi_users
				func.func @transpose_nofold_multi_users() -> (tensor<3x2xf32>, tensor<2x3xf32>) {
				%input = "tosa.const"() {value = dense<[[0.0, 1.0, 2.0], [3.0, 4.0, 5.0]]> : tensor<2x3xf32>} : () -> tensor<2x3xf32>
				%perms = "tosa.const"() {value = dense<[1, 0]> : tensor<2xi32>} : () -> tensor<2xi32>
				// CHECK: tosa.transpose
				%1 = "tosa.transpose"(%input, %perms) : (tensor<2x3xf32>, tensor<2xi32>) -> tensor<3x2xf32>
				return %1, %input : tensor<3x2xf32>, tensor<2x3xf32>
				}

				// CHECK-LABEL: @transpose_nofold_quantized_types
				func.func @transpose_nofold_quantized_types() -> tensor<1x1x16x1x!quant.uniform<i8<-127:127>:f32:3, {1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,2.100000e+00,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01}>> {
				%perms = "tosa.const"() {value = dense<[1, 2, 3, 0]> : tensor<4xi32>} : () -> tensor<4xi32>
				%input = "tosa.const"() {value = dense<[[[[-127, 127, 127, -127, -127, -127, -127, -127, -127, 127, 127, 127, 127, 127, -127, 127]]]]> : tensor<1x1x1x16xi8>} : () -> tensor<1x1x1x16xi8>
				// CHECK: tosa.transpose
				%0 = "tosa.transpose"(%input, %perms) : (tensor<1x1x1x16xi8>, tensor<4xi32>) -> tensor<1x1x16x1x!quant.uniform<i8<-127:127>:f32:3, {1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,2.100000e+00,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01}>>
				return %0: tensor<1x1x16x1x!quant.uniform<i8<-127:127>:f32:3, {1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,2.100000e+00,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01,1.000000e-01}>>
				}

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][tosa] Moves constant folding operations out of the Canonicalizer
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 429812

mlir/include/mlir/Dialect/Tosa/IR/TosaOps.h

mlir/include/mlir/Dialect/Tosa/Transforms/Passes.h

mlir/include/mlir/Dialect/Tosa/Transforms/Passes.td

mlir/lib/Conversion/TosaToLinalg/TosaToLinalgPass.cpp

mlir/lib/Dialect/Tosa/IR/TosaOps.cpp

mlir/lib/Dialect/Tosa/Transforms/CMakeLists.txt

mlir/lib/Dialect/Tosa/Transforms/TosaConstantFoldPass.cpp

mlir/lib/Dialect/Tosa/Transforms/TosaDecomposeConv2D.cpp

mlir/lib/Dialect/Tosa/Transforms/TosaDecomposeDepthwise.cpp

mlir/lib/Dialect/Tosa/Transforms/TosaDecomposeTransposeConv.cpp

mlir/lib/Dialect/Tosa/Transforms/TosaFoldConstantTranspose.cpp

mlir/lib/Dialect/Tosa/Transforms/TosaInferShapes.cpp

mlir/lib/Dialect/Tosa/Transforms/TosaOptionalDecompositions.cpp

mlir/test/Dialect/Tosa/canonicalize.mlir

mlir/test/Dialect/Tosa/constant-op-fold.mlir

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][tosa] Moves constant folding operations out of the CanonicalizerClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 429812

mlir/include/mlir/Dialect/Tosa/IR/TosaOps.h

mlir/include/mlir/Dialect/Tosa/Transforms/Passes.h

mlir/include/mlir/Dialect/Tosa/Transforms/Passes.td

mlir/lib/Conversion/TosaToLinalg/TosaToLinalgPass.cpp

mlir/lib/Dialect/Tosa/IR/TosaOps.cpp

mlir/lib/Dialect/Tosa/Transforms/CMakeLists.txt

mlir/lib/Dialect/Tosa/Transforms/TosaConstantFoldPass.cpp

mlir/lib/Dialect/Tosa/Transforms/TosaDecomposeConv2D.cpp

mlir/lib/Dialect/Tosa/Transforms/TosaDecomposeDepthwise.cpp

mlir/lib/Dialect/Tosa/Transforms/TosaDecomposeTransposeConv.cpp

mlir/lib/Dialect/Tosa/Transforms/TosaFoldConstantTranspose.cpp

mlir/lib/Dialect/Tosa/Transforms/TosaInferShapes.cpp

mlir/lib/Dialect/Tosa/Transforms/TosaOptionalDecompositions.cpp

mlir/test/Dialect/Tosa/canonicalize.mlir

mlir/test/Dialect/Tosa/constant-op-fold.mlir

[mlir][tosa] Moves constant folding operations out of the Canonicalizer
ClosedPublic