Diff 337977

mlir/include/mlir/Dialect/Vector/VectorOps.td

Show First 20 Lines • Show All 1,415 Lines • ▼ Show 20 Lines	OpBuilder<(ins "Value":$vector, "Value":$source, "ValueRange":$indices,
"AffineMapAttr":$permutationMap, "ArrayAttr":$inBounds)>,		"AffineMapAttr":$permutationMap, "ArrayAttr":$inBounds)>,
OpBuilder<(ins "Value":$vector, "Value":$source, "ValueRange":$indices,		OpBuilder<(ins "Value":$vector, "Value":$source, "ValueRange":$indices,
"AffineMap":$permutationMap, "Value":$mask, "ArrayAttr":$inBounds)>,		"AffineMap":$permutationMap, "Value":$mask, "ArrayAttr":$inBounds)>,
OpBuilder<(ins "Value":$vector, "Value":$source, "ValueRange":$indices,		OpBuilder<(ins "Value":$vector, "Value":$source, "ValueRange":$indices,
"AffineMap":$permutationMap, "ArrayAttr":$inBounds)>,		"AffineMap":$permutationMap, "ArrayAttr":$inBounds)>,
];		];

let hasFolder = 1;		let hasFolder = 1;
		let hasCanonicalizer = 1;
}		}

def Vector_LoadOp : Vector_Op<"load"> {		def Vector_LoadOp : Vector_Op<"load"> {
let summary = "reads an n-D slice of memory into an n-D vector";		let summary = "reads an n-D slice of memory into an n-D vector";
let description = [{		let description = [{
The 'vector.load' operation reads an n-D slice of memory into an n-D		The 'vector.load' operation reads an n-D slice of memory into an n-D
vector. It takes a 'base' memref, an index for each memref dimension and a		vector. It takes a 'base' memref, an index for each memref dimension and a
result vector type as arguments. It returns a value of the result vector		result vector type as arguments. It returns a value of the result vector
▲ Show 20 Lines • Show All 975 Lines • Show Last 20 Lines

mlir/include/mlir/Dialect/Vector/VectorUtils.h

Show All 22 Lines
class Location;		class Location;
class OpBuilder;		class OpBuilder;
class Operation;		class Operation;
class ShapedType;		class ShapedType;
class Value;		class Value;
class VectorType;		class VectorType;
class VectorTransferOpInterface;		class VectorTransferOpInterface;

		namespace vector {
		class TransferWriteOp;
		class TransferReadOp;
		} // namespace vector

/// Return the number of elements of basis, `0` if empty.		/// Return the number of elements of basis, `0` if empty.
int64_t computeMaxLinearIndex(ArrayRef<int64_t> basis);		int64_t computeMaxLinearIndex(ArrayRef<int64_t> basis);

/// Given a shape with sizes greater than 0 along all dimensions,		/// Given a shape with sizes greater than 0 along all dimensions,
/// return the distance, in number of elements, between a slice in a dimension		/// return the distance, in number of elements, between a slice in a dimension
/// and the next slice in the same dimension.		/// and the next slice in the same dimension.
/// e.g. shape[3, 4, 5] -> linearization_basis[20, 5, 1]		/// e.g. shape[3, 4, 5] -> linearization_basis[20, 5, 1]
SmallVector<int64_t, 8> computeStrides(ArrayRef<int64_t> shape);		SmallVector<int64_t, 8> computeStrides(ArrayRef<int64_t> shape);
▲ Show 20 Lines • Show All 133 Lines • ▼ Show 20 Lines	bool isDisjointTransferSet(VectorTransferOpInterface transferA,
VectorTransferOpInterface transferB);		VectorTransferOpInterface transferB);

/// Same behavior as `isDisjointTransferSet` but doesn't require the operations		/// Same behavior as `isDisjointTransferSet` but doesn't require the operations
/// to have the same tensor/memref. This allows comparing operations accessing		/// to have the same tensor/memref. This allows comparing operations accessing
/// different tensors.		/// different tensors.
bool isDisjointTransferIndices(VectorTransferOpInterface transferA,		bool isDisjointTransferIndices(VectorTransferOpInterface transferA,
VectorTransferOpInterface transferB);		VectorTransferOpInterface transferB);

		/// Return true if the transfer_write fully writes the data accessed by the
		/// transfer_read.
		bool transferEncompasses(vector::TransferWriteOp defWrite,
		vector::TransferReadOp read);

		/// Return true if the write op fully over-write the priorWrite transfer_write
		/// op.
		bool transferEncompasses(vector::TransferWriteOp write,
		vector::TransferWriteOp priorWrite);

namespace matcher {		namespace matcher {

/// Matches vector.transfer_read, vector.transfer_write and ops that return a		/// Matches vector.transfer_read, vector.transfer_write and ops that return a
/// vector type that is a multiple of the sub-vector type. This allows passing		/// vector type that is a multiple of the sub-vector type. This allows passing
/// over other smaller vector types in the function and avoids interfering with		/// over other smaller vector types in the function and avoids interfering with
/// operations on those.		/// operations on those.
/// This is a first approximation, it can easily be extended in the future.		/// This is a first approximation, it can easily be extended in the future.
/// TODO: this could all be much simpler if we added a bit that a vector type to		/// TODO: this could all be much simpler if we added a bit that a vector type to
/// mark that a vector is a strict super-vector but it still does not warrant		/// mark that a vector is a strict super-vector but it still does not warrant
/// adding even 1 extra bit in the IR for now.		/// adding even 1 extra bit in the IR for now.
bool operatesOnSuperVectorsOf(Operation &op, VectorType subVectorType);		bool operatesOnSuperVectorsOf(Operation &op, VectorType subVectorType);

} // end namespace matcher		} // end namespace matcher
} // end namespace mlir		} // end namespace mlir

#endif // MLIR_DIALECT_VECTOR_VECTORUTILS_H_		#endif // MLIR_DIALECT_VECTOR_VECTORUTILS_H_

mlir/lib/Dialect/Vector/VectorOps.cpp

Show First 20 Lines • Show All 2,506 Lines • ▼ Show 20 Lines	if (!changed)
return failure();		return failure();
// OpBuilder is only used as a helper to build an I64ArrayAttr.		// OpBuilder is only used as a helper to build an I64ArrayAttr.
OpBuilder b(op.getContext());		OpBuilder b(op.getContext());
op->setAttr(TransferOp::getInBoundsAttrName(),		op->setAttr(TransferOp::getInBoundsAttrName(),
b.getBoolArrayAttr(newInBounds));		b.getBoolArrayAttr(newInBounds));
return success();		return success();
}		}

		/// ```
		/// %w0 = vector.transfer_write %v0, %arg0[%c1, %c0] {in_bounds = [true, true]}
		/// : vector<1x4xf32>, tensor<4x4xf32>
		/// %0 = vector.transfer_read %w0[%c1, %c0], %cf0 {in_bounds = [true, true]}
		Lint: Pre-merge checks Inline Actions clang-format: please reformat the code -/// %0 = vector.transfer_read %w0[%c1, %c0], %cf0 {in_bounds = [true, true]} +/// %0 = vector.transfer_read %w0[%c1, %c0], %cf0 {in_bounds = [true, true]} Lint: Pre-merge checks: clang-format: please reformat the code ``` -/// %0 = vector.transfer_read %w0[%c1, %c0], %cf0…
		/// : tensor<4x4xf32>, vector<1x4xf32>
		/// ```
		/// -> Folds into
		/// ```
		/// %v0
		/// ```
		static Value foldTransferWriteIntoTransferRead(TransferReadOp readOp) {
		nicolasvasilacheUnsubmitted Done Reply Inline Actions I'd suggest to rename `foldRAW` so it becomes very clear what type of folding this is and how it relates to the others. nicolasvasilache: I'd suggest to rename `foldRAW` so it becomes very clear what type of folding this is and how…
		if (!readOp.getShapedType().isa<RankedTensorType>())
		return {};
		auto defWrite = readOp.source().getDefiningOp<vector::TransferWriteOp>();
		while (defWrite) {
		if (transferEncompasses(defWrite, readOp))
		nicolasvasilacheUnsubmitted Done Reply Inline Actions I'd suggest to rename `checkSameValueRAW` (or a better name but with RAW in it) so it becomes very clear what type of folding this is and how it relates to the others. nicolasvasilache: I'd suggest to rename `checkSameValueRAW` (or a better name but with RAW in it) so it becomes…
		return defWrite.vector();
		if (!isDisjointTransferIndices(
		cast<VectorTransferOpInterface>(defWrite.getOperation()),
		cast<VectorTransferOpInterface>(readOp.getOperation())))
		break;
		defWrite = defWrite.source().getDefiningOp<vector::TransferWriteOp>();
		}
		return {};
		}

OpFoldResult TransferReadOp::fold(ArrayRef<Attribute>) {		OpFoldResult TransferReadOp::fold(ArrayRef<Attribute>) {
		if (Value vec = foldTransferWriteIntoTransferRead(*this))
		return vec;
/// transfer_read(memrefcast) -> transfer_read		/// transfer_read(memrefcast) -> transfer_read
if (succeeded(foldTransferInBoundsAttribute(*this)))		if (succeeded(foldTransferInBoundsAttribute(*this)))
return getResult();		return getResult();
if (succeeded(foldMemRefCast(*this)))		if (succeeded(foldMemRefCast(*this)))
return getResult();		return getResult();
if (succeeded(foldTensorCast(*this)))		if (succeeded(foldTensorCast(*this)))
return getResult();		return getResult();
return OpFoldResult();		return OpFoldResult();
▲ Show 20 Lines • Show All 195 Lines • ▼ Show 20 Lines	static LogicalResult foldReadInitWrite(TransferWriteOp write,
if (llvm::any_of(read.indices(), isNotConstantZero) \|\|		if (llvm::any_of(read.indices(), isNotConstantZero) \|\|
llvm::any_of(write.indices(), isNotConstantZero))		llvm::any_of(write.indices(), isNotConstantZero))
return failure();		return failure();
// Success.		// Success.
results.push_back(read.source());		results.push_back(read.source());
return success();		return success();
}		}

		/// Fold transfer_write write after read:
		/// ```
		/// %t0 = ...
		/// %v = vector.transfer_read %t0[%c0...] :
		/// tensor<static_sizesxf32>, vector<static_sizesxf32>
		/// %t1 = vector.transfer_write %v, %t0[%c0...] :
		/// vector<static_sizesxf32>, tensor<static_sizesxf32>
		/// ```
		///
		/// into:
		///
		/// ```
		/// %t0
		/// ```
		static LogicalResult
		foldWriteAfterRead(TransferWriteOp write,
		nicolasvasilacheUnsubmitted Done Reply Inline Actions I'd suggest to rename `foldWAR` so it becomes very clear what type of folding this is and how it relates to the others. nicolasvasilache: I'd suggest to rename `foldWAR` so it becomes very clear what type of folding this is and how…
		SmallVectorImpl<OpFoldResult> &results) {
		// Only
		if (!write.source().getType().isa<RankedTensorType>())
		return failure();
		auto read = write.vector().getDefiningOp<vector::TransferReadOp>();
		if (!read)
		return failure();

		if (read.source() != write.source() \|\| read.indices() != write.indices() \|\|
		nicolasvasilacheUnsubmitted Done Reply Inline Actions I'd suggest hoisting that in a helper `checkSameValueWAR` (or a better name but with RAW in it) so it becomes very clear what type of folding this is and how it relates to the others. nicolasvasilache: I'd suggest hoisting that in a helper `checkSameValueWAR` (or a better name but with RAW in it)…
		read.permutation_map() != write.permutation_map() \|\|
		read.getVectorType() != write.getVectorType() \|\| read.mask() \|\|
		write.mask())
		return failure();
		results.push_back(read.source());
		return success();
		}

LogicalResult TransferWriteOp::fold(ArrayRef<Attribute> operands,		LogicalResult TransferWriteOp::fold(ArrayRef<Attribute> operands,
SmallVectorImpl<OpFoldResult> &results) {		SmallVectorImpl<OpFoldResult> &results) {
if (succeeded(foldReadInitWrite(*this, operands, results)))		if (succeeded(foldReadInitWrite(*this, operands, results)))
return success();		return success();
		if (succeeded(foldWriteAfterRead(*this, results)))
		return success();
if (succeeded(foldTransferInBoundsAttribute(*this)))		if (succeeded(foldTransferInBoundsAttribute(*this)))
return success();		return success();
return foldMemRefCast(*this);		return foldMemRefCast(*this);
}		}

Optional<SmallVector<int64_t, 4>> TransferWriteOp::getShapeForUnroll() {		Optional<SmallVector<int64_t, 4>> TransferWriteOp::getShapeForUnroll() {
return llvm::to_vector<4>(getVectorType().getShape());		return llvm::to_vector<4>(getVectorType().getShape());
}		}

void TransferWriteOp::getEffects(		void TransferWriteOp::getEffects(
SmallVectorImpl<SideEffects::EffectInstance<MemoryEffects::Effect>>		SmallVectorImpl<SideEffects::EffectInstance<MemoryEffects::Effect>>
&effects) {		&effects) {
if (getShapedType().isa<MemRefType>())		if (getShapedType().isa<MemRefType>())
effects.emplace_back(MemoryEffects::Write::get(), source(),		effects.emplace_back(MemoryEffects::Write::get(), source(),
SideEffects::DefaultResource::get());		SideEffects::DefaultResource::get());
}		}

		namespace {
		/// Remove dead transfer write from the SSA chain so that it an be eliminated by
		/// DCE
		/// ```
		/// %w0 = vector.transfer_write %v0, %arg0[%c1, %c0] {in_bounds = [true, true]}
		/// : vector<1x4xf32>, tensor<4x4xf32>
		/// %w1 = vector.transfer_write %v0, %w0[%c2, %c0] {in_bounds = [true, true]}
		/// : vector<1x4xf32>, tensor<4x4xf32>
		/// %w2 = vector.transfer_write %v1, %w1[%c1, %c0] {in_bounds = [true, true]}
		/// : vector<1x4xf32>, tensor<4x4xf32>
		/// ```
		///
		/// into:
		///
		/// ```
		/// %w0 = vector.transfer_write %v0, %arg0[%c1, %c0] {in_bounds = [true, true]}
		/// : vector<1x4xf32>, tensor<4x4xf32>
		/// %w1 = vector.transfer_write %v0, %arg0[%c2, %c0] {in_bounds = [true, true]}
		/// : vector<1x4xf32>, tensor<4x4xf32>
		/// %w2 = vector.transfer_write %v1, %w1[%c1, %c0] {in_bounds = [true, true]}
		/// : vector<1x4xf32>, tensor<4x4xf32>
		/// ```
		///
		/// `%w0 = vector.transfer_write` op will be removed by DCE if it doesn't have
		/// any other uses.
		class DeadTransferWrite final : public OpRewritePattern<TransferWriteOp> {
		nicolasvasilacheUnsubmitted Done Reply Inline Actions I'd suggest to rename foldRAW so it becomes very clear what type of folding this is and how it relates to the others. nicolasvasilache: I'd suggest to rename foldRAW so it becomes very clear what type of folding this is and how it…
		public:
		using OpRewritePattern<TransferWriteOp>::OpRewritePattern;
		LogicalResult matchAndRewrite(TransferWriteOp writeOp,
		nicolasvasilacheUnsubmitted Not Done Reply Inline Actions Why does this need to be a canonicalization pattern and not a simple fold ? At some point in space time, https://reviews.llvm.org/D100586 had it working as a folder. nicolasvasilache: Why does this need to be a canonicalization pattern and not a simple fold ? At some point in…
		ThomasRaouxAuthorUnsubmitted Done Reply Inline Actions If we want to support looking more than one level up in the WaW case we need to modify a Transfer_write that isn't the root like in the example here: %w0 = vector.transfer_write %v0, %arg0[%c1, %c0] {in_bounds = [true, true]} : vector<1x4xf32>, tensor<4x4xf32> %w1 = vector.transfer_write %v0, %arg0[%c2, %c0] {in_bounds = [true, true]} : vector<1x4xf32>, tensor<4x4xf32> %w2 = vector.transfer_write %v1, %w1[%c1, %c0] {in_bounds = [true, true]} : vector<1x4xf32>, tensor<4x4xf32> In this case we need to update %w1. It could be implemented as a folding starting from %w0 considering only the case where the write has a single use and going through the SSA chain in the other direction. Do you think this is better? ThomasRaoux: If we want to support looking more than one level up in the WaW case we need to modify a…
		nicolasvasilacheUnsubmitted Not Done Reply Inline Actions I had missed that is more powerful than what you could get with a folder and hop-1 use-def. This is great as is, thanks! nicolasvasilache: I had missed that is more powerful than what you could get with a folder and hop-1 use-def.
		PatternRewriter &rewriter) const override {
		if (!writeOp.getShapedType().isa<RankedTensorType>())
		return failure();
		vector::TransferWriteOp writeToModify = writeOp;
		auto defWrite = writeOp.source().getDefiningOp<vector::TransferWriteOp>();
		while (defWrite) {
		if (transferEncompasses(writeOp, defWrite)) {
		nicolasvasilacheUnsubmitted Done Reply Inline Actions I'd suggest to rename `checkSameValueWAW` (or a better name but with WAW in it) so it becomes very clear what type of folding this is and how it relates to the others. nicolasvasilache: I'd suggest to rename `checkSameValueWAW` (or a better name but with WAW in it) so it becomes…
		writeToModify.sourceMutable().assign(defWrite.source());
		return success();
		}
		if (!isDisjointTransferIndices(
		cast<VectorTransferOpInterface>(defWrite.getOperation()),
		cast<VectorTransferOpInterface>(writeOp.getOperation())))
		break;
		// If the previous write op doesn't have any other use we an safely look
		// at the previous store to see if it can be removed.
		if (!defWrite->hasOneUse())
		break;
		writeToModify = defWrite;
		defWrite = defWrite.source().getDefiningOp<vector::TransferWriteOp>();
		}
		return failure();
		}
		};
		} // namespace

		void TransferWriteOp::getCanonicalizationPatterns(RewritePatternSet &results,
		MLIRContext *context) {
		results.add<DeadTransferWrite>(context);
		}

//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
// LoadOp		// LoadOp
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

static LogicalResult verifyLoadStoreMemRefLayout(Operation *op,		static LogicalResult verifyLoadStoreMemRefLayout(Operation *op,
MemRefType memRefTy) {		MemRefType memRefTy) {
auto affineMaps = memRefTy.getAffineMaps();		auto affineMaps = memRefTy.getAffineMaps();
if (!affineMaps.empty())		if (!affineMaps.empty())
▲ Show 20 Lines • Show All 863 Lines • Show Last 20 Lines

mlir/lib/Dialect/Vector/VectorTransferOpTransforms.cpp

Show All 28 Lines
/// an ancestor of the op.		/// an ancestor of the op.
static Operation findAncestorOpInRegion(Region region, Operation *op) {		static Operation findAncestorOpInRegion(Region region, Operation *op) {
for (; op != nullptr && op->getParentRegion() != region;		for (; op != nullptr && op->getParentRegion() != region;
op = op->getParentOp())		op = op->getParentOp())
;		;
return op;		return op;
}		}

/// Return true if the transfer_write fully writes the data accessed by the
/// transfer_read.
static bool transferEncompasses(vector::TransferWriteOp defWrite,
vector::TransferReadOp read) {
return !defWrite.hasOutOfBoundsDim() &&
defWrite.indices() == read.indices() &&
defWrite.getVectorType() == read.getVectorType() &&
defWrite.permutation_map() == read.permutation_map();
}

/// Return true if the write op fully over-write the priorWrite transfer_write
/// op.
static bool transferEncompasses(vector::TransferWriteOp write,
vector::TransferWriteOp priorWrite) {
return priorWrite.indices() == write.indices() &&
priorWrite.getVectorType() == write.getVectorType() &&
priorWrite.permutation_map() == write.permutation_map();
}

namespace {		namespace {

class TransferOptimization {		class TransferOptimization {
public:		public:
TransferOptimization(FuncOp func) : dominators(func), postDominators(func) {}		TransferOptimization(FuncOp func) : dominators(func), postDominators(func) {}
void deadStoreOp(vector::TransferWriteOp);		void deadStoreOp(vector::TransferWriteOp);
void deadStoreOpTensor(vector::TransferWriteOp);
void storeToLoadForwarding(vector::TransferReadOp);		void storeToLoadForwarding(vector::TransferReadOp);
void storeToLoadForwardingTensor(vector::TransferReadOp);
void removeDeadOp() {		void removeDeadOp() {
for (Operation *op : opToErase)		for (Operation *op : opToErase)
op->erase();		op->erase();
opToErase.clear();		opToErase.clear();
}		}

private:		private:
bool isReachable(Operation start, Operation dest);		bool isReachable(Operation start, Operation dest);
▲ Show 20 Lines • Show All 153 Lines • ▼ Show 20 Lines	void TransferOptimization::storeToLoadForwarding(vector::TransferReadOp read) {
}		}

LLVM_DEBUG(DBGS() << "Forward value from " << *lastwrite.getOperation()		LLVM_DEBUG(DBGS() << "Forward value from " << *lastwrite.getOperation()
<< " to: " << *read.getOperation() << "\n");		<< " to: " << *read.getOperation() << "\n");
read.replaceAllUsesWith(lastwrite.vector());		read.replaceAllUsesWith(lastwrite.vector());
opToErase.push_back(read.getOperation());		opToErase.push_back(read.getOperation());
}		}

/// Walk up the SSA links, if any write gets fully overwritten we can skip it.
/// If it has no more uses it becomes dead.
void TransferOptimization::deadStoreOpTensor(vector::TransferWriteOp write) {
auto defWrite = write.source().getDefiningOp<vector::TransferWriteOp>();
while (defWrite) {
if (transferEncompasses(write, defWrite)) {
write.sourceMutable().assign(defWrite.source());
if (defWrite->use_empty())
opToErase.push_back(defWrite.getOperation());
return;
}
if (!isDisjointTransferIndices(
cast<VectorTransferOpInterface>(defWrite.getOperation()),
cast<VectorTransferOpInterface>(write.getOperation())))
break;
defWrite = defWrite.source().getDefiningOp<vector::TransferWriteOp>();
}
}

/// Walk up the SSA links, if any write fully match the written vector we can
/// replace the read by the vector. The read becomes dead and can be removed.
void TransferOptimization::storeToLoadForwardingTensor(
vector::TransferReadOp read) {
auto defWrite = read.source().getDefiningOp<vector::TransferWriteOp>();
while (defWrite) {
if (transferEncompasses(defWrite, read)) {
read.replaceAllUsesWith(defWrite.vector());
opToErase.push_back(read.getOperation());
return;
}
if (!isDisjointTransferIndices(
cast<VectorTransferOpInterface>(defWrite.getOperation()),
cast<VectorTransferOpInterface>(read.getOperation())))
break;
defWrite = defWrite.source().getDefiningOp<vector::TransferWriteOp>();
}
}

} // namespace		} // namespace

void mlir::vector::transferOpflowOpt(FuncOp func) {		void mlir::vector::transferOpflowOpt(FuncOp func) {
TransferOptimization opt(func);		TransferOptimization opt(func);
// Run store to load forwarding first since it can expose more dead store		// Run store to load forwarding first since it can expose more dead store
// opportunity.		// opportunity.
func.walk([&](vector::TransferReadOp read) {		func.walk([&](vector::TransferReadOp read) {
if (read.getShapedType().isa<MemRefType>())		if (read.getShapedType().isa<MemRefType>())
opt.storeToLoadForwarding(read);		opt.storeToLoadForwarding(read);
else
opt.storeToLoadForwardingTensor(read);
});		});
opt.removeDeadOp();		opt.removeDeadOp();
func.walk([&](vector::TransferWriteOp write) {		func.walk([&](vector::TransferWriteOp write) {
if (write.getShapedType().isa<MemRefType>())		if (write.getShapedType().isa<MemRefType>())
opt.deadStoreOp(write);		opt.deadStoreOp(write);
else
opt.deadStoreOpTensor(write);
});		});
opt.removeDeadOp();		opt.removeDeadOp();
}		}

mlir/lib/Dialect/Vector/VectorUtils.cpp

	Show First 20 Lines • Show All 350 Lines • ▼ Show 20 Lines
	}			}

	bool mlir::isDisjointTransferSet(VectorTransferOpInterface transferA,			bool mlir::isDisjointTransferSet(VectorTransferOpInterface transferA,
	VectorTransferOpInterface transferB) {			VectorTransferOpInterface transferB) {
	if (transferA.source() != transferB.source())			if (transferA.source() != transferB.source())
	return false;			return false;
	return isDisjointTransferIndices(transferA, transferB);			return isDisjointTransferIndices(transferA, transferB);
	}			}

				bool mlir::transferEncompasses(vector::TransferWriteOp defWrite,
				vector::TransferReadOp read) {
				return !defWrite.hasOutOfBoundsDim() && !defWrite.mask() && !read.mask() &&
				defWrite.indices() == read.indices() &&
				defWrite.getVectorType() == read.getVectorType() &&
				defWrite.permutation_map() == read.permutation_map();
				}

				bool mlir::transferEncompasses(vector::TransferWriteOp write,
				vector::TransferWriteOp priorWrite) {
				return priorWrite.indices() == write.indices() &&
				priorWrite.mask() == write.mask() &&
				priorWrite.getVectorType() == write.getVectorType() &&
				priorWrite.permutation_map() == write.permutation_map();
				}

mlir/test/Dialect/Vector/canonicalize.mlir

Show First 20 Lines • Show All 793 Lines • ▼ Show 20 Lines	func @transfer_folding_1(%t0: tensor<2x3x4xf32>, %t1: tensor<2x3x4xf32>)
// CHECK-NEXT: some_op_that_may_have_side_effects		// CHECK-NEXT: some_op_that_may_have_side_effects
%t3 = "some_op_that_may_have_side_effects"() : () -> (tensor<2x3x4xf32>)		%t3 = "some_op_that_may_have_side_effects"() : () -> (tensor<2x3x4xf32>)
%r2 = vector.transfer_write %v, %t0[%c0, %c0, %c0] {in_bounds = [true, true, true]} :		%r2 = vector.transfer_write %v, %t0[%c0, %c0, %c0] {in_bounds = [true, true, true]} :
vector<2x3x4xf32>, tensor<2x3x4xf32>		vector<2x3x4xf32>, tensor<2x3x4xf32>

// CHECK-NEXT: return %[[T0]], %[[T0]], %[[T0]]		// CHECK-NEXT: return %[[T0]], %[[T0]], %[[T0]]
return %r0, %r1, %r2: tensor<2x3x4xf32>, tensor<2x3x4xf32>, tensor<2x3x4xf32>		return %r0, %r1, %r2: tensor<2x3x4xf32>, tensor<2x3x4xf32>, tensor<2x3x4xf32>
}		}

		// -----

		// CHECK-LABEL: func @store_after_load_tensor
		// CHECK-SAME: (%[[ARG:.*]]: tensor<4x4xf32>)
		// CHECK-NOT: vector.transfer_read
		// CHECK-NOT: vector.transfer_write
		// CHECK: return %[[ARG]] : tensor<4x4xf32>
		func @store_after_load_tensor(%arg0 : tensor<4x4xf32>) -> tensor<4x4xf32> {
		%c1 = constant 1 : index
		%c0 = constant 0 : index
		%cf0 = constant 0.0 : f32
		%0 = vector.transfer_read %arg0[%c1, %c0], %cf0 :
		tensor<4x4xf32>, vector<1x4xf32>
		%w0 = vector.transfer_write %0, %arg0[%c1, %c0] :
		vector<1x4xf32>, tensor<4x4xf32>
		return %w0 : tensor<4x4xf32>
		}

		// -----

		// CHECK-LABEL: func @store_after_load_tensor_negative
		// CHECK: vector.transfer_read
		// CHECK: vector.transfer_write
		// CHECK: return
		func @store_after_load_tensor_negative(%arg0 : tensor<4x4xf32>) -> tensor<4x4xf32> {
		%c1 = constant 1 : index
		%c0 = constant 0 : index
		%cf0 = constant 0.0 : f32
		%0 = vector.transfer_read %arg0[%c1, %c0], %cf0 :
		tensor<4x4xf32>, vector<1x4xf32>
		%w0 = vector.transfer_write %0, %arg0[%c0, %c0] :
		vector<1x4xf32>, tensor<4x4xf32>
		return %w0 : tensor<4x4xf32>
		}

		// -----

		// CHECK-LABEL: func @store_to_load_tensor
		// CHECK-SAME: (%[[ARG:.]]: tensor<4x4xf32>, %[[V0:.]]: vector<1x4xf32>, %[[V1:.*]]: vector<1x4xf32>)
		// CHECK-NOT: vector.transfer_write
		// CHECK-NOT: vector.transfer_read
		// CHECK: return %[[V0]] : vector<1x4xf32>
		func @store_to_load_tensor(%arg0 : tensor<4x4xf32>,
		%v0 : vector<1x4xf32>, %v1 : vector<1x4xf32>) -> vector<1x4xf32> {
		%c1 = constant 1 : index
		%c2 = constant 2 : index
		%c0 = constant 0 : index
		%cf0 = constant 0.0 : f32
		%w0 = vector.transfer_write %v0, %arg0[%c1, %c0] {in_bounds = [true, true]} :
		vector<1x4xf32>, tensor<4x4xf32>
		%w1 = vector.transfer_write %v1, %w0[%c2, %c0] {in_bounds = [true, true]} :
		vector<1x4xf32>, tensor<4x4xf32>
		%0 = vector.transfer_read %w1[%c1, %c0], %cf0 {in_bounds = [true, true]} :
		tensor<4x4xf32>, vector<1x4xf32>
		return %0 : vector<1x4xf32>
		}

		// -----

		// CHECK-LABEL: func @store_to_load_negative_tensor
		// CHECK: vector.transfer_write
		// CHECK: vector.transfer_write
		// CHECK: %[[V:.*]] = vector.transfer_read
		// CHECK: return %[[V]] : vector<1x4xf32>
		func @store_to_load_negative_tensor(%arg0 : tensor<4x4xf32>,
		%v0 : vector<1x4xf32>, %v1 : vector<1x4xf32>, %i : index) -> vector<1x4xf32> {
		%c1 = constant 1 : index
		%c2 = constant 2 : index
		%c0 = constant 0 : index
		%cf0 = constant 0.0 : f32
		%w0 = vector.transfer_write %v0, %arg0[%c1, %c0] {in_bounds = [true, true]} :
		vector<1x4xf32>, tensor<4x4xf32>
		%w1 = vector.transfer_write %v0, %w0[%i, %i] {in_bounds = [true, true]} :
		vector<1x4xf32>, tensor<4x4xf32>
		%0 = vector.transfer_read %w1[%c1, %c0], %cf0 {in_bounds = [true, true]} :
		tensor<4x4xf32>, vector<1x4xf32>
		return %0 : vector<1x4xf32>
		}

		// -----


		// CHECK-LABEL: func @dead_store_tensor
		// CHECK-DAG: %[[C0:.*]] = constant 0 : index
		// CHECK-DAG: %[[C1:.*]] = constant 1 : index
		// CHECK-DAG: %[[C2:.*]] = constant 2 : index
		// CHECK-NOT: vector.transfer_write {{.}}, {{.}}[%[[C1]], %[[C0]]
		// CHECK: vector.transfer_write {{.}}, {{.}}[%[[C2]], %[[C0]]
		// CHECK: %[[VTW:.]] = vector.transfer_write {{.}}, {{.*}}[%[[C1]], %[[C0]]
		// CHECK: return %[[VTW]] : tensor<4x4xf32>
		func @dead_store_tensor(%arg0 : tensor<4x4xf32>,
		%v0 : vector<1x4xf32>, %v1 : vector<1x4xf32>, %i : index) -> tensor<4x4xf32> {
		%c1 = constant 1 : index
		%c2 = constant 2 : index
		%c0 = constant 0 : index
		%cf0 = constant 0.0 : f32
		%w0 = vector.transfer_write %v0, %arg0[%c1, %c0] {in_bounds = [true, true]} :
		vector<1x4xf32>, tensor<4x4xf32>
		%w1 = vector.transfer_write %v0, %w0[%c2, %c0] {in_bounds = [true, true]} :
		vector<1x4xf32>, tensor<4x4xf32>
		%w2 = vector.transfer_write %v1, %w1[%c1, %c0] {in_bounds = [true, true]} :
		vector<1x4xf32>, tensor<4x4xf32>
		return %w2 : tensor<4x4xf32>
		}

		// -----

		// CHECK-LABEL: func @dead_store_tensor_negative
		// CHECK-DAG: %[[C0:.*]] = constant 0 : index
		// CHECK-DAG: %[[C1:.*]] = constant 1 : index
		// CHECK: vector.transfer_write
		// CHECK: vector.transfer_write
		// CHECK: vector.transfer_read
		// CHECK: %[[VTW:.]] = vector.transfer_write {{.}}, {{.*}}[%[[C1]], %[[C0]]]
		// CHECK: return %[[VTW]] : tensor<4x4xf32>
		func @dead_store_tensor_negative(%arg0 : tensor<4x4xf32>,
		%v0 : vector<1x4xf32>, %v1 : vector<1x4xf32>, %i : index) -> tensor<4x4xf32> {
		%c1 = constant 1 : index
		%c2 = constant 2 : index
		%c0 = constant 0 : index
		%cf0 = constant 0.0 : f32
		%w0 = vector.transfer_write %v0, %arg0[%c1, %c0] {in_bounds = [true, true]} :
		vector<1x4xf32>, tensor<4x4xf32>
		%w1 = vector.transfer_write %v0, %w0[%c2, %c0] {in_bounds = [true, true]} :
		vector<1x4xf32>, tensor<4x4xf32>
		%0 = vector.transfer_read %w1[%i, %i], %cf0 {in_bounds = [true, true]} :
		tensor<4x4xf32>, vector<1x4xf32>
		%x = addf %0, %0 : vector<1x4xf32>
		%w2 = vector.transfer_write %x, %w0[%c1, %c0] {in_bounds = [true, true]} :
		vector<1x4xf32>, tensor<4x4xf32>
		return %w2 : tensor<4x4xf32>
		}

mlir/test/Dialect/Vector/vector-transfer-unroll.mlir

	Show First 20 Lines • Show All 106 Lines • ▼ Show 20 Lines
	// CHECK-NEXT: %[[VTR2:.]] = vector.transfer_read {{.}}[%[[C2]], %[[C0]]], %{{.*}} : tensor<4x4xf32>, vector<2x2xf32>			// CHECK-NEXT: %[[VTR2:.]] = vector.transfer_read {{.}}[%[[C2]], %[[C0]]], %{{.*}} : tensor<4x4xf32>, vector<2x2xf32>
	// CHECK-NEXT: %[[VTR3:.]] = vector.transfer_read {{.}}[%[[C2]], %[[C2]]], %{{.*}} : tensor<4x4xf32>, vector<2x2xf32>			// CHECK-NEXT: %[[VTR3:.]] = vector.transfer_read {{.}}[%[[C2]], %[[C2]]], %{{.*}} : tensor<4x4xf32>, vector<2x2xf32>
	// CHECK-NEXT: %[[VTW0:.]] = vector.transfer_write %[[VTR0]], {{.}}[%[[C0]], %[[C0]]] {{.*}} : vector<2x2xf32>, tensor<4x4xf32>			// CHECK-NEXT: %[[VTW0:.]] = vector.transfer_write %[[VTR0]], {{.}}[%[[C0]], %[[C0]]] {{.*}} : vector<2x2xf32>, tensor<4x4xf32>
	// CHECK-NEXT: %[[VTW1:.]] = vector.transfer_write %[[VTR1]], %[[VTW0]][%[[C0]], %[[C2]]] {{.}} : vector<2x2xf32>, tensor<4x4xf32>			// CHECK-NEXT: %[[VTW1:.]] = vector.transfer_write %[[VTR1]], %[[VTW0]][%[[C0]], %[[C2]]] {{.}} : vector<2x2xf32>, tensor<4x4xf32>
	// CHECK-NEXT: %[[VTW2:.]] = vector.transfer_write %[[VTR2]], %[[VTW1]][%[[C2]], %[[C0]]] {{.}} : vector<2x2xf32>, tensor<4x4xf32>			// CHECK-NEXT: %[[VTW2:.]] = vector.transfer_write %[[VTR2]], %[[VTW1]][%[[C2]], %[[C0]]] {{.}} : vector<2x2xf32>, tensor<4x4xf32>
	// CHECK-NEXT: %[[VTW3:.]] = vector.transfer_write %[[VTR3]], %[[VTW2]][%[[C2]], %[[C2]]] {{.}} : vector<2x2xf32>, tensor<4x4xf32>			// CHECK-NEXT: %[[VTW3:.]] = vector.transfer_write %[[VTR3]], %[[VTW2]][%[[C2]], %[[C2]]] {{.}} : vector<2x2xf32>, tensor<4x4xf32>
	// CHECK-NEXT: return %[[VTW3]] : tensor<4x4xf32>			// CHECK-NEXT: return %[[VTW3]] : tensor<4x4xf32>

	func @transfer_readwrite_unroll_tensor(%arg0 : tensor<4x4xf32>) ->			func @transfer_readwrite_unroll_tensor(%arg0 : tensor<4x4xf32>, %arg1 : tensor<4x4xf32>) ->
	tensor<4x4xf32> {			tensor<4x4xf32> {
	%c0 = constant 0 : index			%c0 = constant 0 : index
	%cf0 = constant 0.0 : f32			%cf0 = constant 0.0 : f32
	%0 = vector.transfer_read %arg0[%c0, %c0], %cf0 : tensor<4x4xf32>, vector<4x4xf32>			%0 = vector.transfer_read %arg0[%c0, %c0], %cf0 : tensor<4x4xf32>, vector<4x4xf32>
	%r = vector.transfer_write %0, %arg0[%c0, %c0] : vector<4x4xf32>, tensor<4x4xf32>			%r = vector.transfer_write %0, %arg1[%c0, %c0] : vector<4x4xf32>, tensor<4x4xf32>
	return %r: tensor<4x4xf32>			return %r: tensor<4x4xf32>
	}			}

mlir/test/Dialect/Vector/vector-transferop-opt.mlir

Show First 20 Lines • Show All 178 Lines • ▼ Show 20 Lines	scf.if %arg1 {
vector<1x4xf32>, memref<4x4xf32>		vector<1x4xf32>, memref<4x4xf32>
}		}
vector.transfer_write %v0, %arg2[%c1, %c0] {in_bounds = [true, true]} :		vector.transfer_write %v0, %arg2[%c1, %c0] {in_bounds = [true, true]} :
vector<1x4xf32>, memref<4x4xf32>		vector<1x4xf32>, memref<4x4xf32>
}		}
return		return
}		}

// CHECK-LABEL: func @forward_dead_store_tensor
// CHECK-NOT: vector.transfer_write
// CHECK-NOT: vector.transfer_read
// CHECK: scf.for
// CHECK: }
// CHECK: %[[VTW:.*]] = vector.transfer_write
// CHECK: return %[[VTW]] : tensor<4x4xf32>
func @forward_dead_store_tensor(%arg0: i1, %arg1 : tensor<4x4xf32>,
%v0 : vector<1x4xf32>, %v1 : vector<1x4xf32>, %i : index) -> tensor<4x4xf32> {
%c1 = constant 1 : index
%c4 = constant 4 : index
%c0 = constant 0 : index
%cf0 = constant 0.0 : f32
%w0 = vector.transfer_write %v0, %arg1[%c1, %c0] {in_bounds = [true, true]} :
vector<1x4xf32>, tensor<4x4xf32>
%0 = vector.transfer_read %w0[%c1, %c0], %cf0 {in_bounds = [true, true]} :
tensor<4x4xf32>, vector<1x4xf32>
%x = scf.for %i0 = %c0 to %c4 step %c1 iter_args(%acc = %0)
-> (vector<1x4xf32>) {
%1 = addf %acc, %acc : vector<1x4xf32>
scf.yield %1 : vector<1x4xf32>
}
%w1 = vector.transfer_write %x, %w0[%c1, %c0] {in_bounds = [true, true]} :
vector<1x4xf32>, tensor<4x4xf32>
return %w1 : tensor<4x4xf32>
}

// CHECK-LABEL: func @forward_dead_store_negative_tensor
// CHECK: vector.transfer_write
// CHECK: vector.transfer_read
// CHECK: scf.for
// CHECK: }
// CHECK: %[[VTW:.*]] = vector.transfer_write
// CHECK: return %[[VTW]] : tensor<4x4xf32>
func @forward_dead_store_negative_tensor(%arg0: i1, %arg1 : tensor<4x4xf32>,
%v0 : vector<1x4xf32>, %v1 : vector<1x4xf32>, %i : index) -> tensor<4x4xf32> {
%c1 = constant 1 : index
%c4 = constant 4 : index
%c0 = constant 0 : index
%cf0 = constant 0.0 : f32
%w0 = vector.transfer_write %v0, %arg1[%c1, %i] {in_bounds = [true, true]} :
vector<1x4xf32>, tensor<4x4xf32>
%0 = vector.transfer_read %w0[%c1, %c0], %cf0 {in_bounds = [true, true]} :
tensor<4x4xf32>, vector<1x4xf32>
%x = scf.for %i0 = %c0 to %c4 step %c1 iter_args(%acc = %0)
-> (vector<1x4xf32>) {
%1 = addf %acc, %acc : vector<1x4xf32>
scf.yield %1 : vector<1x4xf32>
}
%w1 = vector.transfer_write %x, %w0[%c1, %c0] {in_bounds = [true, true]} :
vector<1x4xf32>, tensor<4x4xf32>
return %w1 : tensor<4x4xf32>
}

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][vector] Move transferOp on tensor opt to folder/canonicalization
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 337977

mlir/include/mlir/Dialect/Vector/VectorOps.td

mlir/include/mlir/Dialect/Vector/VectorUtils.h

mlir/lib/Dialect/Vector/VectorOps.cpp

mlir/lib/Dialect/Vector/VectorTransferOpTransforms.cpp

mlir/lib/Dialect/Vector/VectorUtils.cpp

mlir/test/Dialect/Vector/canonicalize.mlir

mlir/test/Dialect/Vector/vector-transfer-unroll.mlir

mlir/test/Dialect/Vector/vector-transferop-opt.mlir

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][vector] Move transferOp on tensor opt to folder/canonicalizationClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 337977

mlir/include/mlir/Dialect/Vector/VectorOps.td

mlir/include/mlir/Dialect/Vector/VectorUtils.h

mlir/lib/Dialect/Vector/VectorOps.cpp

mlir/lib/Dialect/Vector/VectorTransferOpTransforms.cpp

mlir/lib/Dialect/Vector/VectorUtils.cpp

mlir/test/Dialect/Vector/canonicalize.mlir

mlir/test/Dialect/Vector/vector-transfer-unroll.mlir

mlir/test/Dialect/Vector/vector-transferop-opt.mlir

[mlir][vector] Move transferOp on tensor opt to folder/canonicalization
ClosedPublic