Diff 381134

mlir/lib/Dialect/Linalg/Transforms/ComprehensiveBufferize.cpp

Show First 20 Lines • Show All 1,623 Lines • ▼ Show 20 Lines	for (OpOperand &opOperand : callOp->getOpOperands()) {
}		}
newOperands.push_back(buffer);		newOperands.push_back(buffer);
}		}

// 4. Create the new CallOp.		// 4. Create the new CallOp.
Operation *newCallOp = b.create<CallOp>(callOp.getLoc(), funcOp.sym_name(),		Operation *newCallOp = b.create<CallOp>(callOp.getLoc(), funcOp.sym_name(),
resultTypes, newOperands);		resultTypes, newOperands);
newCallOp->setAttrs(callOp->getAttrs());		newCallOp->setAttrs(callOp->getAttrs());
		callOp->erase();
return success();		return success();
}		}

/// tensor::CastOp bufferizes to memref::CastOp.		/// tensor::CastOp bufferizes to memref::CastOp.
static LogicalResult bufferize(OpBuilder &b, tensor::CastOp castOp,		static LogicalResult bufferize(OpBuilder &b, tensor::CastOp castOp,
BlockAndValueMapping &bvm,		BlockAndValueMapping &bvm,
BufferizationAliasInfo &aliasInfo) {		BufferizationAliasInfo &aliasInfo) {
// Take a guard before anything else.		// Take a guard before anything else.
▲ Show 20 Lines • Show All 675 Lines • ▼ Show 20 Lines
static LogicalResult bufferizeFuncOpInternals(		static LogicalResult bufferizeFuncOpInternals(
FuncOp funcOp, BlockAndValueMapping &bvm, BufferizationAliasInfo &aliasInfo,		FuncOp funcOp, BlockAndValueMapping &bvm, BufferizationAliasInfo &aliasInfo,
DenseMap<FuncOp, FunctionType> &bufferizedFunctionTypes,		DenseMap<FuncOp, FunctionType> &bufferizedFunctionTypes,
GlobalCreator &globalCreator) {		GlobalCreator &globalCreator) {

LLVM_DEBUG(llvm::dbgs() << "\n\n");		LLVM_DEBUG(llvm::dbgs() << "\n\n");
LDBG("Begin BufferizeFuncOpInternals:\n" << funcOp << '\n');		LDBG("Begin BufferizeFuncOpInternals:\n" << funcOp << '\n');
OpBuilder b(funcOp->getContext());		OpBuilder b(funcOp->getContext());
/// Start by bufferizing `funcOp` arguments.
		// Start by bufferizing `funcOp` arguments.
if (failed(bufferize(b, funcOp, bvm, aliasInfo)))		if (failed(bufferize(b, funcOp, bvm, aliasInfo)))
return failure();		return failure();

// Walk in PreOrder to ensure ops with regions are handled before their body.		// Bufferize the function body. `bufferizedOps` keeps track ops that were
// Since walk has to be PreOrder, we need to erase ops that require it		// already bufferized with pre-order traversal.
// separately: this is the case for CallOp		DenseSet<Operation *> bufferizedOps;
SmallVector<Operation *> toErase;		auto walkFunc = [&](Operation *op) -> WalkResult {
if (funcOp		// Collect ops that need to be bufferized before `op`.
.walk<WalkOrder::PreOrder>([&](Operation *op) -> WalkResult {		SmallVector<Operation *> preorderBufferize;
		Operation *parentOp = op->getParentOp();
		// scf::ForOp and TiledLoopOp must be bufferized before their blocks
		// ("pre-order") because BBargs must be mapped when bufferizing children.
		while (isa_and_nonnull<scf::ForOp, TiledLoopOp>(parentOp)) {
		if (bufferizedOps.contains(parentOp))
		break;
		bufferizedOps.insert(parentOp);
		preorderBufferize.push_back(parentOp);
		parentOp = parentOp->getParentOp();
		}

		for (Operation *op : llvm::reverse(preorderBufferize))
if (failed(bufferizeOp(op, bvm, aliasInfo, &bufferizedFunctionTypes,		if (failed(bufferizeOp(op, bvm, aliasInfo, &bufferizedFunctionTypes,
&globalCreator)))		&globalCreator)))
return failure();		return failure();
// Register post-walk erasure, if necessary.
if (isa<CallOpInterface>(op))		if (!bufferizedOps.contains(op) &&
if (llvm::any_of(op->getOperandTypes(), isaTensor) \|\|		failed(bufferizeOp(op, bvm, aliasInfo, &bufferizedFunctionTypes,
llvm::any_of(op->getResultTypes(), isaTensor))		&globalCreator)))
toErase.push_back(op);		return failure();
return success();		return success();
})		};
.wasInterrupted())		if (funcOp.walk(walkFunc).wasInterrupted())
return failure();		return failure();

LDBG("End BufferizeFuncOpInternals:\n" << funcOp << '\n');		LDBG("End BufferizeFuncOpInternals:\n" << funcOp << '\n');

for (Operation *op : toErase)
op->erase();

return success();		return success();
}		}

//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
// Bufferization entry-point for modules.		// Bufferization entry-point for modules.
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

/// Return the op with Allocate MemoryEffect if `v` is equivalent to such an		/// Return the op with Allocate MemoryEffect if `v` is equivalent to such an
▲ Show 20 Lines • Show All 444 Lines • Show Last 20 Lines

mlir/test/Dialect/Linalg/comprehensive-module-bufferize-invalid.mlir

Show First 20 Lines • Show All 107 Lines • ▼ Show 20 Lines	func @extract_slice_fun(%A : tensor<?xf32> {linalg.inplaceable = true})
// expected-error @+1 {{buffer result #0 not produced by an alloc}}		// expected-error @+1 {{buffer result #0 not produced by an alloc}}
return %r0: tensor<4xf32>		return %r0: tensor<4xf32>
}		}

// -----		// -----

func @scf_yield(%b : i1, %A : tensor<4xf32>, %B : tensor<4xf32>) -> tensor<4xf32>		func @scf_yield(%b : i1, %A : tensor<4xf32>, %B : tensor<4xf32>) -> tensor<4xf32>
{		{
// expected-error @+1 {{unsupported op with tensors}}
%r = scf.if %b -> (tensor<4xf32>) {		%r = scf.if %b -> (tensor<4xf32>) {
		// expected-error @+1 {{expected scf::ForOp parent for scf::YieldOp}}
scf.yield %A : tensor<4xf32>		scf.yield %A : tensor<4xf32>
} else {		} else {
scf.yield %B : tensor<4xf32>		scf.yield %B : tensor<4xf32>
}		}
return %r: tensor<4xf32>		return %r: tensor<4xf32>
}		}

// -----		// -----
Show All 13 Lines	func @mini_test_case1() -> tensor<10x20xf32> {
%t = linalg.init_tensor [10, 20] : tensor<10x20xf32>		%t = linalg.init_tensor [10, 20] : tensor<10x20xf32>
%r = linalg.fill(%f0, %t) : f32, tensor<10x20xf32> -> tensor<10x20xf32>		%r = linalg.fill(%f0, %t) : f32, tensor<10x20xf32> -> tensor<10x20xf32>
return %r : tensor<10x20xf32>		return %r : tensor<10x20xf32>
}		}

// -----		// -----

func @main() -> tensor<4xi32> {		func @main() -> tensor<4xi32> {
// expected-error @+1 {{unsupported op with tensors}}		// expected-error @+1 {{expected result-less scf.execute_region containing op}}
%r = scf.execute_region -> tensor<4xi32> {		%r = scf.execute_region -> tensor<4xi32> {
%A = constant dense<[1, 2, 3, 4]> : tensor<4xi32>		%A = constant dense<[1, 2, 3, 4]> : tensor<4xi32>
scf.yield %A: tensor<4xi32>		scf.yield %A: tensor<4xi32>
}		}
return %r: tensor<4xi32>		return %r: tensor<4xi32>
}		}

// -----		// -----
Show All 11 Lines

mlir/test/Dialect/Linalg/comprehensive-module-bufferize.mlir

Show First 20 Lines • Show All 299 Lines • ▼ Show 20 Lines	func @scf_for_yield_only(%A : tensor<?xf32>,

// CHECK: memref.dealloc %[[ALLOC_FOR_A]] : memref<?xf32>		// CHECK: memref.dealloc %[[ALLOC_FOR_A]] : memref<?xf32>
// CHECK: return %[[ALLOC_FOR_A]] : memref<?xf32>		// CHECK: return %[[ALLOC_FOR_A]] : memref<?xf32>
return %r0, %r1: tensor<?xf32>, tensor<?xf32>		return %r0, %r1: tensor<?xf32>, tensor<?xf32>
}		}

// -----		// -----

		// Ensure that the function bufferizes without error. This tests pre-order
		// traversal of scf.for loops during bufferization. No need to check the IR,
		// just want to make sure that it does not crash.

		// CHECK-LABEL: func @nested_scf_for
		func @nested_scf_for(%A : tensor<?xf32> {linalg.inplaceable = true},
		%v : vector<5xf32>) -> tensor<?xf32> {
		%c0 = constant 0 : index
		%c1 = constant 1 : index
		%c10 = constant 10 : index
		%r1 = scf.for %i = %c0 to %c10 step %c1 iter_args(%B = %A) -> tensor<?xf32> {
		%r2 = scf.for %j = %c0 to %c10 step %c1 iter_args(%C = %B) -> tensor<?xf32> {
		%w = vector.transfer_write %v, %C[%c0] : vector<5xf32>, tensor<?xf32>
		scf.yield %w : tensor<?xf32>
		}
		scf.yield %r2 : tensor<?xf32>
		}
		return %r1 : tensor<?xf32>
		}

		// -----

// CHECK-DAG: #[[$map_1d_dyn:.]] = affine_map<(d0)[s0, s1] -> (d0 s1 + s0)>		// CHECK-DAG: #[[$map_1d_dyn:.]] = affine_map<(d0)[s0, s1] -> (d0 s1 + s0)>

// CHECK-LABEL: func @scf_for_with_tensor.insert_slice		// CHECK-LABEL: func @scf_for_with_tensor.insert_slice
// CHECK-SAME: %[[A:[a-zA-Z0-9]*]]: memref<?xf32, #[[$map_1d_dyn]]>		// CHECK-SAME: %[[A:[a-zA-Z0-9]*]]: memref<?xf32, #[[$map_1d_dyn]]>
// CHECK-SAME: %[[B:[a-zA-Z0-9]*]]: memref<?xf32, #[[$map_1d_dyn]]>		// CHECK-SAME: %[[B:[a-zA-Z0-9]*]]: memref<?xf32, #[[$map_1d_dyn]]>
// CHECK-SAME: %[[C:[a-zA-Z0-9]*]]: memref<4xf32, #[[$map_1d_dyn]]>		// CHECK-SAME: %[[C:[a-zA-Z0-9]*]]: memref<4xf32, #[[$map_1d_dyn]]>
func @scf_for_with_tensor.insert_slice(		func @scf_for_with_tensor.insert_slice(
%A : tensor<?xf32>,		%A : tensor<?xf32>,
▲ Show 20 Lines • Show All 442 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][linalg][bufferize] Bufferize using PostOrder traversal
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 381134

mlir/lib/Dialect/Linalg/Transforms/ComprehensiveBufferize.cpp

mlir/test/Dialect/Linalg/comprehensive-module-bufferize-invalid.mlir

mlir/test/Dialect/Linalg/comprehensive-module-bufferize.mlir

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][linalg][bufferize] Bufferize using PostOrder traversalClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 381134

mlir/lib/Dialect/Linalg/Transforms/ComprehensiveBufferize.cpp

mlir/test/Dialect/Linalg/comprehensive-module-bufferize-invalid.mlir

mlir/test/Dialect/Linalg/comprehensive-module-bufferize.mlir

[mlir][linalg][bufferize] Bufferize using PostOrder traversal
ClosedPublic