Diff 297873

mlir/include/mlir/Dialect/GPU/GPUOps.td

Show First 20 Lines • Show All 750 Lines • ▼ Show 20 Lines	let description = [{
launched afterwards. Writes from the device are guaranteed to be visible on		launched afterwards. Writes from the device are guaranteed to be visible on
the host after synchronizing with the device kernel completion.		the host after synchronizing with the device kernel completion.
}];		}];

let assemblyFormat = "$value attr-dict `:` type($value)";		let assemblyFormat = "$value attr-dict `:` type($value)";
let verifier = [{ return success(); }];		let verifier = [{ return success(); }];
}		}

		def GPU_WaitOp : GPU_Op<"wait", [GPU_AsyncOpInterface]> {
		let summary = "Wait for async gpu ops to complete.";
		let description = [{
		This op synchronizes the host or the device with a list of dependent ops.

		If the op contains the `async` keyword, it returns a new async token which
		is synchronized with the op arguments. This new token is merely a shortcut
		to the argument list, and one could replace the uses of the result with the
		arguments for the same effect. The async version of this op is primarily
		used to make each async token have a single use during lowering and
		thereby make forks in async execution explicit. Example usage:

		```mlir
		%t0 = gpu.foo async : !gpu.async.token
		%t1 = gpu.bar async : !gpu.async.token
		%t2 = gpu.wait async [%t0, %t1]
		// gpu.baz doesn't run until gpu.foo and gpu.bar have both completed, just
		// as if the async dependencies were [%t0, %t1].
		%t3 = gpu.baz async [%t2]
		```

		If the op does not contain the `async` keyword, it does not return a new
		async token but blocks until all ops producing the async dependency tokens
		finished execution. All dependent memory operations are visible to the host
		once this op completes. Example usage:

		```mlir
		%t0 = gpu.foo async : !gpu.async.token
		%t1 = gpu.bar async : !gpu.async.token
		// The gpu.wait op blocks until gpu.foo and gpu.bar have completed.
		gpu.wait [%t0, %t1]
		```
		}];

		let arguments = (ins Variadic<GPU_AsyncToken>:$asyncDependencies);
		let results = (outs Optional<GPU_AsyncToken>:$asyncToken);

		let assemblyFormat = [{
		custom<AsyncDependencies>(type($asyncToken), $asyncDependencies) attr-dict
		}];
		}

#endif // GPU_OPS		#endif // GPU_OPS

mlir/lib/Dialect/GPU/IR/GPUDialect.cpp

Show First 20 Lines • Show All 812 Lines • ▼ Show 20 Lines	static void print(OpAsmPrinter &p, GPUModuleOp op) {
p << op.getOperationName() << ' ';		p << op.getOperationName() << ' ';
p.printSymbolName(op.getName());		p.printSymbolName(op.getName());
p.printOptionalAttrDictWithKeyword(op.getAttrs(),		p.printOptionalAttrDictWithKeyword(op.getAttrs(),
{SymbolTable::getSymbolAttrName()});		{SymbolTable::getSymbolAttrName()});
p.printRegion(op.getOperation()->getRegion(0), /printEntryBlockArgs=/false,		p.printRegion(op.getOperation()->getRegion(0), /printEntryBlockArgs=/false,
/printBlockTerminators=/false);		/printBlockTerminators=/false);
}		}

		static ParseResult parseAsyncDependencies(
		OpAsmParser &parser, Type &asyncTokenType,
		SmallVectorImpl<OpAsmParser::OperandType> &asyncDependencies) {
		auto loc = parser.getCurrentLocation();
		if (succeeded(parser.parseOptionalKeyword("async"))) {
		if (parser.getNumResults() == 0)
		return parser.emitError(loc, "needs to be named when marked 'async'");
		asyncTokenType = parser.getBuilder().getType<AsyncTokenType>();
		}
		return parser.parseOperandList(asyncDependencies,
		OpAsmParser::Delimiter::OptionalSquare);
		}

		static void printAsyncDependencies(OpAsmPrinter &printer, Type asyncTokenType,
		OperandRange asyncDependencies) {
		if (asyncTokenType)
		printer << "async ";
		if (asyncDependencies.empty())
		return;
		printer << "[";
		llvm::interleaveComma(asyncDependencies, printer);
		printer << "]";
		}

#include "mlir/Dialect/GPU/GPUOpInterfaces.cpp.inc"		#include "mlir/Dialect/GPU/GPUOpInterfaces.cpp.inc"

#define GET_OP_CLASSES		#define GET_OP_CLASSES
#include "mlir/Dialect/GPU/GPUOps.cpp.inc"		#include "mlir/Dialect/GPU/GPUOps.cpp.inc"

mlir/test/Dialect/GPU/invalid.mlir

Show First 20 Lines • Show All 429 Lines • ▼ Show 20 Lines	module {
gpu.module @gpu_funcs {		gpu.module @gpu_funcs {
// expected-error @+1 {{'gpu.func' op expected at least 5 arguments to body region}}		// expected-error @+1 {{'gpu.func' op expected at least 5 arguments to body region}}
"gpu.func"() ( {		"gpu.func"() ( {
^bb0(%arg0: f32, %arg1: memref<?xf32>, %arg2: memref<5xf32, 3>, %arg3: memref<5xf32, 5>):		^bb0(%arg0: f32, %arg1: memref<?xf32>, %arg2: memref<5xf32, 3>, %arg3: memref<5xf32, 5>):
"gpu.return"() : () -> ()		"gpu.return"() : () -> ()
} ) {gpu.kernel, sym_name = "kernel_1", type = (f32, memref<?xf32>) -> (), workgroup_attributions = 3: i64} : () -> ()		} ) {gpu.kernel, sym_name = "kernel_1", type = (f32, memref<?xf32>) -> (), workgroup_attributions = 3: i64} : () -> ()
}		}
}		}

		// -----

		func @sync_wait_with_result() {
		// expected-error @+1 {{cannot name an operation with no results}}
		%t = gpu.wait
		}

		// -----

		func @async_wait_without_result() {
		// expected-error @+1 {{custom op 'gpu.wait' needs to be named when marked 'async'}}
		gpu.wait async
		}

mlir/test/Dialect/GPU/ops.mlir

Show First 20 Lines • Show All 143 Lines • ▼ Show 20 Lines	gpu.module @explicit_attributions {
} ) {gpu.kernel, sym_name = "kernel_1", type = (f32, memref<?xf32>) -> (), workgroup_attributions = 1: i64} : () -> ()		} ) {gpu.kernel, sym_name = "kernel_1", type = (f32, memref<?xf32>) -> (), workgroup_attributions = 1: i64} : () -> ()
}		}

func @async_token(%arg0 : !gpu.async.token) -> !gpu.async.token {		func @async_token(%arg0 : !gpu.async.token) -> !gpu.async.token {
// CHECK-LABEL: func @async_token({{.*}}: !gpu.async.token)		// CHECK-LABEL: func @async_token({{.*}}: !gpu.async.token)
// CHECK: return {{.*}} : !gpu.async.token		// CHECK: return {{.*}} : !gpu.async.token
return %arg0 : !gpu.async.token		return %arg0 : !gpu.async.token
}		}

		func @async_wait() {
		// CHECK-LABEL: func @async_wait
		// CHECK: %[[t0:.*]] = gpu.wait async
		%0 = gpu.wait async
		// CHECK: %[[t1:.*]] = gpu.wait async [%[[t0]]]
		%1 = gpu.wait async [%0]
		// CHECK: %{{.*}} = gpu.wait async [%[[t0]], %[[t1]]]
		%2 = gpu.wait async [%0, %1]
		// CHECK: gpu.wait [%[[t0]], %[[t1]]]
		// CHECK-NOT: async
		gpu.wait [%0, %1]
		// CHECK: gpu.wait
		// CHECK-NOT: async
		gpu.wait // Valid, but a no-op.
		return
		}
}		}

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][gpu] Add `gpu.wait` op.
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 297873

mlir/include/mlir/Dialect/GPU/GPUOps.td

mlir/lib/Dialect/GPU/IR/GPUDialect.cpp

mlir/test/Dialect/GPU/invalid.mlir

mlir/test/Dialect/GPU/ops.mlir

This is an archive of the discontinued LLVM Phabricator instance.

[mlir][gpu] Add `gpu.wait` op.ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 297873

mlir/include/mlir/Dialect/GPU/GPUOps.td

mlir/lib/Dialect/GPU/IR/GPUDialect.cpp

mlir/test/Dialect/GPU/invalid.mlir

mlir/test/Dialect/GPU/ops.mlir

[mlir][gpu] Add `gpu.wait` op.
ClosedPublic