This is an archive of the discontinued LLVM Phabricator instance.

Separate SerializeToCubin from GPUTransforms.
ClosedPublic

Authored by tra on Mar 17 2023, 1:52 PM.

Download Raw Diff

Details

Reviewers

ThomasRaoux
csigg
GMNGeoffrey

Commits

rGfea8faa705b4: Separate SerializeToCubin from GPUTransforms.

Summary

SerializeToCubin depends on CUDA at *runtime* which is undesirable for MLIR's
general use case, as compilation should be doable on any host, regardless of
whether it has a GPU.

SerializeToCubin is needed to run some GPU tests, so when we build mlir-opt,
SerializeToCubin pass is linked in directly into mlir-opt.

Diff Detail

Repository: rG LLVM Github Monorepo

Event Timeline

tra created this revision.Mar 17 2023, 1:52 PM

Herald added a reviewer: ThomasRaoux. · View Herald TranscriptMar 17 2023, 1:52 PM

Herald added a project: Restricted Project. · View Herald Transcript

Herald added subscribers: Moerafaat, zero9178, bzcheeseman and 22 others. · View Herald Transcript

tra published this revision for review.Mar 17 2023, 1:55 PM

tra added reviewers: csigg, GMNGeoffrey.

Herald added a project: Restricted Project. · View Herald TranscriptMar 17 2023, 1:55 PM

Herald added subscribers: llvm-commits, stephenneuendorffer, nicolasvasilache. · View Herald Transcript

Thanks Artem!

This revision is now accepted and ready to land.Mar 17 2023, 2:00 PM

Harbormaster completed remote builds in B220144: Diff 506193.Mar 17 2023, 2:13 PM

This revision was landed with ongoing or failed builds.Mar 17 2023, 2:14 PM

Closed by commit rGfea8faa705b4: Separate SerializeToCubin from GPUTransforms. (authored by tra). · Explain Why

This revision was automatically updated to reflect the committed changes.

tra added a commit: rGfea8faa705b4: Separate SerializeToCubin from GPUTransforms..

Revision Contents

Path

Size

utils/

bazel/

llvm-project-overlay/

mlir/

BUILD.bazel

58 lines

Diff 506196

utils/bazel/llvm-project-overlay/mlir/BUILD.bazel

This file is larger than 256 KB, so syntax highlighting is disabled by default.

# This file is licensed under the Apache License v2.0 with LLVM Exceptions.		# This file is licensed under the Apache License v2.0 with LLVM Exceptions.
# See https://llvm.org/LICENSE.txt for license information.		# See https://llvm.org/LICENSE.txt for license information.
# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception		# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

# Description:		# Description:
# The MLIR "Multi-Level Intermediate Representation" Compiler Infrastructure		# The MLIR "Multi-Level Intermediate Representation" Compiler Infrastructure

		load("@bazel_skylib//rules:write_file.bzl", "write_file")
load(":tblgen.bzl", "gentbl_cc_library", "td_library")		load(":tblgen.bzl", "gentbl_cc_library", "td_library")
load(":linalggen.bzl", "genlinalg")		load(":linalggen.bzl", "genlinalg")
load(		load(
":build_defs.bzl",		":build_defs.bzl",
"cc_headers_only",		"cc_headers_only",
"if_cuda_available",		"if_cuda_available",
"mlir_c_api_cc_library",		"mlir_c_api_cc_library",
)		)
▲ Show 20 Lines • Show All 4,010 Lines • ▼ Show 20 Lines

cc_library(		cc_library(
name = "GPUTransforms",		name = "GPUTransforms",
srcs = glob(		srcs = glob(
[		[
"lib/Dialect/GPU/Transforms/*.cpp",		"lib/Dialect/GPU/Transforms/*.cpp",
"lib/Dialect/GPU/Transforms/*.h",		"lib/Dialect/GPU/Transforms/*.h",
],		],
		exclude = [
		"lib/Dialect/GPU/Transforms/SerializeToCubin.cpp",
		],
),		),
hdrs = glob(["include/mlir/Dialect/GPU/Transforms/*.h"]),		hdrs = glob(["include/mlir/Dialect/GPU/Transforms/*.h"]),
includes = ["include"],		includes = ["include"],
local_defines = if_cuda_available(["MLIR_GPU_TO_CUBIN_PASS_ENABLE"]),		local_defines = if_cuda_available(["MLIR_GPU_TO_CUBIN_PASS_ENABLE"]),
deps = [		deps = [
":ArithDialect",		":ArithDialect",
":AsmParser",		":AsmParser",
":AsyncDialect",		":AsyncDialect",
":ControlFlowDialect",		":ControlFlowDialect",
":DLTIDialect",		":DLTIDialect",
":AffineUtils",		":AffineUtils",
":GPUDialect",		":GPUDialect",
":GPUPassIncGen",		":GPUPassIncGen",
":MemRefDialect",		":MemRefDialect",
":IR",		":IR",
":Pass",		":Pass",
":ROCDLToLLVMIRTranslation",		":ROCDLToLLVMIRTranslation",
":SCFDialect",		":SCFDialect",
":FuncDialect",		":FuncDialect",
		":SerializeToCubin_stub",
":SideEffectInterfaces",		":SideEffectInterfaces",
":Support",		":Support",
":Transforms",		":Transforms",
":ToLLVMIRTranslation",		":ToLLVMIRTranslation",
":LLVMToLLVMIRTranslation",		":LLVMToLLVMIRTranslation",
"//llvm:Core",		"//llvm:Core",
"//llvm:MC",		"//llvm:MC",
"//llvm:Support",		"//llvm:Support",
"//llvm:Target",		"//llvm:Target",
] + if_cuda_available([		] + if_cuda_available([
# Dependencies for SerializeToCubin.cpp with
# -DMLIR_GPU_TO_CUBIN_PASS_ENABLE
":NVVMToLLVMIRTranslation",		":NVVMToLLVMIRTranslation",
"//llvm:NVPTXCodeGen",		"//llvm:NVPTXCodeGen",
		]),
		)

		cc_library(
		name = "SerializeToCubin",
		srcs = [
		"lib/Dialect/GPU/Transforms/SerializeToCubin.cpp",
		],
		local_defines = if_cuda_available(["MLIR_GPU_TO_CUBIN_PASS_ENABLE"]),
		deps = [
		":NVVMToLLVMIRTranslation",
		":ToLLVMIRTranslation",
		":GPUDialect",
		":GPUPassIncGen",
		":GPUTransforms",
		":Pass",
		":Support",
		"//llvm:Support",
		] + if_cuda_available([
"@cuda//:cuda_headers",		"@cuda//:cuda_headers",
"@cuda//:libcuda",		"@cuda//:libcuda",
]),		])
		)

		write_file(
		name = "SerializeToCubin_stub_cc",
		out = "SerializeToCubin_stub.cc",
		content = [
		"""
		#include "mlir/Dialect/GPU/Transforms/Passes.h"

		// Provide a weak registration stub in case the real SerializeToCubin is not
		// linked in.

		__attribute__((weak)) void mlir::registerGpuSerializeToCubinPass() {}
		"""
		]
		)

		cc_library(
		name = "SerializeToCubin_stub",
		srcs = [":SerializeToCubin_stub_cc"],
		hdrs = glob(["include/mlir/Dialect/GPU/Transforms/*.h"]),
		includes = ["include"],
		deps = [
		":GPUDialect",
		":GPUPassIncGen",
		":Pass",
		":Support",
		"//llvm:Support",
		],
)		)

td_library(		td_library(
name = "GPUTransformOpsTdFiles",		name = "GPUTransformOpsTdFiles",
srcs = [		srcs = [
"include/mlir/Dialect/GPU/TransformOps/GPUTransformOps.td",		"include/mlir/Dialect/GPU/TransformOps/GPUTransformOps.td",
],		],
includes = ["include"],		includes = ["include"],
▲ Show 20 Lines • Show All 2,978 Lines • ▼ Show 20 Lines	cc_binary(
deps = [		deps = [
":AllPassesAndDialects",		":AllPassesAndDialects",
":Analysis",		":Analysis",
":IR",		":IR",
":MlirOptLib",		":MlirOptLib",
":OpenMPDialect",		":OpenMPDialect",
":Pass",		":Pass",
":QuantOps",		":QuantOps",
		":SerializeToCubin",
":SCFToGPU",		":SCFToGPU",
":Support",		":Support",
":Transforms",		":Transforms",
"//llvm:AllTargetsCodeGens",		"//llvm:AllTargetsCodeGens",
"//llvm:Support",		"//llvm:Support",
"//mlir/test:TestAffine",		"//mlir/test:TestAffine",
"//mlir/test:TestAnalysis",		"//mlir/test:TestAnalysis",
"//mlir/test:TestArith",		"//mlir/test:TestArith",
▲ Show 20 Lines • Show All 3,578 Lines • Show Last 20 Lines