This is an archive of the discontinued LLVM Phabricator instance.

lib/Driver/ToolChains/Cuda.cpp
255–257	The purpose of the original assert was to catch a programming error and this change negates that purpose. Perhaps I'm missing something. Could you elaborate on what's the motivation for this particular change? I don't understand why it would be OK to end up with an unknown GPU architecture if -nocudalib is specified. You still do want to pass some specific GPU arch to ptxas and that has nothing to do with whether you happen to have suitable libdevice.

Don't take into account unknown CUDA archs not even for testing purposes.

One small nit. LGTM otherwise.

test/Driver/openmp-offload-gpu.c
133	Please split this RUN line further.

This revision is now accepted and ready to land.Sep 20 2017, 9:37 AM

Split line.

gtbercea closed this revision.Sep 25 2017, 2:58 PM

Revision Contents

Path

Size

lib/

Driver/

ToolChains/

Cuda.cpp

9 lines

test/

Driver/

openmp-offload-gpu.c

9 lines

Diff 115692

lib/Driver/ToolChains/Cuda.cpp

Show First 20 Lines • Show All 246 Lines • ▼ Show 20 Lines	void NVPTX::Assembler::ConstructJob(Compilation &C, const JobAction &JA,
// flag or the default value.		// flag or the default value.
if (JA.isDeviceOffloading(Action::OFK_OpenMP)) {		if (JA.isDeviceOffloading(Action::OFK_OpenMP)) {
GPUArchName = Args.getLastArgValue(options::OPT_march_EQ);		GPUArchName = Args.getLastArgValue(options::OPT_march_EQ);
assert(!GPUArchName.empty() && "Must have an architecture passed in.");		assert(!GPUArchName.empty() && "Must have an architecture passed in.");
} else		} else
GPUArchName = JA.getOffloadingArch();		GPUArchName = JA.getOffloadingArch();

// Obtain architecture from the action.		// Obtain architecture from the action.
CudaArch gpu_arch = StringToCudaArch(GPUArchName);		CudaArch gpu_arch = StringToCudaArch(GPUArchName);
assert(gpu_arch != CudaArch::UNKNOWN &&		assert((gpu_arch != CudaArch::UNKNOWN \|\|
		Args.hasArg(options::OPT_nocudalib)) &&
		traUnsubmitted Not Done Reply Inline Actions The purpose of the original assert was to catch a programming error and this change negates that purpose. Perhaps I'm missing something. Could you elaborate on what's the motivation for this particular change? I don't understand why it would be OK to end up with an unknown GPU architecture if -nocudalib is specified. You still do want to pass some specific GPU arch to ptxas and that has nothing to do with whether you happen to have suitable libdevice. tra: The purpose of the original assert was to catch a programming error and this change negates…
"Device action expected to have an architecture.");		"Device action expected to have an architecture.");

// Check that our installation's ptxas supports gpu_arch.		// Check that our installation's ptxas supports gpu_arch.
if (!Args.hasArg(options::OPT_no_cuda_version_check)) {		if (!Args.hasArg(options::OPT_no_cuda_version_check)) {
TC.CudaInstallation.CheckCudaVersionSupportsArch(gpu_arch);		TC.CudaInstallation.CheckCudaVersionSupportsArch(gpu_arch);
}		}

ArgStringList CmdArgs;		ArgStringList CmdArgs;
▲ Show 20 Lines • Show All 222 Lines • ▼ Show 20 Lines	if (DeviceOffloadingKind == Action::OFK_Cuda) {

if (DriverArgs.hasFlag(options::OPT_fcuda_flush_denormals_to_zero,		if (DriverArgs.hasFlag(options::OPT_fcuda_flush_denormals_to_zero,
options::OPT_fno_cuda_flush_denormals_to_zero, false))		options::OPT_fno_cuda_flush_denormals_to_zero, false))
CC1Args.push_back("-fcuda-flush-denormals-to-zero");		CC1Args.push_back("-fcuda-flush-denormals-to-zero");

if (DriverArgs.hasFlag(options::OPT_fcuda_approx_transcendentals,		if (DriverArgs.hasFlag(options::OPT_fcuda_approx_transcendentals,
options::OPT_fno_cuda_approx_transcendentals, false))		options::OPT_fno_cuda_approx_transcendentals, false))
CC1Args.push_back("-fcuda-approx-transcendentals");		CC1Args.push_back("-fcuda-approx-transcendentals");
		}

if (DriverArgs.hasArg(options::OPT_nocudalib))		if (DriverArgs.hasArg(options::OPT_nocudalib))
return;		return;
}

std::string LibDeviceFile = CudaInstallation.getLibDeviceFile(GpuArch);		std::string LibDeviceFile = CudaInstallation.getLibDeviceFile(GpuArch);

if (LibDeviceFile.empty()) {		if (LibDeviceFile.empty()) {
getDriver().Diag(diag::err_drv_no_cuda_libdevice) << GpuArch;		getDriver().Diag(diag::err_drv_no_cuda_libdevice) << GpuArch;
return;		return;
}		}

▲ Show 20 Lines • Show All 154 Lines • Show Last 20 Lines

test/Driver/openmp-offload-gpu.c

	Show First 20 Lines • Show All 119 Lines • ▼ Show 20 Lines
	/// ###########################################################################			/// ###########################################################################

	/// PTXAS is passed -c flag by default when offloading to an NVIDIA device using OpenMP			/// PTXAS is passed -c flag by default when offloading to an NVIDIA device using OpenMP
	/// Check that the flag is passed when -fopenmp-relocatable-target is used.			/// Check that the flag is passed when -fopenmp-relocatable-target is used.
	// RUN: %clang -### -fopenmp=libomp -fopenmp-targets=nvptx64-nvidia-cuda -fopenmp-relocatable-target -save-temps -no-canonical-prefixes %s 2>&1 \			// RUN: %clang -### -fopenmp=libomp -fopenmp-targets=nvptx64-nvidia-cuda -fopenmp-relocatable-target -save-temps -no-canonical-prefixes %s 2>&1 \
	// RUN: \| FileCheck -check-prefix=CHK-PTXAS-RELO %s			// RUN: \| FileCheck -check-prefix=CHK-PTXAS-RELO %s

	// CHK-PTXAS-RELO: ptxas{{.*}}" "-c"			// CHK-PTXAS-RELO: ptxas{{.*}}" "-c"

				/// ###########################################################################

				/// Check that error is not thrown by toolchain when no cuda lib flag is used.
				/// Check that the flag is passed when -fopenmp-relocatable-target is used.
				// RUN: %clang -### -fopenmp=libomp -fopenmp-targets=nvptx64-nvidia-cuda -Xopenmp-target -march=sm_99 -nocudalib -fopenmp-relocatable-target -save-temps -no-canonical-prefixes %s 2>&1 \
				traUnsubmitted Not Done Reply Inline Actions Please split this RUN line further. tra: Please split this RUN line further.
				// RUN: \| FileCheck -check-prefix=CHK-FLAG-NOLIBDEVICE %s

				// CHK-FLAG-NOLIBDEVICE-NOT: error:{{.*}}sm_99

This is an archive of the discontinued LLVM Phabricator instance.

[OpenMP] Enable the existing nocudalib flag for OpenMP offloading toolchain.ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 115692

lib/Driver/ToolChains/Cuda.cpp

test/Driver/openmp-offload-gpu.c

[OpenMP] Enable the existing nocudalib flag for OpenMP offloading toolchain.
ClosedPublic