Diff 317664

clang/lib/Headers/__clang_cuda_builtin_vars.h

	Show All 21 Lines
	//			//
	// Example:			// Example:
	// int x = threadIdx.x;			// int x = threadIdx.x;
	// IR output:			// IR output:
	// %0 = call i32 @llvm.nvvm.read.ptx.sreg.tid.x() #3			// %0 = call i32 @llvm.nvvm.read.ptx.sreg.tid.x() #3
	// PTX output:			// PTX output:
	// mov.u32 %r2, %tid.x;			// mov.u32 %r2, %tid.x;

				#ifdef __OPENMP_NVPTX__
				traUnsubmitted Done Reply Inline Actions Perhaps we should move all C++-related code under `#ifdef __cplusplus` intead of cherry-picking them all one by one and let the compilation fail if some C code references builtin vars. tra: Perhaps we should move all C++-related code under `#ifdef __cplusplus` intead of cherry-picking…
				tianshilei1992AuthorUnsubmitted Done Reply Inline Actions Finally I decided to only include the header in C++ mode. For C mode, everything is unchanged, which means compilation error will still be emitted because the variables are not defined. tianshilei1992: Finally I decided to only include the header in C++ mode. For C mode, everything is unchanged…
				#define __DEVICE__
				traUnsubmitted Done Reply Inline Actions You should use `__` prefix to avoid unintentional clashes with user-defined macros. `__DEVICE__` ? tra: You should use `__` prefix to avoid unintentional clashes with user-defined macros.
				#else
				#define __DEVICE__ __attribute__((device))
				#endif

	#define __CUDA_DEVICE_BUILTIN(FIELD, INTRINSIC) \			#define __CUDA_DEVICE_BUILTIN(FIELD, INTRINSIC) \
	__declspec(property(get = __fetch_builtin_##FIELD)) unsigned int FIELD; \			__declspec(property(get = __fetch_builtin_##FIELD)) unsigned int FIELD; \
	static inline __attribute__((always_inline)) \			static inline __attribute__((always_inline)) \
	__attribute__((device)) unsigned int __fetch_builtin_##FIELD(void) { \			__DEVICE__ unsigned int __fetch_builtin_##FIELD(void) { \
	return INTRINSIC; \			return INTRINSIC; \
	}			}

	#if __cplusplus >= 201103L			#if __cplusplus >= 201103L
				traUnsubmitted Done Reply Inline Actions Can we generate a sensible error instead? I'd rather fail in an obvious way during compilation than compile successfully into somethings that will not do what the user expected. tra: Can we generate a sensible error instead? I'd rather fail in an obvious way during compilation…
	#define __DELETE =delete			#define __DELETE =delete
	#else			#else
				jdoerfertUnsubmitted Done Reply Inline Actions Why do we need these fetch_builtins (for C). They have a different name than in the C++ variant anyway. In C we could just not define the fetch stuff but only the Field. So `gridDim.x` will work fine. jdoerfert: Why do we need these __fetch_builtins (for C). They have a different name than in the C++…
				tianshilei1992AuthorUnsubmitted Done Reply Inline Actions `__declspec(property)` doesn't support C so that code were removed. tianshilei1992: `__declspec(property)` doesn't support C so that code were removed.
	#define __DELETE			#define __DELETE
	#endif			#endif

	// Make sure nobody can create instances of the special variable types. nvcc			// Make sure nobody can create instances of the special variable types. nvcc
	// also disallows taking address of special variables, so we disable address-of			// also disallows taking address of special variables, so we disable address-of
	// operator as well.			// operator as well.
	#define __CUDA_DISALLOW_BUILTINVAR_ACCESS(TypeName) \			#define __CUDA_DISALLOW_BUILTINVAR_ACCESS(TypeName) \
	__attribute__((device)) TypeName() __DELETE; \			__DEVICE__ TypeName() __DELETE; \
	__attribute__((device)) TypeName(const TypeName &) __DELETE; \			__DEVICE__ TypeName(const TypeName &) __DELETE; \
	__attribute__((device)) void operator=(const TypeName &) const __DELETE; \			__DEVICE__ void operator=(const TypeName &) const __DELETE; \
	__attribute__((device)) TypeName *operator&() const __DELETE			__DEVICE__ TypeName *operator&() const __DELETE

	struct __cuda_builtin_threadIdx_t {			struct __cuda_builtin_threadIdx_t {
	__CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_tid_x());			__CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_tid_x());
				Lint: Pre-merge checks Inline Actions clang-tidy: error: 'declspec' attributes are not enabled; use '-fdeclspec' or '-fms-extensions' to enable support for declspec attributes [clang-diagnostic-error] not useful clang-tidy: error: use of undeclared identifier '__nvvm_read_ptx_sreg_tid_x' [clang-diagnostic-error] not useful Lint: Pre-merge checks: clang-tidy: error: '__declspec' attributes are not enabled; use '-fdeclspec' or '-fms…
	__CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_tid_y());			__CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_tid_y());
				Lint: Pre-merge checks Inline Actions clang-tidy: error: 'declspec' attributes are not enabled; use '-fdeclspec' or '-fms-extensions' to enable support for declspec attributes [clang-diagnostic-error] not useful clang-tidy: error: use of undeclared identifier '__nvvm_read_ptx_sreg_tid_y' [clang-diagnostic-error] not useful Lint: Pre-merge checks: clang-tidy: error: '__declspec' attributes are not enabled; use '-fdeclspec' or '-fms…
	__CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_tid_z());			__CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_tid_z());
				Lint: Pre-merge checks Inline Actions clang-tidy: error: 'declspec' attributes are not enabled; use '-fdeclspec' or '-fms-extensions' to enable support for declspec attributes [clang-diagnostic-error] not useful clang-tidy: error: use of undeclared identifier '__nvvm_read_ptx_sreg_tid_z' [clang-diagnostic-error] not useful Lint: Pre-merge checks: clang-tidy: error: '__declspec' attributes are not enabled; use '-fdeclspec' or '-fms…
	// threadIdx should be convertible to uint3 (in fact in nvcc, it is a			// threadIdx should be convertible to uint3 (in fact in nvcc, it is a
	// uint3). This function is defined after we pull in vector_types.h.			// uint3). This function is defined after we pull in vector_types.h.
	__attribute__((device)) operator dim3() const;			__DEVICE__ operator dim3() const;
				Lint: Pre-merge checks Inline Actions clang-tidy: warning: 'device' attribute ignored [clang-diagnostic-ignored-attributes] not useful Lint: Pre-merge checks: clang-tidy: warning: 'device' attribute ignored [clang-diagnostic-ignored-attributes] [[https…
	__attribute__((device)) operator uint3() const;			__DEVICE__ operator uint3() const;
				Lint: Pre-merge checks Inline Actions clang-tidy: warning: 'device' attribute ignored [clang-diagnostic-ignored-attributes] not useful Lint: Pre-merge checks: clang-tidy: warning: 'device' attribute ignored [clang-diagnostic-ignored-attributes] [[https…
				tianshilei1992AuthorUnsubmitted Done Reply Inline Actions How can we deal with the conversion in C? tianshilei1992: How can we deal with the conversion in C?
				jdoerfertUnsubmitted Done Reply Inline Actions We don't. Given that CUDA is C++ we can just limit us to the C subset. jdoerfert: We don't. Given that CUDA is C++ we can just limit us to the C subset.

	private:			private:
	__CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_threadIdx_t);			__CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_threadIdx_t);
	};			};

	struct __cuda_builtin_blockIdx_t {			struct __cuda_builtin_blockIdx_t {
	__CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_ctaid_x());			__CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_ctaid_x());
				Lint: Pre-merge checks Inline Actions clang-tidy: error: 'declspec' attributes are not enabled; use '-fdeclspec' or '-fms-extensions' to enable support for declspec attributes [clang-diagnostic-error] not useful clang-tidy: error: use of undeclared identifier '__nvvm_read_ptx_sreg_ctaid_x' [clang-diagnostic-error] not useful Lint: Pre-merge checks: clang-tidy: error: '__declspec' attributes are not enabled; use '-fdeclspec' or '-fms…
	__CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_ctaid_y());			__CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_ctaid_y());
				Lint: Pre-merge checks Inline Actions clang-tidy: error: 'declspec' attributes are not enabled; use '-fdeclspec' or '-fms-extensions' to enable support for declspec attributes [clang-diagnostic-error] not useful clang-tidy: error: use of undeclared identifier '__nvvm_read_ptx_sreg_ctaid_y' [clang-diagnostic-error] not useful Lint: Pre-merge checks: clang-tidy: error: '__declspec' attributes are not enabled; use '-fdeclspec' or '-fms…
	__CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_ctaid_z());			__CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_ctaid_z());
				Lint: Pre-merge checks Inline Actions clang-tidy: error: 'declspec' attributes are not enabled; use '-fdeclspec' or '-fms-extensions' to enable support for declspec attributes [clang-diagnostic-error] not useful clang-tidy: error: use of undeclared identifier '__nvvm_read_ptx_sreg_ctaid_z' [clang-diagnostic-error] not useful Lint: Pre-merge checks: clang-tidy: error: '__declspec' attributes are not enabled; use '-fdeclspec' or '-fms…
	// blockIdx should be convertible to uint3 (in fact in nvcc, it is a			// blockIdx should be convertible to uint3 (in fact in nvcc, it is a
	// uint3). This function is defined after we pull in vector_types.h.			// uint3). This function is defined after we pull in vector_types.h.
	__attribute__((device)) operator dim3() const;			__DEVICE__ operator dim3() const;
				Lint: Pre-merge checks Inline Actions clang-tidy: warning: 'device' attribute ignored [clang-diagnostic-ignored-attributes] not useful Lint: Pre-merge checks: clang-tidy: warning: 'device' attribute ignored [clang-diagnostic-ignored-attributes] [[https…
	__attribute__((device)) operator uint3() const;			__DEVICE__ operator uint3() const;
				Lint: Pre-merge checks Inline Actions clang-tidy: warning: 'device' attribute ignored [clang-diagnostic-ignored-attributes] not useful Lint: Pre-merge checks: clang-tidy: warning: 'device' attribute ignored [clang-diagnostic-ignored-attributes] [[https…

	private:			private:
	__CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_blockIdx_t);			__CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_blockIdx_t);
	};			};

	struct __cuda_builtin_blockDim_t {			struct __cuda_builtin_blockDim_t {
	__CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_ntid_x());			__CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_ntid_x());
				Lint: Pre-merge checks Inline Actions clang-tidy: error: 'declspec' attributes are not enabled; use '-fdeclspec' or '-fms-extensions' to enable support for declspec attributes [clang-diagnostic-error] not useful clang-tidy: error: use of undeclared identifier '__nvvm_read_ptx_sreg_ntid_x' [clang-diagnostic-error] not useful Lint: Pre-merge checks: clang-tidy: error: '__declspec' attributes are not enabled; use '-fdeclspec' or '-fms…
	__CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_ntid_y());			__CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_ntid_y());
				Lint: Pre-merge checks Inline Actions clang-tidy: error: 'declspec' attributes are not enabled; use '-fdeclspec' or '-fms-extensions' to enable support for declspec attributes [clang-diagnostic-error] not useful clang-tidy: error: use of undeclared identifier '__nvvm_read_ptx_sreg_ntid_y' [clang-diagnostic-error] not useful Lint: Pre-merge checks: clang-tidy: error: '__declspec' attributes are not enabled; use '-fdeclspec' or '-fms…
	__CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_ntid_z());			__CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_ntid_z());
				Lint: Pre-merge checks Inline Actions clang-tidy: error: 'declspec' attributes are not enabled; use '-fdeclspec' or '-fms-extensions' to enable support for declspec attributes [clang-diagnostic-error] not useful clang-tidy: error: use of undeclared identifier '__nvvm_read_ptx_sreg_ntid_z' [clang-diagnostic-error] not useful Lint: Pre-merge checks: clang-tidy: error: '__declspec' attributes are not enabled; use '-fdeclspec' or '-fms…
	// blockDim should be convertible to dim3 (in fact in nvcc, it is a			// blockDim should be convertible to dim3 (in fact in nvcc, it is a
	// dim3). This function is defined after we pull in vector_types.h.			// dim3). This function is defined after we pull in vector_types.h.
	__attribute__((device)) operator dim3() const;			__DEVICE__ operator dim3() const;
				Lint: Pre-merge checks Inline Actions clang-tidy: warning: 'device' attribute ignored [clang-diagnostic-ignored-attributes] not useful Lint: Pre-merge checks: clang-tidy: warning: 'device' attribute ignored [clang-diagnostic-ignored-attributes] [[https…
	__attribute__((device)) operator uint3() const;			__DEVICE__ operator uint3() const;
				Lint: Pre-merge checks Inline Actions clang-tidy: warning: 'device' attribute ignored [clang-diagnostic-ignored-attributes] not useful Lint: Pre-merge checks: clang-tidy: warning: 'device' attribute ignored [clang-diagnostic-ignored-attributes] [[https…

	private:			private:
	__CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_blockDim_t);			__CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_blockDim_t);
	};			};

	struct __cuda_builtin_gridDim_t {			struct __cuda_builtin_gridDim_t {
	__CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_nctaid_x());			__CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_nctaid_x());
				Lint: Pre-merge checks Inline Actions clang-tidy: error: 'declspec' attributes are not enabled; use '-fdeclspec' or '-fms-extensions' to enable support for declspec attributes [clang-diagnostic-error] not useful Lint: Pre-merge checks: clang-tidy: error: '__declspec' attributes are not enabled; use '-fdeclspec' or '-fms…
	__CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_nctaid_y());			__CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_nctaid_y());
	__CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_nctaid_z());			__CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_nctaid_z());
	// gridDim should be convertible to dim3 (in fact in nvcc, it is a			// gridDim should be convertible to dim3 (in fact in nvcc, it is a
	// dim3). This function is defined after we pull in vector_types.h.			// dim3). This function is defined after we pull in vector_types.h.
	__attribute__((device)) operator dim3() const;			__DEVICE__ operator dim3() const;
	__attribute__((device)) operator uint3() const;			__DEVICE__ operator uint3() const;

	private:			private:
	__CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_gridDim_t);			__CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_gridDim_t);
	};			};

	#define __CUDA_BUILTIN_VAR \			#define __CUDA_BUILTIN_VAR extern const __DEVICE__ __attribute__((weak))
	extern const __attribute__((device)) __attribute__((weak))
	__CUDA_BUILTIN_VAR __cuda_builtin_threadIdx_t threadIdx;			__CUDA_BUILTIN_VAR __cuda_builtin_threadIdx_t threadIdx;
	__CUDA_BUILTIN_VAR __cuda_builtin_blockIdx_t blockIdx;			__CUDA_BUILTIN_VAR __cuda_builtin_blockIdx_t blockIdx;
	__CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;			__CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;
	__CUDA_BUILTIN_VAR __cuda_builtin_gridDim_t gridDim;			__CUDA_BUILTIN_VAR __cuda_builtin_gridDim_t gridDim;

	// warpSize should translate to read of %WARP_SZ but there's currently no			// warpSize should translate to read of %WARP_SZ but there's currently no
	// builtin to do so. According to PTX v4.2 docs 'to date, all target			// builtin to do so. According to PTX v4.2 docs 'to date, all target
	// architectures have a WARP_SZ value of 32'.			// architectures have a WARP_SZ value of 32'.
	__attribute__((device)) const int warpSize = 32;			__DEVICE__ const int warpSize = 32;
				jdoerfertUnsubmitted Done Reply Inline Actions Do we need to do something wrt to the attribute here and above? jdoerfert: Do we need to do something wrt to the attribute here and above?

	#undef __CUDA_DEVICE_BUILTIN			#undef __CUDA_DEVICE_BUILTIN
	#undef __CUDA_BUILTIN_VAR			#undef __CUDA_BUILTIN_VAR
	#undef __CUDA_DISALLOW_BUILTINVAR_ACCESS			#undef __CUDA_DISALLOW_BUILTINVAR_ACCESS
	#undef __DELETE			#undef __DELETE
				#undef __DEVICE__
				traUnsubmitted Done Reply Inline Actions You need to `#undef` the DEVICE macro here. tra: You need to `#undef` the DEVICE macro here.

	#endif /* __CUDA_BUILTIN_VARS_H */			#endif /* __CUDA_BUILTIN_VARS_H */

clang/lib/Headers/openmp_wrappers/__clang_openmp_device_functions.h

	/*===- __clang_openmp_device_functions.h - OpenMP device function declares -===			/*===- __clang_openmp_device_functions.h - OpenMP device function declares -===
	*			*
	* Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.			* Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
	* See https://llvm.org/LICENSE.txt for license information.			* See https://llvm.org/LICENSE.txt for license information.
	* SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception			* SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
	*			*
	*===-----------------------------------------------------------------------===			*===-----------------------------------------------------------------------===
	*/			*/

	#ifndef __CLANG_OPENMP_DEVICE_FUNCTIONS_H__			#ifndef __CLANG_OPENMP_DEVICE_FUNCTIONS_H__
	#define __CLANG_OPENMP_DEVICE_FUNCTIONS_H__			#define __CLANG_OPENMP_DEVICE_FUNCTIONS_H__

	#ifndef _OPENMP			#ifndef _OPENMP
	#error "This file is for OpenMP compilation only."			#error "This file is for OpenMP compilation only."
				Lint: Pre-merge checks Inline Actions clang-tidy: error: "This file is for OpenMP compilation only." [clang-diagnostic-error] not useful Lint: Pre-merge checks: clang-tidy: error: "This file is for OpenMP compilation only." [clang-diagnostic-error] [[https…
	#endif			#endif

	#pragma omp begin declare variant match( \			#pragma omp begin declare variant match( \
	device = {arch(nvptx, nvptx64)}, implementation = {extension(match_any)})			device = {arch(nvptx, nvptx64)}, implementation = {extension(match_any)})

	#ifdef __cplusplus			#ifdef __cplusplus
	extern "C" {			extern "C" {
	#endif			#endif

	#define __CUDA__			#define __CUDA__
	#define __OPENMP_NVPTX__			#define __OPENMP_NVPTX__

	/// Include declarations for libdevice functions.			/// Include declarations for libdevice functions.
	#include <__clang_cuda_libdevice_declares.h>			#include <__clang_cuda_libdevice_declares.h>

	/// Provide definitions for these functions.			/// Provide definitions for these functions.
	#include <__clang_cuda_device_functions.h>			#include <__clang_cuda_device_functions.h>

				/// Provide definition for CUDA builtin variables.
				/// The header is using features only available in C++ so we only include it in
				/// C++ mode.
				#ifdef __cplusplus
				#include <__clang_cuda_builtin_vars.h>
				#endif

	#undef __OPENMP_NVPTX__			#undef __OPENMP_NVPTX__
	#undef __CUDA__			#undef __CUDA__

	#ifdef __cplusplus			#ifdef __cplusplus
	} // extern "C"			} // extern "C"
	#endif			#endif

	#pragma omp end declare variant			#pragma omp end declare variant

	#endif			#endif

clang/test/Headers/nvptx_device_cmath_functions.cpp

	// Test calling of device math functions.			// Test calling of device math functions.
	///==========================================================================///			///==========================================================================///

	// REQUIRES: nvptx-registered-target			// REQUIRES: nvptx-registered-target

	// RUN: %clang_cc1 -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc			// RUN: %clang_cc1 -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
	// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck -check-prefix CHECK-YES %s			// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck -check-prefix CHECK-YES %s

	#include <cmath>			#include <cmath>
	#include <cstdlib>			#include <cstdlib>

	void test_sqrt(double a1) {			void test_sqrt(double a1) {
	#pragma omp target			#pragma omp target
	{			{
	// CHECK-YES: call double @__nv_sqrt(double			// CHECK-YES: call double @__nv_sqrt(double
	Show All 11 Lines

clang/test/Headers/nvptx_device_cmath_functions_cxx17.cpp

	// Test calling of device math functions.			// Test calling of device math functions.
	///==========================================================================///			///==========================================================================///

	// REQUIRES: nvptx-registered-target			// REQUIRES: nvptx-registered-target

	// RUN: %clang_cc1 -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc -std=c++17			// RUN: %clang_cc1 -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc -std=c++17
	// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -std=c++17 -o - \| FileCheck -check-prefix CHECK-YES %s			// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -std=c++17 -o - \| FileCheck -check-prefix CHECK-YES %s

	#include <cmath>			#include <cmath>
	#include <cstdlib>			#include <cstdlib>

	void test_sqrt(double a1) {			void test_sqrt(double a1) {
	#pragma omp target			#pragma omp target
	{			{
	// CHECK-YES: call double @__nv_sqrt(double			// CHECK-YES: call double @__nv_sqrt(double
	Show All 11 Lines

clang/test/Headers/nvptx_device_math_complex.c

	// REQUIRES: nvptx-registered-target			// REQUIRES: nvptx-registered-target
	// RUN: %clang_cc1 -verify -internal-isystem %S/Inputs/include -fopenmp -x c -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc			// RUN: %clang_cc1 -verify -internal-isystem %S/Inputs/include -fopenmp -x c -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
	// RUN: %clang_cc1 -verify -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -internal-isystem %S/Inputs/include -fopenmp -x c -triple nvptx64-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -aux-triple powerpc64le-unknown-unknown -o - \| FileCheck %s			// RUN: %clang_cc1 -verify -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -internal-isystem %S/Inputs/include -fopenmp -x c -triple nvptx64-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -aux-triple powerpc64le-unknown-unknown -o - \| FileCheck %s
	// RUN: %clang_cc1 -verify -internal-isystem %S/Inputs/include -fopenmp -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc			// RUN: %clang_cc1 -verify -internal-isystem %S/Inputs/include -fopenmp -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
	// RUN: %clang_cc1 -verify -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -internal-isystem %S/Inputs/include -fopenmp -x c++ -triple nvptx64-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -aux-triple powerpc64le-unknown-unknown -o - \| FileCheck %s			// RUN: %clang_cc1 -verify -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/Inputs/include -fopenmp -x c++ -triple nvptx64-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -aux-triple powerpc64le-unknown-unknown -o - \| FileCheck %s
	// expected-no-diagnostics			// expected-no-diagnostics

	#ifdef __cplusplus			#ifdef __cplusplus
	#include <complex>			#include <complex>
	#else			#else
	#include <complex.h>			#include <complex.h>
	#endif			#endif

	▲ Show 20 Lines • Show All 41 Lines • Show Last 20 Lines

clang/test/Headers/nvptx_device_math_complex.cpp

	// REQUIRES: nvptx-registered-target			// REQUIRES: nvptx-registered-target
	// RUN: %clang_cc1 -verify -internal-isystem %S/Inputs/include -fopenmp -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc			// RUN: %clang_cc1 -verify -internal-isystem %S/Inputs/include -fopenmp -x c++ -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
	// RUN: %clang_cc1 -verify -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -internal-isystem %S/Inputs/include -fopenmp -x c++ -triple nvptx64-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -aux-triple powerpc64le-unknown-unknown -o - \| FileCheck %s			// RUN: %clang_cc1 -verify -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/Inputs/include -fopenmp -x c++ -triple nvptx64-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -aux-triple powerpc64le-unknown-unknown -o - \| FileCheck %s
	// expected-no-diagnostics			// expected-no-diagnostics

	#include <cmath>			#include <cmath>
	#include <complex>			#include <complex>

	// CHECK: define weak {{.*}} @__muldc3			// CHECK: define weak {{.*}} @__muldc3
	// CHECK-DAG: call i32 @__nv_isnand(			// CHECK-DAG: call i32 @__nv_isnand(
	// CHECK-DAG: call i32 @__nv_isinfd(			// CHECK-DAG: call i32 @__nv_isinfd(
	▲ Show 20 Lines • Show All 76 Lines • Show Last 20 Lines

clang/test/Headers/nvptx_device_math_functions.c

	// Test calling of device math functions.			// Test calling of device math functions.
	///==========================================================================///			///==========================================================================///

	// REQUIRES: nvptx-registered-target			// REQUIRES: nvptx-registered-target

	// RUN: %clang_cc1 -x c -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc			// RUN: %clang_cc1 -x c -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
	// RUN: %clang_cc1 -x c -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s			// RUN: %clang_cc1 -x c -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s
	// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc			// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
	// RUN: %clang_cc1 -x c++ -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s			// RUN: %clang_cc1 -x c++ -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s

	#ifdef __cplusplus			#ifdef __cplusplus
	#include <cstdlib>			#include <cstdlib>
	#include <cmath>			#include <cmath>
	#else			#else
	#include <stdlib.h>			#include <stdlib.h>
	#include <math.h>			#include <math.h>
	#endif			#endif
	Show All 16 Lines

clang/test/Headers/nvptx_device_math_functions.cpp

	// Test calling of device math functions.			// Test calling of device math functions.
	///==========================================================================///			///==========================================================================///

	// REQUIRES: nvptx-registered-target			// REQUIRES: nvptx-registered-target

	// RUN: %clang_cc1 -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc			// RUN: %clang_cc1 -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
	// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck -check-prefix CHECK-YES %s			// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck -check-prefix CHECK-YES %s

	#include <cstdlib>			#include <cstdlib>
	#include <cmath>			#include <cmath>

	void test_sqrt(double a1) {			void test_sqrt(double a1) {
	#pragma omp target			#pragma omp target
	{			{
	// CHECK-YES: call double @__nv_sqrt(double			// CHECK-YES: call double @__nv_sqrt(double
	Show All 11 Lines

clang/test/Headers/nvptx_device_math_functions_cxx17.cpp

	// Test calling of device math functions.			// Test calling of device math functions.
	///==========================================================================///			///==========================================================================///

	// REQUIRES: nvptx-registered-target			// REQUIRES: nvptx-registered-target

	// RUN: %clang_cc1 -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc -std=c++17			// RUN: %clang_cc1 -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc -std=c++17
	// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -std=c++17 -o - \| FileCheck -check-prefix CHECK-YES %s			// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -x c++ -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -std=c++17 -o - \| FileCheck -check-prefix CHECK-YES %s

	#include <cstdlib>			#include <cstdlib>
	#include <cmath>			#include <cmath>

	void test_sqrt(double a1) {			void test_sqrt(double a1) {
	#pragma omp target			#pragma omp target
	{			{
	// CHECK-YES: call double @__nv_sqrt(double			// CHECK-YES: call double @__nv_sqrt(double
	Show All 11 Lines

clang/test/Headers/nvptx_device_math_macro.cpp

	// REQUIRES: nvptx-registered-target			// REQUIRES: nvptx-registered-target
	// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc			// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
	// RUN: %clang_cc1 -x c++ -include __clang_openmp_device_functions.h -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s			// RUN: %clang_cc1 -x c++ -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s
	// expected-no-diagnostics			// expected-no-diagnostics

	#include <cmath>			#include <cmath>

	#pragma omp declare target			#pragma omp declare target
	int use_macro() {			int use_macro() {
	double a(0);			double a(0);
	// CHECK-NOT: call {{.*}}			// CHECK-NOT: call {{.*}}
	// CHECK: call double @llvm.fabs.f64(double			// CHECK: call double @llvm.fabs.f64(double
	// CHECK-NOT: call {{.*}}			// CHECK-NOT: call {{.*}}
	// CHECK: ret i32 %conv			// CHECK: ret i32 %conv
	return (std::fpclassify(a) != FP_ZERO);			return (std::fpclassify(a) != FP_ZERO);
	}			}
	#pragma omp end declare target			#pragma omp end declare target

clang/test/Headers/nvptx_device_math_modf.cpp

	// REQUIRES: nvptx-registered-target			// REQUIRES: nvptx-registered-target
	// RUN: %clang_cc1 -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc			// RUN: %clang_cc1 -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
	// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s			// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s

	#include <cmath>			#include <cmath>

	// 4 calls to modf(f), all translated to __nv_modf calls:			// 4 calls to modf(f), all translated to __nv_modf calls:

	// CHECK-NOT: _Z.modf			// CHECK-NOT: _Z.modf
	// CHECK: call double @__nv_modf(double			// CHECK: call double @__nv_modf(double
	// CHECK-NOT: _Z.modf			// CHECK-NOT: _Z.modf
	▲ Show 20 Lines • Show All 42 Lines • Show Last 20 Lines

clang/test/Headers/nvptx_device_math_sin.cpp

	// REQUIRES: nvptx-registered-target			// REQUIRES: nvptx-registered-target
	// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc			// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
	// RUN: %clang_cc1 -x c++ -include __clang_openmp_device_functions.h -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s --check-prefix=SLOW			// RUN: %clang_cc1 -x c++ -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s --check-prefix=SLOW
	// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc -ffast-math -ffp-contract=fast			// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc -ffast-math -ffp-contract=fast
	// RUN: %clang_cc1 -x c++ -include __clang_openmp_device_functions.h -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - -ffast-math -ffp-contract=fast \| FileCheck %s --check-prefix=FAST			// RUN: %clang_cc1 -x c++ -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - -ffast-math -ffp-contract=fast \| FileCheck %s --check-prefix=FAST
	// expected-no-diagnostics			// expected-no-diagnostics

	#include <cmath>			#include <cmath>

	double math(float f, double d) {			double math(float f, double d) {
	double r = 0;			double r = 0;
	// SLOW: call float @__nv_sinf(float			// SLOW: call float @__nv_sinf(float
	// FAST: call fast float @__nv_fast_sinf(float			// FAST: call fast float @__nv_fast_sinf(float
	Show All 14 Lines

clang/test/Headers/nvptx_device_math_sin_cos.cpp

	// REQUIRES: nvptx-registered-target			// REQUIRES: nvptx-registered-target
	// RUN: %clang_cc1 -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc			// RUN: %clang_cc1 -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
	// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s			// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s

	#include <cmath>			#include <cmath>

	// 6 calls to sin/cos(f), all translated to __nv_sin/__nv_cos calls:			// 6 calls to sin/cos(f), all translated to __nv_sin/__nv_cos calls:

	// CHECK-NOT: _Z.sin			// CHECK-NOT: _Z.sin
	// CHECK-NOT: _Z.cos			// CHECK-NOT: _Z.cos
	// CHECK: call double @__nv_sin(double			// CHECK: call double @__nv_sin(double
	▲ Show 20 Lines • Show All 52 Lines • Show Last 20 Lines

clang/test/Headers/nvptx_device_math_sincos.cpp

	// REQUIRES: nvptx-registered-target			// REQUIRES: nvptx-registered-target
	// RUN: %clang_cc1 -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc			// RUN: %clang_cc1 -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
	// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s			// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s
	// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -DCMATH -include __clang_openmp_device_functions.h -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s			// RUN: %clang_cc1 -internal-isystem %S/../../lib/Headers/openmp_wrappers -DCMATH -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s

	#ifdef CMATH			#ifdef CMATH
	#include <cmath>			#include <cmath>
	#else			#else
	#include <math.h>			#include <math.h>
	#endif			#endif

	// 4 calls to sincos(f), all translated to __nv_sincos calls:			// 4 calls to sincos(f), all translated to __nv_sincos calls:
	▲ Show 20 Lines • Show All 51 Lines • Show Last 20 Lines

clang/test/Headers/openmp_device_math_isnan.cpp

	// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc			// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
	// RUN: %clang_cc1 -x c++ -include __clang_openmp_device_functions.h -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s --check-prefix=BOOL_RETURN			// RUN: %clang_cc1 -x c++ -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s --check-prefix=BOOL_RETURN
	// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc -ffast-math -ffp-contract=fast			// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc -ffast-math -ffp-contract=fast
	// RUN: %clang_cc1 -x c++ -include __clang_openmp_device_functions.h -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - -ffast-math -ffp-contract=fast \| FileCheck %s --check-prefix=BOOL_RETURN			// RUN: %clang_cc1 -x c++ -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - -ffast-math -ffp-contract=fast \| FileCheck %s --check-prefix=BOOL_RETURN
	// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc -DUSE_ISNAN_WITH_INT_RETURN			// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc -DUSE_ISNAN_WITH_INT_RETURN
	// RUN: %clang_cc1 -x c++ -include __clang_openmp_device_functions.h -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - -DUSE_ISNAN_WITH_INT_RETURN \| FileCheck %s --check-prefix=INT_RETURN			// RUN: %clang_cc1 -x c++ -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - -DUSE_ISNAN_WITH_INT_RETURN \| FileCheck %s --check-prefix=INT_RETURN
	// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc -ffast-math -ffp-contract=fast -DUSE_ISNAN_WITH_INT_RETURN			// RUN: %clang_cc1 -x c++ -internal-isystem %S/Inputs/include -fopenmp -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc -ffast-math -ffp-contract=fast -DUSE_ISNAN_WITH_INT_RETURN
	// RUN: %clang_cc1 -x c++ -include __clang_openmp_device_functions.h -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - -ffast-math -ffp-contract=fast -DUSE_ISNAN_WITH_INT_RETURN \| FileCheck %s --check-prefix=INT_RETURN			// RUN: %clang_cc1 -x c++ -include __clang_openmp_device_functions.h -fdeclspec -internal-isystem %S/../../lib/Headers/openmp_wrappers -internal-isystem %S/Inputs/include -fopenmp -triple nvptx64-nvidia-cuda -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - -ffast-math -ffp-contract=fast -DUSE_ISNAN_WITH_INT_RETURN \| FileCheck %s --check-prefix=INT_RETURN
	// expected-no-diagnostics			// expected-no-diagnostics

	#include <cmath>			#include <cmath>

	double math(float f, double d) {			double math(float f, double d) {
	double r = 0;			double r = 0;
	// INT_RETURN: call i32 @__nv_isnanf(float			// INT_RETURN: call i32 @__nv_isnanf(float
	// BOOL_RETURN: call i32 @__nv_isnanf(float			// BOOL_RETURN: call i32 @__nv_isnanf(float
	Show All 14 Lines

clang/test/OpenMP/assumes_include_nvptx.cpp

	// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc			// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
	// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -triple nvptx64-unknown-unknown -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s			// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -triple nvptx64-unknown-unknown -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s
	// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -triple i386-unknown-unknown -fopenmp-targets=nvptx-nvidia-cuda -emit-llvm-bc %s -o %t-x86-host.bc			// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -triple i386-unknown-unknown -fopenmp-targets=nvptx-nvidia-cuda -emit-llvm-bc %s -o %t-x86-host.bc
	// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -triple nvptx64-unknown-unknown -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-x86-host.bc -o - \| FileCheck %s			// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -triple nvptx64-unknown-unknown -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-x86-host.bc -o - \| FileCheck %s
	// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fexceptions -fcxx-exceptions -aux-triple powerpc64le-unknown-unknown -triple nvptx64-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-x86-host.bc -o - \| FileCheck %s			// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -fexceptions -fcxx-exceptions -aux-triple powerpc64le-unknown-unknown -triple nvptx64-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-x86-host.bc -o - \| FileCheck %s
	// expected-no-diagnostics			// expected-no-diagnostics
	#ifndef HEADER			#ifndef HEADER
	#define HEADER			#define HEADER

	#include <cmath>			#include <cmath>

	// TODO: Think about teaching the OMPIRBuilder about default attributes as well so the __kmpc* declarations are annotated.			// TODO: Think about teaching the OMPIRBuilder about default attributes as well so the __kmpc* declarations are annotated.

	▲ Show 20 Lines • Show All 57 Lines • Show Last 20 Lines

clang/test/OpenMP/nvptx_target_parallel_reduction_codegen_tbaa_PR46146.cpp

	// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc			// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc %s -o %t-ppc-host.bc
	// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -triple nvptx64-unknown-unknown -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s			// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -triple nvptx64-unknown-unknown -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -o - \| FileCheck %s
	// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -triple i386-unknown-unknown -fopenmp-targets=nvptx-nvidia-cuda -emit-llvm-bc %s -o %t-x86-host.bc			// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -triple i386-unknown-unknown -fopenmp-targets=nvptx-nvidia-cuda -emit-llvm-bc %s -o %t-x86-host.bc
	// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -triple nvptx64-unknown-unknown -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-x86-host.bc -o - \| FileCheck %s			// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -triple nvptx64-unknown-unknown -aux-triple powerpc64le-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-x86-host.bc -o - \| FileCheck %s
	// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fexceptions -fcxx-exceptions -aux-triple powerpc64le-unknown-unknown -triple nvptx64-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-x86-host.bc -o - \| FileCheck %s			// RUN: %clang_cc1 -x c++ -O1 -disable-llvm-optzns -verify -fopenmp -internal-isystem %S/../Headers/Inputs/include -internal-isystem %S/../../lib/Headers/openmp_wrappers -include __clang_openmp_device_functions.h -fdeclspec -fexceptions -fcxx-exceptions -aux-triple powerpc64le-unknown-unknown -triple nvptx64-unknown-unknown -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-x86-host.bc -o - \| FileCheck %s
	// expected-no-diagnostics			// expected-no-diagnostics
	#ifndef HEADER			#ifndef HEADER
	#define HEADER			#define HEADER

	#include <complex>			#include <complex>

	// Verify we do not add tbaa metadata to type punned memory operations:			// Verify we do not add tbaa metadata to type punned memory operations:

	Show All 25 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[Clang][OpenMP] Include header for CUDA builtin vars into OpenMP wrapper header
AbandonedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 317664

clang/lib/Headers/__clang_cuda_builtin_vars.h

clang/lib/Headers/openmp_wrappers/__clang_openmp_device_functions.h

clang/test/Headers/nvptx_device_cmath_functions.cpp

clang/test/Headers/nvptx_device_cmath_functions_cxx17.cpp

clang/test/Headers/nvptx_device_math_complex.c

clang/test/Headers/nvptx_device_math_complex.cpp

clang/test/Headers/nvptx_device_math_functions.c

clang/test/Headers/nvptx_device_math_functions.cpp

clang/test/Headers/nvptx_device_math_functions_cxx17.cpp

clang/test/Headers/nvptx_device_math_macro.cpp

clang/test/Headers/nvptx_device_math_modf.cpp

clang/test/Headers/nvptx_device_math_sin.cpp

clang/test/Headers/nvptx_device_math_sin_cos.cpp

clang/test/Headers/nvptx_device_math_sincos.cpp

clang/test/Headers/openmp_device_math_isnan.cpp

clang/test/OpenMP/assumes_include_nvptx.cpp

clang/test/OpenMP/nvptx_target_parallel_reduction_codegen_tbaa_PR46146.cpp

This is an archive of the discontinued LLVM Phabricator instance.

[Clang][OpenMP] Include header for CUDA builtin vars into OpenMP wrapper headerAbandonedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 317664

clang/lib/Headers/__clang_cuda_builtin_vars.h

clang/lib/Headers/openmp_wrappers/__clang_openmp_device_functions.h

clang/test/Headers/nvptx_device_cmath_functions.cpp

clang/test/Headers/nvptx_device_cmath_functions_cxx17.cpp

clang/test/Headers/nvptx_device_math_complex.c

clang/test/Headers/nvptx_device_math_complex.cpp

clang/test/Headers/nvptx_device_math_functions.c

clang/test/Headers/nvptx_device_math_functions.cpp

clang/test/Headers/nvptx_device_math_functions_cxx17.cpp

clang/test/Headers/nvptx_device_math_macro.cpp

clang/test/Headers/nvptx_device_math_modf.cpp

clang/test/Headers/nvptx_device_math_sin.cpp

clang/test/Headers/nvptx_device_math_sin_cos.cpp

clang/test/Headers/nvptx_device_math_sincos.cpp

clang/test/Headers/openmp_device_math_isnan.cpp

clang/test/OpenMP/assumes_include_nvptx.cpp

clang/test/OpenMP/nvptx_target_parallel_reduction_codegen_tbaa_PR46146.cpp

[Clang][OpenMP] Include header for CUDA builtin vars into OpenMP wrapper header
AbandonedPublic