Diff 47819

cfe/trunk/include/clang/Sema/Sema.h

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 8,788 Lines • ▼ Show 20 Lines	enum CUDAFunctionTarget {
CFT_Global,		CFT_Global,
CFT_Host,		CFT_Host,
CFT_HostDevice,		CFT_HostDevice,
CFT_InvalidTarget		CFT_InvalidTarget
};		};

CUDAFunctionTarget IdentifyCUDATarget(const FunctionDecl *D);		CUDAFunctionTarget IdentifyCUDATarget(const FunctionDecl *D);

		// CUDA function call preference. Must be ordered numerically from
		// worst to best.
enum CUDAFunctionPreference {		enum CUDAFunctionPreference {
CFP_Never, // Invalid caller/callee combination.		CFP_Never, // Invalid caller/callee combination.
CFP_LastResort, // Lowest priority. Only in effect if		CFP_WrongSide, // Calls from host-device to host or device
		// function that do not match current compilation
		// mode. Only in effect if
// LangOpts.CUDADisableTargetCallChecks is true.		// LangOpts.CUDADisableTargetCallChecks is true.
CFP_Fallback, // Low priority caller/callee combination		CFP_HostDevice, // Any calls to host/device functions.
CFP_Best, // Preferred caller/callee combination		CFP_SameSide, // Calls from host-device to host or device
		// function matching current compilation mode.
		CFP_Native, // host-to-host or device-to-device calls.
};		};

/// Identifies relative preference of a given Caller/Callee		/// Identifies relative preference of a given Caller/Callee
/// combination, based on their host/device attributes.		/// combination, based on their host/device attributes.
/// \param Caller function which needs address of \p Callee.		/// \param Caller function which needs address of \p Callee.
/// nullptr in case of global context.		/// nullptr in case of global context.
/// \param Callee target function		/// \param Callee target function
///		///
▲ Show 20 Lines • Show All 518 Lines • Show Last 20 Lines

cfe/trunk/lib/Sema/SemaCUDA.cpp

	Show First 20 Lines • Show All 62 Lines • ▼ Show 20 Lines

	// * CUDA Call preference table			// * CUDA Call preference table
	//			//
	// F - from,			// F - from,
	// T - to			// T - to
	// Ph - preference in host mode			// Ph - preference in host mode
	// Pd - preference in device mode			// Pd - preference in device mode
	// H - handled in (x)			// H - handled in (x)
	// Preferences: b-best, f-fallback, l-last resort, n-never.			// Preferences: N:native, HD:host-device, SS:same side, WS:wrong side, --:never.
	//			//
	// \| F \| T \| Ph \| Pd \| H \|			// \| F \| T \| Ph \| Pd \| H \|
	// \|----+----+----+----+-----+			// \|----+----+-----+-----+-----+
	// \| d \| d \| b \| b \| (b) \|			// \| d \| d \| N \| N \| (c) \|
	// \| d \| g \| n \| n \| (a) \|			// \| d \| g \| -- \| -- \| (a) \|
	// \| d \| h \| l \| l \| (e) \|			// \| d \| h \| -- \| -- \| (e) \|
	// \| d \| hd \| f \| f \| (c) \|			// \| d \| hd \| HD \| HD \| (b) \|
	// \| g \| d \| b \| b \| (b) \|			// \| g \| d \| N \| N \| (c) \|
	// \| g \| g \| n \| n \| (a) \|			// \| g \| g \| -- \| -- \| (a) \|
	// \| g \| h \| l \| l \| (e) \|			// \| g \| h \| -- \| -- \| (e) \|
	// \| g \| hd \| f \| f \| (c) \|			// \| g \| hd \| HD \| HD \| (b) \|
	// \| h \| d \| l \| l \| (e) \|			// \| h \| d \| -- \| -- \| (e) \|
	// \| h \| g \| b \| b \| (b) \|			// \| h \| g \| N \| N \| (c) \|
	// \| h \| h \| b \| b \| (b) \|			// \| h \| h \| N \| N \| (c) \|
	// \| h \| hd \| f \| f \| (c) \|			// \| h \| hd \| HD \| HD \| (b) \|
	// \| hd \| d \| l \| f \| (d) \|			// \| hd \| d \| WS \| SS \| (d) \|
	// \| hd \| g \| f \| n \|(d/a)\|			// \| hd \| g \| SS \| -- \|(d/a)\|
	// \| hd \| h \| f \| l \| (d) \|			// \| hd \| h \| SS \| WS \| (d) \|
	// \| hd \| hd \| b \| b \| (b) \|			// \| hd \| hd \| HD \| HD \| (b) \|

	Sema::CUDAFunctionPreference			Sema::CUDAFunctionPreference
	Sema::IdentifyCUDAPreference(const FunctionDecl *Caller,			Sema::IdentifyCUDAPreference(const FunctionDecl *Caller,
	const FunctionDecl *Callee) {			const FunctionDecl *Callee) {
	assert(getLangOpts().CUDATargetOverloads &&			assert(getLangOpts().CUDATargetOverloads &&
	"Should not be called w/o enabled target overloads.");			"Should not be called w/o enabled target overloads.");

	assert(Callee && "Callee must be valid.");			assert(Callee && "Callee must be valid.");
	CUDAFunctionTarget CalleeTarget = IdentifyCUDATarget(Callee);			CUDAFunctionTarget CalleeTarget = IdentifyCUDATarget(Callee);
	CUDAFunctionTarget CallerTarget =			CUDAFunctionTarget CallerTarget =
	(Caller != nullptr) ? IdentifyCUDATarget(Caller) : Sema::CFT_Host;			(Caller != nullptr) ? IdentifyCUDATarget(Caller) : Sema::CFT_Host;

	// If one of the targets is invalid, the check always fails, no matter what			// If one of the targets is invalid, the check always fails, no matter what
	// the other target is.			// the other target is.
	if (CallerTarget == CFT_InvalidTarget \|\| CalleeTarget == CFT_InvalidTarget)			if (CallerTarget == CFT_InvalidTarget \|\| CalleeTarget == CFT_InvalidTarget)
	return CFP_Never;			return CFP_Never;

	// (a) Can't call global from some contexts until we support CUDA's			// (a) Can't call global from some contexts until we support CUDA's
	// dynamic parallelism.			// dynamic parallelism.
	if (CalleeTarget == CFT_Global &&			if (CalleeTarget == CFT_Global &&
	(CallerTarget == CFT_Global \|\| CallerTarget == CFT_Device \|\|			(CallerTarget == CFT_Global \|\| CallerTarget == CFT_Device \|\|
	(CallerTarget == CFT_HostDevice && getLangOpts().CUDAIsDevice)))			(CallerTarget == CFT_HostDevice && getLangOpts().CUDAIsDevice)))
	return CFP_Never;			return CFP_Never;

	// (b) Best case scenarios			// (b) Calling HostDevice is OK for everyone.
				if (CalleeTarget == CFT_HostDevice)
				return CFP_HostDevice;

				// (c) Best case scenarios
	if (CalleeTarget == CallerTarget \|\|			if (CalleeTarget == CallerTarget \|\|
	(CallerTarget == CFT_Host && CalleeTarget == CFT_Global) \|\|			(CallerTarget == CFT_Host && CalleeTarget == CFT_Global) \|\|
	(CallerTarget == CFT_Global && CalleeTarget == CFT_Device))			(CallerTarget == CFT_Global && CalleeTarget == CFT_Device))
	return CFP_Best;			return CFP_Native;

	// (c) Calling HostDevice is OK as a fallback that works for everyone.
	if (CalleeTarget == CFT_HostDevice)
	return CFP_Fallback;

	// Figure out what should be returned 'last resort' cases. Normally
	// those would not be allowed, but we'll consider them if
	// CUDADisableTargetCallChecks is true.
	CUDAFunctionPreference QuestionableResult =
	getLangOpts().CUDADisableTargetCallChecks ? CFP_LastResort : CFP_Never;

	// (d) HostDevice behavior depends on compilation mode.			// (d) HostDevice behavior depends on compilation mode.
	if (CallerTarget == CFT_HostDevice) {			if (CallerTarget == CFT_HostDevice) {
	// Calling a function that matches compilation mode is OK.			// It's OK to call a compilation-mode matching function from an HD one.
	// Calling a function from the other side is frowned upon.			if ((getLangOpts().CUDAIsDevice && CalleeTarget == CFT_Device) \|\|
	if (getLangOpts().CUDAIsDevice)			(!getLangOpts().CUDAIsDevice &&
	return CalleeTarget == CFT_Device ? CFP_Fallback : QuestionableResult;			(CalleeTarget == CFT_Host \|\| CalleeTarget == CFT_Global)))
	else			return CFP_SameSide;
	return (CalleeTarget == CFT_Host \|\| CalleeTarget == CFT_Global)
	? CFP_Fallback			// We'll allow calls to non-mode-matching functions if target call
	: QuestionableResult;			// checks are disabled. This is needed to avoid complaining about
				// HD->H calls when we compile for device side and vice versa.
				if (getLangOpts().CUDADisableTargetCallChecks)
				return CFP_WrongSide;

				return CFP_Never;
	}			}

	// (e) Calling across device/host boundary is not something you should do.			// (e) Calling across device/host boundary is not something you should do.
	if ((CallerTarget == CFT_Host && CalleeTarget == CFT_Device) \|\|			if ((CallerTarget == CFT_Host && CalleeTarget == CFT_Device) \|\|
	(CallerTarget == CFT_Device && CalleeTarget == CFT_Host) \|\|			(CallerTarget == CFT_Device && CalleeTarget == CFT_Host) \|\|
	(CallerTarget == CFT_Global && CalleeTarget == CFT_Host))			(CallerTarget == CFT_Global && CalleeTarget == CFT_Host))
	return QuestionableResult;			return CFP_Never;

	llvm_unreachable("All cases should've been handled by now.");			llvm_unreachable("All cases should've been handled by now.");
	}			}

	bool Sema::CheckCUDATarget(const FunctionDecl *Caller,			bool Sema::CheckCUDATarget(const FunctionDecl *Caller,
	const FunctionDecl *Callee) {			const FunctionDecl *Callee) {
	// With target overloads enabled, we only disallow calling			// With target overloads enabled, we only disallow calling
	// combinations with CFP_Never.			// combinations with CFP_Never.
	▲ Show 20 Lines • Show All 301 Lines • Show Last 20 Lines

cfe/trunk/lib/Sema/SemaOverload.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

	Show First 20 Lines • Show All 8,716 Lines • ▼ Show 20 Lines
	/// \param Best If overload resolution was successful or found a deleted			/// \param Best If overload resolution was successful or found a deleted
	/// function, \p Best points to the candidate function found.			/// function, \p Best points to the candidate function found.
	///			///
	/// \returns The result of overload resolution.			/// \returns The result of overload resolution.
	OverloadingResult			OverloadingResult
	OverloadCandidateSet::BestViableFunction(Sema &S, SourceLocation Loc,			OverloadCandidateSet::BestViableFunction(Sema &S, SourceLocation Loc,
	iterator &Best,			iterator &Best,
	bool UserDefinedConversion) {			bool UserDefinedConversion) {
				llvm::SmallVector<OverloadCandidate *, 16> Candidates;
				std::transform(begin(), end(), std::back_inserter(Candidates),
				[](OverloadCandidate &Cand) { return &Cand; });

				// [CUDA] HD->H or HD->D calls are technically not allowed by CUDA
				// but accepted by both clang and NVCC. However during a particular
				// compilation mode only one call variant is viable. We need to
				// exclude non-viable overload candidates from consideration based
				// only on their host/device attributes. Specifically, if one
				// candidate call is WrongSide and the other is SameSide, we ignore
				// the WrongSide candidate.
				if (S.getLangOpts().CUDA && S.getLangOpts().CUDATargetOverloads) {
				const FunctionDecl *Caller = dyn_cast<FunctionDecl>(S.CurContext);
				bool ContainsSameSideCandidate =
				llvm::any_of(Candidates, [&](OverloadCandidate *Cand) {
				return Cand->Function &&
				S.IdentifyCUDAPreference(Caller, Cand->Function) ==
				Sema::CFP_SameSide;
				});
				if (ContainsSameSideCandidate) {
				auto IsWrongSideCandidate = [&](OverloadCandidate *Cand) {
				return Cand->Function &&
				S.IdentifyCUDAPreference(Caller, Cand->Function) ==
				Sema::CFP_WrongSide;
				};
				Candidates.erase(std::remove_if(Candidates.begin(), Candidates.end(),
				IsWrongSideCandidate),
				Candidates.end());
				}
				}

	// Find the best viable function.			// Find the best viable function.
	Best = end();			Best = end();
	for (iterator Cand = begin(); Cand != end(); ++Cand) {			for (auto *Cand : Candidates)
	if (Cand->Viable)			if (Cand->Viable)
	if (Best == end() \|\| isBetterOverloadCandidate(S, Cand, Best, Loc,			if (Best == end() \|\| isBetterOverloadCandidate(S, Cand, Best, Loc,
	UserDefinedConversion))			UserDefinedConversion))
	Best = Cand;			Best = Cand;
	}

	// If we didn't find any viable functions, abort.			// If we didn't find any viable functions, abort.
	if (Best == end())			if (Best == end())
	return OR_No_Viable_Function;			return OR_No_Viable_Function;

	llvm::SmallVector<const NamedDecl *, 4> EquivalentCands;			llvm::SmallVector<const NamedDecl *, 4> EquivalentCands;

	// Make sure that this function is better than every other viable			// Make sure that this function is better than every other viable
	// function. If not, we have an ambiguity.			// function. If not, we have an ambiguity.
	for (iterator Cand = begin(); Cand != end(); ++Cand) {			for (auto *Cand : Candidates) {
	if (Cand->Viable &&			if (Cand->Viable &&
	Cand != Best &&			Cand != Best &&
	!isBetterOverloadCandidate(S, Best, Cand, Loc,			!isBetterOverloadCandidate(S, Best, Cand, Loc,
	UserDefinedConversion)) {			UserDefinedConversion)) {
	if (S.isEquivalentInternalLinkageDeclaration(Best->Function,			if (S.isEquivalentInternalLinkageDeclaration(Best->Function,
	Cand->Function)) {			Cand->Function)) {
	EquivalentCands.push_back(Cand->Function);			EquivalentCands.push_back(Cand->Function);
	continue;			continue;
	▲ Show 20 Lines • Show All 4,212 Lines • Show Last 20 Lines

cfe/trunk/test/CodeGenCUDA/function-overload.cu

	// REQUIRES: x86-registered-target			// REQUIRES: x86-registered-target
	// REQUIRES: nvptx-registered-target			// REQUIRES: nvptx-registered-target

	// Make sure we handle target overloads correctly.			// Make sure we handle target overloads correctly.
	// RUN: %clang_cc1 -triple x86_64-unknown-linux-gnu \			// RUN: %clang_cc1 -triple x86_64-unknown-linux-gnu \
	// RUN: -fcuda-target-overloads -emit-llvm -o - %s \			// RUN: -fcuda-target-overloads -emit-llvm -o - %s \
	// RUN: \| FileCheck -check-prefix=CHECK-BOTH -check-prefix=CHECK-HOST %s			// RUN: \| FileCheck -check-prefix=CHECK-BOTH -check-prefix=CHECK-HOST %s
	// RUN: %clang_cc1 -triple nvptx64-nvidia-cuda -fcuda-is-device \			// RUN: %clang_cc1 -triple nvptx64-nvidia-cuda -fcuda-is-device \
	// RUN: -fcuda-target-overloads -emit-llvm -o - %s \			// RUN: -fcuda-target-overloads -emit-llvm -o - %s \
	// RUN: \| FileCheck -check-prefix=CHECK-BOTH -check-prefix=CHECK-DEVICE %s			// RUN: \| FileCheck -check-prefix=CHECK-BOTH -check-prefix=CHECK-DEVICE \
				// RUN: -check-prefix=CHECK-DEVICE-STRICT %s

	// Check target overloads handling with disabled call target checks.			// Check target overloads handling with disabled call target checks.
	// RUN: %clang_cc1 -DNOCHECKS -triple x86_64-unknown-linux-gnu -emit-llvm \			// RUN: %clang_cc1 -DNOCHECKS -triple x86_64-unknown-linux-gnu -emit-llvm \
	// RUN: -fcuda-disable-target-call-checks -fcuda-target-overloads -o - %s \			// RUN: -fcuda-disable-target-call-checks -fcuda-target-overloads -o - %s \
	// RUN: \| FileCheck -check-prefix=CHECK-BOTH -check-prefix=CHECK-HOST \			// RUN: \| FileCheck -check-prefix=CHECK-BOTH -check-prefix=CHECK-HOST \
	// RUN: -check-prefix=CHECK-BOTH-NC -check-prefix=CHECK-HOST-NC %s			// RUN: -check-prefix=CHECK-BOTH-NC -check-prefix=CHECK-HOST-NC %s
	// RUN: %clang_cc1 -DNOCHECKS -triple nvptx64-nvidia-cuda -emit-llvm \			// RUN: %clang_cc1 -DNOCHECKS -triple nvptx64-nvidia-cuda -emit-llvm \
	// RUN: -fcuda-disable-target-call-checks -fcuda-target-overloads \			// RUN: -fcuda-disable-target-call-checks -fcuda-target-overloads \
	▲ Show 20 Lines • Show All 53 Lines • ▼ Show 20 Lines
	// CHECK-HOST-LABEL: define i32 @ch()			// CHECK-HOST-LABEL: define i32 @ch()
	extern "C" __host__ int ch(void) {return 13;}			extern "C" __host__ int ch(void) {return 13;}
	// CHECK-HOST: ret i32 13			// CHECK-HOST: ret i32 13

	// CHECK-BOTH-LABEL: define i32 @chd()			// CHECK-BOTH-LABEL: define i32 @chd()
	extern "C" __host__ __device__ int chd(void) {return 14;}			extern "C" __host__ __device__ int chd(void) {return 14;}
	// CHECK-BOTH: ret i32 14			// CHECK-BOTH: ret i32 14

				// HD functions are sometimes allowed to call H or D functions -- this
				// is an artifact of the source-to-source splitting performed by nvcc
				// that we need to mimic. During device mode compilation in nvcc, host
				// functions aren't present at all, so don't participate in
				// overloading. But in clang, H and D functions are present in both
				// compilation modes. Clang normally uses the target attribute as a
				// tiebreaker between overloads with otherwise identical priority, but
				// in order to match nvcc's behavior, we sometimes need to wholly
				// discard overloads that would not be present during compilation
				// under nvcc.

				template <typename T> T template_vs_function(T arg) { return 15; }
				__device__ float template_vs_function(float arg) { return 16; }

				// Here we expect to call the templated function during host
				// compilation, even if -fcuda-disable-target-call-checks is passed,
				// and even though C++ overload rules prefer the non-templated
				// function.
				// CHECK-BOTH-LABEL: define void @_Z5hd_tfv()
				__host__ __device__ void hd_tf(void) {
				template_vs_function(1.0f);
				// CHECK-HOST: call float @_Z20template_vs_functionIfET_S0_(float
				// CHECK-DEVICE: call float @_Z20template_vs_functionf(float
				template_vs_function(2.0);
				// CHECK-HOST: call double @_Z20template_vs_functionIdET_S0_(double
				// CHECK-DEVICE: call float @_Z20template_vs_functionf(float
				}

				// Calls from __host__ and __device__ functions should always call the
				// overloaded function that matches their mode.
				// CHECK-HOST-LABEL: define void @_Z4h_tfv()
				__host__ void h_tf() {
				template_vs_function(1.0f);
				// CHECK-HOST: call float @_Z20template_vs_functionIfET_S0_(float
				template_vs_function(2.0);
				// CHECK-HOST: call double @_Z20template_vs_functionIdET_S0_(double
				}

				// CHECK-DEVICE-LABEL: define void @_Z4d_tfv()
				__device__ void d_tf() {
				template_vs_function(1.0f);
				// CHECK-DEVICE: call float @_Z20template_vs_functionf(float
				template_vs_function(2.0);
				// CHECK-DEVICE: call float @_Z20template_vs_functionf(float
				}

				// In case we have a mix of HD and H-only or D-only candidates in the
				// overload set, normal C++ overload resolution rules apply first.
				template <typename T> T template_vs_hd_function(T arg) { return 15; }
				__host__ __device__ float template_vs_hd_function(float arg) { return 16; }

				// CHECK-BOTH-LABEL: define void @_Z7hd_thdfv()
				__host__ __device__ void hd_thdf() {
				template_vs_hd_function(1.0f);
				// CHECK-HOST: call float @_Z23template_vs_hd_functionf(float
				// CHECK-DEVICE: call float @_Z23template_vs_hd_functionf(float
				template_vs_hd_function(1);
				// CHECK-HOST: call i32 @_Z23template_vs_hd_functionIiET_S0_(i32
				// CHECK-DEVICE-STRICT: call float @_Z23template_vs_hd_functionf(float
				// CHECK-DEVICE-NC: call i32 @_Z23template_vs_hd_functionIiET_S0_(i32
				}

				// CHECK-HOST-LABEL: define void @_Z6h_thdfv()
				__host__ void h_thdf() {
				template_vs_hd_function(1.0f);
				// CHECK-HOST: call float @_Z23template_vs_hd_functionf(float
				template_vs_hd_function(1);
				// CHECK-HOST: call i32 @_Z23template_vs_hd_functionIiET_S0_(i32
				}

				// CHECK-DEVICE-LABEL: define void @_Z6d_thdfv()
				__device__ void d_thdf() {
				template_vs_hd_function(1.0f);
				// CHECK-DEVICE: call float @_Z23template_vs_hd_functionf(float
				template_vs_hd_function(1);
				// Host-only function template is not callable with strict call checks,
				// so for device side HD function will be the only choice.
				// CHECK-DEVICE: call float @_Z23template_vs_hd_functionf(float
				}

				// Check that overloads still work the same way on both host and
				// device side when the overload set contains only functions from one
				// side of compilation.
				__device__ float device_only_function(int arg) { return 17; }
				__device__ float device_only_function(float arg) { return 18; }

				__host__ float host_only_function(int arg) { return 19; }
				__host__ float host_only_function(float arg) { return 20; }

				// CHECK-BOTH-LABEL: define void @_Z6hd_dofv()
				__host__ __device__ void hd_dof() {
				#ifdef NOCHECKS
				device_only_function(1.0f);
				// CHECK-BOTH-NC: call float @_Z20device_only_functionf(float
				device_only_function(1);
				// CHECK-BOTH-NC: call float @_Z20device_only_functioni(i32
				host_only_function(1.0f);
				// CHECK-BOTH-NC: call float @_Z18host_only_functionf(float
				host_only_function(1);
				// CHECK-BOTH-NC: call float @_Z18host_only_functioni(i32
				#endif
				}


	// CHECK-HOST-LABEL: define void @_Z5hostfv()			// CHECK-HOST-LABEL: define void @_Z5hostfv()
	__host__ void hostf(void) {			__host__ void hostf(void) {
	#if defined (NOCHECKS)
	fp_t dp = d; // CHECK-HOST-NC: store {{.}} @_Z1dv, {{.}} %dp,
	fp_t cdp = cd; // CHECK-HOST-NC: store {{.}} @cd, {{.}} %cdp,
	#endif
	fp_t hp = h; // CHECK-HOST: store {{.}} @_Z1hv, {{.}} %hp,			fp_t hp = h; // CHECK-HOST: store {{.}} @_Z1hv, {{.}} %hp,
	fp_t chp = ch; // CHECK-HOST: store {{.}} @ch, {{.}} %chp,			fp_t chp = ch; // CHECK-HOST: store {{.}} @ch, {{.}} %chp,
	fp_t dhp = dh; // CHECK-HOST: store {{.}} @_Z2dhv, {{.}} %dhp,			fp_t dhp = dh; // CHECK-HOST: store {{.}} @_Z2dhv, {{.}} %dhp,
	fp_t cdhp = cdh; // CHECK-HOST: store {{.}} @cdh, {{.}} %cdhp,			fp_t cdhp = cdh; // CHECK-HOST: store {{.}} @cdh, {{.}} %cdhp,
	fp_t hdp = hd; // CHECK-HOST: store {{.}} @_Z2hdv, {{.}} %hdp,			fp_t hdp = hd; // CHECK-HOST: store {{.}} @_Z2hdv, {{.}} %hdp,
	fp_t chdp = chd; // CHECK-HOST: store {{.}} @chd, {{.}} %chdp,			fp_t chdp = chd; // CHECK-HOST: store {{.}} @chd, {{.}} %chdp,
	gp_t gp = g; // CHECK-HOST: store {{.}} @_Z1gv, {{.}} %gp,			gp_t gp = g; // CHECK-HOST: store {{.}} @_Z1gv, {{.}} %gp,

	#if defined (NOCHECKS)
	d(); // CHECK-HOST-NC: call i32 @_Z1dv()
	cd(); // CHECK-HOST-NC: call i32 @cd()
	#endif
	h(); // CHECK-HOST: call i32 @_Z1hv()			h(); // CHECK-HOST: call i32 @_Z1hv()
	ch(); // CHECK-HOST: call i32 @ch()			ch(); // CHECK-HOST: call i32 @ch()
	dh(); // CHECK-HOST: call i32 @_Z2dhv()			dh(); // CHECK-HOST: call i32 @_Z2dhv()
	cdh(); // CHECK-HOST: call i32 @cdh()			cdh(); // CHECK-HOST: call i32 @cdh()
	g<<<0,0>>>(); // CHECK-HOST: call void @_Z1gv()			g<<<0,0>>>(); // CHECK-HOST: call void @_Z1gv()
	}			}

	// CHECK-DEVICE-LABEL: define void @_Z7devicefv()			// CHECK-DEVICE-LABEL: define void @_Z7devicefv()
	__device__ void devicef(void) {			__device__ void devicef(void) {
	fp_t dp = d; // CHECK-DEVICE: store {{.}} @_Z1dv, {{.}} %dp,			fp_t dp = d; // CHECK-DEVICE: store {{.}} @_Z1dv, {{.}} %dp,
	fp_t cdp = cd; // CHECK-DEVICE: store {{.}} @cd, {{.}} %cdp,			fp_t cdp = cd; // CHECK-DEVICE: store {{.}} @cd, {{.}} %cdp,
	#if defined (NOCHECKS)
	fp_t hp = h; // CHECK-DEVICE-NC: store {{.}} @_Z1hv, {{.}} %hp,
	fp_t chp = ch; // CHECK-DEVICE-NC: store {{.}} @ch, {{.}} %chp,
	#endif
	fp_t dhp = dh; // CHECK-DEVICE: store {{.}} @_Z2dhv, {{.}} %dhp,			fp_t dhp = dh; // CHECK-DEVICE: store {{.}} @_Z2dhv, {{.}} %dhp,
	fp_t cdhp = cdh; // CHECK-DEVICE: store {{.}} @cdh, {{.}} %cdhp,			fp_t cdhp = cdh; // CHECK-DEVICE: store {{.}} @cdh, {{.}} %cdhp,
	fp_t hdp = hd; // CHECK-DEVICE: store {{.}} @_Z2hdv, {{.}} %hdp,			fp_t hdp = hd; // CHECK-DEVICE: store {{.}} @_Z2hdv, {{.}} %hdp,
	fp_t chdp = chd; // CHECK-DEVICE: store {{.}} @chd, {{.}} %chdp,			fp_t chdp = chd; // CHECK-DEVICE: store {{.}} @chd, {{.}} %chdp,

	d(); // CHECK-DEVICE: call i32 @_Z1dv()			d(); // CHECK-DEVICE: call i32 @_Z1dv()
	cd(); // CHECK-DEVICE: call i32 @cd()			cd(); // CHECK-DEVICE: call i32 @cd()
	#if defined (NOCHECKS)
	h(); // CHECK-DEVICE-NC: call i32 @_Z1hv()
	ch(); // CHECK-DEVICE-NC: call i32 @ch()
	#endif
	dh(); // CHECK-DEVICE: call i32 @_Z2dhv()			dh(); // CHECK-DEVICE: call i32 @_Z2dhv()
	cdh(); // CHECK-DEVICE: call i32 @cdh()			cdh(); // CHECK-DEVICE: call i32 @cdh()
	}			}

	// CHECK-BOTH-LABEL: define void @_Z11hostdevicefv()			// CHECK-BOTH-LABEL: define void @_Z11hostdevicefv()
	__host__ __device__ void hostdevicef(void) {			__host__ __device__ void hostdevicef(void) {
	#if defined (NOCHECKS)			#if defined (NOCHECKS)
	fp_t dp = d; // CHECK-BOTH-NC: store {{.}} @_Z1dv, {{.}} %dp,			fp_t dp = d; // CHECK-BOTH-NC: store {{.}} @_Z1dv, {{.}} %dp,
	▲ Show 20 Lines • Show All 83 Lines • Show Last 20 Lines

cfe/trunk/test/SemaCUDA/function-overload.cu

	Show First 20 Lines • Show All 64 Lines • ▼ Show 20 Lines
	__device__ int d(void) { return 8; }			__device__ int d(void) { return 8; }
	__host__ int h(void) { return 9; }			__host__ int h(void) { return 9; }
	__global__ void g(void) {}			__global__ void g(void) {}
	extern "C" __device__ int cd(void) {return 10;}			extern "C" __device__ int cd(void) {return 10;}
	extern "C" __host__ int ch(void) {return 11;}			extern "C" __host__ int ch(void) {return 11;}

	__host__ void hostf(void) {			__host__ void hostf(void) {
	fp_t dp = d;			fp_t dp = d;
	fp_t cdp = cd;			// expected-error@-1 {{reference to __device__ function 'd' in __host__ function}}
	#if !defined(NOCHECKS)
	// expected-error@-3 {{reference to __device__ function 'd' in __host__ function}}
	// expected-note@65 {{'d' declared here}}			// expected-note@65 {{'d' declared here}}
	// expected-error@-4 {{reference to __device__ function 'cd' in __host__ function}}			fp_t cdp = cd;
				// expected-error@-1 {{reference to __device__ function 'cd' in __host__ function}}
	// expected-note@68 {{'cd' declared here}}			// expected-note@68 {{'cd' declared here}}
	#endif
	fp_t hp = h;			fp_t hp = h;
	fp_t chp = ch;			fp_t chp = ch;
	fp_t dhp = dh;			fp_t dhp = dh;
	fp_t cdhp = cdh;			fp_t cdhp = cdh;
	gp_t gp = g;			gp_t gp = g;

	d();			d();
	cd();			// expected-error@-1 {{no matching function for call to 'd'}}
	#if !defined(NOCHECKS)
	// expected-error@-3 {{no matching function for call to 'd'}}
	// expected-note@65 {{candidate function not viable: call to __device__ function from __host__ function}}			// expected-note@65 {{candidate function not viable: call to __device__ function from __host__ function}}
	// expected-error@-4 {{no matching function for call to 'cd'}}			cd();
				// expected-error@-1 {{no matching function for call to 'cd'}}
	// expected-note@68 {{candidate function not viable: call to __device__ function from __host__ function}}			// expected-note@68 {{candidate function not viable: call to __device__ function from __host__ function}}
	#endif
	h();			h();
	ch();			ch();
	dh();			dh();
	cdh();			cdh();
	g(); // expected-error {{call to global function g not configured}}			g(); // expected-error {{call to global function g not configured}}
	g<<<0,0>>>();			g<<<0,0>>>();
	}			}


	__device__ void devicef(void) {			__device__ void devicef(void) {
	fp_t dp = d;			fp_t dp = d;
	fp_t cdp = cd;			fp_t cdp = cd;
	fp_t hp = h;			fp_t hp = h;
	fp_t chp = ch;			// expected-error@-1 {{reference to __host__ function 'h' in __device__ function}}
	#if !defined(NOCHECKS)
	// expected-error@-3 {{reference to __host__ function 'h' in __device__ function}}
	// expected-note@66 {{'h' declared here}}			// expected-note@66 {{'h' declared here}}
	// expected-error@-4 {{reference to __host__ function 'ch' in __device__ function}}			fp_t chp = ch;
				// expected-error@-1 {{reference to __host__ function 'ch' in __device__ function}}
	// expected-note@69 {{'ch' declared here}}			// expected-note@69 {{'ch' declared here}}
	#endif
	fp_t dhp = dh;			fp_t dhp = dh;
	fp_t cdhp = cdh;			fp_t cdhp = cdh;
	gp_t gp = g; // expected-error {{reference to __global__ function 'g' in __device__ function}}			gp_t gp = g; // expected-error {{reference to __global__ function 'g' in __device__ function}}
	// expected-note@67 {{'g' declared here}}			// expected-note@67 {{'g' declared here}}

	d();			d();
	cd();			cd();
	h();			h(); // expected-error {{no matching function for call to 'h'}}
	ch();
	#if !defined(NOCHECKS)
	// expected-error@-3 {{no matching function for call to 'h'}}
	// expected-note@66 {{candidate function not viable: call to __host__ function from __device__ function}}			// expected-note@66 {{candidate function not viable: call to __host__ function from __device__ function}}
	// expected-error@-4 {{no matching function for call to 'ch'}}			ch(); // expected-error {{no matching function for call to 'ch'}}
	// expected-note@69 {{candidate function not viable: call to __host__ function from __device__ function}}			// expected-note@69 {{candidate function not viable: call to __host__ function from __device__ function}}
	#endif
	dh();			dh();
	cdh();			cdh();
	g(); // expected-error {{no matching function for call to 'g'}}			g(); // expected-error {{no matching function for call to 'g'}}
	// expected-note@67 {{candidate function not viable: call to __global__ function from __device__ function}}			// expected-note@67 {{candidate function not viable: call to __global__ function from __device__ function}}
	g<<<0,0>>>(); // expected-error {{reference to __global__ function 'g' in __device__ function}}			g<<<0,0>>>(); // expected-error {{reference to __global__ function 'g' in __device__ function}}
	// expected-note@67 {{'g' declared here}}			// expected-note@67 {{'g' declared here}}
	}			}

	__global__ void globalf(void) {			__global__ void globalf(void) {
	fp_t dp = d;			fp_t dp = d;
	fp_t cdp = cd;			fp_t cdp = cd;
	fp_t hp = h;			fp_t hp = h;
	fp_t chp = ch;			// expected-error@-1 {{reference to __host__ function 'h' in __global__ function}}
	#if !defined(NOCHECKS)
	// expected-error@-3 {{reference to __host__ function 'h' in __global__ function}}
	// expected-note@66 {{'h' declared here}}			// expected-note@66 {{'h' declared here}}
	// expected-error@-4 {{reference to __host__ function 'ch' in __global__ function}}			fp_t chp = ch;
				// expected-error@-1 {{reference to __host__ function 'ch' in __global__ function}}
	// expected-note@69 {{'ch' declared here}}			// expected-note@69 {{'ch' declared here}}
	#endif
	fp_t dhp = dh;			fp_t dhp = dh;
	fp_t cdhp = cdh;			fp_t cdhp = cdh;
	gp_t gp = g; // expected-error {{reference to __global__ function 'g' in __global__ function}}			gp_t gp = g;
				// expected-error@-1 {{reference to __global__ function 'g' in __global__ function}}
	// expected-note@67 {{'g' declared here}}			// expected-note@67 {{'g' declared here}}

	d();			d();
	cd();			cd();
	h();			h();
	ch();			// expected-error@-1 {{no matching function for call to 'h'}}
	#if !defined(NOCHECKS)
	// expected-error@-3 {{no matching function for call to 'h'}}
	// expected-note@66 {{candidate function not viable: call to __host__ function from __global__ function}}			// expected-note@66 {{candidate function not viable: call to __host__ function from __global__ function}}
	// expected-error@-4 {{no matching function for call to 'ch'}}			ch();
				// expected-error@-1 {{no matching function for call to 'ch'}}
	// expected-note@69 {{candidate function not viable: call to __host__ function from __global__ function}}			// expected-note@69 {{candidate function not viable: call to __host__ function from __global__ function}}
	#endif
	dh();			dh();
	cdh();			cdh();
	g(); // expected-error {{no matching function for call to 'g'}}			g(); // expected-error {{no matching function for call to 'g'}}
	// expected-note@67 {{candidate function not viable: call to __global__ function from __global__ function}}			// expected-note@67 {{candidate function not viable: call to __global__ function from __global__ function}}
	g<<<0,0>>>(); // expected-error {{reference to __global__ function 'g' in __global__ function}}			g<<<0,0>>>(); // expected-error {{reference to __global__ function 'g' in __global__ function}}
	// expected-note@67 {{'g' declared here}}			// expected-note@67 {{'g' declared here}}
	}			}

	▲ Show 20 Lines • Show All 147 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[CUDA] Tweak attribute-based overload resolution to match nvcc behavior.
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 47819

cfe/trunk/include/clang/Sema/Sema.h

cfe/trunk/lib/Sema/SemaCUDA.cpp

cfe/trunk/lib/Sema/SemaOverload.cpp

cfe/trunk/test/CodeGenCUDA/function-overload.cu

cfe/trunk/test/SemaCUDA/function-overload.cu

This is an archive of the discontinued LLVM Phabricator instance.

[CUDA] Tweak attribute-based overload resolution to match nvcc behavior. ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 47819

cfe/trunk/include/clang/Sema/Sema.h

cfe/trunk/lib/Sema/SemaCUDA.cpp

cfe/trunk/lib/Sema/SemaOverload.cpp

cfe/trunk/test/CodeGenCUDA/function-overload.cu

cfe/trunk/test/SemaCUDA/function-overload.cu

[CUDA] Tweak attribute-based overload resolution to match nvcc behavior.
ClosedPublic