This is an archive of the discontinued LLVM Phabricator instance.

[CUDA] Create host and device variants of standard allocator declarations.
ClosedPublic

Authored by tra on Oct 19 2016, 2:36 PM.

Download Raw Diff

Details

Reviewers

Summary

Implicit functions are treated as if they were host device and clang does not allow overloading
those with host or device variants.

In order for users to provide their own standard allocators, we must create host and device variants of these declarations during CUDA compilation.

Diff Detail

Build Status

Buildable 699
Build 699: arc lint + arc unit

Event Timeline

tra updated this revision to Diff 75229.Oct 19 2016, 2:36 PM

tra retitled this revision from to [CUDA] Create __host__ and device variants of standard allocator declarations..

tra updated this object.

tra added a reviewer: jlebar.

tra added a subscriber: cfe-commits.

tra added a child revision: D25809: [CUDA] Improved target attribute-based overloading..Oct 20 2016, 2:00 PM

Is it not possible to write a testcase for this?

jlebar added inline comments.Oct 21 2016, 9:30 AM

lib/Sema/SemaExprCXX.cpp
2596–2601	Nit, no need for empty parens.
2628–2629	I kind of feel like it would be easier to add a boolean parameter to CreateAllocationFunctionDecl, then you don't need to repeat these two lines.

Addressed jlebar's comments.

jlebar accepted this revision.Oct 21 2016, 12:54 PM

jlebar edited edge metadata.

jlebar added inline comments.

lib/Sema/SemaExprCXX.cpp
2596	Oh, I like this way better than a bool arg.

This revision is now accepted and ready to land.Oct 21 2016, 12:54 PM

Landed in r284879.

Revision Contents

Path

Size

lib/

Sema/

SemaExprCXX.cpp

49 lines

test/

SemaCUDA/

overloaded-delete.cu

46 lines

Diff 75462

lib/Sema/SemaExprCXX.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 2,587 Lines • ▼ Show 20 Lines	if (!getLangOpts().CPlusPlus11) {
EPI.ExceptionSpec.Type = EST_Dynamic;		EPI.ExceptionSpec.Type = EST_Dynamic;
EPI.ExceptionSpec.Exceptions = llvm::makeArrayRef(BadAllocType);		EPI.ExceptionSpec.Exceptions = llvm::makeArrayRef(BadAllocType);
}		}
} else {		} else {
EPI.ExceptionSpec =		EPI.ExceptionSpec =
getLangOpts().CPlusPlus11 ? EST_BasicNoexcept : EST_DynamicNone;		getLangOpts().CPlusPlus11 ? EST_BasicNoexcept : EST_DynamicNone;
}		}

		auto CreateAllocationFunctionDecl = [&](Attr *ExtraAttr) {
		jlebarUnsubmitted Not Done Reply Inline Actions Oh, I like this way better than a bool arg. jlebar: Oh, I like this way better than a bool arg.
QualType FnType = Context.getFunctionType(Return, Params, EPI);		QualType FnType = Context.getFunctionType(Return, Params, EPI);
FunctionDecl *Alloc =		FunctionDecl *Alloc = FunctionDecl::Create(
FunctionDecl::Create(Context, GlobalCtx, SourceLocation(),		Context, GlobalCtx, SourceLocation(), SourceLocation(), Name,
SourceLocation(), Name,
FnType, /TInfo=/nullptr, SC_None, false, true);		FnType, /TInfo=/nullptr, SC_None, false, true);
Alloc->setImplicit();		Alloc->setImplicit();
		jlebarUnsubmitted Not Done Reply Inline Actions Nit, no need for empty parens. jlebar: Nit, no need for empty parens.

// Implicit sized deallocation functions always have default visibility.		// Implicit sized deallocation functions always have default visibility.
Alloc->addAttr(VisibilityAttr::CreateImplicit(Context,		Alloc->addAttr(
VisibilityAttr::Default));		VisibilityAttr::CreateImplicit(Context, VisibilityAttr::Default));

llvm::SmallVector<ParmVarDecl*, 3> ParamDecls;		llvm::SmallVector<ParmVarDecl *, 3> ParamDecls;
for (QualType T : Params) {		for (QualType T : Params) {
ParamDecls.push_back(		ParamDecls.push_back(ParmVarDecl::Create(
ParmVarDecl::Create(Context, Alloc, SourceLocation(), SourceLocation(),		Context, Alloc, SourceLocation(), SourceLocation(), nullptr, T,
nullptr, T, /TInfo=/nullptr, SC_None, nullptr));		/TInfo=/nullptr, SC_None, nullptr));
ParamDecls.back()->setImplicit();		ParamDecls.back()->setImplicit();
}		}
Alloc->setParams(ParamDecls);		Alloc->setParams(ParamDecls);
		if (ExtraAttr)
		Alloc->addAttr(ExtraAttr);
Context.getTranslationUnitDecl()->addDecl(Alloc);		Context.getTranslationUnitDecl()->addDecl(Alloc);
IdResolver.tryAddTopLevelDecl(Alloc, Name);		IdResolver.tryAddTopLevelDecl(Alloc, Name);
		};

		if (!LangOpts.CUDA)
		CreateAllocationFunctionDecl(nullptr);
		else {
		// Host and device get their own declaration so each can be
		// defined or re-declared independently.
		CreateAllocationFunctionDecl(CUDAHostAttr::CreateImplicit(Context));
		CreateAllocationFunctionDecl(CUDADeviceAttr::CreateImplicit(Context));
		}
}		}
		jlebarUnsubmitted Not Done Reply Inline Actions I kind of feel like it would be easier to add a boolean parameter to CreateAllocationFunctionDecl, then you don't need to repeat these two lines. jlebar: I kind of feel like it would be easier to add a boolean parameter to…

FunctionDecl *Sema::FindUsualDeallocationFunction(SourceLocation StartLoc,		FunctionDecl *Sema::FindUsualDeallocationFunction(SourceLocation StartLoc,
bool CanProvideSize,		bool CanProvideSize,
bool Overaligned,		bool Overaligned,
DeclarationName Name) {		DeclarationName Name) {
DeclareGlobalNewDelete();		DeclareGlobalNewDelete();

LookupResult FoundDelete(*this, Name, StartLoc, LookupOrdinaryName);		LookupResult FoundDelete(*this, Name, StartLoc, LookupOrdinaryName);
▲ Show 20 Lines • Show All 4,813 Lines • Show Last 20 Lines

test/SemaCUDA/overloaded-delete.cu

	Show All 10 Lines
	};			};

	__host__ __device__ void test(S* s) {			__host__ __device__ void test(S* s) {
	// This shouldn't be ambiguous -- we call the host overload in host mode and			// This shouldn't be ambiguous -- we call the host overload in host mode and
	// the device overload in device mode.			// the device overload in device mode.
	delete s;			delete s;
	}			}

				// Code should work with no explicit declarations/definitions of
				// allocator functions.
				__host__ __device__ void test_default_global_delete_hd(int *ptr) {
				// Again, there should be no ambiguity between which operator delete we call.
				::delete ptr;
				}

				__device__ void test_default_global_delete(int *ptr) {
				// Again, there should be no ambiguity between which operator delete we call.
				::delete ptr;
				}
				__host__ void test_default_global_delete(int *ptr) {
				// Again, there should be no ambiguity between which operator delete we call.
				::delete ptr;
				}

				// It should work with only some of allocators (re-)declared.
				__device__ void operator delete(void *ptr);

				__host__ __device__ void test_partial_global_delete_hd(int *ptr) {
				// Again, there should be no ambiguity between which operator delete we call.
				::delete ptr;
				}

				__device__ void test_partial_global_delete(int *ptr) {
				// Again, there should be no ambiguity between which operator delete we call.
				::delete ptr;
				}
				__host__ void test_partial_global_delete(int *ptr) {
				// Again, there should be no ambiguity between which operator delete we call.
				::delete ptr;
				}


				// We should be able to define both host and device variants.
	__host__ void operator delete(void *ptr) {}			__host__ void operator delete(void *ptr) {}
	__device__ void operator delete(void *ptr) {}			__device__ void operator delete(void *ptr) {}

	__host__ __device__ void test_global_delete(int *ptr) {			__host__ __device__ void test_overloaded_global_delete_hd(int *ptr) {
				// Again, there should be no ambiguity between which operator delete we call.
				::delete ptr;
				}

				__device__ void test_overloaded_global_delete(int *ptr) {
				// Again, there should be no ambiguity between which operator delete we call.
				::delete ptr;
				}
				__host__ void test_overloaded_global_delete(int *ptr) {
	// Again, there should be no ambiguity between which operator delete we call.			// Again, there should be no ambiguity between which operator delete we call.
	::delete ptr;			::delete ptr;
	}			}