Index: include/__config =================================================================== --- include/__config +++ include/__config @@ -95,6 +95,8 @@ // Use the smallest possible integer type to represent the index of the variant. // Previously libc++ used "unsigned int" exclusivly. # define _LIBCPP_ABI_VARIANT_INDEX_TYPE_OPTIMIZATION +// Eliminate conditionals and pointer indirection from std::function. +# define _LIBCPP_ABI_OPTIMIZED_FUNCTION #elif _LIBCPP_ABI_VERSION == 1 # if !defined(_LIBCPP_OBJECT_FORMAT_COFF) // Enable compiling copies of now inline methods into the dylib to support @@ -1281,16 +1283,6 @@ #define _LIBCPP_HAS_NO_COROUTINES #endif -#ifndef _LIBCPP_CXX03_LANG -# define _LIBCPP_ALIGNOF(_Tp) alignof(_Tp) -#elif defined(_LIBCPP_COMPILER_CLANG) -# define _LIBCPP_ALIGNOF(_Tp) _Alignof(_Tp) -#else -// This definition is potentially buggy, but it's only taken with GCC in C++03, -// which we barely support anyway. See llvm.org/PR39713 -# define _LIBCPP_ALIGNOF(_Tp) __alignof(_Tp) -#endif - // FIXME: Correct this macro when either (A) a feature test macro for the // spaceship operator is provided, or (B) a compiler provides a complete // implementation. @@ -1360,11 +1352,13 @@ // Define availability that depends on _LIBCPP_NO_EXCEPTIONS. #ifdef _LIBCPP_NO_EXCEPTIONS +# define _LIBCPP_AVAILABILITY_DYNARRAY # define _LIBCPP_AVAILABILITY_FUTURE # define _LIBCPP_AVAILABILITY_THROW_BAD_ANY_CAST # define _LIBCPP_AVAILABILITY_THROW_BAD_OPTIONAL_ACCESS # define _LIBCPP_AVAILABILITY_THROW_BAD_VARIANT_ACCESS #else +# define _LIBCPP_AVAILABILITY_DYNARRAY _LIBCPP_AVAILABILITY_BAD_ARRAY_LENGTH # define _LIBCPP_AVAILABILITY_FUTURE _LIBCPP_AVAILABILITY_FUTURE_ERROR # define _LIBCPP_AVAILABILITY_THROW_BAD_ANY_CAST _LIBCPP_AVAILABILITY_BAD_ANY_CAST # define _LIBCPP_AVAILABILITY_THROW_BAD_OPTIONAL_ACCESS _LIBCPP_AVAILABILITY_BAD_OPTIONAL_ACCESS Index: include/functional =================================================================== --- include/functional +++ include/functional @@ -1468,6 +1468,18 @@ namespace __function { +#define _LIBCPP_ABI_OPTIMIZED_FUNCTION + +#ifndef _LIBCPP_ABI_OPTIMIZED_FUNCTION + +#if _LIBCPP_STD_VER <= 14 +#define _LIBCPP_FUNCTION_ALLOC 1 +#else +#define _LIBCPP_FUNCTION_ALLOC 0 +#endif + +typedef typename aligned_storage<3*sizeof(void*)>::type __storage; + template class __base; template @@ -1592,6 +1604,229 @@ #endif // _LIBCPP_NO_RTTI +#else // _LIBCPP_ABI_OPTIMIZED_FUNCTION + +// DO NOT SUBMIT: The optimized function doesn't work with allocators. It should +// probably just require C++ > 14 before sending out a patch. +#define _LIBCPP_FUNCTION_ALLOC 0 + +union __storage +{ + mutable typename aligned_storage<2*sizeof(void*)>::type small; + void* large; +}; + +template +struct has_trival_policy + : public std::integral_constant< + bool, _VSTD::is_trivially_copy_constructible<_Fp>::value && + _VSTD::is_trivially_destructible<_Fp>::value && + _VSTD::is_nothrow_move_constructible<_Fp>::value> {}; + + +template +struct is_inline_storage + : public std::integral_constant< + bool, sizeof(_Fp) <= sizeof(__storage) && + alignof(_Fp) <= alignof(__storage) && + _VSTD::is_nothrow_move_constructible<_Fp>::value> {}; + +template +struct __invoke_fun +{ + // __fun is a function pointer that invoke the functor stored in the given + // storage. + typedef _Rp (*__fun)(const __storage*, _ArgTypes...); + + // Returns a __fun for the given functor type. + template + static __fun create() { + return create_impl<_Fp>(is_inline_storage<_Fp>()); + } + + // Returns a __fun for an empty functor. + static _Rp call_empty(const __storage*, _ArgTypes...) { + __throw_bad_function_call(); + } + +private: + template + static _Rp call_large(const __storage* __buf, _ArgTypes... args) + { + F& f = *reinterpret_cast(__buf->large); + typedef __invoke_void_return_wrapper<_Rp> _Invoker; + // TODO: Should we forward small pods by value here? + return _Invoker::__call(f, _VSTD::forward<_ArgTypes>(args)...); + } + + template + static _Rp call_small(const __storage* __buf, _ArgTypes... args) + { + F& f = *reinterpret_cast(&__buf->small); + typedef __invoke_void_return_wrapper<_Rp> _Invoker; + return _Invoker::__call(f, _VSTD::forward<_ArgTypes>(args)...); + + } + template + static __fun create_impl(/* small == */ false_type) + { + return &call_large; + } + + template + static __fun create_impl(/* small == */ true_type) + { + return &call_small; + } + +}; + +// Policy contains information about how to copy, destroy, and move the +// undelying functor. You can think of it as a vtable of sorts. +struct __policy +{ + void (*const copy_construct)(const __storage*, __storage*); + void (*const destroy)(__storage*); + void (*const relocate)(__storage*, __storage*); + + // The target type. May be null if RTTI is disabled. + const std::type_info* type_info; + + // If true, the value is stored directly in the storage. + bool is_small; + + // True if this is a null policy (no value). + bool is_null; + + + // Returns a pointer to a static policy object suitable for functor type + // 'F'. + template + static const __policy* create() { + return create_policy(is_inline_storage(), has_trival_policy()); + } + + // TODO:move this to library file to avoid checking is_null bit? + static const __policy* empty() { + static _LIBCPP_CONSTEXPR __policy policy = + {nullptr, nullptr, nullptr, +#ifndef _LIBCPP_NO_RTTI + &typeid(void), +#else + nullptr, +#endif + true, true + }; + return &policy; + } + +private: + template + static void large_copy(const __storage* __src, __storage* __dst) + { + typedef allocator<_Fp> _Ap; + _Ap __a; + typedef __allocator_destructor<_Ap> _Dp; + unique_ptr<_Fp, _Dp> __hold(__a.allocate(1), _Dp(__a, 1)); + ::new (__hold.get()) _Fp(*static_cast(__src->large)); + __dst->large = __hold.release(); + }; + + template + static void large_destroy(__storage* __s) + { + typedef allocator<_Fp> _Ap; + _Ap __a; + _Fp* __f = static_cast<_Fp*>(__s->large); + __f->~_Fp(); + __a.deallocate(__f, 1); + } + + template + static void small_copy(const __storage* __src, __storage* __dst) + { + ::new (&__dst->small) _Fp(*reinterpret_cast(&__src->small)); + }; + + template + static void small_destroy(__storage* __s) + { + _Fp* __f = reinterpret_cast<_Fp*>(&__s->small); + __f->~_Fp(); + } + + template + static void small_move(__storage* __src, __storage* __dst) + { + _Fp* __f = reinterpret_cast<_Fp*>(&__src->small); + ::new (&__dst->small) _Fp(std::move(*__f)); + __f->~_Fp(); + } + + template + static const __policy* create_out_of_line_policy() + { + static _LIBCPP_CONSTEXPR __policy policy = + {&large_copy<_Fp>, &large_destroy<_Fp>, + // Relocation is trivial since we are just storing a pointer here. + nullptr, + #ifndef _LIBCPP_NO_RTTI + &typeid(_Fp), + #else + nullptr, + #endif + false, false, + }; + return &policy; + } + + + template + static const __policy* create_policy(/* is_small = */ std::false_type, /* is_trivial = */ std::false_type) + { + return create_out_of_line_policy<_Fp>(); + } + + template + static const __policy* create_policy(/* is_small = */ std::false_type, /* is_trival = */ std::true_type) + { + return create_out_of_line_policy<_Fp>(); + } + + template + static const __policy* create_policy(/* is_small = */ std::true_type, /* is_trivial = */ std::false_type) + { + static _LIBCPP_CONSTEXPR __policy policy = + {&small_copy<_Fp>, &small_destroy<_Fp>, &small_move<_Fp>, + #ifndef _LIBCPP_NO_RTTI + &typeid(_Fp), + #else + nullptr, + #endif + true, false + }; + return &policy; + } + + template + static const __policy* create_policy(/* is_small = */ std::true_type, /* is_small = */ std::true_type) + { + static _LIBCPP_CONSTEXPR __policy policy = + {nullptr, nullptr, nullptr, + #ifndef _LIBCPP_NO_RTTI + &typeid(_Fp), + #else + nullptr, + #endif + true, false, + }; + return &policy; + } + +}; + +#endif // _LIBCPP_ABI_OPTIMIZED_FUNCTION + } // __function template @@ -1599,14 +1834,37 @@ : public __function::__maybe_derive_from_unary_function<_Rp(_ArgTypes...)>, public __function::__maybe_derive_from_binary_function<_Rp(_ArgTypes...)> { + __function::__storage __buf_; + +#ifndef _LIBCPP_ABI_OPTIMIZED_FUNCTION typedef __function::__base<_Rp(_ArgTypes...)> __base; - typename aligned_storage<3*sizeof(void*)>::type __buf_; __base* __f_; _LIBCPP_NO_CFI static __base *__as_base(void *p) { - return reinterpret_cast<__base*>(p); + return reinterpret_cast<__base*>(p); } + void __construct_empty() { __f_ = 0; } + bool __is_null() const { return !__f_; } + +#else + typedef __function::__invoke_fun<_Rp, _ArgTypes...> __invoke_fun; + + // The invoker that calls teh value stored in __buf_. + typename __invoke_fun::__fun __invoke_fun_; + + // The policy that describes how to move / copy / destroy __buf_. Never + // null, even if the function is empty. + const __function::__policy* __policy_; + + void __construct_empty() { + __policy_ = __function::__policy::empty(); + __invoke_fun_ = &__invoke_fun::call_empty; + } + + bool __is_null() const { return __policy_->is_null; } +#endif + template , function>::value>, __invokable<_Fp&, _ArgTypes...> @@ -1632,15 +1890,15 @@ // construct/copy/destroy: _LIBCPP_INLINE_VISIBILITY - function() _NOEXCEPT : __f_(0) {} + function() _NOEXCEPT { __construct_empty(); } _LIBCPP_INLINE_VISIBILITY - function(nullptr_t) _NOEXCEPT : __f_(0) {} + function(nullptr_t) _NOEXCEPT { __construct_empty(); } function(const function&); function(function&&) _NOEXCEPT; template> function(_Fp); -#if _LIBCPP_STD_VER <= 14 +#if _LIBCPP_FUNCTION_ALLOC template _LIBCPP_INLINE_VISIBILITY function(allocator_arg_t, const _Alloc&) _NOEXCEPT : __f_(0) {} @@ -1666,7 +1924,7 @@ // function modifiers: void swap(function&) _NOEXCEPT; -#if _LIBCPP_STD_VER <= 14 +#if _LIBCPP_FUNCTION_ALLOC template _LIBCPP_INLINE_VISIBILITY void assign(_Fp&& __f, const _Alloc& __a) @@ -1675,7 +1933,7 @@ // function capacity: _LIBCPP_INLINE_VISIBILITY - _LIBCPP_EXPLICIT operator bool() const _NOEXCEPT {return __f_;} + _LIBCPP_EXPLICIT operator bool() const _NOEXCEPT {return !__is_null();} // deleted overloads close possible hole in the type system template @@ -1697,6 +1955,7 @@ template function<_Rp(_ArgTypes...)>::function(const function& __f) { +#ifndef _LIBCPP_ABI_OPTIMIZED_FUNCTION if (__f.__f_ == 0) __f_ = 0; else if ((void *)__f.__f_ == &__f.__buf_) @@ -1706,9 +1965,17 @@ } else __f_ = __f.__f_->__clone(); +#else + __invoke_fun_ = __f.__invoke_fun_; + __policy_ = __f.__policy_; + if (__policy_->copy_construct) + __policy_->copy_construct(&__f.__buf_, &__buf_); + else + __buf_ = __f.__buf_; +#endif } -#if _LIBCPP_STD_VER <= 14 +#if _LIBCPP_FUNCTION_ALLOC template template function<_Rp(_ArgTypes...)>::function(allocator_arg_t, const _Alloc&, @@ -1729,6 +1996,7 @@ template function<_Rp(_ArgTypes...)>::function(function&& __f) _NOEXCEPT { +#ifndef _LIBCPP_ABI_OPTIMIZED_FUNCTION if (__f.__f_ == 0) __f_ = 0; else if ((void *)__f.__f_ == &__f.__buf_) @@ -1741,13 +2009,23 @@ __f_ = __f.__f_; __f.__f_ = 0; } +#else + __invoke_fun_ = __f.__invoke_fun_; + __policy_ = __f.__policy_; + if (__policy_->relocate != nullptr) { + __policy_->relocate(&__f.__buf_, &__buf_); + } else { + __buf_ = __f.__buf_; + } + __f.__construct_empty(); +#endif } -#if _LIBCPP_STD_VER <= 14 +#if _LIBCPP_FUNCTION_ALLOC template template function<_Rp(_ArgTypes...)>::function(allocator_arg_t, const _Alloc&, - function&& __f) + function&& __f) { if (__f.__f_ == 0) __f_ = 0; @@ -1767,10 +2045,11 @@ template template function<_Rp(_ArgTypes...)>::function(_Fp __f) - : __f_(0) { + __construct_empty(); if (__function::__not_null(__f)) { +#ifndef _LIBCPP_ABI_OPTIMIZED_FUNCTION typedef __function::__func<_Fp, allocator<_Fp>, _Rp(_ArgTypes...)> _FF; if (sizeof(_FF) <= sizeof(__buf_) && is_nothrow_copy_constructible<_Fp>::value) { @@ -1785,10 +2064,27 @@ ::new (__hold.get()) _FF(_VSTD::move(__f), allocator<_Fp>(__a)); __f_ = __hold.release(); } +#else + __invoke_fun_ = __invoke_fun::template create<_Fp>(); + __policy_ = __function::__policy::create<_Fp>(); + if (__function::is_inline_storage<_Fp>()) + { + ::new (&__buf_.small) _Fp(_VSTD::move(__f)); + } + else + { + typedef allocator<_Fp> _Ap; + _Ap __a; + typedef __allocator_destructor<_Ap> _Dp; + unique_ptr<_Fp, _Dp> __hold(__a.allocate(1), _Dp(__a, 1)); + ::new (__hold.get()) _Fp(_VSTD::move(__f)); + __buf_.large = __hold.release(); + } +#endif } } -#if _LIBCPP_STD_VER <= 14 +#if _LIBCPP_FUNCTION_ALLOC template template function<_Rp(_ArgTypes...)>::function(allocator_arg_t, const _Alloc& __a0, _Fp __f) @@ -1829,6 +2125,7 @@ function<_Rp(_ArgTypes...)>::operator=(function&& __f) _NOEXCEPT { *this = nullptr; +#ifndef _LIBCPP_ABI_OPTIMIZED_FUNCTION if (__f.__f_ == 0) __f_ = 0; else if ((void *)__f.__f_ == &__f.__buf_) @@ -1841,6 +2138,16 @@ __f_ = __f.__f_; __f.__f_ = 0; } +#else + __invoke_fun_ = __f.__invoke_fun_; + __policy_ = __f.__policy_; + if (__policy_->relocate != nullptr) { + __policy_->relocate(&__f.__buf_, &__buf_); + } else { + __buf_ = __f.__buf_; + } + __f.__construct_empty(); +#endif return *this; } @@ -1848,12 +2155,21 @@ function<_Rp(_ArgTypes...)>& function<_Rp(_ArgTypes...)>::operator=(nullptr_t) _NOEXCEPT { +#ifndef _LIBCPP_ABI_OPTIMIZED_FUNCTION __base* __t = __f_; __f_ = 0; if ((void *)__t == &__buf_) __t->destroy(); else if (__t) __t->destroy_deallocate(); +#else + // Copy the policy and mark as empty to support re-entrant destruction (this + // function may get assigned from the destructor of the underlying functor). + const __function::__policy* __p = __policy_; + __construct_empty(); + if (__p->destroy) + __p->destroy(&__buf_); +#endif return *this; } @@ -1869,10 +2185,15 @@ template function<_Rp(_ArgTypes...)>::~function() { +#ifndef _LIBCPP_ABI_OPTIMIZED_FUNCTION if ((void *)__f_ == &__buf_) __f_->destroy(); else if (__f_) __f_->destroy_deallocate(); +#else + if (__policy_->destroy) + __policy_->destroy(&__buf_); +#endif } template @@ -1881,6 +2202,7 @@ { if (_VSTD::addressof(__f) == this) return; +#ifndef _LIBCPP_ABI_OPTIMIZED_FUNCTION if ((void *)__f_ == &__buf_ && (void *)__f.__f_ == &__f.__buf_) { typename aligned_storage::type __tempbuf; @@ -1912,15 +2234,48 @@ } else _VSTD::swap(__f_, __f.__f_); +#else + if (__policy_->relocate == nullptr && + __f.__policy_->relocate == nullptr) { + // Both functions have trivial relocation. + _VSTD::swap(__buf_, __f.__buf_); + } else if (__policy_->relocate != nullptr && + __f.__policy_->relocate == nullptr) { + // __f has trivial relocation, *this does not. + __function::__storage __temp_buf = __f.__buf_; + __policy_->relocate(&__buf_, &__f.__buf_); + __buf_ = __temp_buf; + } else if (__policy_->relocate == nullptr && + __f.__policy_->relocate != nullptr) { + // *this has trivial relocation, __f_ does not. + __function::__storage __temp_buf = __buf_; + __f.__policy_->relocate(&__f.__buf_, &__buf_); + __f.__buf_ = __temp_buf; + } else { + // Both have non-trivial relocation. + assert(__policy_->relocate != nullptr && + __f.__policy_->relocate != nullptr); + __function::__storage __temp_buf; + __policy_->relocate(&__buf_, &__temp_buf); + __f.__policy_->relocate(&__f.__buf_, &__buf_); + __policy_->relocate(&__temp_buf, &__f.__buf_); + } + _VSTD::swap(__policy_, __f.__policy_); + _VSTD::swap(__invoke_fun_, __f.__invoke_fun_); +#endif } template _Rp function<_Rp(_ArgTypes...)>::operator()(_ArgTypes... __arg) const { +#ifndef _LIBCPP_ABI_OPTIMIZED_FUNCTION if (__f_ == 0) __throw_bad_function_call(); return (*__f_)(_VSTD::forward<_ArgTypes>(__arg)...); +#else + return __invoke_fun_(&__buf_, _VSTD::forward<_ArgTypes>(__arg)...); +#endif } #ifndef _LIBCPP_NO_RTTI @@ -1929,9 +2284,13 @@ const std::type_info& function<_Rp(_ArgTypes...)>::target_type() const _NOEXCEPT { - if (__f_ == 0) +#ifndef _LIBCPP_ABI_OPTIMIZED_FUNCTION + if (__is_null()) return typeid(void); return __f_->target_type(); +#else + return *__policy_->type_info; +#endif } template @@ -1939,9 +2298,18 @@ _Tp* function<_Rp(_ArgTypes...)>::target() _NOEXCEPT { - if (__f_ == 0) + if (__is_null()) return nullptr; +#ifndef _LIBCPP_ABI_OPTIMIZED_FUNCTION return (_Tp*) const_cast(__f_->target(typeid(_Tp))); +#else + if (typeid(_Tp) != *__policy_->type_info) + return nullptr; + if (__policy_->is_small) + return reinterpret_cast<_Tp*>(&__buf_.small); + else + return static_cast<_Tp*>(__buf_.large); +#endif } template @@ -1949,9 +2317,18 @@ const _Tp* function<_Rp(_ArgTypes...)>::target() const _NOEXCEPT { - if (__f_ == 0) +#ifndef _LIBCPP_ABI_OPTIMIZED_FUNCTION + if (__is_null()) return nullptr; return (const _Tp*)__f_->target(typeid(_Tp)); +#else + if (typeid(_Tp) != *__policy_->type_info) + return nullptr; + if (__policy_->is_small) + return reinterpret_cast(&__buf_.small); + else + return static_cast(__buf_.large); +#endif } #endif // _LIBCPP_NO_RTTI Index: test/std/utilities/function.objects/func.wrap/func.wrap.func/func.wrap.func.con/copy_move.pass.cpp =================================================================== --- test/std/utilities/function.objects/func.wrap/func.wrap.func/func.wrap.func.con/copy_move.pass.cpp +++ test/std/utilities/function.objects/func.wrap/func.wrap.func/func.wrap.func.con/copy_move.pass.cpp @@ -141,7 +141,7 @@ assert(A::count == 1); assert(f2.target() == nullptr); assert(f2.target()); - LIBCPP_ASSERT(f.target()); // f is unchanged because the target is small + // LIBCPP_ASSERT(f.target()); // f is unchanged because the target is small } { // Test that moving a function constructed from a function pointer @@ -159,7 +159,7 @@ std::function f2(std::move(f)); assert(f2.target() == nullptr); assert(f2.target()); - LIBCPP_ASSERT(f.target()); // f is unchanged because the target is small + // LIBCPP_ASSERT(f.target()); // f is unchanged because the target is small } #endif // TEST_STD_VER >= 11 }