This is an archive of the discontinued LLVM Phabricator instance.

-------------------------------------------------------------------------------
Benchmark                                                  old Time    new Time
-------------------------------------------------------------------------------
BM_Rotate_uint32_Random_1                                   10.6 ns     10.7 ns
BM_Rotate_uint32_Random_4                                   24.3 ns     23.3 ns
BM_Rotate_uint32_Random_16                                  43.7 ns     32.9 ns
BM_Rotate_uint32_Random_64                                   116 ns     64.4 ns
BM_Rotate_uint32_Random_256                                  423 ns      181 ns
BM_Rotate_uint32_Random_1024                                1574 ns      612 ns
BM_Rotate_uint32_Random_16384                              26318 ns     8900 ns
BM_Rotate_uint32_Random_262144                            450038 ns   142255 ns
BM_Rotate_uint64_Random_1                                   10.6 ns     10.6 ns
BM_Rotate_uint64_Random_4                                   24.3 ns     23.2 ns
BM_Rotate_uint64_Random_16                                  44.3 ns     34.4 ns
BM_Rotate_uint64_Random_64                                   117 ns     67.7 ns
BM_Rotate_uint64_Random_256                                  424 ns      193 ns
BM_Rotate_uint64_Random_1024                                1589 ns      653 ns
BM_Rotate_uint64_Random_16384                              26920 ns     9357 ns
BM_Rotate_uint64_Random_262144                            460469 ns   149440 ns
BM_Rotate_pair<uint32, uint32>_Random_1                     10.6 ns     10.7 ns
BM_Rotate_pair<uint32, uint32>_Random_4                     23.2 ns     23.2 ns
BM_Rotate_pair<uint32, uint32>_Random_16                    36.9 ns     35.2 ns
BM_Rotate_pair<uint32, uint32>_Random_64                    80.7 ns     80.3 ns
BM_Rotate_pair<uint32, uint32>_Random_256                    268 ns      268 ns
BM_Rotate_pair<uint32, uint32>_Random_1024                  1010 ns     1009 ns
BM_Rotate_pair<uint32, uint32>_Random_16384                15728 ns    15734 ns
BM_Rotate_pair<uint32, uint32>_Random_262144              251816 ns   251948 ns
BM_Rotate_tuple<uint32, uint64, uint32>_Random_1            10.6 ns     10.6 ns
BM_Rotate_tuple<uint32, uint64, uint32>_Random_4            24.1 ns     23.7 ns
BM_Rotate_tuple<uint32, uint64, uint32>_Random_16           40.1 ns     40.7 ns
BM_Rotate_tuple<uint32, uint64, uint32>_Random_64            115 ns      113 ns
BM_Rotate_tuple<uint32, uint64, uint32>_Random_256           412 ns      405 ns
BM_Rotate_tuple<uint32, uint64, uint32>_Random_1024         1548 ns     1532 ns
BM_Rotate_tuple<uint32, uint64, uint32>_Random_16384       24555 ns    23936 ns
BM_Rotate_tuple<uint32, uint64, uint32>_Random_262144     395888 ns   386210 ns
BM_Rotate_string_Random_1                                   10.6 ns     10.6 ns
BM_Rotate_string_Random_4                                   48.7 ns     47.6 ns
BM_Rotate_string_Random_16                                   124 ns      124 ns
BM_Rotate_string_Random_64                                   288 ns      287 ns
BM_Rotate_string_Random_256                                  756 ns      758 ns
BM_Rotate_string_Random_1024                                2278 ns     2266 ns
BM_Rotate_string_Random_16384                              33052 ns    32758 ns
BM_Rotate_string_Random_262144                            533664 ns   533456 ns
BM_Rotate_float_Random_1                                    10.6 ns     10.6 ns
BM_Rotate_float_Random_4                                    25.2 ns     23.9 ns
BM_Rotate_float_Random_16                                   45.3 ns     33.4 ns
BM_Rotate_float_Random_64                                    115 ns     61.2 ns
BM_Rotate_float_Random_256                                   424 ns      167 ns
BM_Rotate_float_Random_1024                                 1578 ns      561 ns
BM_Rotate_float_Random_16384                               24589 ns     8015 ns
BM_Rotate_float_Random_262144                             409517 ns   125895 ns

philnik edited the summary of this revision. (Show Details)Apr 20 2022, 1:39 PM

Harbormaster completed remote builds in B160517: Diff 424013.Apr 20 2022, 3:24 PM

@philnik Note that the issue also contains a comment (https://github.com/llvm/llvm-project/issues/54949#issuecomment-1101619447) indicating that the current optimization can be faster for types that aren't cheap to move. Can we try to detect that and still use the current optimization in that case? Also, can you please try a benchmark with a non-trivially-copyable type and see what the numbers look like?

philnik edited the summary of this revision. (Show Details)Apr 23 2022, 11:03 AM

It looks like it is indeed a bit faster for structs that are expensive to move. I'll enable the optimization for non-trivially_move_constructible types and ones that are larger than 32 bytes.

------------------------------------------------------------------
Benchmark                                    old Time     new Time
------------------------------------------------------------------
BM_Rotate_ExpensiveToMove_Random_1            10.4 ns      10.5 ns
BM_Rotate_ExpensiveToMove_Random_4             300 ns       301 ns
BM_Rotate_ExpensiveToMove_Random_16           1299 ns      1363 ns
BM_Rotate_ExpensiveToMove_Random_64           5401 ns      6023 ns
BM_Rotate_ExpensiveToMove_Random_256         21964 ns     24717 ns
BM_Rotate_ExpensiveToMove_Random_1024        89849 ns    101480 ns
BM_Rotate_ExpensiveToMove_Random_16384     1550789 ns   1732624 ns
BM_Rotate_ExpensiveToMove_Random_262144   30205994 ns  35608461 ns

@var-const The non-trivially-copyable part should be covered by string, or did you have something more specific in mind?

I noticed that it wasn't actually enabled for non-trivial types, so I only restricted it to types larger than 32 bytes, although I'm not sure we want to keep this in, since it's a large part of the code while while only being enabled for a very small amount of types and only making a relatively small difference performance wise. If we can find a good heuristic for enabling it for non-tivial types I would be happier to keep it in. (Although I don't think we can have a good heuristic for this kind of stuff)

Harbormaster completed remote builds in B161043: Diff 424741.Apr 23 2022, 2:25 PM

I'd be fine with this since it addresses the underwhelming performance for simple types like int, which is super important. However, I would prefer if we instead went for a better algorithm directly, like the swap/grail rotate algorithm mentioned in https://github.com/llvm/llvm-project/issues/54949#issue-1206295098.

libcxx/include/__algorithm/rotate.h
135–136	I don't think `constexpr` adds a lot of value here since the compiler will definitely fold this anyway, and it's kind of weird to have `_LIBCPP_CONSTEXPR_AFTER_CXX14` in that location.
135–136	I would also do something like const bool __is_expensive_to_move = sizeof(value_type) > 32; if (is_trivially_foo<...> && __is_expensive_to_move) { ... } That way, the code is somewhat self-documenting.

In D124122#3475473, @ldionne wrote:

I'd be fine with this since it addresses the underwhelming performance for simple types like int, which is super important. However, I would prefer if we instead went for a better algorithm directly, like the swap/grail rotate algorithm mentioned in https://github.com/llvm/llvm-project/issues/54949#issue-1206295098.

I planned to do a follow-up for that anyways. Would it be OK if I just nuke the current implementation and add the ranges API in the same patch?

In D124122#3475497, @philnik wrote:

In D124122#3475473, @ldionne wrote:

I'd be fine with this since it addresses the underwhelming performance for simple types like int, which is super important. However, I would prefer if we instead went for a better algorithm directly, like the swap/grail rotate algorithm mentioned in https://github.com/llvm/llvm-project/issues/54949#issue-1206295098.

I planned to do a follow-up for that anyways. Would it be OK if I just nuke the current implementation and add the ranges API in the same patch?

Yes, if we can have perf benchmarks for before and after. If that's easy to do, you could also first nuke the current implementation and replace it by one that is ranges::-friendly, and then just add the tiny ranges::rotate overlay on top (+ tests) in a separate patch. Both ways are acceptable, though.

Upload current status for Konstantin

Harbormaster completed remote builds in B177706: Diff 447827.Jul 26 2022, 2:47 PM

Revision Contents

Path

Size

libcxx/

benchmarks/

algorithms/

common.h

27 lines

include/

__algorithm/

ranges_rotate.h

14 lines

rotate.h

268 lines

Diff 447827

libcxx/benchmarks/algorithms/common.h

Show All 11 Lines
#include <algorithm>		#include <algorithm>
#include <numeric>		#include <numeric>
#include <tuple>		#include <tuple>
#include <vector>		#include <vector>

#include "../CartesianBenchmarks.h"		#include "../CartesianBenchmarks.h"
#include "../GenerateInput.h"		#include "../GenerateInput.h"

enum class ValueType { Uint32, Uint64, Pair, Tuple, String, Float };		enum class ValueType { Uint32, Uint64, Pair, Tuple, String, Float, ExpensiveToMove };
struct AllValueTypes : EnumValuesAsTuple<AllValueTypes, ValueType, 6> {		struct AllValueTypes : EnumValuesAsTuple<AllValueTypes, ValueType, 7> {
static constexpr const char* Names[] = {"uint32", "uint64", "pair<uint32, uint32>", "tuple<uint32, uint64, uint32>",		static constexpr const char* Names[] = {"uint32", "uint64", "pair<uint32, uint32>", "tuple<uint32, uint64, uint32>",
"string", "float"};		"string", "float", "ExpensiveToMove"};
		};

		struct ExpensiveToMove {
		int a[256];
		std::strong_ordering operator<=>(const ExpensiveToMove&) const = default;
};		};

using Types = std::tuple< uint32_t, uint64_t, std::pair<uint32_t, uint32_t>, std::tuple<uint32_t, uint64_t, uint32_t>,		using Types = std::tuple< uint32_t, uint64_t, std::pair<uint32_t, uint32_t>, std::tuple<uint32_t, uint64_t, uint32_t>,
std::string, float >;		std::string, float, ExpensiveToMove >;

template <class V>		template <class V>
using Value = std::tuple_element_t<(int)V::value, Types>;		using Value = std::tuple_element_t<(int)V::value, Types>;

enum class Order {		enum class Order {
Random,		Random,
Ascending,		Ascending,
Descending,		Descending,
▲ Show 20 Lines • Show All 105 Lines • ▼ Show 20 Lines	inline void fillValues(std::vector<std::string>& V, size_t N, Order O) {
if (O == Order::SingleElement) {		if (O == Order::SingleElement) {
V.resize(N, getRandomString(64));		V.resize(N, getRandomString(64));
} else {		} else {
while (V.size() < N)		while (V.size() < N)
V.push_back(getRandomString(64));		V.push_back(getRandomString(64));
}		}
}		}

		void fillValues(std::vector<ExpensiveToMove>& V, size_t N, Order O) {
		if (O == Order::SingleElement) {
		V.resize(N, ExpensiveToMove{});
		} else {
		while (V.size() != N) {
		ExpensiveToMove e;
		for (size_t i = 0; i != 256; ++i) {
		e.a[i] = V.size() + i;
		}
		V.push_back(e);
		}
		}
		}

template <class T>		template <class T>
void sortValues(T& V, Order O) {		void sortValues(T& V, Order O) {
switch (O) {		switch (O) {
case Order::Random: {		case Order::Random: {
std::random_device R;		std::random_device R;
std::mt19937 M(R());		std::mt19937 M(R());
std::shuffle(V.begin(), V.end(), M);		std::shuffle(V.begin(), V.end(), M);
break;		break;
▲ Show 20 Lines • Show All 88 Lines • Show Last 20 Lines

libcxx/include/__algorithm/ranges_rotate.h

This file was added.

				//===----------------------------------------------------------------------===//
				//
				// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
				// See https://llvm.org/LICENSE.txt for license information.
				// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
				//
				//===----------------------------------------------------------------------===//

				#ifndef _LIBCPP___ALGORITHM_RANGES_ROTATE_H
				#define _LIBCPP___ALGORITHM_RANGES_ROTATE_H



				#endif // _LIBCPP___ALGORITHM_RANGES_ROTATE_H

libcxx/include/__algorithm/rotate.h

//===----------------------------------------------------------------------===// //===----------------------------------------------------------------------===//

// //

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information. // See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

// //

//===----------------------------------------------------------------------===// //===----------------------------------------------------------------------===//

#ifndef _LIBCPP___ALGORITHM_ROTATE_H #ifndef _LIBCPP___ALGORITHM_ROTATE_H

#define _LIBCPP___ALGORITHM_ROTATE_H #define _LIBCPP___ALGORITHM_ROTATE_H

#include <__algorithm/iterator_operations.h> #include <__algorithm/iterator_operations.h>

#include <__algorithm/min.h>

#include <__algorithm/move.h> #include <__algorithm/move.h>

#include <__algorithm/move_backward.h> #include <__algorithm/move_backward.h>

#include <__algorithm/swap_ranges.h> #include <__algorithm/swap_ranges.h>

#include <__config> #include <__config>

#include <__iterator/iterator_traits.h> #include <__iterator/iterator_traits.h>

#include <__iterator/next.h> #include <__iterator/next.h>

#include <__iterator/prev.h> #include <__iterator/prev.h>

#include <__utility/move.h> #include <__utility/move.h>

#include <__utility/swap.h> #include <__utility/swap.h>

#include <type_traits> #include <type_traits>

#if !defined(_LIBCPP_HAS_NO_PRAGMA_SYSTEM_HEADER) #if !defined(_LIBCPP_HAS_NO_PRAGMA_SYSTEM_HEADER)

# pragma GCC system_header # pragma GCC system_header

#endif #endif

_LIBCPP_BEGIN_NAMESPACE_STD _LIBCPP_BEGIN_NAMESPACE_STD

template <class _AlgPolicy, class _ForwardIterator> template <class _Iter, class _Sent>

_LIBCPP_CONSTEXPR_AFTER_CXX11 _ForwardIterator _LIBCPP_HIDE_FROM_ABI _LIBCPP_CONSTEXPR_AFTER_CXX11 _Iter __rotate_left(_Iter __first, _Sent __last) {

__rotate_left(_ForwardIterator __first, _ForwardIterator __last) auto __tmp = std::move(*__first);

{ auto __lm1 = std::__move(std::next(__first), __last, __first);

typedef typename iterator_traits<_ForwardIterator>::value_type value_type; *__lm1 = std::move(__tmp);

value_type __tmp = _IterOps<_AlgPolicy>::__iter_move(__first);

// TODO(ranges): pass `_AlgPolicy` to `move`.

_ForwardIterator __lm1 = _VSTD::move(_VSTD::next(__first), __last, __first);

*__lm1 = _VSTD::move(__tmp);

return __lm1; return __lm1;

} }

template <class _AlgPolicy, class _BidirectionalIterator> template <class _Iter, class _Sent>

_LIBCPP_CONSTEXPR_AFTER_CXX11 _BidirectionalIterator _LIBCPP_HIDE_FROM_ABI _LIBCPP_CONSTEXPR_AFTER_CXX11 _Iter __rotate_right(_Iter __first, _Sent __last) {

__rotate_right(_BidirectionalIterator __first, _BidirectionalIterator __last) auto __lm1 = std::prev(__last);

{ auto __tmp = std::move(*__lm1);

typedef typename iterator_traits<_BidirectionalIterator>::value_type value_type; auto __fp1 = std::__move_backward(__first, __lm1, __last);

// TODO(ranges): pass `_AlgPolicy` to `prev`. *__first = std::move(__tmp);

_BidirectionalIterator __lm1 = _VSTD::prev(__last);

value_type __tmp = _IterOps<_AlgPolicy>::__iter_move(__lm1);

// TODO(ranges): pass `_AlgPolicy` to `move_backward`.

_BidirectionalIterator __fp1 = _VSTD::move_backward(__first, __lm1, __last);

*__first = _VSTD::move(__tmp);

return __fp1; return __fp1;

} }

template <class _AlgPolicy, class _ForwardIterator> template <class _Iter, class _Sent>

_LIBCPP_CONSTEXPR_AFTER_CXX14 _ForwardIterator _LIBCPP_HIDE_FROM_ABI _LIBCPP_CONSTEXPR_AFTER_CXX14 _Iter

__rotate_forward(_ForwardIterator __first, _ForwardIterator __middle, _ForwardIterator __last) __rotate_forward(_Iter __first, _Iter __middle, _Sent __last) {

{ auto __i = __middle;

_ForwardIterator __i = __middle; while (true) {

while (true) swap(*__first, *__i);

{

_IterOps<_AlgPolicy>::iter_swap(__first, __i);

++__first; ++__first;

if (++__i == __last) if (++__i == __last)

break; break;

if (__first == __middle) if (__first == __middle)

__middle = __i; __middle = __i;

} }

_ForwardIterator __r = __first; auto __r = __first;

if (__first != __middle) if (__first != __middle) {

{

__i = __middle; __i = __middle;

while (true) while (true) {

{ swap(*__first, *__i);

_IterOps<_AlgPolicy>::iter_swap(__first, __i);

++__first; ++__first;

if (++__i == __last) if (++__i == __last) {

{

if (__first == __middle) if (__first == __middle)

break; break;

__i = __middle; __i = __middle;

} } else if (__first == __middle)

else if (__first == __middle)

__middle = __i; __middle = __i;

} }

return __r; return __r;

} }

template<typename _Integral> template <class _Iter, class _Sent>

inline _LIBCPP_INLINE_VISIBILITY _LIBCPP_HIDE_FROM_ABI _LIBCPP_CONSTEXPR_AFTER_CXX14 _Iter __rotate_random(_Iter __first, _Iter __middle, _Sent __last) {

_LIBCPP_CONSTEXPR_AFTER_CXX14 _Integral auto __left = std::distance(__first, __middle);

__algo_gcd(_Integral __x, _Integral __y) auto __right = std::distance(__middle, __last);

{ auto __end = __first + __right;

{ if (__left == 0 || __first == __last)

_Integral __t = __x % __y; return __first;

__x = __y;

__y = __t; if (__left == __right) {

} while (__y); std::swap_ranges(__first, __middle, __middle);

return __x;

}

template <class _AlgPolicy, typename _RandomAccessIterator>

_LIBCPP_CONSTEXPR_AFTER_CXX14 _RandomAccessIterator

__rotate_gcd(_RandomAccessIterator __first, _RandomAccessIterator __middle, _RandomAccessIterator __last)

{

typedef typename iterator_traits<_RandomAccessIterator>::difference_type difference_type;

typedef typename iterator_traits<_RandomAccessIterator>::value_type value_type;

const difference_type __m1 = __middle - __first;

const difference_type __m2 = __last - __middle;

if (__m1 == __m2)

{

// TODO(ranges): pass `_AlgPolicy` to `swap_ranges`.

_VSTD::swap_ranges(__first, __middle, __middle);

return __middle; return __middle;

} }

const difference_type __g = _VSTD::__algo_gcd(__m1, __m2);

for (_RandomAccessIterator __p = __first + __g; __p != __first;)

{

value_type __t(_IterOps<_AlgPolicy>::__iter_move(--__p));

_RandomAccessIterator __p1 = __p;

_RandomAccessIterator __p2 = __p1 + __m1;

{

*__p1 = _IterOps<_AlgPolicy>::__iter_move(__p2);

__p1 = __p2;

const difference_type __d = __last - __p2;

if (__m1 < __d)

__p2 += __m1;

else

__p2 = __first + (__m1 - __d);

} while (__p2 != __p);

*__p1 = _VSTD::move(__t);

}

return __first + __m2;

}

template <class _AlgPolicy, class _ForwardIterator>

inline _LIBCPP_INLINE_VISIBILITY

_LIBCPP_CONSTEXPR_AFTER_CXX11 _ForwardIterator

__rotate_impl(_ForwardIterator __first, _ForwardIterator __middle, _ForwardIterator __last,

_VSTD::forward_iterator_tag)

{

typedef typename iterator_traits<_ForwardIterator>::value_type value_type;

if (is_trivially_move_assignable<value_type>::value)

{

if (_IterOps<_AlgPolicy>::next(__first) == __middle)

return std::__rotate_left<_AlgPolicy>(__first, __last);

}

return std::__rotate_forward<_AlgPolicy>(__first, __middle, __last);

}

template <class _AlgPolicy, class _BidirectionalIterator>

inline _LIBCPP_INLINE_VISIBILITY

_LIBCPP_CONSTEXPR_AFTER_CXX11 _BidirectionalIterator

__rotate_impl(_BidirectionalIterator __first, _BidirectionalIterator __middle, _BidirectionalIterator __last,

bidirectional_iterator_tag)

{

typedef typename iterator_traits<_BidirectionalIterator>::value_type value_type;

if (is_trivially_move_assignable<value_type>::value)

{

if (_IterOps<_AlgPolicy>::next(__first) == __middle)

return std::__rotate_left<_AlgPolicy>(__first, __last);

if (_IterOps<_AlgPolicy>::next(__middle) == __last)

return std::__rotate_right<_AlgPolicy>(__first, __last);

}

return std::__rotate_forward<_AlgPolicy>(__first, __middle, __last);

}

template <class _AlgPolicy, class _RandomAccessIterator>

inline _LIBCPP_INLINE_VISIBILITY

_LIBCPP_CONSTEXPR_AFTER_CXX11 _RandomAccessIterator

__rotate_impl(_RandomAccessIterator __first, _RandomAccessIterator __middle, _RandomAccessIterator __last,

random_access_iterator_tag)

{

typedef typename iterator_traits<_RandomAccessIterator>::value_type value_type;

if (is_trivially_move_assignable<value_type>::value)

{

if (_IterOps<_AlgPolicy>::next(__first) == __middle)

return std::__rotate_left<_AlgPolicy>(__first, __last);

if (_IterOps<_AlgPolicy>::next(__middle) == __last)

return std::__rotate_right<_AlgPolicy>(__first, __last);

return std::__rotate_gcd<_AlgPolicy>(__first, __middle, __last);

}

return std::__rotate_forward<_AlgPolicy>(__first, __middle, __last);

}

template <class _AlgPolicy, class _RandomAccessIterator, class _IterCategory>

_LIBCPP_HIDE_FROM_ABI _LIBCPP_CONSTEXPR_AFTER_CXX11

_RandomAccessIterator __rotate(_RandomAccessIterator __first, _RandomAccessIterator __middle,

_RandomAccessIterator __last, _IterCategory __iter_category) {

if (__first == __middle)

return __last;

if (__middle == __last)

return __first;

return std::__rotate_impl<_AlgPolicy>(std::move(__first), std::move(__middle), std::move(__last), __iter_category); auto __min_len = std::min(__left, __right);

while (__min_len > 0) {

if (__left <= __right) {

do {

std::swap_ranges(__first, __first + __left, __first + __left);

__first += __left;

__right -= __left;

} while (__left <= __right);

__min_len = __right;

} else {

do {

std::swap_ranges(__first + (__left - __right), __first + __left, __first + __left);

__left -= __right;

} while (__left > __right);

__min_len = __left;

}

return __end;

}

template <class _Iter, class _Sent>

inline _LIBCPP_HIDE_FROM_ABI _LIBCPP_CONSTEXPR_AFTER_CXX11 _Iter

__rotate(_Iter __first, _Iter __middle, _Sent __last, std::forward_iterator_tag) {

using value_type = typename iterator_traits<_Iter>::value_type;

if (is_nothrow_move_assignable<value_type>::value || !is_nothrow_swappable<value_type>::value) {

if (std::next(__first) == __middle)

return std::__rotate_left(__first, __last);

}

return std::__rotate_forward(__first, __middle, __last);

}

template <class _Iter, class _Sent>

inline _LIBCPP_HIDE_FROM_ABI _LIBCPP_CONSTEXPR_AFTER_CXX11 _Iter

__rotate(_Iter __first, _Iter __middle, _Sent __last, bidirectional_iterator_tag) {

using value_type = typename iterator_traits<_Iter>::value_type;

if (is_nothrow_move_assignable<value_type>::value || !is_nothrow_swappable<value_type>::value) {

if (std::next(__first) == __middle)

return std::__rotate_left(__first, __last);

if (std::next(__middle) == __last)

return std::__rotate_right(__first, __last);

}

return std::__rotate_forward(__first, __middle, __last);

}

template <class _Iter>

ldionneUnsubmitted

Not Done

typedef typename iterator_traits<_RandomAccessIterator>::value_type value_type;

- if _LIBCPP_CONSTEXPR_AFTER_CXX14 (is_trivially_move_assignable<value_type>::value && sizeof(value_type) > 32)

+ if (is_trivially_move_assignable<value_type>::value && sizeof(value_type) > 32)

{

if (_VSTD::next(__first) == __middle)

I don't think constexpr adds a lot of value here since the compiler will definitely fold this anyway, and it's kind of weird to have _LIBCPP_CONSTEXPR_AFTER_CXX14 in that location.

ldionne: I don't think `constexpr` adds a lot of value here since the compiler will definitely fold this…

ldionneUnsubmitted

Not Done

I would also do something like

const bool __is_expensive_to_move = sizeof(value_type) > 32;
if (is_trivially_foo<...> && __is_expensive_to_move) { ... }

That way, the code is somewhat self-documenting.

ldionne: I would also do something like ``` const bool __is_expensive_to_move = sizeof(value_type) > 32…

inline _LIBCPP_HIDE_FROM_ABI _LIBCPP_CONSTEXPR_AFTER_CXX11 _Iter

__rotate(_Iter __first, _Iter __middle, _Iter __last, random_access_iterator_tag) {

using value_type = typename iterator_traits<_Iter>::value_type;

if (is_nothrow_move_assignable<value_type>::value || !is_nothrow_swappable<value_type>::value) {

if (std::next(__first) == __middle)

return std::__rotate_left(__first, __last);

if (std::next(__middle) == __last)

return std::__rotate_right(__first, __last);

return std::__rotate_random(__first, __middle, __last);

}

return std::__rotate_forward(__first, __middle, __last);

} }

template <class _ForwardIterator> template <class _ForwardIterator>

inline _LIBCPP_INLINE_VISIBILITY inline _LIBCPP_HIDE_FROM_ABI _LIBCPP_CONSTEXPR_AFTER_CXX17 _ForwardIterator

_LIBCPP_CONSTEXPR_AFTER_CXX17 _ForwardIterator rotate(_ForwardIterator __first, _ForwardIterator __middle, _ForwardIterator __last) {

rotate(_ForwardIterator __first, _ForwardIterator __middle, _ForwardIterator __last) if (__first == __middle)

{ return __last;

return std::__rotate<_ClassicAlgPolicy>(__first, __middle, __last, if (__middle == __last)

typename iterator_traits<_ForwardIterator>::iterator_category()); return __first;

return std::__rotate(__first, __middle, __last, typename iterator_traits<_ForwardIterator>::iterator_category());

} }

_LIBCPP_END_NAMESPACE_STD _LIBCPP_END_NAMESPACE_STD

#endif // _LIBCPP___ALGORITHM_ROTATE_H #endif // _LIBCPP___ALGORITHM_ROTATE_H

This is an archive of the discontinued LLVM Phabricator instance.

[libc++] Optimize std::rotateNeeds ReviewPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 447827

libcxx/benchmarks/algorithms/common.h

libcxx/include/__algorithm/ranges_rotate.h

libcxx/include/__algorithm/rotate.h

[libc++] Optimize std::rotate
Needs ReviewPublic