From 162a1a76364904eb971bf26adbb229b1aa067f44 Mon Sep 17 00:00:00 2001 From: Michael Schellenberger Costa Date: Tue, 30 Apr 2024 19:10:51 +0200 Subject: [PATCH] Try to ensure that `thrust::tuple` and `thrust::pair` work with CTAD --- libcudacxx/include/cuda/std/__utility/pair.h | 47 ++++---- .../cuda/std/detail/libcxx/include/tuple | 13 --- thrust/testing/pair.cu | 14 ++- thrust/testing/tuple.cu | 16 ++- thrust/thrust/detail/functional/actor.h | 2 +- thrust/thrust/detail/functional/actor.inl | 5 - .../detail/tuple_of_iterator_references.h | 14 +-- thrust/thrust/optional.h | 7 +- thrust/thrust/pair.h | 86 +++++++++++++- thrust/thrust/tuple.h | 107 ++++++++++++++++-- 10 files changed, 242 insertions(+), 69 deletions(-) diff --git a/libcudacxx/include/cuda/std/__utility/pair.h b/libcudacxx/include/cuda/std/__utility/pair.h index 9269a09c745..8b17881446a 100644 --- a/libcudacxx/include/cuda/std/__utility/pair.h +++ b/libcudacxx/include/cuda/std/__utility/pair.h @@ -283,18 +283,21 @@ struct _LIBCUDACXX_TEMPLATE_VIS pair : public __pair_base<_T1, _T2> : __base(__t1, __t2) {} - template ::template __constructible<_U1, _U2>, + template + using __pair_constructible = typename __pair_constraints<_T1, _T2>::template __constructible<_U1, _U2>; + + template , __enable_if_t<_Constraints::__explicit_constructible, int> = 0> _LIBCUDACXX_INLINE_VISIBILITY explicit constexpr pair(_U1&& __u1, _U2&& __u2) noexcept( _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T1, _U1) && _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T2, _U2)) : __base(_CUDA_VSTD::forward<_U1>(__u1), _CUDA_VSTD::forward<_U2>(__u2)) {} - template ::template __constructible<_U1, _U2>, + template , __enable_if_t<_Constraints::__implicit_constructible, int> = 0> _LIBCUDACXX_INLINE_VISIBILITY constexpr pair(_U1&& __u1, _U2&& __u2) noexcept( _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T1, _U1) && _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T2, _U2)) @@ -316,9 +319,9 @@ struct _LIBCUDACXX_TEMPLATE_VIS pair : public __pair_base<_T1, _T2> pair(pair const&) = default; pair(pair&&) = default; - template ::template __constructible, + template , __enable_if_t<_Constraints::__explicit_constructible, int> = 0> _LIBCUDACXX_INLINE_VISIBILITY explicit _CCCL_CONSTEXPR_CXX14 pair(const pair<_U1, _U2>& __p) noexcept( _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T1, const _U1&) @@ -326,9 +329,9 @@ struct _LIBCUDACXX_TEMPLATE_VIS pair : public __pair_base<_T1, _T2> : __base(__p.first, __p.second) {} - template ::template __constructible, + template , __enable_if_t<_Constraints::__implicit_constructible, int> = 0> _LIBCUDACXX_INLINE_VISIBILITY _CCCL_CONSTEXPR_CXX14 pair(const pair<_U1, _U2>& __p) noexcept( _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T1, const _U1&) @@ -337,18 +340,18 @@ struct _LIBCUDACXX_TEMPLATE_VIS pair : public __pair_base<_T1, _T2> {} // move constructors - template ::template __constructible<_U1, _U2>, + template , __enable_if_t<_Constraints::__explicit_constructible, int> = 0> _LIBCUDACXX_INLINE_VISIBILITY explicit _CCCL_CONSTEXPR_CXX14 pair(pair<_U1, _U2>&& __p) noexcept( _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T1, _U1) && _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T2, _U2)) : __base(_CUDA_VSTD::forward<_U1>(__p.first), _CUDA_VSTD::forward<_U2>(__p.second)) {} - template ::template __constructible<_U1, _U2>, + template , __enable_if_t<_Constraints::__implicit_constructible, int> = 0> _LIBCUDACXX_INLINE_VISIBILITY _CCCL_CONSTEXPR_CXX14 pair(pair<_U1, _U2>&& __p) noexcept( _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T1, _U1) && _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T2, _U2)) @@ -359,7 +362,7 @@ struct _LIBCUDACXX_TEMPLATE_VIS pair : public __pair_base<_T1, _T2> #if defined(__cuda_std__) && !defined(_CCCL_COMPILER_NVRTC) template ::template __constructible, + class _Constraints = __pair_constructible, __enable_if_t<_Constraints::__explicit_constructible, int> = 0> _CCCL_HOST _LIBCUDACXX_HIDE_FROM_ABI explicit _CCCL_CONSTEXPR_CXX14 pair(const ::std::pair<_U1, _U2>& __p) noexcept( _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T1, const _U1&) @@ -369,7 +372,7 @@ struct _LIBCUDACXX_TEMPLATE_VIS pair : public __pair_base<_T1, _T2> template ::template __constructible, + class _Constraints = __pair_constructible, __enable_if_t<_Constraints::__implicit_constructible, int> = 0> _CCCL_HOST _LIBCUDACXX_HIDE_FROM_ABI _CCCL_CONSTEXPR_CXX14 pair(const ::std::pair<_U1, _U2>& __p) noexcept( _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T1, const _U1&) @@ -379,7 +382,7 @@ struct _LIBCUDACXX_TEMPLATE_VIS pair : public __pair_base<_T1, _T2> template ::template __constructible<_U1, _U2>, + class _Constraints = __pair_constructible<_U1, _U2>, __enable_if_t<_Constraints::__explicit_constructible, int> = 0> _CCCL_HOST _LIBCUDACXX_HIDE_FROM_ABI explicit _CCCL_CONSTEXPR_CXX14 pair(::std::pair<_U1, _U2>&& __p) noexcept( _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T1, _U1) && _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T2, _U2)) @@ -388,7 +391,7 @@ struct _LIBCUDACXX_TEMPLATE_VIS pair : public __pair_base<_T1, _T2> template ::template __constructible<_U1, _U2>, + class _Constraints = __pair_constructible<_U1, _U2>, __enable_if_t<_Constraints::__implicit_constructible, int> = 0> _CCCL_HOST _LIBCUDACXX_HIDE_FROM_ABI _CCCL_CONSTEXPR_CXX14 pair(::std::pair<_U1, _U2>&& __p) noexcept( _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T1, _U1) && _LIBCUDACXX_TRAIT(is_nothrow_constructible, _T2, _U2)) diff --git a/libcudacxx/include/cuda/std/detail/libcxx/include/tuple b/libcudacxx/include/cuda/std/detail/libcxx/include/tuple index 22cb1d51fe8..f1dadac04b7 100644 --- a/libcudacxx/include/cuda/std/detail/libcxx/include/tuple +++ b/libcudacxx/include/cuda/std/detail/libcxx/include/tuple @@ -194,10 +194,6 @@ template _LIBCUDACXX_BEGIN_NAMESPACE_STD -template -struct __is_tuple_of_iterator_references : false_type -{}; - // __tuple_leaf struct __tuple_leaf_default_constructor_tag {}; @@ -808,15 +804,6 @@ public: typename __tuple_constraints<_Tp...>::template __tuple_like_constraints<_Tuple>, __invalid_tuple_constraints>; - // Horrible hack to make tuple_of_iterator_references work - template ::value, int> = 0, - __enable_if_t<(tuple_size<_TupleOfIteratorReferences>::value == sizeof...(_Tp)), int> = 0> - _LIBCUDACXX_INLINE_VISIBILITY _CCCL_CONSTEXPR_CXX14 tuple(_TupleOfIteratorReferences&& __t) - : tuple(_CUDA_VSTD::forward<_TupleOfIteratorReferences>(__t).template __to_tuple<_Tp...>( - __make_tuple_indices_t())) - {} - template , __enable_if_t::value, int> = 0, diff --git a/thrust/testing/pair.cu b/thrust/testing/pair.cu index 1f1ddcf4d2e..cab025444bd 100644 --- a/thrust/testing/pair.cu +++ b/thrust/testing/pair.cu @@ -322,4 +322,16 @@ void TestPairStructuredBindings(void) ASSERT_EQUAL(b, b2); } DECLARE_UNITTEST(TestPairStructuredBindings); -#endif + +void TestPairCTAD(void) +{ + const int a = 42; + const int b = 1337; + thrust::pair p(a, b); + + auto [a2, b2] = p; + ASSERT_EQUAL(a, a2); + ASSERT_EQUAL(b, b2); +} +DECLARE_UNITTEST(TestPairCTAD); +#endif // _CCCL_STD_VER >= 2017 diff --git a/thrust/testing/tuple.cu b/thrust/testing/tuple.cu index c3cb1b23bab..879d920a011 100644 --- a/thrust/testing/tuple.cu +++ b/thrust/testing/tuple.cu @@ -511,7 +511,21 @@ void TestTupleStructuredBindings(void) ASSERT_EQUAL(c, c2); } DECLARE_UNITTEST(TestTupleStructuredBindings); -#endif + +void TestTupleCTAD(void) +{ + const int a = 0; + const char b = 42; + const short c = 1337; + thrust::tuple t(a, b, c); + + auto [a2, b2, c2] = t; + ASSERT_EQUAL(a, a2); + ASSERT_EQUAL(b, b2); + ASSERT_EQUAL(c, c2); +} +DECLARE_UNITTEST(TestTupleCTAD); +#endif // _CCCL_STD_VER >= 2017 // Ensure that we are backwards compatible with the old thrust::tuple implementation static_assert( diff --git a/thrust/thrust/detail/functional/actor.h b/thrust/thrust/detail/functional/actor.h index 0dd0560e69e..3f30d0a1570 100644 --- a/thrust/thrust/detail/functional/actor.h +++ b/thrust/thrust/detail/functional/actor.h @@ -65,7 +65,7 @@ struct actor : Eval { typedef Eval eval_type; - _CCCL_HOST_DEVICE constexpr actor(); + constexpr actor() = default; _CCCL_HOST_DEVICE actor(const Eval& base); diff --git a/thrust/thrust/detail/functional/actor.inl b/thrust/thrust/detail/functional/actor.inl index 81146a594c6..64d367ed15f 100644 --- a/thrust/thrust/detail/functional/actor.inl +++ b/thrust/thrust/detail/functional/actor.inl @@ -48,11 +48,6 @@ namespace detail namespace functional { -template -_CCCL_HOST_DEVICE constexpr actor::actor() - : eval_type() -{} - template _CCCL_HOST_DEVICE actor::actor(const Eval& base) : eval_type(base) diff --git a/thrust/thrust/iterator/detail/tuple_of_iterator_references.h b/thrust/thrust/iterator/detail/tuple_of_iterator_references.h index 574715e4a77..bb43c9d1c4b 100644 --- a/thrust/thrust/iterator/detail/tuple_of_iterator_references.h +++ b/thrust/thrust/iterator/detail/tuple_of_iterator_references.h @@ -67,9 +67,7 @@ class tuple_of_iterator_references : public thrust::tuple using super_t = thrust::tuple; using super_t::super_t; - inline _CCCL_HOST_DEVICE tuple_of_iterator_references() - : super_t() - {} + tuple_of_iterator_references() = default; // allow implicit construction from tuple inline _CCCL_HOST_DEVICE tuple_of_iterator_references(const super_t& other) @@ -138,15 +136,15 @@ class tuple_of_iterator_references : public thrust::tuple } // namespace detail -THRUST_NAMESPACE_END - -_LIBCUDACXX_BEGIN_NAMESPACE_STD - template struct __is_tuple_of_iterator_references> - : integral_constant + : _CUDA_VSTD::true_type {}; +THRUST_NAMESPACE_END + +_LIBCUDACXX_BEGIN_NAMESPACE_STD + // define tuple_size, tuple_element, etc. template struct tuple_size> diff --git a/thrust/thrust/optional.h b/thrust/thrust/optional.h index be186a9d78a..f7822324907 100644 --- a/thrust/thrust/optional.h +++ b/thrust/thrust/optional.h @@ -838,7 +838,12 @@ struct nullopt_t /// void foo (thrust::optional); /// foo(thrust::nullopt); //pass an empty optional /// ``` -static constexpr nullopt_t nullopt{nullopt_t::do_not_use{}, nullopt_t::do_not_use{}}; +#ifdef __CUDA_ARCH__ +__device__ static _LIBCUDACXX_CONSTEXPR_GLOBAL +#else +static constexpr +#endif // __CUDA_ARCH__ + nullopt_t nullopt{nullopt_t::do_not_use{}, nullopt_t::do_not_use{}}; class bad_optional_access : public std::exception { diff --git a/thrust/thrust/pair.h b/thrust/thrust/pair.h index 4fd2e8f8333..53d5cc93edf 100644 --- a/thrust/thrust/pair.h +++ b/thrust/thrust/pair.h @@ -50,7 +50,7 @@ THRUST_NAMESPACE_BEGIN * \tparam T A \c pair type of interest. */ template -using tuple_element = ::cuda::std::tuple_element; +using tuple_element = _CUDA_VSTD::tuple_element; /*! This convenience metafunction is included for compatibility with * \p tuple. It returns \c 2, the number of elements of a \p pair, @@ -59,7 +59,7 @@ using tuple_element = ::cuda::std::tuple_element; * \tparam Pair A \c pair type of interest. */ template -using tuple_size = ::cuda::std::tuple_size; +using tuple_size = _CUDA_VSTD::tuple_size; /*! \p pair is a generic data structure encapsulating a heterogeneous * pair of values. @@ -73,10 +73,49 @@ using tuple_size = ::cuda::std::tuple_size; * provided by pair::second_type. */ template -using pair = ::cuda::std::pair; - -using ::cuda::std::get; -using ::cuda::std::make_pair; +struct pair : public _CUDA_VSTD::pair +{ + using super_t = _CUDA_VSTD::pair; + using super_t::super_t; + +#if (defined(_CCCL_COMPILER_GCC) && __GNUC__ < 9) || (defined(_CCCL_COMPILER_CLANG) && __clang_major__ < 12) + // For whatever reason nvcc complains about that constructor being used before being defined in a constexpr variable + constexpr pair() = default; + + template ::template __constructible<_U1, _U2>, + _CUDA_VSTD::__enable_if_t<_Constraints::__implicit_constructible, int> = 0> + _CCCL_HOST_DEVICE constexpr pair(_U1&& __u1, _U2&& __u2) + : super_t(_CUDA_VSTD::forward<_U1>(__u1), _CUDA_VSTD::forward<_U2>(__u2)) + {} +#endif // _CCCL_COMPILER_GCC < 9 || _CCCL_COMPILER_CLANG < 12 +}; + +#if _CCCL_STD_VER >= 2017 +template +_CCCL_HOST_DEVICE pair(_T1, _T2) -> pair<_T1, _T2>; +#endif // _CCCL_STD_VER >= 2017 + +template +inline _CCCL_HOST_DEVICE + _CUDA_VSTD::__enable_if_t<_CUDA_VSTD::__is_swappable::value && _CUDA_VSTD::__is_swappable::value, void> + swap(pair& lhs, pair& rhs) noexcept( + (_CUDA_VSTD::__is_nothrow_swappable::value && _CUDA_VSTD::__is_nothrow_swappable::value)) +{ + lhs.swap(rhs); +} + +template +inline _CCCL_HOST_DEVICE + pair::type, typename _CUDA_VSTD::__unwrap_ref_decay::type> + make_pair(T1&& t1, T2&& t2) +{ + return pair::type, typename _CUDA_VSTD::__unwrap_ref_decay::type>( + _CUDA_VSTD::forward(t1), _CUDA_VSTD::forward(t2)); +} + +using _CUDA_VSTD::get; /*! \endcond */ @@ -88,3 +127,38 @@ using ::cuda::std::make_pair; */ THRUST_NAMESPACE_END + +_LIBCUDACXX_BEGIN_NAMESPACE_STD + +template +struct tuple_size> : tuple_size> +{}; + +template +struct tuple_element> : tuple_element> +{}; + +template +struct __tuple_like_ext> : true_type +{}; + +_LIBCUDACXX_END_NAMESPACE_STD + +// This is a workaround for the fact that structured bindings require that the specializations of +// `tuple_size` and `tuple_element` reside in namespace std (https://eel.is/c++draft/dcl.struct.bind#4). +// See https://github.com/NVIDIA/libcudacxx/issues/316 for a short discussion +#if _CCCL_STD_VER >= 2017 + +# include + +namespace std +{ +template +struct tuple_size> : tuple_size> +{}; + +template +struct tuple_element> : tuple_element> +{}; +} // namespace std +#endif // _CCCL_STD_VER >= 2017 diff --git a/thrust/thrust/tuple.h b/thrust/thrust/tuple.h index 5fa1d7f2f7c..4313df83fbd 100644 --- a/thrust/thrust/tuple.h +++ b/thrust/thrust/tuple.h @@ -94,28 +94,32 @@ _CCCL_HOST_DEVICE inline bool operator>(const null_type&, const null_type&) * \tparam N This parameter selects the element of interest. * \tparam T A \c tuple type of interest. * - * \see pair + * \see tuple * \see tuple */ template -using tuple_element = ::cuda::std::tuple_element; +using tuple_element = _CUDA_VSTD::tuple_element; /*! This metafunction returns the number of elements * of a \p tuple type of interest. * * \tparam T A \c tuple type of interest. * - * \see pair + * \see tuple * \see tuple */ template -using tuple_size = ::cuda::std::tuple_size; +using tuple_size = _CUDA_VSTD::tuple_size; + +template +struct __is_tuple_of_iterator_references : _CUDA_VSTD::false_type +{}; /*! \brief \p tuple is a class template that can be instantiated with up to ten * arguments. Each template argument specifies the type of element in the \p * tuple. Consequently, tuples are heterogeneous, fixed-size collections of * values. An instantiation of \p tuple with two arguments is similar to an - * instantiation of \p pair with the same two arguments. Individual elements + * instantiation of \p tuple with the same two arguments. Individual elements * of a \p tuple may be accessed with the \p get function. * * \tparam TN The type of the N \c tuple element. Thrust's \p tuple @@ -143,19 +147,72 @@ using tuple_size = ::cuda::std::tuple_size; * } * \endcode * - * \see pair + * \see tuple * \see get * \see make_tuple * \see tuple_element * \see tuple_size * \see tie */ -template -using tuple = ::cuda::std::tuple; +template +struct tuple : public _CUDA_VSTD::tuple +{ + using super_t = _CUDA_VSTD::tuple; + using super_t::super_t; + + tuple() = default; + + template ::value, int> = 0, + _CUDA_VSTD::__enable_if_t<(tuple_size<_TupleOfIteratorReferences>::value == sizeof...(Ts)), int> = 0> + _CCCL_HOST_DEVICE tuple(_TupleOfIteratorReferences&& tup) + : tuple(_CUDA_VSTD::forward<_TupleOfIteratorReferences>(tup).template __to_tuple( + _CUDA_VSTD::__make_tuple_indices_t())) + {} + + _CCCL_EXEC_CHECK_DISABLE + template ::value, int> = 0> + _CCCL_HOST_DEVICE tuple& operator=(TupleLike&& other) + { + super_t::operator=(_CUDA_VSTD::forward(other)); + return *this; + } +}; + +#if _CCCL_STD_VER >= 2017 +template +_CCCL_HOST_DEVICE tuple(Ts...) -> tuple; + +template +struct pair; + +template +_CCCL_HOST_DEVICE tuple(pair) -> tuple; +#endif // _CCCL_STD_VER >= 2017 + +template +inline _CCCL_HOST_DEVICE + _CUDA_VSTD::__enable_if_t<_CUDA_VSTD::__all<_CUDA_VSTD::__is_swappable::value...>::value, void> + swap(tuple& __x, + tuple& __y) noexcept((_CUDA_VSTD::__all<_CUDA_VSTD::__is_nothrow_swappable::value...>::value)) +{ + __x.swap(__y); +} + +template +inline _CCCL_HOST_DEVICE tuple::type...> make_tuple(Ts&&... __t) +{ + return tuple::type...>(_CUDA_VSTD::forward(__t)...); +} -using ::cuda::std::get; -using ::cuda::std::make_tuple; -using ::cuda::std::tie; +template +inline _CCCL_HOST_DEVICE tuple tie(Ts&... ts) noexcept +{ + return tuple(ts...); +} + +using _CUDA_VSTD::get; /*! \endcond */ @@ -170,6 +227,18 @@ THRUST_NAMESPACE_END _LIBCUDACXX_BEGIN_NAMESPACE_STD +template +struct tuple_size> : tuple_size> +{}; + +template +struct tuple_element> : tuple_element> +{}; + +template +struct __tuple_like_ext> : true_type +{}; + template <> struct tuple_size= 2017 +namespace std +{ +template +struct tuple_size> : tuple_size> +{}; + +template +struct tuple_element> : tuple_element> +{}; +} // namespace std +#endif // _CCCL_STD_VER >= 2017