On Fri, 27 Jun 2025 at 15:15, Patrick Palka <ppa...@redhat.com> wrote:
>
> On Fri, 27 Jun 2025, Jonathan Wakely wrote:
>
> > On 26/06/25 22:25 -0400, Patrick Palka wrote:
> > >     PR libstdc++/100795
> > >
> > > libstdc++-v3/ChangeLog:
> > >
> > >     * include/bits/ranges_algo.h (__detail::__move_merge): New,
> > >     based on the stl_algo.h implementation.
> > >     (__detail::__merge_sort_loop): Likewise.
> > >     (__detail::__chunk_insertion_sort): Likewise.
> > >     (__detail::__merge_sort_with_buffer): Likewise.
> > >     (__detail::__stable_sort_adaptive): Likewise.
> > >     (__detail::__stable_sort_adaptive_resize): Likewise.
> > >     (__detail::__inplace_stable_sort): Likewise.
> > >     (__stable_sort_fn::operator()): Reimplement in terms of the above.
> > >     * testsuite/25_algorithms/stable_sort/constrained.cc:
> > > ---
> > > libstdc++-v3/include/bits/ranges_algo.h       | 207 +++++++++++++++++-
> > > .../25_algorithms/stable_sort/constrained.cc  |  30 +++
> > > 2 files changed, 233 insertions(+), 4 deletions(-)
> > >
> > > diff --git a/libstdc++-v3/include/bits/ranges_algo.h
> > > b/libstdc++-v3/include/bits/ranges_algo.h
> > > index b0357600adbc..7dfd4e7ed64c 100644
> > > --- a/libstdc++-v3/include/bits/ranges_algo.h
> > > +++ b/libstdc++-v3/include/bits/ranges_algo.h
> > > @@ -2388,6 +2388,170 @@ namespace ranges
> > >
> > >   inline constexpr __sort_fn sort{};
> > >
> > > +  namespace __detail
> > > +  {
> > > +    /// This is a helper function for the __merge_sort_loop routines.
> > > +    template<typename _Iter, typename _Out, typename _Comp>
> > > +      _Out
> > > +      __move_merge(_Iter __first1, _Iter __last1,
> > > +              _Iter __first2, _Iter __last2,
> > > +              _Out __result, _Comp __comp)
> > > +      {
> > > +   while (__first1 != __last1 && __first2 != __last2)
> > > +     {
> > > +       if (__comp(*__first2, *__first1))
> > > +         {
> > > +           *__result = ranges::iter_move(__first2);
> > > +           ++__first2;
> > > +         }
> > > +       else
> > > +         {
> > > +           *__result = ranges::iter_move(__first1);
> > > +           ++__first1;
> > > +         }
> > > +       ++__result;
> > > +     }
> > > +   return ranges::move(__first2, __last2,
> > > +                       ranges::move(__first1, __last1,
> > > __result).out).out;
> > > +      }
> > > +
> > > +    template<typename _Iter, typename _Out, typename _Distance, typename
> > > _Comp>
> > > +      void
> > > +      __merge_sort_loop(_Iter __first, _Iter __last, _Out __result,
> > > +                   _Distance __step_size, _Comp __comp)
> > > +      {
> > > +   const _Distance __two_step = 2 * __step_size;
> > > +
> > > +   while (__last - __first >= __two_step)
> > > +     {
> > > +       __result = __detail::__move_merge(__first, __first + __step_size,
> > > +                                         __first + __step_size,
> > > +                                         __first + __two_step,
> > > +                                         __result, __comp);
> > > +       __first += __two_step;
> > > +     }
> > > +   __step_size = ranges::min(_Distance(__last - __first), __step_size);
> > > +
> > > +   __detail::__move_merge(__first, __first + __step_size,
> > > +                          __first + __step_size, __last, __result,
> > > __comp);
> > > +      }
> > > +
> > > +    template<typename _Iter, typename _Distance, typename _Compare>
> > > +      constexpr void
> > > +      __chunk_insertion_sort(_Iter __first, _Iter __last,
> > > +                        _Distance __chunk_size, _Compare __comp)
> > > +      {
> > > +   while (__last - __first >= __chunk_size)
> > > +     {
> > > +       __detail::__insertion_sort(__first, __first + __chunk_size,
> > > __comp);
> > > +       __first += __chunk_size;
> > > +     }
> > > +   __detail::__insertion_sort(__first, __last, __comp);
> > > +      }
> > > +
> > > +    template<typename _Iter, typename _Pointer, typename _Comp>
> > > +      void
> > > +      __merge_sort_with_buffer(_Iter __first, _Iter __last,
> > > +                          _Pointer __buffer, _Comp __comp)
> > > +      {
> > > +   using _Distance = iter_difference_t<_Iter>;
> > > +
> > > +   const _Distance __len = __last - __first;
> > > +   const _Pointer __buffer_last = __buffer + ptrdiff_t(__len);
> > > +
> > > +   constexpr int __chunk_size = 7;
> > > +   _Distance __step_size = __chunk_size;
> > > +   __detail::__chunk_insertion_sort(__first, __last, __step_size,
> > > __comp);
> > > +
> > > +   while (__step_size < __len)
> > > +     {
> > > +       __detail::__merge_sort_loop(__first, __last, __buffer,
> > > +                                   __step_size, __comp);
> > > +       __step_size *= 2;
> > > +       __detail::__merge_sort_loop(__buffer, __buffer_last, __first,
> > > +                                   ptrdiff_t(__step_size), __comp);
> > > +       __step_size *= 2;
> > > +     }
> > > +      }
> > > +
> > > +    template<typename _Iter, typename _Pointer, typename _Comp>
> > > +      void
> > > +      __merge_adaptive(_Iter __first, _Iter __middle, _Iter __last,
> > > +                  iter_difference_t<_Iter> __len1,
> > > +                  iter_difference_t<_Iter> __len2,
> > > +                  _Pointer __buffer, _Comp __comp); // defined near
> > > inplace_merge
> > > +
> > > +    template<typename _Iter, typename _Distance, typename _Pointer,
> > > typename _Comp>
> > > +      void
> > > +      __merge_adaptive_resize(_Iter __first, _Iter __middle, _Iter 
> > > __last,
> > > +                         _Distance __len1, _Distance __len2,
> > > +                         _Pointer __buffer, _Distance __buffer_size,
> > > +                         _Comp __comp); // defined near inplace_merge
> > > +
> > > +    template<typename _Iter, typename _Distance, typename _Comp>
> > > +      constexpr void
> > > +      __merge_without_buffer(_Iter __first, _Iter __middle, _Iter __last,
> > > +                        _Distance __len1, _Distance __len2,
> > > +                        _Comp __comp); // defined near inplace_merge
> > > +
> > > +    template<typename _Iter, typename _Pointer, typename _Comp>
> > > +      void
> > > +      __stable_sort_adaptive(_Iter __first, _Iter __middle, _Iter __last,
> > > +                        _Pointer __buffer, _Comp __comp)
> > > +      {
> > > +   __detail::__merge_sort_with_buffer(__first, __middle, __buffer,
> > > __comp);
> > > +   __detail::__merge_sort_with_buffer(__middle, __last, __buffer,
> > > __comp);
> > > +
> > > +   __detail::__merge_adaptive(__first, __middle, __last,
> > > +                              __middle - __first, __last - __middle,
> > > +                              __buffer, __comp);
> > > +      }
> > > +
> > > +    template<typename _Iter, typename _Pointer, typename _Distance,
> > > typename _Comp>
> > > +      void
> > > +      __stable_sort_adaptive_resize(_Iter __first, _Iter __last,
> > > +                               _Pointer __buffer, _Distance
> > > __buffer_size,
> > > +                               _Comp __comp)
> > > +      {
> > > +   const _Distance __len = (__last - __first + 1) / 2;
> > > +   const _Iter __middle = __first + __len;
> > > +   if (__len > __buffer_size)
> > > +     {
> > > +       __detail::__stable_sort_adaptive_resize(__first, __middle,
> > > __buffer,
> > > +                                               __buffer_size, __comp);
> > > +       __detail::__stable_sort_adaptive_resize(__middle, __last,
> > > __buffer,
> > > +                                               __buffer_size, __comp);
> > > +       __detail::__merge_adaptive_resize(__first, __middle, __last,
> > > +                                         _Distance(__middle - __first),
> > > +                                         _Distance(__last - __middle),
> > > +                                         __buffer, __buffer_size,
> > > +                                         __comp);
> > > +     }
> > > +   else
> > > +     __detail::__stable_sort_adaptive(__first, __middle, __last,
> > > +                                      __buffer, __comp);
> > > +      }
> > > +
> > > +    template<typename _Iter, typename _Comp>
> > > +      _GLIBCXX26_CONSTEXPR
> >
> > I think this could be unconditionally constexpr. It will never be used
> > during constant evaluation before C++26, but we can avoid the ugly
> > macro. Or do you think the macro serves as documentation for when we
> > expect to be constexpr? ... I suppose the 26_CONSTEXPR macro it makes
> > it clear that it could potentially use 'if consteval' in the body for
> > any constexpr paths, whereas it couldn't do that if it was used in
> > C++20.
>
> I think I prefer making it unconditionally constexpr, and also
> __stable_partition_adaptive in the ranges::stable_partition patch.

Ack - OK for trunk with those changes.

> >
> > > +      void
> > > +      __inplace_stable_sort(_Iter __first, _Iter __last, _Comp __comp)
> > > +      {
> > > +   if (__last - __first < 15)
> > > +     {
> > > +       __detail::__insertion_sort(__first, __last, __comp);
> > > +       return;
> > > +     }
> > > +   _Iter __middle = __first + (__last - __first) / 2;
> > > +   __detail::__inplace_stable_sort(__first, __middle, __comp);
> > > +   __detail::__inplace_stable_sort(__middle, __last, __comp);
> > > +   __detail::__merge_without_buffer(__first, __middle, __last,
> > > +                                    __middle - __first,
> > > +                                    __last - __middle,
> > > +                                    __comp);
> > > +      }
> > > +  } // namespace __detail
> > > +
> > >   struct __stable_sort_fn
> > >   {
> > >     template<random_access_iterator _Iter, sentinel_for<_Iter> _Sent,
> > > @@ -2398,10 +2562,45 @@ namespace ranges
> > >       operator()(_Iter __first, _Sent __last,
> > >              _Comp __comp = {}, _Proj __proj = {}) const
> > >       {
> > > -   auto __lasti = ranges::next(__first, __last);
> > > -   std::stable_sort(std::move(__first), __lasti,
> > > -                    __detail::__make_comp_proj(__comp, __proj));
> > > -   return __lasti;
> > > +   if constexpr (!same_as<_Iter, _Sent>)
> > > +     return (*this)(__first, ranges::next(__first, __last),
> > > +                    std::move(__comp), std::move(__proj));
> > > +   else
> > > +     {
> > > +       using _DistanceType = iter_difference_t<_Iter>;
> > > +
> > > +       if (__first == __last)
> > > +         return __last;
> > > +
> > > +#if _GLIBCXX_HOSTED
> > > +# if __glibcxx_constexpr_algorithms >= 202306L // >= C++26
> > > +       if consteval {
> > > +         __detail::__inplace_stable_sort(__first, __last, __comp);
> > > +         return __last;
> > > +       }
> > > +# endif
> > > +
> > > +       typedef _Temporary_buffer<_Iter, iter_value_t<_Iter>> _TmpBuf;
> > > +       // __stable_sort_adaptive sorts the range in two halves,
> > > +       // so the buffer only needs to fit half the range at once.
> > > +       _TmpBuf __buf(__first, ptrdiff_t((__last - __first + 1) / 2));
> > > +
> > > +       auto __comp_proj = __detail::__make_comp_proj(__comp, __proj);
> > > +       if (__buf._M_requested_size() == __buf.size()) [[likely]]
> > > +         __detail::__stable_sort_adaptive(__first,
> > > +                                          __first +
> > > _DistanceType(__buf.size()),
> > > +                                          __last, __buf.begin(),
> > > __comp_proj);
> > > +       else if (__buf.begin()) [[unlikely]]
> > > +         __detail::__inplace_stable_sort(__first, __last, __comp_proj);
> > > +       else
> > > +         __detail::__stable_sort_adaptive_resize(__first, __last,
> > > __buf.begin(),
> > > +
> > > _DistanceType(__buf.size()),
> > > +                                                 __comp_proj);
> > > +#else
> > > +       __detail::__inplace_stable_sort(__first, __last, __comp_proj);
> > > +#endif
> > > +       return __last;
> > > +     }
> > >       }
> > >
> > >     template<random_access_range _Range,
> > > diff --git 
> > > a/libstdc++-v3/testsuite/25_algorithms/stable_sort/constrained.cc
> > > b/libstdc++-v3/testsuite/25_algorithms/stable_sort/constrained.cc
> > > index 0bd438fa5f29..55043442f4be 100644
> > > --- a/libstdc++-v3/testsuite/25_algorithms/stable_sort/constrained.cc
> > > +++ b/libstdc++-v3/testsuite/25_algorithms/stable_sort/constrained.cc
> > > @@ -20,6 +20,7 @@
> > >
> > > #include <algorithm>
> > > #include <random>
> > > +#include <ranges>
> > > #include <vector>
> > > #include <testsuite_hooks.h>
> > > #include <testsuite_iterators.h>
> > > @@ -62,8 +63,37 @@ test01()
> > >     }
> > > }
> > >
> > > +void
> > > +test02()
> > > +{
> > > +  // PR libstdc++/100795 - ranges::stable_sort should not use
> > > std::stable_sort
> > > +  // directly
> > > +#if __SIZEOF_INT128__
> > > +  auto v = std::views::iota(__int128(0), __int128(20));
> > > +#else
> > > +  auto v = std::views::iota(0ll, 20ll);
> > > +#endif
> > > +
> > > +  int storage[20] = {2,5,4,3,1,6,7,9,10,8,11,14,12,13,15,16,18,0,19,17};
> > > +  auto w = v | std::views::transform([&](auto i) -> int& { return
> > > storage[i]; });
> > > +  using type = decltype(w);
> > > +  using cat =
> > > std::iterator_traits<std::ranges::iterator_t<type>>::iterator_category;
> > > +  static_assert( std::same_as<cat, std::output_iterator_tag> );
> > > +  static_assert( std::ranges::random_access_range<type> );
> > > +
> > > +  ranges::stable_sort(w);
> > > +  VERIFY( ranges::equal(w, v) );
> > > +
> > > +  ranges::stable_sort(w, std::ranges::greater{});
> > > +  VERIFY( ranges::equal(w, v | std::views::reverse) );
> > > +
> > > +  ranges::stable_sort(w, std::ranges::greater{}, std::negate{});
> > > +  VERIFY( ranges::equal(w, v) );
> > > +}
> > > +
> > > int
> > > main()
> > > {
> > >   test01();
> > > +  test02();
> > > }
> > > --
> > > 2.50.0.131.gcf6f63ea6b
> > >
> > >
> >
> >
>

Reply via email to