On Thu, 26 Jun 2025, Patrick Palka wrote:

>       PR libstdc++/100795
> 
> libstdc++-v3/ChangeLog:
> 
>       * include/bits/ranges_algo.h (__sample_fn::operator()):
>       Reimplement the forward_iterator branch directly.
>       * testsuite/25_algorithms/sample/constrained.cc (test02):
>       New test.
> ---
>  libstdc++-v3/include/bits/ranges_algo.h       | 70 +++++++++++++++++--
>  .../25_algorithms/sample/constrained.cc       | 28 ++++++++
>  2 files changed, 91 insertions(+), 7 deletions(-)
> 
> diff --git a/libstdc++-v3/include/bits/ranges_algo.h 
> b/libstdc++-v3/include/bits/ranges_algo.h
> index b12da2af1263..672a0ebce0de 100644
> --- a/libstdc++-v3/include/bits/ranges_algo.h
> +++ b/libstdc++-v3/include/bits/ranges_algo.h
> @@ -1839,14 +1839,70 @@ namespace ranges
>        operator()(_Iter __first, _Sent __last, _Out __out,
>                iter_difference_t<_Iter> __n, _Gen&& __g) const
>        {
> +     // FIXME: Correctly handle integer-class difference types.

On second thought maybe we don't need to teach uniform_int_distribution
to handle integer-class difference types.  We could just assert that
__n fits inside a long long and use that as the difference type?  Same
for shuffle.

>       if constexpr (forward_iterator<_Iter>)
>         {
> -         // FIXME: Forwarding to std::sample here requires computing __lasti
> -         // which may take linear time.
> -         auto __lasti = ranges::next(__first, __last);
> -         return _GLIBCXX_STD_A::
> -           sample(std::move(__first), std::move(__lasti), std::move(__out),
> -                  __n, std::forward<_Gen>(__g));
> +         using _Size = iter_difference_t<_Iter>;
> +         using __distrib_type = uniform_int_distribution<_Size>;
> +         using __param_type = typename __distrib_type::param_type;
> +         using _USize = __detail::__make_unsigned_like_t<_Size>;
> +         using __uc_type
> +           = common_type_t<typename remove_reference_t<_Gen>::result_type, 
> _USize>;
> +
> +         if (__first == __last)
> +           return __out;
> +
> +         __distrib_type __d{};
> +         _Size __unsampled_sz = ranges::distance(__first, __last);
> +         __n = std::min(__n, __unsampled_sz);
> +
> +         // If possible, we use __gen_two_uniform_ints to efficiently produce
> +         // two random numbers using a single distribution invocation:
> +
> +         const __uc_type __urngrange = __g.max() - __g.min();
> +         if (__urngrange / __uc_type(__unsampled_sz) >= 
> __uc_type(__unsampled_sz))
> +           // I.e. (__urngrange >= __unsampled_sz * __unsampled_sz) but 
> without
> +           // wrapping issues.
> +           {
> +             while (__n != 0 && __unsampled_sz >= 2)
> +               {
> +                 const pair<_Size, _Size> __p =
> +                   __gen_two_uniform_ints(__unsampled_sz, __unsampled_sz - 
> 1, __g);
> +
> +                 --__unsampled_sz;
> +                 if (__p.first < __n)
> +                   {
> +                     *__out = *__first;
> +                     ++__out;
> +                     --__n;
> +                   }
> +
> +                 ++__first;
> +
> +                 if (__n == 0) break;
> +
> +                 --__unsampled_sz;
> +                 if (__p.second < __n)
> +                   {
> +                     *__out = *__first;
> +                     ++__out;
> +                     --__n;
> +                   }
> +
> +                 ++__first;
> +               }
> +           }
> +
> +         // The loop above is otherwise equivalent to this one-at-a-time 
> version:
> +
> +         for (; __n != 0; ++__first)
> +           if (__d(__g, __param_type{0, --__unsampled_sz}) < __n)
> +             {
> +               *__out = *__first;
> +               ++__out;
> +               --__n;
> +             }
> +         return __out;
>         }
>       else
>         {
> @@ -1867,7 +1923,7 @@ namespace ranges
>               if (__k < __n)
>                 __out[__k] = *__first;
>             }
> -         return __out + __sample_sz;
> +         return __out + iter_difference_t<_Out>(__sample_sz);
>         }
>        }
>  
> diff --git a/libstdc++-v3/testsuite/25_algorithms/sample/constrained.cc 
> b/libstdc++-v3/testsuite/25_algorithms/sample/constrained.cc
> index b9945b164903..150e2d2036e0 100644
> --- a/libstdc++-v3/testsuite/25_algorithms/sample/constrained.cc
> +++ b/libstdc++-v3/testsuite/25_algorithms/sample/constrained.cc
> @@ -20,6 +20,7 @@
>  
>  #include <algorithm>
>  #include <random>
> +#include <ranges>
>  #include <testsuite_hooks.h>
>  #include <testsuite_iterators.h>
>  
> @@ -59,9 +60,36 @@ test01()
>      }
>  }
>  
> +void
> +test02()
> +{
> +  // PR libstdc++/100795 - ranges::sample should not use std::sample
> +#if 0 // FIXME: ranges::sample rejects integer-class difference types.
> +#if __SIZEOF_INT128__
> +  auto v = std::views::iota(__int128(0), __int128(20));
> +#else
> +  auto v = std::views::iota(0ll, 20ll);
> +#endif
> +#else
> +  auto v = std::views::iota(0, 20);
> +#endif
> +
> +  int storage[20] = {2,5,4,3,1,6,7,9,10,8,11,14,12,13,15,16,18,0,19,17};
> +  auto w = v | std::views::transform([&](auto i) -> int& { return 
> storage[i]; });
> +  using type = decltype(w);
> +  using cat = 
> std::iterator_traits<std::ranges::iterator_t<type>>::iterator_category;
> +  static_assert( std::same_as<cat, std::output_iterator_tag> );
> +  static_assert( std::ranges::random_access_range<type> );
> +
> +  ranges::sample(v, w.begin(), 20, rng);
> +  ranges::sort(w);
> +  VERIFY( ranges::equal(w, v) );
> +}
> +
>  int
>  main()
>  {
>    test01<forward_iterator_wrapper, output_iterator_wrapper>();
>    test01<input_iterator_wrapper, random_access_iterator_wrapper>();
> +  test02();
>  }
> -- 
> 2.50.0.131.gcf6f63ea6b
> 
> 

Reply via email to