On Thu, 26 Jun 2025, Patrick Palka wrote:
> PR libstdc++/100795
>
> libstdc++-v3/ChangeLog:
>
> * include/bits/ranges_algo.h (__sample_fn::operator()):
> Reimplement the forward_iterator branch directly.
> * testsuite/25_algorithms/sample/constrained.cc (test02):
> New test.
> ---
> libstdc++-v3/include/bits/ranges_algo.h | 70 +++++++++++++++++--
> .../25_algorithms/sample/constrained.cc | 28 ++++++++
> 2 files changed, 91 insertions(+), 7 deletions(-)
>
> diff --git a/libstdc++-v3/include/bits/ranges_algo.h
> b/libstdc++-v3/include/bits/ranges_algo.h
> index b12da2af1263..672a0ebce0de 100644
> --- a/libstdc++-v3/include/bits/ranges_algo.h
> +++ b/libstdc++-v3/include/bits/ranges_algo.h
> @@ -1839,14 +1839,70 @@ namespace ranges
> operator()(_Iter __first, _Sent __last, _Out __out,
> iter_difference_t<_Iter> __n, _Gen&& __g) const
> {
> + // FIXME: Correctly handle integer-class difference types.
On second thought maybe we don't need to teach uniform_int_distribution
to handle integer-class difference types. We could just assert that
__n fits inside a long long and use that as the difference type? Same
for shuffle.
> if constexpr (forward_iterator<_Iter>)
> {
> - // FIXME: Forwarding to std::sample here requires computing __lasti
> - // which may take linear time.
> - auto __lasti = ranges::next(__first, __last);
> - return _GLIBCXX_STD_A::
> - sample(std::move(__first), std::move(__lasti), std::move(__out),
> - __n, std::forward<_Gen>(__g));
> + using _Size = iter_difference_t<_Iter>;
> + using __distrib_type = uniform_int_distribution<_Size>;
> + using __param_type = typename __distrib_type::param_type;
> + using _USize = __detail::__make_unsigned_like_t<_Size>;
> + using __uc_type
> + = common_type_t<typename remove_reference_t<_Gen>::result_type,
> _USize>;
> +
> + if (__first == __last)
> + return __out;
> +
> + __distrib_type __d{};
> + _Size __unsampled_sz = ranges::distance(__first, __last);
> + __n = std::min(__n, __unsampled_sz);
> +
> + // If possible, we use __gen_two_uniform_ints to efficiently produce
> + // two random numbers using a single distribution invocation:
> +
> + const __uc_type __urngrange = __g.max() - __g.min();
> + if (__urngrange / __uc_type(__unsampled_sz) >=
> __uc_type(__unsampled_sz))
> + // I.e. (__urngrange >= __unsampled_sz * __unsampled_sz) but
> without
> + // wrapping issues.
> + {
> + while (__n != 0 && __unsampled_sz >= 2)
> + {
> + const pair<_Size, _Size> __p =
> + __gen_two_uniform_ints(__unsampled_sz, __unsampled_sz -
> 1, __g);
> +
> + --__unsampled_sz;
> + if (__p.first < __n)
> + {
> + *__out = *__first;
> + ++__out;
> + --__n;
> + }
> +
> + ++__first;
> +
> + if (__n == 0) break;
> +
> + --__unsampled_sz;
> + if (__p.second < __n)
> + {
> + *__out = *__first;
> + ++__out;
> + --__n;
> + }
> +
> + ++__first;
> + }
> + }
> +
> + // The loop above is otherwise equivalent to this one-at-a-time
> version:
> +
> + for (; __n != 0; ++__first)
> + if (__d(__g, __param_type{0, --__unsampled_sz}) < __n)
> + {
> + *__out = *__first;
> + ++__out;
> + --__n;
> + }
> + return __out;
> }
> else
> {
> @@ -1867,7 +1923,7 @@ namespace ranges
> if (__k < __n)
> __out[__k] = *__first;
> }
> - return __out + __sample_sz;
> + return __out + iter_difference_t<_Out>(__sample_sz);
> }
> }
>
> diff --git a/libstdc++-v3/testsuite/25_algorithms/sample/constrained.cc
> b/libstdc++-v3/testsuite/25_algorithms/sample/constrained.cc
> index b9945b164903..150e2d2036e0 100644
> --- a/libstdc++-v3/testsuite/25_algorithms/sample/constrained.cc
> +++ b/libstdc++-v3/testsuite/25_algorithms/sample/constrained.cc
> @@ -20,6 +20,7 @@
>
> #include <algorithm>
> #include <random>
> +#include <ranges>
> #include <testsuite_hooks.h>
> #include <testsuite_iterators.h>
>
> @@ -59,9 +60,36 @@ test01()
> }
> }
>
> +void
> +test02()
> +{
> + // PR libstdc++/100795 - ranges::sample should not use std::sample
> +#if 0 // FIXME: ranges::sample rejects integer-class difference types.
> +#if __SIZEOF_INT128__
> + auto v = std::views::iota(__int128(0), __int128(20));
> +#else
> + auto v = std::views::iota(0ll, 20ll);
> +#endif
> +#else
> + auto v = std::views::iota(0, 20);
> +#endif
> +
> + int storage[20] = {2,5,4,3,1,6,7,9,10,8,11,14,12,13,15,16,18,0,19,17};
> + auto w = v | std::views::transform([&](auto i) -> int& { return
> storage[i]; });
> + using type = decltype(w);
> + using cat =
> std::iterator_traits<std::ranges::iterator_t<type>>::iterator_category;
> + static_assert( std::same_as<cat, std::output_iterator_tag> );
> + static_assert( std::ranges::random_access_range<type> );
> +
> + ranges::sample(v, w.begin(), 20, rng);
> + ranges::sort(w);
> + VERIFY( ranges::equal(w, v) );
> +}
> +
> int
> main()
> {
> test01<forward_iterator_wrapper, output_iterator_wrapper>();
> test01<input_iterator_wrapper, random_access_iterator_wrapper>();
> + test02();
> }
> --
> 2.50.0.131.gcf6f63ea6b
>
>