On Thu, Jun 12, 2025 at 4:56 PM Patrick Palka <ppa...@redhat.com> wrote:

> On Wed, 11 Jun 2025, Tomasz Kaminski wrote:
>
> >
> >
> > On Wed, Jun 11, 2025 at 1:56 PM Jonathan Wakely <jwak...@redhat.com>
> wrote:
> >       On Wed, 11 Jun 2025 at 12:42, Tomasz Kaminski <tkami...@redhat.com>
> wrote:
> >       >
> >       >
> >       >
> >       > On Tue, Jun 10, 2025 at 3:05 AM Patrick Palka <ppa...@redhat.com>
> wrote:
> >       >>
> >       >> ranges::push_heap, ranges::pop_heap, ranges::make_heap and
> >       >> ranges::sort_heap are currently defined in terms of the
> corresponding
> >       >> STL-style algorithms, but this is incorrect because the
> STL-style
> >       >> algorithms rely on the legacy iterator system, and so misbehave
> when
> >       >> passed a narrowly C++20 random access iterator.  The other
> ranges heap
> >       >> algos, ranges::is_heap and ranges::is_heap_until, are
> implemented
> >       >> directly already and have no known issues.
> >       >>
> >       >> This patch reimplements these ranges:: algos directly instead,
> based
> >       >> closely on the legacy stl_algo.h implementation, with the
> following
> >       >> changes for compatibility with the C++20 iterator system:
> >       >>
> >       >>   - handle non-common ranges by computing the corresponding end
> iterator
> >       >>   - pass and invoke a projection function as necessary
> >       >>   - use std::__invoke when invoking the comparator
> >       >>   - use ranges::iter_move instead of std::move(*iter)
> >       >>   - use iter_value_t / iter_difference_t instead of
> iterator_traits
> >       >>
> >       >> Besides these changes, the implementation of these algorithms is
> >       >> intended to mirror the stl_algo.h implementations, for ease of
> >       >> maintenance and review.
> >       >>
> >       >>         PR libstdc++/100795
> >       >>
> >       >> libstdc++-v3/ChangeLog:
> >       >>
> >       >>         * include/bits/ranges_algo.h (__detail::__push_heap):
> New,
> >       >>         based on the stl_algo.h implementation.
> >       >>         (__push_heap_fn::operator()): Reimplement in terms of
> the above.
> >       >>         (__detail::__adjust_heap): New, based on the stl_algo.h
> >       >>         implementation.
> >       >>         (__deatil::__pop_heap): Likewise.
> >       >>         (__pop_heap_fn::operator()): Reimplement in terms of
> the above.
> >       >>         (__make_heap_fn::operator()): Likewise.
> >       >>         (__sort_heap_fn::operator()): Likewise.
> >       >>         * testsuite/25_algorithms/heap/constrained.cc (test03):
> New
> >       >>         test.
> >       >> ---
> >       >>  libstdc++-v3/include/bits/ranges_algo.h       | 138
> ++++++++++++++++--
> >       >>  .../25_algorithms/heap/constrained.cc         |  46 ++++++
> >       >>  2 files changed, 168 insertions(+), 16 deletions(-)
> >       >
> >       > LGTM, only requests to pass the predicates by reference to match
> stl_heap.
> >
> >       That was done by  r7-6137-g437f43cc78d460 for  PR67085
> >
> > So the PR does not seem relevant for the range algorithm, and given that
> helper sort functions
> > pass comparator by value via multiple layers, I think we should default
> by-value, given no reason
> > to do otherwise.
>
> Ack.  Also I think by-value is optimal (in terms of codegen) for the
> common case where the comparator/projection are empty types, if the
> helper functions for some reason don't get inlined.
>
LGTM. Thanks.

>
> >
> >
> >
> >       > I have validated the impl against the stl_heap, and
> implementations are the same modulo described changes.
> >       >>
> >       >>
> >       >> diff --git a/libstdc++-v3/include/bits/ranges_algo.h
> b/libstdc++-v3/include/bits/ranges_algo.h
> >       >> index a62c3cd3954d..f84e0c42d76a 100644
> >       >> --- a/libstdc++-v3/include/bits/ranges_algo.h
> >       >> +++ b/libstdc++-v3/include/bits/ranges_algo.h
> >       >> @@ -1881,6 +1881,30 @@ namespace ranges
> >       >>
> >       >>    inline constexpr __shuffle_fn shuffle{};
> >       >>
> >       >> +  namespace __detail
> >       >> +  {
> >       >> +    template<typename _Iter, typename _Comp, typename _Proj>
> >       >> +      constexpr void
> >       >> +      __push_heap(_Iter __first,
> >       >> +                 iter_difference_t<_Iter> __holeIndex,
> >       >> +                 iter_difference_t<_Iter> __topIndex,
> >       >> +                 iter_value_t<_Iter> __value,
> >       >> +                 _Comp __comp, _Proj __proj)
> >       >
> >       > stl_heap implementation does not copy __comp and __proj, and uses
> >       > _Comp& instead. I think I would do that also here.
> >       >>
> >       >> +      {
> >       >> +       auto __parent = (__holeIndex - 1) / 2;
> >       >> +       while (__holeIndex > __topIndex
> >       >> +              && std::__invoke(__comp,
> >       >> +                               std::__invoke(__proj, *(__first
> + __parent)),
> >       >> +                               std::__invoke(__proj, __value)))
> >       >> +         {
> >       >> +           *(__first + __holeIndex) =
> ranges::iter_move(__first + __parent);
> >       >> +           __holeIndex = __parent;
> >       >> +           __parent = (__holeIndex - 1) / 2;
> >       >> +         }
> >       >> +       *(__first + __holeIndex) = std::move(__value);
> >       >> +      }
> >       >> +  } // namespace __detail
> >       >> +
> >       >>    struct __push_heap_fn
> >       >>    {
> >       >>      template<random_access_iterator _Iter, sentinel_for<_Iter>
> _Sent,
> >       >> @@ -1890,10 +1914,16 @@ namespace ranges
> >       >>        operator()(_Iter __first, _Sent __last,
> >       >>                  _Comp __comp = {}, _Proj __proj = {}) const
> >       >>        {
> >       >> -       auto __lasti = ranges::next(__first, __last);
> >       >> -       std::push_heap(__first, __lasti,
> >       >> -                      __detail::__make_comp_proj(__comp,
> __proj));
> >       >> -       return __lasti;
> >       >> +       if constexpr (!same_as<_Iter, _Sent>)
> >       >> +         return (*this)(__first, ranges::next(__first, __last),
> >       >> +                        std::move(__comp), std::move(__proj));
> >       >
> >       >
> >       >> +       else
> >       >> +         {
> >       >> +           __detail::__push_heap(__first, (__last - __first) -
> 1,
> >       >> +                                 0, ranges::iter_move(__last -
> 1),
> >       >> +                                 __comp, __proj);
> >       >> +           return __last;
> >       >> +         }
> >       >>        }
> >       >>
> >       >>      template<random_access_range _Range,
> >       >> @@ -1909,6 +1939,50 @@ namespace ranges
> >       >>
> >       >>    inline constexpr __push_heap_fn push_heap{};
> >       >>
> >       >> +  namespace __detail
> >       >> +  {
> >       >> +    template<typename _Iter, typename _Comp, typename _Proj>
> >       >> +      constexpr void
> >       >> +      __adjust_heap(_Iter __first,
> >       >> +                   iter_difference_t<_Iter> __holeIndex,
> >       >> +                   iter_difference_t<_Iter> __len,
> >       >> +                   iter_value_t<_Iter> __value,
> >       >> +                   _Comp __comp, _Proj __proj)
> >       >
> >       > Same comment about references.
> >       >>
> >       >> +      {
> >       >> +       auto __topIndex = __holeIndex;
> >       >> +       auto __secondChild = __holeIndex;
> >       >> +       while (__secondChild < (__len - 1) / 2)
> >       >> +         {
> >       >> +           __secondChild = 2 * (__secondChild + 1);
> >       >> +           if (std::__invoke(__comp,
> >       >> +                             std::__invoke(__proj, *(__first +
> __secondChild)),
> >       >> +                             std::__invoke(__proj, *(__first +
> (__secondChild - 1)))))
> >       >> +             __secondChild--;
> >       >> +           *(__first + __holeIndex) =
> ranges::iter_move(__first + __secondChild);
> >       >> +           __holeIndex = __secondChild;
> >       >> +         }
> >       >> +       if ((__len & 1) == 0 && __secondChild == (__len - 2) /
> 2)
> >       >> +         {
> >       >> +           __secondChild = 2 * (__secondChild + 1);
> >       >> +           *(__first + __holeIndex) =
> ranges::iter_move(__first + (__secondChild - 1));
> >       >> +           __holeIndex = __secondChild - 1;
> >       >> +         }
> >       >> +       __detail::__push_heap(__first, __holeIndex, __topIndex,
> >       >> +                             std::move(__value), __comp,
> __proj);
> >       >> +      }
> >       >> +
> >       >> +    template<typename _Iter, typename _Comp, typename _Proj>
> >       >> +      constexpr void
> >       >> +      __pop_heap(_Iter __first, _Iter __last, _Iter __result,
> >       >> +                _Comp __comp, _Proj __proj)
> >       >
> >       > Also here.
> >       >>
> >       >> +      {
> >       >> +       iter_value_t<_Iter> __value =
> ranges::iter_move(__result);
> >       >> +       *__result = ranges::iter_move(__first);
> >       >> +       __detail::__adjust_heap(__first, 0, __last - __first,
> >       >> +                               std::move(__value), __comp,
> __proj);
> >       >> +      }
> >       >> +  } // namespace __detail
> >       >> +
> >       >>    struct __pop_heap_fn
> >       >>    {
> >       >>      template<random_access_iterator _Iter, sentinel_for<_Iter>
> _Sent,
> >       >> @@ -1918,10 +1992,15 @@ namespace ranges
> >       >>        operator()(_Iter __first, _Sent __last,
> >       >>                  _Comp __comp = {}, _Proj __proj = {}) const
> >       >>        {
> >       >> -       auto __lasti = ranges::next(__first, __last);
> >       >> -       std::pop_heap(__first, __lasti,
> >       >> -                     __detail::__make_comp_proj(__comp,
> __proj));
> >       >> -       return __lasti;
> >       >> +       if constexpr (!same_as<_Iter, _Sent>)
> >       >> +         return (*this)(__first, ranges::next(__first, __last),
> >       >> +                        std::move(__comp), std::move(__proj));
> >       >> +       else
> >       >> +         {
> >       >> +           if (__last - __first > 1)
> >       >> +             __detail::__pop_heap(__first, __last - 1, __last
> - 1, __comp, __proj);
> >       >> +           return __last;
> >       >> +         }
> >       >>        }
> >       >>
> >       >>      template<random_access_range _Range,
> >       >> @@ -1946,10 +2025,28 @@ namespace ranges
> >       >>        operator()(_Iter __first, _Sent __last,
> >       >>                  _Comp __comp = {}, _Proj __proj = {}) const
> >       >>        {
> >       >> -       auto __lasti = ranges::next(__first, __last);
> >       >> -       std::make_heap(__first, __lasti,
> >       >> -                      __detail::__make_comp_proj(__comp,
> __proj));
> >       >> -       return __lasti;
> >       >> +       if constexpr (!same_as<_Iter, _Sent>)
> >       >> +         return (*this)(__first, ranges::next(__first, __last),
> >       >> +                        std::move(__comp), std::move(__proj));
> >       >> +       else
> >       >> +         {
> >       >> +           if (__last - __first > 1)
> >       >
> >       > I would prefer early if, matching the stl_heap closer:
> >       >  const auto __len = __last - __first;
> >       >   if (__len < 2)
> >       >      return __last;
>
> Fixed.
>
> Here's an updated patch, with the above early if change and also
> changed stl_algo.h mentions to stl_heap.h in the commit message.
>
> -- >8 --
>
> Subject: [PATCH 1/2] libstdc++: Directly implement ranges::heap algos
>  [PR100795]
>
> ranges::push_heap, ranges::pop_heap, ranges::make_heap and
> ranges::sort_heap are currently defined in terms of the corresponding
> STL-style algorithms, but this is incorrect because the STL-style
> algorithms rely on the legacy iterator system, and so misbehave when
> passed a narrowly C++20 random access iterator.  The other ranges heap
> algos, ranges::is_heap and ranges::is_heap_until, are implemented
> directly already and have no known issues.
>
> This patch reimplements these ranges:: algos directly instead, based
> closely on the legacy stl_heap.h implementation, with the following
> changes for compatibility with the C++20 iterator system:
>
>   - handle non-common ranges by computing the corresponding end iterator
>   - pass and invoke a projection function as necessary
>   - use std::__invoke when invoking the comparator
>   - use ranges::iter_move instead of std::move(*iter)
>   - use iter_value_t / iter_difference_t instead of iterator_traits
>
> Besides these changes, the implementation of these algorithms is
> intended to mirror the stl_heap.h implementations, for ease of
> maintenance and review.
>
>         PR libstdc++/100795
>
> libstdc++-v3/ChangeLog:
>
>         * include/bits/ranges_algo.h (__detail::__push_heap): New,
>         based on the stl_heap.h implementation.
>         (__push_heap_fn::operator()): Reimplement in terms of the above.
>         (__detail::__adjust_heap): New, based on the stl_heap.h
>         implementation.
>         (__deatil::__pop_heap): Likewise.
>         (__pop_heap_fn::operator()): Reimplement in terms of the above.
>         (__make_heap_fn::operator()): Likewise.
>         (__sort_heap_fn::operator()): Likewise.
>         * testsuite/25_algorithms/heap/constrained.cc (test03): New
>         test.
> ---
>  libstdc++-v3/include/bits/ranges_algo.h       | 138 ++++++++++++++++--
>  .../25_algorithms/heap/constrained.cc         |  46 ++++++
>  2 files changed, 168 insertions(+), 16 deletions(-)
>
> diff --git a/libstdc++-v3/include/bits/ranges_algo.h
> b/libstdc++-v3/include/bits/ranges_algo.h
> index a62c3cd3954d..ca86f63812f4 100644
> --- a/libstdc++-v3/include/bits/ranges_algo.h
> +++ b/libstdc++-v3/include/bits/ranges_algo.h
> @@ -1881,6 +1881,30 @@ namespace ranges
>
>    inline constexpr __shuffle_fn shuffle{};
>
> +  namespace __detail
> +  {
> +    template<typename _Iter, typename _Comp, typename _Proj>
> +      constexpr void
> +      __push_heap(_Iter __first,
> +                 iter_difference_t<_Iter> __holeIndex,
> +                 iter_difference_t<_Iter> __topIndex,
> +                 iter_value_t<_Iter> __value,
> +                 _Comp __comp, _Proj __proj)
> +      {
> +       auto __parent = (__holeIndex - 1) / 2;
> +       while (__holeIndex > __topIndex
> +              && std::__invoke(__comp,
> +                               std::__invoke(__proj, *(__first +
> __parent)),
> +                               std::__invoke(__proj, __value)))
> +         {
> +           *(__first + __holeIndex) = ranges::iter_move(__first +
> __parent);
> +           __holeIndex = __parent;
> +           __parent = (__holeIndex - 1) / 2;
> +         }
> +       *(__first + __holeIndex) = std::move(__value);
> +      }
> +  } // namespace __detail
> +
>    struct __push_heap_fn
>    {
>      template<random_access_iterator _Iter, sentinel_for<_Iter> _Sent,
> @@ -1890,10 +1914,16 @@ namespace ranges
>        operator()(_Iter __first, _Sent __last,
>                  _Comp __comp = {}, _Proj __proj = {}) const
>        {
> -       auto __lasti = ranges::next(__first, __last);
> -       std::push_heap(__first, __lasti,
> -                      __detail::__make_comp_proj(__comp, __proj));
> -       return __lasti;
> +       if constexpr (!same_as<_Iter, _Sent>)
> +         return (*this)(__first, ranges::next(__first, __last),
> +                        std::move(__comp), std::move(__proj));
> +       else
> +         {
> +           __detail::__push_heap(__first, (__last - __first) - 1,
> +                                 0, ranges::iter_move(__last - 1),
> +                                 __comp, __proj);
> +           return __last;
> +         }
>        }
>
>      template<random_access_range _Range,
> @@ -1909,6 +1939,50 @@ namespace ranges
>
>    inline constexpr __push_heap_fn push_heap{};
>
> +  namespace __detail
> +  {
> +    template<typename _Iter, typename _Comp, typename _Proj>
> +      constexpr void
> +      __adjust_heap(_Iter __first,
> +                   iter_difference_t<_Iter> __holeIndex,
> +                   iter_difference_t<_Iter> __len,
> +                   iter_value_t<_Iter> __value,
> +                   _Comp __comp, _Proj __proj)
> +      {
> +       auto __topIndex = __holeIndex;
> +       auto __secondChild = __holeIndex;
> +       while (__secondChild < (__len - 1) / 2)
> +         {
> +           __secondChild = 2 * (__secondChild + 1);
> +           if (std::__invoke(__comp,
> +                             std::__invoke(__proj, *(__first +
> __secondChild)),
> +                             std::__invoke(__proj, *(__first +
> (__secondChild - 1)))))
> +             __secondChild--;
> +           *(__first + __holeIndex) = ranges::iter_move(__first +
> __secondChild);
> +           __holeIndex = __secondChild;
> +         }
> +       if ((__len & 1) == 0 && __secondChild == (__len - 2) / 2)
> +         {
> +           __secondChild = 2 * (__secondChild + 1);
> +           *(__first + __holeIndex) = ranges::iter_move(__first +
> (__secondChild - 1));
> +           __holeIndex = __secondChild - 1;
> +         }
> +       __detail::__push_heap(__first, __holeIndex, __topIndex,
> +                             std::move(__value), __comp, __proj);
> +      }
> +
> +    template<typename _Iter, typename _Comp, typename _Proj>
> +      constexpr void
> +      __pop_heap(_Iter __first, _Iter __last, _Iter __result,
> +                _Comp __comp, _Proj __proj)
> +      {
> +       iter_value_t<_Iter> __value = ranges::iter_move(__result);
> +       *__result = ranges::iter_move(__first);
> +       __detail::__adjust_heap(__first, 0, __last - __first,
> +                               std::move(__value), __comp, __proj);
> +      }
> +  } // namespace __detail
> +
>    struct __pop_heap_fn
>    {
>      template<random_access_iterator _Iter, sentinel_for<_Iter> _Sent,
> @@ -1918,10 +1992,15 @@ namespace ranges
>        operator()(_Iter __first, _Sent __last,
>                  _Comp __comp = {}, _Proj __proj = {}) const
>        {
> -       auto __lasti = ranges::next(__first, __last);
> -       std::pop_heap(__first, __lasti,
> -                     __detail::__make_comp_proj(__comp, __proj));
> -       return __lasti;
> +       if constexpr (!same_as<_Iter, _Sent>)
> +         return (*this)(__first, ranges::next(__first, __last),
> +                        std::move(__comp), std::move(__proj));
> +       else
> +         {
> +           if (__last - __first > 1)
> +             __detail::__pop_heap(__first, __last - 1, __last - 1,
> __comp, __proj);
> +           return __last;
> +         }
>        }
>
>      template<random_access_range _Range,
> @@ -1946,10 +2025,28 @@ namespace ranges
>        operator()(_Iter __first, _Sent __last,
>                  _Comp __comp = {}, _Proj __proj = {}) const
>        {
> -       auto __lasti = ranges::next(__first, __last);
> -       std::make_heap(__first, __lasti,
> -                      __detail::__make_comp_proj(__comp, __proj));
> -       return __lasti;
> +       if constexpr (!same_as<_Iter, _Sent>)
> +         return (*this)(__first, ranges::next(__first, __last),
> +                        std::move(__comp), std::move(__proj));
> +       else
> +         {
> +           const auto __len = __last - __first;
> +           if (__len < 2)
> +             return __last;
> +
> +           auto __parent = (__len - 2) / 2;
> +           while (true)
> +             {
> +               iter_value_t<_Iter> __value = ranges::iter_move(__first +
> __parent);
> +               __detail::__adjust_heap(__first, __parent, __len,
> +                                       std::move(__value),
> +                                       __comp, __proj);
> +               if (__parent == 0)
> +                 break;
> +               __parent--;
> +             }
> +           return __last;
> +         }
>        }
>
>      template<random_access_range _Range,
> @@ -1974,10 +2071,19 @@ namespace ranges
>        operator()(_Iter __first, _Sent __last,
>                  _Comp __comp = {}, _Proj __proj = {}) const
>        {
> -       auto __lasti = ranges::next(__first, __last);
> -       std::sort_heap(__first, __lasti,
> -                      __detail::__make_comp_proj(__comp, __proj));
> -       return __lasti;
> +       if constexpr (!same_as<_Iter, _Sent>)
> +         return (*this)(__first, ranges::next(__first, __last),
> +                        std::move(__comp), std::move(__proj));
> +       else
> +         {
> +           _Iter __ret = __last;
> +           while (__last - __first > 1)
> +             {
> +               --__last;
> +               __detail::__pop_heap(__first, __last, __last, __comp,
> __proj);
> +             }
> +           return __ret;
> +         }
>        }
>
>      template<random_access_range _Range,
> diff --git a/libstdc++-v3/testsuite/25_algorithms/heap/constrained.cc
> b/libstdc++-v3/testsuite/25_algorithms/heap/constrained.cc
> index 8037a2db6b80..5486c8552d03 100644
> --- a/libstdc++-v3/testsuite/25_algorithms/heap/constrained.cc
> +++ b/libstdc++-v3/testsuite/25_algorithms/heap/constrained.cc
> @@ -20,6 +20,7 @@
>
>  #include <algorithm>
>  #include <random>
> +#include <ranges>
>  #include <testsuite_hooks.h>
>  #include <testsuite_iterators.h>
>
> @@ -97,10 +98,55 @@ test02()
>    return ok;
>  }
>
> +constexpr bool
> +test03()
> +{
> +  // PR libstdc++/100795 - ranges::heap algos should not use std::heap
> directly
> +#if __SIZEOF_INT128__
> +  auto v = std::views::iota(__int128(0), __int128(20));
> +#else
> +  auto v = std::views::iota(0ll, 20ll);
> +#endif
> +
> +  int storage[20] = {2,5,4,3,1,6,7,9,10,8,11,14,12,13,15,16,18,0,19,17};
> +  auto w = v | std::views::transform([&](auto i) -> int& { return
> storage[i]; });
> +  using type = decltype(w);
> +  using cat =
> std::iterator_traits<std::ranges::iterator_t<type>>::iterator_category;
> +  static_assert( std::same_as<cat, std::output_iterator_tag> );
> +  static_assert( std::ranges::random_access_range<type> );
> +
> +  for (int i = 1; i < 20; i++)
> +    ranges::push_heap(w.begin(), w.begin() + i);
> +  ranges::sort_heap(w);
> +  VERIFY( ranges::equal(w, v) );
> +  ranges::make_heap(w);
> +  auto it = ranges::pop_heap(w);
> +  VERIFY( it[-1] == 19 );
> +
> +  for (int i = 1; i < 20; i++)
> +    ranges::push_heap(w.begin(), w.begin() + i, std::ranges::greater{});
> +  ranges::sort_heap(w, std::ranges::greater{});
> +  VERIFY( ranges::equal(w, v | std::views::reverse) );
> +  ranges::make_heap(w, std::ranges::greater{});
> +  it = ranges::pop_heap(w, std::ranges::greater{});
> +  VERIFY( it[-1] == 0 );
> +
> +  for (int i = 1; i < 20; i++)
> +    ranges::push_heap(w.begin(), w.begin() + i, std::ranges::greater{},
> std::negate{});
> +  ranges::sort_heap(w, std::ranges::greater{}, std::negate{});
> +  VERIFY( ranges::equal(w, v) );
> +  ranges::make_heap(w, std::ranges::greater{}, std::negate{});
> +  it = ranges::pop_heap(w, std::ranges::greater{}, std::negate{});
> +  VERIFY( it[-1] == 19 );
> +
> +  return true;
> +}
> +
>  int
>  main()
>  {
>    test01<test_range>();
>    test01<test_container>();
>    static_assert(test02());
> +  static_assert(test03());
>  }
> --
> 2.50.0.rc2
>

Reply via email to