]> git.ipfire.org Git - thirdparty/gcc.git/commitdiff
libstdc++: Reduce ranges::minmax/minmax_element comparison complexity
authorPatrick Palka <ppalka@redhat.com>
Fri, 18 Jun 2021 23:33:39 +0000 (19:33 -0400)
committerPatrick Palka <ppalka@redhat.com>
Fri, 18 Jun 2021 23:33:39 +0000 (19:33 -0400)
This rewrites ranges::minmax and ranges::minmax_element so that it
performs at most 3*N/2 many comparisons, as required by the standard.
In passing, this also fixes PR100387 by avoiding a premature std::move
in ranges::minmax and in std::shift_right.

PR libstdc++/100387

libstdc++-v3/ChangeLog:

* include/bits/ranges_algo.h (__minmax_fn::operator()): Rewrite
to limit comparison complexity to 3*N/2.
(__minmax_element_fn::operator()): Likewise.
(shift_right): Avoid premature std::move of __result.
* testsuite/25_algorithms/minmax/constrained.cc (test04, test05):
New tests.
* testsuite/25_algorithms/minmax_element/constrained.cc (test02):
Likewise.

libstdc++-v3/include/bits/ranges_algo.h
libstdc++-v3/testsuite/25_algorithms/minmax/constrained.cc
libstdc++-v3/testsuite/25_algorithms/minmax_element/constrained.cc

index 9eeebff65258623aac7e0db859c64b220106a64b..83371a4bdf0a113fc042eaf400f43e5a36e05ad4 100644 (file)
@@ -3076,26 +3076,59 @@ namespace ranges
     template<input_range _Range, typename _Proj = identity,
             indirect_strict_weak_order<projected<iterator_t<_Range>, _Proj>>
               _Comp = ranges::less>
-      requires indirectly_copyable_storable<iterator_t<_Range>,
-      range_value_t<_Range>*>
+      requires indirectly_copyable_storable<iterator_t<_Range>, range_value_t<_Range>*>
       constexpr minmax_result<range_value_t<_Range>>
       operator()(_Range&& __r, _Comp __comp = {}, _Proj __proj = {}) const
       {
        auto __first = ranges::begin(__r);
        auto __last = ranges::end(__r);
        __glibcxx_assert(__first != __last);
+       auto __comp_proj = __detail::__make_comp_proj(__comp, __proj);
        minmax_result<range_value_t<_Range>> __result = {*__first, *__first};
+       if (++__first == __last)
+         return __result;
+       else
+         {
+           // At this point __result.min == __result.max, so a single
+           // comparison with the next element suffices.
+           auto&& __val = *__first;
+           if (__comp_proj(__val, __result.min))
+             __result.min = std::forward<decltype(__val)>(__val);
+           else
+             __result.max = std::forward<decltype(__val)>(__val);
+         }
        while (++__first != __last)
          {
-           auto __tmp = *__first;
-           if (std::__invoke(__comp,
-                             std::__invoke(__proj, __tmp),
-                             std::__invoke(__proj, __result.min)))
-             __result.min = std::move(__tmp);
-           if (!(bool)std::__invoke(__comp,
-                                    std::__invoke(__proj, __tmp),
-                                    std::__invoke(__proj, __result.max)))
-             __result.max = std::move(__tmp);
+           // Now process two elements at a time so that we perform at most
+           // 1 + 3*(N-2)/2 comparisons in total (each of the (N-2)/2
+           // iterations of this loop performs three comparisons).
+           range_value_t<_Range> __val1 = *__first;
+           if (++__first == __last)
+             {
+               // N is odd; in this final iteration, we perform at most two
+               // comparisons, for a total of 1 + 3*(N-3)/2 + 2 comparisons,
+               // which is not more than 3*N/2, as required.
+               if (__comp_proj(__val1, __result.min))
+                 __result.min = std::move(__val1);
+               else if (!__comp_proj(__val1, __result.max))
+                 __result.max = std::move(__val1);
+               break;
+             }
+           auto&& __val2 = *__first;
+           if (!__comp_proj(__val2, __val1))
+             {
+               if (__comp_proj(__val1, __result.min))
+                 __result.min = std::move(__val1);
+               if (!__comp_proj(__val2, __result.max))
+                 __result.max = std::forward<decltype(__val2)>(__val2);
+             }
+           else
+             {
+               if (__comp_proj(__val2, __result.min))
+                 __result.min = std::forward<decltype(__val2)>(__val2);
+               if (!__comp_proj(__val1, __result.max))
+                 __result.max = std::move(__val1);
+             }
          }
        return __result;
       }
@@ -3201,21 +3234,50 @@ namespace ranges
       operator()(_Iter __first, _Sent __last,
                 _Comp __comp = {}, _Proj __proj = {}) const
       {
-       if (__first == __last)
-         return {__first, __first};
-
+       auto __comp_proj = __detail::__make_comp_proj(__comp, __proj);
        minmax_element_result<_Iter> __result = {__first, __first};
-       auto __i = __first;
-       while (++__i != __last)
+       if (__first == __last || ++__first == __last)
+         return __result;
+       else
          {
-           if (std::__invoke(__comp,
-                             std::__invoke(__proj, *__i),
-                             std::__invoke(__proj, *__result.min)))
-             __result.min = __i;
-           if (!(bool)std::__invoke(__comp,
-                                    std::__invoke(__proj, *__i),
-                                    std::__invoke(__proj, *__result.max)))
-             __result.max = __i;
+           // At this point __result.min == __result.max, so a single
+           // comparison with the next element suffices.
+           if (__comp_proj(*__first, *__result.min))
+             __result.min = __first;
+           else
+             __result.max = __first;
+         }
+       while (++__first != __last)
+         {
+           // Now process two elements at a time so that we perform at most
+           // 1 + 3*(N-2)/2 comparisons in total (each of the (N-2)/2
+           // iterations of this loop performs three comparisons).
+           auto __prev = __first;
+           if (++__first == __last)
+             {
+               // N is odd; in this final iteration, we perform at most two
+               // comparisons, for a total of 1 + 3*(N-3)/2 + 2 comparisons,
+               // which is not more than 3*N/2, as required.
+               if (__comp_proj(*__prev, *__result.min))
+                 __result.min = __prev;
+               else if (!__comp_proj(*__prev, *__result.max))
+                 __result.max = __prev;
+               break;
+             }
+           if (!__comp_proj(*__first, *__prev))
+             {
+               if (__comp_proj(*__prev, *__result.min))
+                 __result.min = __prev;
+               if (!__comp_proj(*__first, *__result.max))
+                 __result.max = __first;
+             }
+           else
+             {
+               if (__comp_proj(*__first, *__result.min))
+                 __result.min = __first;
+               if (!__comp_proj(*__prev, *__result.max))
+                 __result.max = __prev;
+             }
          }
        return __result;
       }
@@ -3542,8 +3604,7 @@ namespace ranges
                  // i.e. we are shifting out at least half of the range.  In
                  // this case we can safely perform the shift with a single
                  // move.
-                 std::move(std::move(__first), std::move(__dest_head),
-                           std::move(__result));
+                 std::move(std::move(__first), std::move(__dest_head), __result);
                  return __result;
                }
              ++__dest_head;
index 786922414b59adce6b50d3e5359c36d6b76ac83b..c365152bf2bce39af2e996b40d9bdd05b94734e0 100644 (file)
@@ -19,6 +19,8 @@
 // { dg-do run { target c++2a } }
 
 #include <algorithm>
+#include <string>
+#include <vector>
 #include <testsuite_hooks.h>
 #include <testsuite_iterators.h>
 
@@ -89,10 +91,50 @@ test03()
          == res_t(1,4) );
 }
 
+void
+test04()
+{
+  // Verify we perform at most 3*N/2 applications of the comparison predicate.
+  static int counter;
+  struct counted_less
+  { bool operator()(int a, int b) { ++counter; return a < b; } };
+
+  ranges::minmax({1,2}, counted_less{});
+  VERIFY( counter == 1 );
+
+  counter = 0;
+  ranges::minmax({1,2,3}, counted_less{});
+  VERIFY( counter == 3 );
+
+  counter = 0;
+  ranges::minmax({1,2,3,4,5,6,7,8,9,10}, counted_less{});
+  VERIFY( counter <= 15 );
+
+  counter = 0;
+  ranges::minmax({10,9,8,7,6,5,4,3,2,1}, counted_less{});
+  VERIFY( counter <= 15 );
+}
+
+void
+test05()
+{
+  // PR libstdc++/100387
+  using namespace std::literals::string_literals;
+  auto comp = [](const auto& a, const auto& b) {
+    return a.size() == b.size() ? a.front() < b.front() : a.size() > b.size();
+  };
+  auto result = ranges::minmax({"b"s, "a"s}, comp);
+  VERIFY( result.min == "a"s && result.max == "b"s );
+  result = ranges::minmax({"c"s, "b"s, "a"s}, comp);
+  VERIFY( result.min == "a"s && result.max == "c"s );
+}
+
 int
 main()
 {
   test01();
   test02();
   test03();
+  test04();
+  test05();
 }
index 3b11c0dd96c2812d50163de97cb5e1b5f35518d3..0919f7dda8f9adc8c3725ff11ad7320c2878a2f2 100644 (file)
@@ -61,8 +61,35 @@ test01()
   static_assert(ranges::minmax_element(y, y+3, {}, &X::i).max->j == 3);
 }
 
+void
+test02()
+{
+  // Verify we perform at most 3*N/2 applications of the comparison predicate.
+  static int counter;
+  struct counted_less
+  { bool operator()(int a, int b) { ++counter; return a < b; } };
+
+  int x[] = {1,2,3,4,5,6,7,8,9,10};
+  ranges::minmax_element(x, x+2, counted_less{});
+  VERIFY( counter == 1 );
+
+  counter = 0;
+  ranges::minmax_element(x, x+3, counted_less{});
+  VERIFY( counter == 3 );
+
+  counter = 0;
+  ranges::minmax_element(x, counted_less{});
+  VERIFY( counter <= 15 );
+
+  ranges::reverse(x);
+  counter = 0;
+  ranges::minmax_element(x, counted_less{});
+  VERIFY( counter <= 15 );
+}
+
 int
 main()
 {
   test01();
+  test02();
 }