]>
Commit | Line | Data |
---|---|---|
1 | // -*- C++ -*- | |
2 | //===-- algorithm_impl.h --------------------------------------------------===// | |
3 | // | |
4 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | |
5 | // See https://llvm.org/LICENSE.txt for license information. | |
6 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | |
7 | // | |
8 | //===----------------------------------------------------------------------===// | |
9 | ||
10 | #ifndef _PSTL_ALGORITHM_IMPL_H | |
11 | #define _PSTL_ALGORITHM_IMPL_H | |
12 | ||
13 | #include <iterator> | |
14 | #include <type_traits> | |
15 | #include <utility> | |
16 | #include <functional> | |
17 | #include <algorithm> | |
18 | ||
19 | #include "execution_impl.h" | |
20 | #include "memory_impl.h" | |
21 | #include "parallel_backend_utils.h" | |
22 | #include "parallel_backend.h" | |
23 | #include "parallel_impl.h" | |
24 | #include "unseq_backend_simd.h" | |
25 | ||
26 | ||
27 | namespace __pstl | |
28 | { | |
29 | namespace __internal | |
30 | { | |
31 | ||
32 | //------------------------------------------------------------------------ | |
33 | // any_of | |
34 | //------------------------------------------------------------------------ | |
35 | ||
36 | template <class _ForwardIterator, class _Pred> | |
37 | bool | |
38 | __brick_any_of(const _ForwardIterator __first, const _ForwardIterator __last, _Pred __pred, | |
39 | /*__is_vector=*/std::false_type) noexcept | |
40 | { | |
41 | return std::any_of(__first, __last, __pred); | |
42 | }; | |
43 | ||
44 | template <class _RandomAccessIterator, class _Pred> | |
45 | bool | |
46 | __brick_any_of(const _RandomAccessIterator __first, const _RandomAccessIterator __last, _Pred __pred, | |
47 | /*__is_vector=*/std::true_type) noexcept | |
48 | { | |
49 | return __unseq_backend::__simd_or(__first, __last - __first, __pred); | |
50 | }; | |
51 | ||
52 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _Pred> | |
53 | bool | |
54 | __pattern_any_of(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, _Pred __pred) noexcept | |
55 | { | |
56 | return __internal::__brick_any_of(__first, __last, __pred, typename _Tag::__is_vector{}); | |
57 | } | |
58 | ||
59 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Pred> | |
60 | bool | |
61 | __pattern_any_of(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
62 | _RandomAccessIterator __last, _Pred __pred) | |
63 | { | |
64 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
65 | ||
66 | return __internal::__except_handler( | |
67 | [&]() | |
68 | { | |
69 | return __internal::__parallel_or(__backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
70 | [__pred](_RandomAccessIterator __i, _RandomAccessIterator __j) | |
71 | { return __internal::__brick_any_of(__i, __j, __pred, _IsVector{}); }); | |
72 | }); | |
73 | } | |
74 | ||
75 | // [alg.foreach] | |
76 | // for_each_n with no policy | |
77 | ||
78 | template <class _ForwardIterator, class _Size, class _Function> | |
79 | _ForwardIterator | |
80 | __for_each_n_it_serial(_ForwardIterator __first, _Size __n, _Function __f) | |
81 | { | |
82 | for (; __n > 0; ++__first, --__n) | |
83 | __f(__first); | |
84 | return __first; | |
85 | } | |
86 | ||
87 | //------------------------------------------------------------------------ | |
88 | // walk1 (pseudo) | |
89 | // | |
90 | // walk1 evaluates f(x) for each dereferenced value x drawn from [first,last) | |
91 | //------------------------------------------------------------------------ | |
92 | template <class _ForwardIterator, class _Function> | |
93 | void | |
94 | __brick_walk1(_ForwardIterator __first, _ForwardIterator __last, _Function __f, /*vector=*/std::false_type) noexcept | |
95 | { | |
96 | std::for_each(__first, __last, __f); | |
97 | } | |
98 | ||
99 | template <class _RandomAccessIterator, class _Function> | |
100 | void | |
101 | __brick_walk1(_RandomAccessIterator __first, _RandomAccessIterator __last, _Function __f, | |
102 | /*vector=*/std::true_type) noexcept | |
103 | { | |
104 | __unseq_backend::__simd_walk_1(__first, __last - __first, __f); | |
105 | } | |
106 | ||
107 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _Function> | |
108 | void | |
109 | __pattern_walk1(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, _Function __f) noexcept | |
110 | { | |
111 | __internal::__brick_walk1(__first, __last, __f, typename _Tag::__is_vector{}); | |
112 | } | |
113 | ||
114 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Function> | |
115 | void | |
116 | __pattern_walk1(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
117 | _RandomAccessIterator __last, _Function __f) | |
118 | { | |
119 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
120 | ||
121 | __internal::__except_handler( | |
122 | [&]() | |
123 | { | |
124 | __par_backend::__parallel_for(__backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
125 | [__f](_RandomAccessIterator __i, _RandomAccessIterator __j) | |
126 | { __internal::__brick_walk1(__i, __j, __f, _IsVector{}); }); | |
127 | }); | |
128 | } | |
129 | ||
130 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _Brick> | |
131 | void | |
132 | __pattern_walk_brick(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, | |
133 | _Brick __brick) noexcept | |
134 | { | |
135 | __brick(__first, __last); | |
136 | } | |
137 | ||
138 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Brick> | |
139 | void | |
140 | __pattern_walk_brick(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
141 | _RandomAccessIterator __last, _Brick __brick) | |
142 | { | |
143 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
144 | ||
145 | __internal::__except_handler( | |
146 | [&]() | |
147 | { | |
148 | __par_backend::__parallel_for(__backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
149 | [__brick](_RandomAccessIterator __i, _RandomAccessIterator __j) | |
150 | { __brick(__i, __j); }); | |
151 | }); | |
152 | } | |
153 | ||
154 | //------------------------------------------------------------------------ | |
155 | // walk1_n | |
156 | //------------------------------------------------------------------------ | |
157 | template <class _ForwardIterator, class _Size, class _Function> | |
158 | _ForwardIterator | |
159 | __brick_walk1_n(_ForwardIterator __first, _Size __n, _Function __f, /*_IsVectorTag=*/std::false_type) | |
160 | { | |
161 | return __internal::__for_each_n_it_serial(__first, __n, | |
162 | [&__f](_ForwardIterator __it) { __f(*__it); }); // calling serial version | |
163 | } | |
164 | ||
165 | template <class _RandomAccessIterator, class _DifferenceType, class _Function> | |
166 | _RandomAccessIterator | |
167 | __brick_walk1_n(_RandomAccessIterator __first, _DifferenceType __n, _Function __f, | |
168 | /*vectorTag=*/std::true_type) noexcept | |
169 | { | |
170 | return __unseq_backend::__simd_walk_1(__first, __n, __f); | |
171 | } | |
172 | ||
173 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _Size, class _Function> | |
174 | _ForwardIterator | |
175 | __pattern_walk1_n(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _Size __n, _Function __f) noexcept | |
176 | { | |
177 | return __internal::__brick_walk1_n(__first, __n, __f, typename _Tag::__is_vector{}); | |
178 | } | |
179 | ||
180 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Size, class _Function> | |
181 | _RandomAccessIterator | |
182 | __pattern_walk1_n(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, _Size __n, | |
183 | _Function __f) | |
184 | { | |
185 | __internal::__pattern_walk1(__tag, std::forward<_ExecutionPolicy>(__exec), __first, __first + __n, __f); | |
186 | ||
187 | return __first + __n; | |
188 | } | |
189 | ||
190 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _Size, class _Brick> | |
191 | _ForwardIterator | |
192 | __pattern_walk_brick_n(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _Size __n, _Brick __brick) noexcept | |
193 | { | |
194 | return __brick(__first, __n); | |
195 | } | |
196 | ||
197 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Size, class _Brick> | |
198 | _RandomAccessIterator | |
199 | __pattern_walk_brick_n(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
200 | _Size __n, _Brick __brick) | |
201 | { | |
202 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
203 | ||
204 | return __internal::__except_handler( | |
205 | [&]() | |
206 | { | |
207 | __par_backend::__parallel_for( | |
208 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __first + __n, | |
209 | [__brick](_RandomAccessIterator __i, _RandomAccessIterator __j) { __brick(__i, __j - __i); }); | |
210 | return __first + __n; | |
211 | }); | |
212 | } | |
213 | ||
214 | //------------------------------------------------------------------------ | |
215 | // walk2 (pseudo) | |
216 | // | |
217 | // walk2 evaluates f(x,y) for deferenced values (x,y) drawn from [first1,last1) and [first2,...) | |
218 | //------------------------------------------------------------------------ | |
219 | template <class _ForwardIterator1, class _ForwardIterator2, class _Function> | |
220 | _ForwardIterator2 | |
221 | __brick_walk2(_ForwardIterator1 __first1, _ForwardIterator1 __last1, _ForwardIterator2 __first2, _Function __f, | |
222 | /*vector=*/std::false_type) noexcept | |
223 | { | |
224 | for (; __first1 != __last1; ++__first1, ++__first2) | |
225 | __f(*__first1, *__first2); | |
226 | return __first2; | |
227 | } | |
228 | ||
229 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _Function> | |
230 | _RandomAccessIterator2 | |
231 | __brick_walk2(_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, | |
232 | _Function __f, | |
233 | /*vector=*/std::true_type) noexcept | |
234 | { | |
235 | return __unseq_backend::__simd_walk_2(__first1, __last1 - __first1, __first2, __f); | |
236 | } | |
237 | ||
238 | template <class _ForwardIterator1, class _Size, class _ForwardIterator2, class _Function> | |
239 | _ForwardIterator2 | |
240 | __brick_walk2_n(_ForwardIterator1 __first1, _Size __n, _ForwardIterator2 __first2, _Function __f, | |
241 | /*vector=*/std::false_type) noexcept | |
242 | { | |
243 | for (; __n > 0; --__n, ++__first1, ++__first2) | |
244 | __f(*__first1, *__first2); | |
245 | return __first2; | |
246 | } | |
247 | ||
248 | template <class _RandomAccessIterator1, class _Size, class _RandomAccessIterator2, class _Function> | |
249 | _RandomAccessIterator2 | |
250 | __brick_walk2_n(_RandomAccessIterator1 __first1, _Size __n, _RandomAccessIterator2 __first2, _Function __f, | |
251 | /*vector=*/std::true_type) noexcept | |
252 | { | |
253 | return __unseq_backend::__simd_walk_2(__first1, __n, __first2, __f); | |
254 | } | |
255 | ||
256 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _Function> | |
257 | _ForwardIterator2 | |
258 | __pattern_walk2(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first1, _ForwardIterator1 __last1, | |
259 | _ForwardIterator2 __first2, _Function __f) noexcept | |
260 | { | |
261 | return __internal::__brick_walk2(__first1, __last1, __first2, __f, typename _Tag::__is_vector{}); | |
262 | } | |
263 | ||
264 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
265 | class _Function> | |
266 | _RandomAccessIterator2 | |
267 | __pattern_walk2(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first1, | |
268 | _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, _Function __f) | |
269 | { | |
270 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
271 | ||
272 | return __internal::__except_handler( | |
273 | [&]() | |
274 | { | |
275 | __par_backend::__parallel_for( | |
276 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, | |
277 | [__f, __first1, __first2](_RandomAccessIterator1 __i, _RandomAccessIterator1 __j) | |
278 | { __internal::__brick_walk2(__i, __j, __first2 + (__i - __first1), __f, _IsVector{}); }); | |
279 | return __first2 + (__last1 - __first1); | |
280 | }); | |
281 | } | |
282 | ||
283 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _Size, class _ForwardIterator2, | |
284 | class _Function> | |
285 | _ForwardIterator2 | |
286 | __pattern_walk2_n(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first1, _Size __n, _ForwardIterator2 __first2, | |
287 | _Function __f) noexcept | |
288 | { | |
289 | return __internal::__brick_walk2_n(__first1, __n, __first2, __f, typename _Tag::__is_vector{}); | |
290 | } | |
291 | ||
292 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _Size, | |
293 | class _RandomAccessIterator2, class _Function> | |
294 | _RandomAccessIterator2 | |
295 | __pattern_walk2_n(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first1, | |
296 | _Size __n, _RandomAccessIterator2 __first2, _Function __f) | |
297 | { | |
298 | return __internal::__pattern_walk2(__tag, std::forward<_ExecutionPolicy>(__exec), __first1, __first1 + __n, | |
299 | __first2, __f); | |
300 | } | |
301 | ||
302 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _Brick> | |
303 | _ForwardIterator2 | |
304 | __pattern_walk2_brick(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first1, _ForwardIterator1 __last1, | |
305 | _ForwardIterator2 __first2, _Brick __brick) noexcept | |
306 | { | |
307 | return __brick(__first1, __last1, __first2); | |
308 | } | |
309 | ||
310 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
311 | class _Brick> | |
312 | _RandomAccessIterator2 | |
313 | __pattern_walk2_brick(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first1, | |
314 | _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, _Brick __brick) | |
315 | { | |
316 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
317 | ||
318 | return __internal::__except_handler( | |
319 | [&]() | |
320 | { | |
321 | __par_backend::__parallel_for( | |
322 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, | |
323 | [__first1, __first2, __brick](_RandomAccessIterator1 __i, _RandomAccessIterator1 __j) | |
324 | { __brick(__i, __j, __first2 + (__i - __first1)); }); | |
325 | return __first2 + (__last1 - __first1); | |
326 | }); | |
327 | } | |
328 | ||
329 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _Size, class _ForwardIterator2, | |
330 | class _Brick> | |
331 | _ForwardIterator2 | |
332 | __pattern_walk2_brick_n(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first1, _Size __n, _ForwardIterator2 __first2, | |
333 | _Brick __brick) noexcept | |
334 | { | |
335 | return __brick(__first1, __n, __first2); | |
336 | } | |
337 | ||
338 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _Size, | |
339 | class _RandomAccessIterator2, class _Brick> | |
340 | _RandomAccessIterator2 | |
341 | __pattern_walk2_brick_n(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first1, | |
342 | _Size __n, _RandomAccessIterator2 __first2, _Brick __brick) | |
343 | { | |
344 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
345 | ||
346 | return __internal::__except_handler( | |
347 | [&]() | |
348 | { | |
349 | __par_backend::__parallel_for( | |
350 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first1, __first1 + __n, | |
351 | [__first1, __first2, __brick](_RandomAccessIterator1 __i, _RandomAccessIterator1 __j) | |
352 | { __brick(__i, __j - __i, __first2 + (__i - __first1)); }); | |
353 | return __first2 + __n; | |
354 | }); | |
355 | } | |
356 | ||
357 | //------------------------------------------------------------------------ | |
358 | // walk3 (pseudo) | |
359 | // | |
360 | // walk3 evaluates f(x,y,z) for (x,y,z) drawn from [first1,last1), [first2,...), [first3,...) | |
361 | //------------------------------------------------------------------------ | |
362 | template <class _ForwardIterator1, class _ForwardIterator2, class _ForwardIterator3, class _Function> | |
363 | _ForwardIterator3 | |
364 | __brick_walk3(_ForwardIterator1 __first1, _ForwardIterator1 __last1, _ForwardIterator2 __first2, | |
365 | _ForwardIterator3 __first3, _Function __f, /*vector=*/std::false_type) noexcept | |
366 | { | |
367 | for (; __first1 != __last1; ++__first1, ++__first2, ++__first3) | |
368 | __f(*__first1, *__first2, *__first3); | |
369 | return __first3; | |
370 | } | |
371 | ||
372 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _RandomAccessIterator3, class _Function> | |
373 | _RandomAccessIterator3 | |
374 | __brick_walk3(_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, | |
375 | _RandomAccessIterator3 __first3, _Function __f, /*vector=*/std::true_type) noexcept | |
376 | { | |
377 | return __unseq_backend::__simd_walk_3(__first1, __last1 - __first1, __first2, __first3, __f); | |
378 | } | |
379 | ||
380 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _ForwardIterator3, | |
381 | class _Function> | |
382 | _ForwardIterator3 | |
383 | __pattern_walk3(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first1, _ForwardIterator1 __last1, | |
384 | _ForwardIterator2 __first2, _ForwardIterator3 __first3, _Function __f) noexcept | |
385 | { | |
386 | return __internal::__brick_walk3(__first1, __last1, __first2, __first3, __f, typename _Tag::__is_vector{}); | |
387 | } | |
388 | ||
389 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
390 | class _RandomAccessIterator3, class _Function> | |
391 | _RandomAccessIterator3 | |
392 | __pattern_walk3(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first1, | |
393 | _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, _RandomAccessIterator3 __first3, | |
394 | _Function __f) | |
395 | { | |
396 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
397 | ||
398 | return __internal::__except_handler( | |
399 | [&]() | |
400 | { | |
401 | __par_backend::__parallel_for( | |
402 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, | |
403 | [__f, __first1, __first2, __first3](_RandomAccessIterator1 __i, _RandomAccessIterator1 __j) { | |
404 | __internal::__brick_walk3(__i, __j, __first2 + (__i - __first1), __first3 + (__i - __first1), __f, | |
405 | _IsVector{}); | |
406 | }); | |
407 | return __first3 + (__last1 - __first1); | |
408 | }); | |
409 | } | |
410 | ||
411 | //------------------------------------------------------------------------ | |
412 | // equal | |
413 | //------------------------------------------------------------------------ | |
414 | ||
415 | template <class _ForwardIterator1, class _ForwardIterator2, class _BinaryPredicate> | |
416 | bool | |
417 | __brick_equal(_ForwardIterator1 __first1, _ForwardIterator1 __last1, _ForwardIterator2 __first2, | |
418 | _ForwardIterator2 __last2, _BinaryPredicate __p, /* IsVector = */ std::false_type) noexcept | |
419 | { | |
420 | return std::equal(__first1, __last1, __first2, __last2, __p); | |
421 | } | |
422 | ||
423 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _BinaryPredicate> | |
424 | bool | |
425 | __brick_equal(_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, | |
426 | _RandomAccessIterator2 __last2, _BinaryPredicate __p, /* is_vector = */ std::true_type) noexcept | |
427 | { | |
428 | if (__last1 - __first1 != __last2 - __first2) | |
429 | return false; | |
430 | ||
431 | return __unseq_backend::__simd_first(__first1, __last1 - __first1, __first2, std::not_fn(__p)).first == __last1; | |
432 | } | |
433 | ||
434 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _BinaryPredicate> | |
435 | bool | |
436 | __pattern_equal(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first1, _ForwardIterator1 __last1, | |
437 | _ForwardIterator2 __first2, _ForwardIterator2 __last2, _BinaryPredicate __p) noexcept | |
438 | { | |
439 | return __internal::__brick_equal(__first1, __last1, __first2, __last2, __p, typename _Tag::__is_vector{}); | |
440 | } | |
441 | ||
442 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
443 | class _BinaryPredicate> | |
444 | bool | |
445 | __pattern_equal(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first1, | |
446 | _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, _RandomAccessIterator2 __last2, | |
447 | _BinaryPredicate __p) | |
448 | { | |
449 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
450 | ||
451 | if (__last1 - __first1 != __last2 - __first2) | |
452 | return false; | |
453 | ||
454 | return __internal::__except_handler( | |
455 | [&]() | |
456 | { | |
457 | return !__internal::__parallel_or( | |
458 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, | |
459 | [__first1, __first2, __p](_RandomAccessIterator1 __i, _RandomAccessIterator1 __j) | |
460 | { | |
461 | return !__internal::__brick_equal(__i, __j, __first2 + (__i - __first1), | |
462 | __first2 + (__j - __first1), __p, _IsVector{}); | |
463 | }); | |
464 | }); | |
465 | } | |
466 | ||
467 | //------------------------------------------------------------------------ | |
468 | // equal version for sequences with equal length | |
469 | //------------------------------------------------------------------------ | |
470 | ||
471 | template <class _ForwardIterator1, class _ForwardIterator2, class _BinaryPredicate> | |
472 | bool | |
473 | __brick_equal(_ForwardIterator1 __first1, _ForwardIterator1 __last1, _ForwardIterator2 __first2, _BinaryPredicate __p, | |
474 | /* IsVector = */ std::false_type) noexcept | |
475 | { | |
476 | return std::equal(__first1, __last1, __first2, __p); | |
477 | } | |
478 | ||
479 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _BinaryPredicate> | |
480 | bool | |
481 | __brick_equal(_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, | |
482 | _BinaryPredicate __p, /* is_vector = */ std::true_type) noexcept | |
483 | { | |
484 | return __unseq_backend::__simd_first(__first1, __last1 - __first1, __first2, std::not_fn(__p)).first == __last1; | |
485 | } | |
486 | ||
487 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _BinaryPredicate> | |
488 | bool | |
489 | __pattern_equal(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first1, _ForwardIterator1 __last1, | |
490 | _ForwardIterator2 __first2, _BinaryPredicate __p) noexcept | |
491 | { | |
492 | return __internal::__brick_equal(__first1, __last1, __first2, __p, typename _Tag::__is_vector{}); | |
493 | } | |
494 | ||
495 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
496 | class _BinaryPredicate> | |
497 | bool | |
498 | __pattern_equal(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first1, | |
499 | _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, _BinaryPredicate __p) | |
500 | { | |
501 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
502 | ||
503 | return __internal::__except_handler( | |
504 | [&]() | |
505 | { | |
506 | return !__internal::__parallel_or( | |
507 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, | |
508 | [__first1, __first2, __p](_RandomAccessIterator1 __i, _RandomAccessIterator1 __j) | |
509 | { return !__internal::__brick_equal(__i, __j, __first2 + (__i - __first1), __p, _IsVector{}); }); | |
510 | }); | |
511 | } | |
512 | ||
513 | //------------------------------------------------------------------------ | |
514 | // find_if | |
515 | //------------------------------------------------------------------------ | |
516 | template <class _ForwardIterator, class _Predicate> | |
517 | _ForwardIterator | |
518 | __brick_find_if(_ForwardIterator __first, _ForwardIterator __last, _Predicate __pred, | |
519 | /*is_vector=*/std::false_type) noexcept | |
520 | { | |
521 | return std::find_if(__first, __last, __pred); | |
522 | } | |
523 | ||
524 | template <class _RandomAccessIterator, class _Predicate> | |
525 | _RandomAccessIterator | |
526 | __brick_find_if(_RandomAccessIterator __first, _RandomAccessIterator __last, _Predicate __pred, | |
527 | /*is_vector=*/std::true_type) noexcept | |
528 | { | |
529 | typedef typename std::iterator_traits<_RandomAccessIterator>::difference_type _SizeType; | |
530 | return __unseq_backend::__simd_first( | |
531 | __first, _SizeType(0), __last - __first, | |
532 | [&__pred](_RandomAccessIterator __it, _SizeType __i) { return __pred(__it[__i]); }); | |
533 | } | |
534 | ||
535 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _Predicate> | |
536 | _ForwardIterator | |
537 | __pattern_find_if(_Tag __tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, | |
538 | _Predicate __pred) noexcept | |
539 | { | |
540 | return __internal::__brick_find_if(__first, __last, __pred, typename _Tag::__is_vector{}); | |
541 | } | |
542 | ||
543 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Predicate> | |
544 | _RandomAccessIterator | |
545 | __pattern_find_if(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
546 | _RandomAccessIterator __last, _Predicate __pred) | |
547 | { | |
548 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
549 | ||
550 | return __internal::__except_handler( | |
551 | [&]() | |
552 | { | |
553 | return __internal::__parallel_find( | |
554 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
555 | [__pred](_RandomAccessIterator __i, _RandomAccessIterator __j) | |
556 | { return __internal::__brick_find_if(__i, __j, __pred, _IsVector{}); }, | |
557 | std::less<typename std::iterator_traits<_RandomAccessIterator>::difference_type>(), | |
558 | /*is_first=*/true); | |
559 | }); | |
560 | } | |
561 | ||
562 | //------------------------------------------------------------------------ | |
563 | // find_end | |
564 | //------------------------------------------------------------------------ | |
565 | ||
566 | // find the first occurrence of the subsequence [s_first, s_last) | |
567 | // or the last occurrence of the subsequence in the range [first, last) | |
568 | // b_first determines what occurrence we want to find (first or last) | |
569 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _BinaryPredicate, class _IsVector> | |
570 | _RandomAccessIterator1 | |
571 | __find_subrange(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, _RandomAccessIterator1 __global_last, | |
572 | _RandomAccessIterator2 __s_first, _RandomAccessIterator2 __s_last, _BinaryPredicate __pred, | |
573 | bool __b_first, _IsVector __is_vector) noexcept | |
574 | { | |
575 | typedef typename std::iterator_traits<_RandomAccessIterator2>::value_type _ValueType; | |
576 | auto __n2 = __s_last - __s_first; | |
577 | if (__n2 < 1) | |
578 | { | |
579 | return __b_first ? __first : __last; | |
580 | } | |
581 | ||
582 | auto __n1 = __global_last - __first; | |
583 | if (__n1 < __n2) | |
584 | { | |
585 | return __last; | |
586 | } | |
587 | ||
588 | auto __cur = __last; | |
589 | while (__first != __last && (__global_last - __first >= __n2)) | |
590 | { | |
591 | // find position of *s_first in [first, last) (it can be start of subsequence) | |
592 | __first = __internal::__brick_find_if( | |
593 | __first, __last, __equal_value_by_pred<_ValueType, _BinaryPredicate>(*__s_first, __pred), __is_vector); | |
594 | ||
595 | // if position that was found previously is the start of subsequence | |
596 | // then we can exit the loop (b_first == true) or keep the position | |
597 | // (b_first == false) | |
598 | if (__first != __last && (__global_last - __first >= __n2) && | |
599 | __internal::__brick_equal(__s_first + 1, __s_last, __first + 1, __pred, __is_vector)) | |
600 | { | |
601 | if (__b_first) | |
602 | { | |
603 | return __first; | |
604 | } | |
605 | else | |
606 | { | |
607 | __cur = __first; | |
608 | } | |
609 | } | |
610 | else if (__first == __last) | |
611 | { | |
612 | break; | |
613 | } | |
614 | else | |
615 | { | |
616 | } | |
617 | ||
618 | // in case of b_first == false we try to find new start position | |
619 | // for the next subsequence | |
620 | ++__first; | |
621 | } | |
622 | return __cur; | |
623 | } | |
624 | ||
625 | template <class _RandomAccessIterator, class _Size, class _Tp, class _BinaryPredicate, class _IsVector> | |
626 | _RandomAccessIterator | |
627 | __find_subrange(_RandomAccessIterator __first, _RandomAccessIterator __last, _RandomAccessIterator __global_last, | |
628 | _Size __count, const _Tp& __value, _BinaryPredicate __pred, _IsVector __is_vector) noexcept | |
629 | { | |
630 | if (static_cast<_Size>(__global_last - __first) < __count || __count < 1) | |
631 | { | |
632 | return __last; // According to the standard last shall be returned when count < 1 | |
633 | } | |
634 | ||
635 | auto __unary_pred = __equal_value_by_pred<_Tp, _BinaryPredicate>(__value, __pred); | |
636 | while (__first != __last && (static_cast<_Size>(__global_last - __first) >= __count)) | |
637 | { | |
638 | __first = __internal::__brick_find_if(__first, __last, __unary_pred, __is_vector); | |
639 | ||
640 | // check that all of elements in [first+1, first+count) equal to value | |
641 | if (__first != __last && (static_cast<_Size>(__global_last - __first) >= __count) && | |
642 | !__internal::__brick_any_of(__first + 1, __first + __count, std::not_fn(__unary_pred), __is_vector)) | |
643 | { | |
644 | return __first; | |
645 | } | |
646 | else if (__first == __last) | |
647 | { | |
648 | break; | |
649 | } | |
650 | else | |
651 | { | |
652 | ++__first; | |
653 | } | |
654 | } | |
655 | return __last; | |
656 | } | |
657 | ||
658 | template <class _ForwardIterator1, class _ForwardIterator2, class _BinaryPredicate> | |
659 | _ForwardIterator1 | |
660 | __brick_find_end(_ForwardIterator1 __first, _ForwardIterator1 __last, _ForwardIterator2 __s_first, | |
661 | _ForwardIterator2 __s_last, _BinaryPredicate __pred, /*__is_vector=*/std::false_type) noexcept | |
662 | { | |
663 | return std::find_end(__first, __last, __s_first, __s_last, __pred); | |
664 | } | |
665 | ||
666 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _BinaryPredicate> | |
667 | _RandomAccessIterator1 | |
668 | __brick_find_end(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, _RandomAccessIterator2 __s_first, | |
669 | _RandomAccessIterator2 __s_last, _BinaryPredicate __pred, /*__is_vector=*/std::true_type) noexcept | |
670 | { | |
671 | return __find_subrange(__first, __last, __last, __s_first, __s_last, __pred, false, std::true_type()); | |
672 | } | |
673 | ||
674 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _BinaryPredicate> | |
675 | _ForwardIterator1 | |
676 | __pattern_find_end(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first, _ForwardIterator1 __last, | |
677 | _ForwardIterator2 __s_first, _ForwardIterator2 __s_last, _BinaryPredicate __pred) noexcept | |
678 | { | |
679 | return __internal::__brick_find_end(__first, __last, __s_first, __s_last, __pred, typename _Tag::__is_vector{}); | |
680 | } | |
681 | ||
682 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
683 | class _BinaryPredicate> | |
684 | _RandomAccessIterator1 | |
685 | __pattern_find_end(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first, | |
686 | _RandomAccessIterator1 __last, _RandomAccessIterator2 __s_first, _RandomAccessIterator2 __s_last, | |
687 | _BinaryPredicate __pred) noexcept | |
688 | { | |
689 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
690 | ||
691 | if (__last - __first == __s_last - __s_first) | |
692 | { | |
693 | const bool __res = __internal::__pattern_equal(__tag, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
694 | __s_first, __pred); | |
695 | return __res ? __first : __last; | |
696 | } | |
697 | else | |
698 | { | |
699 | return __internal::__except_handler( | |
700 | [&]() | |
701 | { | |
702 | return __internal::__parallel_find( | |
703 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
704 | [__last, __s_first, __s_last, __pred](_RandomAccessIterator1 __i, _RandomAccessIterator1 __j) { | |
705 | return __internal::__find_subrange(__i, __j, __last, __s_first, __s_last, __pred, false, | |
706 | _IsVector{}); | |
707 | }, | |
708 | std::greater<typename std::iterator_traits<_RandomAccessIterator1>::difference_type>(), | |
709 | /*is_first=*/false); | |
710 | }); | |
711 | } | |
712 | } | |
713 | ||
714 | //------------------------------------------------------------------------ | |
715 | // find_first_of | |
716 | //------------------------------------------------------------------------ | |
717 | template <class _ForwardIterator1, class _ForwardIterator2, class _BinaryPredicate> | |
718 | _ForwardIterator1 | |
719 | __brick_find_first_of(_ForwardIterator1 __first, _ForwardIterator1 __last, _ForwardIterator2 __s_first, | |
720 | _ForwardIterator2 __s_last, _BinaryPredicate __pred, /*__is_vector=*/std::false_type) noexcept | |
721 | { | |
722 | return std::find_first_of(__first, __last, __s_first, __s_last, __pred); | |
723 | } | |
724 | ||
725 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _BinaryPredicate> | |
726 | _RandomAccessIterator1 | |
727 | __brick_find_first_of(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, _RandomAccessIterator2 __s_first, | |
728 | _RandomAccessIterator2 __s_last, _BinaryPredicate __pred, /*__is_vector=*/std::true_type) noexcept | |
729 | { | |
730 | return __unseq_backend::__simd_find_first_of(__first, __last, __s_first, __s_last, __pred); | |
731 | } | |
732 | ||
733 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _BinaryPredicate> | |
734 | _ForwardIterator1 | |
735 | __pattern_find_first_of(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first, _ForwardIterator1 __last, | |
736 | _ForwardIterator2 __s_first, _ForwardIterator2 __s_last, _BinaryPredicate __pred) noexcept | |
737 | { | |
738 | return __internal::__brick_find_first_of(__first, __last, __s_first, __s_last, __pred, | |
739 | typename _Tag::__is_vector{}); | |
740 | } | |
741 | ||
742 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
743 | class _BinaryPredicate> | |
744 | _RandomAccessIterator1 | |
745 | __pattern_find_first_of(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first, | |
746 | _RandomAccessIterator1 __last, _RandomAccessIterator2 __s_first, | |
747 | _RandomAccessIterator2 __s_last, _BinaryPredicate __pred) noexcept | |
748 | { | |
749 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
750 | ||
751 | return __internal::__except_handler( | |
752 | [&]() | |
753 | { | |
754 | return __internal::__parallel_find( | |
755 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
756 | [__s_first, __s_last, __pred](_RandomAccessIterator1 __i, _RandomAccessIterator1 __j) | |
757 | { return __internal::__brick_find_first_of(__i, __j, __s_first, __s_last, __pred, _IsVector{}); }, | |
758 | std::less<typename std::iterator_traits<_RandomAccessIterator1>::difference_type>(), /*is_first=*/true); | |
759 | }); | |
760 | } | |
761 | ||
762 | //------------------------------------------------------------------------ | |
763 | // search | |
764 | //------------------------------------------------------------------------ | |
765 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _BinaryPredicate> | |
766 | _RandomAccessIterator1 | |
767 | __brick_search(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, _RandomAccessIterator2 __s_first, | |
768 | _RandomAccessIterator2 __s_last, _BinaryPredicate __pred, /*vector=*/std::false_type) noexcept | |
769 | { | |
770 | return std::search(__first, __last, __s_first, __s_last, __pred); | |
771 | } | |
772 | ||
773 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _BinaryPredicate> | |
774 | _RandomAccessIterator1 | |
775 | __brick_search(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, _RandomAccessIterator2 __s_first, | |
776 | _RandomAccessIterator2 __s_last, _BinaryPredicate __pred, /*vector=*/std::true_type) noexcept | |
777 | { | |
778 | return __internal::__find_subrange(__first, __last, __last, __s_first, __s_last, __pred, true, std::true_type()); | |
779 | } | |
780 | ||
781 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _BinaryPredicate> | |
782 | _ForwardIterator1 | |
783 | __pattern_search(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first, _ForwardIterator1 __last, | |
784 | _ForwardIterator2 __s_first, _ForwardIterator2 __s_last, _BinaryPredicate __pred) noexcept | |
785 | { | |
786 | return __internal::__brick_search(__first, __last, __s_first, __s_last, __pred, typename _Tag::__is_vector{}); | |
787 | } | |
788 | ||
789 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
790 | class _BinaryPredicate> | |
791 | _RandomAccessIterator1 | |
792 | __pattern_search(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first, | |
793 | _RandomAccessIterator1 __last, _RandomAccessIterator2 __s_first, _RandomAccessIterator2 __s_last, | |
794 | _BinaryPredicate __pred) noexcept | |
795 | { | |
796 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
797 | ||
798 | if (__last - __first == __s_last - __s_first) | |
799 | { | |
800 | const bool __res = __internal::__pattern_equal(__tag, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
801 | __s_first, __pred); | |
802 | return __res ? __first : __last; | |
803 | } | |
804 | else | |
805 | { | |
806 | return __internal::__except_handler( | |
807 | [&]() | |
808 | { | |
809 | return __internal::__parallel_find( | |
810 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
811 | [__last, __s_first, __s_last, __pred](_RandomAccessIterator1 __i, _RandomAccessIterator1 __j) { | |
812 | return __internal::__find_subrange(__i, __j, __last, __s_first, __s_last, __pred, true, | |
813 | _IsVector{}); | |
814 | }, | |
815 | std::less<typename std::iterator_traits<_RandomAccessIterator1>::difference_type>(), | |
816 | /*is_first=*/true); | |
817 | }); | |
818 | } | |
819 | } | |
820 | ||
821 | //------------------------------------------------------------------------ | |
822 | // search_n | |
823 | //------------------------------------------------------------------------ | |
824 | template <class _ForwardIterator, class _Size, class _Tp, class _BinaryPredicate> | |
825 | _ForwardIterator | |
826 | __brick_search_n(_ForwardIterator __first, _ForwardIterator __last, _Size __count, const _Tp& __value, | |
827 | _BinaryPredicate __pred, /*vector=*/std::false_type) noexcept | |
828 | { | |
829 | return std::search_n(__first, __last, __count, __value, __pred); | |
830 | } | |
831 | ||
832 | template <class _RandomAccessIterator, class _Size, class _Tp, class _BinaryPredicate> | |
833 | _RandomAccessIterator | |
834 | __brick_search_n(_RandomAccessIterator __first, _RandomAccessIterator __last, _Size __count, const _Tp& __value, | |
835 | _BinaryPredicate __pred, /*vector=*/std::true_type) noexcept | |
836 | { | |
837 | return __internal::__find_subrange(__first, __last, __last, __count, __value, __pred, std::true_type()); | |
838 | } | |
839 | ||
840 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _Size, class _Tp, class _BinaryPredicate> | |
841 | _ForwardIterator | |
842 | __pattern_search_n(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, _Size __count, | |
843 | const _Tp& __value, _BinaryPredicate __pred) noexcept | |
844 | { | |
845 | return __internal::__brick_search_n(__first, __last, __count, __value, __pred, typename _Tag::__is_vector{}); | |
846 | } | |
847 | ||
848 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Size, class _Tp, | |
849 | class _BinaryPredicate> | |
850 | _RandomAccessIterator | |
851 | __pattern_search_n(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
852 | _RandomAccessIterator __last, _Size __count, const _Tp& __value, _BinaryPredicate __pred) noexcept | |
853 | { | |
854 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
855 | ||
856 | if (static_cast<_Size>(__last - __first) == __count) | |
857 | { | |
858 | const bool __result = | |
859 | !__internal::__pattern_any_of(__tag, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
860 | [&__value, &__pred](const _Tp& __val) { return !__pred(__val, __value); }); | |
861 | return __result ? __first : __last; | |
862 | } | |
863 | else | |
864 | { | |
865 | return __internal::__except_handler( | |
866 | [&__exec, __first, __last, __count, &__value, __pred]() | |
867 | { | |
868 | return __internal::__parallel_find( | |
869 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
870 | [__last, __count, &__value, __pred](_RandomAccessIterator __i, _RandomAccessIterator __j) | |
871 | { return __internal::__find_subrange(__i, __j, __last, __count, __value, __pred, _IsVector{}); }, | |
872 | std::less<typename std::iterator_traits<_RandomAccessIterator>::difference_type>(), | |
873 | /*is_first=*/true); | |
874 | }); | |
875 | } | |
876 | } | |
877 | ||
878 | //------------------------------------------------------------------------ | |
879 | // copy_n | |
880 | //------------------------------------------------------------------------ | |
881 | ||
882 | template <class _ForwardIterator, class _Size, class _OutputIterator> | |
883 | _OutputIterator | |
884 | __brick_copy_n(_ForwardIterator __first, _Size __n, _OutputIterator __result, /*vector=*/std::false_type) noexcept | |
885 | { | |
886 | return std::copy_n(__first, __n, __result); | |
887 | } | |
888 | ||
889 | template <class _RandomAccessIterator1, class _Size, class _RandomAccessIterator2> | |
890 | _RandomAccessIterator2 | |
891 | __brick_copy_n(_RandomAccessIterator1 __first, _Size __n, _RandomAccessIterator2 __result, | |
892 | /*vector=*/std::true_type) noexcept | |
893 | { | |
894 | return __unseq_backend::__simd_assign( | |
895 | __first, __n, __result, | |
896 | [](_RandomAccessIterator1 __first, _RandomAccessIterator2 __result) { *__result = *__first; }); | |
897 | } | |
898 | ||
899 | //------------------------------------------------------------------------ | |
900 | // copy | |
901 | //------------------------------------------------------------------------ | |
902 | template <class _ForwardIterator, class _OutputIterator> | |
903 | _OutputIterator | |
904 | __brick_copy(_ForwardIterator __first, _ForwardIterator __last, _OutputIterator __result, | |
905 | /*vector=*/std::false_type) noexcept | |
906 | { | |
907 | return std::copy(__first, __last, __result); | |
908 | } | |
909 | ||
910 | template <class _RandomAccessIterator1, class _RandomAccessIterator2> | |
911 | _RandomAccessIterator2 | |
912 | __brick_copy(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, _RandomAccessIterator2 __result, | |
913 | /*vector=*/std::true_type) noexcept | |
914 | { | |
915 | return __unseq_backend::__simd_assign( | |
916 | __first, __last - __first, __result, | |
917 | [](_RandomAccessIterator1 __first, _RandomAccessIterator2 __result) { *__result = *__first; }); | |
918 | } | |
919 | ||
920 | //------------------------------------------------------------------------ | |
921 | // move | |
922 | //------------------------------------------------------------------------ | |
923 | template <class _ForwardIterator, class _OutputIterator> | |
924 | _OutputIterator | |
925 | __brick_move(_ForwardIterator __first, _ForwardIterator __last, _OutputIterator __result, | |
926 | /*vector=*/std::false_type) noexcept | |
927 | { | |
928 | return std::move(__first, __last, __result); | |
929 | } | |
930 | ||
931 | template <class _RandomAccessIterator1, class _RandomAccessIterator2> | |
932 | _RandomAccessIterator2 | |
933 | __brick_move(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, _RandomAccessIterator2 __result, | |
934 | /*vector=*/std::true_type) noexcept | |
935 | { | |
936 | return __unseq_backend::__simd_assign( | |
937 | __first, __last - __first, __result, | |
938 | [](_RandomAccessIterator1 __first, _RandomAccessIterator2 __result) { *__result = std::move(*__first); }); | |
939 | } | |
940 | ||
941 | struct __brick_move_destroy | |
942 | { | |
943 | template <typename _RandomAccessIterator1, typename _RandomAccessIterator2> | |
944 | _RandomAccessIterator2 | |
945 | operator()(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, _RandomAccessIterator2 __result, | |
946 | /*vec*/ std::true_type) const | |
947 | { | |
948 | using _IteratorValueType = typename std::iterator_traits<_RandomAccessIterator1>::value_type; | |
949 | ||
950 | return __unseq_backend::__simd_assign(__first, __last - __first, __result, | |
951 | [](_RandomAccessIterator1 __first, _RandomAccessIterator2 __result) { | |
952 | *__result = std::move(*__first); | |
953 | (*__first).~_IteratorValueType(); | |
954 | }); | |
955 | } | |
956 | ||
957 | template <typename _RandomAccessIterator1, typename _RandomAccessIterator2> | |
958 | _RandomAccessIterator2 | |
959 | operator()(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, _RandomAccessIterator2 __result, | |
960 | /*vec*/ std::false_type) const | |
961 | { | |
962 | using _IteratorValueType = typename std::iterator_traits<_RandomAccessIterator1>::value_type; | |
963 | ||
964 | for (; __first != __last; ++__first, ++__result) | |
965 | { | |
966 | *__result = std::move(*__first); | |
967 | (*__first).~_IteratorValueType(); | |
968 | } | |
969 | return __result; | |
970 | } | |
971 | }; | |
972 | ||
973 | //------------------------------------------------------------------------ | |
974 | // swap_ranges | |
975 | //------------------------------------------------------------------------ | |
976 | template <class _ForwardIterator, class _OutputIterator> | |
977 | _OutputIterator | |
978 | __brick_swap_ranges(_ForwardIterator __first, _ForwardIterator __last, _OutputIterator __result, | |
979 | /*vector=*/std::false_type) noexcept | |
980 | { | |
981 | return std::swap_ranges(__first, __last, __result); | |
982 | } | |
983 | ||
984 | template <class _RandomAccessIterator1, class _RandomAccessIterator2> | |
985 | _RandomAccessIterator2 | |
986 | __brick_swap_ranges(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, _RandomAccessIterator2 __result, | |
987 | /*vector=*/std::true_type) noexcept | |
988 | { | |
989 | using std::iter_swap; | |
990 | return __unseq_backend::__simd_assign(__first, __last - __first, __result, | |
991 | iter_swap<_RandomAccessIterator1, _RandomAccessIterator2>); | |
992 | } | |
993 | ||
994 | //------------------------------------------------------------------------ | |
995 | // copy_if | |
996 | //------------------------------------------------------------------------ | |
997 | template <class _ForwardIterator, class _OutputIterator, class _UnaryPredicate> | |
998 | _OutputIterator | |
999 | __brick_copy_if(_ForwardIterator __first, _ForwardIterator __last, _OutputIterator __result, _UnaryPredicate __pred, | |
1000 | /*vector=*/std::false_type) noexcept | |
1001 | { | |
1002 | return std::copy_if(__first, __last, __result, __pred); | |
1003 | } | |
1004 | ||
1005 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _UnaryPredicate> | |
1006 | _RandomAccessIterator2 | |
1007 | __brick_copy_if(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, _RandomAccessIterator2 __result, | |
1008 | _UnaryPredicate __pred, | |
1009 | /*vector=*/std::true_type) noexcept | |
1010 | { | |
1011 | #if defined(_PSTL_MONOTONIC_PRESENT) | |
1012 | return __unseq_backend::__simd_copy_if(__first, __last - __first, __result, __pred); | |
1013 | #else | |
1014 | return std::copy_if(__first, __last, __result, __pred); | |
1015 | #endif | |
1016 | } | |
1017 | ||
1018 | // TODO: Try to use transform_reduce for combining __brick_copy_if_phase1 on IsVector. | |
1019 | template <class _DifferenceType, class _ForwardIterator, class _UnaryPredicate> | |
1020 | std::pair<_DifferenceType, _DifferenceType> | |
1021 | __brick_calc_mask_1(_ForwardIterator __first, _ForwardIterator __last, bool* __restrict __mask, _UnaryPredicate __pred, | |
1022 | /*vector=*/std::false_type) noexcept | |
1023 | { | |
1024 | auto __count_true = _DifferenceType(0); | |
1025 | auto __size = __last - __first; | |
1026 | ||
1027 | static_assert(__are_random_access_iterators<_ForwardIterator>::value, | |
1028 | "Pattern-brick error. Should be a random access iterator."); | |
1029 | ||
1030 | for (; __first != __last; ++__first, ++__mask) | |
1031 | { | |
1032 | *__mask = __pred(*__first); | |
1033 | if (*__mask) | |
1034 | { | |
1035 | ++__count_true; | |
1036 | } | |
1037 | } | |
1038 | return std::make_pair(__count_true, __size - __count_true); | |
1039 | } | |
1040 | ||
1041 | template <class _DifferenceType, class _RandomAccessIterator, class _UnaryPredicate> | |
1042 | std::pair<_DifferenceType, _DifferenceType> | |
1043 | __brick_calc_mask_1(_RandomAccessIterator __first, _RandomAccessIterator __last, bool* __mask, _UnaryPredicate __pred, | |
1044 | /*vector=*/std::true_type) noexcept | |
1045 | { | |
1046 | auto __result = __unseq_backend::__simd_calc_mask_1(__first, __last - __first, __mask, __pred); | |
1047 | return std::make_pair(__result, (__last - __first) - __result); | |
1048 | } | |
1049 | ||
1050 | template <class _ForwardIterator, class _OutputIterator, class _Assigner> | |
1051 | void | |
1052 | __brick_copy_by_mask(_ForwardIterator __first, _ForwardIterator __last, _OutputIterator __result, bool* __mask, | |
1053 | _Assigner __assigner, /*vector=*/std::false_type) noexcept | |
1054 | { | |
1055 | for (; __first != __last; ++__first, ++__mask) | |
1056 | { | |
1057 | if (*__mask) | |
1058 | { | |
1059 | __assigner(__first, __result); | |
1060 | ++__result; | |
1061 | } | |
1062 | } | |
1063 | } | |
1064 | ||
1065 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _Assigner> | |
1066 | void | |
1067 | __brick_copy_by_mask(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, _RandomAccessIterator2 __result, | |
1068 | bool* __restrict __mask, _Assigner __assigner, /*vector=*/std::true_type) noexcept | |
1069 | { | |
1070 | #if defined(_PSTL_MONOTONIC_PRESENT) | |
1071 | __unseq_backend::__simd_copy_by_mask(__first, __last - __first, __result, __mask, __assigner); | |
1072 | #else | |
1073 | __internal::__brick_copy_by_mask(__first, __last, __result, __mask, __assigner, std::false_type()); | |
1074 | #endif | |
1075 | } | |
1076 | ||
1077 | template <class _ForwardIterator, class _OutputIterator1, class _OutputIterator2> | |
1078 | void | |
1079 | __brick_partition_by_mask(_ForwardIterator __first, _ForwardIterator __last, _OutputIterator1 __out_true, | |
1080 | _OutputIterator2 __out_false, bool* __mask, /*vector=*/std::false_type) noexcept | |
1081 | { | |
1082 | for (; __first != __last; ++__first, ++__mask) | |
1083 | { | |
1084 | if (*__mask) | |
1085 | { | |
1086 | *__out_true = *__first; | |
1087 | ++__out_true; | |
1088 | } | |
1089 | else | |
1090 | { | |
1091 | *__out_false = *__first; | |
1092 | ++__out_false; | |
1093 | } | |
1094 | } | |
1095 | } | |
1096 | ||
1097 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _RandomAccessIterator3> | |
1098 | void | |
1099 | __brick_partition_by_mask(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, | |
1100 | _RandomAccessIterator2 __out_true, _RandomAccessIterator3 __out_false, bool* __mask, | |
1101 | /*vector=*/std::true_type) noexcept | |
1102 | { | |
1103 | #if defined(_PSTL_MONOTONIC_PRESENT) | |
1104 | __unseq_backend::__simd_partition_by_mask(__first, __last - __first, __out_true, __out_false, __mask); | |
1105 | #else | |
1106 | __internal::__brick_partition_by_mask(__first, __last, __out_true, __out_false, __mask, std::false_type()); | |
1107 | #endif | |
1108 | } | |
1109 | ||
1110 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _OutputIterator, class _UnaryPredicate> | |
1111 | _OutputIterator | |
1112 | __pattern_copy_if(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, _OutputIterator __result, | |
1113 | _UnaryPredicate __pred) noexcept | |
1114 | { | |
1115 | return __internal::__brick_copy_if(__first, __last, __result, __pred, typename _Tag::__is_vector{}); | |
1116 | } | |
1117 | ||
1118 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
1119 | class _UnaryPredicate> | |
1120 | _RandomAccessIterator2 | |
1121 | __pattern_copy_if(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first, | |
1122 | _RandomAccessIterator1 __last, _RandomAccessIterator2 __result, _UnaryPredicate __pred) | |
1123 | { | |
1124 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
1125 | ||
1126 | typedef typename std::iterator_traits<_RandomAccessIterator1>::difference_type _DifferenceType; | |
1127 | const _DifferenceType __n = __last - __first; | |
1128 | if (_DifferenceType(1) < __n) | |
1129 | { | |
1130 | __par_backend::__buffer<bool> __mask_buf(__n); | |
1131 | return __internal::__except_handler( | |
1132 | [&__exec, __n, __first, __result, __pred, &__mask_buf]() | |
1133 | { | |
1134 | bool* __mask = __mask_buf.get(); | |
1135 | _DifferenceType __m{}; | |
1136 | __par_backend::__parallel_strict_scan( | |
1137 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __n, _DifferenceType(0), | |
1138 | [=](_DifferenceType __i, _DifferenceType __len) { // Reduce | |
1139 | return __internal::__brick_calc_mask_1<_DifferenceType>(__first + __i, __first + (__i + __len), | |
1140 | __mask + __i, __pred, _IsVector{}) | |
1141 | .first; | |
1142 | }, | |
1143 | std::plus<_DifferenceType>(), // Combine | |
1144 | [=](_DifferenceType __i, _DifferenceType __len, _DifferenceType __initial) { // Scan | |
1145 | __internal::__brick_copy_by_mask( | |
1146 | __first + __i, __first + (__i + __len), __result + __initial, __mask + __i, | |
1147 | [](_RandomAccessIterator1 __x, _RandomAccessIterator2 __z) { *__z = *__x; }, _IsVector{}); | |
1148 | }, | |
1149 | [&__m](_DifferenceType __total) { __m = __total; }); | |
1150 | return __result + __m; | |
1151 | }); | |
1152 | } | |
1153 | // trivial sequence - use serial algorithm | |
1154 | return __internal::__brick_copy_if(__first, __last, __result, __pred, _IsVector{}); | |
1155 | } | |
1156 | ||
1157 | //------------------------------------------------------------------------ | |
1158 | // count | |
1159 | //------------------------------------------------------------------------ | |
1160 | template <class _RandomAccessIterator, class _Predicate> | |
1161 | typename std::iterator_traits<_RandomAccessIterator>::difference_type | |
1162 | __brick_count(_RandomAccessIterator __first, _RandomAccessIterator __last, _Predicate __pred, | |
1163 | /* is_vector = */ std::true_type) noexcept | |
1164 | { | |
1165 | return __unseq_backend::__simd_count(__first, __last - __first, __pred); | |
1166 | } | |
1167 | ||
1168 | template <class _ForwardIterator, class _Predicate> | |
1169 | typename std::iterator_traits<_ForwardIterator>::difference_type | |
1170 | __brick_count(_ForwardIterator __first, _ForwardIterator __last, _Predicate __pred, | |
1171 | /* is_vector = */ std::false_type) noexcept | |
1172 | { | |
1173 | return std::count_if(__first, __last, __pred); | |
1174 | } | |
1175 | ||
1176 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _Predicate> | |
1177 | typename std::iterator_traits<_ForwardIterator>::difference_type | |
1178 | __pattern_count(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, _Predicate __pred) noexcept | |
1179 | { | |
1180 | return __internal::__brick_count(__first, __last, __pred, typename _Tag::__is_vector{}); | |
1181 | } | |
1182 | ||
1183 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Predicate> | |
1184 | typename std::iterator_traits<_RandomAccessIterator>::difference_type | |
1185 | __pattern_count(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
1186 | _RandomAccessIterator __last, _Predicate __pred) | |
1187 | { | |
1188 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
1189 | ||
1190 | typedef typename std::iterator_traits<_RandomAccessIterator>::difference_type _SizeType; | |
1191 | return __internal::__except_handler( | |
1192 | [&]() | |
1193 | { | |
1194 | return __par_backend::__parallel_reduce( | |
1195 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, _SizeType(0), | |
1196 | [__pred](_RandomAccessIterator __begin, _RandomAccessIterator __end, _SizeType __value) -> _SizeType | |
1197 | { return __value + __internal::__brick_count(__begin, __end, __pred, _IsVector{}); }, | |
1198 | std::plus<_SizeType>()); | |
1199 | }); | |
1200 | } | |
1201 | ||
1202 | //------------------------------------------------------------------------ | |
1203 | // unique | |
1204 | //------------------------------------------------------------------------ | |
1205 | ||
1206 | template <class _RandomAccessIterator, class _BinaryPredicate> | |
1207 | _RandomAccessIterator | |
1208 | __brick_unique(_RandomAccessIterator __first, _RandomAccessIterator __last, _BinaryPredicate __pred, | |
1209 | /*is_vector=*/std::false_type) noexcept | |
1210 | { | |
1211 | return std::unique(__first, __last, __pred); | |
1212 | } | |
1213 | ||
1214 | template <class _RandomAccessIterator, class _BinaryPredicate> | |
1215 | _RandomAccessIterator | |
1216 | __brick_unique(_RandomAccessIterator __first, _RandomAccessIterator __last, _BinaryPredicate __pred, | |
1217 | /*is_vector=*/std::true_type) noexcept | |
1218 | { | |
1219 | _PSTL_PRAGMA_MESSAGE("Vectorized algorithm unimplemented, redirected to serial"); | |
1220 | return std::unique(__first, __last, __pred); | |
1221 | } | |
1222 | ||
1223 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _BinaryPredicate> | |
1224 | _ForwardIterator | |
1225 | __pattern_unique(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, | |
1226 | _BinaryPredicate __pred) noexcept | |
1227 | { | |
1228 | return __internal::__brick_unique(__first, __last, __pred, typename _Tag::__is_vector{}); | |
1229 | } | |
1230 | ||
1231 | // That function is shared between two algorithms - remove_if (__pattern_remove_if) and unique (pattern unique). But a mask calculation is different. | |
1232 | // So, a caller passes _CalcMask brick into remove_elements. | |
1233 | template <class _IsVector, class _ExecutionPolicy, class _ForwardIterator, class _CalcMask> | |
1234 | _ForwardIterator | |
1235 | __remove_elements(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _ForwardIterator __first, | |
1236 | _ForwardIterator __last, _CalcMask __calc_mask) | |
1237 | { | |
1238 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
1239 | ||
1240 | typedef typename std::iterator_traits<_ForwardIterator>::difference_type _DifferenceType; | |
1241 | typedef typename std::iterator_traits<_ForwardIterator>::value_type _Tp; | |
1242 | _DifferenceType __n = __last - __first; | |
1243 | __par_backend::__buffer<bool> __mask_buf(__n); | |
1244 | // 1. find a first iterator that should be removed | |
1245 | return __internal::__except_handler([&]() { | |
1246 | bool* __mask = __mask_buf.get(); | |
1247 | _DifferenceType __min = __par_backend::__parallel_reduce( | |
1248 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), _DifferenceType(0), __n, __n, | |
1249 | [__first, __mask, &__calc_mask](_DifferenceType __i, _DifferenceType __j, | |
1250 | _DifferenceType __local_min) -> _DifferenceType | |
1251 | { | |
1252 | // Create mask | |
1253 | __calc_mask(__mask + __i, __mask + __j, __first + __i); | |
1254 | ||
1255 | // if minimum was found in a previous range we shouldn't do anymore | |
1256 | if (__local_min < __i) | |
1257 | { | |
1258 | return __local_min; | |
1259 | } | |
1260 | // find first iterator that should be removed | |
1261 | bool* __result = __internal::__brick_find_if( | |
1262 | __mask + __i, __mask + __j, [](bool __val) { return !__val; }, _IsVector{}); | |
1263 | if (__result - __mask == __j) | |
1264 | { | |
1265 | return __local_min; | |
1266 | } | |
1267 | return std::min(__local_min, _DifferenceType(__result - __mask)); | |
1268 | }, | |
1269 | [](_DifferenceType __local_min1, _DifferenceType __local_min2) -> _DifferenceType | |
1270 | { return std::min(__local_min1, __local_min2); }); | |
1271 | ||
1272 | // No elements to remove - exit | |
1273 | if (__min == __n) | |
1274 | { | |
1275 | return __last; | |
1276 | } | |
1277 | __n -= __min; | |
1278 | __first += __min; | |
1279 | ||
1280 | __par_backend::__buffer<_Tp> __buf(__n); | |
1281 | _Tp* __result = __buf.get(); | |
1282 | __mask += __min; | |
1283 | _DifferenceType __m{}; | |
1284 | // 2. Elements that doesn't satisfy pred are moved to result | |
1285 | __par_backend::__parallel_strict_scan( | |
1286 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __n, _DifferenceType(0), | |
1287 | [__mask](_DifferenceType __i, _DifferenceType __len) | |
1288 | { | |
1289 | return __internal::__brick_count( | |
1290 | __mask + __i, __mask + __i + __len, [](bool __val) { return __val; }, _IsVector{}); | |
1291 | }, | |
1292 | std::plus<_DifferenceType>(), | |
1293 | [=](_DifferenceType __i, _DifferenceType __len, _DifferenceType __initial) | |
1294 | { | |
1295 | __internal::__brick_copy_by_mask( | |
1296 | __first + __i, __first + __i + __len, __result + __initial, __mask + __i, | |
1297 | [](_ForwardIterator __x, _Tp* __z) | |
1298 | { | |
1299 | __internal::__invoke_if_else( | |
1300 | std::conjunction<std::is_trivially_copyable<_Tp>, std::is_trivially_default_constructible<_Tp>>(), | |
1301 | [&]() { *__z = std::move(*__x); }, | |
1302 | [&]() { ::new (std::addressof(*__z)) _Tp(std::move(*__x)); }); | |
1303 | }, | |
1304 | _IsVector{}); | |
1305 | }, | |
1306 | [&__m](_DifferenceType __total) { __m = __total; }); | |
1307 | ||
1308 | // 3. Elements from result are moved to [first, last) | |
1309 | __par_backend::__parallel_for( | |
1310 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __result, __result + __m, | |
1311 | [__result, __first](_Tp* __i, _Tp* __j) | |
1312 | { | |
1313 | __invoke_if_else( | |
1314 | std::conjunction<std::is_trivially_copyable<_Tp>, std::is_trivially_default_constructible<_Tp>>(), | |
1315 | [&]() { __brick_move(__i, __j, __first + (__i - __result), _IsVector{}); }, | |
1316 | [&]() { __brick_move_destroy()(__i, __j, __first + (__i - __result), _IsVector{}); }); | |
1317 | }); | |
1318 | return __first + __m; | |
1319 | }); | |
1320 | } | |
1321 | ||
1322 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _BinaryPredicate> | |
1323 | _RandomAccessIterator | |
1324 | __pattern_unique(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
1325 | _RandomAccessIterator __last, _BinaryPredicate __pred) noexcept | |
1326 | { | |
1327 | typedef typename std::iterator_traits<_RandomAccessIterator>::reference _ReferenceType; | |
1328 | ||
1329 | if (__first == __last) | |
1330 | { | |
1331 | return __last; | |
1332 | } | |
1333 | if (__first + 1 == __last || __first + 2 == __last) | |
1334 | { | |
1335 | // Trivial sequence - use serial algorithm | |
1336 | return __internal::__brick_unique(__first, __last, __pred, _IsVector{}); | |
1337 | } | |
1338 | return __internal::__remove_elements( | |
1339 | __tag, std::forward<_ExecutionPolicy>(__exec), ++__first, __last, | |
1340 | [&__pred](bool* __b, bool* __e, _RandomAccessIterator __it) | |
1341 | { | |
1342 | __internal::__brick_walk3( | |
1343 | __b, __e, __it - 1, __it, | |
1344 | [&__pred](bool& __x, _ReferenceType __y, _ReferenceType __z) { __x = !__pred(__y, __z); }, _IsVector{}); | |
1345 | }); | |
1346 | } | |
1347 | ||
1348 | //------------------------------------------------------------------------ | |
1349 | // unique_copy | |
1350 | //------------------------------------------------------------------------ | |
1351 | ||
1352 | template <class _ForwardIterator, class _OutputIterator, class _BinaryPredicate> | |
1353 | _OutputIterator | |
1354 | __brick_unique_copy(_ForwardIterator __first, _ForwardIterator __last, _OutputIterator __result, _BinaryPredicate __pred, | |
1355 | /*vector=*/std::false_type) noexcept | |
1356 | { | |
1357 | return std::unique_copy(__first, __last, __result, __pred); | |
1358 | } | |
1359 | ||
1360 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _BinaryPredicate> | |
1361 | _RandomAccessIterator2 | |
1362 | __brick_unique_copy(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, _RandomAccessIterator2 __result, | |
1363 | _BinaryPredicate __pred, /*vector=*/std::true_type) noexcept | |
1364 | { | |
1365 | #if defined(_PSTL_MONOTONIC_PRESENT) | |
1366 | return __unseq_backend::__simd_unique_copy(__first, __last - __first, __result, __pred); | |
1367 | #else | |
1368 | return std::unique_copy(__first, __last, __result, __pred); | |
1369 | #endif | |
1370 | } | |
1371 | ||
1372 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _OutputIterator, class _BinaryPredicate> | |
1373 | _OutputIterator | |
1374 | __pattern_unique_copy(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, | |
1375 | _OutputIterator __result, _BinaryPredicate __pred) noexcept | |
1376 | { | |
1377 | return __internal::__brick_unique_copy(__first, __last, __result, __pred, typename _Tag::__is_vector{}); | |
1378 | } | |
1379 | ||
1380 | template <class _DifferenceType, class _RandomAccessIterator, class _BinaryPredicate> | |
1381 | _DifferenceType | |
1382 | __brick_calc_mask_2(_RandomAccessIterator __first, _RandomAccessIterator __last, bool* __restrict __mask, | |
1383 | _BinaryPredicate __pred, /*vector=*/std::false_type) noexcept | |
1384 | { | |
1385 | _DifferenceType __count = 0; | |
1386 | for (; __first != __last; ++__first, ++__mask) | |
1387 | { | |
1388 | *__mask = !__pred(*__first, *(__first - 1)); | |
1389 | __count += *__mask; | |
1390 | } | |
1391 | return __count; | |
1392 | } | |
1393 | ||
1394 | template <class _DifferenceType, class _RandomAccessIterator, class _BinaryPredicate> | |
1395 | _DifferenceType | |
1396 | __brick_calc_mask_2(_RandomAccessIterator __first, _RandomAccessIterator __last, bool* __restrict __mask, | |
1397 | _BinaryPredicate __pred, /*vector=*/std::true_type) noexcept | |
1398 | { | |
1399 | return __unseq_backend::__simd_calc_mask_2(__first, __last - __first, __mask, __pred); | |
1400 | } | |
1401 | ||
1402 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
1403 | class _BinaryPredicate> | |
1404 | _RandomAccessIterator2 | |
1405 | __pattern_unique_copy(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first, | |
1406 | _RandomAccessIterator1 __last, _RandomAccessIterator2 __result, _BinaryPredicate __pred) | |
1407 | { | |
1408 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
1409 | ||
1410 | typedef typename std::iterator_traits<_RandomAccessIterator1>::difference_type _DifferenceType; | |
1411 | const _DifferenceType __n = __last - __first; | |
1412 | if (_DifferenceType(2) < __n) | |
1413 | { | |
1414 | __par_backend::__buffer<bool> __mask_buf(__n); | |
1415 | if (_DifferenceType(2) < __n) | |
1416 | { | |
1417 | return __internal::__except_handler( | |
1418 | [&__exec, __n, __first, __result, __pred, &__mask_buf]() | |
1419 | { | |
1420 | bool* __mask = __mask_buf.get(); | |
1421 | _DifferenceType __m{}; | |
1422 | __par_backend::__parallel_strict_scan( | |
1423 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __n, _DifferenceType(0), | |
1424 | [=](_DifferenceType __i, _DifferenceType __len) -> _DifferenceType { // Reduce | |
1425 | _DifferenceType __extra = 0; | |
1426 | if (__i == 0) | |
1427 | { | |
1428 | // Special boundary case | |
1429 | __mask[__i] = true; | |
1430 | if (--__len == 0) | |
1431 | return 1; | |
1432 | ++__i; | |
1433 | ++__extra; | |
1434 | } | |
1435 | return __internal::__brick_calc_mask_2<_DifferenceType>( | |
1436 | __first + __i, __first + (__i + __len), __mask + __i, __pred, _IsVector{}) + | |
1437 | __extra; | |
1438 | }, | |
1439 | std::plus<_DifferenceType>(), // Combine | |
1440 | [=](_DifferenceType __i, _DifferenceType __len, _DifferenceType __initial) { // Scan | |
1441 | // Phase 2 is same as for __pattern_copy_if | |
1442 | __internal::__brick_copy_by_mask( | |
1443 | __first + __i, __first + (__i + __len), __result + __initial, __mask + __i, | |
1444 | [](_RandomAccessIterator1 __x, _RandomAccessIterator2 __z) { *__z = *__x; }, | |
1445 | _IsVector{}); | |
1446 | }, | |
1447 | [&__m](_DifferenceType __total) { __m = __total; }); | |
1448 | return __result + __m; | |
1449 | }); | |
1450 | } | |
1451 | } | |
1452 | // trivial sequence - use serial algorithm | |
1453 | return __internal::__brick_unique_copy(__first, __last, __result, __pred, _IsVector{}); | |
1454 | } | |
1455 | ||
1456 | //------------------------------------------------------------------------ | |
1457 | // reverse | |
1458 | //------------------------------------------------------------------------ | |
1459 | template <class _BidirectionalIterator> | |
1460 | void | |
1461 | __brick_reverse(_BidirectionalIterator __first, _BidirectionalIterator __last, /*__is_vector=*/std::false_type) noexcept | |
1462 | { | |
1463 | std::reverse(__first, __last); | |
1464 | } | |
1465 | ||
1466 | template <class _RandomAccessIterator> | |
1467 | void | |
1468 | __brick_reverse(_RandomAccessIterator __first, _RandomAccessIterator __last, /*__is_vector=*/std::true_type) noexcept | |
1469 | { | |
1470 | typedef typename std::iterator_traits<_RandomAccessIterator>::reference _ReferenceType; | |
1471 | ||
1472 | const auto __n = (__last - __first) / 2; | |
1473 | __unseq_backend::__simd_walk_2(__first, __n, std::reverse_iterator<_RandomAccessIterator>(__last), | |
1474 | [](_ReferenceType __x, _ReferenceType __y) { | |
1475 | using std::swap; | |
1476 | swap(__x, __y); | |
1477 | }); | |
1478 | } | |
1479 | ||
1480 | // this brick is called in parallel version, so we can use iterator arithmetic | |
1481 | template <class _BidirectionalIterator> | |
1482 | void | |
1483 | __brick_reverse(_BidirectionalIterator __first, _BidirectionalIterator __last, _BidirectionalIterator __d_last, | |
1484 | /*is_vector=*/std::false_type) noexcept | |
1485 | { | |
1486 | for (--__d_last; __first != __last; ++__first, --__d_last) | |
1487 | { | |
1488 | using std::iter_swap; | |
1489 | iter_swap(__first, __d_last); | |
1490 | } | |
1491 | } | |
1492 | ||
1493 | // this brick is called in parallel version, so we can use iterator arithmetic | |
1494 | template <class _RandomAccessIterator> | |
1495 | void | |
1496 | __brick_reverse(_RandomAccessIterator __first, _RandomAccessIterator __last, _RandomAccessIterator __d_last, | |
1497 | /*is_vector=*/std::true_type) noexcept | |
1498 | { | |
1499 | typedef typename std::iterator_traits<_RandomAccessIterator>::reference _ReferenceType; | |
1500 | ||
1501 | __unseq_backend::__simd_walk_2(__first, __last - __first, std::reverse_iterator<_RandomAccessIterator>(__d_last), | |
1502 | [](_ReferenceType __x, _ReferenceType __y) { | |
1503 | using std::swap; | |
1504 | swap(__x, __y); | |
1505 | }); | |
1506 | } | |
1507 | ||
1508 | template <class _Tag, class _ExecutionPolicy, class _BidirectionalIterator> | |
1509 | void | |
1510 | __pattern_reverse(_Tag, _ExecutionPolicy&&, _BidirectionalIterator __first, _BidirectionalIterator __last) noexcept | |
1511 | { | |
1512 | __internal::__brick_reverse(__first, __last, typename _Tag::__is_vector{}); | |
1513 | } | |
1514 | ||
1515 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator> | |
1516 | void | |
1517 | __pattern_reverse(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
1518 | _RandomAccessIterator __last) | |
1519 | { | |
1520 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
1521 | ||
1522 | __par_backend::__parallel_for( | |
1523 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __first + (__last - __first) / 2, | |
1524 | [__first, __last](_RandomAccessIterator __inner_first, _RandomAccessIterator __inner_last) | |
1525 | { __internal::__brick_reverse(__inner_first, __inner_last, __last - (__inner_first - __first), _IsVector{}); }); | |
1526 | } | |
1527 | ||
1528 | //------------------------------------------------------------------------ | |
1529 | // reverse_copy | |
1530 | //------------------------------------------------------------------------ | |
1531 | ||
1532 | template <class _BidirectionalIterator, class _OutputIterator> | |
1533 | _OutputIterator | |
1534 | __brick_reverse_copy(_BidirectionalIterator __first, _BidirectionalIterator __last, _OutputIterator __d_first, | |
1535 | /*is_vector=*/std::false_type) noexcept | |
1536 | { | |
1537 | return std::reverse_copy(__first, __last, __d_first); | |
1538 | } | |
1539 | ||
1540 | template <class _RandomAccessIterator1, class _RandomAccessIterator2> | |
1541 | _RandomAccessIterator2 | |
1542 | __brick_reverse_copy(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, _RandomAccessIterator2 __d_first, | |
1543 | /*is_vector=*/std::true_type) noexcept | |
1544 | { | |
1545 | typedef typename std::iterator_traits<_RandomAccessIterator1>::reference _ReferenceType1; | |
1546 | typedef typename std::iterator_traits<_RandomAccessIterator2>::reference _ReferenceType2; | |
1547 | ||
1548 | return __unseq_backend::__simd_walk_2(std::reverse_iterator<_RandomAccessIterator1>(__last), __last - __first, | |
1549 | __d_first, [](_ReferenceType1 __x, _ReferenceType2 __y) { __y = __x; }); | |
1550 | } | |
1551 | ||
1552 | template <class _Tag, class _ExecutionPolicy, class _BidirectionalIterator, class _OutputIterator> | |
1553 | _OutputIterator | |
1554 | __pattern_reverse_copy(_Tag, _ExecutionPolicy&&, _BidirectionalIterator __first, _BidirectionalIterator __last, | |
1555 | _OutputIterator __d_first) noexcept | |
1556 | { | |
1557 | return __internal::__brick_reverse_copy(__first, __last, __d_first, typename _Tag::__is_vector{}); | |
1558 | } | |
1559 | ||
1560 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2> | |
1561 | _RandomAccessIterator2 | |
1562 | __pattern_reverse_copy(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first, | |
1563 | _RandomAccessIterator1 __last, _RandomAccessIterator2 __d_first) | |
1564 | { | |
1565 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
1566 | ||
1567 | auto __len = __last - __first; | |
1568 | __par_backend::__parallel_for( | |
1569 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
1570 | [__first, __len, __d_first](_RandomAccessIterator1 __inner_first, _RandomAccessIterator1 __inner_last) | |
1571 | { | |
1572 | __internal::__brick_reverse_copy(__inner_first, __inner_last, | |
1573 | __d_first + (__len - (__inner_last - __first)), _IsVector{}); | |
1574 | }); | |
1575 | return __d_first + __len; | |
1576 | } | |
1577 | ||
1578 | //------------------------------------------------------------------------ | |
1579 | // rotate | |
1580 | //------------------------------------------------------------------------ | |
1581 | template <class _ForwardIterator> | |
1582 | _ForwardIterator | |
1583 | __brick_rotate(_ForwardIterator __first, _ForwardIterator __middle, _ForwardIterator __last, | |
1584 | /*is_vector=*/std::false_type) noexcept | |
1585 | { | |
1586 | #if defined(_PSTL_CPP11_STD_ROTATE_BROKEN) | |
1587 | std::rotate(__first, __middle, __last); | |
1588 | return std::next(__first, std::distance(__middle, __last)); | |
1589 | #else | |
1590 | return std::rotate(__first, __middle, __last); | |
1591 | #endif | |
1592 | } | |
1593 | ||
1594 | template <class _RandomAccessIterator> | |
1595 | _RandomAccessIterator | |
1596 | __brick_rotate(_RandomAccessIterator __first, _RandomAccessIterator __middle, _RandomAccessIterator __last, | |
1597 | /*is_vector=*/std::true_type) noexcept | |
1598 | { | |
1599 | auto __n = __last - __first; | |
1600 | auto __m = __middle - __first; | |
1601 | const _RandomAccessIterator __ret = __first + (__last - __middle); | |
1602 | ||
1603 | bool __is_left = (__m <= __n / 2); | |
1604 | if (!__is_left) | |
1605 | __m = __n - __m; | |
1606 | ||
1607 | while (__n > 1 && __m > 0) | |
1608 | { | |
1609 | using std::iter_swap; | |
1610 | const auto __m_2 = __m * 2; | |
1611 | if (__is_left) | |
1612 | { | |
1613 | for (; __last - __first >= __m_2; __first += __m) | |
1614 | { | |
1615 | __unseq_backend::__simd_assign(__first, __m, __first + __m, | |
1616 | iter_swap<_RandomAccessIterator, _RandomAccessIterator>); | |
1617 | } | |
1618 | } | |
1619 | else | |
1620 | { | |
1621 | for (; __last - __first >= __m_2; __last -= __m) | |
1622 | { | |
1623 | __unseq_backend::__simd_assign(__last - __m, __m, __last - __m_2, | |
1624 | iter_swap<_RandomAccessIterator, _RandomAccessIterator>); | |
1625 | } | |
1626 | } | |
1627 | __is_left = !__is_left; | |
1628 | __m = __n % __m; | |
1629 | __n = __last - __first; | |
1630 | } | |
1631 | ||
1632 | return __ret; | |
1633 | } | |
1634 | ||
1635 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator> | |
1636 | _ForwardIterator | |
1637 | __pattern_rotate(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __middle, | |
1638 | _ForwardIterator __last) noexcept | |
1639 | { | |
1640 | return __internal::__brick_rotate(__first, __middle, __last, typename _Tag::__is_vector{}); | |
1641 | } | |
1642 | ||
1643 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator> | |
1644 | _RandomAccessIterator | |
1645 | __pattern_rotate(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
1646 | _RandomAccessIterator __middle, _RandomAccessIterator __last) | |
1647 | { | |
1648 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
1649 | ||
1650 | typedef typename std::iterator_traits<_RandomAccessIterator>::value_type _Tp; | |
1651 | auto __n = __last - __first; | |
1652 | auto __m = __middle - __first; | |
1653 | if (__m <= __n / 2) | |
1654 | { | |
1655 | __par_backend::__buffer<_Tp> __buf(__n - __m); | |
1656 | return __internal::__except_handler( | |
1657 | [&__exec, __n, __m, __first, __middle, __last, &__buf]() | |
1658 | { | |
1659 | _Tp* __result = __buf.get(); | |
1660 | __par_backend::__parallel_for( | |
1661 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __middle, __last, | |
1662 | [__middle, __result](_RandomAccessIterator __b, _RandomAccessIterator __e) | |
1663 | { __internal::__brick_uninitialized_move(__b, __e, __result + (__b - __middle), _IsVector{}); }); | |
1664 | ||
1665 | __par_backend::__parallel_for( | |
1666 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __middle, | |
1667 | [__last, __middle](_RandomAccessIterator __b, _RandomAccessIterator __e) | |
1668 | { __internal::__brick_move(__b, __e, __b + (__last - __middle), _IsVector{}); }); | |
1669 | ||
1670 | __par_backend::__parallel_for( | |
1671 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __result, __result + (__n - __m), | |
1672 | [__first, __result](_Tp* __b, _Tp* __e) | |
1673 | { __brick_move_destroy()(__b, __e, __first + (__b - __result), _IsVector{}); }); | |
1674 | ||
1675 | return __first + (__last - __middle); | |
1676 | }); | |
1677 | } | |
1678 | else | |
1679 | { | |
1680 | __par_backend::__buffer<_Tp> __buf(__m); | |
1681 | return __internal::__except_handler( | |
1682 | [&__exec, __n, __m, __first, __middle, __last, &__buf]() | |
1683 | { | |
1684 | _Tp* __result = __buf.get(); | |
1685 | __par_backend::__parallel_for( | |
1686 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __middle, | |
1687 | [__first, __result](_RandomAccessIterator __b, _RandomAccessIterator __e) | |
1688 | { __internal::__brick_uninitialized_move(__b, __e, __result + (__b - __first), _IsVector{}); }); | |
1689 | ||
1690 | __par_backend::__parallel_for( | |
1691 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __middle, __last, | |
1692 | [__first, __middle](_RandomAccessIterator __b, _RandomAccessIterator __e) | |
1693 | { __internal::__brick_move(__b, __e, __first + (__b - __middle), _IsVector{}); }); | |
1694 | ||
1695 | __par_backend::__parallel_for( | |
1696 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __result, __result + __m, | |
1697 | [__n, __m, __first, __result](_Tp* __b, _Tp* __e) | |
1698 | { __brick_move_destroy()(__b, __e, __first + ((__n - __m) + (__b - __result)), _IsVector{}); }); | |
1699 | ||
1700 | return __first + (__last - __middle); | |
1701 | }); | |
1702 | } | |
1703 | } | |
1704 | ||
1705 | //------------------------------------------------------------------------ | |
1706 | // rotate_copy | |
1707 | //------------------------------------------------------------------------ | |
1708 | ||
1709 | template <class _ForwardIterator, class _OutputIterator> | |
1710 | _OutputIterator | |
1711 | __brick_rotate_copy(_ForwardIterator __first, _ForwardIterator __middle, _ForwardIterator __last, | |
1712 | _OutputIterator __result, /*__is_vector=*/std::false_type) noexcept | |
1713 | { | |
1714 | return std::rotate_copy(__first, __middle, __last, __result); | |
1715 | } | |
1716 | ||
1717 | template <class _RandomAccessIterator1, class _RandomAccessIterator2> | |
1718 | _RandomAccessIterator2 | |
1719 | __brick_rotate_copy(_RandomAccessIterator1 __first, _RandomAccessIterator1 __middle, _RandomAccessIterator1 __last, | |
1720 | _RandomAccessIterator2 __result, /*__is_vector=*/std::true_type) noexcept | |
1721 | { | |
1722 | _RandomAccessIterator2 __res = __internal::__brick_copy(__middle, __last, __result, std::true_type()); | |
1723 | return __internal::__brick_copy(__first, __middle, __res, std::true_type()); | |
1724 | } | |
1725 | ||
1726 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _OutputIterator> | |
1727 | _OutputIterator | |
1728 | __pattern_rotate_copy(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __middle, | |
1729 | _ForwardIterator __last, _OutputIterator __result) noexcept | |
1730 | { | |
1731 | return __internal::__brick_rotate_copy(__first, __middle, __last, __result, typename _Tag::__is_vector{}); | |
1732 | } | |
1733 | ||
1734 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2> | |
1735 | _RandomAccessIterator2 | |
1736 | __pattern_rotate_copy(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first, | |
1737 | _RandomAccessIterator1 __middle, _RandomAccessIterator1 __last, _RandomAccessIterator2 __result) | |
1738 | { | |
1739 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
1740 | ||
1741 | __par_backend::__parallel_for( | |
1742 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
1743 | [__first, __last, __middle, __result](_RandomAccessIterator1 __b, _RandomAccessIterator1 __e) | |
1744 | { | |
1745 | if (__b > __middle) | |
1746 | { | |
1747 | __internal::__brick_copy(__b, __e, __result + (__b - __middle), _IsVector{}); | |
1748 | } | |
1749 | else | |
1750 | { | |
1751 | _RandomAccessIterator2 __new_result = __result + ((__last - __middle) + (__b - __first)); | |
1752 | if (__e < __middle) | |
1753 | { | |
1754 | __internal::__brick_copy(__b, __e, __new_result, _IsVector{}); | |
1755 | } | |
1756 | else | |
1757 | { | |
1758 | __internal::__brick_copy(__b, __middle, __new_result, _IsVector{}); | |
1759 | __internal::__brick_copy(__middle, __e, __result, _IsVector{}); | |
1760 | } | |
1761 | } | |
1762 | }); | |
1763 | return __result + (__last - __first); | |
1764 | } | |
1765 | ||
1766 | //------------------------------------------------------------------------ | |
1767 | // is_partitioned | |
1768 | //------------------------------------------------------------------------ | |
1769 | ||
1770 | template <class _ForwardIterator, class _UnaryPredicate> | |
1771 | bool | |
1772 | __brick_is_partitioned(_ForwardIterator __first, _ForwardIterator __last, _UnaryPredicate __pred, | |
1773 | /*is_vector=*/std::false_type) noexcept | |
1774 | { | |
1775 | return std::is_partitioned(__first, __last, __pred); | |
1776 | } | |
1777 | ||
1778 | template <class _RandomAccessIterator, class _UnaryPredicate> | |
1779 | bool | |
1780 | __brick_is_partitioned(_RandomAccessIterator __first, _RandomAccessIterator __last, _UnaryPredicate __pred, | |
1781 | /*is_vector=*/std::true_type) noexcept | |
1782 | { | |
1783 | typedef typename std::iterator_traits<_RandomAccessIterator>::difference_type _SizeType; | |
1784 | if (__first == __last) | |
1785 | { | |
1786 | return true; | |
1787 | } | |
1788 | else | |
1789 | { | |
1790 | _RandomAccessIterator __result = __unseq_backend::__simd_first( | |
1791 | __first, _SizeType(0), __last - __first, | |
1792 | [&__pred](_RandomAccessIterator __it, _SizeType __i) { return !__pred(__it[__i]); }); | |
1793 | if (__result == __last) | |
1794 | { | |
1795 | return true; | |
1796 | } | |
1797 | else | |
1798 | { | |
1799 | ++__result; | |
1800 | return !__unseq_backend::__simd_or(__result, __last - __result, __pred); | |
1801 | } | |
1802 | } | |
1803 | } | |
1804 | ||
1805 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _UnaryPredicate> | |
1806 | bool | |
1807 | __pattern_is_partitioned(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, | |
1808 | _UnaryPredicate __pred) noexcept | |
1809 | { | |
1810 | return __internal::__brick_is_partitioned(__first, __last, __pred, typename _Tag::__is_vector{}); | |
1811 | } | |
1812 | ||
1813 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _UnaryPredicate> | |
1814 | bool | |
1815 | __pattern_is_partitioned(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
1816 | _RandomAccessIterator __last, _UnaryPredicate __pred) | |
1817 | { | |
1818 | if (__first == __last) | |
1819 | { | |
1820 | return true; | |
1821 | } | |
1822 | else | |
1823 | { | |
1824 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
1825 | ||
1826 | return __internal::__except_handler([&]() { | |
1827 | // State of current range: | |
1828 | // broken - current range is not partitioned by pred | |
1829 | // all_true - all elements in current range satisfy pred | |
1830 | // all_false - all elements in current range don't satisfy pred | |
1831 | // true_false - elements satisfy pred are placed before elements that don't satisfy pred | |
1832 | enum _ReduceType | |
1833 | { | |
1834 | __not_init = -1, | |
1835 | __broken, | |
1836 | __all_true, | |
1837 | __all_false, | |
1838 | __true_false | |
1839 | }; | |
1840 | _ReduceType __init = __not_init; | |
1841 | ||
1842 | // Array with states that we'll have when state from the left branch is merged with state from the right branch. | |
1843 | // State is calculated by formula: new_state = table[left_state * 4 + right_state] | |
1844 | _ReduceType __table[] = {__broken, __broken, __broken, __broken, __broken, __all_true, | |
1845 | __true_false, __true_false, __broken, __broken, __all_false, __broken, | |
1846 | __broken, __broken, __true_false, __broken}; | |
1847 | ||
1848 | __init = __par_backend::__parallel_reduce( | |
1849 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, __init, | |
1850 | [&__pred, &__table](_RandomAccessIterator __i, _RandomAccessIterator __j, | |
1851 | _ReduceType __value) -> _ReduceType | |
1852 | { | |
1853 | if (__value == __broken) | |
1854 | { | |
1855 | return __broken; | |
1856 | } | |
1857 | _ReduceType __res = __not_init; | |
1858 | // if first element satisfy pred | |
1859 | if (__pred(*__i)) | |
1860 | { | |
1861 | // find first element that don't satisfy pred | |
1862 | _RandomAccessIterator __x = | |
1863 | __internal::__brick_find_if(__i + 1, __j, std::not_fn(__pred), _IsVector{}); | |
1864 | if (__x != __j) | |
1865 | { | |
1866 | // find first element after "x" that satisfy pred | |
1867 | _RandomAccessIterator __y = __internal::__brick_find_if(__x + 1, __j, __pred, _IsVector{}); | |
1868 | // if it was found then range isn't partitioned by pred | |
1869 | if (__y != __j) | |
1870 | { | |
1871 | return __broken; | |
1872 | } | |
1873 | else | |
1874 | { | |
1875 | __res = __true_false; | |
1876 | } | |
1877 | } | |
1878 | else | |
1879 | { | |
1880 | __res = __all_true; | |
1881 | } | |
1882 | } | |
1883 | else | |
1884 | { // if first element doesn't satisfy pred | |
1885 | // then we should find the first element that satisfy pred. | |
1886 | // If we found it then range isn't partitioned by pred | |
1887 | if (__internal::__brick_find_if(__i + 1, __j, __pred, _IsVector{}) != __j) | |
1888 | { | |
1889 | return __broken; | |
1890 | } | |
1891 | else | |
1892 | { | |
1893 | __res = __all_false; | |
1894 | } | |
1895 | } | |
1896 | // if we have value from left range then we should calculate the result | |
1897 | return (__value == -1) ? __res : __table[__value * 4 + __res]; | |
1898 | }, | |
1899 | ||
1900 | [&__table](_ReduceType __val1, _ReduceType __val2) -> _ReduceType | |
1901 | { | |
1902 | if (__val1 == __broken || __val2 == __broken) | |
1903 | { | |
1904 | return __broken; | |
1905 | } | |
1906 | // calculate the result for new big range | |
1907 | return __table[__val1 * 4 + __val2]; | |
1908 | }); | |
1909 | return __init != __broken; | |
1910 | }); | |
1911 | } | |
1912 | } | |
1913 | ||
1914 | //------------------------------------------------------------------------ | |
1915 | // partition | |
1916 | //------------------------------------------------------------------------ | |
1917 | ||
1918 | template <class _ForwardIterator, class _UnaryPredicate> | |
1919 | _ForwardIterator | |
1920 | __brick_partition(_ForwardIterator __first, _ForwardIterator __last, _UnaryPredicate __pred, | |
1921 | /*is_vector=*/std::false_type) noexcept | |
1922 | { | |
1923 | return std::partition(__first, __last, __pred); | |
1924 | } | |
1925 | ||
1926 | template <class _RandomAccessIterator, class _UnaryPredicate> | |
1927 | _RandomAccessIterator | |
1928 | __brick_partition(_RandomAccessIterator __first, _RandomAccessIterator __last, _UnaryPredicate __pred, | |
1929 | /*is_vector=*/std::true_type) noexcept | |
1930 | { | |
1931 | _PSTL_PRAGMA_MESSAGE("Vectorized algorithm unimplemented, redirected to serial"); | |
1932 | return std::partition(__first, __last, __pred); | |
1933 | } | |
1934 | ||
1935 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _UnaryPredicate> | |
1936 | _ForwardIterator | |
1937 | __pattern_partition(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, | |
1938 | _UnaryPredicate __pred) noexcept | |
1939 | { | |
1940 | return __internal::__brick_partition(__first, __last, __pred, typename _Tag::__is_vector{}); | |
1941 | } | |
1942 | ||
1943 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _UnaryPredicate> | |
1944 | _RandomAccessIterator | |
1945 | __pattern_partition(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
1946 | _RandomAccessIterator __last, _UnaryPredicate __pred) | |
1947 | { | |
1948 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
1949 | ||
1950 | // partitioned range: elements before pivot satisfy pred (true part), | |
1951 | // elements after pivot don't satisfy pred (false part) | |
1952 | struct _PartitionRange | |
1953 | { | |
1954 | _RandomAccessIterator __begin; | |
1955 | _RandomAccessIterator __pivot; | |
1956 | _RandomAccessIterator __end; | |
1957 | }; | |
1958 | ||
1959 | return __internal::__except_handler([&]() { | |
1960 | _PartitionRange __init{__last, __last, __last}; | |
1961 | ||
1962 | // lambda for merging two partitioned ranges to one partitioned range | |
1963 | auto __reductor = [&__exec](_PartitionRange __val1, _PartitionRange __val2) -> _PartitionRange | |
1964 | { | |
1965 | auto __size1 = __val1.__end - __val1.__pivot; | |
1966 | auto __size2 = __val2.__pivot - __val2.__begin; | |
1967 | auto __new_begin = __val2.__begin - (__val1.__end - __val1.__begin); | |
1968 | ||
1969 | // if all elements in left range satisfy pred then we can move new pivot to pivot of right range | |
1970 | if (__val1.__end == __val1.__pivot) | |
1971 | { | |
1972 | return {__new_begin, __val2.__pivot, __val2.__end}; | |
1973 | } | |
1974 | // if true part of right range greater than false part of left range | |
1975 | // then we should swap the false part of left range and last part of true part of right range | |
1976 | else if (__size2 > __size1) | |
1977 | { | |
1978 | __par_backend::__parallel_for( | |
1979 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __val1.__pivot, __val1.__pivot + __size1, | |
1980 | [__val1, __val2, __size1](_RandomAccessIterator __i, _RandomAccessIterator __j) { | |
1981 | __internal::__brick_swap_ranges(__i, __j, (__val2.__pivot - __size1) + (__i - __val1.__pivot), | |
1982 | _IsVector{}); | |
1983 | }); | |
1984 | return {__new_begin, __val2.__pivot - __size1, __val2.__end}; | |
1985 | } | |
1986 | // else we should swap the first part of false part of left range and true part of right range | |
1987 | else | |
1988 | { | |
1989 | __par_backend::__parallel_for( | |
1990 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __val1.__pivot, __val1.__pivot + __size2, | |
1991 | [__val1, __val2](_RandomAccessIterator __i, _RandomAccessIterator __j) { | |
1992 | __internal::__brick_swap_ranges(__i, __j, __val2.__begin + (__i - __val1.__pivot), _IsVector{}); | |
1993 | }); | |
1994 | return {__new_begin, __val1.__pivot + __size2, __val2.__end}; | |
1995 | } | |
1996 | }; | |
1997 | ||
1998 | _PartitionRange __result = __par_backend::__parallel_reduce( | |
1999 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, __init, | |
2000 | [__pred, __reductor](_RandomAccessIterator __i, _RandomAccessIterator __j, | |
2001 | _PartitionRange __value) -> _PartitionRange | |
2002 | { | |
2003 | //1. serial partition | |
2004 | _RandomAccessIterator __pivot = __internal::__brick_partition(__i, __j, __pred, _IsVector{}); | |
2005 | ||
2006 | // 2. merging of two ranges (left and right respectively) | |
2007 | return __reductor(__value, {__i, __pivot, __j}); | |
2008 | }, | |
2009 | __reductor); | |
2010 | return __result.__pivot; | |
2011 | }); | |
2012 | } | |
2013 | ||
2014 | //------------------------------------------------------------------------ | |
2015 | // stable_partition | |
2016 | //------------------------------------------------------------------------ | |
2017 | ||
2018 | template <class _BidirectionalIterator, class _UnaryPredicate> | |
2019 | _BidirectionalIterator | |
2020 | __brick_stable_partition(_BidirectionalIterator __first, _BidirectionalIterator __last, _UnaryPredicate __pred, | |
2021 | /*__is_vector=*/std::false_type) noexcept | |
2022 | { | |
2023 | return std::stable_partition(__first, __last, __pred); | |
2024 | } | |
2025 | ||
2026 | template <class _RandomAccessIterator, class _UnaryPredicate> | |
2027 | _RandomAccessIterator | |
2028 | __brick_stable_partition(_RandomAccessIterator __first, _RandomAccessIterator __last, _UnaryPredicate __pred, | |
2029 | /*__is_vector=*/std::true_type) noexcept | |
2030 | { | |
2031 | _PSTL_PRAGMA_MESSAGE("Vectorized algorithm unimplemented, redirected to serial"); | |
2032 | return std::stable_partition(__first, __last, __pred); | |
2033 | } | |
2034 | ||
2035 | template <class _Tag, class _ExecutionPolicy, class _BidirectionalIterator, class _UnaryPredicate> | |
2036 | _BidirectionalIterator | |
2037 | __pattern_stable_partition(_Tag, _ExecutionPolicy&&, _BidirectionalIterator __first, _BidirectionalIterator __last, | |
2038 | _UnaryPredicate __pred) noexcept | |
2039 | { | |
2040 | return __internal::__brick_stable_partition(__first, __last, __pred, typename _Tag::__is_vector{}); | |
2041 | } | |
2042 | ||
2043 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _UnaryPredicate> | |
2044 | _RandomAccessIterator | |
2045 | __pattern_stable_partition(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
2046 | _RandomAccessIterator __last, _UnaryPredicate __pred) noexcept | |
2047 | { | |
2048 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
2049 | ||
2050 | // partitioned range: elements before pivot satisfy pred (true part), | |
2051 | // elements after pivot don't satisfy pred (false part) | |
2052 | struct _PartitionRange | |
2053 | { | |
2054 | _RandomAccessIterator __begin; | |
2055 | _RandomAccessIterator __pivot; | |
2056 | _RandomAccessIterator __end; | |
2057 | }; | |
2058 | ||
2059 | return __internal::__except_handler([&]() { | |
2060 | _PartitionRange __init{__last, __last, __last}; | |
2061 | ||
2062 | // lambda for merging two partitioned ranges to one partitioned range | |
2063 | auto __reductor = [](_PartitionRange __val1, _PartitionRange __val2) -> _PartitionRange | |
2064 | { | |
2065 | auto __size1 = __val1.__end - __val1.__pivot; | |
2066 | auto __new_begin = __val2.__begin - (__val1.__end - __val1.__begin); | |
2067 | ||
2068 | // if all elements in left range satisfy pred then we can move new pivot to pivot of right range | |
2069 | if (__val1.__end == __val1.__pivot) | |
2070 | { | |
2071 | return {__new_begin, __val2.__pivot, __val2.__end}; | |
2072 | } | |
2073 | // if true part of right range greater than false part of left range | |
2074 | // then we should swap the false part of left range and last part of true part of right range | |
2075 | else | |
2076 | { | |
2077 | __internal::__brick_rotate(__val1.__pivot, __val2.__begin, __val2.__pivot, _IsVector{}); | |
2078 | return {__new_begin, __val2.__pivot - __size1, __val2.__end}; | |
2079 | } | |
2080 | }; | |
2081 | ||
2082 | _PartitionRange __result = __par_backend::__parallel_reduce( | |
2083 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, __init, | |
2084 | [&__pred, __reductor](_RandomAccessIterator __i, _RandomAccessIterator __j, | |
2085 | _PartitionRange __value) -> _PartitionRange | |
2086 | { | |
2087 | //1. serial stable_partition | |
2088 | _RandomAccessIterator __pivot = __internal::__brick_stable_partition(__i, __j, __pred, _IsVector{}); | |
2089 | ||
2090 | // 2. merging of two ranges (left and right respectively) | |
2091 | return __reductor(__value, {__i, __pivot, __j}); | |
2092 | }, | |
2093 | __reductor); | |
2094 | return __result.__pivot; | |
2095 | }); | |
2096 | } | |
2097 | ||
2098 | //------------------------------------------------------------------------ | |
2099 | // partition_copy | |
2100 | //------------------------------------------------------------------------ | |
2101 | ||
2102 | template <class _ForwardIterator, class _OutputIterator1, class _OutputIterator2, class _UnaryPredicate> | |
2103 | std::pair<_OutputIterator1, _OutputIterator2> | |
2104 | __brick_partition_copy(_ForwardIterator __first, _ForwardIterator __last, _OutputIterator1 __out_true, | |
2105 | _OutputIterator2 __out_false, _UnaryPredicate __pred, /*is_vector=*/std::false_type) noexcept | |
2106 | { | |
2107 | return std::partition_copy(__first, __last, __out_true, __out_false, __pred); | |
2108 | } | |
2109 | ||
2110 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _RandomAccessIterator3, | |
2111 | class _UnaryPredicate> | |
2112 | std::pair<_RandomAccessIterator2, _RandomAccessIterator3> | |
2113 | __brick_partition_copy(_RandomAccessIterator1 __first, _RandomAccessIterator1 __last, _RandomAccessIterator2 __out_true, | |
2114 | _RandomAccessIterator3 __out_false, _UnaryPredicate __pred, | |
2115 | /*is_vector=*/std::true_type) noexcept | |
2116 | { | |
2117 | #if defined(_PSTL_MONOTONIC_PRESENT) | |
2118 | return __unseq_backend::__simd_partition_copy(__first, __last - __first, __out_true, __out_false, __pred); | |
2119 | #else | |
2120 | return std::partition_copy(__first, __last, __out_true, __out_false, __pred); | |
2121 | #endif | |
2122 | } | |
2123 | ||
2124 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _OutputIterator1, class _OutputIterator2, | |
2125 | class _UnaryPredicate> | |
2126 | std::pair<_OutputIterator1, _OutputIterator2> | |
2127 | __pattern_partition_copy(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, | |
2128 | _OutputIterator1 __out_true, _OutputIterator2 __out_false, _UnaryPredicate __pred) noexcept | |
2129 | { | |
2130 | return __internal::__brick_partition_copy(__first, __last, __out_true, __out_false, __pred, | |
2131 | typename _Tag::__is_vector{}); | |
2132 | } | |
2133 | ||
2134 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
2135 | class _RandomAccessIterator3, class _UnaryPredicate> | |
2136 | std::pair<_RandomAccessIterator2, _RandomAccessIterator3> | |
2137 | __pattern_partition_copy(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first, | |
2138 | _RandomAccessIterator1 __last, _RandomAccessIterator2 __out_true, | |
2139 | _RandomAccessIterator3 __out_false, _UnaryPredicate __pred) | |
2140 | { | |
2141 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
2142 | ||
2143 | typedef typename std::iterator_traits<_RandomAccessIterator1>::difference_type _DifferenceType; | |
2144 | typedef std::pair<_DifferenceType, _DifferenceType> _ReturnType; | |
2145 | const _DifferenceType __n = __last - __first; | |
2146 | if (_DifferenceType(1) < __n) | |
2147 | { | |
2148 | __par_backend::__buffer<bool> __mask_buf(__n); | |
2149 | return __internal::__except_handler( | |
2150 | [&__exec, __n, __first, __out_true, __out_false, __pred, &__mask_buf]() | |
2151 | { | |
2152 | bool* __mask = __mask_buf.get(); | |
2153 | _ReturnType __m{}; | |
2154 | __par_backend::__parallel_strict_scan( | |
2155 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __n, | |
2156 | std::make_pair(_DifferenceType(0), _DifferenceType(0)), | |
2157 | [=](_DifferenceType __i, _DifferenceType __len) { // Reduce | |
2158 | return __internal::__brick_calc_mask_1<_DifferenceType>(__first + __i, __first + (__i + __len), | |
2159 | __mask + __i, __pred, _IsVector{}); | |
2160 | }, | |
2161 | [](const _ReturnType& __x, const _ReturnType& __y) -> _ReturnType | |
2162 | { return std::make_pair(__x.first + __y.first, __x.second + __y.second); }, // Combine | |
2163 | [=](_DifferenceType __i, _DifferenceType __len, _ReturnType __initial) { // Scan | |
2164 | __internal::__brick_partition_by_mask( | |
2165 | __first + __i, __first + (__i + __len), __out_true + __initial.first, | |
2166 | __out_false + __initial.second, __mask + __i, _IsVector{}); | |
2167 | }, | |
2168 | [&__m](_ReturnType __total) { __m = __total; }); | |
2169 | return std::make_pair(__out_true + __m.first, __out_false + __m.second); | |
2170 | }); | |
2171 | } | |
2172 | // trivial sequence - use serial algorithm | |
2173 | return __internal::__brick_partition_copy(__first, __last, __out_true, __out_false, __pred, _IsVector{}); | |
2174 | } | |
2175 | ||
2176 | //------------------------------------------------------------------------ | |
2177 | // sort | |
2178 | //------------------------------------------------------------------------ | |
2179 | ||
2180 | template <class _Tag, class _ExecutionPolicy, class _RandomAccessIterator, class _Compare, class _IsMoveConstructible> | |
2181 | void | |
2182 | __pattern_sort(_Tag, _ExecutionPolicy&&, _RandomAccessIterator __first, _RandomAccessIterator __last, _Compare __comp, | |
2183 | _IsMoveConstructible) noexcept | |
2184 | { | |
2185 | std::sort(__first, __last, __comp); | |
2186 | } | |
2187 | ||
2188 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Compare> | |
2189 | void | |
2190 | __pattern_sort(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
2191 | _RandomAccessIterator __last, _Compare __comp, /*is_move_constructible=*/std::true_type) | |
2192 | { | |
2193 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
2194 | ||
2195 | __internal::__except_handler( | |
2196 | [&]() | |
2197 | { | |
2198 | __par_backend::__parallel_stable_sort( | |
2199 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, __comp, | |
2200 | [](_RandomAccessIterator __first, _RandomAccessIterator __last, _Compare __comp) | |
2201 | { std::sort(__first, __last, __comp); }); | |
2202 | }); | |
2203 | } | |
2204 | ||
2205 | //------------------------------------------------------------------------ | |
2206 | // stable_sort | |
2207 | //------------------------------------------------------------------------ | |
2208 | ||
2209 | template <class _Tag, class _ExecutionPolicy, class _RandomAccessIterator, class _Compare> | |
2210 | void | |
2211 | __pattern_stable_sort(_Tag, _ExecutionPolicy&&, _RandomAccessIterator __first, _RandomAccessIterator __last, | |
2212 | _Compare __comp) noexcept | |
2213 | { | |
2214 | std::stable_sort(__first, __last, __comp); | |
2215 | } | |
2216 | ||
2217 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Compare> | |
2218 | void | |
2219 | __pattern_stable_sort(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
2220 | _RandomAccessIterator __last, _Compare __comp) | |
2221 | { | |
2222 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
2223 | ||
2224 | __internal::__except_handler( | |
2225 | [&]() | |
2226 | { | |
2227 | __par_backend::__parallel_stable_sort( | |
2228 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, __comp, | |
2229 | [](_RandomAccessIterator __first, _RandomAccessIterator __last, _Compare __comp) | |
2230 | { std::stable_sort(__first, __last, __comp); }); | |
2231 | }); | |
2232 | } | |
2233 | ||
2234 | //------------------------------------------------------------------------ | |
2235 | // partial_sort | |
2236 | //------------------------------------------------------------------------ | |
2237 | ||
2238 | template <class _Tag, class _ExecutionPolicy, class _RandomAccessIterator, class _Compare> | |
2239 | void | |
2240 | __pattern_partial_sort(_Tag, _ExecutionPolicy&&, _RandomAccessIterator __first, _RandomAccessIterator __middle, | |
2241 | _RandomAccessIterator __last, _Compare __comp) noexcept | |
2242 | { | |
2243 | std::partial_sort(__first, __middle, __last, __comp); | |
2244 | } | |
2245 | ||
2246 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Compare> | |
2247 | void | |
2248 | __pattern_partial_sort(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
2249 | _RandomAccessIterator __middle, _RandomAccessIterator __last, _Compare __comp) | |
2250 | { | |
2251 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
2252 | ||
2253 | const auto __n = __middle - __first; | |
2254 | if (__n == 0) | |
2255 | return; | |
2256 | ||
2257 | __internal::__except_handler( | |
2258 | [&]() | |
2259 | { | |
2260 | __par_backend::__parallel_stable_sort( | |
2261 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, __comp, | |
2262 | [__n](_RandomAccessIterator __begin, _RandomAccessIterator __end, _Compare __comp) | |
2263 | { | |
2264 | if (__n < __end - __begin) | |
2265 | std::partial_sort(__begin, __begin + __n, __end, __comp); | |
2266 | else | |
2267 | std::sort(__begin, __end, __comp); | |
2268 | }, | |
2269 | __n); | |
2270 | }); | |
2271 | } | |
2272 | ||
2273 | //------------------------------------------------------------------------ | |
2274 | // partial_sort_copy | |
2275 | //------------------------------------------------------------------------ | |
2276 | ||
2277 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _RandomAccessIterator, class _Compare> | |
2278 | _RandomAccessIterator | |
2279 | __pattern_partial_sort_copy(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, | |
2280 | _RandomAccessIterator __d_first, _RandomAccessIterator __d_last, _Compare __comp) noexcept | |
2281 | { | |
2282 | return std::partial_sort_copy(__first, __last, __d_first, __d_last, __comp); | |
2283 | } | |
2284 | ||
2285 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
2286 | class _Compare> | |
2287 | _RandomAccessIterator2 | |
2288 | __pattern_partial_sort_copy(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first, | |
2289 | _RandomAccessIterator1 __last, _RandomAccessIterator2 __d_first, | |
2290 | _RandomAccessIterator2 __d_last, _Compare __comp) | |
2291 | { | |
2292 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
2293 | ||
2294 | if (__last == __first || __d_last == __d_first) | |
2295 | { | |
2296 | return __d_first; | |
2297 | } | |
2298 | auto __n1 = __last - __first; | |
2299 | auto __n2 = __d_last - __d_first; | |
2300 | return __internal::__except_handler([&]() { | |
2301 | if (__n2 >= __n1) | |
2302 | { | |
2303 | __par_backend::__parallel_stable_sort( | |
2304 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __d_first, __d_first + __n1, __comp, | |
2305 | [__first, __d_first](_RandomAccessIterator2 __i, _RandomAccessIterator2 __j, _Compare __comp) | |
2306 | { | |
2307 | _RandomAccessIterator1 __i1 = __first + (__i - __d_first); | |
2308 | _RandomAccessIterator1 __j1 = __first + (__j - __d_first); | |
2309 | ||
2310 | // 1. Copy elements from input to output | |
2311 | #if !defined(_PSTL_ICC_18_OMP_SIMD_BROKEN) | |
2312 | __internal::__brick_copy(__i1, __j1, __i, _IsVector{}); | |
2313 | #else | |
2314 | std::copy(__i1, __j1, __i); | |
2315 | #endif | |
2316 | // 2. Sort elements in output sequence | |
2317 | std::sort(__i, __j, __comp); | |
2318 | }, | |
2319 | __n1); | |
2320 | return __d_first + __n1; | |
2321 | } | |
2322 | else | |
2323 | { | |
2324 | typedef typename std::iterator_traits<_RandomAccessIterator1>::value_type _T1; | |
2325 | typedef typename std::iterator_traits<_RandomAccessIterator2>::value_type _T2; | |
2326 | __par_backend::__buffer<_T1> __buf(__n1); | |
2327 | _T1* __r = __buf.get(); | |
2328 | ||
2329 | __par_backend::__parallel_stable_sort( | |
2330 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __r, __r + __n1, __comp, | |
2331 | [__n2, __first, __r](_T1* __i, _T1* __j, _Compare __comp) | |
2332 | { | |
2333 | _RandomAccessIterator1 __it = __first + (__i - __r); | |
2334 | ||
2335 | // 1. Copy elements from input to raw memory | |
2336 | for (_T1* __k = __i; __k != __j; ++__k, ++__it) | |
2337 | { | |
2338 | ::new (__k) _T2(*__it); | |
2339 | } | |
2340 | ||
2341 | // 2. Sort elements in temporary __buffer | |
2342 | if (__n2 < __j - __i) | |
2343 | std::partial_sort(__i, __i + __n2, __j, __comp); | |
2344 | else | |
2345 | std::sort(__i, __j, __comp); | |
2346 | }, | |
2347 | __n2); | |
2348 | ||
2349 | // 3. Move elements from temporary __buffer to output | |
2350 | __par_backend::__parallel_for(__backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __r, __r + __n2, | |
2351 | [__r, __d_first](_T1* __i, _T1* __j) | |
2352 | { __brick_move_destroy()(__i, __j, __d_first + (__i - __r), _IsVector{}); }); | |
2353 | __par_backend::__parallel_for(__backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __r + __n2, | |
2354 | __r + __n1, | |
2355 | [](_T1* __i, _T1* __j) { __brick_destroy(__i, __j, _IsVector{}); }); | |
2356 | ||
2357 | return __d_first + __n2; | |
2358 | } | |
2359 | }); | |
2360 | } | |
2361 | ||
2362 | //------------------------------------------------------------------------ | |
2363 | // adjacent_find | |
2364 | //------------------------------------------------------------------------ | |
2365 | template <class _RandomAccessIterator, class _BinaryPredicate> | |
2366 | _RandomAccessIterator | |
2367 | __brick_adjacent_find(_RandomAccessIterator __first, _RandomAccessIterator __last, _BinaryPredicate __pred, | |
2368 | /* IsVector = */ std::true_type, bool __or_semantic) noexcept | |
2369 | { | |
2370 | return __unseq_backend::__simd_adjacent_find(__first, __last, __pred, __or_semantic); | |
2371 | } | |
2372 | ||
2373 | template <class _ForwardIterator, class _BinaryPredicate> | |
2374 | _ForwardIterator | |
2375 | __brick_adjacent_find(_ForwardIterator __first, _ForwardIterator __last, _BinaryPredicate __pred, | |
2376 | /* IsVector = */ std::false_type, bool) noexcept | |
2377 | { | |
2378 | return std::adjacent_find(__first, __last, __pred); | |
2379 | } | |
2380 | ||
2381 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _BinaryPredicate> | |
2382 | _ForwardIterator | |
2383 | __pattern_adjacent_find(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, | |
2384 | _BinaryPredicate __pred, bool __or_semantic) noexcept | |
2385 | { | |
2386 | return __internal::__brick_adjacent_find(__first, __last, __pred, typename _Tag::__is_vector{}, __or_semantic); | |
2387 | } | |
2388 | ||
2389 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _BinaryPredicate> | |
2390 | _RandomAccessIterator | |
2391 | __pattern_adjacent_find(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
2392 | _RandomAccessIterator __last, _BinaryPredicate __pred, bool __or_semantic) | |
2393 | { | |
2394 | if (__last - __first < 2) | |
2395 | return __last; | |
2396 | ||
2397 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
2398 | ||
2399 | return __internal::__except_handler( | |
2400 | [&]() | |
2401 | { | |
2402 | return __par_backend::__parallel_reduce( | |
2403 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, __last, | |
2404 | [__last, __pred, __or_semantic](_RandomAccessIterator __begin, _RandomAccessIterator __end, | |
2405 | _RandomAccessIterator __value) -> _RandomAccessIterator | |
2406 | { | |
2407 | // TODO: investigate performance benefits from the use of shared variable for the result, | |
2408 | // checking (compare_and_swap idiom) its __value at __first. | |
2409 | if (__or_semantic && __value < __last) | |
2410 | { //found | |
2411 | __par_backend::__cancel_execution(); | |
2412 | return __value; | |
2413 | } | |
2414 | ||
2415 | if (__value > __begin) | |
2416 | { | |
2417 | // modify __end to check the predicate on the boundary __values; | |
2418 | // TODO: to use a custom range with boundaries overlapping | |
2419 | // TODO: investigate what if we remove "if" below and run algorithm on range [__first, __last-1) | |
2420 | // then check the pair [__last-1, __last) | |
2421 | if (__end != __last) | |
2422 | ++__end; | |
2423 | ||
2424 | //correct the global result iterator if the "brick" returns a local "__last" | |
2425 | const _RandomAccessIterator __res = | |
2426 | __internal::__brick_adjacent_find(__begin, __end, __pred, _IsVector{}, __or_semantic); | |
2427 | if (__res < __end) | |
2428 | __value = __res; | |
2429 | } | |
2430 | return __value; | |
2431 | }, | |
2432 | [](_RandomAccessIterator __x, _RandomAccessIterator __y) -> _RandomAccessIterator | |
2433 | { return __x < __y ? __x : __y; } //reduce a __value | |
2434 | ); | |
2435 | }); | |
2436 | } | |
2437 | ||
2438 | //------------------------------------------------------------------------ | |
2439 | // nth_element | |
2440 | //------------------------------------------------------------------------ | |
2441 | ||
2442 | template <class _Tag, class _ExecutionPolicy, class _RandomAccessIterator, class _Compare> | |
2443 | void | |
2444 | __pattern_nth_element(_Tag, _ExecutionPolicy&&, _RandomAccessIterator __first, _RandomAccessIterator __nth, | |
2445 | _RandomAccessIterator __last, _Compare __comp) noexcept | |
2446 | { | |
2447 | std::nth_element(__first, __nth, __last, __comp); | |
2448 | } | |
2449 | ||
2450 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Compare> | |
2451 | void | |
2452 | __pattern_nth_element(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
2453 | _RandomAccessIterator __nth, _RandomAccessIterator __last, _Compare __comp) noexcept | |
2454 | { | |
2455 | if (__first == __last || __nth == __last) | |
2456 | { | |
2457 | return; | |
2458 | } | |
2459 | ||
2460 | using std::iter_swap; | |
2461 | typedef typename std::iterator_traits<_RandomAccessIterator>::value_type _Tp; | |
2462 | _RandomAccessIterator __x; | |
2463 | do | |
2464 | { | |
2465 | __x = __internal::__pattern_partition(__tag, std::forward<_ExecutionPolicy>(__exec), __first + 1, __last, | |
2466 | [&__comp, __first](const _Tp& __x) { return __comp(__x, *__first); }); | |
2467 | --__x; | |
2468 | if (__x != __first) | |
2469 | { | |
2470 | iter_swap(__first, __x); | |
2471 | } | |
2472 | // if x > nth then our new range for partition is [first, x) | |
2473 | if (__x - __nth > 0) | |
2474 | { | |
2475 | __last = __x; | |
2476 | } | |
2477 | // if x < nth then our new range for partition is [x, last) | |
2478 | else if (__x - __nth < 0) | |
2479 | { | |
2480 | // if *x == *nth then we can start new partition with x+1 | |
2481 | if (!__comp(*__nth, *__x) && !__comp(*__x, *__nth)) | |
2482 | { | |
2483 | ++__x; | |
2484 | } | |
2485 | else | |
2486 | { | |
2487 | iter_swap(__nth, __x); | |
2488 | } | |
2489 | __first = __x; | |
2490 | } | |
2491 | } while (__x != __nth); | |
2492 | } | |
2493 | ||
2494 | //------------------------------------------------------------------------ | |
2495 | // fill, fill_n | |
2496 | //------------------------------------------------------------------------ | |
2497 | template <class _RandomAccessIterator, class _Tp> | |
2498 | void | |
2499 | __brick_fill(_RandomAccessIterator __first, _RandomAccessIterator __last, const _Tp& __value, | |
2500 | /* __is_vector = */ std::true_type) noexcept | |
2501 | { | |
2502 | __unseq_backend::__simd_fill_n(__first, __last - __first, __value); | |
2503 | } | |
2504 | ||
2505 | template <class _ForwardIterator, class _Tp> | |
2506 | void | |
2507 | __brick_fill(_ForwardIterator __first, _ForwardIterator __last, const _Tp& __value, | |
2508 | /* __is_vector = */ std::false_type) noexcept | |
2509 | { | |
2510 | std::fill(__first, __last, __value); | |
2511 | } | |
2512 | ||
2513 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _Tp> | |
2514 | void | |
2515 | __pattern_fill(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, const _Tp& __value) noexcept | |
2516 | { | |
2517 | __internal::__brick_fill(__first, __last, __value, typename _Tag::__is_vector{}); | |
2518 | } | |
2519 | ||
2520 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Tp> | |
2521 | _RandomAccessIterator | |
2522 | __pattern_fill(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
2523 | _RandomAccessIterator __last, const _Tp& __value) | |
2524 | { | |
2525 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
2526 | ||
2527 | return __internal::__except_handler( | |
2528 | [&__exec, __first, __last, &__value]() | |
2529 | { | |
2530 | __par_backend::__parallel_for(__backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
2531 | [&__value](_RandomAccessIterator __begin, _RandomAccessIterator __end) | |
2532 | { __internal::__brick_fill(__begin, __end, __value, _IsVector{}); }); | |
2533 | return __last; | |
2534 | }); | |
2535 | } | |
2536 | ||
2537 | template <class _RandomAccessIterator, class _Size, class _Tp> | |
2538 | _RandomAccessIterator | |
2539 | __brick_fill_n(_RandomAccessIterator __first, _Size __count, const _Tp& __value, | |
2540 | /* __is_vector = */ std::true_type) noexcept | |
2541 | { | |
2542 | return __unseq_backend::__simd_fill_n(__first, __count, __value); | |
2543 | } | |
2544 | ||
2545 | template <class _OutputIterator, class _Size, class _Tp> | |
2546 | _OutputIterator | |
2547 | __brick_fill_n(_OutputIterator __first, _Size __count, const _Tp& __value, /* __is_vector = */ std::false_type) noexcept | |
2548 | { | |
2549 | return std::fill_n(__first, __count, __value); | |
2550 | } | |
2551 | ||
2552 | template <class _Tag, class _ExecutionPolicy, class _OutputIterator, class _Size, class _Tp> | |
2553 | _OutputIterator | |
2554 | __pattern_fill_n(_Tag, _ExecutionPolicy&&, _OutputIterator __first, _Size __count, const _Tp& __value) noexcept | |
2555 | { | |
2556 | return __internal::__brick_fill_n(__first, __count, __value, typename _Tag::__is_vector{}); | |
2557 | } | |
2558 | ||
2559 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Size, class _Tp> | |
2560 | _RandomAccessIterator | |
2561 | __pattern_fill_n(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
2562 | _Size __count, const _Tp& __value) | |
2563 | { | |
2564 | return __internal::__pattern_fill(__tag, std::forward<_ExecutionPolicy>(__exec), __first, __first + __count, | |
2565 | __value); | |
2566 | } | |
2567 | ||
2568 | //------------------------------------------------------------------------ | |
2569 | // generate, generate_n | |
2570 | //------------------------------------------------------------------------ | |
2571 | template <class _RandomAccessIterator, class _Generator> | |
2572 | void | |
2573 | __brick_generate(_RandomAccessIterator __first, _RandomAccessIterator __last, _Generator __g, | |
2574 | /* is_vector = */ std::true_type) noexcept | |
2575 | { | |
2576 | __unseq_backend::__simd_generate_n(__first, __last - __first, __g); | |
2577 | } | |
2578 | ||
2579 | template <class _ForwardIterator, class _Generator> | |
2580 | void | |
2581 | __brick_generate(_ForwardIterator __first, _ForwardIterator __last, _Generator __g, | |
2582 | /* is_vector = */ std::false_type) noexcept | |
2583 | { | |
2584 | std::generate(__first, __last, __g); | |
2585 | } | |
2586 | ||
2587 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _Generator> | |
2588 | void | |
2589 | __pattern_generate(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, _Generator __g) noexcept | |
2590 | { | |
2591 | __internal::__brick_generate(__first, __last, __g, typename _Tag::__is_vector{}); | |
2592 | } | |
2593 | ||
2594 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Generator> | |
2595 | _RandomAccessIterator | |
2596 | __pattern_generate(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
2597 | _RandomAccessIterator __last, _Generator __g) | |
2598 | { | |
2599 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
2600 | ||
2601 | return __internal::__except_handler( | |
2602 | [&]() | |
2603 | { | |
2604 | __par_backend::__parallel_for(__backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
2605 | [__g](_RandomAccessIterator __begin, _RandomAccessIterator __end) | |
2606 | { __internal::__brick_generate(__begin, __end, __g, _IsVector{}); }); | |
2607 | return __last; | |
2608 | }); | |
2609 | } | |
2610 | ||
2611 | template <class _RandomAccessIterator, class _Size, class _Generator> | |
2612 | _RandomAccessIterator | |
2613 | __brick_generate_n(_RandomAccessIterator __first, _Size __count, _Generator __g, | |
2614 | /* is_vector = */ std::true_type) noexcept | |
2615 | { | |
2616 | return __unseq_backend::__simd_generate_n(__first, __count, __g); | |
2617 | } | |
2618 | ||
2619 | template <class _OutputIterator, class _Size, class _Generator> | |
2620 | _OutputIterator | |
2621 | __brick_generate_n(_OutputIterator __first, _Size __count, _Generator __g, /* is_vector = */ std::false_type) noexcept | |
2622 | { | |
2623 | return std::generate_n(__first, __count, __g); | |
2624 | } | |
2625 | ||
2626 | template <class _Tag, class _ExecutionPolicy, class _OutputIterator, class _Size, class _Generator> | |
2627 | _OutputIterator | |
2628 | __pattern_generate_n(_Tag, _ExecutionPolicy&&, _OutputIterator __first, _Size __count, _Generator __g) noexcept | |
2629 | { | |
2630 | return __internal::__brick_generate_n(__first, __count, __g, typename _Tag::__is_vector{}); | |
2631 | } | |
2632 | ||
2633 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Size, class _Generator> | |
2634 | _RandomAccessIterator | |
2635 | __pattern_generate_n(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
2636 | _Size __count, _Generator __g) | |
2637 | { | |
2638 | static_assert(__are_random_access_iterators<_RandomAccessIterator>::value, | |
2639 | "Pattern-brick error. Should be a random access iterator."); | |
2640 | return __internal::__pattern_generate(__tag, std::forward<_ExecutionPolicy>(__exec), __first, __first + __count, | |
2641 | __g); | |
2642 | } | |
2643 | ||
2644 | //------------------------------------------------------------------------ | |
2645 | // remove | |
2646 | //------------------------------------------------------------------------ | |
2647 | ||
2648 | template <class _ForwardIterator, class _UnaryPredicate> | |
2649 | _ForwardIterator | |
2650 | __brick_remove_if(_ForwardIterator __first, _ForwardIterator __last, _UnaryPredicate __pred, | |
2651 | /* __is_vector = */ std::false_type) noexcept | |
2652 | { | |
2653 | return std::remove_if(__first, __last, __pred); | |
2654 | } | |
2655 | ||
2656 | template <class _RandomAccessIterator, class _UnaryPredicate> | |
2657 | _RandomAccessIterator | |
2658 | __brick_remove_if(_RandomAccessIterator __first, _RandomAccessIterator __last, _UnaryPredicate __pred, | |
2659 | /* __is_vector = */ std::true_type) noexcept | |
2660 | { | |
2661 | #if defined(_PSTL_MONOTONIC_PRESENT) | |
2662 | return __unseq_backend::__simd_remove_if(__first, __last - __first, __pred); | |
2663 | #else | |
2664 | return std::remove_if(__first, __last, __pred); | |
2665 | #endif | |
2666 | } | |
2667 | ||
2668 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator, class _UnaryPredicate> | |
2669 | _ForwardIterator | |
2670 | __pattern_remove_if(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, | |
2671 | _UnaryPredicate __pred) noexcept | |
2672 | { | |
2673 | return __internal::__brick_remove_if(__first, __last, __pred, typename _Tag::__is_vector{}); | |
2674 | } | |
2675 | ||
2676 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _UnaryPredicate> | |
2677 | _RandomAccessIterator | |
2678 | __pattern_remove_if(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
2679 | _RandomAccessIterator __last, _UnaryPredicate __pred) noexcept | |
2680 | { | |
2681 | typedef typename std::iterator_traits<_RandomAccessIterator>::reference _ReferenceType; | |
2682 | ||
2683 | if (__first == __last || __first + 1 == __last) | |
2684 | { | |
2685 | // Trivial sequence - use serial algorithm | |
2686 | return __internal::__brick_remove_if(__first, __last, __pred, _IsVector{}); | |
2687 | } | |
2688 | ||
2689 | return __internal::__remove_elements( | |
2690 | __tag, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
2691 | [&__pred](bool* __b, bool* __e, _RandomAccessIterator __it) | |
2692 | { | |
2693 | __internal::__brick_walk2( | |
2694 | __b, __e, __it, [&__pred](bool& __x, _ReferenceType __y) { __x = !__pred(__y); }, _IsVector{}); | |
2695 | }); | |
2696 | } | |
2697 | ||
2698 | //------------------------------------------------------------------------ | |
2699 | // merge | |
2700 | //------------------------------------------------------------------------ | |
2701 | ||
2702 | template <class _ForwardIterator1, class _ForwardIterator2, class _OutputIterator, class _Compare> | |
2703 | _OutputIterator | |
2704 | __brick_merge(_ForwardIterator1 __first1, _ForwardIterator1 __last1, _ForwardIterator2 __first2, | |
2705 | _ForwardIterator2 __last2, _OutputIterator __d_first, _Compare __comp, | |
2706 | /* __is_vector = */ std::false_type) noexcept | |
2707 | { | |
2708 | return std::merge(__first1, __last1, __first2, __last2, __d_first, __comp); | |
2709 | } | |
2710 | ||
2711 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _RandomAccessIterator3, class _Compare> | |
2712 | _RandomAccessIterator3 | |
2713 | __brick_merge(_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, | |
2714 | _RandomAccessIterator2 __last2, _RandomAccessIterator3 __d_first, _Compare __comp, | |
2715 | /* __is_vector = */ std::true_type) noexcept | |
2716 | { | |
2717 | _PSTL_PRAGMA_MESSAGE("Vectorized algorithm unimplemented, redirected to serial"); | |
2718 | return std::merge(__first1, __last1, __first2, __last2, __d_first, __comp); | |
2719 | } | |
2720 | ||
2721 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _OutputIterator, | |
2722 | class _Compare> | |
2723 | _OutputIterator | |
2724 | __pattern_merge(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first1, _ForwardIterator1 __last1, | |
2725 | _ForwardIterator2 __first2, _ForwardIterator2 __last2, _OutputIterator __d_first, | |
2726 | _Compare __comp) noexcept | |
2727 | { | |
2728 | return __internal::__brick_merge(__first1, __last1, __first2, __last2, __d_first, __comp, | |
2729 | typename _Tag::__is_vector{}); | |
2730 | } | |
2731 | ||
2732 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
2733 | class _RandomAccessIterator3, class _Compare> | |
2734 | _RandomAccessIterator3 | |
2735 | __pattern_merge(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first1, | |
2736 | _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, _RandomAccessIterator2 __last2, | |
2737 | _RandomAccessIterator3 __d_first, _Compare __comp) | |
2738 | { | |
2739 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
2740 | ||
2741 | __par_backend::__parallel_merge( | |
2742 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, __first2, __last2, __d_first, | |
2743 | __comp, | |
2744 | [](_RandomAccessIterator1 __f1, _RandomAccessIterator1 __l1, _RandomAccessIterator2 __f2, | |
2745 | _RandomAccessIterator2 __l2, _RandomAccessIterator3 __f3, _Compare __comp) | |
2746 | { return __internal::__brick_merge(__f1, __l1, __f2, __l2, __f3, __comp, _IsVector{}); }); | |
2747 | return __d_first + (__last1 - __first1) + (__last2 - __first2); | |
2748 | } | |
2749 | ||
2750 | //------------------------------------------------------------------------ | |
2751 | // inplace_merge | |
2752 | //------------------------------------------------------------------------ | |
2753 | template <class _BidirectionalIterator, class _Compare> | |
2754 | void | |
2755 | __brick_inplace_merge(_BidirectionalIterator __first, _BidirectionalIterator __middle, _BidirectionalIterator __last, | |
2756 | _Compare __comp, /* __is_vector = */ std::false_type) noexcept | |
2757 | { | |
2758 | std::inplace_merge(__first, __middle, __last, __comp); | |
2759 | } | |
2760 | ||
2761 | template <class _RandomAccessIterator, class _Compare> | |
2762 | void | |
2763 | __brick_inplace_merge(_RandomAccessIterator __first, _RandomAccessIterator __middle, _RandomAccessIterator __last, | |
2764 | _Compare __comp, /* __is_vector = */ std::true_type) noexcept | |
2765 | { | |
2766 | _PSTL_PRAGMA_MESSAGE("Vectorized algorithm unimplemented, redirected to serial") | |
2767 | std::inplace_merge(__first, __middle, __last, __comp); | |
2768 | } | |
2769 | ||
2770 | template <class _Tag, class _ExecutionPolicy, class _BidirectionalIterator, class _Compare> | |
2771 | void | |
2772 | __pattern_inplace_merge(_Tag, _ExecutionPolicy&&, _BidirectionalIterator __first, _BidirectionalIterator __middle, | |
2773 | _BidirectionalIterator __last, _Compare __comp) noexcept | |
2774 | { | |
2775 | __internal::__brick_inplace_merge(__first, __middle, __last, __comp, typename _Tag::__is_vector{}); | |
2776 | } | |
2777 | ||
2778 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Compare> | |
2779 | void | |
2780 | __pattern_inplace_merge(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
2781 | _RandomAccessIterator __middle, _RandomAccessIterator __last, _Compare __comp) | |
2782 | { | |
2783 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
2784 | ||
2785 | if (__first == __last || __first == __middle || __middle == __last) | |
2786 | { | |
2787 | return; | |
2788 | } | |
2789 | typedef typename std::iterator_traits<_RandomAccessIterator>::value_type _Tp; | |
2790 | auto __n = __last - __first; | |
2791 | __par_backend::__buffer<_Tp> __buf(__n); | |
2792 | _Tp* __r = __buf.get(); | |
2793 | __internal::__except_handler( | |
2794 | [&]() | |
2795 | { | |
2796 | auto __move_values = [](_RandomAccessIterator __x, _Tp* __z) | |
2797 | { | |
2798 | __internal::__invoke_if_else( | |
2799 | std::conjunction<std::is_trivially_copyable<_Tp>, std::is_trivially_default_constructible<_Tp>>(), | |
2800 | [&]() { *__z = std::move(*__x); }, | |
2801 | [&]() { ::new (std::addressof(*__z)) _Tp(std::move(*__x)); }); | |
2802 | }; | |
2803 | ||
2804 | auto __move_sequences = [](_RandomAccessIterator __first1, _RandomAccessIterator __last1, _Tp* __first2) | |
2805 | { return __internal::__brick_uninitialized_move(__first1, __last1, __first2, _IsVector()); }; | |
2806 | ||
2807 | __par_backend::__parallel_merge( | |
2808 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __middle, __middle, __last, __r, | |
2809 | __comp, | |
2810 | [__n, __move_values, __move_sequences](_RandomAccessIterator __f1, _RandomAccessIterator __l1, | |
2811 | _RandomAccessIterator __f2, _RandomAccessIterator __l2, | |
2812 | _Tp* __f3, _Compare __comp) | |
2813 | { | |
2814 | (__utils::__serial_move_merge(__n))(__f1, __l1, __f2, __l2, __f3, __comp, __move_values, | |
2815 | __move_values, __move_sequences, __move_sequences); | |
2816 | return __f3 + (__l1 - __f1) + (__l2 - __f2); | |
2817 | }); | |
2818 | __par_backend::__parallel_for(__backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __r, __r + __n, | |
2819 | [__r, __first](_Tp* __i, _Tp* __j) | |
2820 | { __brick_move_destroy()(__i, __j, __first + (__i - __r), _IsVector{}); }); | |
2821 | }); | |
2822 | } | |
2823 | ||
2824 | //------------------------------------------------------------------------ | |
2825 | // includes | |
2826 | //------------------------------------------------------------------------ | |
2827 | ||
2828 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _Compare> | |
2829 | bool | |
2830 | __pattern_includes(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first1, _ForwardIterator1 __last1, | |
2831 | _ForwardIterator2 __first2, _ForwardIterator2 __last2, _Compare __comp) noexcept | |
2832 | { | |
2833 | return std::includes(__first1, __last1, __first2, __last2, __comp); | |
2834 | } | |
2835 | ||
2836 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
2837 | class _Compare> | |
2838 | bool | |
2839 | __pattern_includes(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first1, | |
2840 | _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, _RandomAccessIterator2 __last2, | |
2841 | _Compare __comp) | |
2842 | { | |
2843 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
2844 | ||
2845 | if (__first2 >= __last2) | |
2846 | return true; | |
2847 | ||
2848 | if (__first1 >= __last1 || __comp(*__first2, *__first1) || __comp(*(__last1 - 1), *(__last2 - 1))) | |
2849 | return false; | |
2850 | ||
2851 | __first1 = std::lower_bound(__first1, __last1, *__first2, __comp); | |
2852 | if (__first1 == __last1) | |
2853 | return false; | |
2854 | ||
2855 | if (__last2 - __first2 == 1) | |
2856 | return !__comp(*__first1, *__first2) && !__comp(*__first2, *__first1); | |
2857 | ||
2858 | return __internal::__except_handler( | |
2859 | [&]() | |
2860 | { | |
2861 | return !__internal::__parallel_or( | |
2862 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first2, __last2, | |
2863 | [__first1, __last1, __first2, __last2, &__comp](_RandomAccessIterator2 __i, _RandomAccessIterator2 __j) | |
2864 | { | |
2865 | _PSTL_ASSERT(__j > __i); | |
2866 | //_PSTL_ASSERT(__j - __i > 1); | |
2867 | ||
2868 | //1. moving boundaries to "consume" subsequence of equal elements | |
2869 | auto __is_equal = [&__comp](_RandomAccessIterator2 __a, _RandomAccessIterator2 __b) -> bool | |
2870 | { return !__comp(*__a, *__b) && !__comp(*__b, *__a); }; | |
2871 | ||
2872 | //1.1 left bound, case "aaa[aaaxyz...]" - searching "x" | |
2873 | if (__i > __first2 && __is_equal(__i, __i - 1)) | |
2874 | { | |
2875 | //whole subrange continues to content equal elements - return "no op" | |
2876 | if (__is_equal(__i, __j - 1)) | |
2877 | return false; | |
2878 | ||
2879 | __i = std::upper_bound(__i, __last2, *__i, __comp); | |
2880 | } | |
2881 | ||
2882 | //1.2 right bound, case "[...aaa]aaaxyz" - searching "x" | |
2883 | if (__j < __last2 && __is_equal(__j - 1, __j)) | |
2884 | __j = std::upper_bound(__j, __last2, *__j, __comp); | |
2885 | ||
2886 | //2. testing is __a subsequence of the second range included into the first range | |
2887 | auto __b = std::lower_bound(__first1, __last1, *__i, __comp); | |
2888 | ||
2889 | _PSTL_ASSERT(!__comp(*(__last1 - 1), *__b)); | |
2890 | _PSTL_ASSERT(!__comp(*(__j - 1), *__i)); | |
2891 | return !std::includes(__b, __last1, __i, __j, __comp); | |
2892 | }); | |
2893 | }); | |
2894 | } | |
2895 | ||
2896 | inline constexpr auto __set_algo_cut_off = 1000; | |
2897 | ||
2898 | template <class _IsVector, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, | |
2899 | class _OutputIterator, class _Compare, class _SizeFunction, class _SetOP> | |
2900 | _OutputIterator | |
2901 | __parallel_set_op(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _ForwardIterator1 __first1, | |
2902 | _ForwardIterator1 __last1, _ForwardIterator2 __first2, _ForwardIterator2 __last2, | |
2903 | _OutputIterator __result, _Compare __comp, _SizeFunction __size_func, _SetOP __set_op) | |
2904 | { | |
2905 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
2906 | ||
2907 | typedef typename std::iterator_traits<_ForwardIterator1>::difference_type _DifferenceType; | |
2908 | typedef typename std::iterator_traits<_OutputIterator>::value_type _Tp; | |
2909 | ||
2910 | struct _SetRange | |
2911 | { | |
2912 | _DifferenceType __pos, __len, __buf_pos; | |
2913 | bool | |
2914 | empty() const | |
2915 | { | |
2916 | return __len == 0; | |
2917 | } | |
2918 | }; | |
2919 | ||
2920 | const _DifferenceType __n1 = __last1 - __first1; | |
2921 | const _DifferenceType __n2 = __last2 - __first2; | |
2922 | ||
2923 | __par_backend::__buffer<_Tp> __buf(__size_func(__n1, __n2)); | |
2924 | ||
2925 | return __internal::__except_handler( | |
2926 | [&__exec, __n1, __first1, __last1, __first2, __last2, __result, __comp, __size_func, __set_op, &__buf]() | |
2927 | { | |
2928 | auto __buffer = __buf.get(); | |
2929 | _DifferenceType __m{}; | |
2930 | auto __scan = [=](_DifferenceType, _DifferenceType, const _SetRange& __s) { // Scan | |
2931 | if (!__s.empty()) | |
2932 | __brick_move_destroy()(__buffer + __s.__buf_pos, __buffer + (__s.__buf_pos + __s.__len), | |
2933 | __result + __s.__pos, _IsVector{}); | |
2934 | }; | |
2935 | __par_backend::__parallel_strict_scan( | |
2936 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __n1, _SetRange{0, 0, 0}, //-1, 0}, | |
2937 | [=](_DifferenceType __i, _DifferenceType __len) { // Reduce | |
2938 | //[__b; __e) - a subrange of the first sequence, to reduce | |
2939 | _ForwardIterator1 __b = __first1 + __i, __e = __first1 + (__i + __len); | |
2940 | ||
2941 | //try searching for the first element which not equal to *__b | |
2942 | if (__b != __first1) | |
2943 | __b = std::upper_bound(__b, __last1, *__b, __comp); | |
2944 | ||
2945 | //try searching for the first element which not equal to *__e | |
2946 | if (__e != __last1) | |
2947 | __e = std::upper_bound(__e, __last1, *__e, __comp); | |
2948 | ||
2949 | //check is [__b; __e) empty | |
2950 | if (__e - __b < 1) | |
2951 | { | |
2952 | _ForwardIterator2 __bb = __last2; | |
2953 | if (__b != __last1) | |
2954 | __bb = std::lower_bound(__first2, __last2, *__b, __comp); | |
2955 | ||
2956 | const _DifferenceType __buf_pos = __size_func((__b - __first1), (__bb - __first2)); | |
2957 | return _SetRange{0, 0, __buf_pos}; | |
2958 | } | |
2959 | ||
2960 | //try searching for "corresponding" subrange [__bb; __ee) in the second sequence | |
2961 | _ForwardIterator2 __bb = __first2; | |
2962 | if (__b != __first1) | |
2963 | __bb = std::lower_bound(__first2, __last2, *__b, __comp); | |
2964 | ||
2965 | _ForwardIterator2 __ee = __last2; | |
2966 | if (__e != __last1) | |
2967 | __ee = std::lower_bound(__bb, __last2, *__e, __comp); | |
2968 | ||
2969 | const _DifferenceType __buf_pos = __size_func((__b - __first1), (__bb - __first2)); | |
2970 | auto __buffer_b = __buffer + __buf_pos; | |
2971 | auto __res = __set_op(__b, __e, __bb, __ee, __buffer_b, __comp); | |
2972 | ||
2973 | return _SetRange{0, __res - __buffer_b, __buf_pos}; | |
2974 | }, | |
2975 | [](const _SetRange& __a, const _SetRange& __b) { // Combine | |
2976 | if (__b.__buf_pos > __a.__buf_pos || ((__b.__buf_pos == __a.__buf_pos) && !__b.empty())) | |
2977 | return _SetRange{__a.__pos + __a.__len + __b.__pos, __b.__len, __b.__buf_pos}; | |
2978 | return _SetRange{__b.__pos + __b.__len + __a.__pos, __a.__len, __a.__buf_pos}; | |
2979 | }, | |
2980 | __scan, // Scan | |
2981 | [&__m, &__scan](const _SetRange& __total) { // Apex | |
2982 | //final scan | |
2983 | __scan(0, 0, __total); | |
2984 | __m = __total.__pos + __total.__len; | |
2985 | }); | |
2986 | return __result + __m; | |
2987 | }); | |
2988 | } | |
2989 | ||
2990 | //a shared parallel pattern for '__pattern_set_union' and '__pattern_set_symmetric_difference' | |
2991 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _OutputIterator, | |
2992 | class _Compare, class _SetUnionOp> | |
2993 | _OutputIterator | |
2994 | __parallel_set_union_op(_Tag __tag, _ExecutionPolicy&& __exec, _ForwardIterator1 __first1, _ForwardIterator1 __last1, | |
2995 | _ForwardIterator2 __first2, _ForwardIterator2 __last2, _OutputIterator __result, | |
2996 | _Compare __comp, _SetUnionOp __set_union_op) | |
2997 | { | |
2998 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
2999 | ||
3000 | typedef typename std::iterator_traits<_ForwardIterator1>::difference_type _DifferenceType; | |
3001 | ||
3002 | const auto __n1 = __last1 - __first1; | |
3003 | const auto __n2 = __last2 - __first2; | |
3004 | ||
3005 | auto copy_range1 = [](_ForwardIterator1 __begin, _ForwardIterator1 __end, _OutputIterator __res) | |
3006 | { return __internal::__brick_copy(__begin, __end, __res, typename _Tag::__is_vector{}); }; | |
3007 | auto copy_range2 = [](_ForwardIterator2 __begin, _ForwardIterator2 __end, _OutputIterator __res) | |
3008 | { return __internal::__brick_copy(__begin, __end, __res, typename _Tag::__is_vector{}); }; | |
3009 | ||
3010 | // {1} {}: parallel copying just first sequence | |
3011 | if (__n2 == 0) | |
3012 | return __internal::__pattern_walk2_brick(__tag, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, | |
3013 | __result, copy_range1); | |
3014 | ||
3015 | // {} {2}: parallel copying justmake second sequence | |
3016 | if (__n1 == 0) | |
3017 | return __internal::__pattern_walk2_brick(__tag, std::forward<_ExecutionPolicy>(__exec), __first2, __last2, | |
3018 | __result, copy_range2); | |
3019 | ||
3020 | // testing whether the sequences are intersected | |
3021 | _ForwardIterator1 __left_bound_seq_1 = std::lower_bound(__first1, __last1, *__first2, __comp); | |
3022 | ||
3023 | if (__left_bound_seq_1 == __last1) | |
3024 | { | |
3025 | //{1} < {2}: seq2 is wholly greater than seq1, so, do parallel copying seq1 and seq2 | |
3026 | __par_backend::__parallel_invoke( | |
3027 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), | |
3028 | [=] | |
3029 | { | |
3030 | __internal::__pattern_walk2_brick(__tag, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, | |
3031 | __result, copy_range1); | |
3032 | }, | |
3033 | [=] | |
3034 | { | |
3035 | __internal::__pattern_walk2_brick(__tag, std::forward<_ExecutionPolicy>(__exec), __first2, __last2, | |
3036 | __result + __n1, copy_range2); | |
3037 | }); | |
3038 | return __result + __n1 + __n2; | |
3039 | } | |
3040 | ||
3041 | // testing whether the sequences are intersected | |
3042 | _ForwardIterator2 __left_bound_seq_2 = std::lower_bound(__first2, __last2, *__first1, __comp); | |
3043 | ||
3044 | if (__left_bound_seq_2 == __last2) | |
3045 | { | |
3046 | //{2} < {1}: seq2 is wholly greater than seq1, so, do parallel copying seq1 and seq2 | |
3047 | __par_backend::__parallel_invoke( | |
3048 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), | |
3049 | [=] | |
3050 | { | |
3051 | __internal::__pattern_walk2_brick(__tag, std::forward<_ExecutionPolicy>(__exec), __first2, __last2, | |
3052 | __result, copy_range2); | |
3053 | }, | |
3054 | [=] | |
3055 | { | |
3056 | __internal::__pattern_walk2_brick(__tag, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, | |
3057 | __result + __n2, copy_range1); | |
3058 | }); | |
3059 | return __result + __n1 + __n2; | |
3060 | } | |
3061 | ||
3062 | const auto __m1 = __left_bound_seq_1 - __first1; | |
3063 | if (__m1 > __set_algo_cut_off) | |
3064 | { | |
3065 | auto __res_or = __result; | |
3066 | __result += __m1; //we know proper offset due to [first1; left_bound_seq_1) < [first2; last2) | |
3067 | __par_backend::__parallel_invoke( | |
3068 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), | |
3069 | //do parallel copying of [first1; left_bound_seq_1) | |
3070 | [=] | |
3071 | { | |
3072 | __internal::__pattern_walk2_brick(__tag, std::forward<_ExecutionPolicy>(__exec), __first1, | |
3073 | __left_bound_seq_1, __res_or, copy_range1); | |
3074 | }, | |
3075 | [=, &__result] | |
3076 | { | |
3077 | __result = __internal::__parallel_set_op( | |
3078 | __tag, std::forward<_ExecutionPolicy>(__exec), __left_bound_seq_1, __last1, __first2, __last2, | |
3079 | __result, __comp, [](_DifferenceType __n, _DifferenceType __m) { return __n + __m; }, | |
3080 | __set_union_op); | |
3081 | }); | |
3082 | return __result; | |
3083 | } | |
3084 | ||
3085 | const auto __m2 = __left_bound_seq_2 - __first2; | |
3086 | _PSTL_ASSERT(__m1 == 0 || __m2 == 0); | |
3087 | if (__m2 > __set_algo_cut_off) | |
3088 | { | |
3089 | auto __res_or = __result; | |
3090 | __result += __m2; //we know proper offset due to [first2; left_bound_seq_2) < [first1; last1) | |
3091 | __par_backend::__parallel_invoke( | |
3092 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), | |
3093 | //do parallel copying of [first2; left_bound_seq_2) | |
3094 | [=] | |
3095 | { | |
3096 | __internal::__pattern_walk2_brick(__tag, std::forward<_ExecutionPolicy>(__exec), __first2, | |
3097 | __left_bound_seq_2, __res_or, copy_range2); | |
3098 | }, | |
3099 | [=, &__result] | |
3100 | { | |
3101 | __result = __internal::__parallel_set_op( | |
3102 | __tag, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, __left_bound_seq_2, __last2, | |
3103 | __result, __comp, [](_DifferenceType __n, _DifferenceType __m) { return __n + __m; }, | |
3104 | __set_union_op); | |
3105 | }); | |
3106 | return __result; | |
3107 | } | |
3108 | ||
3109 | return __internal::__parallel_set_op( | |
3110 | __tag, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, __first2, __last2, __result, __comp, | |
3111 | [](_DifferenceType __n, _DifferenceType __m) { return __n + __m; }, __set_union_op); | |
3112 | } | |
3113 | ||
3114 | //------------------------------------------------------------------------ | |
3115 | // set_union | |
3116 | //------------------------------------------------------------------------ | |
3117 | ||
3118 | template <class _ForwardIterator1, class _ForwardIterator2, class _OutputIterator, class _Compare> | |
3119 | _OutputIterator | |
3120 | __brick_set_union(_ForwardIterator1 __first1, _ForwardIterator1 __last1, _ForwardIterator2 __first2, | |
3121 | _ForwardIterator2 __last2, _OutputIterator __result, _Compare __comp, | |
3122 | /*__is_vector=*/std::false_type) noexcept | |
3123 | { | |
3124 | return std::set_union(__first1, __last1, __first2, __last2, __result, __comp); | |
3125 | } | |
3126 | ||
3127 | template <typename _IsVector> | |
3128 | struct __BrickCopyConstruct | |
3129 | { | |
3130 | template <typename _ForwardIterator, typename _OutputIterator> | |
3131 | _OutputIterator | |
3132 | operator()(_ForwardIterator __first, _ForwardIterator __last, _OutputIterator __result) | |
3133 | { | |
3134 | return __brick_uninitialized_copy(__first, __last, __result, _IsVector()); | |
3135 | } | |
3136 | }; | |
3137 | ||
3138 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _OutputIterator, class _Compare> | |
3139 | _OutputIterator | |
3140 | __brick_set_union(_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, | |
3141 | _RandomAccessIterator2 __last2, _OutputIterator __result, _Compare __comp, | |
3142 | /*__is_vector=*/std::true_type) noexcept | |
3143 | { | |
3144 | _PSTL_PRAGMA_MESSAGE("Vectorized algorithm unimplemented, redirected to serial"); | |
3145 | return std::set_union(__first1, __last1, __first2, __last2, __result, __comp); | |
3146 | } | |
3147 | ||
3148 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _OutputIterator, | |
3149 | class _Compare> | |
3150 | _OutputIterator | |
3151 | __pattern_set_union(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first1, _ForwardIterator1 __last1, | |
3152 | _ForwardIterator2 __first2, _ForwardIterator2 __last2, _OutputIterator __result, | |
3153 | _Compare __comp) noexcept | |
3154 | { | |
3155 | return __internal::__brick_set_union(__first1, __last1, __first2, __last2, __result, __comp, | |
3156 | typename _Tag::__is_vector{}); | |
3157 | } | |
3158 | ||
3159 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
3160 | class _OutputIterator, class _Compare> | |
3161 | _OutputIterator | |
3162 | __pattern_set_union(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first1, | |
3163 | _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, _RandomAccessIterator2 __last2, | |
3164 | _OutputIterator __result, _Compare __comp) | |
3165 | { | |
3166 | ||
3167 | const auto __n1 = __last1 - __first1; | |
3168 | const auto __n2 = __last2 - __first2; | |
3169 | ||
3170 | // use serial algorithm | |
3171 | if (__n1 + __n2 <= __set_algo_cut_off) | |
3172 | return std::set_union(__first1, __last1, __first2, __last2, __result, __comp); | |
3173 | ||
3174 | typedef typename std::iterator_traits<_OutputIterator>::value_type _Tp; | |
3175 | return __parallel_set_union_op( | |
3176 | __tag, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, __first2, __last2, __result, __comp, | |
3177 | [](_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, | |
3178 | _RandomAccessIterator2 __last2, _Tp* __result, _Compare __comp) | |
3179 | { | |
3180 | return __pstl::__utils::__set_union_construct(__first1, __last1, __first2, __last2, __result, __comp, | |
3181 | __BrickCopyConstruct<_IsVector>()); | |
3182 | }); | |
3183 | } | |
3184 | ||
3185 | //------------------------------------------------------------------------ | |
3186 | // set_intersection | |
3187 | //------------------------------------------------------------------------ | |
3188 | ||
3189 | template <class _ForwardIterator1, class _ForwardIterator2, class _OutputIterator, class _Compare> | |
3190 | _OutputIterator | |
3191 | __brick_set_intersection(_ForwardIterator1 __first1, _ForwardIterator1 __last1, _ForwardIterator2 __first2, | |
3192 | _ForwardIterator2 __last2, _OutputIterator __result, _Compare __comp, | |
3193 | /*__is_vector=*/std::false_type) noexcept | |
3194 | { | |
3195 | return std::set_intersection(__first1, __last1, __first2, __last2, __result, __comp); | |
3196 | } | |
3197 | ||
3198 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _RandomAccessIterator3, class _Compare> | |
3199 | _RandomAccessIterator3 | |
3200 | __brick_set_intersection(_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, | |
3201 | _RandomAccessIterator2 __first2, _RandomAccessIterator2 __last2, | |
3202 | _RandomAccessIterator3 __result, _Compare __comp, | |
3203 | /*__is_vector=*/std::true_type) noexcept | |
3204 | { | |
3205 | _PSTL_PRAGMA_MESSAGE("Vectorized algorithm unimplemented, redirected to serial"); | |
3206 | return std::set_intersection(__first1, __last1, __first2, __last2, __result, __comp); | |
3207 | } | |
3208 | ||
3209 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _OutputIterator, | |
3210 | class _Compare> | |
3211 | _OutputIterator | |
3212 | __pattern_set_intersection(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first1, _ForwardIterator1 __last1, | |
3213 | _ForwardIterator2 __first2, _ForwardIterator2 __last2, _OutputIterator __result, | |
3214 | _Compare __comp) noexcept | |
3215 | { | |
3216 | return __internal::__brick_set_intersection(__first1, __last1, __first2, __last2, __result, __comp, | |
3217 | typename _Tag::__is_vector{}); | |
3218 | } | |
3219 | ||
3220 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
3221 | class _RandomAccessIterator3, class _Compare> | |
3222 | _RandomAccessIterator3 | |
3223 | __pattern_set_intersection(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first1, | |
3224 | _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, | |
3225 | _RandomAccessIterator2 __last2, _RandomAccessIterator3 __result, _Compare __comp) | |
3226 | { | |
3227 | typedef typename std::iterator_traits<_RandomAccessIterator3>::value_type _Tp; | |
3228 | typedef typename std::iterator_traits<_RandomAccessIterator1>::difference_type _DifferenceType; | |
3229 | ||
3230 | const auto __n1 = __last1 - __first1; | |
3231 | const auto __n2 = __last2 - __first2; | |
3232 | ||
3233 | // intersection is empty | |
3234 | if (__n1 == 0 || __n2 == 0) | |
3235 | return __result; | |
3236 | ||
3237 | // testing whether the sequences are intersected | |
3238 | _RandomAccessIterator1 __left_bound_seq_1 = std::lower_bound(__first1, __last1, *__first2, __comp); | |
3239 | //{1} < {2}: seq 2 is wholly greater than seq 1, so, the intersection is empty | |
3240 | if (__left_bound_seq_1 == __last1) | |
3241 | return __result; | |
3242 | ||
3243 | // testing whether the sequences are intersected | |
3244 | _RandomAccessIterator2 __left_bound_seq_2 = std::lower_bound(__first2, __last2, *__first1, __comp); | |
3245 | //{2} < {1}: seq 1 is wholly greater than seq 2, so, the intersection is empty | |
3246 | if (__left_bound_seq_2 == __last2) | |
3247 | return __result; | |
3248 | ||
3249 | const auto __m1 = __last1 - __left_bound_seq_1 + __n2; | |
3250 | if (__m1 > __set_algo_cut_off) | |
3251 | { | |
3252 | //we know proper offset due to [first1; left_bound_seq_1) < [first2; last2) | |
3253 | return __internal::__parallel_set_op( | |
3254 | __tag, std::forward<_ExecutionPolicy>(__exec), __left_bound_seq_1, __last1, __first2, __last2, __result, | |
3255 | __comp, [](_DifferenceType __n, _DifferenceType __m) { return std::min(__n, __m); }, | |
3256 | [](_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, | |
3257 | _RandomAccessIterator2 __last2, _Tp* __result, _Compare __comp) { | |
3258 | return __pstl::__utils::__set_intersection_construct(__first1, __last1, __first2, __last2, __result, | |
3259 | __comp); | |
3260 | }); | |
3261 | } | |
3262 | ||
3263 | const auto __m2 = __last2 - __left_bound_seq_2 + __n1; | |
3264 | if (__m2 > __set_algo_cut_off) | |
3265 | { | |
3266 | //we know proper offset due to [first2; left_bound_seq_2) < [first1; last1) | |
3267 | __result = __internal::__parallel_set_op( | |
3268 | __tag, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, __left_bound_seq_2, __last2, __result, | |
3269 | __comp, [](_DifferenceType __n, _DifferenceType __m) { return std::min(__n, __m); }, | |
3270 | [](_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, | |
3271 | _RandomAccessIterator2 __last2, _Tp* __result, _Compare __comp) { | |
3272 | return __pstl::__utils::__set_intersection_construct(__first2, __last2, __first1, __last1, __result, | |
3273 | __comp); | |
3274 | }); | |
3275 | return __result; | |
3276 | } | |
3277 | ||
3278 | // [left_bound_seq_1; last1) and [left_bound_seq_2; last2) - use serial algorithm | |
3279 | return std::set_intersection(__left_bound_seq_1, __last1, __left_bound_seq_2, __last2, __result, __comp); | |
3280 | } | |
3281 | ||
3282 | //------------------------------------------------------------------------ | |
3283 | // set_difference | |
3284 | //------------------------------------------------------------------------ | |
3285 | ||
3286 | template <class _ForwardIterator1, class _ForwardIterator2, class _OutputIterator, class _Compare> | |
3287 | _OutputIterator | |
3288 | __brick_set_difference(_ForwardIterator1 __first1, _ForwardIterator1 __last1, _ForwardIterator2 __first2, | |
3289 | _ForwardIterator2 __last2, _OutputIterator __result, _Compare __comp, | |
3290 | /*__is_vector=*/std::false_type) noexcept | |
3291 | { | |
3292 | return std::set_difference(__first1, __last1, __first2, __last2, __result, __comp); | |
3293 | } | |
3294 | ||
3295 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _RandomAccessIterator3, class _Compare> | |
3296 | _RandomAccessIterator3 | |
3297 | __brick_set_difference(_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, | |
3298 | _RandomAccessIterator2 __last2, _RandomAccessIterator3 __result, _Compare __comp, | |
3299 | /*__is_vector=*/std::true_type) noexcept | |
3300 | { | |
3301 | _PSTL_PRAGMA_MESSAGE("Vectorized algorithm unimplemented, redirected to serial"); | |
3302 | return std::set_difference(__first1, __last1, __first2, __last2, __result, __comp); | |
3303 | } | |
3304 | ||
3305 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _OutputIterator, | |
3306 | class _Compare> | |
3307 | _OutputIterator | |
3308 | __pattern_set_difference(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first1, _ForwardIterator1 __last1, | |
3309 | _ForwardIterator2 __first2, _ForwardIterator2 __last2, _OutputIterator __result, | |
3310 | _Compare __comp) noexcept | |
3311 | { | |
3312 | return __internal::__brick_set_difference(__first1, __last1, __first2, __last2, __result, __comp, | |
3313 | typename _Tag::__is_vector{}); | |
3314 | } | |
3315 | ||
3316 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
3317 | class _RandomAccessIterator3, class _Compare> | |
3318 | _RandomAccessIterator3 | |
3319 | __pattern_set_difference(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first1, | |
3320 | _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, | |
3321 | _RandomAccessIterator2 __last2, _RandomAccessIterator3 __result, _Compare __comp) | |
3322 | { | |
3323 | typedef typename std::iterator_traits<_RandomAccessIterator3>::value_type _Tp; | |
3324 | typedef typename std::iterator_traits<_RandomAccessIterator1>::difference_type _DifferenceType; | |
3325 | ||
3326 | const auto __n1 = __last1 - __first1; | |
3327 | const auto __n2 = __last2 - __first2; | |
3328 | ||
3329 | // {} \ {2}: the difference is empty | |
3330 | if (__n1 == 0) | |
3331 | return __result; | |
3332 | ||
3333 | // {1} \ {}: parallel copying just first sequence | |
3334 | if (__n2 == 0) | |
3335 | return __internal::__pattern_walk2_brick( | |
3336 | __tag, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, __result, | |
3337 | [](_RandomAccessIterator1 __begin, _RandomAccessIterator1 __end, _RandomAccessIterator3 __res) | |
3338 | { return __internal::__brick_copy(__begin, __end, __res, _IsVector{}); }); | |
3339 | ||
3340 | // testing whether the sequences are intersected | |
3341 | _RandomAccessIterator1 __left_bound_seq_1 = std::lower_bound(__first1, __last1, *__first2, __comp); | |
3342 | //{1} < {2}: seq 2 is wholly greater than seq 1, so, parallel copying just first sequence | |
3343 | if (__left_bound_seq_1 == __last1) | |
3344 | return __internal::__pattern_walk2_brick( | |
3345 | __tag, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, __result, | |
3346 | [](_RandomAccessIterator1 __begin, _RandomAccessIterator1 __end, _RandomAccessIterator3 __res) | |
3347 | { return __internal::__brick_copy(__begin, __end, __res, _IsVector{}); }); | |
3348 | ||
3349 | // testing whether the sequences are intersected | |
3350 | _RandomAccessIterator2 __left_bound_seq_2 = std::lower_bound(__first2, __last2, *__first1, __comp); | |
3351 | //{2} < {1}: seq 1 is wholly greater than seq 2, so, parallel copying just first sequence | |
3352 | if (__left_bound_seq_2 == __last2) | |
3353 | return __internal::__pattern_walk2_brick( | |
3354 | __tag, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, __result, | |
3355 | [](_RandomAccessIterator1 __begin, _RandomAccessIterator1 __end, _RandomAccessIterator3 __res) | |
3356 | { return __internal::__brick_copy(__begin, __end, __res, _IsVector{}); }); | |
3357 | ||
3358 | if (__n1 + __n2 > __set_algo_cut_off) | |
3359 | return __parallel_set_op( | |
3360 | __tag, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, __first2, __last2, __result, __comp, | |
3361 | [](_DifferenceType __n, _DifferenceType) { return __n; }, | |
3362 | [](_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, | |
3363 | _RandomAccessIterator2 __last2, _Tp* __result, _Compare __comp) | |
3364 | { | |
3365 | return __pstl::__utils::__set_difference_construct(__first1, __last1, __first2, __last2, __result, | |
3366 | __comp, __BrickCopyConstruct<_IsVector>()); | |
3367 | }); | |
3368 | ||
3369 | // use serial algorithm | |
3370 | return std::set_difference(__first1, __last1, __first2, __last2, __result, __comp); | |
3371 | } | |
3372 | ||
3373 | //------------------------------------------------------------------------ | |
3374 | // set_symmetric_difference | |
3375 | //------------------------------------------------------------------------ | |
3376 | ||
3377 | template <class _ForwardIterator1, class _ForwardIterator2, class _OutputIterator, class _Compare> | |
3378 | _OutputIterator | |
3379 | __brick_set_symmetric_difference(_ForwardIterator1 __first1, _ForwardIterator1 __last1, _ForwardIterator2 __first2, | |
3380 | _ForwardIterator2 __last2, _OutputIterator __result, _Compare __comp, | |
3381 | /*__is_vector=*/std::false_type) noexcept | |
3382 | { | |
3383 | return std::set_symmetric_difference(__first1, __last1, __first2, __last2, __result, __comp); | |
3384 | } | |
3385 | ||
3386 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _RandomAccessIterator3, class _Compare> | |
3387 | _RandomAccessIterator3 | |
3388 | __brick_set_symmetric_difference(_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, | |
3389 | _RandomAccessIterator2 __first2, _RandomAccessIterator2 __last2, | |
3390 | _RandomAccessIterator3 __result, _Compare __comp, | |
3391 | /*__is_vector=*/std::true_type) noexcept | |
3392 | { | |
3393 | _PSTL_PRAGMA_MESSAGE("Vectorized algorithm unimplemented, redirected to serial"); | |
3394 | return std::set_symmetric_difference(__first1, __last1, __first2, __last2, __result, __comp); | |
3395 | } | |
3396 | ||
3397 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _OutputIterator, | |
3398 | class _Compare> | |
3399 | _OutputIterator | |
3400 | __pattern_set_symmetric_difference(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first1, _ForwardIterator1 __last1, | |
3401 | _ForwardIterator2 __first2, _ForwardIterator2 __last2, _OutputIterator __result, | |
3402 | _Compare __comp) noexcept | |
3403 | { | |
3404 | return __internal::__brick_set_symmetric_difference(__first1, __last1, __first2, __last2, __result, __comp, | |
3405 | typename _Tag::__is_vector{}); | |
3406 | } | |
3407 | ||
3408 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
3409 | class _RandomAccessIterator3, class _Compare> | |
3410 | _RandomAccessIterator3 | |
3411 | __pattern_set_symmetric_difference(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, | |
3412 | _RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, | |
3413 | _RandomAccessIterator2 __first2, _RandomAccessIterator2 __last2, | |
3414 | _RandomAccessIterator3 __result, _Compare __comp) | |
3415 | { | |
3416 | ||
3417 | const auto __n1 = __last1 - __first1; | |
3418 | const auto __n2 = __last2 - __first2; | |
3419 | ||
3420 | // use serial algorithm | |
3421 | if (__n1 + __n2 <= __set_algo_cut_off) | |
3422 | return std::set_symmetric_difference(__first1, __last1, __first2, __last2, __result, __comp); | |
3423 | ||
3424 | typedef typename std::iterator_traits<_RandomAccessIterator3>::value_type _Tp; | |
3425 | return __internal::__parallel_set_union_op( | |
3426 | __tag, std::forward<_ExecutionPolicy>(__exec), __first1, __last1, __first2, __last2, __result, __comp, | |
3427 | [](_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, | |
3428 | _RandomAccessIterator2 __last2, _Tp* __result, _Compare __comp) | |
3429 | { | |
3430 | return __pstl::__utils::__set_symmetric_difference_construct(__first1, __last1, __first2, __last2, __result, | |
3431 | __comp, __BrickCopyConstruct<_IsVector>()); | |
3432 | }); | |
3433 | } | |
3434 | ||
3435 | //------------------------------------------------------------------------ | |
3436 | // is_heap_until | |
3437 | //------------------------------------------------------------------------ | |
3438 | ||
3439 | template <class _RandomAccessIterator, class _Compare> | |
3440 | _RandomAccessIterator | |
3441 | __brick_is_heap_until(_RandomAccessIterator __first, _RandomAccessIterator __last, _Compare __comp, | |
3442 | /* __is_vector = */ std::false_type) noexcept | |
3443 | { | |
3444 | return std::is_heap_until(__first, __last, __comp); | |
3445 | } | |
3446 | ||
3447 | template <class _RandomAccessIterator, class _Compare> | |
3448 | _RandomAccessIterator | |
3449 | __brick_is_heap_until(_RandomAccessIterator __first, _RandomAccessIterator __last, _Compare __comp, | |
3450 | /* __is_vector = */ std::true_type) noexcept | |
3451 | { | |
3452 | if (__last - __first < 2) | |
3453 | return __last; | |
3454 | typedef typename std::iterator_traits<_RandomAccessIterator>::difference_type _SizeType; | |
3455 | return __unseq_backend::__simd_first( | |
3456 | __first, _SizeType(0), __last - __first, | |
3457 | [&__comp](_RandomAccessIterator __it, _SizeType __i) { return __comp(__it[(__i - 1) / 2], __it[__i]); }); | |
3458 | } | |
3459 | ||
3460 | template <class _Tag, class _ExecutionPolicy, class _RandomAccessIterator, class _Compare> | |
3461 | _RandomAccessIterator | |
3462 | __pattern_is_heap_until(_Tag, _ExecutionPolicy&&, _RandomAccessIterator __first, _RandomAccessIterator __last, | |
3463 | _Compare __comp) noexcept | |
3464 | { | |
3465 | return __internal::__brick_is_heap_until(__first, __last, __comp, typename _Tag::__is_vector{}); | |
3466 | } | |
3467 | ||
3468 | template <class _RandomAccessIterator, class _DifferenceType, class _Compare> | |
3469 | _RandomAccessIterator | |
3470 | __is_heap_until_local(_RandomAccessIterator __first, _DifferenceType __begin, _DifferenceType __end, _Compare __comp, | |
3471 | /* __is_vector = */ std::false_type) noexcept | |
3472 | { | |
3473 | _DifferenceType __i = __begin; | |
3474 | for (; __i < __end; ++__i) | |
3475 | { | |
3476 | if (__comp(__first[(__i - 1) / 2], __first[__i])) | |
3477 | { | |
3478 | break; | |
3479 | } | |
3480 | } | |
3481 | return __first + __i; | |
3482 | } | |
3483 | ||
3484 | template <class _RandomAccessIterator, class _DifferenceType, class _Compare> | |
3485 | _RandomAccessIterator | |
3486 | __is_heap_until_local(_RandomAccessIterator __first, _DifferenceType __begin, _DifferenceType __end, _Compare __comp, | |
3487 | /* __is_vector = */ std::true_type) noexcept | |
3488 | { | |
3489 | return __unseq_backend::__simd_first( | |
3490 | __first, __begin, __end, | |
3491 | [&__comp](_RandomAccessIterator __it, _DifferenceType __i) { return __comp(__it[(__i - 1) / 2], __it[__i]); }); | |
3492 | } | |
3493 | ||
3494 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator, class _Compare> | |
3495 | _RandomAccessIterator | |
3496 | __pattern_is_heap_until(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
3497 | _RandomAccessIterator __last, _Compare __comp) noexcept | |
3498 | { | |
3499 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
3500 | ||
3501 | if (__last - __first < 2) | |
3502 | return __last; | |
3503 | ||
3504 | return __internal::__except_handler( | |
3505 | [&]() | |
3506 | { | |
3507 | return __parallel_find( | |
3508 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first, __last, | |
3509 | [__first, __comp](_RandomAccessIterator __i, _RandomAccessIterator __j) { | |
3510 | return __internal::__is_heap_until_local(__first, __i - __first, __j - __first, __comp, | |
3511 | _IsVector{}); | |
3512 | }, | |
3513 | std::less<typename std::iterator_traits<_RandomAccessIterator>::difference_type>(), /*is_first=*/true); | |
3514 | }); | |
3515 | } | |
3516 | ||
3517 | //------------------------------------------------------------------------ | |
3518 | // min_element | |
3519 | //------------------------------------------------------------------------ | |
3520 | ||
3521 | template <typename _ForwardIterator, typename _Compare> | |
3522 | _ForwardIterator | |
3523 | __brick_min_element(_ForwardIterator __first, _ForwardIterator __last, _Compare __comp, | |
3524 | /* __is_vector = */ std::false_type) noexcept | |
3525 | { | |
3526 | return std::min_element(__first, __last, __comp); | |
3527 | } | |
3528 | ||
3529 | template <typename _RandomAccessIterator, typename _Compare> | |
3530 | _RandomAccessIterator | |
3531 | __brick_min_element(_RandomAccessIterator __first, _RandomAccessIterator __last, _Compare __comp, | |
3532 | /* __is_vector = */ std::true_type) noexcept | |
3533 | { | |
3534 | #if defined(_PSTL_UDR_PRESENT) | |
3535 | return __unseq_backend::__simd_min_element(__first, __last - __first, __comp); | |
3536 | #else | |
3537 | return std::min_element(__first, __last, __comp); | |
3538 | #endif | |
3539 | } | |
3540 | ||
3541 | template <typename _Tag, typename _ExecutionPolicy, typename _ForwardIterator, typename _Compare> | |
3542 | _ForwardIterator | |
3543 | __pattern_min_element(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, | |
3544 | _Compare __comp) noexcept | |
3545 | { | |
3546 | return __internal::__brick_min_element(__first, __last, __comp, typename _Tag::__is_vector{}); | |
3547 | } | |
3548 | ||
3549 | template <typename _IsVector, typename _ExecutionPolicy, typename _RandomAccessIterator, typename _Compare> | |
3550 | _RandomAccessIterator | |
3551 | __pattern_min_element(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
3552 | _RandomAccessIterator __last, _Compare __comp) | |
3553 | { | |
3554 | if (__first == __last) | |
3555 | return __last; | |
3556 | ||
3557 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
3558 | ||
3559 | return __internal::__except_handler( | |
3560 | [&]() | |
3561 | { | |
3562 | return __par_backend::__parallel_reduce( | |
3563 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first + 1, __last, __first, | |
3564 | [=](_RandomAccessIterator __begin, _RandomAccessIterator __end, | |
3565 | _RandomAccessIterator __init) -> _RandomAccessIterator | |
3566 | { | |
3567 | const _RandomAccessIterator subresult = | |
3568 | __internal::__brick_min_element(__begin, __end, __comp, _IsVector{}); | |
3569 | return __internal::__cmp_iterators_by_values(__init, subresult, __comp); | |
3570 | }, | |
3571 | [=](_RandomAccessIterator __it1, _RandomAccessIterator __it2) -> _RandomAccessIterator | |
3572 | { return __internal::__cmp_iterators_by_values(__it1, __it2, __comp); }); | |
3573 | }); | |
3574 | } | |
3575 | ||
3576 | //------------------------------------------------------------------------ | |
3577 | // minmax_element | |
3578 | //------------------------------------------------------------------------ | |
3579 | ||
3580 | template <typename _ForwardIterator, typename _Compare> | |
3581 | std::pair<_ForwardIterator, _ForwardIterator> | |
3582 | __brick_minmax_element(_ForwardIterator __first, _ForwardIterator __last, _Compare __comp, | |
3583 | /* __is_vector = */ std::false_type) noexcept | |
3584 | { | |
3585 | return std::minmax_element(__first, __last, __comp); | |
3586 | } | |
3587 | ||
3588 | template <typename _RandomAccessIterator, typename _Compare> | |
3589 | std::pair<_RandomAccessIterator, _RandomAccessIterator> | |
3590 | __brick_minmax_element(_RandomAccessIterator __first, _RandomAccessIterator __last, _Compare __comp, | |
3591 | /* __is_vector = */ std::true_type) noexcept | |
3592 | { | |
3593 | #if defined(_PSTL_UDR_PRESENT) | |
3594 | return __unseq_backend::__simd_minmax_element(__first, __last - __first, __comp); | |
3595 | #else | |
3596 | return std::minmax_element(__first, __last, __comp); | |
3597 | #endif | |
3598 | } | |
3599 | ||
3600 | template <typename _Tag, typename _ExecutionPolicy, typename _ForwardIterator, typename _Compare> | |
3601 | std::pair<_ForwardIterator, _ForwardIterator> | |
3602 | __pattern_minmax_element(_Tag, _ExecutionPolicy&&, _ForwardIterator __first, _ForwardIterator __last, | |
3603 | _Compare __comp) noexcept | |
3604 | { | |
3605 | return __internal::__brick_minmax_element(__first, __last, __comp, typename _Tag::__is_vector{}); | |
3606 | } | |
3607 | ||
3608 | template <typename _IsVector, typename _ExecutionPolicy, typename _RandomAccessIterator, typename _Compare> | |
3609 | std::pair<_RandomAccessIterator, _RandomAccessIterator> | |
3610 | __pattern_minmax_element(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator __first, | |
3611 | _RandomAccessIterator __last, _Compare __comp) | |
3612 | { | |
3613 | if (__first == __last) | |
3614 | return std::make_pair(__first, __first); | |
3615 | ||
3616 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
3617 | ||
3618 | return __internal::__except_handler([&]() { | |
3619 | typedef std::pair<_RandomAccessIterator, _RandomAccessIterator> _Result; | |
3620 | ||
3621 | return __par_backend::__parallel_reduce( | |
3622 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first + 1, __last, | |
3623 | std::make_pair(__first, __first), | |
3624 | [=](_RandomAccessIterator __begin, _RandomAccessIterator __end, _Result __init) -> _Result | |
3625 | { | |
3626 | const _Result __subresult = __internal::__brick_minmax_element(__begin, __end, __comp, _IsVector{}); | |
3627 | return std::make_pair( | |
3628 | __internal::__cmp_iterators_by_values(__subresult.first, __init.first, __comp), | |
3629 | __internal::__cmp_iterators_by_values(__init.second, __subresult.second, std::not_fn(__comp))); | |
3630 | }, | |
3631 | [=](_Result __p1, _Result __p2) -> _Result | |
3632 | { | |
3633 | return std::make_pair( | |
3634 | __internal::__cmp_iterators_by_values(__p1.first, __p2.first, __comp), | |
3635 | __internal::__cmp_iterators_by_values(__p2.second, __p1.second, std::not_fn(__comp))); | |
3636 | }); | |
3637 | }); | |
3638 | } | |
3639 | ||
3640 | //------------------------------------------------------------------------ | |
3641 | // mismatch | |
3642 | //------------------------------------------------------------------------ | |
3643 | template <class _ForwardIterator1, class _ForwardIterator2, class _BinaryPredicate> | |
3644 | std::pair<_ForwardIterator1, _ForwardIterator2> | |
3645 | __mismatch_serial(_ForwardIterator1 __first1, _ForwardIterator1 __last1, _ForwardIterator2 __first2, | |
3646 | _ForwardIterator2 __last2, _BinaryPredicate __pred) | |
3647 | { | |
3648 | #if defined(_PSTL_CPP14_2RANGE_MISMATCH_EQUAL_PRESENT) | |
3649 | return std::mismatch(__first1, __last1, __first2, __last2, __pred); | |
3650 | #else | |
3651 | for (; __first1 != __last1 && __first2 != __last2 && __pred(*__first1, *__first2); ++__first1, ++__first2) | |
3652 | { | |
3653 | } | |
3654 | return std::make_pair(__first1, __first2); | |
3655 | #endif | |
3656 | } | |
3657 | ||
3658 | template <class _ForwardIterator1, class _ForwardIterator2, class _Predicate> | |
3659 | std::pair<_ForwardIterator1, _ForwardIterator2> | |
3660 | __brick_mismatch(_ForwardIterator1 __first1, _ForwardIterator1 __last1, _ForwardIterator2 __first2, | |
3661 | _ForwardIterator2 __last2, _Predicate __pred, /* __is_vector = */ std::false_type) noexcept | |
3662 | { | |
3663 | return __mismatch_serial(__first1, __last1, __first2, __last2, __pred); | |
3664 | } | |
3665 | ||
3666 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _Predicate> | |
3667 | std::pair<_RandomAccessIterator1, _RandomAccessIterator2> | |
3668 | __brick_mismatch(_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, | |
3669 | _RandomAccessIterator2 __last2, _Predicate __pred, /* __is_vector = */ std::true_type) noexcept | |
3670 | { | |
3671 | auto __n = std::min(__last1 - __first1, __last2 - __first2); | |
3672 | return __unseq_backend::__simd_first(__first1, __n, __first2, std::not_fn(__pred)); | |
3673 | } | |
3674 | ||
3675 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _Predicate> | |
3676 | std::pair<_ForwardIterator1, _ForwardIterator2> | |
3677 | __pattern_mismatch(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first1, _ForwardIterator1 __last1, | |
3678 | _ForwardIterator2 __first2, _ForwardIterator2 __last2, _Predicate __pred) noexcept | |
3679 | { | |
3680 | return __internal::__brick_mismatch(__first1, __last1, __first2, __last2, __pred, typename _Tag::__is_vector{}); | |
3681 | } | |
3682 | ||
3683 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
3684 | class _Predicate> | |
3685 | std::pair<_RandomAccessIterator1, _RandomAccessIterator2> | |
3686 | __pattern_mismatch(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, _RandomAccessIterator1 __first1, | |
3687 | _RandomAccessIterator1 __last1, _RandomAccessIterator2 __first2, _RandomAccessIterator2 __last2, | |
3688 | _Predicate __pred) noexcept | |
3689 | { | |
3690 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
3691 | ||
3692 | return __internal::__except_handler([&]() { | |
3693 | auto __n = std::min(__last1 - __first1, __last2 - __first2); | |
3694 | auto __result = __internal::__parallel_find( | |
3695 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first1, __first1 + __n, | |
3696 | [__first1, __first2, __pred](_RandomAccessIterator1 __i, _RandomAccessIterator1 __j) | |
3697 | { | |
3698 | return __internal::__brick_mismatch(__i, __j, __first2 + (__i - __first1), __first2 + (__j - __first1), | |
3699 | __pred, _IsVector{}) | |
3700 | .first; | |
3701 | }, | |
3702 | std::less<typename std::iterator_traits<_RandomAccessIterator1>::difference_type>(), /*is_first=*/true); | |
3703 | return std::make_pair(__result, __first2 + (__result - __first1)); | |
3704 | }); | |
3705 | } | |
3706 | ||
3707 | //------------------------------------------------------------------------ | |
3708 | // lexicographical_compare | |
3709 | //------------------------------------------------------------------------ | |
3710 | ||
3711 | template <class _ForwardIterator1, class _ForwardIterator2, class _Compare> | |
3712 | bool | |
3713 | __brick_lexicographical_compare(_ForwardIterator1 __first1, _ForwardIterator1 __last1, _ForwardIterator2 __first2, | |
3714 | _ForwardIterator2 __last2, _Compare __comp, | |
3715 | /* __is_vector = */ std::false_type) noexcept | |
3716 | { | |
3717 | return std::lexicographical_compare(__first1, __last1, __first2, __last2, __comp); | |
3718 | } | |
3719 | ||
3720 | template <class _RandomAccessIterator1, class _RandomAccessIterator2, class _Compare> | |
3721 | bool | |
3722 | __brick_lexicographical_compare(_RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, | |
3723 | _RandomAccessIterator2 __first2, _RandomAccessIterator2 __last2, _Compare __comp, | |
3724 | /* __is_vector = */ std::true_type) noexcept | |
3725 | { | |
3726 | if (__first2 == __last2) | |
3727 | { // if second sequence is empty | |
3728 | return false; | |
3729 | } | |
3730 | else if (__first1 == __last1) | |
3731 | { // if first sequence is empty | |
3732 | return true; | |
3733 | } | |
3734 | else | |
3735 | { | |
3736 | typedef typename std::iterator_traits<_RandomAccessIterator1>::reference ref_type1; | |
3737 | typedef typename std::iterator_traits<_RandomAccessIterator2>::reference ref_type2; | |
3738 | --__last1; | |
3739 | --__last2; | |
3740 | auto __n = std::min(__last1 - __first1, __last2 - __first2); | |
3741 | std::pair<_RandomAccessIterator1, _RandomAccessIterator2> __result = __unseq_backend::__simd_first( | |
3742 | __first1, __n, __first2, [__comp](const ref_type1 __x, const ref_type2 __y) mutable { | |
3743 | return __comp(__x, __y) || __comp(__y, __x); | |
3744 | }); | |
3745 | ||
3746 | if (__result.first == __last1 && __result.second != __last2) | |
3747 | { // if first sequence shorter than second | |
3748 | return !__comp(*__result.second, *__result.first); | |
3749 | } | |
3750 | else | |
3751 | { // if second sequence shorter than first or both have the same number of elements | |
3752 | return __comp(*__result.first, *__result.second); | |
3753 | } | |
3754 | } | |
3755 | } | |
3756 | ||
3757 | template <class _Tag, class _ExecutionPolicy, class _ForwardIterator1, class _ForwardIterator2, class _Compare> | |
3758 | bool | |
3759 | __pattern_lexicographical_compare(_Tag, _ExecutionPolicy&&, _ForwardIterator1 __first1, _ForwardIterator1 __last1, | |
3760 | _ForwardIterator2 __first2, _ForwardIterator2 __last2, _Compare __comp) noexcept | |
3761 | { | |
3762 | return __internal::__brick_lexicographical_compare(__first1, __last1, __first2, __last2, __comp, | |
3763 | typename _Tag::__is_vector{}); | |
3764 | } | |
3765 | ||
3766 | template <class _IsVector, class _ExecutionPolicy, class _RandomAccessIterator1, class _RandomAccessIterator2, | |
3767 | class _Compare> | |
3768 | bool | |
3769 | __pattern_lexicographical_compare(__parallel_tag<_IsVector> __tag, _ExecutionPolicy&& __exec, | |
3770 | _RandomAccessIterator1 __first1, _RandomAccessIterator1 __last1, | |
3771 | _RandomAccessIterator2 __first2, _RandomAccessIterator2 __last2, | |
3772 | _Compare __comp) noexcept | |
3773 | { | |
3774 | using __backend_tag = typename decltype(__tag)::__backend_tag; | |
3775 | ||
3776 | if (__first2 == __last2) | |
3777 | { // if second sequence is empty | |
3778 | return false; | |
3779 | } | |
3780 | else if (__first1 == __last1) | |
3781 | { // if first sequence is empty | |
3782 | return true; | |
3783 | } | |
3784 | else | |
3785 | { | |
3786 | typedef typename std::iterator_traits<_RandomAccessIterator1>::reference _RefType1; | |
3787 | typedef typename std::iterator_traits<_RandomAccessIterator2>::reference _RefType2; | |
3788 | --__last1; | |
3789 | --__last2; | |
3790 | auto __n = std::min(__last1 - __first1, __last2 - __first2); | |
3791 | auto __result = __internal::__parallel_find( | |
3792 | __backend_tag{}, std::forward<_ExecutionPolicy>(__exec), __first1, __first1 + __n, | |
3793 | [__first1, __first2, &__comp](_RandomAccessIterator1 __i, _RandomAccessIterator1 __j) | |
3794 | { | |
3795 | return __internal::__brick_mismatch( | |
3796 | __i, __j, __first2 + (__i - __first1), __first2 + (__j - __first1), | |
3797 | [&__comp](const _RefType1 __x, const _RefType2 __y) | |
3798 | { return !__comp(__x, __y) && !__comp(__y, __x); }, | |
3799 | _IsVector{}) | |
3800 | .first; | |
3801 | }, | |
3802 | std::less<typename std::iterator_traits<_RandomAccessIterator1>::difference_type>(), /*is_first=*/true); | |
3803 | ||
3804 | if (__result == __last1 && __first2 + (__result - __first1) != __last2) | |
3805 | { // if first sequence shorter than second | |
3806 | return !__comp(*(__first2 + (__result - __first1)), *__result); | |
3807 | } | |
3808 | else | |
3809 | { // if second sequence shorter than first or both have the same number of elements | |
3810 | return __comp(*__result, *(__first2 + (__result - __first1))); | |
3811 | } | |
3812 | } | |
3813 | } | |
3814 | ||
3815 | } // namespace __internal | |
3816 | } // namespace __pstl | |
3817 | ||
3818 | #endif /* _PSTL_ALGORITHM_IMPL_H */ |