11.2.0/parallel/partition.h

// -*- C++ -*-

// Copyright (C) 2007-2021 Free Software Foundation, Inc.
//
// This file is part of the GNU ISO C++ Library.  This library is free
// software; you can redistribute it and/or modify it under the terms
// of the GNU General Public License as published by the Free Software
// Foundation; either version 3, or (at your option) any later
// version.

// This library is distributed in the hope that it will be useful, but
// WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
// General Public License for more details.

// Under Section 7 of GPL version 3, you are granted additional
// permissions described in the GCC Runtime Library Exception, version
// 3.1, as published by the Free Software Foundation.

// You should have received a copy of the GNU General Public License and
// a copy of the GCC Runtime Library Exception along with this program;
// see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
// <http://www.gnu.org/licenses/>.

/** @file parallel/partition.h
 *  @brief Parallel implementation of std::partition(),
 *  std::nth_element(), and std::partial_sort().
 *  This file is a GNU parallel extension to the Standard C++ Library.
 */

// Written by Johannes Singler and Felix Putze.

#ifndef _GLIBCXX_PARALLEL_PARTITION_H
#define _GLIBCXX_PARALLEL_PARTITION_H 1

#include <parallel/basic_iterator.h>
#include <parallel/sort.h>
#include <parallel/random_number.h>
#include <bits/stl_algo.h>
#include <parallel/parallel.h>

/** @brief Decide whether to declare certain variables volatile. */
#define _GLIBCXX_VOLATILE volatile

namespace __gnu_parallel
{
  /** @brief Parallel implementation of std::partition.
    *  @param __begin Begin iterator of input sequence to split.
    *  @param __end End iterator of input sequence to split.
    *  @param __pred Partition predicate, possibly including some kind
    *         of pivot.
    *  @param __num_threads Maximum number of threads to use for this task.
    *  @return Number of elements not fulfilling the predicate. */
  template<typename _RAIter, typename _Predicate>
    typename std::iterator_traits<_RAIter>::difference_type
    __parallel_partition(_RAIter __begin, _RAIter __end,
                         _Predicate __pred, _ThreadIndex __num_threads)
    {
      typedef std::iterator_traits<_RAIter> _TraitsType;
      typedef typename _TraitsType::value_type _ValueType;
      typedef typename _TraitsType::difference_type _DifferenceType;

      _DifferenceType __n = __end - __begin;

      _GLIBCXX_CALL(__n)

      const _Settings& __s = _Settings::get();

      // shared
      _GLIBCXX_VOLATILE _DifferenceType __left = 0, __right = __n - 1,
                                        __dist = __n,
                                        __leftover_left, __leftover_right,
                                        __leftnew, __rightnew;

      // just 0 or 1, but int to allow atomic operations
      int* __reserved_left = 0, * __reserved_right = 0;

      _DifferenceType __chunk_size = __s.partition_chunk_size;

      //at least two chunks per thread
      if (__dist >= 2 * __num_threads * __chunk_size)
#       pragma omp parallel num_threads(__num_threads)
        {
#         pragma omp single
          {
            __num_threads = omp_get_num_threads();
            __reserved_left = new int[__num_threads];
            __reserved_right = new int[__num_threads];

            if (__s.partition_chunk_share > 0.0)
              __chunk_size = std::max<_DifferenceType>
                (__s.partition_chunk_size, (double)__n 
                 * __s.partition_chunk_share / (double)__num_threads);
            else
              __chunk_size = __s.partition_chunk_size;
          }

          while (__dist >= 2 * __num_threads * __chunk_size)
            {
#             pragma omp single
              {
                _DifferenceType __num_chunks = __dist / __chunk_size;

                for (_ThreadIndex __r = 0; __r < __num_threads; ++__r)
                  {
                    __reserved_left [__r] = 0; // false
                    __reserved_right[__r] = 0; // false
                  }
                __leftover_left = 0;
                __leftover_right = 0;
              } //implicit barrier

              // Private.
              _DifferenceType __thread_left, __thread_left_border,
                              __thread_right, __thread_right_border;

              __thread_left = __left + 1;
              // Just to satisfy the condition below.
              __thread_left_border = __thread_left - 1;

              __thread_right = __n - 1;
             // Just to satisfy the condition below.
              __thread_right_border = __thread_right + 1;

              bool __iam_finished = false;
              while (!__iam_finished)
                {
                  if (__thread_left > __thread_left_border)
                    {
                      _DifferenceType __former_dist =
                              __fetch_and_add(&__dist, -__chunk_size);
                      if (__former_dist < __chunk_size)
                        {
                          __fetch_and_add(&__dist, __chunk_size);
                          __iam_finished = true;
                          break;
                        }
                      else
                        {
                          __thread_left =
                                  __fetch_and_add(&__left, __chunk_size);
                          __thread_left_border =
                                  __thread_left + (__chunk_size - 1);
                        }
                    }

                  if (__thread_right < __thread_right_border)
                    {
                      _DifferenceType __former_dist =
                              __fetch_and_add(&__dist, -__chunk_size);
                      if (__former_dist < __chunk_size)
                        {
                          __fetch_and_add(&__dist, __chunk_size);
                          __iam_finished = true;
                          break;
                        }
                      else
                        {
                          __thread_right =
                                  __fetch_and_add(&__right, -__chunk_size);
                          __thread_right_border =
                                  __thread_right - (__chunk_size - 1);
                        }
                    }

                  // Swap as usual.
                  while (__thread_left < __thread_right)
                    {
                      while (__pred(__begin[__thread_left])
                             && __thread_left <= __thread_left_border)
                        ++__thread_left;
                      while (!__pred(__begin[__thread_right])
                             && __thread_right >= __thread_right_border)
                        --__thread_right;

                      if (__thread_left > __thread_left_border
                          || __thread_right < __thread_right_border)
                        // Fetch new chunk(__s).
                        break;

                      std::iter_swap(__begin + __thread_left,
                             __begin + __thread_right);
                      ++__thread_left;
                      --__thread_right;
                    }
                }

              // Now swap the leftover chunks to the right places.
              if (__thread_left <= __thread_left_border)
#               pragma omp atomic
                ++__leftover_left;
              if (__thread_right >= __thread_right_border)
#               pragma omp atomic
                ++__leftover_right;

#             pragma omp barrier

              _DifferenceType
                    __leftold = __left,
                    __leftnew = __left - __leftover_left * __chunk_size,
                    __rightold = __right,
                    __rightnew = __right + __leftover_right * __chunk_size;

              // <=> __thread_left_border + (__chunk_size - 1) >= __leftnew
              if (__thread_left <= __thread_left_border
                  && __thread_left_border >= __leftnew)
                {
                  // Chunk already in place, reserve spot.
                __reserved_left[(__left - (__thread_left_border + 1))
                                / __chunk_size] = 1;
                }

              // <=> __thread_right_border - (__chunk_size - 1) <= __rightnew
              if (__thread_right >= __thread_right_border
                  && __thread_right_border <= __rightnew)
                {
                  // Chunk already in place, reserve spot.
                  __reserved_right[((__thread_right_border - 1) - __right)
                                   / __chunk_size] = 1;
                }

#             pragma omp barrier

              if (__thread_left <= __thread_left_border
                  && __thread_left_border < __leftnew)
                {
                  // Find spot and swap.
                  _DifferenceType __swapstart = -1;
                  for (int __r = 0; __r < __leftover_left; ++__r)
                    if (__reserved_left[__r] == 0
                        && __compare_and_swap(&(__reserved_left[__r]), 0, 1))
                      {
                        __swapstart = __leftold - (__r + 1) * __chunk_size;
                        break;
                      }

#if _GLIBCXX_PARALLEL_ASSERTIONS
                  _GLIBCXX_PARALLEL_ASSERT(__swapstart != -1);
#endif

                  std::swap_ranges(__begin + __thread_left_border
                                   - (__chunk_size - 1),
                                   __begin + __thread_left_border + 1,
                                   __begin + __swapstart);
                }

              if (__thread_right >= __thread_right_border
                  && __thread_right_border > __rightnew)
                {
                  // Find spot and swap
                  _DifferenceType __swapstart = -1;
                  for (int __r = 0; __r < __leftover_right; ++__r)
                    if (__reserved_right[__r] == 0
                        && __compare_and_swap(&(__reserved_right[__r]), 0, 1))
                      {
                        __swapstart = __rightold + __r * __chunk_size + 1;
                        break;
                      }

#if _GLIBCXX_PARALLEL_ASSERTIONS
                  _GLIBCXX_PARALLEL_ASSERT(__swapstart != -1);
#endif

                  std::swap_ranges(__begin + __thread_right_border,
                                   __begin + __thread_right_border
                                   + __chunk_size, __begin + __swapstart);
              }
#if _GLIBCXX_PARALLEL_ASSERTIONS
#             pragma omp barrier

#             pragma omp single
              {
                for (_DifferenceType __r = 0; __r < __leftover_left; ++__r)
                  _GLIBCXX_PARALLEL_ASSERT(__reserved_left[__r] == 1);
                for (_DifferenceType __r = 0; __r < __leftover_right; ++__r)
                  _GLIBCXX_PARALLEL_ASSERT(__reserved_right[__r] == 1);
              }
#endif

              __left = __leftnew;
              __right = __rightnew;
              __dist = __right - __left + 1;
            }

#           pragma omp flush(__left, __right)
        } // end "recursion" //parallel

        _DifferenceType __final_left = __left, __final_right = __right;

        while (__final_left < __final_right)
          {
            // Go right until key is geq than pivot.
            while (__pred(__begin[__final_left])
                   && __final_left < __final_right)
              ++__final_left;

            // Go left until key is less than pivot.
            while (!__pred(__begin[__final_right])
                   && __final_left < __final_right)
              --__final_right;

            if (__final_left == __final_right)
              break;
            std::iter_swap(__begin + __final_left, __begin + __final_right);
            ++__final_left;
            --__final_right;
          }

        // All elements on the left side are < piv, all elements on the
        // right are >= piv
        delete[] __reserved_left;
        delete[] __reserved_right;

        // Element "between" __final_left and __final_right might not have
        // been regarded yet
        if (__final_left < __n && !__pred(__begin[__final_left]))
          // Really swapped.
          return __final_left;
        else
          return __final_left + 1;
    }

  /**
    *  @brief Parallel implementation of std::nth_element().
    *  @param __begin Begin iterator of input sequence.
    *  @param __nth _Iterator of element that must be in position afterwards.
    *  @param __end End iterator of input sequence.
    *  @param __comp Comparator.
    */
  template<typename _RAIter, typename _Compare>
    void 
    __parallel_nth_element(_RAIter __begin, _RAIter __nth, 
                           _RAIter __end, _Compare __comp)
    {
      typedef std::iterator_traits<_RAIter> _TraitsType;
      typedef typename _TraitsType::value_type _ValueType;
      typedef typename _TraitsType::difference_type _DifferenceType;

      _GLIBCXX_CALL(__end - __begin)

      _RAIter __split;
      _RandomNumber __rng;

      const _Settings& __s = _Settings::get();
      _DifferenceType __minimum_length = std::max<_DifferenceType>(2,
        std::max(__s.nth_element_minimal_n, __s.partition_minimal_n));

      // Break if input range to small.
      while (static_cast<_SequenceIndex>(__end - __begin) >= __minimum_length)
        {
          _DifferenceType __n = __end - __begin;

          _RAIter __pivot_pos = __begin + __rng(__n);

          // Swap __pivot_pos value to end.
          if (__pivot_pos != (__end - 1))
            std::iter_swap(__pivot_pos, __end - 1);
          __pivot_pos = __end - 1;

          // _Compare must have first_value_type, second_value_type,
          // result_type
          // _Compare ==
          // __gnu_parallel::_Lexicographic<S, int,
          //                                __gnu_parallel::_Less<S, S> >
          // __pivot_pos == std::pair<S, int>*
          __gnu_parallel::__binder2nd<_Compare, _ValueType, _ValueType, bool>
            __pred(__comp, *__pivot_pos);

          // Divide, leave pivot unchanged in last place.
          _RAIter __split_pos1, __split_pos2;
          __split_pos1 = __begin + __parallel_partition(__begin, __end - 1,
                                                        __pred,
                                                        __get_max_threads());

          // Left side: < __pivot_pos; __right side: >= __pivot_pos

          // Swap pivot back to middle.
          if (__split_pos1 != __pivot_pos)
            std::iter_swap(__split_pos1, __pivot_pos);
          __pivot_pos = __split_pos1;

          // In case all elements are equal, __split_pos1 == 0
          if ((__split_pos1 + 1 - __begin) < (__n >> 7)
              || (__end - __split_pos1) < (__n >> 7))
            {
              // Very unequal split, one part smaller than one 128th
              // elements not strictly larger than the pivot.
              __gnu_parallel::__unary_negate<__gnu_parallel::
                __binder1st<_Compare, _ValueType,
                            _ValueType, bool>, _ValueType>
                __pred(__gnu_parallel::__binder1st<_Compare, _ValueType,
                       _ValueType, bool>(__comp, *__pivot_pos));

              // Find other end of pivot-equal range.
              __split_pos2 = __gnu_sequential::partition(__split_pos1 + 1,
                                                         __end, __pred);
            }
          else
            // Only skip the pivot.
            __split_pos2 = __split_pos1 + 1;

          // Compare iterators.
          if (__split_pos2 <= __nth)
            __begin = __split_pos2;
          else if (__nth < __split_pos1)
            __end = __split_pos1;
          else
            break;
        }

      // Only at most _Settings::partition_minimal_n __elements __left.
      __gnu_sequential::nth_element(__begin, __nth, __end, __comp);
    }

  /** @brief Parallel implementation of std::partial_sort().
  *  @param __begin Begin iterator of input sequence.
  *  @param __middle Sort until this position.
  *  @param __end End iterator of input sequence.
  *  @param __comp Comparator. */
  template<typename _RAIter, typename _Compare>
    void
    __parallel_partial_sort(_RAIter __begin,
                            _RAIter __middle,
                            _RAIter __end, _Compare __comp)
    {
      __parallel_nth_element(__begin, __middle, __end, __comp);
      std::sort(__begin, __middle, __comp);
    }

} //namespace __gnu_parallel

#undef _GLIBCXX_VOLATILE

#endif /* _GLIBCXX_PARALLEL_PARTITION_H */
Revision:	1166
Committed:	Tue Oct 26 14:22:36 2021 UTC (4 years ago) by rossy
Content type:	text/x-chdr
File size:	14961 byte(s)
Log Message:	Daodan: Replace MinGW build env with an up-to-date MSYS2 env
#	Content
1	// -- C++ --
2
3	// Copyright (C) 2007-2021 Free Software Foundation, Inc.
4	//
5	// This file is part of the GNU ISO C++ Library. This library is free
6	// software; you can redistribute it and/or modify it under the terms
7	// of the GNU General Public License as published by the Free Software
8	// Foundation; either version 3, or (at your option) any later
9	// version.
10
11	// This library is distributed in the hope that it will be useful, but
12	// WITHOUT ANY WARRANTY; without even the implied warranty of
13	// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14	// General Public License for more details.
15
16	// Under Section 7 of GPL version 3, you are granted additional
17	// permissions described in the GCC Runtime Library Exception, version
18	// 3.1, as published by the Free Software Foundation.
19
20	// You should have received a copy of the GNU General Public License and
21	// a copy of the GCC Runtime Library Exception along with this program;
22	// see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
23	// <http://www.gnu.org/licenses/>.
24
25	/** @file parallel/partition.h
26	* @brief Parallel implementation of std::partition(),
27	* std::nth_element(), and std::partial_sort().
28	* This file is a GNU parallel extension to the Standard C++ Library.
29	*/
30
31	// Written by Johannes Singler and Felix Putze.
32
33	#ifndef _GLIBCXX_PARALLEL_PARTITION_H
34	#define _GLIBCXX_PARALLEL_PARTITION_H 1
35
36	#include <parallel/basic_iterator.h>
37	#include <parallel/sort.h>
38	#include <parallel/random_number.h>
39	#include <bits/stl_algo.h>
40	#include <parallel/parallel.h>
41
42	/** @brief Decide whether to declare certain variables volatile. */
43	#define _GLIBCXX_VOLATILE volatile
44
45	namespace __gnu_parallel
46	{
47	/** @brief Parallel implementation of std::partition.
48	* @param __begin Begin iterator of input sequence to split.
49	* @param __end End iterator of input sequence to split.
50	* @param __pred Partition predicate, possibly including some kind
51	* of pivot.
52	* @param __num_threads Maximum number of threads to use for this task.
53	* @return Number of elements not fulfilling the predicate. */
54	template<typename _RAIter, typename _Predicate>
55	typename std::iterator_traits<_RAIter>::difference_type
56	__parallel_partition(_RAIter __begin, _RAIter __end,
57	_Predicate __pred, _ThreadIndex __num_threads)
58	{
59	typedef std::iterator_traits<_RAIter> _TraitsType;
60	typedef typename _TraitsType::value_type _ValueType;
61	typedef typename _TraitsType::difference_type _DifferenceType;
62
63	_DifferenceType __n = __end - __begin;
64
65	_GLIBCXX_CALL(__n)
66
67	const _Settings& __s = _Settings::get();
68
69	// shared
70	_GLIBCXX_VOLATILE _DifferenceType __left = 0, __right = __n - 1,
71	__dist = __n,
72	__leftover_left, __leftover_right,
73	__leftnew, __rightnew;
74
75	// just 0 or 1, but int to allow atomic operations
76	int* __reserved_left = 0, * __reserved_right = 0;
77
78	_DifferenceType __chunk_size = __s.partition_chunk_size;
79
80	//at least two chunks per thread
81	if (__dist >= 2 * __num_threads * __chunk_size)
82	# pragma omp parallel num_threads(__num_threads)
83	{
84	# pragma omp single
85	{
86	__num_threads = omp_get_num_threads();
87	__reserved_left = new int[__num_threads];
88	__reserved_right = new int[__num_threads];
89
90	if (__s.partition_chunk_share > 0.0)
91	__chunk_size = std::max<_DifferenceType>
92	(__s.partition_chunk_size, (double)__n
93	* __s.partition_chunk_share / (double)__num_threads);
94	else
95	__chunk_size = __s.partition_chunk_size;
96	}
97
98	while (__dist >= 2 * __num_threads * __chunk_size)
99	{
100	# pragma omp single
101	{
102	_DifferenceType __num_chunks = __dist / __chunk_size;
103
104	for (_ThreadIndex __r = 0; __r < __num_threads; ++__r)
105	{
106	__reserved_left [__r] = 0; // false
107	__reserved_right[__r] = 0; // false
108	}
109	__leftover_left = 0;
110	__leftover_right = 0;
111	} //implicit barrier
112
113	// Private.
114	_DifferenceType __thread_left, __thread_left_border,
115	__thread_right, __thread_right_border;
116
117	__thread_left = __left + 1;
118	// Just to satisfy the condition below.
119	__thread_left_border = __thread_left - 1;
120
121	__thread_right = __n - 1;
122	// Just to satisfy the condition below.
123	__thread_right_border = __thread_right + 1;
124
125	bool __iam_finished = false;
126	while (!__iam_finished)
127	{
128	if (__thread_left > __thread_left_border)
129	{
130	_DifferenceType __former_dist =
131	__fetch_and_add(&__dist, -__chunk_size);
132	if (__former_dist < __chunk_size)
133	{
134	__fetch_and_add(&__dist, __chunk_size);
135	__iam_finished = true;
136	break;
137	}
138	else
139	{
140	__thread_left =
141	__fetch_and_add(&__left, __chunk_size);
142	__thread_left_border =
143	__thread_left + (__chunk_size - 1);
144	}
145	}
146
147	if (__thread_right < __thread_right_border)
148	{
149	_DifferenceType __former_dist =
150	__fetch_and_add(&__dist, -__chunk_size);
151	if (__former_dist < __chunk_size)
152	{
153	__fetch_and_add(&__dist, __chunk_size);
154	__iam_finished = true;
155	break;
156	}
157	else
158	{
159	__thread_right =
160	__fetch_and_add(&__right, -__chunk_size);
161	__thread_right_border =
162	__thread_right - (__chunk_size - 1);
163	}
164	}
165
166	// Swap as usual.
167	while (__thread_left < __thread_right)
168	{
169	while (__pred(__begin[__thread_left])
170	&& __thread_left <= __thread_left_border)
171	++__thread_left;
172	while (!__pred(__begin[__thread_right])
173	&& __thread_right >= __thread_right_border)
174	--__thread_right;
175
176	if (__thread_left > __thread_left_border
177	\|\| __thread_right < __thread_right_border)
178	// Fetch new chunk(__s).
179	break;
180
181	std::iter_swap(__begin + __thread_left,
182	__begin + __thread_right);
183	++__thread_left;
184	--__thread_right;
185	}
186	}
187
188	// Now swap the leftover chunks to the right places.
189	if (__thread_left <= __thread_left_border)
190	# pragma omp atomic
191	++__leftover_left;
192	if (__thread_right >= __thread_right_border)
193	# pragma omp atomic
194	++__leftover_right;
195
196	# pragma omp barrier
197
198	_DifferenceType
199	__leftold = __left,
200	__leftnew = __left - __leftover_left * __chunk_size,
201	__rightold = __right,
202	__rightnew = __right + __leftover_right * __chunk_size;
203
204	// <=> __thread_left_border + (__chunk_size - 1) >= __leftnew
205	if (__thread_left <= __thread_left_border
206	&& __thread_left_border >= __leftnew)
207	{
208	// Chunk already in place, reserve spot.
209	__reserved_left[(__left - (__thread_left_border + 1))
210	/ __chunk_size] = 1;
211	}
212
213	// <=> __thread_right_border - (__chunk_size - 1) <= __rightnew
214	if (__thread_right >= __thread_right_border
215	&& __thread_right_border <= __rightnew)
216	{
217	// Chunk already in place, reserve spot.
218	__reserved_right[((__thread_right_border - 1) - __right)
219	/ __chunk_size] = 1;
220	}
221
222	# pragma omp barrier
223
224	if (__thread_left <= __thread_left_border
225	&& __thread_left_border < __leftnew)
226	{
227	// Find spot and swap.
228	_DifferenceType __swapstart = -1;
229	for (int __r = 0; __r < __leftover_left; ++__r)
230	if (__reserved_left[__r] == 0
231	&& __compare_and_swap(&(__reserved_left[__r]), 0, 1))
232	{
233	__swapstart = __leftold - (__r + 1) * __chunk_size;
234	break;
235	}
236
237	#if _GLIBCXX_PARALLEL_ASSERTIONS
238	_GLIBCXX_PARALLEL_ASSERT(__swapstart != -1);
239	#endif
240
241	std::swap_ranges(__begin + __thread_left_border
242	- (__chunk_size - 1),
243	__begin + __thread_left_border + 1,
244	__begin + __swapstart);
245	}
246
247	if (__thread_right >= __thread_right_border
248	&& __thread_right_border > __rightnew)
249	{
250	// Find spot and swap
251	_DifferenceType __swapstart = -1;
252	for (int __r = 0; __r < __leftover_right; ++__r)
253	if (__reserved_right[__r] == 0
254	&& __compare_and_swap(&(__reserved_right[__r]), 0, 1))
255	{
256	__swapstart = __rightold + __r * __chunk_size + 1;
257	break;
258	}
259
260	#if _GLIBCXX_PARALLEL_ASSERTIONS
261	_GLIBCXX_PARALLEL_ASSERT(__swapstart != -1);
262	#endif
263
264	std::swap_ranges(__begin + __thread_right_border,
265	__begin + __thread_right_border
266	+ __chunk_size, __begin + __swapstart);
267	}
268	#if _GLIBCXX_PARALLEL_ASSERTIONS
269	# pragma omp barrier
270
271	# pragma omp single
272	{
273	for (_DifferenceType __r = 0; __r < __leftover_left; ++__r)
274	_GLIBCXX_PARALLEL_ASSERT(__reserved_left[__r] == 1);
275	for (_DifferenceType __r = 0; __r < __leftover_right; ++__r)
276	_GLIBCXX_PARALLEL_ASSERT(__reserved_right[__r] == 1);
277	}
278	#endif
279
280	__left = __leftnew;
281	__right = __rightnew;
282	__dist = __right - __left + 1;
283	}
284
285	# pragma omp flush(__left, __right)
286	} // end "recursion" //parallel
287
288	_DifferenceType __final_left = __left, __final_right = __right;
289
290	while (__final_left < __final_right)
291	{
292	// Go right until key is geq than pivot.
293	while (__pred(__begin[__final_left])
294	&& __final_left < __final_right)
295	++__final_left;
296
297	// Go left until key is less than pivot.
298	while (!__pred(__begin[__final_right])
299	&& __final_left < __final_right)
300	--__final_right;
301
302	if (__final_left == __final_right)
303	break;
304	std::iter_swap(__begin + __final_left, __begin + __final_right);
305	++__final_left;
306	--__final_right;
307	}
308
309	// All elements on the left side are < piv, all elements on the
310	// right are >= piv
311	delete[] __reserved_left;
312	delete[] __reserved_right;
313
314	// Element "between" __final_left and __final_right might not have
315	// been regarded yet
316	if (__final_left < __n && !__pred(__begin[__final_left]))
317	// Really swapped.
318	return __final_left;
319	else
320	return __final_left + 1;
321	}
322
323	/**
324	* @brief Parallel implementation of std::nth_element().
325	* @param __begin Begin iterator of input sequence.
326	* @param __nth _Iterator of element that must be in position afterwards.
327	* @param __end End iterator of input sequence.
328	* @param __comp Comparator.
329	*/
330	template<typename _RAIter, typename _Compare>
331	void
332	__parallel_nth_element(_RAIter __begin, _RAIter __nth,
333	_RAIter __end, _Compare __comp)
334	{
335	typedef std::iterator_traits<_RAIter> _TraitsType;
336	typedef typename _TraitsType::value_type _ValueType;
337	typedef typename _TraitsType::difference_type _DifferenceType;
338
339	_GLIBCXX_CALL(__end - __begin)
340
341	_RAIter __split;
342	_RandomNumber __rng;
343
344	const _Settings& __s = _Settings::get();
345	_DifferenceType __minimum_length = std::max<_DifferenceType>(2,
346	std::max(__s.nth_element_minimal_n, __s.partition_minimal_n));
347
348	// Break if input range to small.
349	while (static_cast<_SequenceIndex>(__end - __begin) >= __minimum_length)
350	{
351	_DifferenceType __n = __end - __begin;
352
353	_RAIter __pivot_pos = __begin + __rng(__n);
354
355	// Swap __pivot_pos value to end.
356	if (__pivot_pos != (__end - 1))
357	std::iter_swap(__pivot_pos, __end - 1);
358	__pivot_pos = __end - 1;
359
360	// _Compare must have first_value_type, second_value_type,
361	// result_type
362	// _Compare ==
363	// __gnu_parallel::_Lexicographic<S, int,
364	// __gnu_parallel::_Less<S, S> >
365	// __pivot_pos == std::pair<S, int>*
366	__gnu_parallel::__binder2nd<_Compare, _ValueType, _ValueType, bool>
367	__pred(__comp, *__pivot_pos);
368
369	// Divide, leave pivot unchanged in last place.
370	_RAIter __split_pos1, __split_pos2;
371	__split_pos1 = __begin + __parallel_partition(__begin, __end - 1,
372	__pred,
373	__get_max_threads());
374
375	// Left side: < __pivot_pos; __right side: >= __pivot_pos
376
377	// Swap pivot back to middle.
378	if (__split_pos1 != __pivot_pos)
379	std::iter_swap(__split_pos1, __pivot_pos);
380	__pivot_pos = __split_pos1;
381
382	// In case all elements are equal, __split_pos1 == 0
383	if ((__split_pos1 + 1 - __begin) < (__n >> 7)
384	\|\| (__end - __split_pos1) < (__n >> 7))
385	{
386	// Very unequal split, one part smaller than one 128th
387	// elements not strictly larger than the pivot.
388	__gnu_parallel::__unary_negate<__gnu_parallel::
389	__binder1st<_Compare, _ValueType,
390	_ValueType, bool>, _ValueType>
391	__pred(__gnu_parallel::__binder1st<_Compare, _ValueType,
392	_ValueType, bool>(__comp, *__pivot_pos));
393
394	// Find other end of pivot-equal range.
395	__split_pos2 = __gnu_sequential::partition(__split_pos1 + 1,
396	__end, __pred);
397	}
398	else
399	// Only skip the pivot.
400	__split_pos2 = __split_pos1 + 1;
401
402	// Compare iterators.
403	if (__split_pos2 <= __nth)
404	__begin = __split_pos2;
405	else if (__nth < __split_pos1)
406	__end = __split_pos1;
407	else
408	break;
409	}
410
411	// Only at most _Settings::partition_minimal_n __elements __left.
412	__gnu_sequential::nth_element(__begin, __nth, __end, __comp);
413	}
414
415	/** @brief Parallel implementation of std::partial_sort().
416	* @param __begin Begin iterator of input sequence.
417	* @param __middle Sort until this position.
418	* @param __end End iterator of input sequence.
419	* @param __comp Comparator. */
420	template<typename _RAIter, typename _Compare>
421	void
422	__parallel_partial_sort(_RAIter __begin,
423	_RAIter __middle,
424	_RAIter __end, _Compare __comp)
425	{
426	__parallel_nth_element(__begin, __middle, __end, __comp);
427	std::sort(__begin, __middle, __comp);
428	}
429
430	} //namespace __gnu_parallel
431
432	#undef _GLIBCXX_VOLATILE
433
434	#endif /* _GLIBCXX_PARALLEL_PARTITION_H */