xref: /dflybsd-src/contrib/gcc-4.7/libstdc++-v3/include/parallel/quicksort.h (revision 04febcfb30580676d3e95f58a16c5137ee478b32)
1*e4b17023SJohn Marino // -*- C++ -*-
2*e4b17023SJohn Marino 
3*e4b17023SJohn Marino // Copyright (C) 2007, 2008, 2009, 2010, 2011 Free Software Foundation, Inc.
4*e4b17023SJohn Marino //
5*e4b17023SJohn Marino // This file is part of the GNU ISO C++ Library.  This library is free
6*e4b17023SJohn Marino // software; you can redistribute it and/or modify it under the terms
7*e4b17023SJohn Marino // of the GNU General Public License as published by the Free Software
8*e4b17023SJohn Marino // Foundation; either version 3, or (at your option) any later
9*e4b17023SJohn Marino // version.
10*e4b17023SJohn Marino 
11*e4b17023SJohn Marino // This library is distributed in the hope that it will be useful, but
12*e4b17023SJohn Marino // WITHOUT ANY WARRANTY; without even the implied warranty of
13*e4b17023SJohn Marino // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14*e4b17023SJohn Marino // General Public License for more details.
15*e4b17023SJohn Marino 
16*e4b17023SJohn Marino // Under Section 7 of GPL version 3, you are granted additional
17*e4b17023SJohn Marino // permissions described in the GCC Runtime Library Exception, version
18*e4b17023SJohn Marino // 3.1, as published by the Free Software Foundation.
19*e4b17023SJohn Marino 
20*e4b17023SJohn Marino // You should have received a copy of the GNU General Public License and
21*e4b17023SJohn Marino // a copy of the GCC Runtime Library Exception along with this program;
22*e4b17023SJohn Marino // see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
23*e4b17023SJohn Marino // <http://www.gnu.org/licenses/>.
24*e4b17023SJohn Marino 
25*e4b17023SJohn Marino /** @file parallel/quicksort.h
26*e4b17023SJohn Marino  *  @brief Implementation of a unbalanced parallel quicksort (in-place).
27*e4b17023SJohn Marino  *  This file is a GNU parallel extension to the Standard C++ Library.
28*e4b17023SJohn Marino  */
29*e4b17023SJohn Marino 
30*e4b17023SJohn Marino // Written by Johannes Singler.
31*e4b17023SJohn Marino 
32*e4b17023SJohn Marino #ifndef _GLIBCXX_PARALLEL_QUICKSORT_H
33*e4b17023SJohn Marino #define _GLIBCXX_PARALLEL_QUICKSORT_H 1
34*e4b17023SJohn Marino 
35*e4b17023SJohn Marino #include <parallel/parallel.h>
36*e4b17023SJohn Marino #include <parallel/partition.h>
37*e4b17023SJohn Marino 
38*e4b17023SJohn Marino namespace __gnu_parallel
39*e4b17023SJohn Marino {
40*e4b17023SJohn Marino   /** @brief Unbalanced quicksort divide step.
41*e4b17023SJohn Marino    *  @param __begin Begin iterator of subsequence.
42*e4b17023SJohn Marino    *  @param __end End iterator of subsequence.
43*e4b17023SJohn Marino    *  @param __comp Comparator.
44*e4b17023SJohn Marino    *  @param __pivot_rank Desired __rank of the pivot.
45*e4b17023SJohn Marino    *  @param __num_samples Choose pivot from that many samples.
46*e4b17023SJohn Marino    *  @param __num_threads Number of threads that are allowed to work on
47*e4b17023SJohn Marino    *  this part.
48*e4b17023SJohn Marino    */
49*e4b17023SJohn Marino   template<typename _RAIter, typename _Compare>
50*e4b17023SJohn Marino     typename std::iterator_traits<_RAIter>::difference_type
__parallel_sort_qs_divide(_RAIter __begin,_RAIter __end,_Compare __comp,typename std::iterator_traits<_RAIter>::difference_type __pivot_rank,typename std::iterator_traits<_RAIter>::difference_type __num_samples,_ThreadIndex __num_threads)51*e4b17023SJohn Marino     __parallel_sort_qs_divide(_RAIter __begin, _RAIter __end,
52*e4b17023SJohn Marino 			      _Compare __comp, typename std::iterator_traits
53*e4b17023SJohn Marino 			      <_RAIter>::difference_type __pivot_rank,
54*e4b17023SJohn Marino 			      typename std::iterator_traits
55*e4b17023SJohn Marino 			      <_RAIter>::difference_type
56*e4b17023SJohn Marino 			      __num_samples, _ThreadIndex __num_threads)
57*e4b17023SJohn Marino     {
58*e4b17023SJohn Marino       typedef std::iterator_traits<_RAIter> _TraitsType;
59*e4b17023SJohn Marino       typedef typename _TraitsType::value_type _ValueType;
60*e4b17023SJohn Marino       typedef typename _TraitsType::difference_type _DifferenceType;
61*e4b17023SJohn Marino 
62*e4b17023SJohn Marino       _DifferenceType __n = __end - __begin;
63*e4b17023SJohn Marino       __num_samples = std::min(__num_samples, __n);
64*e4b17023SJohn Marino 
65*e4b17023SJohn Marino       // Allocate uninitialized, to avoid default constructor.
66*e4b17023SJohn Marino       _ValueType* __samples = static_cast<_ValueType*>
67*e4b17023SJohn Marino 	(::operator new(__num_samples * sizeof(_ValueType)));
68*e4b17023SJohn Marino 
69*e4b17023SJohn Marino       for (_DifferenceType __s = 0; __s < __num_samples; ++__s)
70*e4b17023SJohn Marino         {
71*e4b17023SJohn Marino           const unsigned long long __index = static_cast<unsigned long long>
72*e4b17023SJohn Marino 	    (__s) * __n / __num_samples;
73*e4b17023SJohn Marino           ::new(&(__samples[__s])) _ValueType(__begin[__index]);
74*e4b17023SJohn Marino         }
75*e4b17023SJohn Marino 
76*e4b17023SJohn Marino       __gnu_sequential::sort(__samples, __samples + __num_samples, __comp);
77*e4b17023SJohn Marino 
78*e4b17023SJohn Marino       _ValueType& __pivot = __samples[__pivot_rank * __num_samples / __n];
79*e4b17023SJohn Marino 
80*e4b17023SJohn Marino       __gnu_parallel::__binder2nd<_Compare, _ValueType, _ValueType, bool>
81*e4b17023SJohn Marino         __pred(__comp, __pivot);
82*e4b17023SJohn Marino       _DifferenceType __split = __parallel_partition(__begin, __end,
83*e4b17023SJohn Marino 						     __pred, __num_threads);
84*e4b17023SJohn Marino 
85*e4b17023SJohn Marino       for (_DifferenceType __s = 0; __s < __num_samples; ++__s)
86*e4b17023SJohn Marino 	__samples[__s].~_ValueType();
87*e4b17023SJohn Marino       ::operator delete(__samples);
88*e4b17023SJohn Marino 
89*e4b17023SJohn Marino       return __split;
90*e4b17023SJohn Marino     }
91*e4b17023SJohn Marino 
92*e4b17023SJohn Marino   /** @brief Unbalanced quicksort conquer step.
93*e4b17023SJohn Marino    *  @param __begin Begin iterator of subsequence.
94*e4b17023SJohn Marino    *  @param __end End iterator of subsequence.
95*e4b17023SJohn Marino    *  @param __comp Comparator.
96*e4b17023SJohn Marino    *  @param __num_threads Number of threads that are allowed to work on
97*e4b17023SJohn Marino    *  this part.
98*e4b17023SJohn Marino    */
99*e4b17023SJohn Marino   template<typename _RAIter, typename _Compare>
100*e4b17023SJohn Marino     void
__parallel_sort_qs_conquer(_RAIter __begin,_RAIter __end,_Compare __comp,_ThreadIndex __num_threads)101*e4b17023SJohn Marino     __parallel_sort_qs_conquer(_RAIter __begin, _RAIter __end,
102*e4b17023SJohn Marino 			       _Compare __comp,
103*e4b17023SJohn Marino 			       _ThreadIndex __num_threads)
104*e4b17023SJohn Marino     {
105*e4b17023SJohn Marino       typedef std::iterator_traits<_RAIter> _TraitsType;
106*e4b17023SJohn Marino       typedef typename _TraitsType::value_type _ValueType;
107*e4b17023SJohn Marino       typedef typename _TraitsType::difference_type _DifferenceType;
108*e4b17023SJohn Marino 
109*e4b17023SJohn Marino       if (__num_threads <= 1)
110*e4b17023SJohn Marino         {
111*e4b17023SJohn Marino           __gnu_sequential::sort(__begin, __end, __comp);
112*e4b17023SJohn Marino           return;
113*e4b17023SJohn Marino         }
114*e4b17023SJohn Marino 
115*e4b17023SJohn Marino       _DifferenceType __n = __end - __begin, __pivot_rank;
116*e4b17023SJohn Marino 
117*e4b17023SJohn Marino       if (__n <= 1)
118*e4b17023SJohn Marino         return;
119*e4b17023SJohn Marino 
120*e4b17023SJohn Marino       _ThreadIndex __num_threads_left;
121*e4b17023SJohn Marino 
122*e4b17023SJohn Marino       if ((__num_threads % 2) == 1)
123*e4b17023SJohn Marino         __num_threads_left = __num_threads / 2 + 1;
124*e4b17023SJohn Marino       else
125*e4b17023SJohn Marino         __num_threads_left = __num_threads / 2;
126*e4b17023SJohn Marino 
127*e4b17023SJohn Marino       __pivot_rank = __n * __num_threads_left / __num_threads;
128*e4b17023SJohn Marino 
129*e4b17023SJohn Marino       _DifferenceType __split = __parallel_sort_qs_divide
130*e4b17023SJohn Marino 	(__begin, __end, __comp, __pivot_rank,
131*e4b17023SJohn Marino 	 _Settings::get().sort_qs_num_samples_preset, __num_threads);
132*e4b17023SJohn Marino 
133*e4b17023SJohn Marino #pragma omp parallel sections num_threads(2)
134*e4b17023SJohn Marino       {
135*e4b17023SJohn Marino #pragma omp section
136*e4b17023SJohn Marino         __parallel_sort_qs_conquer(__begin, __begin + __split,
137*e4b17023SJohn Marino 				   __comp, __num_threads_left);
138*e4b17023SJohn Marino #pragma omp section
139*e4b17023SJohn Marino         __parallel_sort_qs_conquer(__begin + __split, __end,
140*e4b17023SJohn Marino 				   __comp, __num_threads - __num_threads_left);
141*e4b17023SJohn Marino       }
142*e4b17023SJohn Marino     }
143*e4b17023SJohn Marino 
144*e4b17023SJohn Marino 
145*e4b17023SJohn Marino   /** @brief Unbalanced quicksort main call.
146*e4b17023SJohn Marino    *  @param __begin Begin iterator of input sequence.
147*e4b17023SJohn Marino    *  @param __end End iterator input sequence, ignored.
148*e4b17023SJohn Marino    *  @param __comp Comparator.
149*e4b17023SJohn Marino    *  @param __num_threads Number of threads that are allowed to work on
150*e4b17023SJohn Marino    *  this part.
151*e4b17023SJohn Marino    */
152*e4b17023SJohn Marino   template<typename _RAIter, typename _Compare>
153*e4b17023SJohn Marino     void
__parallel_sort_qs(_RAIter __begin,_RAIter __end,_Compare __comp,_ThreadIndex __num_threads)154*e4b17023SJohn Marino     __parallel_sort_qs(_RAIter __begin, _RAIter __end,
155*e4b17023SJohn Marino 		       _Compare __comp,
156*e4b17023SJohn Marino 		       _ThreadIndex __num_threads)
157*e4b17023SJohn Marino     {
158*e4b17023SJohn Marino       _GLIBCXX_CALL(__n)
159*e4b17023SJohn Marino 
160*e4b17023SJohn Marino       typedef std::iterator_traits<_RAIter> _TraitsType;
161*e4b17023SJohn Marino       typedef typename _TraitsType::value_type _ValueType;
162*e4b17023SJohn Marino       typedef typename _TraitsType::difference_type _DifferenceType;
163*e4b17023SJohn Marino 
164*e4b17023SJohn Marino       _DifferenceType __n = __end - __begin;
165*e4b17023SJohn Marino 
166*e4b17023SJohn Marino       // At least one element per processor.
167*e4b17023SJohn Marino       if (__num_threads > __n)
168*e4b17023SJohn Marino         __num_threads = static_cast<_ThreadIndex>(__n);
169*e4b17023SJohn Marino 
170*e4b17023SJohn Marino       __parallel_sort_qs_conquer(
171*e4b17023SJohn Marino         __begin, __begin + __n, __comp, __num_threads);
172*e4b17023SJohn Marino     }
173*e4b17023SJohn Marino 
174*e4b17023SJohn Marino } //namespace __gnu_parallel
175*e4b17023SJohn Marino 
176*e4b17023SJohn Marino #endif /* _GLIBCXX_PARALLEL_QUICKSORT_H */
177