1*e4b17023SJohn Marino // -*- C++ -*- 2*e4b17023SJohn Marino 3*e4b17023SJohn Marino // Copyright (C) 2007, 2008, 2009, 2010, 2011 Free Software Foundation, Inc. 4*e4b17023SJohn Marino // 5*e4b17023SJohn Marino // This file is part of the GNU ISO C++ Library. This library is free 6*e4b17023SJohn Marino // software; you can redistribute it and/or modify it under the terms 7*e4b17023SJohn Marino // of the GNU General Public License as published by the Free Software 8*e4b17023SJohn Marino // Foundation; either version 3, or (at your option) any later 9*e4b17023SJohn Marino // version. 10*e4b17023SJohn Marino 11*e4b17023SJohn Marino // This library is distributed in the hope that it will be useful, but 12*e4b17023SJohn Marino // WITHOUT ANY WARRANTY; without even the implied warranty of 13*e4b17023SJohn Marino // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 14*e4b17023SJohn Marino // General Public License for more details. 15*e4b17023SJohn Marino 16*e4b17023SJohn Marino // Under Section 7 of GPL version 3, you are granted additional 17*e4b17023SJohn Marino // permissions described in the GCC Runtime Library Exception, version 18*e4b17023SJohn Marino // 3.1, as published by the Free Software Foundation. 19*e4b17023SJohn Marino 20*e4b17023SJohn Marino // You should have received a copy of the GNU General Public License and 21*e4b17023SJohn Marino // a copy of the GCC Runtime Library Exception along with this program; 22*e4b17023SJohn Marino // see the files COPYING3 and COPYING.RUNTIME respectively. If not, see 23*e4b17023SJohn Marino // <http://www.gnu.org/licenses/>. 24*e4b17023SJohn Marino 25*e4b17023SJohn Marino /** @file parallel/quicksort.h 26*e4b17023SJohn Marino * @brief Implementation of a unbalanced parallel quicksort (in-place). 27*e4b17023SJohn Marino * This file is a GNU parallel extension to the Standard C++ Library. 28*e4b17023SJohn Marino */ 29*e4b17023SJohn Marino 30*e4b17023SJohn Marino // Written by Johannes Singler. 31*e4b17023SJohn Marino 32*e4b17023SJohn Marino #ifndef _GLIBCXX_PARALLEL_QUICKSORT_H 33*e4b17023SJohn Marino #define _GLIBCXX_PARALLEL_QUICKSORT_H 1 34*e4b17023SJohn Marino 35*e4b17023SJohn Marino #include <parallel/parallel.h> 36*e4b17023SJohn Marino #include <parallel/partition.h> 37*e4b17023SJohn Marino 38*e4b17023SJohn Marino namespace __gnu_parallel 39*e4b17023SJohn Marino { 40*e4b17023SJohn Marino /** @brief Unbalanced quicksort divide step. 41*e4b17023SJohn Marino * @param __begin Begin iterator of subsequence. 42*e4b17023SJohn Marino * @param __end End iterator of subsequence. 43*e4b17023SJohn Marino * @param __comp Comparator. 44*e4b17023SJohn Marino * @param __pivot_rank Desired __rank of the pivot. 45*e4b17023SJohn Marino * @param __num_samples Choose pivot from that many samples. 46*e4b17023SJohn Marino * @param __num_threads Number of threads that are allowed to work on 47*e4b17023SJohn Marino * this part. 48*e4b17023SJohn Marino */ 49*e4b17023SJohn Marino template<typename _RAIter, typename _Compare> 50*e4b17023SJohn Marino typename std::iterator_traits<_RAIter>::difference_type __parallel_sort_qs_divide(_RAIter __begin,_RAIter __end,_Compare __comp,typename std::iterator_traits<_RAIter>::difference_type __pivot_rank,typename std::iterator_traits<_RAIter>::difference_type __num_samples,_ThreadIndex __num_threads)51*e4b17023SJohn Marino __parallel_sort_qs_divide(_RAIter __begin, _RAIter __end, 52*e4b17023SJohn Marino _Compare __comp, typename std::iterator_traits 53*e4b17023SJohn Marino <_RAIter>::difference_type __pivot_rank, 54*e4b17023SJohn Marino typename std::iterator_traits 55*e4b17023SJohn Marino <_RAIter>::difference_type 56*e4b17023SJohn Marino __num_samples, _ThreadIndex __num_threads) 57*e4b17023SJohn Marino { 58*e4b17023SJohn Marino typedef std::iterator_traits<_RAIter> _TraitsType; 59*e4b17023SJohn Marino typedef typename _TraitsType::value_type _ValueType; 60*e4b17023SJohn Marino typedef typename _TraitsType::difference_type _DifferenceType; 61*e4b17023SJohn Marino 62*e4b17023SJohn Marino _DifferenceType __n = __end - __begin; 63*e4b17023SJohn Marino __num_samples = std::min(__num_samples, __n); 64*e4b17023SJohn Marino 65*e4b17023SJohn Marino // Allocate uninitialized, to avoid default constructor. 66*e4b17023SJohn Marino _ValueType* __samples = static_cast<_ValueType*> 67*e4b17023SJohn Marino (::operator new(__num_samples * sizeof(_ValueType))); 68*e4b17023SJohn Marino 69*e4b17023SJohn Marino for (_DifferenceType __s = 0; __s < __num_samples; ++__s) 70*e4b17023SJohn Marino { 71*e4b17023SJohn Marino const unsigned long long __index = static_cast<unsigned long long> 72*e4b17023SJohn Marino (__s) * __n / __num_samples; 73*e4b17023SJohn Marino ::new(&(__samples[__s])) _ValueType(__begin[__index]); 74*e4b17023SJohn Marino } 75*e4b17023SJohn Marino 76*e4b17023SJohn Marino __gnu_sequential::sort(__samples, __samples + __num_samples, __comp); 77*e4b17023SJohn Marino 78*e4b17023SJohn Marino _ValueType& __pivot = __samples[__pivot_rank * __num_samples / __n]; 79*e4b17023SJohn Marino 80*e4b17023SJohn Marino __gnu_parallel::__binder2nd<_Compare, _ValueType, _ValueType, bool> 81*e4b17023SJohn Marino __pred(__comp, __pivot); 82*e4b17023SJohn Marino _DifferenceType __split = __parallel_partition(__begin, __end, 83*e4b17023SJohn Marino __pred, __num_threads); 84*e4b17023SJohn Marino 85*e4b17023SJohn Marino for (_DifferenceType __s = 0; __s < __num_samples; ++__s) 86*e4b17023SJohn Marino __samples[__s].~_ValueType(); 87*e4b17023SJohn Marino ::operator delete(__samples); 88*e4b17023SJohn Marino 89*e4b17023SJohn Marino return __split; 90*e4b17023SJohn Marino } 91*e4b17023SJohn Marino 92*e4b17023SJohn Marino /** @brief Unbalanced quicksort conquer step. 93*e4b17023SJohn Marino * @param __begin Begin iterator of subsequence. 94*e4b17023SJohn Marino * @param __end End iterator of subsequence. 95*e4b17023SJohn Marino * @param __comp Comparator. 96*e4b17023SJohn Marino * @param __num_threads Number of threads that are allowed to work on 97*e4b17023SJohn Marino * this part. 98*e4b17023SJohn Marino */ 99*e4b17023SJohn Marino template<typename _RAIter, typename _Compare> 100*e4b17023SJohn Marino void __parallel_sort_qs_conquer(_RAIter __begin,_RAIter __end,_Compare __comp,_ThreadIndex __num_threads)101*e4b17023SJohn Marino __parallel_sort_qs_conquer(_RAIter __begin, _RAIter __end, 102*e4b17023SJohn Marino _Compare __comp, 103*e4b17023SJohn Marino _ThreadIndex __num_threads) 104*e4b17023SJohn Marino { 105*e4b17023SJohn Marino typedef std::iterator_traits<_RAIter> _TraitsType; 106*e4b17023SJohn Marino typedef typename _TraitsType::value_type _ValueType; 107*e4b17023SJohn Marino typedef typename _TraitsType::difference_type _DifferenceType; 108*e4b17023SJohn Marino 109*e4b17023SJohn Marino if (__num_threads <= 1) 110*e4b17023SJohn Marino { 111*e4b17023SJohn Marino __gnu_sequential::sort(__begin, __end, __comp); 112*e4b17023SJohn Marino return; 113*e4b17023SJohn Marino } 114*e4b17023SJohn Marino 115*e4b17023SJohn Marino _DifferenceType __n = __end - __begin, __pivot_rank; 116*e4b17023SJohn Marino 117*e4b17023SJohn Marino if (__n <= 1) 118*e4b17023SJohn Marino return; 119*e4b17023SJohn Marino 120*e4b17023SJohn Marino _ThreadIndex __num_threads_left; 121*e4b17023SJohn Marino 122*e4b17023SJohn Marino if ((__num_threads % 2) == 1) 123*e4b17023SJohn Marino __num_threads_left = __num_threads / 2 + 1; 124*e4b17023SJohn Marino else 125*e4b17023SJohn Marino __num_threads_left = __num_threads / 2; 126*e4b17023SJohn Marino 127*e4b17023SJohn Marino __pivot_rank = __n * __num_threads_left / __num_threads; 128*e4b17023SJohn Marino 129*e4b17023SJohn Marino _DifferenceType __split = __parallel_sort_qs_divide 130*e4b17023SJohn Marino (__begin, __end, __comp, __pivot_rank, 131*e4b17023SJohn Marino _Settings::get().sort_qs_num_samples_preset, __num_threads); 132*e4b17023SJohn Marino 133*e4b17023SJohn Marino #pragma omp parallel sections num_threads(2) 134*e4b17023SJohn Marino { 135*e4b17023SJohn Marino #pragma omp section 136*e4b17023SJohn Marino __parallel_sort_qs_conquer(__begin, __begin + __split, 137*e4b17023SJohn Marino __comp, __num_threads_left); 138*e4b17023SJohn Marino #pragma omp section 139*e4b17023SJohn Marino __parallel_sort_qs_conquer(__begin + __split, __end, 140*e4b17023SJohn Marino __comp, __num_threads - __num_threads_left); 141*e4b17023SJohn Marino } 142*e4b17023SJohn Marino } 143*e4b17023SJohn Marino 144*e4b17023SJohn Marino 145*e4b17023SJohn Marino /** @brief Unbalanced quicksort main call. 146*e4b17023SJohn Marino * @param __begin Begin iterator of input sequence. 147*e4b17023SJohn Marino * @param __end End iterator input sequence, ignored. 148*e4b17023SJohn Marino * @param __comp Comparator. 149*e4b17023SJohn Marino * @param __num_threads Number of threads that are allowed to work on 150*e4b17023SJohn Marino * this part. 151*e4b17023SJohn Marino */ 152*e4b17023SJohn Marino template<typename _RAIter, typename _Compare> 153*e4b17023SJohn Marino void __parallel_sort_qs(_RAIter __begin,_RAIter __end,_Compare __comp,_ThreadIndex __num_threads)154*e4b17023SJohn Marino __parallel_sort_qs(_RAIter __begin, _RAIter __end, 155*e4b17023SJohn Marino _Compare __comp, 156*e4b17023SJohn Marino _ThreadIndex __num_threads) 157*e4b17023SJohn Marino { 158*e4b17023SJohn Marino _GLIBCXX_CALL(__n) 159*e4b17023SJohn Marino 160*e4b17023SJohn Marino typedef std::iterator_traits<_RAIter> _TraitsType; 161*e4b17023SJohn Marino typedef typename _TraitsType::value_type _ValueType; 162*e4b17023SJohn Marino typedef typename _TraitsType::difference_type _DifferenceType; 163*e4b17023SJohn Marino 164*e4b17023SJohn Marino _DifferenceType __n = __end - __begin; 165*e4b17023SJohn Marino 166*e4b17023SJohn Marino // At least one element per processor. 167*e4b17023SJohn Marino if (__num_threads > __n) 168*e4b17023SJohn Marino __num_threads = static_cast<_ThreadIndex>(__n); 169*e4b17023SJohn Marino 170*e4b17023SJohn Marino __parallel_sort_qs_conquer( 171*e4b17023SJohn Marino __begin, __begin + __n, __comp, __num_threads); 172*e4b17023SJohn Marino } 173*e4b17023SJohn Marino 174*e4b17023SJohn Marino } //namespace __gnu_parallel 175*e4b17023SJohn Marino 176*e4b17023SJohn Marino #endif /* _GLIBCXX_PARALLEL_QUICKSORT_H */ 177