2007-09-12 00:32:51 +02:00
|
|
|
// -*- C++ -*-
|
|
|
|
|
2009-04-09 17:00:19 +02:00
|
|
|
// Copyright (C) 2007, 2008, 2009 Free Software Foundation, Inc.
|
2007-09-12 00:32:51 +02:00
|
|
|
//
|
|
|
|
// This file is part of the GNU ISO C++ Library. This library is free
|
|
|
|
// software; you can redistribute it and/or modify it under the terms
|
|
|
|
// of the GNU General Public License as published by the Free Software
|
2009-04-09 17:00:19 +02:00
|
|
|
// Foundation; either version 3, or (at your option) any later
|
2007-09-12 00:32:51 +02:00
|
|
|
// version.
|
|
|
|
|
|
|
|
// This library is distributed in the hope that it will be useful, but
|
|
|
|
// WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
// General Public License for more details.
|
|
|
|
|
2009-04-09 17:00:19 +02:00
|
|
|
// Under Section 7 of GPL version 3, you are granted additional
|
|
|
|
// permissions described in the GCC Runtime Library Exception, version
|
|
|
|
// 3.1, as published by the Free Software Foundation.
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-04-09 17:00:19 +02:00
|
|
|
// You should have received a copy of the GNU General Public License and
|
|
|
|
// a copy of the GCC Runtime Library Exception along with this program;
|
|
|
|
// see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
|
|
|
|
// <http://www.gnu.org/licenses/>.
|
2007-09-12 00:32:51 +02:00
|
|
|
|
|
|
|
/** @file parallel/multiway_mergesort.h
|
|
|
|
* @brief Parallel multiway merge sort.
|
|
|
|
* This file is a GNU parallel extension to the Standard C++ Library.
|
|
|
|
*/
|
|
|
|
|
|
|
|
// Written by Johannes Singler.
|
|
|
|
|
2008-07-15 12:06:58 +02:00
|
|
|
#ifndef _GLIBCXX_PARALLEL_MULTIWAY_MERGESORT_H
|
|
|
|
#define _GLIBCXX_PARALLEL_MULTIWAY_MERGESORT_H 1
|
2007-09-12 00:32:51 +02:00
|
|
|
|
|
|
|
#include <vector>
|
|
|
|
|
|
|
|
#include <parallel/basic_iterator.h>
|
|
|
|
#include <bits/stl_algo.h>
|
|
|
|
#include <parallel/parallel.h>
|
|
|
|
#include <parallel/multiway_merge.h>
|
|
|
|
|
|
|
|
namespace __gnu_parallel
|
|
|
|
{
|
|
|
|
|
2007-11-22 11:13:08 +01:00
|
|
|
/** @brief Subsequence description. */
|
|
|
|
template<typename _DifferenceTp>
|
2009-09-16 11:47:25 +02:00
|
|
|
struct _Piece
|
2007-09-12 00:32:51 +02:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
typedef _DifferenceTp _DifferenceType;
|
2007-09-12 00:32:51 +02:00
|
|
|
|
|
|
|
/** @brief Begin of subsequence. */
|
2009-09-16 11:47:25 +02:00
|
|
|
_DifferenceType __begin;
|
2007-09-12 00:32:51 +02:00
|
|
|
|
|
|
|
/** @brief End of subsequence. */
|
2009-09-16 11:47:25 +02:00
|
|
|
_DifferenceType __end;
|
2007-09-12 00:32:51 +02:00
|
|
|
};
|
|
|
|
|
2007-11-22 11:13:08 +01:00
|
|
|
/** @brief Data accessed by all threads.
|
|
|
|
*
|
|
|
|
* PMWMS = parallel multiway mergesort */
|
2009-09-16 11:47:25 +02:00
|
|
|
template<typename _RAIter>
|
|
|
|
struct _PMWMSSortingData
|
2007-09-12 00:32:51 +02:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
typedef std::iterator_traits<_RAIter> _TraitsType;
|
|
|
|
typedef typename _TraitsType::value_type _ValueType;
|
|
|
|
typedef typename _TraitsType::difference_type _DifferenceType;
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2007-11-22 11:13:08 +01:00
|
|
|
/** @brief Number of threads involved. */
|
2009-09-16 11:47:25 +02:00
|
|
|
_ThreadIndex __num_threads;
|
2007-11-22 11:13:08 +01:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
/** @brief Input __begin. */
|
|
|
|
_RAIter _M_source;
|
2007-09-12 00:32:51 +02:00
|
|
|
|
|
|
|
/** @brief Start indices, per thread. */
|
2009-09-16 11:47:25 +02:00
|
|
|
_DifferenceType* _M_starts;
|
2007-09-12 00:32:51 +02:00
|
|
|
|
|
|
|
/** @brief Storage in which to sort. */
|
2009-09-16 11:47:25 +02:00
|
|
|
_ValueType** _M_temporary;
|
2007-09-12 00:32:51 +02:00
|
|
|
|
|
|
|
/** @brief Samples. */
|
2009-09-16 11:47:25 +02:00
|
|
|
_ValueType* _M_samples;
|
2007-09-12 00:32:51 +02:00
|
|
|
|
|
|
|
/** @brief Offsets to add to the found positions. */
|
2009-09-16 11:47:25 +02:00
|
|
|
_DifferenceType* _M_offsets;
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
/** @brief Pieces of data to merge @__c [thread][__sequence] */
|
|
|
|
std::vector<_Piece<_DifferenceType> >* _M_pieces;
|
2007-11-22 11:13:08 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
/**
|
2009-09-16 11:47:25 +02:00
|
|
|
* @brief Select _M_samples from a sequence.
|
|
|
|
* @param __sd Pointer to algorithm data. _Result will be placed in
|
|
|
|
* @__c __sd->_M_samples.
|
|
|
|
* @param __num_samples Number of _M_samples to select.
|
2007-11-22 11:13:08 +01:00
|
|
|
*/
|
2009-09-16 11:47:25 +02:00
|
|
|
template<typename _RAIter, typename _DifferenceTp>
|
2008-01-10 03:07:41 +01:00
|
|
|
void
|
2009-09-16 11:47:25 +02:00
|
|
|
__determine_samples(_PMWMSSortingData<_RAIter>* __sd,
|
|
|
|
_DifferenceTp __num_samples)
|
2007-09-12 00:32:51 +02:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
typedef std::iterator_traits<_RAIter> _TraitsType;
|
|
|
|
typedef typename _TraitsType::value_type _ValueType;
|
|
|
|
typedef _DifferenceTp _DifferenceType;
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
_ThreadIndex __iam = omp_get_thread_num();
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
_DifferenceType* __es = new _DifferenceType[__num_samples + 2];
|
2007-10-09 23:51:06 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
equally_split(__sd->_M_starts[__iam + 1] - __sd->_M_starts[__iam],
|
|
|
|
__num_samples + 1, __es);
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
for (_DifferenceType __i = 0; __i < __num_samples; ++__i)
|
|
|
|
::new(&(__sd->_M_samples[__iam * __num_samples + __i]))
|
|
|
|
_ValueType(__sd->_M_source[__sd->_M_starts[__iam] + __es[__i + 1]]);
|
2007-11-22 11:13:08 +01:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
delete[] __es;
|
2007-09-12 00:32:51 +02:00
|
|
|
}
|
|
|
|
|
2008-04-07 10:27:34 +02:00
|
|
|
/** @brief Split consistently. */
|
2009-09-16 11:47:25 +02:00
|
|
|
template<bool __exact, typename _RAIter,
|
|
|
|
typename _Compare, typename _SortingPlacesIterator>
|
|
|
|
struct _SplitConsistently
|
2008-04-07 10:27:34 +02:00
|
|
|
{
|
|
|
|
};
|
|
|
|
|
|
|
|
/** @brief Split by exact splitting. */
|
2009-09-16 11:47:25 +02:00
|
|
|
template<typename _RAIter, typename _Compare,
|
|
|
|
typename _SortingPlacesIterator>
|
|
|
|
struct _SplitConsistently
|
|
|
|
<true, _RAIter, _Compare, _SortingPlacesIterator>
|
2008-04-07 10:27:34 +02:00
|
|
|
{
|
|
|
|
void operator()(
|
2009-09-16 11:47:25 +02:00
|
|
|
const _ThreadIndex __iam,
|
|
|
|
_PMWMSSortingData<_RAIter>* __sd,
|
|
|
|
_Compare& __comp,
|
2008-04-07 10:27:34 +02:00
|
|
|
const typename
|
2009-09-16 11:47:25 +02:00
|
|
|
std::iterator_traits<_RAIter>::difference_type
|
|
|
|
__num_samples)
|
2008-04-07 10:27:34 +02:00
|
|
|
const
|
|
|
|
{
|
|
|
|
# pragma omp barrier
|
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
std::vector<std::pair<_SortingPlacesIterator, _SortingPlacesIterator> >
|
|
|
|
seqs(__sd->__num_threads);
|
|
|
|
for (_ThreadIndex __s = 0; __s < __sd->__num_threads; __s++)
|
|
|
|
seqs[__s] = std::make_pair(__sd->_M_temporary[__s],
|
|
|
|
__sd->_M_temporary[__s]
|
|
|
|
+ (__sd->_M_starts[__s + 1] - __sd->_M_starts[__s]));
|
2008-04-07 10:27:34 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
std::vector<_SortingPlacesIterator> _M_offsets(__sd->__num_threads);
|
2008-04-07 10:27:34 +02:00
|
|
|
|
|
|
|
// if not last thread
|
2009-09-16 11:47:25 +02:00
|
|
|
if (__iam < __sd->__num_threads - 1)
|
2008-04-07 10:27:34 +02:00
|
|
|
multiseq_partition(seqs.begin(), seqs.end(),
|
2009-09-16 11:47:25 +02:00
|
|
|
__sd->_M_starts[__iam + 1], _M_offsets.begin(), __comp);
|
2008-04-07 10:27:34 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
for (int __seq = 0; __seq < __sd->__num_threads; __seq++)
|
2008-04-07 10:27:34 +02:00
|
|
|
{
|
|
|
|
// for each sequence
|
2009-09-16 11:47:25 +02:00
|
|
|
if (__iam < (__sd->__num_threads - 1))
|
|
|
|
__sd->_M_pieces[__iam][__seq].__end = _M_offsets[__seq] - seqs[__seq].first;
|
2008-04-07 10:27:34 +02:00
|
|
|
else
|
|
|
|
// very end of this sequence
|
2009-09-16 11:47:25 +02:00
|
|
|
__sd->_M_pieces[__iam][__seq].__end =
|
|
|
|
__sd->_M_starts[__seq + 1] - __sd->_M_starts[__seq];
|
2008-04-07 10:27:34 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
# pragma omp barrier
|
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
for (_ThreadIndex __seq = 0; __seq < __sd->__num_threads; __seq++)
|
2008-04-07 10:27:34 +02:00
|
|
|
{
|
|
|
|
// For each sequence.
|
2009-09-16 11:47:25 +02:00
|
|
|
if (__iam > 0)
|
|
|
|
__sd->_M_pieces[__iam][__seq].__begin = __sd->_M_pieces[__iam - 1][__seq].__end;
|
2008-04-07 10:27:34 +02:00
|
|
|
else
|
|
|
|
// Absolute beginning.
|
2009-09-16 11:47:25 +02:00
|
|
|
__sd->_M_pieces[__iam][__seq].__begin = 0;
|
2008-04-07 10:27:34 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
/** @brief Split by sampling. */
|
2009-09-16 11:47:25 +02:00
|
|
|
template<typename _RAIter, typename _Compare,
|
|
|
|
typename _SortingPlacesIterator>
|
|
|
|
struct _SplitConsistently<false, _RAIter, _Compare,
|
|
|
|
_SortingPlacesIterator>
|
2008-04-07 10:27:34 +02:00
|
|
|
{
|
|
|
|
void operator()(
|
2009-09-16 11:47:25 +02:00
|
|
|
const _ThreadIndex __iam,
|
|
|
|
_PMWMSSortingData<_RAIter>* __sd,
|
|
|
|
_Compare& __comp,
|
2008-04-07 10:27:34 +02:00
|
|
|
const typename
|
2009-09-16 11:47:25 +02:00
|
|
|
std::iterator_traits<_RAIter>::difference_type
|
|
|
|
__num_samples)
|
2008-04-07 10:27:34 +02:00
|
|
|
const
|
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
typedef std::iterator_traits<_RAIter> _TraitsType;
|
|
|
|
typedef typename _TraitsType::value_type _ValueType;
|
|
|
|
typedef typename _TraitsType::difference_type _DifferenceType;
|
2008-04-07 10:27:34 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
__determine_samples(__sd, __num_samples);
|
2008-04-07 10:27:34 +02:00
|
|
|
|
|
|
|
# pragma omp barrier
|
|
|
|
|
|
|
|
# pragma omp single
|
2009-09-16 11:47:25 +02:00
|
|
|
__gnu_sequential::sort(__sd->_M_samples,
|
|
|
|
__sd->_M_samples + (__num_samples * __sd->__num_threads),
|
|
|
|
__comp);
|
2008-04-07 10:27:34 +02:00
|
|
|
|
|
|
|
# pragma omp barrier
|
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
for (_ThreadIndex __s = 0; __s < __sd->__num_threads; ++__s)
|
2008-04-07 10:27:34 +02:00
|
|
|
{
|
|
|
|
// For each sequence.
|
2009-09-16 11:47:25 +02:00
|
|
|
if (__num_samples * __iam > 0)
|
|
|
|
__sd->_M_pieces[__iam][__s].__begin =
|
|
|
|
std::lower_bound(__sd->_M_temporary[__s],
|
|
|
|
__sd->_M_temporary[__s]
|
|
|
|
+ (__sd->_M_starts[__s + 1] - __sd->_M_starts[__s]),
|
|
|
|
__sd->_M_samples[__num_samples * __iam],
|
|
|
|
__comp)
|
|
|
|
- __sd->_M_temporary[__s];
|
2008-04-07 10:27:34 +02:00
|
|
|
else
|
|
|
|
// Absolute beginning.
|
2009-09-16 11:47:25 +02:00
|
|
|
__sd->_M_pieces[__iam][__s].__begin = 0;
|
|
|
|
|
|
|
|
if ((__num_samples * (__iam + 1)) < (__num_samples * __sd->__num_threads))
|
|
|
|
__sd->_M_pieces[__iam][__s].__end =
|
|
|
|
std::lower_bound(__sd->_M_temporary[__s],
|
|
|
|
__sd->_M_temporary[__s]
|
|
|
|
+ (__sd->_M_starts[__s + 1] - __sd->_M_starts[__s]),
|
|
|
|
__sd->_M_samples[__num_samples * (__iam + 1)],
|
|
|
|
__comp)
|
|
|
|
- __sd->_M_temporary[__s];
|
2008-04-07 10:27:34 +02:00
|
|
|
else
|
2009-09-16 11:47:25 +02:00
|
|
|
// Absolute __end.
|
|
|
|
__sd->_M_pieces[__iam][__s].__end = __sd->_M_starts[__s + 1] - __sd->_M_starts[__s];
|
2008-04-07 10:27:34 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
template<bool __stable, typename _RAIter, typename _Compare>
|
|
|
|
struct __possibly_stable_sort
|
2008-04-07 10:27:34 +02:00
|
|
|
{
|
|
|
|
};
|
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
template<typename _RAIter, typename _Compare>
|
|
|
|
struct __possibly_stable_sort<true, _RAIter, _Compare>
|
2008-04-07 10:27:34 +02:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
void operator()(const _RAIter& __begin,
|
|
|
|
const _RAIter& __end, _Compare& __comp) const
|
2008-04-07 10:27:34 +02:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
__gnu_sequential::stable_sort(__begin, __end, __comp);
|
2008-04-07 10:27:34 +02:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
template<typename _RAIter, typename _Compare>
|
|
|
|
struct __possibly_stable_sort<false, _RAIter, _Compare>
|
2008-04-07 10:27:34 +02:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
void operator()(const _RAIter __begin,
|
|
|
|
const _RAIter __end, _Compare& __comp) const
|
2008-04-07 10:27:34 +02:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
__gnu_sequential::sort(__begin, __end, __comp);
|
2008-04-07 10:27:34 +02:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
template<bool __stable, typename Seq_RAIter,
|
|
|
|
typename _RAIter, typename _Compare,
|
2008-04-07 10:27:34 +02:00
|
|
|
typename DiffType>
|
2009-09-16 11:47:25 +02:00
|
|
|
struct __possibly_stable_multiway_merge
|
2008-04-07 10:27:34 +02:00
|
|
|
{
|
|
|
|
};
|
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
template<typename Seq_RAIter, typename _RAIter,
|
|
|
|
typename _Compare, typename DiffType>
|
|
|
|
struct __possibly_stable_multiway_merge
|
|
|
|
<true, Seq_RAIter, _RAIter, _Compare,
|
2008-04-07 10:27:34 +02:00
|
|
|
DiffType>
|
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
void operator()(const Seq_RAIter& __seqs_begin,
|
|
|
|
const Seq_RAIter& __seqs_end,
|
|
|
|
const _RAIter& __target,
|
|
|
|
_Compare& __comp,
|
|
|
|
DiffType __length_am) const
|
2008-04-07 10:27:34 +02:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
stable_multiway_merge(__seqs_begin, __seqs_end, __target, __length_am, __comp,
|
2008-05-16 09:10:26 +02:00
|
|
|
sequential_tag());
|
2008-04-07 10:27:34 +02:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
template<typename Seq_RAIter, typename _RAIter,
|
|
|
|
typename _Compare, typename DiffType>
|
|
|
|
struct __possibly_stable_multiway_merge
|
|
|
|
<false, Seq_RAIter, _RAIter, _Compare,
|
2008-04-07 10:27:34 +02:00
|
|
|
DiffType>
|
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
void operator()(const Seq_RAIter& __seqs_begin,
|
|
|
|
const Seq_RAIter& __seqs_end,
|
|
|
|
const _RAIter& __target,
|
|
|
|
_Compare& __comp,
|
|
|
|
DiffType __length_am) const
|
2008-04-07 10:27:34 +02:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
multiway_merge(__seqs_begin, __seqs_end, __target, __length_am, __comp,
|
2008-05-16 09:10:26 +02:00
|
|
|
sequential_tag());
|
2008-04-07 10:27:34 +02:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2007-11-22 11:13:08 +01:00
|
|
|
/** @brief PMWMS code executed by each thread.
|
2009-09-16 11:47:25 +02:00
|
|
|
* @param __sd Pointer to algorithm data.
|
|
|
|
* @param __comp Comparator.
|
2007-11-22 11:13:08 +01:00
|
|
|
*/
|
2009-09-16 11:47:25 +02:00
|
|
|
template<bool __stable, bool __exact, typename _RAIter,
|
|
|
|
typename _Compare>
|
2008-01-10 03:07:41 +01:00
|
|
|
void
|
2009-09-16 11:47:25 +02:00
|
|
|
parallel_sort_mwms_pu(_PMWMSSortingData<_RAIter>* __sd,
|
|
|
|
_Compare& __comp)
|
2007-09-12 00:32:51 +02:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
typedef std::iterator_traits<_RAIter> _TraitsType;
|
|
|
|
typedef typename _TraitsType::value_type _ValueType;
|
|
|
|
typedef typename _TraitsType::difference_type _DifferenceType;
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
_ThreadIndex __iam = omp_get_thread_num();
|
2007-09-12 00:32:51 +02:00
|
|
|
|
|
|
|
// Length of this thread's chunk, before merging.
|
2009-09-16 11:47:25 +02:00
|
|
|
_DifferenceType __length_local = __sd->_M_starts[__iam + 1] - __sd->_M_starts[__iam];
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2008-04-07 10:27:34 +02:00
|
|
|
// Sort in temporary storage, leave space for sentinel.
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
typedef _ValueType* _SortingPlacesIterator;
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
__sd->_M_temporary[__iam] =
|
|
|
|
static_cast<_ValueType*>(
|
|
|
|
::operator new(sizeof(_ValueType) * (__length_local + 1)));
|
2007-09-12 00:32:51 +02:00
|
|
|
|
|
|
|
// Copy there.
|
2009-09-16 11:47:25 +02:00
|
|
|
std::uninitialized_copy(__sd->_M_source + __sd->_M_starts[__iam],
|
|
|
|
__sd->_M_source + __sd->_M_starts[__iam] + __length_local,
|
|
|
|
__sd->_M_temporary[__iam]);
|
2007-11-22 11:13:08 +01:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
__possibly_stable_sort<__stable, _SortingPlacesIterator, _Compare>()
|
|
|
|
(__sd->_M_temporary[__iam], __sd->_M_temporary[__iam] + __length_local, __comp);
|
2007-11-22 11:13:08 +01:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
// Invariant: locally sorted subsequence in sd->_M_temporary[__iam],
|
|
|
|
// __sd->_M_temporary[__iam] + __length_local.
|
2007-11-22 11:13:08 +01:00
|
|
|
|
2008-04-07 10:27:34 +02:00
|
|
|
// No barrier here: Synchronization is done by the splitting routine.
|
2007-11-22 11:13:08 +01:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
_DifferenceType __num_samples =
|
|
|
|
_Settings::get().sort_mwms_oversampling * __sd->__num_threads - 1;
|
|
|
|
_SplitConsistently
|
|
|
|
<__exact, _RAIter, _Compare, _SortingPlacesIterator>()
|
|
|
|
(__iam, __sd, __comp, __num_samples);
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
// Offset from __target __begin, __length after merging.
|
|
|
|
_DifferenceType __offset = 0, __length_am = 0;
|
|
|
|
for (_ThreadIndex __s = 0; __s < __sd->__num_threads; __s++)
|
2007-09-12 00:32:51 +02:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
__length_am += __sd->_M_pieces[__iam][__s].__end - __sd->_M_pieces[__iam][__s].__begin;
|
|
|
|
__offset += __sd->_M_pieces[__iam][__s].__begin;
|
2007-09-12 00:32:51 +02:00
|
|
|
}
|
|
|
|
|
2008-04-07 10:27:34 +02:00
|
|
|
typedef std::vector<
|
2009-09-16 11:47:25 +02:00
|
|
|
std::pair<_SortingPlacesIterator, _SortingPlacesIterator> >
|
2008-04-07 10:27:34 +02:00
|
|
|
seq_vector_type;
|
2009-09-16 11:47:25 +02:00
|
|
|
seq_vector_type seqs(__sd->__num_threads);
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
for (int __s = 0; __s < __sd->__num_threads; ++__s)
|
2007-09-12 00:32:51 +02:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
seqs[__s] =
|
|
|
|
std::make_pair(__sd->_M_temporary[__s] + __sd->_M_pieces[__iam][__s].__begin,
|
|
|
|
__sd->_M_temporary[__s] + __sd->_M_pieces[__iam][__s].__end);
|
2007-09-12 00:32:51 +02:00
|
|
|
}
|
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
__possibly_stable_multiway_merge<
|
|
|
|
__stable,
|
2008-04-07 10:27:34 +02:00
|
|
|
typename seq_vector_type::iterator,
|
2009-09-16 11:47:25 +02:00
|
|
|
_RAIter,
|
|
|
|
_Compare, _DifferenceType>()
|
2008-04-07 10:27:34 +02:00
|
|
|
(seqs.begin(), seqs.end(),
|
2009-09-16 11:47:25 +02:00
|
|
|
__sd->_M_source + __offset, __comp,
|
|
|
|
__length_am);
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2007-11-22 11:13:08 +01:00
|
|
|
# pragma omp barrier
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
::operator delete(__sd->_M_temporary[__iam]);
|
2007-09-12 00:32:51 +02:00
|
|
|
}
|
|
|
|
|
2007-11-22 11:13:08 +01:00
|
|
|
/** @brief PMWMS main call.
|
2009-09-16 11:47:25 +02:00
|
|
|
* @param __begin Begin iterator of sequence.
|
|
|
|
* @param __end End iterator of sequence.
|
|
|
|
* @param __comp Comparator.
|
|
|
|
* @param __n Length of sequence.
|
|
|
|
* @param __num_threads Number of threads to use.
|
2007-11-22 11:13:08 +01:00
|
|
|
*/
|
2009-09-16 11:47:25 +02:00
|
|
|
template<bool __stable, bool __exact, typename _RAIter,
|
|
|
|
typename _Compare>
|
2008-01-10 03:07:41 +01:00
|
|
|
void
|
2009-09-16 11:47:25 +02:00
|
|
|
parallel_sort_mwms(_RAIter __begin, _RAIter __end,
|
|
|
|
_Compare __comp,
|
|
|
|
_ThreadIndex __num_threads)
|
2007-09-12 00:32:51 +02:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
_GLIBCXX_CALL(__end - __begin)
|
2007-11-22 11:13:08 +01:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
typedef std::iterator_traits<_RAIter> _TraitsType;
|
|
|
|
typedef typename _TraitsType::value_type _ValueType;
|
|
|
|
typedef typename _TraitsType::difference_type _DifferenceType;
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
_DifferenceType __n = __end - __begin;
|
2008-04-07 10:27:34 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
if (__n <= 1)
|
2007-09-12 00:32:51 +02:00
|
|
|
return;
|
|
|
|
|
2007-11-22 11:13:08 +01:00
|
|
|
// at least one element per thread
|
2009-09-16 11:47:25 +02:00
|
|
|
if (__num_threads > __n)
|
|
|
|
__num_threads = static_cast<_ThreadIndex>(__n);
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2007-11-22 11:13:08 +01:00
|
|
|
// shared variables
|
2009-09-16 11:47:25 +02:00
|
|
|
_PMWMSSortingData<_RAIter> __sd;
|
|
|
|
_DifferenceType* _M_starts;
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
# pragma omp parallel num_threads(__num_threads)
|
2007-11-22 11:13:08 +01:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
__num_threads = omp_get_num_threads(); //no more threads than requested
|
2007-11-22 11:13:08 +01:00
|
|
|
|
|
|
|
# pragma omp single
|
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
__sd.__num_threads = __num_threads;
|
|
|
|
__sd._M_source = __begin;
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
__sd._M_temporary = new _ValueType*[__num_threads];
|
2008-04-07 10:27:34 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
if (!__exact)
|
2007-11-22 11:13:08 +01:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
_DifferenceType size =
|
|
|
|
(_Settings::get().sort_mwms_oversampling * __num_threads - 1)
|
|
|
|
* __num_threads;
|
|
|
|
__sd._M_samples = static_cast<_ValueType*>(
|
|
|
|
::operator new(size * sizeof(_ValueType)));
|
2007-11-22 11:13:08 +01:00
|
|
|
}
|
|
|
|
else
|
2009-09-16 11:47:25 +02:00
|
|
|
__sd._M_samples = NULL;
|
|
|
|
|
|
|
|
__sd._M_offsets = new _DifferenceType[__num_threads - 1];
|
|
|
|
__sd._M_pieces = new std::vector<_Piece<_DifferenceType> >[__num_threads];
|
|
|
|
for (int __s = 0; __s < __num_threads; ++__s)
|
|
|
|
__sd._M_pieces[__s].resize(__num_threads);
|
|
|
|
_M_starts = __sd._M_starts = new _DifferenceType[__num_threads + 1];
|
|
|
|
|
|
|
|
_DifferenceType __chunk_length = __n / __num_threads;
|
|
|
|
_DifferenceType __split = __n % __num_threads;
|
|
|
|
_DifferenceType __pos = 0;
|
|
|
|
for (int __i = 0; __i < __num_threads; ++__i)
|
2007-11-22 11:13:08 +01:00
|
|
|
{
|
2009-09-16 11:47:25 +02:00
|
|
|
_M_starts[__i] = __pos;
|
|
|
|
__pos += (__i < __split) ? (__chunk_length + 1) : __chunk_length;
|
2007-11-22 11:13:08 +01:00
|
|
|
}
|
2009-09-16 11:47:25 +02:00
|
|
|
_M_starts[__num_threads] = __pos;
|
2008-04-07 10:27:34 +02:00
|
|
|
} //single
|
2007-11-22 11:13:08 +01:00
|
|
|
|
|
|
|
// Now sort in parallel.
|
2009-09-16 11:47:25 +02:00
|
|
|
parallel_sort_mwms_pu<__stable, __exact>(&__sd, __comp);
|
2007-11-22 11:13:08 +01:00
|
|
|
} //parallel
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
delete[] _M_starts;
|
|
|
|
delete[] __sd._M_temporary;
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
if (!__exact)
|
|
|
|
::operator delete(__sd._M_samples);
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2009-09-16 11:47:25 +02:00
|
|
|
delete[] __sd._M_offsets;
|
|
|
|
delete[] __sd._M_pieces;
|
2007-09-12 00:32:51 +02:00
|
|
|
}
|
2007-11-22 11:13:08 +01:00
|
|
|
} //namespace __gnu_parallel
|
2007-09-12 00:32:51 +02:00
|
|
|
|
2008-07-15 12:06:58 +02:00
|
|
|
#endif /* _GLIBCXX_PARALLEL_MULTIWAY_MERGESORT_H */
|