172 lines
5.2 KiB
Plaintext
172 lines
5.2 KiB
Plaintext
|
/*
|
||
|
[auto_generated]
|
||
|
boost/numeric/odeint/external/openmp/openmp_state.hpp
|
||
|
|
||
|
[begin_description]
|
||
|
Wrappers for OpenMP.
|
||
|
[end_description]
|
||
|
|
||
|
Copyright 2013 Karsten Ahnert
|
||
|
Copyright 2013 Mario Mulansky
|
||
|
Copyright 2013 Pascal Germroth
|
||
|
|
||
|
Distributed under the Boost Software License, Version 1.0.
|
||
|
(See accompanying file LICENSE_1_0.txt or
|
||
|
copy at http://www.boost.org/LICENSE_1_0.txt)
|
||
|
*/
|
||
|
|
||
|
|
||
|
#ifndef BOOST_NUMERIC_ODEINT_EXTERNAL_OPENMP_OPENMP_STATE_HPP_INCLUDED
|
||
|
#define BOOST_NUMERIC_ODEINT_EXTERNAL_OPENMP_OPENMP_STATE_HPP_INCLUDED
|
||
|
|
||
|
#include <omp.h>
|
||
|
#include <vector>
|
||
|
#include <algorithm>
|
||
|
#include <boost/range/adaptor/sliced.hpp>
|
||
|
#include <boost/numeric/odeint/util/copy.hpp>
|
||
|
#include <boost/numeric/odeint/util/split.hpp>
|
||
|
#include <boost/numeric/odeint/util/resize.hpp>
|
||
|
#include <boost/numeric/odeint/external/openmp/openmp_nested_algebra.hpp>
|
||
|
|
||
|
namespace boost {
|
||
|
namespace numeric {
|
||
|
namespace odeint {
|
||
|
|
||
|
/** \brief A container that is split into distinct parts, for threading.
|
||
|
* Just a wrapper for vector<vector<T>>, use `copy` for splitting/joining.
|
||
|
*/
|
||
|
template< class T >
|
||
|
struct openmp_state : public std::vector< std::vector< T > >
|
||
|
{
|
||
|
openmp_state() {}
|
||
|
|
||
|
openmp_state(size_t n, const std::vector<T>& val = std::vector<T>())
|
||
|
: std::vector< std::vector< T > >(n, val) {}
|
||
|
|
||
|
template<class InputIterator>
|
||
|
openmp_state(InputIterator first, InputIterator last)
|
||
|
: std::vector< std::vector< T > >(first, last) {}
|
||
|
|
||
|
openmp_state(const std::vector< std::vector< T > > &orig)
|
||
|
: std::vector< std::vector< T > >(orig) {}
|
||
|
|
||
|
};
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
template< class T >
|
||
|
struct is_resizeable< openmp_state< T > > : boost::true_type { };
|
||
|
|
||
|
|
||
|
template< class T >
|
||
|
struct same_size_impl< openmp_state< T > , openmp_state< T > >
|
||
|
{
|
||
|
static bool same_size( const openmp_state< T > &x , const openmp_state< T > &y )
|
||
|
{
|
||
|
if( x.size() != y.size() ) return false;
|
||
|
for( size_t i = 0 ; i != x.size() ; i++ )
|
||
|
if( x[i].size() != y[i].size() ) return false;
|
||
|
return true;
|
||
|
}
|
||
|
};
|
||
|
|
||
|
|
||
|
template< class T >
|
||
|
struct resize_impl< openmp_state< T > , openmp_state< T > >
|
||
|
{
|
||
|
static void resize( openmp_state< T > &x , const openmp_state< T > &y )
|
||
|
{
|
||
|
x.resize( y.size() );
|
||
|
# pragma omp parallel for schedule(dynamic)
|
||
|
for(size_t i = 0 ; i < x.size() ; i++)
|
||
|
x[i].resize( y[i].size() );
|
||
|
}
|
||
|
};
|
||
|
|
||
|
|
||
|
/** \brief Copy data between openmp_states of same size. */
|
||
|
template< class T >
|
||
|
struct copy_impl< openmp_state< T >, openmp_state< T > >
|
||
|
{
|
||
|
static void copy( const openmp_state< T > &from, openmp_state< T > &to )
|
||
|
{
|
||
|
# pragma omp parallel for schedule(dynamic)
|
||
|
for(size_t i = 0 ; i < from.size() ; i++)
|
||
|
std::copy( from[i].begin() , from[i].end() , to.begin() );
|
||
|
}
|
||
|
};
|
||
|
|
||
|
|
||
|
|
||
|
/** \brief Copy data from some container to an openmp_state and resize it.
|
||
|
* Target container size will determine number of blocks to split into.
|
||
|
* If it is empty, it will be resized to the maximum number of OpenMP threads.
|
||
|
* SourceContainer must support `s::value_type`, `s::const_iterator`, `s.begin()`, `s.end()` and `s.size()`,
|
||
|
* with Random Access Iterators; i.e. it must be a Random Access Container. */
|
||
|
template< class SourceContainer >
|
||
|
struct split_impl< SourceContainer, openmp_state< typename SourceContainer::value_type > >
|
||
|
{
|
||
|
static void split( const SourceContainer &from, openmp_state< typename SourceContainer::value_type > &to )
|
||
|
{
|
||
|
if(to.size() == 0) to.resize( omp_get_max_threads() );
|
||
|
const size_t part = from.size() / to.size();
|
||
|
# pragma omp parallel for schedule(dynamic)
|
||
|
for(size_t i = 0 ; i < to.size() ; i++) {
|
||
|
typedef typename SourceContainer::const_iterator it_t;
|
||
|
const it_t begin = from.begin() + i * part;
|
||
|
it_t end = begin + part;
|
||
|
// for cases where from.size() % to.size() > 0
|
||
|
if(i + 1 == to.size() || end > from.end()) end = from.end();
|
||
|
to[i].resize(end - begin);
|
||
|
std::copy(begin, end, to[i].begin());
|
||
|
}
|
||
|
}
|
||
|
};
|
||
|
|
||
|
/** \brief Copy data from an openmp_state to some container and resize it.
|
||
|
* TargetContainer must support `s::value_type`, `s::iterator`, `s.begin()` and `s.resize(n)`,
|
||
|
* i.e. it must be a `std::vector`. */
|
||
|
template< class TargetContainer >
|
||
|
struct unsplit_impl< openmp_state< typename TargetContainer::value_type >, TargetContainer >
|
||
|
{
|
||
|
static void unsplit( const openmp_state< typename TargetContainer::value_type > &from , TargetContainer &to )
|
||
|
{
|
||
|
// resize target
|
||
|
size_t total_size = 0;
|
||
|
for(size_t i = 0 ; i < from.size() ; i++)
|
||
|
total_size += from[i].size();
|
||
|
to.resize( total_size );
|
||
|
// copy parts
|
||
|
typename TargetContainer::iterator out = to.begin();
|
||
|
for(size_t i = 0 ; i < from.size() ; i++)
|
||
|
out = std::copy(from[i].begin(), from[i].end(), out);
|
||
|
}
|
||
|
};
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
/** \brief OpenMP-parallelized algebra.
|
||
|
* For use with openmp_state.
|
||
|
*/
|
||
|
typedef openmp_nested_algebra< range_algebra > openmp_algebra;
|
||
|
|
||
|
|
||
|
|
||
|
/** \brief Use `openmp_algebra` for `openmp_state`. */
|
||
|
template< class T >
|
||
|
struct algebra_dispatcher< openmp_state< T > >
|
||
|
{
|
||
|
typedef openmp_algebra algebra_type;
|
||
|
};
|
||
|
|
||
|
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
|
||
|
#endif
|
||
|
|