Chris@102
|
1 /*
|
Chris@102
|
2 [auto_generated]
|
Chris@102
|
3 boost/numeric/odeint/external/openmp/openmp_state.hpp
|
Chris@102
|
4
|
Chris@102
|
5 [begin_description]
|
Chris@102
|
6 Wrappers for OpenMP.
|
Chris@102
|
7 [end_description]
|
Chris@102
|
8
|
Chris@102
|
9 Copyright 2013 Karsten Ahnert
|
Chris@102
|
10 Copyright 2013 Mario Mulansky
|
Chris@102
|
11 Copyright 2013 Pascal Germroth
|
Chris@102
|
12
|
Chris@102
|
13 Distributed under the Boost Software License, Version 1.0.
|
Chris@102
|
14 (See accompanying file LICENSE_1_0.txt or
|
Chris@102
|
15 copy at http://www.boost.org/LICENSE_1_0.txt)
|
Chris@102
|
16 */
|
Chris@102
|
17
|
Chris@102
|
18
|
Chris@102
|
19 #ifndef BOOST_NUMERIC_ODEINT_EXTERNAL_OPENMP_OPENMP_STATE_HPP_INCLUDED
|
Chris@102
|
20 #define BOOST_NUMERIC_ODEINT_EXTERNAL_OPENMP_OPENMP_STATE_HPP_INCLUDED
|
Chris@102
|
21
|
Chris@102
|
22 #include <omp.h>
|
Chris@102
|
23 #include <vector>
|
Chris@102
|
24 #include <algorithm>
|
Chris@102
|
25 #include <boost/range/adaptor/sliced.hpp>
|
Chris@102
|
26 #include <boost/numeric/odeint/util/copy.hpp>
|
Chris@102
|
27 #include <boost/numeric/odeint/util/split.hpp>
|
Chris@102
|
28 #include <boost/numeric/odeint/util/resize.hpp>
|
Chris@102
|
29 #include <boost/numeric/odeint/external/openmp/openmp_nested_algebra.hpp>
|
Chris@102
|
30
|
Chris@102
|
31 namespace boost {
|
Chris@102
|
32 namespace numeric {
|
Chris@102
|
33 namespace odeint {
|
Chris@102
|
34
|
Chris@102
|
35 /** \brief A container that is split into distinct parts, for threading.
|
Chris@102
|
36 * Just a wrapper for vector<vector<T>>, use `copy` for splitting/joining.
|
Chris@102
|
37 */
|
Chris@102
|
38 template< class T >
|
Chris@102
|
39 struct openmp_state : public std::vector< std::vector< T > >
|
Chris@102
|
40 {
|
Chris@102
|
41 openmp_state() {}
|
Chris@102
|
42
|
Chris@102
|
43 openmp_state(size_t n, const std::vector<T>& val = std::vector<T>())
|
Chris@102
|
44 : std::vector< std::vector< T > >(n, val) {}
|
Chris@102
|
45
|
Chris@102
|
46 template<class InputIterator>
|
Chris@102
|
47 openmp_state(InputIterator first, InputIterator last)
|
Chris@102
|
48 : std::vector< std::vector< T > >(first, last) {}
|
Chris@102
|
49
|
Chris@102
|
50 openmp_state(const std::vector< std::vector< T > > &orig)
|
Chris@102
|
51 : std::vector< std::vector< T > >(orig) {}
|
Chris@102
|
52
|
Chris@102
|
53 };
|
Chris@102
|
54
|
Chris@102
|
55
|
Chris@102
|
56
|
Chris@102
|
57
|
Chris@102
|
58 template< class T >
|
Chris@102
|
59 struct is_resizeable< openmp_state< T > > : boost::true_type { };
|
Chris@102
|
60
|
Chris@102
|
61
|
Chris@102
|
62 template< class T >
|
Chris@102
|
63 struct same_size_impl< openmp_state< T > , openmp_state< T > >
|
Chris@102
|
64 {
|
Chris@102
|
65 static bool same_size( const openmp_state< T > &x , const openmp_state< T > &y )
|
Chris@102
|
66 {
|
Chris@102
|
67 if( x.size() != y.size() ) return false;
|
Chris@102
|
68 for( size_t i = 0 ; i != x.size() ; i++ )
|
Chris@102
|
69 if( x[i].size() != y[i].size() ) return false;
|
Chris@102
|
70 return true;
|
Chris@102
|
71 }
|
Chris@102
|
72 };
|
Chris@102
|
73
|
Chris@102
|
74
|
Chris@102
|
75 template< class T >
|
Chris@102
|
76 struct resize_impl< openmp_state< T > , openmp_state< T > >
|
Chris@102
|
77 {
|
Chris@102
|
78 static void resize( openmp_state< T > &x , const openmp_state< T > &y )
|
Chris@102
|
79 {
|
Chris@102
|
80 x.resize( y.size() );
|
Chris@102
|
81 # pragma omp parallel for schedule(dynamic)
|
Chris@102
|
82 for(size_t i = 0 ; i < x.size() ; i++)
|
Chris@102
|
83 x[i].resize( y[i].size() );
|
Chris@102
|
84 }
|
Chris@102
|
85 };
|
Chris@102
|
86
|
Chris@102
|
87
|
Chris@102
|
88 /** \brief Copy data between openmp_states of same size. */
|
Chris@102
|
89 template< class T >
|
Chris@102
|
90 struct copy_impl< openmp_state< T >, openmp_state< T > >
|
Chris@102
|
91 {
|
Chris@102
|
92 static void copy( const openmp_state< T > &from, openmp_state< T > &to )
|
Chris@102
|
93 {
|
Chris@102
|
94 # pragma omp parallel for schedule(dynamic)
|
Chris@102
|
95 for(size_t i = 0 ; i < from.size() ; i++)
|
Chris@102
|
96 std::copy( from[i].begin() , from[i].end() , to.begin() );
|
Chris@102
|
97 }
|
Chris@102
|
98 };
|
Chris@102
|
99
|
Chris@102
|
100
|
Chris@102
|
101
|
Chris@102
|
102 /** \brief Copy data from some container to an openmp_state and resize it.
|
Chris@102
|
103 * Target container size will determine number of blocks to split into.
|
Chris@102
|
104 * If it is empty, it will be resized to the maximum number of OpenMP threads.
|
Chris@102
|
105 * SourceContainer must support `s::value_type`, `s::const_iterator`, `s.begin()`, `s.end()` and `s.size()`,
|
Chris@102
|
106 * with Random Access Iterators; i.e. it must be a Random Access Container. */
|
Chris@102
|
107 template< class SourceContainer >
|
Chris@102
|
108 struct split_impl< SourceContainer, openmp_state< typename SourceContainer::value_type > >
|
Chris@102
|
109 {
|
Chris@102
|
110 static void split( const SourceContainer &from, openmp_state< typename SourceContainer::value_type > &to )
|
Chris@102
|
111 {
|
Chris@102
|
112 if(to.size() == 0) to.resize( omp_get_max_threads() );
|
Chris@102
|
113 const size_t part = from.size() / to.size();
|
Chris@102
|
114 # pragma omp parallel for schedule(dynamic)
|
Chris@102
|
115 for(size_t i = 0 ; i < to.size() ; i++) {
|
Chris@102
|
116 typedef typename SourceContainer::const_iterator it_t;
|
Chris@102
|
117 const it_t begin = from.begin() + i * part;
|
Chris@102
|
118 it_t end = begin + part;
|
Chris@102
|
119 // for cases where from.size() % to.size() > 0
|
Chris@102
|
120 if(i + 1 == to.size() || end > from.end()) end = from.end();
|
Chris@102
|
121 to[i].resize(end - begin);
|
Chris@102
|
122 std::copy(begin, end, to[i].begin());
|
Chris@102
|
123 }
|
Chris@102
|
124 }
|
Chris@102
|
125 };
|
Chris@102
|
126
|
Chris@102
|
127 /** \brief Copy data from an openmp_state to some container and resize it.
|
Chris@102
|
128 * TargetContainer must support `s::value_type`, `s::iterator`, `s.begin()` and `s.resize(n)`,
|
Chris@102
|
129 * i.e. it must be a `std::vector`. */
|
Chris@102
|
130 template< class TargetContainer >
|
Chris@102
|
131 struct unsplit_impl< openmp_state< typename TargetContainer::value_type >, TargetContainer >
|
Chris@102
|
132 {
|
Chris@102
|
133 static void unsplit( const openmp_state< typename TargetContainer::value_type > &from , TargetContainer &to )
|
Chris@102
|
134 {
|
Chris@102
|
135 // resize target
|
Chris@102
|
136 size_t total_size = 0;
|
Chris@102
|
137 for(size_t i = 0 ; i < from.size() ; i++)
|
Chris@102
|
138 total_size += from[i].size();
|
Chris@102
|
139 to.resize( total_size );
|
Chris@102
|
140 // copy parts
|
Chris@102
|
141 typename TargetContainer::iterator out = to.begin();
|
Chris@102
|
142 for(size_t i = 0 ; i < from.size() ; i++)
|
Chris@102
|
143 out = std::copy(from[i].begin(), from[i].end(), out);
|
Chris@102
|
144 }
|
Chris@102
|
145 };
|
Chris@102
|
146
|
Chris@102
|
147
|
Chris@102
|
148
|
Chris@102
|
149
|
Chris@102
|
150 /** \brief OpenMP-parallelized algebra.
|
Chris@102
|
151 * For use with openmp_state.
|
Chris@102
|
152 */
|
Chris@102
|
153 typedef openmp_nested_algebra< range_algebra > openmp_algebra;
|
Chris@102
|
154
|
Chris@102
|
155
|
Chris@102
|
156
|
Chris@102
|
157 /** \brief Use `openmp_algebra` for `openmp_state`. */
|
Chris@102
|
158 template< class T >
|
Chris@102
|
159 struct algebra_dispatcher< openmp_state< T > >
|
Chris@102
|
160 {
|
Chris@102
|
161 typedef openmp_algebra algebra_type;
|
Chris@102
|
162 };
|
Chris@102
|
163
|
Chris@102
|
164
|
Chris@102
|
165 }
|
Chris@102
|
166 }
|
Chris@102
|
167 }
|
Chris@102
|
168
|
Chris@102
|
169
|
Chris@102
|
170 #endif
|
Chris@102
|
171
|