Chris@16
|
1 /*
|
Chris@16
|
2 [auto_generated]
|
Chris@16
|
3 boost/numeric/odeint/external/mkl/mkl_operations.hpp
|
Chris@16
|
4
|
Chris@16
|
5 [begin_description]
|
Chris@16
|
6 Wrapper classes for intel math kernel library types.
|
Chris@16
|
7 Get a free, non-commercial download of MKL at
|
Chris@16
|
8 http://software.intel.com/en-us/articles/non-commercial-software-download/
|
Chris@16
|
9 [end_description]
|
Chris@16
|
10
|
Chris@101
|
11 Copyright 2010-2011 Mario Mulansky
|
Chris@101
|
12 Copyright 2011-2013 Karsten Ahnert
|
Chris@16
|
13
|
Chris@16
|
14 Distributed under the Boost Software License, Version 1.0.
|
Chris@16
|
15 (See accompanying file LICENSE_1_0.txt or
|
Chris@16
|
16 copy at http://www.boost.org/LICENSE_1_0.txt)
|
Chris@16
|
17 */
|
Chris@16
|
18
|
Chris@16
|
19
|
Chris@16
|
20 #ifndef BOOST_NUMERIC_ODEINT_EXTERNAL_MKL_MKL_OPERATIONS_HPP_INCLUDED
|
Chris@16
|
21 #define BOOST_NUMERIC_ODEINT_EXTERNAL_MKL_MKL_OPERATIONS_HPP_INCLUDED
|
Chris@16
|
22
|
Chris@16
|
23 #include <iostream>
|
Chris@16
|
24
|
Chris@16
|
25 #include <mkl_cblas.h>
|
Chris@16
|
26 #include <boost/numeric/odeint/algebra/default_operations.hpp>
|
Chris@16
|
27
|
Chris@16
|
28 /* exemplary example for writing bindings to the Intel MKL library
|
Chris@16
|
29 * see test/mkl for how to use mkl with odeint
|
Chris@16
|
30 * this is a quick and dirty implementation showing the general possibility.
|
Chris@16
|
31 * It works only with containers based on double and sequential memory allocation.
|
Chris@16
|
32 */
|
Chris@16
|
33
|
Chris@16
|
34 namespace boost {
|
Chris@16
|
35 namespace numeric {
|
Chris@16
|
36 namespace odeint {
|
Chris@16
|
37
|
Chris@16
|
38 /* only defined for doubles */
|
Chris@16
|
39 struct mkl_operations
|
Chris@16
|
40 {
|
Chris@16
|
41 //template< class Fac1 , class Fac2 > struct scale_sum2;
|
Chris@16
|
42
|
Chris@16
|
43 template< class F1 = double , class F2 = F1 >
|
Chris@16
|
44 struct scale_sum2
|
Chris@16
|
45 {
|
Chris@16
|
46 typedef double Fac1;
|
Chris@16
|
47 typedef double Fac2;
|
Chris@16
|
48 const Fac1 m_alpha1;
|
Chris@16
|
49 const Fac2 m_alpha2;
|
Chris@16
|
50
|
Chris@16
|
51 scale_sum2( const Fac1 alpha1 , const Fac2 alpha2 ) : m_alpha1( alpha1 ) , m_alpha2( alpha2 ) { }
|
Chris@16
|
52
|
Chris@16
|
53 template< class T1 , class T2 , class T3 >
|
Chris@16
|
54 void operator()( T1 &t1 , const T2 &t2 , const T3 &t3) const
|
Chris@16
|
55 { // t1 = m_alpha1 * t2 + m_alpha2 * t3;
|
Chris@16
|
56 // we get Containers that have size() and [i]-access
|
Chris@16
|
57
|
Chris@16
|
58 const int n = t1.size();
|
Chris@16
|
59 //boost::numeric::odeint::copy( t1 , t3 );
|
Chris@16
|
60 if( &(t2[0]) != &(t1[0]) )
|
Chris@16
|
61 {
|
Chris@16
|
62 cblas_dcopy( n , &(t2[0]) , 1 , &(t1[0]) , 1 );
|
Chris@16
|
63 }
|
Chris@16
|
64 cblas_dscal( n , m_alpha1 , &(t1[0]) , 1 );
|
Chris@16
|
65 cblas_daxpy( n , m_alpha2 , &(t3[0]) , 1 , &(t1[0]) , 1 );
|
Chris@16
|
66 //daxpby( &n , &m_alpha2 , &(t3[0]) , &one , &m_alpha1 , &(t1[0]) , &one );
|
Chris@16
|
67 }
|
Chris@16
|
68 };
|
Chris@16
|
69
|
Chris@16
|
70 template< class F1 = double , class F2 = F1 , class F3 = F2 >
|
Chris@16
|
71 struct scale_sum3
|
Chris@16
|
72 {
|
Chris@16
|
73 typedef double Fac1;
|
Chris@16
|
74 typedef double Fac2;
|
Chris@16
|
75 typedef double Fac3;
|
Chris@16
|
76 const Fac1 m_alpha1;
|
Chris@16
|
77 const Fac2 m_alpha2;
|
Chris@16
|
78 const Fac3 m_alpha3;
|
Chris@16
|
79
|
Chris@16
|
80 scale_sum3( const Fac1 alpha1 , const Fac2 alpha2 , const Fac3 alpha3 )
|
Chris@16
|
81 : m_alpha1( alpha1 ) , m_alpha2( alpha2 ) , m_alpha3( alpha3 ) { }
|
Chris@16
|
82
|
Chris@16
|
83 template< class T1 , class T2 , class T3 , class T4 >
|
Chris@16
|
84 void operator()( T1 &t1 , const T2 &t2 , const T3 &t3 , const T4 &t4 ) const
|
Chris@16
|
85 { // t1 = m_alpha1 * t2 + m_alpha2 * t3 + m_alpha3 * t4;
|
Chris@16
|
86 // we get Containers that have size() and [i]-access
|
Chris@16
|
87
|
Chris@16
|
88 const int n = t1.size();
|
Chris@16
|
89 //boost::numeric::odeint::copy( t1 , t3 );
|
Chris@16
|
90 if( &(t2[0]) != &(t1[0]) )
|
Chris@16
|
91 {
|
Chris@16
|
92 cblas_dcopy( n , &(t2[0]) , 1 , &(t1[0]) , 1 );
|
Chris@16
|
93 }
|
Chris@16
|
94 cblas_dscal( n , m_alpha1 , &(t1[0]) , 1 );
|
Chris@16
|
95 cblas_daxpy( n , m_alpha2 , &(t3[0]) , 1 , &(t1[0]) , 1 );
|
Chris@16
|
96 //daxpby( &n , &m_alpha2 , &(t3[0]) , &one , &m_alpha1 , &(t1[0]) , &one );
|
Chris@16
|
97 cblas_daxpy( n , m_alpha3 , &(t4[0]) , 1 , &(t1[0]) , 1 );
|
Chris@16
|
98 }
|
Chris@16
|
99 };
|
Chris@16
|
100
|
Chris@16
|
101 template< class F1 = double , class F2 = F1 , class F3 = F2 , class F4 = F3 >
|
Chris@16
|
102 struct scale_sum4
|
Chris@16
|
103 {
|
Chris@16
|
104 typedef double Fac1;
|
Chris@16
|
105 typedef double Fac2;
|
Chris@16
|
106 typedef double Fac3;
|
Chris@16
|
107 typedef double Fac4;
|
Chris@16
|
108 const Fac1 m_alpha1;
|
Chris@16
|
109 const Fac2 m_alpha2;
|
Chris@16
|
110 const Fac3 m_alpha3;
|
Chris@16
|
111 const Fac4 m_alpha4;
|
Chris@16
|
112
|
Chris@16
|
113 scale_sum4( const Fac1 alpha1 , const Fac2 alpha2 , const Fac3 alpha3 , const Fac4 alpha4 )
|
Chris@16
|
114 : m_alpha1( alpha1 ) , m_alpha2( alpha2 ) , m_alpha3( alpha3 ) , m_alpha4( alpha4 ) { }
|
Chris@16
|
115
|
Chris@16
|
116 template< class T1 , class T2 , class T3 , class T4 , class T5 >
|
Chris@16
|
117 void operator()( T1 &t1 , const T2 &t2 , const T3 &t3 , const T4 &t4 , const T5 &t5 ) const
|
Chris@16
|
118 { // t1 = m_alpha1 * t2 + m_alpha2 * t3 + m_alpha3 * t4 + m_alpha4 * t5;
|
Chris@16
|
119 // we get Containers that have size() and [i]-access
|
Chris@16
|
120
|
Chris@16
|
121 const int n = t1.size();
|
Chris@16
|
122 //boost::numeric::odeint::copy( t1 , t3 );
|
Chris@16
|
123 if( &(t2[0]) != &(t1[0]) )
|
Chris@16
|
124 {
|
Chris@16
|
125 cblas_dcopy( n , &(t2[0]) , 1 , &(t1[0]) , 1 );
|
Chris@16
|
126 }
|
Chris@16
|
127
|
Chris@16
|
128 cblas_dscal( n , m_alpha1 , &(t1[0]) , 1 );
|
Chris@16
|
129 cblas_daxpy( n , m_alpha2 , &(t3[0]) , 1 , &(t1[0]) , 1 );
|
Chris@16
|
130 //daxpby( &n , &m_alpha2 , &(t3[0]) , &one , &m_alpha1 , &(t1[0]) , &one );
|
Chris@16
|
131 cblas_daxpy( n , m_alpha3 , &(t4[0]) , 1 , &(t1[0]) , 1 );
|
Chris@16
|
132 cblas_daxpy( n , m_alpha4 , &(t5[0]) , 1 , &(t1[0]) , 1 );
|
Chris@16
|
133 }
|
Chris@16
|
134 };
|
Chris@16
|
135
|
Chris@16
|
136
|
Chris@16
|
137 template< class F1 = double , class F2 = F1 , class F3 = F2 , class F4 = F3 , class F5 = F4 >
|
Chris@16
|
138 struct scale_sum5
|
Chris@16
|
139 {
|
Chris@16
|
140 typedef double Fac1;
|
Chris@16
|
141 typedef double Fac2;
|
Chris@16
|
142 typedef double Fac3;
|
Chris@16
|
143 typedef double Fac4;
|
Chris@16
|
144 typedef double Fac5;
|
Chris@16
|
145 const Fac1 m_alpha1;
|
Chris@16
|
146 const Fac2 m_alpha2;
|
Chris@16
|
147 const Fac3 m_alpha3;
|
Chris@16
|
148 const Fac4 m_alpha4;
|
Chris@16
|
149 const Fac5 m_alpha5;
|
Chris@16
|
150
|
Chris@16
|
151 scale_sum5( const Fac1 alpha1 , const Fac2 alpha2 , const Fac3 alpha3 , const Fac4 alpha4 , const Fac5 alpha5 )
|
Chris@16
|
152 : m_alpha1( alpha1 ) , m_alpha2( alpha2 ) , m_alpha3( alpha3 ) , m_alpha4( alpha4 ) , m_alpha5( alpha5 ) { }
|
Chris@16
|
153
|
Chris@16
|
154 template< class T1 , class T2 , class T3 , class T4 , class T5 , class T6 >
|
Chris@16
|
155 void operator()( T1 &t1 , const T2 &t2 , const T3 &t3 , const T4 &t4 , const T5 &t5 , const T6 &t6 ) const
|
Chris@16
|
156 { // t1 = m_alpha1 * t2 + m_alpha2 * t3 + m_alpha3 * t4 + m_alpha4 * t5 + m_alpha5 * t6;
|
Chris@16
|
157 // we get Containers that have size() and [i]-access
|
Chris@16
|
158
|
Chris@16
|
159 const int n = t1.size();
|
Chris@16
|
160 //boost::numeric::odeint::copy( t1 , t3 );
|
Chris@16
|
161 if( &(t2[0]) != &(t1[0]) )
|
Chris@16
|
162 {
|
Chris@16
|
163 cblas_dcopy( n , &(t2[0]) , 1 , &(t1[0]) , 1 );
|
Chris@16
|
164 }
|
Chris@16
|
165
|
Chris@16
|
166 cblas_dscal( n , m_alpha1 , &(t1[0]) , 1 );
|
Chris@16
|
167 cblas_daxpy( n , m_alpha2 , &(t3[0]) , 1 , &(t1[0]) , 1 );
|
Chris@16
|
168 //daxpby( &n , &m_alpha2 , &(t3[0]) , &one , &m_alpha1 , &(t1[0]) , &one );
|
Chris@16
|
169 cblas_daxpy( n , m_alpha3 , &(t4[0]) , 1 , &(t1[0]) , 1 );
|
Chris@16
|
170 cblas_daxpy( n , m_alpha4 , &(t5[0]) , 1 , &(t1[0]) , 1 );
|
Chris@16
|
171 cblas_daxpy( n , m_alpha5 , &(t6[0]) , 1 , &(t1[0]) , 1 );
|
Chris@16
|
172 }
|
Chris@16
|
173 };
|
Chris@16
|
174
|
Chris@16
|
175 };
|
Chris@16
|
176
|
Chris@16
|
177 } // odeint
|
Chris@16
|
178 } // numeric
|
Chris@16
|
179 } // boost
|
Chris@16
|
180
|
Chris@16
|
181 #endif // BOOST_NUMERIC_ODEINT_EXTERNAL_MKL_MKL_OPERATIONS_HPP_INCLUDED
|