Chris@16: // Chris@16: // Copyright (c) 2000-2002 Chris@16: // Joerg Walter, Mathias Koch Chris@16: // Chris@16: // Distributed under the Boost Software License, Version 1.0. (See Chris@16: // accompanying file LICENSE_1_0.txt or copy at Chris@16: // http://www.boost.org/LICENSE_1_0.txt) Chris@16: // Chris@16: // The authors gratefully acknowledge the support of Chris@16: // GeNeSys mbH & Co. KG in producing this work. Chris@16: // Chris@16: Chris@16: #ifndef _BOOST_UBLAS_OPERATION_BLOCKED_ Chris@16: #define _BOOST_UBLAS_OPERATION_BLOCKED_ Chris@16: Chris@16: #include Chris@16: #include // indexing_vector_assign Chris@16: #include // indexing_matrix_assign Chris@16: Chris@16: Chris@16: namespace boost { namespace numeric { namespace ublas { Chris@16: Chris@16: template Chris@16: BOOST_UBLAS_INLINE Chris@16: V Chris@16: block_prod (const matrix_expression &e1, Chris@16: const vector_expression &e2) { Chris@16: typedef V vector_type; Chris@16: typedef const E1 expression1_type; Chris@16: typedef const E2 expression2_type; Chris@16: typedef typename V::size_type size_type; Chris@16: typedef typename V::value_type value_type; Chris@16: const size_type block_size = BS; Chris@16: Chris@16: V v (e1 ().size1 ()); Chris@16: #if BOOST_UBLAS_TYPE_CHECK Chris@16: vector cv (v.size ()); Chris@16: typedef typename type_traits::real_type real_type; Chris@16: real_type verrorbound (norm_1 (v) + norm_1 (e1) * norm_1 (e2)); Chris@16: indexing_vector_assign (cv, prod (e1, e2)); Chris@16: #endif Chris@16: size_type i_size = e1 ().size1 (); Chris@16: size_type j_size = BOOST_UBLAS_SAME (e1 ().size2 (), e2 ().size ()); Chris@16: for (size_type i_begin = 0; i_begin < i_size; i_begin += block_size) { Chris@16: size_type i_end = i_begin + (std::min) (i_size - i_begin, block_size); Chris@16: // FIX: never ignore Martin Weiser's advice ;-( Chris@16: #ifdef BOOST_UBLAS_NO_CACHE Chris@16: vector_range v_range (v, range (i_begin, i_end)); Chris@16: #else Chris@16: // vector > v_range (i_end - i_begin); Chris@16: vector v_range (i_end - i_begin); Chris@16: #endif Chris@16: v_range.assign (zero_vector (i_end - i_begin)); Chris@16: for (size_type j_begin = 0; j_begin < j_size; j_begin += block_size) { Chris@16: size_type j_end = j_begin + (std::min) (j_size - j_begin, block_size); Chris@16: #ifdef BOOST_UBLAS_NO_CACHE Chris@16: const matrix_range e1_range (e1 (), range (i_begin, i_end), range (j_begin, j_end)); Chris@16: const vector_range e2_range (e2 (), range (j_begin, j_end)); Chris@16: v_range.plus_assign (prod (e1_range, e2_range)); Chris@16: #else Chris@16: // const matrix > e1_range (project (e1 (), range (i_begin, i_end), range (j_begin, j_end))); Chris@16: // const vector > e2_range (project (e2 (), range (j_begin, j_end))); Chris@16: const matrix e1_range (project (e1 (), range (i_begin, i_end), range (j_begin, j_end))); Chris@16: const vector e2_range (project (e2 (), range (j_begin, j_end))); Chris@16: v_range.plus_assign (prod (e1_range, e2_range)); Chris@16: #endif Chris@16: } Chris@16: #ifndef BOOST_UBLAS_NO_CACHE Chris@16: project (v, range (i_begin, i_end)).assign (v_range); Chris@16: #endif Chris@16: } Chris@16: #if BOOST_UBLAS_TYPE_CHECK Chris@16: BOOST_UBLAS_CHECK (norm_1 (v - cv) <= 2 * std::numeric_limits::epsilon () * verrorbound, internal_logic ()); Chris@16: #endif Chris@16: return v; Chris@16: } Chris@16: Chris@16: template Chris@16: BOOST_UBLAS_INLINE Chris@16: V Chris@16: block_prod (const vector_expression &e1, Chris@16: const matrix_expression &e2) { Chris@16: typedef V vector_type; Chris@16: typedef const E1 expression1_type; Chris@16: typedef const E2 expression2_type; Chris@16: typedef typename V::size_type size_type; Chris@16: typedef typename V::value_type value_type; Chris@16: const size_type block_size = BS; Chris@16: Chris@16: V v (e2 ().size2 ()); Chris@16: #if BOOST_UBLAS_TYPE_CHECK Chris@16: vector cv (v.size ()); Chris@16: typedef typename type_traits::real_type real_type; Chris@16: real_type verrorbound (norm_1 (v) + norm_1 (e1) * norm_1 (e2)); Chris@16: indexing_vector_assign (cv, prod (e1, e2)); Chris@16: #endif Chris@16: size_type i_size = BOOST_UBLAS_SAME (e1 ().size (), e2 ().size1 ()); Chris@16: size_type j_size = e2 ().size2 (); Chris@16: for (size_type j_begin = 0; j_begin < j_size; j_begin += block_size) { Chris@16: size_type j_end = j_begin + (std::min) (j_size - j_begin, block_size); Chris@16: // FIX: never ignore Martin Weiser's advice ;-( Chris@16: #ifdef BOOST_UBLAS_NO_CACHE Chris@16: vector_range v_range (v, range (j_begin, j_end)); Chris@16: #else Chris@16: // vector > v_range (j_end - j_begin); Chris@16: vector v_range (j_end - j_begin); Chris@16: #endif Chris@16: v_range.assign (zero_vector (j_end - j_begin)); Chris@16: for (size_type i_begin = 0; i_begin < i_size; i_begin += block_size) { Chris@16: size_type i_end = i_begin + (std::min) (i_size - i_begin, block_size); Chris@16: #ifdef BOOST_UBLAS_NO_CACHE Chris@16: const vector_range e1_range (e1 (), range (i_begin, i_end)); Chris@16: const matrix_range e2_range (e2 (), range (i_begin, i_end), range (j_begin, j_end)); Chris@16: #else Chris@16: // const vector > e1_range (project (e1 (), range (i_begin, i_end))); Chris@16: // const matrix > e2_range (project (e2 (), range (i_begin, i_end), range (j_begin, j_end))); Chris@16: const vector e1_range (project (e1 (), range (i_begin, i_end))); Chris@16: const matrix e2_range (project (e2 (), range (i_begin, i_end), range (j_begin, j_end))); Chris@16: #endif Chris@16: v_range.plus_assign (prod (e1_range, e2_range)); Chris@16: } Chris@16: #ifndef BOOST_UBLAS_NO_CACHE Chris@16: project (v, range (j_begin, j_end)).assign (v_range); Chris@16: #endif Chris@16: } Chris@16: #if BOOST_UBLAS_TYPE_CHECK Chris@16: BOOST_UBLAS_CHECK (norm_1 (v - cv) <= 2 * std::numeric_limits::epsilon () * verrorbound, internal_logic ()); Chris@16: #endif Chris@16: return v; Chris@16: } Chris@16: Chris@16: template Chris@16: BOOST_UBLAS_INLINE Chris@16: M Chris@16: block_prod (const matrix_expression &e1, Chris@16: const matrix_expression &e2, Chris@16: row_major_tag) { Chris@16: typedef M matrix_type; Chris@16: typedef const E1 expression1_type; Chris@16: typedef const E2 expression2_type; Chris@16: typedef typename M::size_type size_type; Chris@16: typedef typename M::value_type value_type; Chris@16: const size_type block_size = BS; Chris@16: Chris@16: M m (e1 ().size1 (), e2 ().size2 ()); Chris@16: #if BOOST_UBLAS_TYPE_CHECK Chris@16: matrix cm (m.size1 (), m.size2 ()); Chris@16: typedef typename type_traits::real_type real_type; Chris@16: real_type merrorbound (norm_1 (m) + norm_1 (e1) * norm_1 (e2)); Chris@16: indexing_matrix_assign (cm, prod (e1, e2), row_major_tag ()); Chris@16: disable_type_check::value = true; Chris@16: #endif Chris@16: size_type i_size = e1 ().size1 (); Chris@16: size_type j_size = e2 ().size2 (); Chris@16: size_type k_size = BOOST_UBLAS_SAME (e1 ().size2 (), e2 ().size1 ()); Chris@16: for (size_type i_begin = 0; i_begin < i_size; i_begin += block_size) { Chris@16: size_type i_end = i_begin + (std::min) (i_size - i_begin, block_size); Chris@16: for (size_type j_begin = 0; j_begin < j_size; j_begin += block_size) { Chris@16: size_type j_end = j_begin + (std::min) (j_size - j_begin, block_size); Chris@16: // FIX: never ignore Martin Weiser's advice ;-( Chris@16: #ifdef BOOST_UBLAS_NO_CACHE Chris@16: matrix_range m_range (m, range (i_begin, i_end), range (j_begin, j_end)); Chris@16: #else Chris@16: // matrix > m_range (i_end - i_begin, j_end - j_begin); Chris@16: matrix m_range (i_end - i_begin, j_end - j_begin); Chris@16: #endif Chris@16: m_range.assign (zero_matrix (i_end - i_begin, j_end - j_begin)); Chris@16: for (size_type k_begin = 0; k_begin < k_size; k_begin += block_size) { Chris@16: size_type k_end = k_begin + (std::min) (k_size - k_begin, block_size); Chris@16: #ifdef BOOST_UBLAS_NO_CACHE Chris@16: const matrix_range e1_range (e1 (), range (i_begin, i_end), range (k_begin, k_end)); Chris@16: const matrix_range e2_range (e2 (), range (k_begin, k_end), range (j_begin, j_end)); Chris@16: #else Chris@16: // const matrix > e1_range (project (e1 (), range (i_begin, i_end), range (k_begin, k_end))); Chris@16: // const matrix > e2_range (project (e2 (), range (k_begin, k_end), range (j_begin, j_end))); Chris@16: const matrix e1_range (project (e1 (), range (i_begin, i_end), range (k_begin, k_end))); Chris@16: const matrix e2_range (project (e2 (), range (k_begin, k_end), range (j_begin, j_end))); Chris@16: #endif Chris@16: m_range.plus_assign (prod (e1_range, e2_range)); Chris@16: } Chris@16: #ifndef BOOST_UBLAS_NO_CACHE Chris@16: project (m, range (i_begin, i_end), range (j_begin, j_end)).assign (m_range); Chris@16: #endif Chris@16: } Chris@16: } Chris@16: #if BOOST_UBLAS_TYPE_CHECK Chris@16: disable_type_check::value = false; Chris@16: BOOST_UBLAS_CHECK (norm_1 (m - cm) <= 2 * std::numeric_limits::epsilon () * merrorbound, internal_logic ()); Chris@16: #endif Chris@16: return m; Chris@16: } Chris@16: Chris@16: template Chris@16: BOOST_UBLAS_INLINE Chris@16: M Chris@16: block_prod (const matrix_expression &e1, Chris@16: const matrix_expression &e2, Chris@16: column_major_tag) { Chris@16: typedef M matrix_type; Chris@16: typedef const E1 expression1_type; Chris@16: typedef const E2 expression2_type; Chris@16: typedef typename M::size_type size_type; Chris@16: typedef typename M::value_type value_type; Chris@16: const size_type block_size = BS; Chris@16: Chris@16: M m (e1 ().size1 (), e2 ().size2 ()); Chris@16: #if BOOST_UBLAS_TYPE_CHECK Chris@16: matrix cm (m.size1 (), m.size2 ()); Chris@16: typedef typename type_traits::real_type real_type; Chris@16: real_type merrorbound (norm_1 (m) + norm_1 (e1) * norm_1 (e2)); Chris@16: indexing_matrix_assign (cm, prod (e1, e2), column_major_tag ()); Chris@16: disable_type_check::value = true; Chris@16: #endif Chris@16: size_type i_size = e1 ().size1 (); Chris@16: size_type j_size = e2 ().size2 (); Chris@16: size_type k_size = BOOST_UBLAS_SAME (e1 ().size2 (), e2 ().size1 ()); Chris@16: for (size_type j_begin = 0; j_begin < j_size; j_begin += block_size) { Chris@16: size_type j_end = j_begin + (std::min) (j_size - j_begin, block_size); Chris@16: for (size_type i_begin = 0; i_begin < i_size; i_begin += block_size) { Chris@16: size_type i_end = i_begin + (std::min) (i_size - i_begin, block_size); Chris@16: // FIX: never ignore Martin Weiser's advice ;-( Chris@16: #ifdef BOOST_UBLAS_NO_CACHE Chris@16: matrix_range m_range (m, range (i_begin, i_end), range (j_begin, j_end)); Chris@16: #else Chris@16: // matrix > m_range (i_end - i_begin, j_end - j_begin); Chris@16: matrix m_range (i_end - i_begin, j_end - j_begin); Chris@16: #endif Chris@16: m_range.assign (zero_matrix (i_end - i_begin, j_end - j_begin)); Chris@16: for (size_type k_begin = 0; k_begin < k_size; k_begin += block_size) { Chris@16: size_type k_end = k_begin + (std::min) (k_size - k_begin, block_size); Chris@16: #ifdef BOOST_UBLAS_NO_CACHE Chris@16: const matrix_range e1_range (e1 (), range (i_begin, i_end), range (k_begin, k_end)); Chris@16: const matrix_range e2_range (e2 (), range (k_begin, k_end), range (j_begin, j_end)); Chris@16: #else Chris@16: // const matrix > e1_range (project (e1 (), range (i_begin, i_end), range (k_begin, k_end))); Chris@16: // const matrix > e2_range (project (e2 (), range (k_begin, k_end), range (j_begin, j_end))); Chris@16: const matrix e1_range (project (e1 (), range (i_begin, i_end), range (k_begin, k_end))); Chris@16: const matrix e2_range (project (e2 (), range (k_begin, k_end), range (j_begin, j_end))); Chris@16: #endif Chris@16: m_range.plus_assign (prod (e1_range, e2_range)); Chris@16: } Chris@16: #ifndef BOOST_UBLAS_NO_CACHE Chris@16: project (m, range (i_begin, i_end), range (j_begin, j_end)).assign (m_range); Chris@16: #endif Chris@16: } Chris@16: } Chris@16: #if BOOST_UBLAS_TYPE_CHECK Chris@16: disable_type_check::value = false; Chris@16: BOOST_UBLAS_CHECK (norm_1 (m - cm) <= 2 * std::numeric_limits::epsilon () * merrorbound, internal_logic ()); Chris@16: #endif Chris@16: return m; Chris@16: } Chris@16: Chris@16: // Dispatcher Chris@16: template Chris@16: BOOST_UBLAS_INLINE Chris@16: M Chris@16: block_prod (const matrix_expression &e1, Chris@16: const matrix_expression &e2) { Chris@16: typedef typename M::orientation_category orientation_category; Chris@16: return block_prod (e1, e2, orientation_category ()); Chris@16: } Chris@16: Chris@16: }}} Chris@16: Chris@16: #endif