#ifndef VIENNACL_LINALG_DETAIL_SPAI_FSPAI_HPP #define VIENNACL_LINALG_DETAIL_SPAI_FSPAI_HPP /* ========================================================================= Copyright (c) 2010-2011, Institute for Microelectronics, Institute for Analysis and Scientific Computing, TU Wien. ----------------- ViennaCL - The Vienna Computing Library ----------------- Project Head: Karl Rupp rupp@iue.tuwien.ac.at (A list of authors and contributors can be found in the PDF manual) License: MIT (X11), see file LICENSE in the base directory ============================================================================= */ #include #include #include #include #include #include #include #include //boost includes #include "boost/numeric/ublas/vector.hpp" #include "boost/numeric/ublas/matrix.hpp" #include "boost/numeric/ublas/matrix_proxy.hpp" #include "boost/numeric/ublas/vector_proxy.hpp" #include "boost/numeric/ublas/storage.hpp" #include "boost/numeric/ublas/io.hpp" #include "boost/numeric/ublas/lu.hpp" #include "boost/numeric/ublas/triangular.hpp" #include "boost/numeric/ublas/matrix_expression.hpp" // ViennaCL includes #include "viennacl/linalg/prod.hpp" #include "viennacl/matrix.hpp" #include "viennacl/compressed_matrix.hpp" #include "viennacl/linalg/compressed_matrix_operations.hpp" #include "viennacl/linalg/matrix_operations.hpp" #include "viennacl/scalar.hpp" #include "viennacl/linalg/cg.hpp" #include "viennacl/linalg/inner_prod.hpp" #include "viennacl/linalg/ilu.hpp" //#include /** @file viennacl/linalg/detail/spai/fspai.hpp @brief Implementation of FSPAI. Experimental. */ namespace viennacl { namespace linalg { namespace detail { namespace spai { /** @brief A tag for FSPAI. Experimental. * Contains values for the algorithm. * Must be passed to spai_precond constructor */ class fspai_tag{ /** @brief Constructor * @param residual_norm_threshold Calculate until the norm of the residual falls below this threshold * @param iteration_limit maximum number of iterations * @param is_static determines if static version of SPAI should be used * @param is_right determines if left or right preconditioner should be used */ public: fspai_tag( double residual_norm_threshold = 1e-3, unsigned int iteration_limit = 5, bool is_static = false, bool is_right = false) : _residual_norm_threshold(residual_norm_threshold), _iteration_limit(iteration_limit), _is_static(is_static), _is_right(is_right){}; inline const double getResidualNormThreshold() const { return _residual_norm_threshold; } inline const unsigned long getIterationLimit () const { return _iteration_limit; } inline const bool getIsStatic() const { return _is_static; } inline const bool getIsRight() const { return _is_right; } inline void setResidualNormThreshold(double residual_norm_threshold){ if(residual_norm_threshold > 0) _residual_norm_threshold = residual_norm_threshold; } inline void setIterationLimit(unsigned long iteration_limit){ if(iteration_limit > 0) _iteration_limit = iteration_limit; } inline void setIsRight(bool is_right){ _is_right = is_right; } inline void setIsStatic(bool is_static){ _is_static = is_static; } private: double _residual_norm_threshold; unsigned long _iteration_limit; bool _is_static; bool _is_right; }; // // Helper: Store A in an STL container of type, exploiting symmetry // Reason: ublas interface does not allow to iterate over nonzeros of a particular row without starting an iterator1 from the very beginning of the matrix... // template void sym_sparse_matrix_to_stl(MatrixType const & A, std::vector > & STL_A) { STL_A.resize(A.size1()); for (typename MatrixType::const_iterator1 row_it = A.begin1(); row_it != A.end1(); ++row_it) { for (typename MatrixType::const_iterator2 col_it = row_it.begin(); col_it != row_it.end(); ++col_it) { if (col_it.index1() >= col_it.index2()) STL_A[col_it.index1()][col_it.index2()] = *col_it; else break; //go to next row } } } // // Generate index sets J_k, k=0,...,N-1 // template void generateJ(MatrixType const & A, std::vector > & J) { for (typename MatrixType::const_iterator1 row_it = A.begin1(); row_it != A.end1(); ++row_it) { for (typename MatrixType::const_iterator2 col_it = row_it.begin(); col_it != row_it.end(); ++col_it) { if (col_it.index1() > col_it.index2()) //Matrix is symmetric, thus only work on lower triangular part { J[col_it.index2()].push_back(col_it.index1()); J[col_it.index1()].push_back(col_it.index2()); } else break; //go to next row } } } // // Extracts the blocks A(\tilde{J}_k, \tilde{J}_k) from A // Sets up y_k = A(\tilde{J}_k, k) for the inplace-solution after Cholesky-factoriation // template void fill_blocks(std::vector< std::map > & A, std::vector & blocks, std::vector > const & J, std::vector & Y) { for (size_t k=0; k const & Jk = J[k]; VectorType & yk = Y[k]; MatrixType & block_k = blocks[k]; yk.resize(Jk.size()); block_k.resize(Jk.size(), Jk.size()); block_k.clear(); for (size_t i=0; i & A_row = A[row_index]; //fill y_k: yk[i] = A_row[k]; for (size_t j=0; j void cholesky_decompose(MatrixType & A) { for (size_t k=0; k 0); A(k,k) = std::sqrt(A(k,k)); for (size_t i=k+1; i void cholesky_solve(MatrixType const & L, VectorType & b) { typedef typename VectorType::value_type ScalarType; // inplace forward solve L x = b for (size_t i=0; i void computeL(MatrixType const & A, MatrixType & L, MatrixType & L_trans, std::vector & Y, std::vector > & J) { typedef typename VectorType1::value_type ScalarType; typedef std::vector > STLSparseMatrixType; STLSparseMatrixType L_temp(A.size1()); for (size_t k=0; k const & Jk = J[k]; VectorType1 const & yk = Y[k]; //compute L(k,k): ScalarType Lkk = A(k,k); for (size_t i=0; i::const_iterator it = L_temp[i].begin(); it != L_temp[i].end(); ++it) L(i, it->first) = it->second; } // // Top level FSPAI function // template void computeFSPAI(MatrixType const & A, MatrixType const & PatternA, MatrixType & L, MatrixType & L_trans, fspai_tag const & tag) { typedef typename MatrixType::value_type ScalarType; typedef boost::numeric::ublas::matrix DenseMatrixType; typedef std::vector > SparseMatrixType; // // preprocessing: Store A in a STL container: // //std::cout << "Transferring to STL container:" << std::endl; std::vector > y_k(A.size1()); SparseMatrixType STL_A(A.size1()); sym_sparse_matrix_to_stl(A, STL_A); // // Step 1: Generate pattern indices // //std::cout << "computeFSPAI(): Generating pattern..." << std::endl; std::vector > J(A.size1()); generateJ(PatternA, J); // // Step 2: Set up matrix blocks // //std::cout << "computeFSPAI(): Setting up matrix blocks..." << std::endl; std::vector subblocks_A(A.size1()); fill_blocks(STL_A, subblocks_A, J, y_k); STL_A.clear(); //not needed anymore // // Step 3: Cholesky-factor blocks // //std::cout << "computeFSPAI(): Cholesky-factorization..." << std::endl; for (size_t i=0; i 0) //block might be empty... { //y_k[i].resize(subblocks_A[i].size1()); //std::cout << "y_k[" << i << "]: "; //for (size_t j=0; j