doc/ilut_8hpp_source.html

 #ifndef VIENNACL_LINALG_DETAIL_ILUT_HPP_

 #define VIENNACL_LINALG_DETAIL_ILUT_HPP_


 /* =========================================================================

    Copyright (c) 2010-2016, Institute for Microelectronics,

                             Institute for Analysis and Scientific Computing,

                             TU Wien.

    Portions of this software are copyright by UChicago Argonne, LLC.


                             -----------------

                   ViennaCL - The Vienna Computing Library

                             -----------------


    Project Head:    Karl Rupp                   rupp@iue.tuwien.ac.at


    (A list of authors and contributors can be found in the manual)


    License:         MIT (X11), see file LICENSE in the base directory

 ============================================================================= */


 #include <vector>

 #include <cmath>

 #include <iostream>

 #include "viennacl/forwards.h"

 #include "viennacl/tools/tools.hpp"


 #include "viennacl/linalg/detail/ilu/common.hpp"

 #include "viennacl/compressed_matrix.hpp"


 #include "viennacl/linalg/host_based/common.hpp"


 #include <map>


 namespace viennacl

 {

 namespace linalg

 {


 class ilut_tag

 {

   public:

     ilut_tag(unsigned int entries_per_row = 20,

              double       drop_tolerance = 1e-4,

              bool         with_level_scheduling = false)

       : entries_per_row_(entries_per_row),

         drop_tolerance_(drop_tolerance),

         use_level_scheduling_(with_level_scheduling) {}


     void set_drop_tolerance(double tol)

     {

       if (tol > 0)

         drop_tolerance_ = tol;

     }

     double get_drop_tolerance() const { return drop_tolerance_; }


     void set_entries_per_row(unsigned int e)

     {

       if (e > 0)

         entries_per_row_ = e;

     }


     unsigned int get_entries_per_row() const { return entries_per_row_; }


     bool use_level_scheduling() const { return use_level_scheduling_; }

     void use_level_scheduling(bool b) { use_level_scheduling_ = b; }


   private:

     unsigned int entries_per_row_;

     double       drop_tolerance_;

     bool         use_level_scheduling_;

 };


 namespace detail

 {

   template<typename NumericT>

   struct ilut_sparse_vector

   {

     ilut_sparse_vector(vcl_size_t alloc_size = 0) : size_(0), col_indices_(alloc_size), elements_(alloc_size) {}


     void resize_if_bigger(vcl_size_t s)

     {

       if (s > elements_.size())

       {

         col_indices_.resize(s);

         elements_.resize(s);

       }

       size_ = s;

     }


     vcl_size_t size_;

     std::vector<unsigned int> col_indices_;

     std::vector<NumericT>     elements_;

   };


   template<typename IndexT, typename NumericT>

   IndexT merge_subtract_sparse_rows(IndexT const * w_coords, NumericT const * w_elements, IndexT w_size,

                                     IndexT const * u_coords, NumericT const * u_elements, IndexT u_size, NumericT alpha,

                                     IndexT       * z_coords, NumericT       * z_elements)

   {

     IndexT index_w = 0;

     IndexT index_u = 0;

     IndexT index_z = 0;


     while (1)

     {

       if (index_w < w_size && index_u < u_size)

       {

         if (w_coords[index_w] < u_coords[index_u])

         {

           z_coords[index_z]     = w_coords[index_w];

           z_elements[index_z++] = w_elements[index_w++];

         }

         else if (w_coords[index_w] == u_coords[index_u])

         {

           z_coords[index_z]     = w_coords[index_w];

           z_elements[index_z++] = w_elements[index_w++] - alpha * u_elements[index_u++];

         }

         else

         {

           z_coords[index_z]     = u_coords[index_u];

           z_elements[index_z++] = - alpha * u_elements[index_u++];

         }

       }

       else if (index_w == w_size && index_u < u_size)

       {

         z_coords[index_z]     = u_coords[index_u];

         z_elements[index_z++] = - alpha * u_elements[index_u++];

       }

       else if (index_w < w_size && index_u == u_size)

       {

         z_coords[index_z]     = w_coords[index_w];

         z_elements[index_z++] = w_elements[index_w++];

       }

       else

         return index_z;

     }

   }


   template<typename SizeT, typename NumericT>

   void insert_with_value_sort(std::vector<std::pair<SizeT, NumericT> > & map,

                               SizeT index, NumericT value)

   {

     NumericT abs_value = std::fabs(value);

     if (abs_value > 0)

     {

       // find first element with smaller absolute value:

       std::size_t first_smaller_index = 0;

       while (first_smaller_index < map.size() && std::fabs(map[first_smaller_index].second) > abs_value)

         ++first_smaller_index;


       std::pair<SizeT, NumericT> tmp(index, value);

       for (std::size_t j=first_smaller_index; j<map.size(); ++j)

         std::swap(map[j], tmp);

     }

   }


 }


 template<typename NumericT>

 void precondition(viennacl::compressed_matrix<NumericT> const & A,

                   viennacl::compressed_matrix<NumericT>       & L,

                   viennacl::compressed_matrix<NumericT>       & U,

                   ilut_tag const & tag)

 {

   assert(A.size1() == L.size1() && bool("Output matrix size mismatch") );

   assert(A.size1() == U.size1() && bool("Output matrix size mismatch") );


   L.reserve( tag.get_entries_per_row()      * A.size1());

   U.reserve((tag.get_entries_per_row() + 1) * A.size1());


   vcl_size_t avg_nnz_per_row = static_cast<vcl_size_t>(A.nnz() / A.size1());

   detail::ilut_sparse_vector<NumericT> w1(tag.get_entries_per_row() * (avg_nnz_per_row + 10));

   detail::ilut_sparse_vector<NumericT> w2(tag.get_entries_per_row() * (avg_nnz_per_row + 10));

   detail::ilut_sparse_vector<NumericT> * w_in  = &w1;

   detail::ilut_sparse_vector<NumericT> * w_out = &w2;

   std::vector<NumericT> diagonal_U(A.size1());


   NumericT     const * elements_A   = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericT>(A.handle());

   unsigned int const * row_buffer_A = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(A.handle1());

   unsigned int const * col_buffer_A = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(A.handle2());


   NumericT           * elements_L   = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericT>(L.handle());

   unsigned int       * row_buffer_L = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(L.handle1()); row_buffer_L[0] = 0;

   unsigned int       * col_buffer_L = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(L.handle2());


   NumericT           * elements_U   = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericT>(U.handle());

   unsigned int       * row_buffer_U = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(U.handle1()); row_buffer_U[0] = 0;

   unsigned int       * col_buffer_U = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(U.handle2());


   std::vector<std::pair<unsigned int, NumericT> > sorted_entries_L(tag.get_entries_per_row());

   std::vector<std::pair<unsigned int, NumericT> > sorted_entries_U(tag.get_entries_per_row());


   for (vcl_size_t i=0; i<viennacl::traits::size1(A); ++i)  // Line 1

   {

     std::fill(sorted_entries_L.begin(), sorted_entries_L.end(), std::pair<unsigned int, NumericT>(0, NumericT(0)));

     std::fill(sorted_entries_U.begin(), sorted_entries_U.end(), std::pair<unsigned int, NumericT>(0, NumericT(0)));


     //line 2: set up w

     w_in->resize_if_bigger(row_buffer_A[i+1] - row_buffer_A[i]);

     NumericT row_norm = 0;

     unsigned int k = 0;

     for (unsigned int j = row_buffer_A[i]; j < row_buffer_A[i+1]; ++j, ++k)

     {

       w_in->col_indices_[k] = col_buffer_A[j];

       NumericT entry = elements_A[j];

       w_in->elements_[k] = entry;

       row_norm += entry * entry;

     }

     row_norm = std::sqrt(row_norm);

     NumericT tau_i = static_cast<NumericT>(tag.get_drop_tolerance()) * row_norm;


     //line 3: Iterate over lower diagonal parts of A:

     k = 0;

     unsigned int current_col = (row_buffer_A[i+1] > row_buffer_A[i]) ? w_in->col_indices_[k] : static_cast<unsigned int>(i); // mind empty rows here!

     while (current_col < i)

     {

       //line 4:

       NumericT a_kk = diagonal_U[current_col];


       NumericT w_k_entry = w_in->elements_[k] / a_kk;

       w_in->elements_[k] = w_k_entry;


       //lines 5,6: (dropping rule to w_k)

       if ( std::fabs(w_k_entry) > tau_i)

       {

         //line 7:

         unsigned int row_U_begin = row_buffer_U[current_col];

         unsigned int row_U_end   = row_buffer_U[current_col + 1];


         if (row_U_end > row_U_begin)

         {

           w_out->resize_if_bigger(w_in->size_ + (row_U_end - row_U_begin) - 1);

           w_out->size_ = detail::merge_subtract_sparse_rows(&(w_in->col_indices_[0]), &(w_in->elements_[0]), static_cast<unsigned int>(w_in->size_),

                                                             col_buffer_U + row_U_begin + 1, elements_U + row_U_begin + 1, (row_U_end - row_U_begin) - 1, w_k_entry,

                                                             &(w_out->col_indices_[0]), &(w_out->elements_[0])

                                                            );

           ++k;

         }

       }

       else // drop element

       {

         w_out->resize_if_bigger(w_in->size_ - 1);

         for (unsigned int r = 0; r < k; ++r)

         {

           w_out->col_indices_[r] = w_in->col_indices_[r];

           w_out->elements_[r]    = w_in->elements_[r];

         }

         for (unsigned int r = k+1; r < w_in->size_; ++r)

         {

           w_out->col_indices_[r-1] = w_in->col_indices_[r];

           w_out->elements_[r-1]    = w_in->elements_[r];

         }


         // Note: No increment to k here, element was dropped!

       }


       // swap pointers to w1 and w2

       std::swap(w_in, w_out);


       // process next entry:

       current_col = (k < w_in->size_) ? w_in->col_indices_[k] : static_cast<unsigned int>(i);

     } // while()


     // Line 10: Apply a dropping rule to w

     // To do so, we write values to a temporary array

     for (unsigned int r = 0; r < w_in->size_; ++r)

     {

       unsigned int col   = w_in->col_indices_[r];

       NumericT     value = w_in->elements_[r];


       if (col < i) // entry for L:

         detail::insert_with_value_sort(sorted_entries_L, col, value);

       else if (col == i) // do not drop diagonal element

       {

         diagonal_U[i] = value;

         if (value <= 0 && value >= 0)

         {

           std::cerr << "ViennaCL: FATAL ERROR in ILUT(): Diagonal entry computed to zero (" << value << ") in row " << i << "!" << std::endl;

           throw zero_on_diagonal_exception("ILUT zero diagonal!");

         }

       }

       else // entry for U:

         detail::insert_with_value_sort(sorted_entries_U, col, value);

     }


     //Lines 10-12: Apply a dropping rule to w, write the largest p values to L and U

     unsigned int offset_L = row_buffer_L[i];

     std::sort(sorted_entries_L.begin(), sorted_entries_L.end());

     for (unsigned int j=0; j<tag.get_entries_per_row(); ++j)

       if (std::fabs(sorted_entries_L[j].second) > 0)

       {

         col_buffer_L[offset_L] = sorted_entries_L[j].first;

         elements_L[offset_L]   = sorted_entries_L[j].second;

         ++offset_L;

       }

     row_buffer_L[i+1] = offset_L;


     unsigned int offset_U = row_buffer_U[i];

     col_buffer_U[offset_U] = static_cast<unsigned int>(i);

     elements_U[offset_U]   = diagonal_U[i];

     ++offset_U;

     std::sort(sorted_entries_U.begin(), sorted_entries_U.end());

     for (unsigned int j=0; j<tag.get_entries_per_row(); ++j)

       if (std::fabs(sorted_entries_U[j].second) > 0)

       {

         col_buffer_U[offset_U] = sorted_entries_U[j].first;

         elements_U[offset_U]   = sorted_entries_U[j].second;

         ++offset_U;

       }

     row_buffer_U[i+1] = offset_U;


   } //for i

 }


 template<typename MatrixT>

 class ilut_precond

 {

   typedef typename MatrixT::value_type      NumericType;


 public:

   ilut_precond(MatrixT const & mat, ilut_tag const & tag) : tag_(tag), L_(mat.size1(), mat.size2()), U_(mat.size1(), mat.size2())

   {

     //initialize preconditioner:

     //std::cout << "Start CPU precond" << std::endl;

     init(mat);

     //std::cout << "End CPU precond" << std::endl;

   }


   template<typename VectorT>

   void apply(VectorT & vec) const

   {

     //Note: Since vec can be a rather arbitrary vector type, we call the more generic version in the backend manually:

     {

       unsigned int const * row_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(L_.handle1());

       unsigned int const * col_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(L_.handle2());

       NumericType  const * elements   = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericType>(L_.handle());


       viennacl::linalg::host_based::detail::csr_inplace_solve<NumericType>(row_buffer, col_buffer, elements, vec, L_.size2(), unit_lower_tag());

     }

     {

       unsigned int const * row_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(U_.handle1());

       unsigned int const * col_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(U_.handle2());

       NumericType  const * elements   = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericType>(U_.handle());


       viennacl::linalg::host_based::detail::csr_inplace_solve<NumericType>(row_buffer, col_buffer, elements, vec, U_.size2(), upper_tag());

     }

   }


 private:

   void init(MatrixT const & mat)

   {

     viennacl::context host_context(viennacl::MAIN_MEMORY);

     viennacl::compressed_matrix<NumericType> temp;

     viennacl::switch_memory_context(temp, host_context);

     viennacl::switch_memory_context(L_, host_context);

     viennacl::switch_memory_context(U_, host_context);


     viennacl::copy(mat, temp);


     viennacl::linalg::precondition(temp, L_, U_, tag_);

   }


   ilut_tag tag_;

   viennacl::compressed_matrix<NumericType> L_;

   viennacl::compressed_matrix<NumericType> U_;

 };


 template<typename NumericT, unsigned int AlignmentV>

 class ilut_precond< viennacl::compressed_matrix<NumericT, AlignmentV> >

 {

 typedef viennacl::compressed_matrix<NumericT, AlignmentV>   MatrixType;


 public:

   ilut_precond(MatrixType const & mat, ilut_tag const & tag)

     : tag_(tag),

       L_(mat.size1(), mat.size2(), viennacl::traits::context(mat)),

       U_(mat.size1(), mat.size2(), viennacl::traits::context(mat))

   {

     //initialize preconditioner:

     //std::cout << "Start GPU precond" << std::endl;

     init(mat);

     //std::cout << "End GPU precond" << std::endl;

   }


   void apply(viennacl::vector<NumericT> & vec) const

   {

     if (vec.handle().get_active_handle_id() != viennacl::MAIN_MEMORY)

     {

       if (tag_.use_level_scheduling())

       {

         //std::cout << "Using multifrontal on GPU..." << std::endl;

         detail::level_scheduling_substitute(vec,

                                             multifrontal_L_row_index_arrays_,

                                             multifrontal_L_row_buffers_,

                                             multifrontal_L_col_buffers_,

                                             multifrontal_L_element_buffers_,

                                             multifrontal_L_row_elimination_num_list_);


         vec = viennacl::linalg::element_div(vec, multifrontal_U_diagonal_);


         detail::level_scheduling_substitute(vec,

                                             multifrontal_U_row_index_arrays_,

                                             multifrontal_U_row_buffers_,

                                             multifrontal_U_col_buffers_,

                                             multifrontal_U_element_buffers_,

                                             multifrontal_U_row_elimination_num_list_);


       }

       else

       {

         viennacl::context host_context(viennacl::MAIN_MEMORY);

         viennacl::context old_context = viennacl::traits::context(vec);

         viennacl::switch_memory_context(vec, host_context);

         viennacl::linalg::inplace_solve(L_, vec, unit_lower_tag());

         viennacl::linalg::inplace_solve(U_, vec, upper_tag());

         viennacl::switch_memory_context(vec, old_context);

       }

     }

     else //apply ILUT directly:

     {

       viennacl::linalg::inplace_solve(L_, vec, unit_lower_tag());

       viennacl::linalg::inplace_solve(U_, vec, upper_tag());

     }

   }


 private:

   void init(MatrixType const & mat)

   {

     viennacl::context host_context(viennacl::MAIN_MEMORY);

     viennacl::switch_memory_context(L_, host_context);

     viennacl::switch_memory_context(U_, host_context);


     if (viennacl::traits::context(mat).memory_type() == viennacl::MAIN_MEMORY)

     {

       viennacl::linalg::precondition(mat, L_, U_, tag_);

     }

     else //we need to copy to CPU

     {

       viennacl::compressed_matrix<NumericT> cpu_mat(mat.size1(), mat.size2(), viennacl::traits::context(mat));

       viennacl::switch_memory_context(cpu_mat, host_context);


       cpu_mat = mat;


       viennacl::linalg::precondition(cpu_mat, L_, U_, tag_);

     }


     if (!tag_.use_level_scheduling())

       return;


     //

     // multifrontal part:

     //


     viennacl::switch_memory_context(multifrontal_U_diagonal_, host_context);

     multifrontal_U_diagonal_.resize(U_.size1(), false);

     host_based::detail::row_info(U_, multifrontal_U_diagonal_, viennacl::linalg::detail::SPARSE_ROW_DIAGONAL);


     detail::level_scheduling_setup_L(L_,

                                      multifrontal_U_diagonal_, //dummy

                                      multifrontal_L_row_index_arrays_,

                                      multifrontal_L_row_buffers_,

                                      multifrontal_L_col_buffers_,

                                      multifrontal_L_element_buffers_,

                                      multifrontal_L_row_elimination_num_list_);


     detail::level_scheduling_setup_U(U_,

                                      multifrontal_U_diagonal_,

                                      multifrontal_U_row_index_arrays_,

                                      multifrontal_U_row_buffers_,

                                      multifrontal_U_col_buffers_,

                                      multifrontal_U_element_buffers_,

                                      multifrontal_U_row_elimination_num_list_);


     //

     // Bring to device if necessary:

     //


     // L:


     for (typename std::list< viennacl::backend::mem_handle >::iterator it  = multifrontal_L_row_index_arrays_.begin();

                                                                        it != multifrontal_L_row_index_arrays_.end();

                                                                      ++it)

       viennacl::backend::switch_memory_context<unsigned int>(*it, viennacl::traits::context(mat));


     for (typename std::list< viennacl::backend::mem_handle >::iterator it  = multifrontal_L_row_buffers_.begin();

                                                                        it != multifrontal_L_row_buffers_.end();

                                                                      ++it)

       viennacl::backend::switch_memory_context<unsigned int>(*it, viennacl::traits::context(mat));


     for (typename std::list< viennacl::backend::mem_handle >::iterator it  = multifrontal_L_col_buffers_.begin();

                                                                        it != multifrontal_L_col_buffers_.end();

                                                                      ++it)

       viennacl::backend::switch_memory_context<unsigned int>(*it, viennacl::traits::context(mat));


     for (typename std::list< viennacl::backend::mem_handle >::iterator it  = multifrontal_L_element_buffers_.begin();

                                                                        it != multifrontal_L_element_buffers_.end();

                                                                      ++it)

       viennacl::backend::switch_memory_context<NumericT>(*it, viennacl::traits::context(mat));


     // U:


     viennacl::switch_memory_context(multifrontal_U_diagonal_, viennacl::traits::context(mat));


     for (typename std::list< viennacl::backend::mem_handle >::iterator it  = multifrontal_U_row_index_arrays_.begin();

                                                                        it != multifrontal_U_row_index_arrays_.end();

                                                                      ++it)

       viennacl::backend::switch_memory_context<unsigned int>(*it, viennacl::traits::context(mat));


     for (typename std::list< viennacl::backend::mem_handle >::iterator it  = multifrontal_U_row_buffers_.begin();

                                                                        it != multifrontal_U_row_buffers_.end();

                                                                      ++it)

       viennacl::backend::switch_memory_context<unsigned int>(*it, viennacl::traits::context(mat));


     for (typename std::list< viennacl::backend::mem_handle >::iterator it  = multifrontal_U_col_buffers_.begin();

                                                                        it != multifrontal_U_col_buffers_.end();

                                                                      ++it)

       viennacl::backend::switch_memory_context<unsigned int>(*it, viennacl::traits::context(mat));


     for (typename std::list< viennacl::backend::mem_handle >::iterator it  = multifrontal_U_element_buffers_.begin();

                                                                        it != multifrontal_U_element_buffers_.end();

                                                                      ++it)

       viennacl::backend::switch_memory_context<NumericT>(*it, viennacl::traits::context(mat));


   }


   ilut_tag tag_;

   viennacl::compressed_matrix<NumericT> L_;

   viennacl::compressed_matrix<NumericT> U_;


   std::list<viennacl::backend::mem_handle> multifrontal_L_row_index_arrays_;

   std::list<viennacl::backend::mem_handle> multifrontal_L_row_buffers_;

   std::list<viennacl::backend::mem_handle> multifrontal_L_col_buffers_;

   std::list<viennacl::backend::mem_handle> multifrontal_L_element_buffers_;

   std::list<vcl_size_t > multifrontal_L_row_elimination_num_list_;


   viennacl::vector<NumericT> multifrontal_U_diagonal_;

   std::list<viennacl::backend::mem_handle> multifrontal_U_row_index_arrays_;

   std::list<viennacl::backend::mem_handle> multifrontal_U_row_buffers_;

   std::list<viennacl::backend::mem_handle> multifrontal_U_col_buffers_;

   std::list<viennacl::backend::mem_handle> multifrontal_U_element_buffers_;

   std::list<vcl_size_t > multifrontal_U_row_elimination_num_list_;

 };


 } // namespace linalg

 } // namespace viennacl


 #endif


viennacl::compressed_matrix::size2
const vcl_size_t & size2() const
Returns the number of columns.
Definition: compressed_matrix.hpp:929

viennacl::traits::fill
void fill(MatrixType &matrix, vcl_size_t row_index, vcl_size_t col_index, NumericT value)
Generic filler routine for setting an entry of a matrix to a particular value.
Definition: fill.hpp:46

viennacl::linalg::element_div
viennacl::vector_expression< const vector_base< T >, const vector_base< T >, op_element_binary< op_div > > element_div(vector_base< T > const &v1, vector_base< T > const &v2)

viennacl::zero_on_diagonal_exception
Definition: forwards.h:597

viennacl::linalg::inplace_solve
void inplace_solve(const matrix_base< NumericT > &A, matrix_base< NumericT > &B, SolverTagT)
Direct inplace solver for triangular systems with multiple right hand sides, i.e. A \ B (MATLAB notat...
Definition: direct_solve.hpp:217

viennacl::linalg::detail::merge_subtract_sparse_rows
IndexT merge_subtract_sparse_rows(IndexT const *w_coords, NumericT const *w_elements, IndexT w_size, IndexT const *u_coords, NumericT const *u_elements, IndexT u_size, NumericT alpha, IndexT *z_coords, NumericT *z_elements)
Subtracts a scaled sparse vector u from a sparse vector w and writes the output to z: z = w - alpha *...
Definition: ilut.hpp:120

viennacl::linalg::ilut_precond::ilut_precond
ilut_precond(MatrixT const &mat, ilut_tag const &tag)
Definition: ilut.hpp:357

viennacl::compressed_matrix::size1
const vcl_size_t & size1() const
Returns the number of rows.
Definition: compressed_matrix.hpp:927

tools.hpp
Various little tools used here and there in ViennaCL.

viennacl::traits::size1
vcl_size_t size1(MatrixType const &mat)
Generic routine for obtaining the number of rows of a matrix (ViennaCL, uBLAS, etc.)
Definition: size.hpp:163

viennacl::linalg::detail::ilut_sparse_vector::size_
vcl_size_t size_
Definition: ilut.hpp:108

viennacl::linalg::detail::ilut_sparse_vector::col_indices_
std::vector< unsigned int > col_indices_
Definition: ilut.hpp:109

viennacl::linalg::ilut_tag::set_entries_per_row
void set_entries_per_row(unsigned int e)
Definition: ilut.hpp:68

viennacl::linalg::precondition
void precondition(viennacl::compressed_matrix< NumericT > &A, ilu0_tag const &)
Implementation of a ILU-preconditioner with static pattern. Optimized version for CSR matrices...
Definition: ilu0.hpp:78

forwards.h
This file provides the forward declarations for the main types used within ViennaCL.

viennacl::linalg::ilut_tag::use_level_scheduling
bool use_level_scheduling() const
Definition: ilut.hpp:76

viennacl::linalg::detail::level_scheduling_setup_U
void level_scheduling_setup_U(viennacl::compressed_matrix< NumericT, AlignmentV > const &LU, viennacl::vector< NumericT > const &diagonal_LU, std::list< viennacl::backend::mem_handle > &row_index_arrays, std::list< viennacl::backend::mem_handle > &row_buffers, std::list< viennacl::backend::mem_handle > &col_buffers, std::list< viennacl::backend::mem_handle > &element_buffers, std::list< vcl_size_t > &row_elimination_num_list)
Definition: common.hpp:208

viennacl::traits::size2
result_of::size_type< MatrixType >::type size2(MatrixType const &mat)
Generic routine for obtaining the number of columns of a matrix (ViennaCL, uBLAS, etc...
Definition: size.hpp:201

viennacl::linalg::detail::level_scheduling_substitute
void level_scheduling_substitute(viennacl::vector< NumericT > &vec, std::list< viennacl::backend::mem_handle > const &row_index_arrays, std::list< viennacl::backend::mem_handle > const &row_buffers, std::list< viennacl::backend::mem_handle > const &col_buffers, std::list< viennacl::backend::mem_handle > const &element_buffers, std::list< vcl_size_t > const &row_elimination_num_list)
Definition: common.hpp:224

viennacl::compressed_matrix::handle
const handle_type & handle() const
Returns the OpenCL handle to the matrix entry array.
Definition: compressed_matrix.hpp:942

viennacl::compressed_matrix::handle1
const handle_type & handle1() const
Returns the OpenCL handle to the row index array.
Definition: compressed_matrix.hpp:936

viennacl::compressed_matrix::nnz
const vcl_size_t & nnz() const
Returns the number of nonzero entries.
Definition: compressed_matrix.hpp:931

NumericT
float NumericT
Definition: bisect.cpp:40

viennacl::context
Represents a generic 'context' similar to an OpenCL context, but is backend-agnostic and thus also su...
Definition: context.hpp:39

viennacl::linalg::ilut_precond::apply
void apply(VectorT &vec) const
Definition: ilut.hpp:366

viennacl::linalg::detail::ilut_sparse_vector::resize_if_bigger
void resize_if_bigger(vcl_size_t s)
Definition: ilut.hpp:98

viennacl::linalg::upper_tag
A tag class representing an upper triangular matrix.
Definition: forwards.h:854

viennacl::linalg::ilut_tag
A tag for incomplete LU factorization with threshold (ILUT)
Definition: ilut.hpp:45

compressed_matrix.hpp
Implementation of the compressed_matrix class.

viennacl::linalg::ilut_precond< viennacl::compressed_matrix< NumericT, AlignmentV > >::ilut_precond
ilut_precond(MatrixType const &mat, ilut_tag const &tag)
Definition: ilut.hpp:415

viennacl::linalg::ilut_tag::get_entries_per_row
unsigned int get_entries_per_row() const
Definition: ilut.hpp:74

viennacl::compressed_matrix::handle2
const handle_type & handle2() const
Returns the OpenCL handle to the column index array.
Definition: compressed_matrix.hpp:938

viennacl::linalg::ilut_precond
ILUT preconditioner class, can be supplied to solve()-routines.
Definition: ilut.hpp:352

viennacl::linalg::detail::insert_with_value_sort
void insert_with_value_sort(std::vector< std::pair< SizeT, NumericT > > &map, SizeT index, NumericT value)
Definition: ilut.hpp:164

viennacl::vcl_size_t
std::size_t vcl_size_t
Definition: forwards.h:75

common.hpp
Common routines for single-threaded or OpenMP-enabled execution on CPU.

viennacl::vector< NumericT >

viennacl::linalg::cuda::swap
viennacl::enable_if< viennacl::is_scalar< ScalarT1 >::value &&viennacl::is_scalar< ScalarT2 >::value >::type swap(ScalarT1 &s1, ScalarT2 &s2)
Swaps the contents of two scalars, data is copied.
Definition: scalar_operations.hpp:361

viennacl::linalg::detail::ilut_sparse_vector::ilut_sparse_vector
ilut_sparse_vector(vcl_size_t alloc_size=0)
Definition: ilut.hpp:96

viennacl::MAIN_MEMORY
Definition: forwards.h:348

viennacl::compressed_matrix::reserve
void reserve(vcl_size_t new_nonzeros, bool preserve=true)
Allocate memory for the supplied number of nonzeros in the matrix. Old values are preserved...
Definition: compressed_matrix.hpp:794

viennacl::linalg::ilut_precond< viennacl::compressed_matrix< NumericT, AlignmentV > >::apply
void apply(viennacl::vector< NumericT > &vec) const
Definition: ilut.hpp:426

viennacl::linalg::ilut_tag::set_drop_tolerance
void set_drop_tolerance(double tol)
Definition: ilut.hpp:61

viennacl::traits::context
viennacl::context context(T const &t)
Returns an ID for the currently active memory domain of an object.
Definition: context.hpp:40

viennacl::linalg::detail::SPARSE_ROW_DIAGONAL
Definition: forwards.h:842

viennacl::copy
void copy(std::vector< NumericT > &cpu_vec, circulant_matrix< NumericT, AlignmentV > &gpu_mat)
Copies a circulant matrix from the std::vector to the OpenCL device (either GPU or multi-core CPU) ...
Definition: circulant_matrix.hpp:150

viennacl::linalg::ilut_tag::use_level_scheduling
void use_level_scheduling(bool b)
Definition: ilut.hpp:77

viennacl::linalg::detail::ilut_sparse_vector::elements_
std::vector< NumericT > elements_
Definition: ilut.hpp:110

viennacl::linalg::unit_lower_tag
A tag class representing a lower triangular matrix with unit diagonal.
Definition: forwards.h:859

viennacl::linalg::detail::ilut_sparse_vector
Helper struct for holding a sparse vector in linear memory. For internal use only.
Definition: ilut.hpp:94

viennacl::linalg::host_based::detail::row_info
void row_info(compressed_matrix< NumericT, AlignmentV > const &mat, vector_base< NumericT > &vec, viennacl::linalg::detail::row_info_types info_selector)
Definition: sparse_matrix_operations.hpp:53

viennacl::linalg::detail::level_scheduling_setup_L
void level_scheduling_setup_L(viennacl::compressed_matrix< NumericT, AlignmentV > const &LU, viennacl::vector< NumericT > const &diagonal_LU, std::list< viennacl::backend::mem_handle > &row_index_arrays, std::list< viennacl::backend::mem_handle > &row_buffers, std::list< viennacl::backend::mem_handle > &col_buffers, std::list< viennacl::backend::mem_handle > &element_buffers, std::list< vcl_size_t > &row_elimination_num_list)
Definition: common.hpp:191

viennacl::compressed_matrix< NumericT >

common.hpp
Common routines used within ILU-type preconditioners.

viennacl::vector_base::handle
const handle_type & handle() const
Returns the memory handle.
Definition: vector_def.hpp:128

viennacl::linalg::ilut_tag::ilut_tag
ilut_tag(unsigned int entries_per_row=20, double drop_tolerance=1e-4, bool with_level_scheduling=false)
The constructor.
Definition: ilut.hpp:54

viennacl::backend::mem_handle::get_active_handle_id
memory_types get_active_handle_id() const
Returns an ID for the currently active memory buffer. Other memory buffers might contain old or no da...
Definition: mem_handle.hpp:118

viennacl::linalg::ilut_tag::get_drop_tolerance
double get_drop_tolerance() const
Definition: ilut.hpp:66

viennacl::switch_memory_context
void switch_memory_context(T &obj, viennacl::context new_ctx)
Generic convenience routine for migrating data of an object to a new memory domain.
Definition: memory.hpp:622