doc/host__based_2amg__operations_8hpp_source.html

 #ifndef VIENNACL_LINALG_HOST_BASED_AMG_OPERATIONS_HPP

 #define VIENNACL_LINALG_HOST_BASED_AMG_OPERATIONS_HPP


 /* =========================================================================

    Copyright (c) 2010-2016, Institute for Microelectronics,

                             Institute for Analysis and Scientific Computing,

                             TU Wien.

    Portions of this software are copyright by UChicago Argonne, LLC.


                             -----------------

                   ViennaCL - The Vienna Computing Library

                             -----------------


    Project Head:    Karl Rupp                   rupp@iue.tuwien.ac.at


    (A list of authors and contributors can be found in the PDF manual)


    License:         MIT (X11), see file LICENSE in the base directory

 ============================================================================= */


 #include <cstdlib>

 #include <cmath>

 #include "viennacl/linalg/detail/amg/amg_base.hpp"


 #include <map>

 #include <set>

 #include <functional>

 #ifdef VIENNACL_WITH_OPENMP

 #include <omp.h>

 #endif


 namespace viennacl

 {

 namespace linalg

 {

 namespace host_based

 {

 namespace amg

 {


 template<typename NumericT>

 void amg_influence_trivial(compressed_matrix<NumericT> const & A,

                            viennacl::linalg::detail::amg::amg_level_context & amg_context,

                            viennacl::linalg::amg_tag & tag)

 {

   (void)tag;


   unsigned int const * A_row_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(A.handle1());

   unsigned int const * A_col_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(A.handle2());


   unsigned int *influences_row_ptr = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_jumper_.handle());

   unsigned int *influences_id_ptr  = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_ids_.handle());

   unsigned int *influences_values_ptr  = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_values_.handle());


 #ifdef VIENNACL_WITH_OPENMP

   #pragma omp parallel for

 #endif

   for (long i2=0; i2<static_cast<long>(A.size1()); ++i2)

   {

     vcl_size_t i = vcl_size_t(i2);

     influences_row_ptr[i] = A_row_buffer[i];

     influences_values_ptr[i] = A_row_buffer[i+1] - A_row_buffer[i];

   }

   influences_row_ptr[A.size1()] = A_row_buffer[A.size1()];


 #ifdef VIENNACL_WITH_OPENMP

   #pragma omp parallel for

 #endif

   for (long i=0; i<long(A.nnz()); ++i)

     influences_id_ptr[i] = A_col_buffer[i];

 }


 template<typename NumericT>

 void amg_influence_advanced(compressed_matrix<NumericT> const & A,

                             viennacl::linalg::detail::amg::amg_level_context & amg_context,

                             viennacl::linalg::amg_tag & tag)

 {

   NumericT     const * A_elements   = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericT>(A.handle());

   unsigned int const * A_row_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(A.handle1());

   unsigned int const * A_col_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(A.handle2());


   unsigned int *influences_row_ptr = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_jumper_.handle());

   unsigned int *influences_id_ptr  = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_ids_.handle());


   //

   // Step 1: Scan influences in order to allocate the necessary memory

   //

 #ifdef VIENNACL_WITH_OPENMP

   #pragma omp parallel for

 #endif

   for (long i2=0; i2<static_cast<long>(A.size1()); ++i2)

   {

     vcl_size_t i = vcl_size_t(i2);

     unsigned int row_start = A_row_buffer[i];

     unsigned int row_stop  = A_row_buffer[i+1];

     NumericT diag = 0;

     NumericT largest_positive = 0;

     NumericT largest_negative = 0;

     unsigned int num_influences = 0;


     // obtain diagonal element as well as maximum positive and negative off-diagonal entries

     for (unsigned int nnz_index = row_start; nnz_index < row_stop; ++nnz_index)

     {

       unsigned int col = A_col_buffer[nnz_index];

       NumericT value   = A_elements[nnz_index];


       if (col == i)

         diag = value;

       else if (value > largest_positive)

         largest_positive = value;

       else if (value < largest_negative)

         largest_negative = value;

     }


     if (largest_positive <= 0 && largest_negative >= 0) // no offdiagonal entries

     {

       influences_row_ptr[i] = 0;

       continue;

     }


     // Find all points that strongly influence current point (Yang, p.5)

     //std::cout << "Looking for strongly influencing points for point " << i << std::endl;

     for (unsigned int nnz_index = row_start; nnz_index < row_stop; ++nnz_index)

     {

       unsigned int col = A_col_buffer[nnz_index];


       if (i == col)

         continue;


       NumericT value   = A_elements[nnz_index];


       if (   (diag > 0 && diag * value <= tag.get_strong_connection_threshold() * diag * largest_negative)

           || (diag < 0 && diag * value <= tag.get_strong_connection_threshold() * diag * largest_positive))

       {

         ++num_influences;

       }

     }


     influences_row_ptr[i] = num_influences;

   }


   //

   // Step 2: Exclusive scan on number of influences to obtain CSR-like datastructure

   //

   unsigned int current_entry = 0;

   for (std::size_t i=0; i<A.size1(); ++i)

   {

     unsigned int tmp = influences_row_ptr[i];

     influences_row_ptr[i] = current_entry;

     current_entry += tmp;

   }

   influences_row_ptr[A.size1()] = current_entry;


   //

   // Step 3: Write actual influences

   //

 #ifdef VIENNACL_WITH_OPENMP

   #pragma omp parallel for

 #endif

   for (long i2=0; i2<static_cast<long>(A.size1()); ++i2)

   {

     unsigned int i = static_cast<unsigned int>(i2);

     unsigned int row_start = A_row_buffer[i];

     unsigned int row_stop  = A_row_buffer[i+1];

     NumericT diag = 0;

     NumericT largest_positive = 0;

     NumericT largest_negative = 0;


     // obtain diagonal element as well as maximum positive and negative off-diagonal entries

     for (unsigned int nnz_index = row_start; nnz_index < row_stop; ++nnz_index)

     {

       unsigned int col = A_col_buffer[nnz_index];

       NumericT value   = A_elements[nnz_index];


       if (col == i)

         diag = value;

       else if (value > largest_positive)

         largest_positive = value;

       else if (value < largest_negative)

         largest_negative = value;

     }


     if (largest_positive <= 0 && largest_negative >= 0) // no offdiagonal entries

       continue;


     // Find all points that strongly influence current point (Yang, p.5)

     //std::cout << "Looking for strongly influencing points for point " << i << std::endl;

     unsigned int *influences_id_write_ptr = influences_id_ptr + influences_row_ptr[i];

     for (unsigned int nnz_index = row_start; nnz_index < row_stop; ++nnz_index)

     {

       unsigned int col = A_col_buffer[nnz_index];


       if (i == col)

         continue;


       NumericT value   = A_elements[nnz_index];


       if (   (diag > 0 && diag * value <= tag.get_strong_connection_threshold() * diag * largest_negative)

           || (diag < 0 && diag * value <= tag.get_strong_connection_threshold() * diag * largest_positive))

       {

         //std::cout << " - Adding influence from point " << col << std::endl;

         *influences_id_write_ptr = col;

         ++influences_id_write_ptr;

       }

     }

   }


 }


 template<typename NumericT>

 void amg_influence(compressed_matrix<NumericT> const & A,

                    viennacl::linalg::detail::amg::amg_level_context & amg_context,

                    viennacl::linalg::amg_tag & tag)

 {

   // TODO: dispatch based on influence tolerance provided

   amg_influence_trivial(A, amg_context, tag);

 }


 inline void enumerate_coarse_points(viennacl::linalg::detail::amg::amg_level_context & amg_context)

 {

   unsigned int *point_types_ptr  = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.point_types_.handle());

   unsigned int *coarse_id_ptr    = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.coarse_id_.handle());


   unsigned int coarse_id = 0;

   for (vcl_size_t i=0; i<amg_context.coarse_id_.size(); ++i)

   {

     //assert(point_types_ptr[i] != viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_UNDECIDED && bool("Logic error in enumerate_coarse_points(): Undecided points detected!"));


     if (point_types_ptr[i] == viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_COARSE)

       coarse_id_ptr[i] = coarse_id++;

   }


   //std::cout << "Coarse nodes after enumerate_coarse_points(): " << coarse_id << std::endl;

   amg_context.num_coarse_ = coarse_id;

 }


 struct amg_id_influence

 {

   amg_id_influence(std::size_t id2, std::size_t influences2) : id(static_cast<unsigned int>(id2)), influences(static_cast<unsigned int>(influences2)) {}


   unsigned int  id;

   unsigned int  influences;

 };


 inline bool operator>(amg_id_influence const & a, amg_id_influence const & b)

 {

   if (a.influences > b.influences)

     return true;

   if (a.influences == b.influences)

     return a.id > b.id;

   return false;

 }


 template<typename NumericT>

 void amg_coarse_classic_onepass(compressed_matrix<NumericT> const & A,

                                 viennacl::linalg::detail::amg::amg_level_context & amg_context,

                                 viennacl::linalg::amg_tag & tag)

 {

   unsigned int *point_types_ptr       = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.point_types_.handle());

   unsigned int *influences_row_ptr    = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_jumper_.handle());

   unsigned int *influences_id_ptr     = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_ids_.handle());

   unsigned int *influences_values_ptr = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_values_.handle());


   std::set<amg_id_influence, std::greater<amg_id_influence> > points_by_influences;


   amg_influence_advanced(A, amg_context, tag);


   for (std::size_t i=0; i<A.size1(); ++i)

     points_by_influences.insert(amg_id_influence(i, influences_values_ptr[i]));


   //std::cout << "Starting coarsening process..." << std::endl;


   while (!points_by_influences.empty())

   {

     amg_id_influence point = *(points_by_influences.begin());


     // remove point from queue:

     points_by_influences.erase(points_by_influences.begin());


     //std::cout << "Working on point " << point.id << std::endl;


     // point is already coarse or fine point, continue;

     if (point_types_ptr[point.id] != viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_UNDECIDED)

       continue;


     //std::cout << " Setting point " << point.id << " to a coarse point." << std::endl;

     // make this a coarse point:

     point_types_ptr[point.id] = viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_COARSE;


     // Set strongly influenced points to fine points:

     unsigned int j_stop = influences_row_ptr[point.id + 1];

     for (unsigned int j = influences_row_ptr[point.id]; j < j_stop; ++j)

     {

       unsigned int influenced_point_id = influences_id_ptr[j];


       //std::cout << "Checking point " << influenced_point_id << std::endl;

       if (point_types_ptr[influenced_point_id] != viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_UNDECIDED)

         continue;


       //std::cout << " Setting point " << influenced_point_id << " to a fine point." << std::endl;

       point_types_ptr[influenced_point_id] = viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_FINE;


       // add one to influence measure for all undecided points strongly influencing this fine point.

       unsigned int k_stop = influences_row_ptr[influenced_point_id + 1];

       for (unsigned int k = influences_row_ptr[influenced_point_id]; k < k_stop; ++k)

       {

         unsigned int influenced_influenced_point_id = influences_id_ptr[k];

         if (point_types_ptr[influenced_influenced_point_id] == viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_UNDECIDED)

         {

           // grab and remove from set, increase influence counter, store back:

           amg_id_influence point_to_find(influenced_influenced_point_id, influences_values_ptr[influenced_influenced_point_id]);

           points_by_influences.erase(point_to_find);


           point_to_find.influences += 1;

           influences_values_ptr[influenced_influenced_point_id] += 1; // for consistency


           points_by_influences.insert(point_to_find);

         }

       } //for

     } // for


   } // while


   viennacl::linalg::host_based::amg::enumerate_coarse_points(amg_context);

 }


 template<typename NumericT>

 void amg_coarse_ag_stage1_sequential(compressed_matrix<NumericT> const & A,

                                      viennacl::linalg::detail::amg::amg_level_context & amg_context,

                                      viennacl::linalg::amg_tag & tag)

 {

   (void)tag;

   unsigned int *point_types_ptr       = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.point_types_.handle());

   unsigned int *influences_row_ptr    = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_jumper_.handle());

   unsigned int *influences_id_ptr     = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_ids_.handle());


   for (unsigned int i=0; i<static_cast<unsigned int>(A.size1()); ++i)

   {

     // check if node has no aggregates next to it (MIS-2)

     bool is_new_coarse_node = true;


     // Set strongly influenced points to fine points:

     unsigned int j_stop = influences_row_ptr[i + 1];

     for (unsigned int j = influences_row_ptr[i]; j < j_stop; ++j)

     {

       unsigned int influenced_point_id = influences_id_ptr[j];

       if (point_types_ptr[influenced_point_id] != viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_UNDECIDED) // either coarse or fine point

       {

         is_new_coarse_node = false;

         break;

       }

     }


     if (is_new_coarse_node)

     {

       // make all strongly influenced neighbors fine points:

       for (unsigned int j = influences_row_ptr[i]; j < j_stop; ++j)

       {

         unsigned int influenced_point_id = influences_id_ptr[j];

         point_types_ptr[influenced_point_id] = viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_FINE;

       }


       //std::cout << "Setting new coarse node: " << i << std::endl;

       // Note: influences may include diagonal element, so it's important to *first* set fine points above before setting the coarse information here

       point_types_ptr[i] = viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_COARSE;

     }

   }

 }


 template<typename NumericT>

 void amg_coarse_ag_stage1_mis2(compressed_matrix<NumericT> const & A,

                                viennacl::linalg::detail::amg::amg_level_context & amg_context,

                                viennacl::linalg::amg_tag & tag)

 {

   (void)tag;

   unsigned int  *point_types_ptr       = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.point_types_.handle());

   unsigned int *influences_row_ptr    = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_jumper_.handle());

   unsigned int *influences_id_ptr     = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_ids_.handle());


   std::vector<unsigned int> random_weights(A.size1());

   for (std::size_t i=0; i<random_weights.size(); ++i)

     random_weights[i] = static_cast<unsigned int>(rand()) % static_cast<unsigned int>(A.size1());


   std::size_t num_threads = 1;

 #ifdef VIENNACL_WITH_OPENMP

   num_threads = omp_get_max_threads();

 #endif


   viennacl::vector<unsigned int> work_state(A.size1(), viennacl::traits::context(A));

   viennacl::vector<unsigned int> work_random(A.size1(), viennacl::traits::context(A));

   viennacl::vector<unsigned int> work_index(A.size1(), viennacl::traits::context(A));


   unsigned int *work_state_ptr     = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(work_state.handle());

   unsigned int *work_random_ptr    = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(work_random.handle());

   unsigned int *work_index_ptr     = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(work_index.handle());


   viennacl::vector<unsigned int> work_state2(A.size1(), viennacl::traits::context(A));

   viennacl::vector<unsigned int> work_random2(A.size1(), viennacl::traits::context(A));

   viennacl::vector<unsigned int> work_index2(A.size1(), viennacl::traits::context(A));


   unsigned int *work_state2_ptr     = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(work_state2.handle());

   unsigned int *work_random2_ptr    = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(work_random2.handle());

   unsigned int *work_index2_ptr     = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(work_index2.handle());


   unsigned int num_undecided = static_cast<unsigned int>(A.size1());

   unsigned int pmis_iters = 0;

   while (num_undecided > 0)

   {

     ++pmis_iters;


     //

     // init temporary work data:

     //

 #ifdef VIENNACL_WITH_OPENMP

   #pragma omp parallel for

 #endif

     for (long i2=0; i2<static_cast<long>(A.size1()); ++i2)

     {

       unsigned int i = static_cast<unsigned int>(i2);

       switch (point_types_ptr[i])

       {

       case viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_UNDECIDED: work_state_ptr[i] = 1; break;

       case viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_FINE:      work_state_ptr[i] = 0; break;

       case viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_COARSE:    work_state_ptr[i] = 2; break;

       default:

         throw std::runtime_error("Unexpected state encountered in MIS2 setup for AMG.");

       }


       work_random_ptr[i] = random_weights[i];

       work_index_ptr[i]  = i;

     }


     //

     // Propagate maximum tuple twice

     //

     for (unsigned int r = 0; r < 2; ++r)

     {

       // max operation

 #ifdef VIENNACL_WITH_OPENMP

       #pragma omp parallel for

 #endif

       for (long i2=0; i2<static_cast<long>(A.size1()); ++i2)

       {

         unsigned int i = static_cast<unsigned int>(i2);

         // load

         unsigned int state  = work_state_ptr[i];

         unsigned int random = work_random_ptr[i];

         unsigned int index  = work_index_ptr[i];


         // max

         unsigned int j_stop = influences_row_ptr[i + 1];

         for (unsigned int j = influences_row_ptr[i]; j < j_stop; ++j)

         {

           unsigned int influenced_point_id = influences_id_ptr[j];


           // lexigraphical triple-max (not particularly pretty, but does the job):

           if (state < work_state_ptr[influenced_point_id])

           {

             state  = work_state_ptr[influenced_point_id];

             random = work_random_ptr[influenced_point_id];

             index  = work_index_ptr[influenced_point_id];

           }

           else if (state == work_state_ptr[influenced_point_id])

           {

             if (random < work_random_ptr[influenced_point_id])

             {

               state  = work_state_ptr[influenced_point_id];

               random = work_random_ptr[influenced_point_id];

               index  = work_index_ptr[influenced_point_id];

             }

             else if (random == work_random_ptr[influenced_point_id])

             {

               if (index < work_index_ptr[influenced_point_id])

               {

                 state  = work_state_ptr[influenced_point_id];

                 random = work_random_ptr[influenced_point_id];

                 index  = work_index_ptr[influenced_point_id];

               }

             } // max(random)

           } // max(state)

         } // for


         // store

         work_state2_ptr[i]  = state;

         work_random2_ptr[i] = random;

         work_index2_ptr[i]  = index;

       }


       // copy work array

 #ifdef VIENNACL_WITH_OPENMP

       #pragma omp parallel for

 #endif

       for (long i2=0; i2<static_cast<long>(A.size1()); ++i2)

       {

         unsigned int i = static_cast<unsigned int>(i2);

         work_state_ptr[i]  = work_state2_ptr[i];

         work_random_ptr[i] = work_random2_ptr[i];

         work_index_ptr[i]  = work_index2_ptr[i];

       }

     }


     //

     // mark MIS and non-MIS nodes:

     //

     std::vector<unsigned int> thread_buffer(num_threads);


 #ifdef VIENNACL_WITH_OPENMP

     #pragma omp parallel for

 #endif

     for (long i2=0; i2<static_cast<long>(A.size1()); ++i2)

     {

       unsigned int i = static_cast<unsigned int>(i2);

       unsigned int max_state  = work_state_ptr[i];

       unsigned int max_index  = work_index_ptr[i];


       if (point_types_ptr[i] == viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_UNDECIDED)

       {

         if (i == max_index) // make this a MIS node

           point_types_ptr[i] = viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_COARSE;

         else if (max_state == 2) // mind the mapping of viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_COARSE above!

           point_types_ptr[i] = viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_FINE;

         else

 #ifdef VIENNACL_WITH_OPENMP

           thread_buffer[omp_get_thread_num()] += 1;

 #else

           thread_buffer[0] += 1;

 #endif

       }

     }


     num_undecided = 0;

     for (std::size_t i=0; i<thread_buffer.size(); ++i)

       num_undecided += thread_buffer[i];

   } // while


   // consistency with sequential MIS: reset state for non-coarse points, so that coarse indices are correctly picked up later

 #ifdef VIENNACL_WITH_OPENMP

   #pragma omp parallel for

 #endif

   for (long i=0; i<static_cast<long>(A.size1()); ++i)

     if (point_types_ptr[i] != viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_COARSE)

       point_types_ptr[i] = viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_UNDECIDED;


 }


 template<typename NumericT>

 void amg_coarse_ag(compressed_matrix<NumericT> const & A,

                    viennacl::linalg::detail::amg::amg_level_context & amg_context,

                    viennacl::linalg::amg_tag & tag)

 {

   unsigned int *point_types_ptr       = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.point_types_.handle());

   unsigned int *influences_row_ptr    = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_jumper_.handle());

   unsigned int *influences_id_ptr     = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_ids_.handle());

   unsigned int *coarse_id_ptr         = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.coarse_id_.handle());


   amg_influence_trivial(A, amg_context, tag);


   //

   // Stage 1: Build aggregates:

   //

   if (tag.get_coarsening_method() == viennacl::linalg::AMG_COARSENING_METHOD_AGGREGATION)      amg_coarse_ag_stage1_sequential(A, amg_context, tag);

   if (tag.get_coarsening_method() == viennacl::linalg::AMG_COARSENING_METHOD_MIS2_AGGREGATION) amg_coarse_ag_stage1_mis2(A, amg_context, tag);


   viennacl::linalg::host_based::amg::enumerate_coarse_points(amg_context);


   //

   // Stage 2: Propagate coarse aggregate indices to neighbors:

   //

 #ifdef VIENNACL_WITH_OPENMP

   #pragma omp parallel for

 #endif

   for (long i2=0; i2<static_cast<long>(A.size1()); ++i2)

   {

     unsigned int i = static_cast<unsigned int>(i2);

     if (point_types_ptr[i] == viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_COARSE)

     {

       unsigned int coarse_index = coarse_id_ptr[i];


       unsigned int j_stop = influences_row_ptr[i + 1];

       for (unsigned int j = influences_row_ptr[i]; j < j_stop; ++j)

       {

         unsigned int influenced_point_id = influences_id_ptr[j];

         coarse_id_ptr[influenced_point_id] = coarse_index; // Set aggregate index for fine point


         if (influenced_point_id != i) // Note: Any write races between threads are harmless here

           point_types_ptr[influenced_point_id] = viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_FINE;

       }

     }

   }


   //

   // Stage 3: Merge remaining undecided points (merging to first aggregate found when cycling over the hierarchy

   //

 #ifdef VIENNACL_WITH_OPENMP

   #pragma omp parallel for

 #endif

   for (long i2=0; i2<static_cast<long>(A.size1()); ++i2)

   {

     unsigned int i = static_cast<unsigned int>(i2);

     if (point_types_ptr[i] == viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_UNDECIDED)

     {

       unsigned int j_stop = influences_row_ptr[i + 1];

       for (unsigned int j = influences_row_ptr[i]; j < j_stop; ++j)

       {

         unsigned int influenced_point_id = influences_id_ptr[j];

         if (point_types_ptr[influenced_point_id] != viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_UNDECIDED) // either coarse or fine point

         {

           //std::cout << "Setting fine node " << i << " to be aggregated with node " << *influence_iter << "/" << pointvector.get_coarse_index(*influence_iter) << std::endl;

           coarse_id_ptr[i] = coarse_id_ptr[influenced_point_id];

           break;

         }

       }

     }

   }


   //

   // Stage 4: Set undecided points to fine points (coarse ID already set in Stage 3)

   //          Note: Stage 3 and Stage 4 were initially fused, but are now split in order to avoid race conditions (or a fallback to sequential execution).

   //

 #ifdef VIENNACL_WITH_OPENMP

   #pragma omp parallel for

 #endif

   for (long i=0; i<static_cast<long>(A.size1()); ++i)

     if (point_types_ptr[i] == viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_UNDECIDED)

       point_types_ptr[i] = viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_FINE;


 }


 template<typename MatrixT>

 void amg_coarse(MatrixT & A,

                 viennacl::linalg::detail::amg::amg_level_context & amg_context,

                 viennacl::linalg::amg_tag & tag)

 {

   switch (tag.get_coarsening_method())

   {

   case viennacl::linalg::AMG_COARSENING_METHOD_ONEPASS: amg_coarse_classic_onepass(A, amg_context, tag); break;

   case viennacl::linalg::AMG_COARSENING_METHOD_AGGREGATION:

   case viennacl::linalg::AMG_COARSENING_METHOD_MIS2_AGGREGATION: amg_coarse_ag(A, amg_context, tag); break;

   //default: throw std::runtime_error("not implemented yet");

   }

 }


 template<typename NumericT>

 void amg_interpol_direct(compressed_matrix<NumericT> const & A,

                          compressed_matrix<NumericT> & P,

                          viennacl::linalg::detail::amg::amg_level_context & amg_context,

                          viennacl::linalg::amg_tag & tag)

 {

   NumericT     const * A_elements   = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericT>(A.handle());

   unsigned int const * A_row_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(A.handle1());

   unsigned int const * A_col_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(A.handle2());


   unsigned int *point_types_ptr       = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.point_types_.handle());

   unsigned int *influences_row_ptr    = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_jumper_.handle());

   unsigned int *influences_id_ptr     = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.influence_ids_.handle());

   unsigned int *coarse_id_ptr         = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.coarse_id_.handle());


   P.resize(A.size1(), amg_context.num_coarse_, false);


   std::vector<std::map<unsigned int, NumericT> > P_setup(A.size1());


   // Iterate over all points to build the interpolation matrix row-by-row

   // Interpolation for coarse points is immediate using '1'.

   // Interpolation for fine points is set up via corresponding row weights (cf. Yang paper, p. 14)

 #ifdef VIENNACL_WITH_OPENMP

   #pragma omp parallel for

 #endif

   for (long row2=0; row2<static_cast<long>(A.size1()); ++row2)

   {

     unsigned int row = static_cast<unsigned int>(row2);

     std::map<unsigned int, NumericT> & P_setup_row = P_setup[row];

     //std::cout << "Row " << row << ": " << std::endl;

     if (point_types_ptr[row] == viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_COARSE)

     {

       //std::cout << "  Setting value 1.0 at " << coarse_id_ptr[row] << std::endl;

       P_setup_row[coarse_id_ptr[row]] = NumericT(1);

     }

     else if (point_types_ptr[row] == viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_FINE)

     {

       //std::cout << "Building interpolant for fine point " << row << std::endl;


       NumericT row_sum = 0;

       NumericT row_coarse_sum = 0;

       NumericT diag = 0;


       // Row sum of coefficients (without diagonal) and sum of influencing coarse point coefficients has to be computed

       unsigned int row_A_start = A_row_buffer[row];

       unsigned int row_A_end   = A_row_buffer[row + 1];

       unsigned int const *influence_iter = influences_id_ptr + influences_row_ptr[row];

       unsigned int const *influence_end  = influences_id_ptr + influences_row_ptr[row + 1];

       for (unsigned int index = row_A_start; index < row_A_end; ++index)

       {

         unsigned int col = A_col_buffer[index];

         NumericT value = A_elements[index];


         if (col == row)

         {

           diag = value;

           continue;

         }

         else if (point_types_ptr[col] == viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_COARSE)

         {

           // Note: One increment is sufficient, because influence_iter traverses an ordered subset of the column indices in this row

           while (influence_iter != influence_end && *influence_iter < col)

             ++influence_iter;


           if (influence_iter != influence_end && *influence_iter == col)

             row_coarse_sum += value;

         }


         row_sum += value;

       }


       NumericT temp_res = -row_sum/(row_coarse_sum*diag);

       //std::cout << "row_sum: " << row_sum << ", row_coarse_sum: " << row_coarse_sum << ", diag: " << diag << std::endl;


       if (std::fabs(temp_res) > 1e-2 * std::fabs(diag))

       {

         // Iterate over all strongly influencing points to build the interpolant

         influence_iter = influences_id_ptr + influences_row_ptr[row];

         for (unsigned int index = row_A_start; index < row_A_end; ++index)

         {

           unsigned int col = A_col_buffer[index];

           if (point_types_ptr[col] != viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_COARSE)

             continue;

           NumericT value = A_elements[index];


           // Advance to correct influence metric:

           while (influence_iter != influence_end && *influence_iter < col)

             ++influence_iter;


           if (influence_iter != influence_end && *influence_iter == col)

           {

             //std::cout << " Setting entry "  << temp_res * value << " at " << coarse_id_ptr[col] << " for point " << col << std::endl;

             P_setup_row[coarse_id_ptr[col]] = temp_res * value;

           }

         }

       }


       // TODO truncate interpolation if specified by the user.

       (void)tag;

     }

     else

       throw std::runtime_error("Logic error in direct interpolation: Point is neither coarse-point nor fine-point!");

   }


   // TODO: P_setup can be avoided without sacrificing parallelism.

   viennacl::tools::sparse_matrix_adapter<NumericT> P_adapter(P_setup, P.size1(), P.size2());

   viennacl::copy(P_adapter, P);

 }


 template<typename NumericT>

 void amg_interpol_ag(compressed_matrix<NumericT> const & A,

                      compressed_matrix<NumericT> & P,

                      viennacl::linalg::detail::amg::amg_level_context & amg_context,

                      viennacl::linalg::amg_tag & tag)

 {

   (void)tag;

   P = compressed_matrix<NumericT>(A.size1(), amg_context.num_coarse_, A.size1(), viennacl::traits::context(A));


   NumericT     * P_elements   = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericT>(P.handle());

   unsigned int * P_row_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(P.handle1());

   unsigned int * P_col_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(P.handle2());


   unsigned int *coarse_id_ptr = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(amg_context.coarse_id_.handle());


   // Build interpolation matrix:

 #ifdef VIENNACL_WITH_OPENMP

   #pragma omp parallel for

 #endif

   for (long row2 = 0; row2 < long(A.size1()); ++row2)

   {

     unsigned int row = static_cast<unsigned int>(row2);

     P_elements[row]   = NumericT(1);

     P_row_buffer[row] = row;

     P_col_buffer[row] = coarse_id_ptr[row];

   }

   P_row_buffer[A.size1()] = static_cast<unsigned int>(A.size1()); // don't forget finalizer


   P.generate_row_block_information();

 }


 template<typename NumericT>

 void amg_interpol_sa(compressed_matrix<NumericT> const & A,

                      compressed_matrix<NumericT> & P,

                      viennacl::linalg::detail::amg::amg_level_context & amg_context,

                      viennacl::linalg::amg_tag & tag)

 {

   (void)tag;

   viennacl::compressed_matrix<NumericT> P_tentative(A.size1(), amg_context.num_coarse_, A.size1(), viennacl::traits::context(A));


   // form tentative operator:

   amg_interpol_ag(A, P_tentative, amg_context, tag);


   unsigned int const * A_row_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(A.handle1());

   unsigned int const * A_col_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(A.handle2());

   NumericT     const * A_elements   = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericT>(A.handle());


   viennacl::compressed_matrix<NumericT> Jacobi(A.size1(), A.size1(), A.nnz(), viennacl::traits::context(A));

   unsigned int * Jacobi_row_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(Jacobi.handle1());

   unsigned int * Jacobi_col_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(Jacobi.handle2());

   NumericT     * Jacobi_elements   = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericT>(Jacobi.handle());


   // Build Jacobi matrix:

 #ifdef VIENNACL_WITH_OPENMP

   #pragma omp parallel for

 #endif

   for (long row2=0; row2<static_cast<long>(A.size1()); ++row2)

   {

     unsigned int row = static_cast<unsigned int>(row2);

     unsigned int row_begin = A_row_buffer[row];

     unsigned int row_end   = A_row_buffer[row+1];


     Jacobi_row_buffer[row] = row_begin;


     // Step 1: Extract diagonal:

     NumericT diag = 0;

     for (unsigned int j = row_begin; j < row_end; ++j)

     {

       if (A_col_buffer[j] == row)

       {

         diag = A_elements[j];

         break;

       }

     }


     // Step 2: Write entries:

     for (unsigned int j = row_begin; j < row_end; ++j)

     {

       unsigned int col_index = A_col_buffer[j];

       Jacobi_col_buffer[j] = col_index;


       if (col_index == row)

         Jacobi_elements[j] = NumericT(1) - NumericT(tag.get_jacobi_weight());

       else

         Jacobi_elements[j] = - NumericT(tag.get_jacobi_weight()) * A_elements[j] / diag;

     }

   }

   Jacobi_row_buffer[A.size1()] = static_cast<unsigned int>(Jacobi.nnz()); // don't forget finalizer


   P = viennacl::linalg::prod(Jacobi, P_tentative);


   P.generate_row_block_information();

 }


 template<typename MatrixT>

 void amg_interpol(MatrixT const & A,

                   MatrixT & P,

                   viennacl::linalg::detail::amg::amg_level_context & amg_context,

                   viennacl::linalg::amg_tag & tag)

 {

   switch (tag.get_interpolation_method())

   {

   case viennacl::linalg::AMG_INTERPOLATION_METHOD_DIRECT:               amg_interpol_direct (A, P, amg_context, tag); break;

   case viennacl::linalg::AMG_INTERPOLATION_METHOD_AGGREGATION:          amg_interpol_ag     (A, P, amg_context, tag); break;

   case viennacl::linalg::AMG_INTERPOLATION_METHOD_SMOOTHED_AGGREGATION: amg_interpol_sa     (A, P, amg_context, tag); break;

   default: throw std::runtime_error("Not implemented yet!");

   }

 }


 template<typename NumericT>

 void amg_transpose(compressed_matrix<NumericT> const & A,

                    compressed_matrix<NumericT> & B)

 {

   NumericT     const * A_elements   = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericT>(A.handle());

   unsigned int const * A_row_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(A.handle1());

   unsigned int const * A_col_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(A.handle2());


   // initialize datastructures for B:

   B = compressed_matrix<NumericT>(A.size2(), A.size1(), A.nnz(), viennacl::traits::context(A));


   NumericT     * B_elements   = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericT>(B.handle());

   unsigned int * B_row_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(B.handle1());

   unsigned int * B_col_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(B.handle2());


   // prepare uninitialized B_row_buffer:

   for (std::size_t i = 0; i < B.size1(); ++i)

     B_row_buffer[i] = 0;


   //

   // Stage 1: Compute pattern for B

   //

   for (std::size_t row = 0; row < A.size1(); ++row)

   {

     unsigned int row_start = A_row_buffer[row];

     unsigned int row_stop  = A_row_buffer[row+1];


     for (unsigned int nnz_index = row_start; nnz_index < row_stop; ++nnz_index)

       B_row_buffer[A_col_buffer[nnz_index]] += 1;

   }


   // Bring row-start array in place using inclusive-scan:

   unsigned int offset = B_row_buffer[0];

   B_row_buffer[0] = 0;

   for (std::size_t row = 1; row < B.size1(); ++row)

   {

     unsigned int tmp = B_row_buffer[row];

     B_row_buffer[row] = offset;

     offset += tmp;

   }

   B_row_buffer[B.size1()] = offset;


   //

   // Stage 2: Fill with data

   //


   std::vector<unsigned int> B_row_offsets(B.size1()); //number of elements already written per row


   for (std::size_t row = 0; row < A.size1(); ++row)

   {

     //std::cout << "Row " << row << ": ";

     unsigned int row_start = A_row_buffer[row];

     unsigned int row_stop  = A_row_buffer[row+1];


     for (unsigned int nnz_index = row_start; nnz_index < row_stop; ++nnz_index)

     {

       unsigned int col_in_A = A_col_buffer[nnz_index];

       unsigned int B_nnz_index = B_row_buffer[col_in_A] + B_row_offsets[col_in_A];

       B_col_buffer[B_nnz_index] = static_cast<unsigned int>(row);

       B_elements[B_nnz_index] = A_elements[nnz_index];

       ++B_row_offsets[col_in_A];

       //B_temp.at(A_col_buffer[nnz_index])[row] = A_elements[nnz_index];

     }

   }


   // Step 3: Make datastructure consistent (row blocks!)

   B.generate_row_block_information();

 }


 template<typename NumericT, unsigned int AlignmentV>

 void assign_to_dense(viennacl::compressed_matrix<NumericT, AlignmentV> const & A,

                      viennacl::matrix_base<NumericT> & B)

 {

   NumericT     const * A_elements   = detail::extract_raw_pointer<NumericT>(A.handle());

   unsigned int const * A_row_buffer = detail::extract_raw_pointer<unsigned int>(A.handle1());

   unsigned int const * A_col_buffer = detail::extract_raw_pointer<unsigned int>(A.handle2());


   NumericT           * B_elements   = detail::extract_raw_pointer<NumericT>(B.handle());


 #ifdef VIENNACL_WITH_OPENMP

   #pragma omp parallel for

 #endif

   for (long row = 0; row < static_cast<long>(A.size1()); ++row)

   {

     unsigned int row_stop  = A_row_buffer[row+1];


     for (unsigned int nnz_index = A_row_buffer[row]; nnz_index < row_stop; ++nnz_index)

       B_elements[static_cast<unsigned int>(row) * static_cast<unsigned int>(B.internal_size2()) + A_col_buffer[nnz_index]] = A_elements[nnz_index];

   }


 }


 template<typename NumericT>

 void smooth_jacobi(unsigned int iterations,

                    compressed_matrix<NumericT> const & A,

                    vector<NumericT> & x,

                    vector<NumericT> & x_backup,

                    vector<NumericT> const & rhs_smooth,

                    NumericT weight)

 {


   NumericT     const * A_elements   = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericT>(A.handle());

   unsigned int const * A_row_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(A.handle1());

   unsigned int const * A_col_buffer = viennacl::linalg::host_based::detail::extract_raw_pointer<unsigned int>(A.handle2());

   NumericT     const * rhs_elements = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericT>(rhs_smooth.handle());


   NumericT           * x_elements     = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericT>(x.handle());

   NumericT     const * x_old_elements = viennacl::linalg::host_based::detail::extract_raw_pointer<NumericT>(x_backup.handle());


   for (unsigned int i=0; i<iterations; ++i)

   {

     x_backup = x;


     #ifdef VIENNACL_WITH_OPENMP

     #pragma omp parallel for

     #endif

     for (long row2 = 0; row2 < static_cast<long>(A.size1()); ++row2)

     {

       unsigned int row = static_cast<unsigned int>(row2);

       unsigned int col_end   = A_row_buffer[row+1];


       NumericT sum  = NumericT(0);

       NumericT diag = NumericT(1);

       for (unsigned int index = A_row_buffer[row]; index != col_end; ++index)

       {

         unsigned int col = A_col_buffer[index];

         if (col == row)

           diag = A_elements[index];

         else

           sum += A_elements[index] * x_old_elements[col];

       }


       x_elements[row] = weight * (rhs_elements[row] - sum) / diag + (NumericT(1) - weight) * x_old_elements[row];

     }

   }

 }


 } //namespace amg

 } //namespace host_based

 } //namespace linalg

 } //namespace viennacl


 #endif

viennacl::compressed_matrix::size2
const vcl_size_t & size2() const
Returns the number of columns.
Definition: compressed_matrix.hpp:929

viennacl::linalg::host_based::amg::amg_id_influence
Helper struct for sequential classical one-pass coarsening.
Definition: amg_operations.hpp:260

viennacl::linalg::amg_tag::get_coarsening_method
amg_coarsening_method get_coarsening_method() const
Returns the current coarsening strategy.
Definition: amg_base.hpp:88

viennacl::linalg::sum
viennacl::scalar_expression< const viennacl::vector_base< NumericT >, const viennacl::vector_base< NumericT >, viennacl::op_sum > sum(viennacl::vector_base< NumericT > const &x)
User interface function for computing the sum of all elements of a vector.
Definition: sum.hpp:45

viennacl::linalg::detail::amg::amg_level_context
Definition: amg_base.hpp:167

viennacl::compressed_matrix::size1
const vcl_size_t & size1() const
Returns the number of rows.
Definition: compressed_matrix.hpp:927

viennacl::linalg::row_sum
viennacl::vector_expression< const viennacl::matrix_base< NumericT >, const viennacl::matrix_base< NumericT >, viennacl::op_row_sum > row_sum(viennacl::matrix_base< NumericT > const &A)
User interface function for computing the sum of all elements of each row of a matrix.
Definition: sum.hpp:77

viennacl::linalg::host_based::amg::amg_coarse_ag
void amg_coarse_ag(compressed_matrix< NumericT > const &A, viennacl::linalg::detail::amg::amg_level_context &amg_context, viennacl::linalg::amg_tag &tag)
AG (aggregation based) coarsening. Partially single-threaded version (VIENNACL_AMG_COARSE_AG) ...
Definition: amg_operations.hpp:604

viennacl::linalg::amg_tag::get_jacobi_weight
double get_jacobi_weight() const
Returns the Jacobi smoother weight (damping).
Definition: amg_base.hpp:113

viennacl::matrix_base< NumericT >

viennacl::linalg::host_based::amg::amg_interpol_ag
void amg_interpol_ag(compressed_matrix< NumericT > const &A, compressed_matrix< NumericT > &P, viennacl::linalg::detail::amg::amg_level_context &amg_context, viennacl::linalg::amg_tag &tag)
AG (aggregation based) interpolation. Multi-Threaded! (VIENNACL_INTERPOL_AG)
Definition: amg_operations.hpp:841

viennacl::linalg::AMG_INTERPOLATION_METHOD_AGGREGATION
Definition: amg_base.hpp:57

viennacl::linalg::host_based::amg::amg_influence_advanced
void amg_influence_advanced(compressed_matrix< NumericT > const &A, viennacl::linalg::detail::amg::amg_level_context &amg_context, viennacl::linalg::amg_tag &tag)
Routine for extracting strongly connected points considering a user-provided threshold value...
Definition: amg_operations.hpp:84

viennacl::linalg::AMG_INTERPOLATION_METHOD_DIRECT
Definition: amg_base.hpp:56

viennacl::linalg::host_based::amg::amg_coarse_classic_onepass
void amg_coarse_classic_onepass(compressed_matrix< NumericT > const &A, viennacl::linalg::detail::amg::amg_level_context &amg_context, viennacl::linalg::amg_tag &tag)
Classical (RS) one-pass coarsening. Single-Threaded! (VIENNACL_AMG_COARSE_CLASSIC_ONEPASS) ...
Definition: amg_operations.hpp:284

viennacl::linalg::host_based::amg::amg_id_influence::amg_id_influence
amg_id_influence(std::size_t id2, std::size_t influences2)
Definition: amg_operations.hpp:262

viennacl::compressed_matrix::handle
const handle_type & handle() const
Returns the OpenCL handle to the matrix entry array.
Definition: compressed_matrix.hpp:942

viennacl::compressed_matrix::handle1
const handle_type & handle1() const
Returns the OpenCL handle to the row index array.
Definition: compressed_matrix.hpp:936

viennacl::linalg::AMG_COARSENING_METHOD_MIS2_AGGREGATION
Definition: amg_base.hpp:50

viennacl::compressed_matrix::nnz
const vcl_size_t & nnz() const
Returns the number of nonzero entries.
Definition: compressed_matrix.hpp:931

NumericT
float NumericT
Definition: bisect.cpp:40

viennacl::linalg::host_based::amg::amg_coarse_ag_stage1_sequential
void amg_coarse_ag_stage1_sequential(compressed_matrix< NumericT > const &A, viennacl::linalg::detail::amg::amg_level_context &amg_context, viennacl::linalg::amg_tag &tag)
AG (aggregation based) coarsening, single-threaded version of stage 1.
Definition: amg_operations.hpp:367

viennacl::linalg::prod
VectorT prod(std::vector< std::vector< T, A1 >, A2 > const &matrix, VectorT const &vector)
Definition: prod.hpp:102

viennacl::compressed_matrix::generate_row_block_information
void generate_row_block_information()
Builds the row block information needed for fast sparse matrix-vector multiplications.
Definition: compressed_matrix.hpp:999

viennacl::linalg::host_based::amg::amg_transpose
void amg_transpose(compressed_matrix< NumericT > const &A, compressed_matrix< NumericT > &B)
Computes B = trans(A).
Definition: amg_operations.hpp:972

viennacl::linalg::AMG_COARSENING_METHOD_AGGREGATION
Definition: amg_base.hpp:49

viennacl::linalg::host_based::amg::operator>
bool operator>(amg_id_influence const &a, amg_id_influence const &b)
Definition: amg_operations.hpp:268

viennacl::linalg::AMG_INTERPOLATION_METHOD_SMOOTHED_AGGREGATION
Definition: amg_base.hpp:58

viennacl::linalg::host_based::amg::assign_to_dense
void assign_to_dense(viennacl::compressed_matrix< NumericT, AlignmentV > const &A, viennacl::matrix_base< NumericT > &B)
Definition: amg_operations.hpp:1042

viennacl::linalg::amg_tag::get_strong_connection_threshold
double get_strong_connection_threshold() const
Returns the strong connection threshold parameter.
Definition: amg_base.hpp:105

viennacl::linalg::detail::amg::amg_level_context::num_coarse_
unsigned int num_coarse_
Definition: amg_base.hpp:199

viennacl::compressed_matrix::handle2
const handle_type & handle2() const
Returns the OpenCL handle to the column index array.
Definition: compressed_matrix.hpp:938

viennacl::vcl_size_t
std::size_t vcl_size_t
Definition: forwards.h:75

viennacl::linalg::host_based::amg::enumerate_coarse_points
void enumerate_coarse_points(viennacl::linalg::detail::amg::amg_level_context &amg_context)
Assign IDs to coarse points.
Definition: amg_operations.hpp:235

viennacl::matrix_base::handle
handle_type & handle()
Returns the OpenCL handle, non-const-version.
Definition: matrix_def.hpp:244

viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_UNDECIDED
Definition: amg_base.hpp:189

viennacl::vector< unsigned int >

viennacl::diag
vector_expression< const matrix_base< NumericT >, const int, op_matrix_diag > diag(const matrix_base< NumericT > &A, int k=0)
Definition: matrix.hpp:895

viennacl::linalg::host_based::amg::smooth_jacobi
void smooth_jacobi(unsigned int iterations, compressed_matrix< NumericT > const &A, vector< NumericT > &x, vector< NumericT > &x_backup, vector< NumericT > const &rhs_smooth, NumericT weight)
Damped Jacobi Smoother (CUDA version)
Definition: amg_operations.hpp:1074

viennacl::row
vector_expression< const matrix_base< NumericT, F >, const unsigned int, op_row > row(const matrix_base< NumericT, F > &A, unsigned int i)
Definition: matrix.hpp:910

viennacl::linalg::host_based::amg::amg_coarse_ag_stage1_mis2
void amg_coarse_ag_stage1_mis2(compressed_matrix< NumericT > const &A, viennacl::linalg::detail::amg::amg_level_context &amg_context, viennacl::linalg::amg_tag &tag)
AG (aggregation based) coarsening, multi-threaded version of stage 1 using parallel maximum independe...
Definition: amg_operations.hpp:418

viennacl::linalg::host_based::amg::amg_interpol_sa
void amg_interpol_sa(compressed_matrix< NumericT > const &A, compressed_matrix< NumericT > &P, viennacl::linalg::detail::amg::amg_level_context &amg_context, viennacl::linalg::amg_tag &tag)
Smoothed aggregation interpolation. Multi-Threaded! (VIENNACL_INTERPOL_SA)
Definition: amg_operations.hpp:880

viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_FINE
Definition: amg_base.hpp:191

viennacl::linalg::amg_tag
A tag for algebraic multigrid (AMG). Used to transport information from the user to the implementatio...
Definition: amg_base.hpp:64

viennacl::linalg::host_based::amg::amg_influence
void amg_influence(compressed_matrix< NumericT > const &A, viennacl::linalg::detail::amg::amg_level_context &amg_context, viennacl::linalg::amg_tag &tag)
Dispatcher for influence processing.
Definition: amg_operations.hpp:224

viennacl::traits::context
viennacl::context context(T const &t)
Returns an ID for the currently active memory domain of an object.
Definition: context.hpp:40

viennacl::linalg::host_based::amg::amg_influence_trivial
void amg_influence_trivial(compressed_matrix< NumericT > const &A, viennacl::linalg::detail::amg::amg_level_context &amg_context, viennacl::linalg::amg_tag &tag)
Routine for taking all connections in the matrix as strong.
Definition: amg_operations.hpp:50

viennacl::copy
void copy(std::vector< NumericT > &cpu_vec, circulant_matrix< NumericT, AlignmentV > &gpu_mat)
Copies a circulant matrix from the std::vector to the OpenCL device (either GPU or multi-core CPU) ...
Definition: circulant_matrix.hpp:150

viennacl::linalg::host_based::amg::amg_coarse
void amg_coarse(MatrixT &A, viennacl::linalg::detail::amg::amg_level_context &amg_context, viennacl::linalg::amg_tag &tag)
Entry point and dispatcher for coarsening procedures.
Definition: amg_operations.hpp:697

viennacl::vector_base::size
size_type size() const
Returns the length of the vector (cf. std::vector)
Definition: vector_def.hpp:118

viennacl::linalg::detail::amg::amg_level_context::point_types_
viennacl::vector< unsigned int > point_types_
Definition: amg_base.hpp:197

viennacl::linalg::amg_tag::get_interpolation_method
amg_interpolation_method get_interpolation_method() const
Returns the current interpolation method.
Definition: amg_base.hpp:93

viennacl::tools::sparse_matrix_adapter
Adapts a non-const sparse matrix type made up from std::vector > to basic u...
Definition: adapter.hpp:357

viennacl::compressed_matrix< NumericT >

viennacl::matrix_base::internal_size2
size_type internal_size2() const
Returns the internal number of columns. Usually required for launching OpenCL kernels only...
Definition: matrix_def.hpp:240

amg_base.hpp
Helper classes and functions for the AMG preconditioner. Experimental.

viennacl::linalg::detail::amg::amg_level_context::POINT_TYPE_COARSE
Definition: amg_base.hpp:190

viennacl::linalg::host_based::amg::amg_interpol
void amg_interpol(MatrixT const &A, MatrixT &P, viennacl::linalg::detail::amg::amg_level_context &amg_context, viennacl::linalg::amg_tag &tag)
Dispatcher for building the interpolation matrix.
Definition: amg_operations.hpp:952

viennacl::linalg::host_based::amg::amg_id_influence::id
unsigned int id
Definition: amg_operations.hpp:264

viennacl::linalg::host_based::amg::amg_interpol_direct
void amg_interpol_direct(compressed_matrix< NumericT > const &A, compressed_matrix< NumericT > &P, viennacl::linalg::detail::amg::amg_level_context &amg_context, viennacl::linalg::amg_tag &tag)
Direct interpolation. Multi-threaded! (VIENNACL_AMG_INTERPOL_DIRECT)
Definition: amg_operations.hpp:724

viennacl::linalg::detail::amg::amg_level_context::coarse_id_
viennacl::vector< unsigned int > coarse_id_
Definition: amg_base.hpp:198

viennacl::linalg::AMG_COARSENING_METHOD_ONEPASS
Definition: amg_base.hpp:48

viennacl::compressed_matrix::resize
void resize(vcl_size_t new_size1, vcl_size_t new_size2, bool preserve=true)
Resize the matrix.
Definition: compressed_matrix.hpp:829

viennacl::linalg::host_based::amg::amg_id_influence::influences
unsigned int influences
Definition: amg_operations.hpp:265

viennacl::vector_base::handle
const handle_type & handle() const
Returns the memory handle.
Definition: vector_def.hpp:128

viennacl::linalg::detail::amg::amg_level_context::influence_values_
viennacl::vector< unsigned int > influence_values_
Definition: amg_base.hpp:196

viennacl::linalg::detail::amg::amg_level_context::influence_ids_
viennacl::vector< unsigned int > influence_ids_
Definition: amg_base.hpp:195

viennacl::linalg::detail::amg::amg_level_context::influence_jumper_
viennacl::vector< unsigned int > influence_jumper_
Definition: amg_base.hpp:194