doc/compressed__matrix_8hpp_source.html

 #ifndef VIENNACL_COMPRESSED_MATRIX_HPP_

 #define VIENNACL_COMPRESSED_MATRIX_HPP_


 /* =========================================================================

    Copyright (c) 2010-2016, Institute for Microelectronics,

                             Institute for Analysis and Scientific Computing,

                             TU Wien.

    Portions of this software are copyright by UChicago Argonne, LLC.


                             -----------------

                   ViennaCL - The Vienna Computing Library

                             -----------------


    Project Head:    Karl Rupp                   rupp@iue.tuwien.ac.at


    (A list of authors and contributors can be found in the manual)


    License:         MIT (X11), see file LICENSE in the base directory

 ============================================================================= */


 #include <vector>

 #include <list>

 #include <map>

 #include "viennacl/forwards.h"

 #include "viennacl/vector.hpp"


 #include "viennacl/linalg/sparse_matrix_operations.hpp"


 #include "viennacl/tools/tools.hpp"

 #include "viennacl/tools/entry_proxy.hpp"


 #ifdef VIENNACL_WITH_UBLAS

 #include <boost/numeric/ublas/matrix_sparse.hpp>

 #endif


 namespace viennacl

 {

 namespace detail

 {


   template<typename CPUMatrixT, typename NumericT, unsigned int AlignmentV>

   void copy_impl(const CPUMatrixT & cpu_matrix,

                  compressed_matrix<NumericT, AlignmentV> & gpu_matrix,

                  vcl_size_t nonzeros)

   {

     assert( (gpu_matrix.size1() == 0 || viennacl::traits::size1(cpu_matrix) == gpu_matrix.size1()) && bool("Size mismatch") );

     assert( (gpu_matrix.size2() == 0 || viennacl::traits::size2(cpu_matrix) == gpu_matrix.size2()) && bool("Size mismatch") );


     viennacl::backend::typesafe_host_array<unsigned int> row_buffer(gpu_matrix.handle1(), cpu_matrix.size1() + 1);

     viennacl::backend::typesafe_host_array<unsigned int> col_buffer(gpu_matrix.handle2(), nonzeros);

     std::vector<NumericT> elements(nonzeros);


     vcl_size_t row_index  = 0;

     vcl_size_t data_index = 0;


     for (typename CPUMatrixT::const_iterator1 row_it = cpu_matrix.begin1();

          row_it != cpu_matrix.end1();

          ++row_it)

     {

       row_buffer.set(row_index, data_index);

       ++row_index;


       for (typename CPUMatrixT::const_iterator2 col_it = row_it.begin();

            col_it != row_it.end();

            ++col_it)

       {

         col_buffer.set(data_index, col_it.index2());

         elements[data_index] = *col_it;

         ++data_index;

       }

       data_index = viennacl::tools::align_to_multiple<vcl_size_t>(data_index, AlignmentV); //take care of alignment

     }

     row_buffer.set(row_index, data_index);


     gpu_matrix.set(row_buffer.get(),

                    col_buffer.get(),

                    &elements[0],

         cpu_matrix.size1(),

         cpu_matrix.size2(),

         nonzeros);

   }

 }


 //

 // host to device:

 //


 //provide copy-operation:

 template<typename CPUMatrixT, typename NumericT, unsigned int AlignmentV>

 void copy(const CPUMatrixT & cpu_matrix,

           compressed_matrix<NumericT, AlignmentV> & gpu_matrix )

 {

   if ( cpu_matrix.size1() > 0 && cpu_matrix.size2() > 0 )

   {

     //determine nonzeros:

     vcl_size_t num_entries = 0;

     for (typename CPUMatrixT::const_iterator1 row_it = cpu_matrix.begin1();

          row_it != cpu_matrix.end1();

          ++row_it)

     {

       vcl_size_t entries_per_row = 0;

       for (typename CPUMatrixT::const_iterator2 col_it = row_it.begin();

            col_it != row_it.end();

            ++col_it)

       {

         ++entries_per_row;

       }

       num_entries += viennacl::tools::align_to_multiple<vcl_size_t>(entries_per_row, AlignmentV);

     }


     if (num_entries == 0) //we copy an empty matrix

       num_entries = 1;


     //set up matrix entries:

     viennacl::detail::copy_impl(cpu_matrix, gpu_matrix, num_entries);

   }

 }


 //adapted for std::vector< std::map < > > argument:

 template<typename SizeT, typename NumericT, unsigned int AlignmentV>

 void copy(const std::vector< std::map<SizeT, NumericT> > & cpu_matrix,

           compressed_matrix<NumericT, AlignmentV> & gpu_matrix )

 {

   vcl_size_t nonzeros = 0;

   vcl_size_t max_col = 0;

   for (vcl_size_t i=0; i<cpu_matrix.size(); ++i)

   {

     if (cpu_matrix[i].size() > 0)

       nonzeros += ((cpu_matrix[i].size() - 1) / AlignmentV + 1) * AlignmentV;

     if (cpu_matrix[i].size() > 0)

       max_col = std::max<vcl_size_t>(max_col, (cpu_matrix[i].rbegin())->first);

   }


   viennacl::detail::copy_impl(tools::const_sparse_matrix_adapter<NumericT, SizeT>(cpu_matrix, cpu_matrix.size(), max_col + 1),

                               gpu_matrix,

                               nonzeros);

 }


 #ifdef VIENNACL_WITH_UBLAS


 template<typename ScalarType, typename F, vcl_size_t IB, typename IA, typename TA>

 void copy(const boost::numeric::ublas::compressed_matrix<ScalarType, F, IB, IA, TA> & ublas_matrix,

           viennacl::compressed_matrix<ScalarType, 1> & gpu_matrix)

 {

   assert( (gpu_matrix.size1() == 0 || viennacl::traits::size1(ublas_matrix) == gpu_matrix.size1()) && bool("Size mismatch") );

   assert( (gpu_matrix.size2() == 0 || viennacl::traits::size2(ublas_matrix) == gpu_matrix.size2()) && bool("Size mismatch") );


   //we just need to copy the CSR arrays:

   viennacl::backend::typesafe_host_array<unsigned int> row_buffer(gpu_matrix.handle1(), ublas_matrix.size1() + 1);

   for (vcl_size_t i=0; i<=ublas_matrix.size1(); ++i)

     row_buffer.set(i, ublas_matrix.index1_data()[i]);


   viennacl::backend::typesafe_host_array<unsigned int> col_buffer(gpu_matrix.handle2(), ublas_matrix.nnz());

   for (vcl_size_t i=0; i<ublas_matrix.nnz(); ++i)

     col_buffer.set(i, ublas_matrix.index2_data()[i]);


   gpu_matrix.set(row_buffer.get(),

                  col_buffer.get(),

                  &(ublas_matrix.value_data()[0]),

       ublas_matrix.size1(),

       ublas_matrix.size2(),

       ublas_matrix.nnz());


 }

 #endif


 #ifdef VIENNACL_WITH_ARMADILLO


 template<typename NumericT, unsigned int AlignmentV>

 void copy(arma::SpMat<NumericT> const & arma_matrix,

           viennacl::compressed_matrix<NumericT, AlignmentV> & vcl_matrix)

 {

   assert( (vcl_matrix.size1() == 0 || static_cast<vcl_size_t>(arma_matrix.n_rows) == vcl_matrix.size1()) && bool("Size mismatch") );

   assert( (vcl_matrix.size2() == 0 || static_cast<vcl_size_t>(arma_matrix.n_cols) == vcl_matrix.size2()) && bool("Size mismatch") );


   viennacl::backend::typesafe_host_array<unsigned int> row_buffer(vcl_matrix.handle1(), arma_matrix.n_rows + 1);

   viennacl::backend::typesafe_host_array<unsigned int> col_buffer(vcl_matrix.handle2(), arma_matrix.n_nonzero);

   viennacl::backend::typesafe_host_array<NumericT    > value_buffer(vcl_matrix.handle(), arma_matrix.n_nonzero);


   // Step 1: Count number of nonzeros in each row

   for (vcl_size_t col=0; col < static_cast<vcl_size_t>(arma_matrix.n_cols); ++col)

   {

     vcl_size_t col_begin = static_cast<vcl_size_t>(arma_matrix.col_ptrs[col]);

     vcl_size_t col_end   = static_cast<vcl_size_t>(arma_matrix.col_ptrs[col+1]);

     for (vcl_size_t i = col_begin; i < col_end; ++i)

     {

       unsigned int row = arma_matrix.row_indices[i];

       row_buffer.set(row, row_buffer[row] + 1);

     }

   }


   // Step 2: Exclusive scan on row_buffer to obtain offsets

   unsigned int offset = 0;

   for (vcl_size_t i=0; i<row_buffer.size(); ++i)

   {

     unsigned int tmp = row_buffer[i];

     row_buffer.set(i, offset);

     offset += tmp;

   }


   // Step 3: Fill data

   std::vector<unsigned int> row_offsets(arma_matrix.n_rows);

   for (vcl_size_t col=0; col < static_cast<vcl_size_t>(arma_matrix.n_cols); ++col)

   {

     vcl_size_t col_begin = static_cast<vcl_size_t>(arma_matrix.col_ptrs[col]);

     vcl_size_t col_end   = static_cast<vcl_size_t>(arma_matrix.col_ptrs[col+1]);

     for (vcl_size_t i = col_begin; i < col_end; ++i)

     {

       unsigned int row = arma_matrix.row_indices[i];

       col_buffer.set(row_buffer[row] + row_offsets[row], col);

       value_buffer.set(row_buffer[row] + row_offsets[row], arma_matrix.values[i]);

       row_offsets[row] += 1;

     }

   }


   vcl_matrix.set(row_buffer.get(), col_buffer.get(), reinterpret_cast<NumericT*>(value_buffer.get()),

                  arma_matrix.n_rows, arma_matrix.n_cols, arma_matrix.n_nonzero);

 }

 #endif


 #ifdef VIENNACL_WITH_EIGEN


 template<typename NumericT, int flags, unsigned int AlignmentV>

 void copy(const Eigen::SparseMatrix<NumericT, flags> & eigen_matrix,

           compressed_matrix<NumericT, AlignmentV> & gpu_matrix)

 {

   assert( (gpu_matrix.size1() == 0 || static_cast<vcl_size_t>(eigen_matrix.rows()) == gpu_matrix.size1()) && bool("Size mismatch") );

   assert( (gpu_matrix.size2() == 0 || static_cast<vcl_size_t>(eigen_matrix.cols()) == gpu_matrix.size2()) && bool("Size mismatch") );


   std::vector< std::map<unsigned int, NumericT> >  stl_matrix(eigen_matrix.rows());


   for (int k=0; k < eigen_matrix.outerSize(); ++k)

     for (typename Eigen::SparseMatrix<NumericT, flags>::InnerIterator it(eigen_matrix, k); it; ++it)

       stl_matrix[it.row()][it.col()] = it.value();


   copy(tools::const_sparse_matrix_adapter<NumericT>(stl_matrix, eigen_matrix.rows(), eigen_matrix.cols()), gpu_matrix);

 }

 #endif


 #ifdef VIENNACL_WITH_MTL4


 template<typename NumericT, unsigned int AlignmentV>

 void copy(const mtl::compressed2D<NumericT> & cpu_matrix,

           compressed_matrix<NumericT, AlignmentV> & gpu_matrix)

 {

   assert( (gpu_matrix.size1() == 0 || static_cast<vcl_size_t>(cpu_matrix.num_rows()) == gpu_matrix.size1()) && bool("Size mismatch") );

   assert( (gpu_matrix.size2() == 0 || static_cast<vcl_size_t>(cpu_matrix.num_cols()) == gpu_matrix.size2()) && bool("Size mismatch") );


   typedef mtl::compressed2D<NumericT>  MatrixType;


   std::vector< std::map<unsigned int, NumericT> >  stl_matrix(cpu_matrix.num_rows());


   using mtl::traits::range_generator;

   using mtl::traits::range::min;


   // Choose between row and column traversal

   typedef typename min<range_generator<mtl::tag::row, MatrixType>,

       range_generator<mtl::tag::col, MatrixType> >::type   range_type;

   range_type                                                      my_range;


   // Type of outer cursor

   typedef typename range_type::type                               c_type;

   // Type of inner cursor

   typedef typename mtl::traits::range_generator<mtl::tag::nz, c_type>::type ic_type;


   // Define the property maps

   typename mtl::traits::row<MatrixType>::type                              row(cpu_matrix);

   typename mtl::traits::col<MatrixType>::type                              col(cpu_matrix);

   typename mtl::traits::const_value<MatrixType>::type                      value(cpu_matrix);


   // Now iterate over the matrix

   for (c_type cursor(my_range.begin(cpu_matrix)), cend(my_range.end(cpu_matrix)); cursor != cend; ++cursor)

     for (ic_type icursor(mtl::begin<mtl::tag::nz>(cursor)), icend(mtl::end<mtl::tag::nz>(cursor)); icursor != icend; ++icursor)

       stl_matrix[row(*icursor)][col(*icursor)] = value(*icursor);


   copy(tools::const_sparse_matrix_adapter<NumericT>(stl_matrix, cpu_matrix.num_rows(), cpu_matrix.num_cols()), gpu_matrix);

 }

 #endif


 //

 // device to host:

 //

 template<typename CPUMatrixT, typename NumericT, unsigned int AlignmentV>

 void copy(const compressed_matrix<NumericT, AlignmentV> & gpu_matrix,

           CPUMatrixT & cpu_matrix )

 {

   assert( (viennacl::traits::size1(cpu_matrix) == gpu_matrix.size1()) && bool("Size mismatch") );

   assert( (viennacl::traits::size2(cpu_matrix) == gpu_matrix.size2()) && bool("Size mismatch") );


   if ( gpu_matrix.size1() > 0 && gpu_matrix.size2() > 0 )

   {

     //get raw data from memory:

     viennacl::backend::typesafe_host_array<unsigned int> row_buffer(gpu_matrix.handle1(), cpu_matrix.size1() + 1);

     viennacl::backend::typesafe_host_array<unsigned int> col_buffer(gpu_matrix.handle2(), gpu_matrix.nnz());

     std::vector<NumericT> elements(gpu_matrix.nnz());


     //std::cout << "GPU->CPU, nonzeros: " << gpu_matrix.nnz() << std::endl;


     viennacl::backend::memory_read(gpu_matrix.handle1(), 0, row_buffer.raw_size(), row_buffer.get());

     viennacl::backend::memory_read(gpu_matrix.handle2(), 0, col_buffer.raw_size(), col_buffer.get());

     viennacl::backend::memory_read(gpu_matrix.handle(),  0, sizeof(NumericT)* gpu_matrix.nnz(), &(elements[0]));


     //fill the cpu_matrix:

     vcl_size_t data_index = 0;

     for (vcl_size_t row = 1; row <= gpu_matrix.size1(); ++row)

     {

       while (data_index < row_buffer[row])

       {

         if (col_buffer[data_index] >= gpu_matrix.size2())

         {

           std::cerr << "ViennaCL encountered invalid data at colbuffer[" << data_index << "]: " << col_buffer[data_index] << std::endl;

           return;

         }


         if (std::fabs(elements[data_index]) > static_cast<NumericT>(0))

           cpu_matrix(row-1, static_cast<vcl_size_t>(col_buffer[data_index])) = elements[data_index];

         ++data_index;

       }

     }

   }

 }


 template<typename NumericT, unsigned int AlignmentV>

 void copy(const compressed_matrix<NumericT, AlignmentV> & gpu_matrix,

           std::vector< std::map<unsigned int, NumericT> > & cpu_matrix)

 {

   assert( (cpu_matrix.size() == gpu_matrix.size1()) && bool("Size mismatch") );


   tools::sparse_matrix_adapter<NumericT> temp(cpu_matrix, gpu_matrix.size1(), gpu_matrix.size2());

   copy(gpu_matrix, temp);

 }


 #ifdef VIENNACL_WITH_UBLAS


 template<typename ScalarType, unsigned int AlignmentV, typename F, vcl_size_t IB, typename IA, typename TA>

 void copy(viennacl::compressed_matrix<ScalarType, AlignmentV> const & gpu_matrix,

           boost::numeric::ublas::compressed_matrix<ScalarType> & ublas_matrix)

 {

   assert( (viennacl::traits::size1(ublas_matrix) == gpu_matrix.size1()) && bool("Size mismatch") );

   assert( (viennacl::traits::size2(ublas_matrix) == gpu_matrix.size2()) && bool("Size mismatch") );


   viennacl::backend::typesafe_host_array<unsigned int> row_buffer(gpu_matrix.handle1(), gpu_matrix.size1() + 1);

   viennacl::backend::typesafe_host_array<unsigned int> col_buffer(gpu_matrix.handle2(), gpu_matrix.nnz());


   viennacl::backend::memory_read(gpu_matrix.handle1(), 0, row_buffer.raw_size(), row_buffer.get());

   viennacl::backend::memory_read(gpu_matrix.handle2(), 0, col_buffer.raw_size(), col_buffer.get());


   ublas_matrix.clear();

   ublas_matrix.reserve(gpu_matrix.nnz());


   ublas_matrix.set_filled(gpu_matrix.size1() + 1, gpu_matrix.nnz());


   for (vcl_size_t i=0; i<ublas_matrix.size1() + 1; ++i)

     ublas_matrix.index1_data()[i] = row_buffer[i];


   for (vcl_size_t i=0; i<ublas_matrix.nnz(); ++i)

     ublas_matrix.index2_data()[i] = col_buffer[i];


   viennacl::backend::memory_read(gpu_matrix.handle(),  0, sizeof(ScalarType) * gpu_matrix.nnz(), &(ublas_matrix.value_data()[0]));


 }

 #endif


 #ifdef VIENNACL_WITH_ARMADILLO


 template<typename NumericT, unsigned int AlignmentV>

 void copy(viennacl::compressed_matrix<NumericT, AlignmentV> & vcl_matrix,

           arma::SpMat<NumericT> & arma_matrix)

 {

   assert( (static_cast<vcl_size_t>(arma_matrix.n_rows) == vcl_matrix.size1()) && bool("Size mismatch") );

   assert( (static_cast<vcl_size_t>(arma_matrix.n_cols) == vcl_matrix.size2()) && bool("Size mismatch") );


   if ( vcl_matrix.size1() > 0 && vcl_matrix.size2() > 0 )

   {

     //get raw data from memory:

     viennacl::backend::typesafe_host_array<unsigned int> row_buffer(vcl_matrix.handle1(), vcl_matrix.size1() + 1);

     viennacl::backend::typesafe_host_array<unsigned int> col_buffer(vcl_matrix.handle2(), vcl_matrix.nnz());

     viennacl::backend::typesafe_host_array<NumericT>     elements  (vcl_matrix.handle(),  vcl_matrix.nnz());


     viennacl::backend::memory_read(vcl_matrix.handle1(), 0, row_buffer.raw_size(), row_buffer.get());

     viennacl::backend::memory_read(vcl_matrix.handle2(), 0, col_buffer.raw_size(), col_buffer.get());

     viennacl::backend::memory_read(vcl_matrix.handle(),  0, elements.raw_size(),     elements.get());


     arma_matrix.zeros();

     vcl_size_t data_index = 0;

     for (vcl_size_t row = 1; row <= vcl_matrix.size1(); ++row)

     {

       while (data_index < row_buffer[row])

       {

         assert(col_buffer[data_index] < vcl_matrix.size2() && bool("ViennaCL encountered invalid data at col_buffer"));

         if (elements[data_index] != static_cast<NumericT>(0.0))

           arma_matrix(row-1, col_buffer[data_index]) = elements[data_index];

         ++data_index;

       }

     }

   }

 }

 #endif


 #ifdef VIENNACL_WITH_EIGEN


 template<typename NumericT, int flags, unsigned int AlignmentV>

 void copy(compressed_matrix<NumericT, AlignmentV> & gpu_matrix,

           Eigen::SparseMatrix<NumericT, flags> & eigen_matrix)

 {

   assert( (static_cast<vcl_size_t>(eigen_matrix.rows()) == gpu_matrix.size1()) && bool("Size mismatch") );

   assert( (static_cast<vcl_size_t>(eigen_matrix.cols()) == gpu_matrix.size2()) && bool("Size mismatch") );


   if ( gpu_matrix.size1() > 0 && gpu_matrix.size2() > 0 )

   {

     //get raw data from memory:

     viennacl::backend::typesafe_host_array<unsigned int> row_buffer(gpu_matrix.handle1(), gpu_matrix.size1() + 1);

     viennacl::backend::typesafe_host_array<unsigned int> col_buffer(gpu_matrix.handle2(), gpu_matrix.nnz());

     std::vector<NumericT> elements(gpu_matrix.nnz());


     viennacl::backend::memory_read(gpu_matrix.handle1(), 0, row_buffer.raw_size(), row_buffer.get());

     viennacl::backend::memory_read(gpu_matrix.handle2(), 0, col_buffer.raw_size(), col_buffer.get());

     viennacl::backend::memory_read(gpu_matrix.handle(),  0, sizeof(NumericT)* gpu_matrix.nnz(),        &(elements[0]));


     eigen_matrix.setZero();

     vcl_size_t data_index = 0;

     for (vcl_size_t row = 1; row <= gpu_matrix.size1(); ++row)

     {

       while (data_index < row_buffer[row])

       {

         assert(col_buffer[data_index] < gpu_matrix.size2() && bool("ViennaCL encountered invalid data at col_buffer"));

         if (elements[data_index] != static_cast<NumericT>(0.0))

           eigen_matrix.insert(row-1, col_buffer[data_index]) = elements[data_index];

         ++data_index;

       }

     }

   }

 }

 #endif


 #ifdef VIENNACL_WITH_MTL4


 template<typename NumericT, unsigned int AlignmentV>

 void copy(compressed_matrix<NumericT, AlignmentV> & gpu_matrix,

           mtl::compressed2D<NumericT> & mtl4_matrix)

 {

   assert( (static_cast<vcl_size_t>(mtl4_matrix.num_rows()) == gpu_matrix.size1()) && bool("Size mismatch") );

   assert( (static_cast<vcl_size_t>(mtl4_matrix.num_cols()) == gpu_matrix.size2()) && bool("Size mismatch") );


   if ( gpu_matrix.size1() > 0 && gpu_matrix.size2() > 0 )

   {


     //get raw data from memory:

     viennacl::backend::typesafe_host_array<unsigned int> row_buffer(gpu_matrix.handle1(), gpu_matrix.size1() + 1);

     viennacl::backend::typesafe_host_array<unsigned int> col_buffer(gpu_matrix.handle2(), gpu_matrix.nnz());

     std::vector<NumericT> elements(gpu_matrix.nnz());


     viennacl::backend::memory_read(gpu_matrix.handle1(), 0, row_buffer.raw_size(), row_buffer.get());

     viennacl::backend::memory_read(gpu_matrix.handle2(), 0, col_buffer.raw_size(), col_buffer.get());

     viennacl::backend::memory_read(gpu_matrix.handle(),  0, sizeof(NumericT)* gpu_matrix.nnz(), &(elements[0]));


     //set_to_zero(mtl4_matrix);

     //mtl4_matrix.change_dim(gpu_matrix.size1(), gpu_matrix.size2());


     mtl::matrix::inserter< mtl::compressed2D<NumericT> >  ins(mtl4_matrix);

     vcl_size_t data_index = 0;

     for (vcl_size_t row = 1; row <= gpu_matrix.size1(); ++row)

     {

       while (data_index < row_buffer[row])

       {

         assert(col_buffer[data_index] < gpu_matrix.size2() && bool("ViennaCL encountered invalid data at col_buffer"));

         if (elements[data_index] != static_cast<NumericT>(0.0))

           ins(row-1, col_buffer[data_index]) << typename mtl::Collection< mtl::compressed2D<NumericT> >::value_type(elements[data_index]);

         ++data_index;

       }

     }

   }

 }

 #endif


 template<class NumericT, unsigned int AlignmentV /* see VCLForwards.h */>

 class compressed_matrix

 {

 public:

   typedef viennacl::backend::mem_handle                                                              handle_type;

   typedef scalar<typename viennacl::tools::CHECK_SCALAR_TEMPLATE_ARGUMENT<NumericT>::ResultType>   value_type;

   typedef vcl_size_t                                                                                 size_type;


   compressed_matrix() : rows_(0), cols_(0), nonzeros_(0), row_block_num_(0) {}


   explicit compressed_matrix(vcl_size_t rows, vcl_size_t cols, vcl_size_t nonzeros = 0, viennacl::context ctx = viennacl::context())

     : rows_(rows), cols_(cols), nonzeros_(nonzeros), row_block_num_(0)

   {

     row_buffer_.switch_active_handle_id(ctx.memory_type());

     col_buffer_.switch_active_handle_id(ctx.memory_type());

     elements_.switch_active_handle_id(ctx.memory_type());

     row_blocks_.switch_active_handle_id(ctx.memory_type());


 #ifdef VIENNACL_WITH_OPENCL

     if (ctx.memory_type() == OPENCL_MEMORY)

     {

       row_buffer_.opencl_handle().context(ctx.opencl_context());

       col_buffer_.opencl_handle().context(ctx.opencl_context());

       elements_.opencl_handle().context(ctx.opencl_context());

       row_blocks_.opencl_handle().context(ctx.opencl_context());

     }

 #endif

     if (rows > 0)

     {

       viennacl::backend::memory_create(row_buffer_, viennacl::backend::typesafe_host_array<unsigned int>().element_size() * (rows + 1), ctx);

       viennacl::vector_base<unsigned int> init_temporary(row_buffer_, size_type(rows+1), 0, 1);

       init_temporary = viennacl::zero_vector<unsigned int>(size_type(rows+1), ctx);

     }

     if (nonzeros > 0)

     {

       viennacl::backend::memory_create(col_buffer_, viennacl::backend::typesafe_host_array<unsigned int>().element_size() * nonzeros, ctx);

       viennacl::backend::memory_create(elements_, sizeof(NumericT) * nonzeros, ctx);

     }

   }


   explicit compressed_matrix(vcl_size_t rows, vcl_size_t cols, viennacl::context ctx)

     : rows_(rows), cols_(cols), nonzeros_(0), row_block_num_(0)

   {

     row_buffer_.switch_active_handle_id(ctx.memory_type());

     col_buffer_.switch_active_handle_id(ctx.memory_type());

     elements_.switch_active_handle_id(ctx.memory_type());

     row_blocks_.switch_active_handle_id(ctx.memory_type());


 #ifdef VIENNACL_WITH_OPENCL

     if (ctx.memory_type() == OPENCL_MEMORY)

     {

       row_buffer_.opencl_handle().context(ctx.opencl_context());

       col_buffer_.opencl_handle().context(ctx.opencl_context());

       elements_.opencl_handle().context(ctx.opencl_context());

       row_blocks_.opencl_handle().context(ctx.opencl_context());

     }

 #endif

     if (rows > 0)

     {

       viennacl::backend::memory_create(row_buffer_, viennacl::backend::typesafe_host_array<unsigned int>().element_size() * (rows + 1), ctx);

       viennacl::vector_base<unsigned int> init_temporary(row_buffer_, size_type(rows+1), 0, 1);

       init_temporary = viennacl::zero_vector<unsigned int>(size_type(rows+1), ctx);

     }

   }


   explicit compressed_matrix(viennacl::context ctx) : rows_(0), cols_(0), nonzeros_(0), row_block_num_(0)

   {

     row_buffer_.switch_active_handle_id(ctx.memory_type());

     col_buffer_.switch_active_handle_id(ctx.memory_type());

     elements_.switch_active_handle_id(ctx.memory_type());

     row_blocks_.switch_active_handle_id(ctx.memory_type());


 #ifdef VIENNACL_WITH_OPENCL

     if (ctx.memory_type() == OPENCL_MEMORY)

     {

       row_buffer_.opencl_handle().context(ctx.opencl_context());

       col_buffer_.opencl_handle().context(ctx.opencl_context());

       elements_.opencl_handle().context(ctx.opencl_context());

       row_blocks_.opencl_handle().context(ctx.opencl_context());

     }

 #endif

   }


 #ifdef VIENNACL_WITH_OPENCL


   explicit compressed_matrix(cl_mem mem_row_buffer, cl_mem mem_col_buffer, cl_mem mem_elements,

                              vcl_size_t rows, vcl_size_t cols, vcl_size_t nonzeros) :

     rows_(rows), cols_(cols), nonzeros_(nonzeros), row_block_num_(0)

   {

     row_buffer_.switch_active_handle_id(viennacl::OPENCL_MEMORY);

     row_buffer_.opencl_handle() = mem_row_buffer;

     row_buffer_.opencl_handle().inc();             //prevents that the user-provided memory is deleted once the matrix object is destroyed.

     row_buffer_.raw_size(sizeof(cl_uint) * (rows + 1));


     col_buffer_.switch_active_handle_id(viennacl::OPENCL_MEMORY);

     col_buffer_.opencl_handle() = mem_col_buffer;

     col_buffer_.opencl_handle().inc();             //prevents that the user-provided memory is deleted once the matrix object is destroyed.

     col_buffer_.raw_size(sizeof(cl_uint) * nonzeros);


     elements_.switch_active_handle_id(viennacl::OPENCL_MEMORY);

     elements_.opencl_handle() = mem_elements;

     elements_.opencl_handle().inc();               //prevents that the user-provided memory is deleted once the matrix object is destroyed.

     elements_.raw_size(sizeof(NumericT) * nonzeros);


     //generate block information for CSR-adaptive:

     generate_row_block_information();

   }

 #endif


   compressed_matrix(matrix_expression<const compressed_matrix, const compressed_matrix, op_prod> const & proxy)

     : rows_(0), cols_(0), nonzeros_(0), row_block_num_(0)

   {

     viennacl::context ctx = viennacl::traits::context(proxy.lhs());


     row_buffer_.switch_active_handle_id(ctx.memory_type());

     col_buffer_.switch_active_handle_id(ctx.memory_type());

     elements_.switch_active_handle_id(ctx.memory_type());

     row_blocks_.switch_active_handle_id(ctx.memory_type());


 #ifdef VIENNACL_WITH_OPENCL

     if (ctx.memory_type() == OPENCL_MEMORY)

     {

       row_buffer_.opencl_handle().context(ctx.opencl_context());

       col_buffer_.opencl_handle().context(ctx.opencl_context());

       elements_.opencl_handle().context(ctx.opencl_context());

       row_blocks_.opencl_handle().context(ctx.opencl_context());

     }

 #endif


     viennacl::linalg::prod_impl(proxy.lhs(), proxy.rhs(), *this);

     generate_row_block_information();

   }


   compressed_matrix & operator=(compressed_matrix const & other)

   {

     assert( (rows_ == 0 || rows_ == other.size1()) && bool("Size mismatch") );

     assert( (cols_ == 0 || cols_ == other.size2()) && bool("Size mismatch") );


     rows_ = other.size1();

     cols_ = other.size2();

     nonzeros_ = other.nnz();

     row_block_num_ = other.row_block_num_;


     viennacl::backend::typesafe_memory_copy<unsigned int>(other.row_buffer_, row_buffer_);

     viennacl::backend::typesafe_memory_copy<unsigned int>(other.col_buffer_, col_buffer_);

     viennacl::backend::typesafe_memory_copy<unsigned int>(other.row_blocks_, row_blocks_);

     viennacl::backend::typesafe_memory_copy<NumericT>(other.elements_, elements_);


     return *this;

   }


   compressed_matrix & operator=(matrix_expression<const compressed_matrix, const compressed_matrix, op_prod> const & proxy)

   {

     assert( (rows_ == 0 || rows_ == proxy.lhs().size1()) && bool("Size mismatch") );

     assert( (cols_ == 0 || cols_ == proxy.rhs().size2()) && bool("Size mismatch") );


     viennacl::linalg::prod_impl(proxy.lhs(), proxy.rhs(), *this);

     generate_row_block_information();


     return *this;

   }


   void set(const void * row_jumper,

            const void * col_buffer,

            const NumericT * elements,

            vcl_size_t rows,

            vcl_size_t cols,

            vcl_size_t nonzeros)

   {

     assert( (rows > 0)     && bool("Error in compressed_matrix::set(): Number of rows must be larger than zero!"));

     assert( (cols > 0)     && bool("Error in compressed_matrix::set(): Number of columns must be larger than zero!"));

     assert( (nonzeros > 0) && bool("Error in compressed_matrix::set(): Number of nonzeros must be larger than zero!"));

     //std::cout << "Setting memory: " << cols + 1 << ", " << nonzeros << std::endl;


     //row_buffer_.switch_active_handle_id(viennacl::backend::OPENCL_MEMORY);

     viennacl::backend::memory_create(row_buffer_, viennacl::backend::typesafe_host_array<unsigned int>(row_buffer_).element_size() * (rows + 1), viennacl::traits::context(row_buffer_), row_jumper);


     //col_buffer_.switch_active_handle_id(viennacl::backend::OPENCL_MEMORY);

     viennacl::backend::memory_create(col_buffer_, viennacl::backend::typesafe_host_array<unsigned int>(col_buffer_).element_size() * nonzeros, viennacl::traits::context(col_buffer_), col_buffer);


     //elements_.switch_active_handle_id(viennacl::backend::OPENCL_MEMORY);

     viennacl::backend::memory_create(elements_, sizeof(NumericT) * nonzeros, viennacl::traits::context(elements_), elements);


     nonzeros_ = nonzeros;

     rows_ = rows;

     cols_ = cols;


     //generate block information for CSR-adaptive:

     generate_row_block_information();

   }


   void reserve(vcl_size_t new_nonzeros, bool preserve = true)

   {

     if (new_nonzeros > nonzeros_)

     {

       if (preserve)

       {

         handle_type col_buffer_old;

         handle_type elements_old;

         viennacl::backend::memory_shallow_copy(col_buffer_, col_buffer_old);

         viennacl::backend::memory_shallow_copy(elements_,   elements_old);


         viennacl::backend::typesafe_host_array<unsigned int> size_deducer(col_buffer_);

         viennacl::backend::memory_create(col_buffer_, size_deducer.element_size() * new_nonzeros, viennacl::traits::context(col_buffer_));

         viennacl::backend::memory_create(elements_,   sizeof(NumericT) * new_nonzeros,          viennacl::traits::context(elements_));


         viennacl::backend::memory_copy(col_buffer_old, col_buffer_, 0, 0, size_deducer.element_size() * nonzeros_);

         viennacl::backend::memory_copy(elements_old,   elements_,   0, 0, sizeof(NumericT)* nonzeros_);

       }

       else

       {

         viennacl::backend::typesafe_host_array<unsigned int> size_deducer(col_buffer_);

         viennacl::backend::memory_create(col_buffer_, size_deducer.element_size() * new_nonzeros, viennacl::traits::context(col_buffer_));

         viennacl::backend::memory_create(elements_,   sizeof(NumericT)            * new_nonzeros, viennacl::traits::context(elements_));

       }


       nonzeros_ = new_nonzeros;

     }

   }


   void resize(vcl_size_t new_size1, vcl_size_t new_size2, bool preserve = true)

   {

     assert(new_size1 > 0 && new_size2 > 0 && bool("Cannot resize to zero size!"));


     if (new_size1 != rows_ || new_size2 != cols_)

     {

       if (!preserve)

       {

         viennacl::backend::typesafe_host_array<unsigned int> host_row_buffer(row_buffer_, new_size1 + 1);

         viennacl::backend::memory_create(row_buffer_, viennacl::backend::typesafe_host_array<unsigned int>().element_size() * (new_size1 + 1), viennacl::traits::context(row_buffer_), host_row_buffer.get());

         // faster version without initializing memory:

         //viennacl::backend::memory_create(row_buffer_, viennacl::backend::typesafe_host_array<unsigned int>().element_size() * (new_size1 + 1), viennacl::traits::context(row_buffer_));

         nonzeros_ = 0;

       }

       else

       {

         std::vector<std::map<unsigned int, NumericT> > stl_sparse_matrix;

         if (rows_ > 0)

         {

           stl_sparse_matrix.resize(rows_);

           viennacl::copy(*this, stl_sparse_matrix);

         } else {

           stl_sparse_matrix.resize(new_size1);

           stl_sparse_matrix[0][0] = 0;      //enforces nonzero array sizes if matrix was initially empty

         }


         stl_sparse_matrix.resize(new_size1);


         //discard entries with column index larger than new_size2

         if (new_size2 < cols_ && rows_ > 0)

         {

           for (vcl_size_t i=0; i<stl_sparse_matrix.size(); ++i)

           {

             std::list<unsigned int> to_delete;

             for (typename std::map<unsigned int, NumericT>::iterator it = stl_sparse_matrix[i].begin();

                  it != stl_sparse_matrix[i].end();

                  ++it)

             {

               if (it->first >= new_size2)

                 to_delete.push_back(it->first);

             }


             for (std::list<unsigned int>::iterator it = to_delete.begin(); it != to_delete.end(); ++it)

               stl_sparse_matrix[i].erase(*it);

           }

         }


         viennacl::tools::sparse_matrix_adapter<NumericT> adapted_matrix(stl_sparse_matrix, new_size1, new_size2);

         rows_ = new_size1;

         cols_ = new_size2;

         viennacl::copy(adapted_matrix, *this);

       }


       rows_ = new_size1;

       cols_ = new_size2;

     }

   }


   void clear()

   {

     viennacl::backend::typesafe_host_array<unsigned int> host_row_buffer(row_buffer_, rows_ + 1);

     viennacl::backend::typesafe_host_array<unsigned int> host_col_buffer(col_buffer_, 1);

     std::vector<NumericT> host_elements(1);


     viennacl::backend::memory_create(row_buffer_, host_row_buffer.element_size() * (rows_ + 1), viennacl::traits::context(row_buffer_), host_row_buffer.get());

     viennacl::backend::memory_create(col_buffer_, host_col_buffer.element_size() * 1,           viennacl::traits::context(col_buffer_), host_col_buffer.get());

     viennacl::backend::memory_create(elements_,   sizeof(NumericT) * 1,                         viennacl::traits::context(elements_), &(host_elements[0]));


     nonzeros_ = 0;

   }


   entry_proxy<NumericT> operator()(vcl_size_t i, vcl_size_t j)

   {

     assert( (i < rows_) && (j < cols_) && bool("compressed_matrix access out of bounds!"));


     vcl_size_t index = element_index(i, j);


     // check for element in sparsity pattern

     if (index < nonzeros_)

       return entry_proxy<NumericT>(index, elements_);


     // Element not found. Copying required. Very slow, but direct entry manipulation is painful anyway...

     std::vector< std::map<unsigned int, NumericT> > cpu_backup(rows_);

     tools::sparse_matrix_adapter<NumericT> adapted_cpu_backup(cpu_backup, rows_, cols_);

     viennacl::copy(*this, adapted_cpu_backup);

     cpu_backup[i][static_cast<unsigned int>(j)] = 0.0;

     viennacl::copy(adapted_cpu_backup, *this);


     index = element_index(i, j);


     assert(index < nonzeros_);


     return entry_proxy<NumericT>(index, elements_);

   }


   const vcl_size_t & size1() const { return rows_; }

   const vcl_size_t & size2() const { return cols_; }

   const vcl_size_t & nnz() const { return nonzeros_; }

   const vcl_size_t & blocks1() const { return row_block_num_; }


   const handle_type & handle1() const { return row_buffer_; }

   const handle_type & handle2() const { return col_buffer_; }

   const handle_type & handle3() const { return row_blocks_; }

   const handle_type & handle() const { return elements_; }


   handle_type & handle1() { return row_buffer_; }

   handle_type & handle2() { return col_buffer_; }

   handle_type & handle3() { return row_blocks_; }

   handle_type & handle() { return elements_; }


   void switch_memory_context(viennacl::context new_ctx)

   {

     viennacl::backend::switch_memory_context<unsigned int>(row_buffer_, new_ctx);

     viennacl::backend::switch_memory_context<unsigned int>(col_buffer_, new_ctx);

     viennacl::backend::switch_memory_context<unsigned int>(row_blocks_, new_ctx);

     viennacl::backend::switch_memory_context<NumericT>(elements_, new_ctx);

   }


   viennacl::memory_types memory_context() const

   {

     return row_buffer_.get_active_handle_id();

   }


 private:


   vcl_size_t element_index(vcl_size_t i, vcl_size_t j)

   {

     //read row indices

     viennacl::backend::typesafe_host_array<unsigned int> row_indices(row_buffer_, 2);

     viennacl::backend::memory_read(row_buffer_, row_indices.element_size()*i, row_indices.element_size()*2, row_indices.get());


     //get column indices for row i:

     viennacl::backend::typesafe_host_array<unsigned int> col_indices(col_buffer_, row_indices[1] - row_indices[0]);

     viennacl::backend::memory_read(col_buffer_, col_indices.element_size()*row_indices[0], row_indices.element_size()*col_indices.size(), col_indices.get());


     for (vcl_size_t k=0; k<col_indices.size(); ++k)

     {

       if (col_indices[k] == j)

         return row_indices[0] + k;

     }


     // if not found, return index past the end of the matrix (cf. matrix.end() in the spirit of the STL)

     return nonzeros_;

   }


 public:

   void generate_row_block_information()

   {

     viennacl::backend::typesafe_host_array<unsigned int> row_buffer(row_buffer_, rows_ + 1);

     viennacl::backend::memory_read(row_buffer_, 0, row_buffer.raw_size(), row_buffer.get());


     viennacl::backend::typesafe_host_array<unsigned int> row_blocks(row_buffer_, rows_ + 1);


     vcl_size_t num_entries_in_current_batch = 0;


     const vcl_size_t shared_mem_size = 1024; // number of column indices loaded to shared memory, number of floating point values loaded to shared memory


     row_block_num_ = 0;

     row_blocks.set(0, 0);

     for (vcl_size_t i=0; i<rows_; ++i)

     {

       vcl_size_t entries_in_row = vcl_size_t(row_buffer[i+1]) - vcl_size_t(row_buffer[i]);

       num_entries_in_current_batch += entries_in_row;


       if (num_entries_in_current_batch > shared_mem_size)

       {

         vcl_size_t rows_in_batch = i - row_blocks[row_block_num_];

         if (rows_in_batch > 0) // at least one full row is in the batch. Use current row in next batch.

           row_blocks.set(++row_block_num_, i--);

         else // row is larger than buffer in shared memory

           row_blocks.set(++row_block_num_, i+1);

         num_entries_in_current_batch = 0;

       }

     }

     if (num_entries_in_current_batch > 0)

       row_blocks.set(++row_block_num_, rows_);


     if (row_block_num_ > 0) //matrix might be empty...

       viennacl::backend::memory_create(row_blocks_,

                                        row_blocks.element_size() * (row_block_num_ + 1),

                                        viennacl::traits::context(row_buffer_), row_blocks.get());


   }


 private:

   // /** @brief Copy constructor is by now not available. */

   //compressed_matrix(compressed_matrix const &);


 private:


   vcl_size_t rows_;

   vcl_size_t cols_;

   vcl_size_t nonzeros_;

   vcl_size_t row_block_num_;

   handle_type row_buffer_;

   handle_type row_blocks_;

   handle_type col_buffer_;

   handle_type elements_;

 };


 template<typename NumericT, unsigned int AlignmentV>

 std::ostream & operator<<(std::ostream & os, compressed_matrix<NumericT, AlignmentV> const & A)

 {

   std::vector<std::map<unsigned int, NumericT> > tmp(A.size1());

   viennacl::copy(A, tmp);

   os << "compressed_matrix of size (" << A.size1() << ", " << A.size2() << ") with " << A.nnz() << " nonzeros:" << std::endl;


   for (vcl_size_t i=0; i<A.size1(); ++i)

   {

     for (typename std::map<unsigned int, NumericT>::const_iterator it = tmp[i].begin(); it != tmp[i].end(); ++it)

       os << "  (" << i << ", " << it->first << ")\t" << it->second << std::endl;

   }

   return os;

 }


 //

 // Specify available operations:

 //


 namespace linalg

 {

 namespace detail

 {

   // x = A * y

   template<typename T, unsigned int A>

   struct op_executor<vector_base<T>, op_assign, vector_expression<const compressed_matrix<T, A>, const vector_base<T>, op_prod> >

   {

     static void apply(vector_base<T> & lhs, vector_expression<const compressed_matrix<T, A>, const vector_base<T>, op_prod> const & rhs)

     {

       // check for the special case x = A * x

       if (viennacl::traits::handle(lhs) == viennacl::traits::handle(rhs.rhs()))

       {

         viennacl::vector<T> temp(lhs);

         viennacl::linalg::prod_impl(rhs.lhs(), rhs.rhs(), T(1), temp, T(0));

         lhs = temp;

       }

       else

         viennacl::linalg::prod_impl(rhs.lhs(), rhs.rhs(), T(1), lhs, T(0));

     }

   };


   template<typename T, unsigned int A>

   struct op_executor<vector_base<T>, op_inplace_add, vector_expression<const compressed_matrix<T, A>, const vector_base<T>, op_prod> >

   {

     static void apply(vector_base<T> & lhs, vector_expression<const compressed_matrix<T, A>, const vector_base<T>, op_prod> const & rhs)

     {

       // check for the special case x += A * x

       if (viennacl::traits::handle(lhs) == viennacl::traits::handle(rhs.rhs()))

       {

         viennacl::vector<T> temp(lhs);

         viennacl::linalg::prod_impl(rhs.lhs(), rhs.rhs(), T(1), temp, T(0));

         lhs += temp;

       }

       else

         viennacl::linalg::prod_impl(rhs.lhs(), rhs.rhs(), T(1), lhs, T(1));

     }

   };


   template<typename T, unsigned int A>

   struct op_executor<vector_base<T>, op_inplace_sub, vector_expression<const compressed_matrix<T, A>, const vector_base<T>, op_prod> >

   {

     static void apply(vector_base<T> & lhs, vector_expression<const compressed_matrix<T, A>, const vector_base<T>, op_prod> const & rhs)

     {

       // check for the special case x -= A * x

       if (viennacl::traits::handle(lhs) == viennacl::traits::handle(rhs.rhs()))

       {

         viennacl::vector<T> temp(lhs);

         viennacl::linalg::prod_impl(rhs.lhs(), rhs.rhs(), T(1), temp, T(0));

         lhs -= temp;

       }

       else

         viennacl::linalg::prod_impl(rhs.lhs(), rhs.rhs(), T(-1), lhs, T(1));

     }

   };


   // x = A * vec_op

   template<typename T, unsigned int A, typename LHS, typename RHS, typename OP>

   struct op_executor<vector_base<T>, op_assign, vector_expression<const compressed_matrix<T, A>, const vector_expression<const LHS, const RHS, OP>, op_prod> >

   {

     static void apply(vector_base<T> & lhs, vector_expression<const compressed_matrix<T, A>, const vector_expression<const LHS, const RHS, OP>, op_prod> const & rhs)

     {

       viennacl::vector<T> temp(rhs.rhs(), viennacl::traits::context(rhs));

       viennacl::linalg::prod_impl(rhs.lhs(), temp, lhs);

     }

   };


   // x = A * vec_op

   template<typename T, unsigned int A, typename LHS, typename RHS, typename OP>

   struct op_executor<vector_base<T>, op_inplace_add, vector_expression<const compressed_matrix<T, A>, vector_expression<const LHS, const RHS, OP>, op_prod> >

   {

     static void apply(vector_base<T> & lhs, vector_expression<const compressed_matrix<T, A>, vector_expression<const LHS, const RHS, OP>, op_prod> const & rhs)

     {

       viennacl::vector<T> temp(rhs.rhs(), viennacl::traits::context(rhs));

       viennacl::vector<T> temp_result(lhs);

       viennacl::linalg::prod_impl(rhs.lhs(), temp, temp_result);

       lhs += temp_result;

     }

   };


   // x = A * vec_op

   template<typename T, unsigned int A, typename LHS, typename RHS, typename OP>

   struct op_executor<vector_base<T>, op_inplace_sub, vector_expression<const compressed_matrix<T, A>, const vector_expression<const LHS, const RHS, OP>, op_prod> >

   {

     static void apply(vector_base<T> & lhs, vector_expression<const compressed_matrix<T, A>, const vector_expression<const LHS, const RHS, OP>, op_prod> const & rhs)

     {

       viennacl::vector<T> temp(rhs.rhs(), viennacl::traits::context(rhs));

       viennacl::vector<T> temp_result(lhs);

       viennacl::linalg::prod_impl(rhs.lhs(), temp, temp_result);

       lhs -= temp_result;

     }

   };


 } // namespace detail

 } // namespace linalg

 }


 #endif

viennacl::compressed_matrix::size2
const vcl_size_t & size2() const
Returns the number of columns.
Definition: compressed_matrix.hpp:929

viennacl::backend::typesafe_host_array
Helper class implementing an array on the host. Default case: No conversion necessary.
Definition: util.hpp:92

viennacl::backend::typesafe_host_array::element_size
vcl_size_t element_size() const
Definition: util.hpp:112

viennacl::scalar
This class represents a single scalar value on the GPU and behaves mostly like a built-in scalar type...
Definition: forwards.h:227

viennacl::compressed_matrix::size1
const vcl_size_t & size1() const
Returns the number of rows.
Definition: compressed_matrix.hpp:927

tools.hpp
Various little tools used here and there in ViennaCL.

viennacl::compressed_matrix::switch_memory_context
void switch_memory_context(viennacl::context new_ctx)
Switches the memory context of the matrix.
Definition: compressed_matrix.hpp:957

viennacl::traits::size1
vcl_size_t size1(MatrixType const &mat)
Generic routine for obtaining the number of rows of a matrix (ViennaCL, uBLAS, etc.)
Definition: size.hpp:163

entry_proxy.hpp
A proxy class for entries in a vector.

viennacl::OPENCL_MEMORY
Definition: forwards.h:349

viennacl::matrix_expression
Expression template class for representing a tree of expressions which ultimately result in a matrix...
Definition: forwards.h:341

forwards.h
This file provides the forward declarations for the main types used within ViennaCL.

viennacl::zero_vector
Definition: vector_def.hpp:93

viennacl::backend::typesafe_host_array::get
void * get()
Definition: util.hpp:110

viennacl::backend::memory_read
void memory_read(mem_handle const &src_buffer, vcl_size_t src_offset, vcl_size_t bytes_to_read, void *ptr, bool async=false)
Reads data from a buffer back to main RAM.
Definition: memory.hpp:261

viennacl::traits::size2
result_of::size_type< MatrixType >::type size2(MatrixType const &mat)
Generic routine for obtaining the number of columns of a matrix (ViennaCL, uBLAS, etc...
Definition: size.hpp:201

viennacl::compressed_matrix::handle
const handle_type & handle() const
Returns the OpenCL handle to the matrix entry array.
Definition: compressed_matrix.hpp:942

viennacl::compressed_matrix::handle1
const handle_type & handle1() const
Returns the OpenCL handle to the row index array.
Definition: compressed_matrix.hpp:936

viennacl::compressed_matrix::nnz
const vcl_size_t & nnz() const
Returns the number of nonzero entries.
Definition: compressed_matrix.hpp:931

viennacl::backend::detail::element_size
vcl_size_t element_size(memory_types)
Definition: memory.hpp:299

NumericT
float NumericT
Definition: bisect.cpp:40

viennacl::context
Represents a generic 'context' similar to an OpenCL context, but is backend-agnostic and thus also su...
Definition: context.hpp:39

viennacl::compressed_matrix::generate_row_block_information
void generate_row_block_information()
Builds the row block information needed for fast sparse matrix-vector multiplications.
Definition: compressed_matrix.hpp:999

viennacl::traits::size
vcl_size_t size(VectorType const &vec)
Generic routine for obtaining the size of a vector (ViennaCL, uBLAS, etc.)
Definition: size.hpp:239

viennacl::compressed_matrix::operator()
entry_proxy< NumericT > operator()(vcl_size_t i, vcl_size_t j)
Returns a reference to the (i,j)-th entry of the sparse matrix. If (i,j) does not exist (zero)...
Definition: compressed_matrix.hpp:902

viennacl::compressed_matrix::handle3
handle_type & handle3()
Returns the OpenCL handle to the row block array.
Definition: compressed_matrix.hpp:949

viennacl::compressed_matrix::handle
handle_type & handle()
Returns the OpenCL handle to the matrix entry array.
Definition: compressed_matrix.hpp:951

sparse_matrix_operations.hpp
Implementations of operations using sparse matrices.

viennacl::compressed_matrix::handle2
const handle_type & handle2() const
Returns the OpenCL handle to the column index array.
Definition: compressed_matrix.hpp:938

viennacl::vector_base< unsigned int >

viennacl::compressed_matrix::clear
void clear()
Resets all entries in the matrix back to zero without changing the matrix size. Resets the sparsity p...
Definition: compressed_matrix.hpp:888

viennacl::tools::const_sparse_matrix_adapter
Adapts a constant sparse matrix type made up from std::vector > to basic ub...
Definition: adapter.hpp:183

viennacl::compressed_matrix::value_type
scalar< typename viennacl::tools::CHECK_SCALAR_TEMPLATE_ARGUMENT< NumericT >::ResultType > value_type
Definition: compressed_matrix.hpp:563

viennacl::vcl_size_t
std::size_t vcl_size_t
Definition: forwards.h:75

viennacl::compressed_matrix::size_type
vcl_size_t size_type
Definition: compressed_matrix.hpp:564

viennacl::vector
Definition: forwards.h:266

viennacl::compressed_matrix::compressed_matrix
compressed_matrix(vcl_size_t rows, vcl_size_t cols, viennacl::context ctx)
Construction of a compressed matrix with the supplied number of rows and columns. If the number of no...
Definition: compressed_matrix.hpp:612

viennacl::row
vector_expression< const matrix_base< NumericT, F >, const unsigned int, op_row > row(const matrix_base< NumericT, F > &A, unsigned int i)
Definition: matrix.hpp:910

viennacl::context::memory_type
viennacl::memory_types memory_type() const
Definition: context.hpp:76

viennacl::detail::copy_impl
void copy_impl(const CPUMatrixT &cpu_matrix, compressed_compressed_matrix< NumericT > &gpu_matrix, vcl_size_t nonzero_rows, vcl_size_t nonzeros)
Definition: compressed_compressed_matrix.hpp:41

viennacl::compressed_matrix::memory_context
viennacl::memory_types memory_context() const
Returns the current memory context to determine whether the matrix is set up for OpenMP, OpenCL, or CUDA.
Definition: compressed_matrix.hpp:966

viennacl::matrix_expression::rhs
RHS & rhs() const
Get right hand side operand.
Definition: matrix.hpp:69

viennacl::compressed_matrix::reserve
void reserve(vcl_size_t new_nonzeros, bool preserve=true)
Allocate memory for the supplied number of nonzeros in the matrix. Old values are preserved...
Definition: compressed_matrix.hpp:794

viennacl::compressed_matrix::handle3
const handle_type & handle3() const
Returns the OpenCL handle to the row block array.
Definition: compressed_matrix.hpp:940

viennacl::compressed_matrix::handle1
handle_type & handle1()
Returns the OpenCL handle to the row index array.
Definition: compressed_matrix.hpp:945

viennacl::compressed_matrix::compressed_matrix
compressed_matrix(vcl_size_t rows, vcl_size_t cols, vcl_size_t nonzeros=0, viennacl::context ctx=viennacl::context())
Construction of a compressed matrix with the supplied number of rows and columns. If the number of no...
Definition: compressed_matrix.hpp:576

viennacl::backend::mem_handle::switch_active_handle_id
void switch_active_handle_id(memory_types new_id)
Switches the currently active handle. If no support for that backend is provided, an exception is thr...
Definition: mem_handle.hpp:121

viennacl::backend::memory_copy
void memory_copy(mem_handle const &src_buffer, mem_handle &dst_buffer, vcl_size_t src_offset, vcl_size_t dst_offset, vcl_size_t bytes_to_copy)
Copies 'bytes_to_copy' bytes from address 'src_buffer + src_offset' to memory starting at address 'ds...
Definition: memory.hpp:140

viennacl::compressed_matrix::compressed_matrix
compressed_matrix(viennacl::context ctx)
Creates an empty compressed_matrix, but sets the respective context information.
Definition: compressed_matrix.hpp:641

viennacl::traits::context
viennacl::context context(T const &t)
Returns an ID for the currently active memory domain of an object.
Definition: context.hpp:40

vector.hpp
The vector type with operator-overloads and proxy classes is defined here. Linear algebra operations ...

viennacl::copy
void copy(std::vector< NumericT > &cpu_vec, circulant_matrix< NumericT, AlignmentV > &gpu_mat)
Copies a circulant matrix from the std::vector to the OpenCL device (either GPU or multi-core CPU) ...
Definition: circulant_matrix.hpp:150

viennacl::compressed_matrix::set
void set(const void *row_jumper, const void *col_buffer, const NumericT *elements, vcl_size_t rows, vcl_size_t cols, vcl_size_t nonzeros)
Sets the row, column and value arrays of the compressed matrix.
Definition: compressed_matrix.hpp:764

viennacl::backend::typesafe_host_array::set
void set(vcl_size_t index, U value)
Definition: util.hpp:115

viennacl::compressed_matrix::handle_type
viennacl::backend::mem_handle handle_type
Definition: compressed_matrix.hpp:562

ScalarType
float ScalarType
Definition: fft_1d.cpp:42

viennacl::backend::mem_handle
Main abstraction class for multiple memory domains. Represents a buffer in either main RAM...
Definition: mem_handle.hpp:89

viennacl::backend::mem_handle::raw_size
vcl_size_t raw_size() const
Returns the number of bytes of the currently active buffer.
Definition: mem_handle.hpp:230

viennacl::tools::sparse_matrix_adapter
Adapts a non-const sparse matrix type made up from std::vector > to basic u...
Definition: adapter.hpp:357

viennacl::compressed_matrix
A sparse square matrix in compressed sparse rows format.
Definition: compressed_matrix.hpp:559

viennacl::backend::memory_create
void memory_create(mem_handle &handle, vcl_size_t size_in_bytes, viennacl::context const &ctx, const void *host_ptr=NULL)
Creates an array of the specified size. If the second argument is provided, the buffer is initialized...
Definition: memory.hpp:87

viennacl::linalg::detail::min
T min(const T &lhs, const T &rhs)
Minimum.
Definition: util.hpp:45

viennacl::linalg::prod_impl
void prod_impl(const matrix_base< NumericT > &mat, const vector_base< NumericT > &vec, vector_base< NumericT > &result)
Carries out matrix-vector multiplication.
Definition: matrix_operations.hpp:438

viennacl::compressed_matrix::compressed_matrix
compressed_matrix(matrix_expression< const compressed_matrix, const compressed_matrix, op_prod > const &proxy)
Assignment a compressed matrix from the product of two compressed_matrix objects (C = A * B)...
Definition: compressed_matrix.hpp:695

viennacl::traits::handle
viennacl::backend::mem_handle & handle(T &obj)
Returns the generic memory handle of an object. Non-const version.
Definition: handle.hpp:41

viennacl::memory_types
memory_types
Definition: forwards.h:345

viennacl::matrix_expression::lhs
LHS & lhs() const
Get left hand side operand.
Definition: matrix.hpp:66

viennacl::backend::typesafe_host_array::raw_size
vcl_size_t raw_size() const
Definition: util.hpp:111

viennacl::compressed_matrix::blocks1
const vcl_size_t & blocks1() const
Returns the internal number of row blocks for an adaptive SpMV.
Definition: compressed_matrix.hpp:933

viennacl::entry_proxy
A proxy class for a single element of a vector or matrix. This proxy should not be noticed by end-use...
Definition: forwards.h:233

viennacl::compressed_matrix::compressed_matrix
compressed_matrix()
Default construction of a compressed matrix. No memory is allocated.
Definition: compressed_matrix.hpp:567

viennacl::compressed_matrix::resize
void resize(vcl_size_t new_size1, vcl_size_t new_size2, bool preserve=true)
Resize the matrix.
Definition: compressed_matrix.hpp:829

op_assign
Definition: self_assign.cpp:132

viennacl::backend::memory_shallow_copy
void memory_shallow_copy(mem_handle const &src_buffer, mem_handle &dst_buffer)
A 'shallow' copy operation from an initialized buffer to an uninitialized buffer. The uninitialized b...
Definition: memory.hpp:177

viennacl::compressed_matrix::operator=
compressed_matrix & operator=(compressed_matrix const &other)
Assignment a compressed matrix from possibly another memory domain.
Definition: compressed_matrix.hpp:720

viennacl::compressed_matrix::handle2
handle_type & handle2()
Returns the OpenCL handle to the column index array.
Definition: compressed_matrix.hpp:947

viennacl::compressed_matrix::operator=
compressed_matrix & operator=(matrix_expression< const compressed_matrix, const compressed_matrix, op_prod > const &proxy)
Assignment a compressed matrix from the product of two compressed_matrix objects (C = A * B)...
Definition: compressed_matrix.hpp:739

viennacl::backend::mem_handle::get_active_handle_id
memory_types get_active_handle_id() const
Returns an ID for the currently active memory buffer. Other memory buffers might contain old or no da...
Definition: mem_handle.hpp:118