doc/html/spai_8cpp_source.html

 /* =========================================================================

    Copyright (c) 2010-2015, Institute for Microelectronics,

                             Institute for Analysis and Scientific Computing,

                             TU Wien.

    Portions of this software are copyright by UChicago Argonne, LLC.


                             -----------------

                   ViennaCL - The Vienna Computing Library

                             -----------------


    Project Head:    Karl Rupp                   rupp@iue.tuwien.ac.at


    (A list of authors and contributors can be found in the PDF manual)


    License:         MIT (X11), see file LICENSE in the base directory

 ============================================================================= */


 // enable Boost.uBLAS support

 #define VIENNACL_WITH_UBLAS


 #ifndef NDEBUG

  #define BOOST_UBLAS_NDEBUG

 #endif


 // System headers:

 #include <utility>

 #include <iostream>

 #include <fstream>

 #include <string>

 #include <cmath>

 #include <algorithm>

 #include <stdio.h>


 // ViennaCL headers:

 #include "viennacl/scalar.hpp"

 #include "viennacl/matrix.hpp"

 #include "viennacl/compressed_matrix.hpp"

 #include "viennacl/linalg/cg.hpp"

 #include "viennacl/linalg/bicgstab.hpp"

 #include "viennacl/linalg/prod.hpp"

 #include "viennacl/linalg/inner_prod.hpp"

 #include "viennacl/linalg/ilu.hpp"

 #include "viennacl/linalg/norm_2.hpp"

 #include "viennacl/io/matrix_market.hpp"

 #include "viennacl/linalg/spai.hpp"


 // Boost headers:

 #include "boost/numeric/ublas/vector.hpp"

 #include "boost/numeric/ublas/matrix.hpp"

 #include "boost/numeric/ublas/io.hpp"


 // auxiliary functionality:

 #include "vector-io.hpp"


 template<typename MatrixT, typename VectorT, typename SolverTagT, typename PreconditionerT>

 void run_solver(MatrixT const & A, VectorT const & b, SolverTagT const & solver_tag, PreconditionerT const & precond)

 {

   VectorT result = viennacl::linalg::solve(A, b, solver_tag, precond);

   std::cout << " * Solver iterations: " << solver_tag.iters() << std::endl;

   VectorT residual = viennacl::linalg::prod(A, result);

   residual -= b;

   std::cout << " * Rel. Residual: " << viennacl::linalg::norm_2(residual) / viennacl::linalg::norm_2(b) << std::endl;

 }


 int main (int, const char **)

 {

   typedef float               ScalarType;

   typedef boost::numeric::ublas::compressed_matrix<ScalarType>        MatrixType;

   typedef boost::numeric::ublas::vector<ScalarType>                   VectorType;

   typedef viennacl::compressed_matrix<ScalarType>                     GPUMatrixType;

   typedef viennacl::vector<ScalarType>                                GPUVectorType;


 #ifdef VIENNACL_WITH_OPENCL

   // Optional: Customize OpenCL backend

   viennacl::ocl::platform pf = viennacl::ocl::get_platforms()[0];

   std::vector<viennacl::ocl::device> const & devices = pf.devices();


   // Optional: Set first device to first context:

   viennacl::ocl::setup_context(0, devices[0]);


   // Optional: Set second device for second context (use the same device for the second context if only one device available):

   if (devices.size() > 1)

     viennacl::ocl::setup_context(1, devices[1]);

   else

     viennacl::ocl::setup_context(1, devices[0]);


   std::cout << viennacl::ocl::current_device().info() << std::endl;

   viennacl::context ctx(viennacl::ocl::get_context(1));

 #else

   viennacl::context ctx;

 #endif


   MatrixType M;


   if (!viennacl::io::read_matrix_market_file(M, "../examples/testdata/mat65k.mtx"))

   {

     std::cerr<<"ERROR: Could not read matrix file " << std::endl;

     exit(EXIT_FAILURE);

   }


   std::cout << "Size of matrix: " << M.size1() << std::endl;

   std::cout << "Avg. Entries per row: " << double(M.nnz()) / static_cast<double>(M.size1()) << std::endl;


   VectorType rhs(M.size2());

   for (std::size_t i=0; i<rhs.size(); ++i)

     rhs(i) = ScalarType(1);


   GPUMatrixType  gpu_M(M.size1(), M.size2(), ctx);

   GPUVectorType  gpu_rhs(M.size1(), ctx);

   viennacl::copy(M, gpu_M);

   viennacl::copy(rhs, gpu_rhs);


   viennacl::linalg::bicgstab_tag solver_tag(1e-10, 50); //for simplicity and reasonably short execution times we use only 50 iterations here


   std::cout << "--- Reference 1: Pure BiCGStab on CPU ---" << std::endl;

   VectorType result = viennacl::linalg::solve(M, rhs, solver_tag);

   std::cout << " * Solver iterations: " << solver_tag.iters() << std::endl;

   VectorType residual = viennacl::linalg::prod(M, result) - rhs;

   std::cout << " * Rel. Residual: " << viennacl::linalg::norm_2(residual) / viennacl::linalg::norm_2(rhs) << std::endl;


   std::cout << "--- Reference 2: Pure BiCGStab on GPU ---" << std::endl;

   GPUVectorType gpu_result = viennacl::linalg::solve(gpu_M, gpu_rhs, solver_tag);

   std::cout << " * Solver iterations: " << solver_tag.iters() << std::endl;

   GPUVectorType gpu_residual = viennacl::linalg::prod(gpu_M, gpu_result);

   gpu_residual -= gpu_rhs;

   std::cout << " * Rel. Residual: " << viennacl::linalg::norm_2(gpu_residual) / viennacl::linalg::norm_2(gpu_rhs) << std::endl;


   std::cout << "--- Reference 2: BiCGStab with ILUT on CPU ---" << std::endl;

   std::cout << " * Preconditioner setup..." << std::endl;

   viennacl::linalg::ilut_precond<MatrixType> ilut(M, viennacl::linalg::ilut_tag());

   std::cout << " * Iterative solver run..." << std::endl;

   run_solver(M, rhs, solver_tag, ilut);


   std::cout << "--- Test 1: CPU-based SPAI ---" << std::endl;

   std::cout << " * Preconditioner setup..." << std::endl;

   viennacl::linalg::spai_precond<MatrixType> spai_cpu(M, viennacl::linalg::spai_tag(1e-3, 3, 5e-2));

   std::cout << " * Iterative solver run..." << std::endl;

   run_solver(M, rhs, solver_tag, spai_cpu);


   std::cout << "--- Test 2: CPU-based FSPAI ---" << std::endl;

   std::cout << " * Preconditioner setup..." << std::endl;

   viennacl::linalg::fspai_precond<MatrixType> fspai_cpu(M, viennacl::linalg::fspai_tag());

   std::cout << " * Iterative solver run..." << std::endl;

   run_solver(M, rhs, solver_tag, fspai_cpu);


   std::cout << "--- Test 3: GPU-based SPAI ---" << std::endl;

   std::cout << " * Preconditioner setup..." << std::endl;

   viennacl::linalg::spai_precond<GPUMatrixType> spai_gpu(gpu_M, viennacl::linalg::spai_tag(1e-3, 3, 5e-2));

   std::cout << " * Iterative solver run..." << std::endl;

   run_solver(gpu_M, gpu_rhs, solver_tag, spai_gpu);


   std::cout << "--- Test 4: GPU-based FSPAI ---" << std::endl;

   std::cout << " * Preconditioner setup..." << std::endl;

   viennacl::linalg::fspai_precond<GPUMatrixType> fspai_gpu(gpu_M, viennacl::linalg::fspai_tag());

   std::cout << " * Iterative solver run..." << std::endl;

   run_solver(gpu_M, gpu_rhs, solver_tag, fspai_gpu);


   std::cout << "!!!! TUTORIAL COMPLETED SUCCESSFULLY !!!!" << std::endl;


   return EXIT_SUCCESS;

 }


viennacl::linalg::norm_2
T norm_2(std::vector< T, A > const &v1)
Definition: norm_2.hpp:96

matrix_market.hpp
A reader and writer for the matrix market format is implemented here.

viennacl::ocl::get_platforms
std::vector< platform > get_platforms()
Definition: platform.hpp:124

norm_2.hpp
Generic interface for the l^2-norm. See viennacl/linalg/vector_operations.hpp for implementations...

viennacl::ocl::platform
Wrapper class for an OpenCL platform.
Definition: platform.hpp:45

prod.hpp
Generic interface for matrix-vector and matrix-matrix products. See viennacl/linalg/vector_operations...

matrix.hpp
Implementation of the dense matrix class.

main
int main()
Definition: bisect.cpp:91

viennacl::ocl::platform::devices
std::vector< device > devices(cl_device_type dtype=CL_DEVICE_TYPE_DEFAULT)
Returns the available devices of the supplied device type.
Definition: platform.hpp:91

bicgstab.hpp
The stabilized bi-conjugate gradient method is implemented here.

vector-io.hpp

viennacl::linalg::detail::spai::spai_tag
A tag for SPAI.
Definition: spai_tag.hpp:64

viennacl::ocl::current_device
viennacl::ocl::device const & current_device()
Convenience function for returning the active device in the current context.
Definition: backend.hpp:351

inner_prod.hpp
Generic interface for the computation of inner products. See viennacl/linalg/vector_operations.hpp for implementations.

viennacl::linalg::solve
VectorT solve(MatrixT const &matrix, VectorT const &rhs, bicgstab_tag const &tag, PreconditionerT const &precond)
Definition: bicgstab.hpp:496

viennacl::ocl::device::info
std::string info(vcl_size_t indent=0, char indent_char= ' ') const
Returns an info string with a few properties of the device. Use full_info() to get all details...
Definition: device.hpp:995

viennacl::context
Represents a generic 'context' similar to an OpenCL context, but is backend-agnostic and thus also su...
Definition: context.hpp:39

viennacl::linalg::prod
VectorT prod(std::vector< std::vector< T, A1 >, A2 > const &matrix, VectorT const &vector)
Definition: prod.hpp:102

viennacl::linalg::detail::spai::fspai_tag
A tag for FSPAI. Experimental.
Definition: fspai.hpp:71

ilu.hpp
Implementations of incomplete factorization preconditioners. Convenience header file.

viennacl::linalg::fspai_precond
Implementation of the Factored SParse Approximate Inverse Algorithm for a generic, uBLAS-compatible matrix type.
Definition: spai.hpp:189

viennacl::linalg::ilut_tag
A tag for incomplete LU factorization with threshold (ILUT)
Definition: ilut.hpp:45

compressed_matrix.hpp
Implementation of the compressed_matrix class.

viennacl::linalg::spai_precond
Implementation of the SParse Approximate Inverse Algorithm for a generic, uBLAS-compatible matrix typ...
Definition: spai.hpp:75

run_solver
void run_solver(MatrixType const &matrix, VectorType const &rhs, VectorType const &ref_result, SolverTag const &solver, PrecondTag const &precond, long ops)
Definition: solver.cpp:101

viennacl::linalg::ilut_precond
ILUT preconditioner class, can be supplied to solve()-routines.
Definition: ilut.hpp:352

cg.hpp
The conjugate gradient method is implemented here.

viennacl::vector< ScalarType >

viennacl::copy
void copy(std::vector< NumericT > &cpu_vec, circulant_matrix< NumericT, AlignmentV > &gpu_mat)
Copies a circulant matrix from the std::vector to the OpenCL device (either GPU or multi-core CPU) ...
Definition: circulant_matrix.hpp:150

ScalarType
float ScalarType
Definition: fft_1d.cpp:42

spai.hpp
Main include file for the sparse approximate inverse preconditioner family (SPAI and FSPAI)...

viennacl::compressed_matrix
A sparse square matrix in compressed sparse rows format.
Definition: compressed_matrix.hpp:559

viennacl::linalg::bicgstab_tag
A tag for the stabilized Bi-conjugate gradient solver. Used for supplying solver parameters and for d...
Definition: bicgstab.hpp:47

viennacl::io::read_matrix_market_file
long read_matrix_market_file(MatrixT &mat, const char *file, long index_base=1)
Reads a sparse matrix from a file (MatrixMarket format)
Definition: matrix_market.hpp:339

viennacl::ocl::get_context
viennacl::ocl::context & get_context(long i)
Convenience function for returning the current context.
Definition: backend.hpp:225

scalar.hpp
Implementation of the ViennaCL scalar class.

viennacl::ocl::setup_context
void setup_context(long i, std::vector< cl_device_id > const &devices)
Convenience function for setting devices for a context.
Definition: backend.hpp:231