doc/html/opencl_2matrix__operations_8hpp_source.html

 #ifndef VIENNACL_LINALG_OPENCL_MATRIX_OPERATIONS_HPP_

 #define VIENNACL_LINALG_OPENCL_MATRIX_OPERATIONS_HPP_


 /* =========================================================================

    Copyright (c) 2010-2015, Institute for Microelectronics,

                             Institute for Analysis and Scientific Computing,

                             TU Wien.

    Portions of this software are copyright by UChicago Argonne, LLC.


                             -----------------

                   ViennaCL - The Vienna Computing Library

                             -----------------


    Project Head:    Karl Rupp                   rupp@iue.tuwien.ac.at


    (A list of authors and contributors can be found in the manual)


    License:         MIT (X11), see file LICENSE in the base directory

 ============================================================================= */


 #include "viennacl/forwards.h"


 #include "viennacl/ocl/device.hpp"

 #include "viennacl/ocl/handle.hpp"

 #include "viennacl/ocl/kernel.hpp"

 #include "viennacl/scalar.hpp"

 #include "viennacl/vector.hpp"

 #include "viennacl/vector_proxy.hpp"

 #include "viennacl/tools/tools.hpp"

 #include "viennacl/meta/enable_if.hpp"

 #include "viennacl/meta/predicate.hpp"

 #include "viennacl/meta/result_of.hpp"


 #include "viennacl/scheduler/forwards.h"


 #include "viennacl/traits/size.hpp"

 #include "viennacl/traits/start.hpp"

 #include "viennacl/traits/handle.hpp"

 #include "viennacl/traits/stride.hpp"


 #include "viennacl/linalg/opencl/common.hpp"

 #include "viennacl/linalg/opencl/kernels/svd.hpp"


 #include "viennacl/linalg/opencl/kernels/matrix.hpp"


 namespace viennacl

 {

 namespace linalg

 {

 namespace opencl

 {


 namespace detail

 {


   template<typename NumericT>

   viennacl::ocl::kernel & legacy_kernel_for_matrix(matrix_base<NumericT> const & M, std::string const & kernel_name)

   {

     viennacl::ocl::context & ctx = traits::opencl_context(M);

     viennacl::ocl::program * program;

     if (M.row_major())

     {

       typedef viennacl::linalg::opencl::kernels::matrix_legacy<NumericT, row_major>  KernelClass;

       KernelClass::init(ctx);

       program = &ctx.get_program(KernelClass::program_name());

     }

     else

     {

       typedef viennacl::linalg::opencl::kernels::matrix_legacy<NumericT, column_major>  KernelClass;

       KernelClass::init(ctx);

       program = &ctx.get_program(KernelClass::program_name());

     }

     return program->get_kernel(kernel_name);

   }


 }


 //

 // Introductory note: By convention, all dimensions are already checked in the dispatcher frontend. No need to double-check again in here!

 //


 const std::string SVD_BIDIAG_PACK_KERNEL = "bidiag_pack";

 const std::string SVD_HOUSEHOLDER_UPDATE_A_LEFT_KERNEL = "house_update_A_left";

 const std::string SVD_HOUSEHOLDER_UPDATE_A_RIGHT_KERNEL = "house_update_A_right";

 const std::string SVD_HOUSEHOLDER_UPDATE_QL_KERNEL = "house_update_QL";

 const std::string SVD_GIVENS_NEXT_KERNEL = "givens_next";

 const std::string SVD_COPY_COL_KERNEL = "copy_col";

 const std::string SVD_COPY_ROW_KERNEL = "copy_row";


 template<typename DestNumericT, typename SrcNumericT>

 void convert(matrix_base<DestNumericT> & dest, matrix_base<SrcNumericT> const & src)

 {

   assert(dest.row_major() == src.row_major() && bool("Addition/subtraction on mixed matrix layouts not supported yet!"));


   assert(viennacl::traits::opencl_handle(dest).context() == viennacl::traits::opencl_handle(src).context() && bool("Matrices do not reside in the same OpenCL context. Automatic migration not yet supported!"));


   std::string kernel_name("convert_");

   kernel_name += dest.row_major() ? "row_" : "col_";

   kernel_name += viennacl::ocl::type_to_string<DestNumericT>::apply();

   kernel_name += "_";

   kernel_name += viennacl::ocl::type_to_string<SrcNumericT>::apply();


   viennacl::ocl::context & ctx = const_cast<viennacl::ocl::context &>(viennacl::traits::opencl_handle(dest).context());

   viennacl::linalg::opencl::kernels::matrix_convert::init(ctx);

   viennacl::ocl::kernel& k = ctx.get_kernel(viennacl::linalg::opencl::kernels::matrix_convert::program_name(), kernel_name);


   viennacl::ocl::enqueue(k( dest, cl_uint(dest.start1()), cl_uint(dest.stride1()), cl_uint(dest.size1()), cl_uint(dest.internal_size1()), cl_uint(dest.start2()), cl_uint(dest.stride2()), cl_uint(dest.size2()), cl_uint(dest.internal_size2()),

                             src,  cl_uint( src.start1()), cl_uint( src.stride1()), cl_uint( src.size1()), cl_uint( src.internal_size1()), cl_uint( src.start2()), cl_uint( src.stride2()), cl_uint( src.size2()), cl_uint( src.internal_size2())

                         ) );

 }


 template<typename NumericT,

          typename ScalarT1>

 void am(matrix_base<NumericT> & A,

         matrix_base<NumericT> const & B, ScalarT1 const & alpha, vcl_size_t /* len_alpha */, bool reciprocal_alpha, bool flip_sign_alpha)

 {

   assert(A.row_major() == B.row_major() && bool("Addition/subtraction on mixed matrix layouts not supported yet!"));


   std::string kernel_name("assign_*m_**00");

   bool is_scalar_cpu = is_cpu_scalar<ScalarT1>::value;

   kernel_name[7]  = is_scalar_cpu    ? 'h' : 'd';

   kernel_name[10] = flip_sign_alpha  ? '1' : '0';

   kernel_name[11] = reciprocal_alpha ? '1' : '0';


   scheduler::statement statement = scheduler::preset::av(scheduler::OPERATION_BINARY_ASSIGN_TYPE, &A, &B, &alpha, flip_sign_alpha, reciprocal_alpha);

   kernels::matrix<NumericT>::execution_handler(A.row_major(), viennacl::traits::opencl_context(A)).execute(kernel_name, statement);

 }


 template<typename NumericT,

           typename ScalarT1, typename ScalarT2>

 void ambm(matrix_base<NumericT> & A,

           matrix_base<NumericT> const & B, ScalarT1 const & alpha, vcl_size_t /* len_alpha */, bool reciprocal_alpha, bool flip_sign_alpha,

           matrix_base<NumericT> const & C, ScalarT2 const & beta,  vcl_size_t /* len_beta */,  bool reciprocal_beta,  bool flip_sign_beta)

 {

   assert(A.row_major() == B.row_major() && A.row_major() == C.row_major() && bool("Addition/subtraction on mixed matrix layouts not supported yet!"));


   std::string kernel_name("assign_*m*m_****");

   bool is_scalar_cpu1 = is_cpu_scalar<ScalarT1>::value;

   bool is_scalar_cpu2 = is_cpu_scalar<ScalarT2>::value;

   kernel_name[7]  = is_scalar_cpu1   ? 'h' : 'd';

   kernel_name[9]  = is_scalar_cpu2   ? 'h' : 'd';

   kernel_name[12] = flip_sign_alpha  ? '1' : '0';

   kernel_name[13] = reciprocal_alpha ? '1' : '0';

   kernel_name[14] = flip_sign_beta   ? '1' : '0';

   kernel_name[15] = reciprocal_beta  ? '1' : '0';


   scheduler::statement statement = scheduler::preset::avbv(scheduler::OPERATION_BINARY_ASSIGN_TYPE, &A, &B, &alpha, flip_sign_alpha, reciprocal_alpha, &C, &beta, flip_sign_beta, reciprocal_beta);

   kernels::matrix<NumericT>::execution_handler(A.row_major(), viennacl::traits::opencl_context(A)).execute(kernel_name, statement);

 }


 template<typename NumericT,

           typename ScalarT1, typename ScalarT2>

 void ambm_m(matrix_base<NumericT> & A,

             matrix_base<NumericT> const & B, ScalarT1 const & alpha, vcl_size_t /* len_alpha */, bool reciprocal_alpha, bool flip_sign_alpha,

             matrix_base<NumericT> const & C, ScalarT2 const & beta,  vcl_size_t /* len_beta */,  bool reciprocal_beta,  bool flip_sign_beta)

 {

   assert(A.row_major() == B.row_major() && A.row_major() == C.row_major() && bool("Addition/subtraction on mixed matrix layouts not supported yet!"));


   std::string kernel_name("ip_add_*v*v_****");

   bool is_scalar_cpu1 = is_cpu_scalar<ScalarT1>::value;

   bool is_scalar_cpu2 = is_cpu_scalar<ScalarT2>::value;

   kernel_name[7]  = is_scalar_cpu1   ? 'h' : 'd';

   kernel_name[9]  = is_scalar_cpu2   ? 'h' : 'd';

   kernel_name[12] = flip_sign_alpha  ? '1' : '0';

   kernel_name[13] = reciprocal_alpha ? '1' : '0';

   kernel_name[14] = flip_sign_beta   ? '1' : '0';

   kernel_name[15] = reciprocal_beta  ? '1' : '0';


   scheduler::statement statement = scheduler::preset::avbv(scheduler::OPERATION_BINARY_INPLACE_ADD_TYPE, &A, &B, &alpha, flip_sign_alpha, reciprocal_alpha, &C, &beta, flip_sign_beta, reciprocal_beta);

   kernels::matrix<NumericT>::execution_handler(A.row_major(), viennacl::traits::opencl_context(A)).execute(kernel_name, statement);

 }


 template<typename NumericT,

           typename SizeT, typename DistanceT>

 void trans(const matrix_expression<const matrix_base<NumericT, SizeT, DistanceT>,const matrix_base<NumericT, SizeT, DistanceT>, op_trans> & proxy,

            matrix_base<NumericT> & temp_trans)

 {

   std::string kernel_name("trans_kernel");

   viennacl::ocl::kernel& kernel = detail::legacy_kernel_for_matrix(proxy.lhs(),kernel_name);

   viennacl::ocl::enqueue(kernel(proxy.lhs(),

                                 static_cast<cl_uint>(proxy.lhs().start1()),         static_cast<cl_uint>(proxy.lhs().start2()),

                                 static_cast<cl_uint>(proxy.lhs().internal_size1()), static_cast<cl_uint>(proxy.lhs().internal_size2()),

                                 static_cast<cl_uint>(proxy.lhs().size1()),          static_cast<cl_uint>(proxy.lhs().size2()),

                                 static_cast<cl_uint>(proxy.lhs().stride1()),        static_cast<cl_uint>(proxy.lhs().stride2()),


                                 temp_trans,

                                 static_cast<cl_uint>(temp_trans.start1()),         static_cast<cl_uint>(temp_trans.start2()),

                                 static_cast<cl_uint>(temp_trans.internal_size1()), static_cast<cl_uint>(temp_trans.internal_size2()),

                                 static_cast<cl_uint>(temp_trans.stride1()),        static_cast<cl_uint>(temp_trans.stride2())));

 }


 template<typename NumericT>

 void matrix_assign(matrix_base<NumericT> & A, NumericT s, bool up_to_internal_size = false)

 {

   scalar_matrix<NumericT> B(viennacl::traits::size1(A),viennacl::traits::size2(A),s,viennacl::traits::context(A));

   scheduler::statement statement = scheduler::preset::assign_cpu(&A, &B);


   dynamic_cast<device_specific::matrix_axpy_template*>(kernels::matrix<NumericT>::execution_handler(A.row_major(), viennacl::traits::opencl_context(A)).template_of("assign_cpu"))->up_to_internal_size(up_to_internal_size);

   kernels::matrix<NumericT>::execution_handler(A.row_major(), viennacl::traits::opencl_context(A)).execute("assign_cpu", statement);

 }


 template<typename NumericT>

 void matrix_diagonal_assign(matrix_base<NumericT> & A, NumericT s)

 {

   viennacl::scalar_vector<NumericT> sx(std::min(viennacl::traits::size1(A), viennacl::traits::size2(A)), s);

   scheduler::statement statement = scheduler::preset::diagonal_assign_cpu(&A, &sx);

   kernels::matrix<NumericT>::execution_handler(A.row_major(), viennacl::traits::opencl_context(A)).execute("diagonal_assign_cpu", statement);

 }


 template<typename NumericT>

 void matrix_diag_from_vector(const vector_base<NumericT> & vec, int k, matrix_base<NumericT> & A)

 {

   scheduler::statement statement = scheduler::preset::matrix_diag_from_vector(&vec, &A, k);

   kernels::matrix<NumericT>::execution_handler(A.row_major(), viennacl::traits::opencl_context(A)).execute("matrix_diag_from_vector", statement);

 }


 template<typename NumericT>

 void matrix_diag_to_vector(const matrix_base<NumericT> & A, int k, vector_base<NumericT> & vec)

 {

   scheduler::statement statement = scheduler::preset::matrix_diag_to_vector(&vec, &A, k);

   kernels::matrix<NumericT>::execution_handler(A.row_major(), viennacl::traits::opencl_context(A)).execute("matrix_diag_to_vector", statement);

 }


 template<typename NumericT>

 void matrix_row(const matrix_base<NumericT> & A, unsigned int i, vector_base<NumericT> & vec)

 {

   scheduler::statement statement = scheduler::preset::matrix_row(&vec, &A, i);

   kernels::matrix<NumericT>::execution_handler(A.row_major(), viennacl::traits::opencl_context(A)).execute("matrix_row", statement);

 }


 template<typename NumericT>

 void matrix_column(const matrix_base<NumericT> & A, unsigned int j, vector_base<NumericT> & vec)

 {

   scheduler::statement statement = scheduler::preset::matrix_column(&vec, &A, j);

   kernels::matrix<NumericT>::execution_handler(A.row_major(), viennacl::traits::opencl_context(A)).execute("matrix_column", statement);

 }


 //

 //


 // Binary operations A = B .* C and A = B ./ C

 template<typename NumericT, typename OpT>

 void element_op(matrix_base<NumericT> & A,

                 matrix_expression<const matrix_base<NumericT>, const matrix_base<NumericT>, op_element_binary<OpT> > const & proxy)

 {

   assert(A.row_major() == proxy.lhs().row_major() && bool("Elementwise operations on mixed matrix layouts not supported yet!"));

   assert(A.row_major() == proxy.rhs().row_major() && bool("Elementwise operations on mixed matrix layouts not supported yet!"));

   assert(viennacl::traits::opencl_handle(A).context() == viennacl::traits::opencl_handle(proxy.lhs()).context() && bool("Matrices do not reside in the same OpenCL context. Automatic migration not yet supported!"));

   assert(viennacl::traits::opencl_handle(A).context() == viennacl::traits::opencl_handle(proxy.rhs()).context() && bool("Matrices do not reside in the same OpenCL context. Automatic migration not yet supported!"));


   scheduler::operation_node_type TYPE = scheduler::operation_node_type(scheduler::result_of::op_type_info<op_element_binary<OpT> >::id);

   scheduler::statement statement =  scheduler::preset::binary_element_op(&A, &proxy.lhs(), &proxy.rhs(),TYPE);

   kernels::matrix_element<NumericT>::execution_handler(A.row_major(), viennacl::traits::opencl_context(A)).execute(device_specific::tree_parsing::operator_string(TYPE), statement);

 }


 // Unary operations


 template<typename NumericT, typename OpT>

 void element_op(matrix_base<NumericT> & A,

                 matrix_expression<const matrix_base<NumericT>, const matrix_base<NumericT>, op_element_unary<OpT> > const & proxy)

 {

   assert(A.row_major() == proxy.lhs().row_major() && bool("Elementwise operations on mixed matrix layouts not supported yet!"));

   assert(A.row_major() == proxy.rhs().row_major() && bool("Elementwise operations on mixed matrix layouts not supported yet!"));


   assert(viennacl::traits::opencl_handle(A).context() == viennacl::traits::opencl_handle(proxy.lhs()).context() && bool("Matrices do not reside in the same OpenCL context. Automatic migration not yet supported!"));

   assert(viennacl::traits::opencl_handle(A).context() == viennacl::traits::opencl_handle(proxy.rhs()).context() && bool("Matrices do not reside in the same OpenCL context. Automatic migration not yet supported!"));


   scheduler::operation_node_type TYPE = scheduler::operation_node_type(scheduler::result_of::op_type_info<op_element_unary<OpT> >::id);

   scheduler::statement statement = scheduler::preset::unary_element_op(&A, &proxy.lhs(),TYPE);

   kernels::matrix_element<NumericT>::execution_handler(A.row_major(), viennacl::traits::opencl_context(A)).execute(device_specific::tree_parsing::operator_string(TYPE), statement);

 }


 template<typename NumericT>

 void prod_impl(const matrix_base<NumericT> & A, bool trans_A,

                const vector_base<NumericT> & vec,

                      vector_base<NumericT> & result)

 {

   // Inplace matrix-vector products like x = prod(A, x) are currently illegal: Introduce a temporary like y = prod(A, x); x = y; instead

   assert(viennacl::traits::handle(vec) != viennacl::traits::handle(result) && bool("No direct inplace matrix-vector product possible. Introduce a temporary!"));


   std::string kernel_name = std::string("mat_vec_") + (trans_A ^ A.row_major()?"T":"N");

   scheduler::statement statement = scheduler::preset::mat_vec_prod(&A, trans_A, &vec, &result);

   kernels::row_wise_reduction<NumericT>::execution_handler(viennacl::traits::opencl_context(A)).execute(kernel_name, statement);

 }


 //


 template<typename NumericT, typename ScalarType >

 void prod_impl(matrix_base<NumericT> const & A, bool A_trans,

                matrix_base<NumericT> const & B, bool B_trans,

                matrix_base<NumericT>       & C,

                ScalarType alpha,

                ScalarType beta)

 {

     bool effective_A_trans = A_trans ^ A.row_major();

     bool effective_B_trans = B_trans ^ B.row_major();


     char cAt = effective_A_trans ? 'T' : 'N';

     char cBt = effective_B_trans ? 'T' : 'N';


     std::string kernel_prefix("prod_");

     kernel_prefix+=cAt;

     kernel_prefix+=cBt;


     scheduler::statement statement = scheduler::preset::mat_mat_prod(alpha, &A, effective_A_trans, &B, effective_B_trans, beta, &C);

     kernels::matrix_prod<NumericT>::execution_handler(C.row_major(), viennacl::traits::opencl_context(C)).execute(kernel_prefix, statement);

 }


 //

 //


 template<typename NumericT, typename ScalarT1>

 void scaled_rank_1_update(matrix_base<NumericT> & A,

                           ScalarT1 const & alpha, vcl_size_t len_alpha, bool reciprocal_alpha, bool flip_sign_alpha,

                           const vector_base<NumericT> & vec1,

                           const vector_base<NumericT> & vec2)

 {

   assert( (viennacl::traits::size1(A) == viennacl::traits::size(vec1)) && bool("Size mismatch in scaled_rank_1_update: size1(A) != size(v1)"));

   assert( (viennacl::traits::size2(A) == viennacl::traits::size(vec2)) && bool("Size mismatch in scaled_rank_1_update: size2(A) != size(v2)"));


   cl_uint options_alpha = detail::make_options(len_alpha, reciprocal_alpha, flip_sign_alpha);

   bool is_cpu = viennacl::is_cpu_scalar<ScalarT1>::value;

   viennacl::ocl::kernel& kernel= detail::legacy_kernel_for_matrix(A, is_cpu ? "scaled_rank1_update_cpu" : "scaled_rank1_update_gpu");


   viennacl::ocl::enqueue(kernel(viennacl::traits::opencl_handle(A),

                            cl_uint(viennacl::traits::start1(A)),           cl_uint(viennacl::traits::start2(A)),

                            cl_uint(viennacl::traits::stride1(A)),          cl_uint(viennacl::traits::stride2(A)),

                            cl_uint(viennacl::traits::size1(A)),            cl_uint(viennacl::traits::size2(A)),

                            cl_uint(viennacl::traits::internal_size1(A)),   cl_uint(viennacl::traits::internal_size2(A)),


                            viennacl::traits::opencl_handle(viennacl::tools::promote_if_host_scalar<NumericT>(alpha)),

                            options_alpha,


                            viennacl::traits::opencl_handle(vec1),

                            cl_uint(viennacl::traits::start(vec1)),

                            cl_uint(viennacl::traits::stride(vec1)),

                            cl_uint(viennacl::traits::size(vec1)),


                            viennacl::traits::opencl_handle(vec2),

                            cl_uint(viennacl::traits::start(vec2)),

                            cl_uint(viennacl::traits::stride(vec2)),

                            cl_uint(viennacl::traits::size(vec2))

                           )

                         );

 }


 //

 template <typename SCALARTYPE, typename VectorType>

 void bidiag_pack_svd(viennacl::matrix<SCALARTYPE>& A,

                  VectorType & dh,

                  VectorType & sh

                 )

 {

   viennacl::vector<SCALARTYPE> D(dh.size());

   viennacl::vector<SCALARTYPE> S(sh.size());


   viennacl::ocl::context & ctx = const_cast<viennacl::ocl::context &>(viennacl::traits::opencl_handle(A).context());

   viennacl::ocl::kernel& kernel = ctx.get_kernel(viennacl::linalg::opencl::kernels::svd<SCALARTYPE>::program_name(), SVD_BIDIAG_PACK_KERNEL);


   viennacl::ocl::enqueue(kernel(

                                 A,

                                 D,

                                 S,

                                 static_cast<cl_uint>(A.size1()),

                                 static_cast<cl_uint>(A.size2()),

                                 static_cast<cl_uint>(A.internal_size2())

                               ));


   fast_copy(D, dh);

   fast_copy(S, sh);

 }


 template <typename NumericT>

 void bidiag_pack(matrix_base<NumericT> & A,

                  viennacl::vector<NumericT> & dh,

                  viennacl::vector<NumericT> & sh

                 )

 {

   viennacl::ocl::context & ctx = const_cast<viennacl::ocl::context &>(viennacl::traits::opencl_handle(A).context());


   if(A.row_major())

   {

       viennacl::linalg::opencl::kernels::svd<NumericT, row_major>::init(ctx);

       viennacl::ocl::kernel& kernel = ctx.get_kernel(viennacl::linalg::opencl::kernels::svd<NumericT, row_major>::program_name(), SVD_BIDIAG_PACK_KERNEL);


       viennacl::ocl::enqueue(kernel(

                                     A,

                                     dh,

                                     sh,

                                     cl_uint(viennacl::traits::size1(A)),

                                     cl_uint(viennacl::traits::size2(A)),

                                     cl_uint(viennacl::traits::internal_size2(A))

                                   ));

   }

   else

   {

       viennacl::linalg::opencl::kernels::svd<NumericT, column_major>::init(ctx);

       viennacl::ocl::kernel& kernel = ctx.get_kernel(viennacl::linalg::opencl::kernels::svd<NumericT, column_major>::program_name(), SVD_BIDIAG_PACK_KERNEL);


       viennacl::ocl::enqueue(kernel(

                                     A,

                                     dh,

                                     sh,

                                     cl_uint(viennacl::traits::size1(A)),

                                     cl_uint(viennacl::traits::size2(A)),

                                     cl_uint(viennacl::traits::internal_size2(A))

                                   ));

   }

 }


 template <typename NumericT>

 void house_update_A_left(matrix_base<NumericT> & A,

                          vector_base<NumericT> & D,

                          vcl_size_t start)

 {


     viennacl::ocl::context & ctx = const_cast<viennacl::ocl::context &>(viennacl::traits::opencl_handle(A).context());

     if(A.row_major())

     {

         viennacl::linalg::opencl::kernels::svd<NumericT, row_major>::init(ctx);

         viennacl::ocl::kernel& kernel = ctx.get_kernel(viennacl::linalg::opencl::kernels::svd<NumericT, row_major>::program_name(), SVD_HOUSEHOLDER_UPDATE_A_LEFT_KERNEL);

         viennacl::ocl::enqueue(kernel(

                                       A,

                                       D,

                                       static_cast<cl_uint>(start + 1),

                                       static_cast<cl_uint>(start),

                                       cl_uint(viennacl::traits::size1(A)),

                                       cl_uint(viennacl::traits::size2(A)),

                                       cl_uint(viennacl::traits::internal_size2(A)),

                                       viennacl::ocl::local_mem(static_cast<cl_uint>(128 * 4))

                               ));

     }

     else

     {

         viennacl::linalg::opencl::kernels::svd<NumericT, column_major>::init(ctx);

         viennacl::ocl::kernel& kernel = ctx.get_kernel(viennacl::linalg::opencl::kernels::svd<NumericT, column_major>::program_name(), SVD_HOUSEHOLDER_UPDATE_A_LEFT_KERNEL);

         viennacl::ocl::enqueue(kernel(

                                       A,

                                       D,

                                       static_cast<cl_uint>(start + 1),

                                       static_cast<cl_uint>(start),

                                       cl_uint(viennacl::traits::size1(A)),

                                       cl_uint(viennacl::traits::size2(A)),

                                       cl_uint(viennacl::traits::internal_size2(A)),

                                       viennacl::ocl::local_mem(static_cast<cl_uint>(128 * 4))

                               ));

     }


 }


 template <typename NumericT>

 void house_update_A_right(matrix_base<NumericT> & A,

                           vector_base<NumericT> & D)

 {

     viennacl::ocl::context & ctx = const_cast<viennacl::ocl::context &>(viennacl::traits::opencl_handle(A).context());


     if(A.row_major())

     {

         viennacl::linalg::opencl::kernels::svd<NumericT, row_major>::init(ctx);

         viennacl::ocl::kernel& kernel = ctx.get_kernel(viennacl::linalg::opencl::kernels::svd<NumericT, row_major>::program_name(), SVD_HOUSEHOLDER_UPDATE_A_RIGHT_KERNEL);


         viennacl::ocl::enqueue(kernel(

                                       A,

                                       D,

                                       static_cast<cl_uint>(0),

                                       static_cast<cl_uint>(0),

                                       cl_uint(viennacl::traits::size1(A)),

                                       cl_uint(viennacl::traits::size2(A)),

                                       cl_uint(viennacl::traits::internal_size2(A)),

                                       viennacl::ocl::local_mem(static_cast<cl_uint>(128 * sizeof(NumericT)))

                               ));

     }

     else

     {

         viennacl::linalg::opencl::kernels::svd<NumericT, column_major>::init(ctx);

         viennacl::ocl::kernel& kernel = ctx.get_kernel(viennacl::linalg::opencl::kernels::svd<NumericT, column_major>::program_name(), SVD_HOUSEHOLDER_UPDATE_A_RIGHT_KERNEL);


         viennacl::ocl::enqueue(kernel(

                                       A,

                                       D,

                                       static_cast<cl_uint>(0),

                                       static_cast<cl_uint>(0),

                                       cl_uint(viennacl::traits::size1(A)),

                                       cl_uint(viennacl::traits::size2(A)),

                                       cl_uint(viennacl::traits::internal_size2(A)),

                                       viennacl::ocl::local_mem(static_cast<cl_uint>(128 * sizeof(NumericT)))

                               ));

     }


 }


 template <typename NumericT>

 void house_update_QL(matrix_base<NumericT> & Q,

                      vector_base<NumericT> & D,

                      vcl_size_t A_size1)


 {

     viennacl::ocl::context & ctx = const_cast<viennacl::ocl::context &>(viennacl::traits::opencl_handle(Q).context());


     if(Q.row_major())

     {

         viennacl::linalg::opencl::kernels::svd<NumericT, row_major>::init(ctx);

         viennacl::ocl::kernel& kernel = ctx.get_kernel(viennacl::linalg::opencl::kernels::svd<NumericT, row_major>::program_name(), SVD_HOUSEHOLDER_UPDATE_QL_KERNEL);


         viennacl::ocl::enqueue(kernel(

                                         Q,

                                         D,

                                         cl_uint(A_size1),

                                         cl_uint(viennacl::traits::internal_size2(Q)),

                                         viennacl::ocl::local_mem(static_cast<cl_uint>(128 * sizeof(NumericT)))

                                     ));

     }

     else

     {

         viennacl::linalg::opencl::kernels::svd<NumericT, column_major>::init(ctx);

         viennacl::ocl::kernel& kernel = ctx.get_kernel(viennacl::linalg::opencl::kernels::svd<NumericT, column_major>::program_name(), SVD_HOUSEHOLDER_UPDATE_QL_KERNEL);


         viennacl::ocl::enqueue(kernel(

                                         Q,

                                         D,

                                         cl_uint(A_size1),

                                         cl_uint(viennacl::traits::internal_size2(Q)),

                                         viennacl::ocl::local_mem(static_cast<cl_uint>(128 * sizeof(NumericT)))

                                     ));

     }


 }


 template<typename NumericT>

   void givens_next(matrix_base<NumericT> & matrix,

                   vector_base<NumericT>& tmp1,

                   vector_base<NumericT>& tmp2,

                   int l,

                   int m

                 )

   {

     viennacl::ocl::context & ctx = const_cast<viennacl::ocl::context &>(viennacl::traits::opencl_handle(matrix).context());


     if(matrix.row_major())

     {

         viennacl::linalg::opencl::kernels::svd<NumericT, row_major>::init(ctx);

         viennacl::ocl::kernel& kernel = ctx.get_kernel(viennacl::linalg::opencl::kernels::svd<NumericT, row_major>::program_name(), SVD_GIVENS_NEXT_KERNEL);

         kernel.global_work_size(0, viennacl::tools::align_to_multiple<cl_uint>(cl_uint(viennacl::traits::size1(matrix)), 256));

         kernel.local_work_size(0, 256);


         viennacl::ocl::enqueue(kernel(

                                       matrix,

                                       tmp1,

                                       tmp2,

                                       cl_uint(viennacl::traits::size1(matrix)),

                                       cl_uint(viennacl::traits::internal_size2(matrix)),

                                       static_cast<cl_uint>(l),

                                       static_cast<cl_uint>(m - 1)

                               ));

     }

     else

     {

         viennacl::linalg::opencl::kernels::svd<NumericT, column_major>::init(ctx);

         viennacl::ocl::kernel& kernel = ctx.get_kernel(viennacl::linalg::opencl::kernels::svd<NumericT, column_major>::program_name(), SVD_GIVENS_NEXT_KERNEL);

         kernel.global_work_size(0, viennacl::tools::align_to_multiple<cl_uint>(cl_uint(viennacl::traits::size1(matrix)), 256));

         kernel.local_work_size(0, 256);


         viennacl::ocl::enqueue(kernel(

                                       matrix,

                                       tmp1,

                                       tmp2,

                                       cl_uint(viennacl::traits::size1(matrix)),

                                       cl_uint(viennacl::traits::internal_size2(matrix)),

                                       static_cast<cl_uint>(l),

                                       static_cast<cl_uint>(m - 1)

                               ));

     }


   }


   template <typename NumericT>

   void copy_vec(matrix_base<NumericT>& A,

                 vector_base<NumericT> & V,

                 vcl_size_t row_start,

                 vcl_size_t col_start,

                 bool copy_col

   )

   {

     std::string kernel_name = copy_col ? SVD_COPY_COL_KERNEL : SVD_COPY_ROW_KERNEL;

     viennacl::ocl::context & ctx = const_cast<viennacl::ocl::context &>(viennacl::traits::opencl_handle(A).context());


     if(A.row_major())

     {

         viennacl::linalg::opencl::kernels::svd<NumericT, row_major>::init(ctx);

         viennacl::ocl::kernel& kernel = ctx.get_kernel(viennacl::linalg::opencl::kernels::svd<NumericT, row_major>::program_name(), kernel_name);


         viennacl::ocl::enqueue(kernel(

                                       A,

                                       V,

                                       static_cast<cl_uint>(row_start),

                                       static_cast<cl_uint>(col_start),

                                       copy_col ? cl_uint(viennacl::traits::size1(A))

                                                : cl_uint(viennacl::traits::size2(A)),

                                       static_cast<cl_uint>(A.internal_size2())

                               ));

     }

     else

     {

         viennacl::linalg::opencl::kernels::svd<NumericT, column_major>::init(ctx);

         viennacl::ocl::kernel& kernel = ctx.get_kernel(viennacl::linalg::opencl::kernels::svd<NumericT, column_major>::program_name(), kernel_name);


         viennacl::ocl::enqueue(kernel(

                                       A,

                                       V,

                                       static_cast<cl_uint>(row_start),

                                       static_cast<cl_uint>(col_start),

                                       copy_col ? cl_uint(viennacl::traits::size1(A))

                                                : cl_uint(viennacl::traits::size2(A)),

                                       static_cast<cl_uint>(A.internal_size2())

                               ));

     }


   }


 } // namespace opencl

 } //namespace linalg

 } //namespace viennacl


 #endif

viennacl::linalg::opencl::matrix_diag_from_vector
void matrix_diag_from_vector(const vector_base< NumericT > &vec, int k, matrix_base< NumericT > &A)
Definition: matrix_operations.hpp:218

viennacl::linalg::opencl::trans
void trans(const matrix_expression< const matrix_base< NumericT, SizeT, DistanceT >, const matrix_base< NumericT, SizeT, DistanceT >, op_trans > &proxy, matrix_base< NumericT > &temp_trans)
Definition: matrix_operations.hpp:182

viennacl::linalg::opencl::am
void am(matrix_base< NumericT > &A, matrix_base< NumericT > const &B, ScalarT1 const &alpha, vcl_size_t, bool reciprocal_alpha, bool flip_sign_alpha)
Definition: matrix_operations.hpp:118

viennacl::linalg::opencl::matrix_column
void matrix_column(const matrix_base< NumericT > &A, unsigned int j, vector_base< NumericT > &vec)
Definition: matrix_operations.hpp:239

device.hpp
Represents an OpenCL device within ViennaCL.

viennacl::traits::stride1
result_of::size_type< matrix_base< NumericT > >::type stride1(matrix_base< NumericT > const &s)
Definition: stride.hpp:55

viennacl::linalg::opencl::SVD_HOUSEHOLDER_UPDATE_A_LEFT_KERNEL
const std::string SVD_HOUSEHOLDER_UPDATE_A_LEFT_KERNEL
Definition: matrix_operations.hpp:87

viennacl::scheduler::preset::matrix_diag_from_vector
statement matrix_diag_from_vector(viennacl::vector_base< NumericT > const *x, viennacl::matrix_base< NumericT > const *A, int id)
Definition: preset.hpp:363

size.hpp
Generic size and resize functionality for different vector and matrix types.

viennacl::ocl::kernel
Represents an OpenCL kernel within ViennaCL.
Definition: kernel.hpp:58

viennacl::ocl::context::get_program
viennacl::ocl::program & get_program(std::string const &name)
Returns the program with the provided name.
Definition: context.hpp:532

start.hpp
Extracts the underlying OpenCL start index handle from a vector, a matrix, an expression etc...

tools.hpp
Various little tools used here and there in ViennaCL.

viennacl::traits::internal_size1
vcl_size_t internal_size1(matrix_base< NumericT > const &mat)
Helper routine for obtaining the internal number of entries per row of a ViennaCL matrix...
Definition: size.hpp:382

viennacl::ocl::kernel::local_work_size
size_type local_work_size(int index=0) const
Returns the local work size at the respective dimension.
Definition: kernel.hpp:742

viennacl::traits::size1
vcl_size_t size1(MatrixType const &mat)
Generic routine for obtaining the number of rows of a matrix (ViennaCL, uBLAS, etc.)
Definition: size.hpp:163

viennacl::linalg::opencl::SVD_BIDIAG_PACK_KERNEL
const std::string SVD_BIDIAG_PACK_KERNEL
Definition: matrix_operations.hpp:86

viennacl::ocl::context
Manages an OpenCL context and provides the respective convenience functions for creating buffers...
Definition: context.hpp:55

viennacl::traits::internal_size2
vcl_size_t internal_size2(matrix_base< NumericT > const &mat)
Helper routine for obtaining the internal number of entries per column of a ViennaCL matrix...
Definition: size.hpp:390

viennacl::matrix_base< NumericT >

viennacl::matrix_expression
Expression template class for representing a tree of expressions which ultimately result in a matrix...
Definition: forwards.h:341

viennacl::matrix_base::stride2
size_type stride2() const
Returns the number of columns.
Definition: matrix_def.hpp:234

viennacl::linalg::opencl::SVD_GIVENS_NEXT_KERNEL
const std::string SVD_GIVENS_NEXT_KERNEL
Definition: matrix_operations.hpp:90

viennacl::linalg::opencl::SVD_HOUSEHOLDER_UPDATE_A_RIGHT_KERNEL
const std::string SVD_HOUSEHOLDER_UPDATE_A_RIGHT_KERNEL
Definition: matrix_operations.hpp:88

viennacl::traits::stride
result_of::size_type< viennacl::vector_base< T > >::type stride(viennacl::vector_base< T > const &s)
Definition: stride.hpp:45

forwards.h
This file provides the forward declarations for the main types used within ViennaCL.

viennacl::traits::start1
result_of::size_type< T >::type start1(T const &obj)
Definition: start.hpp:65

viennacl::linalg::opencl::kernels::row_wise_reduction::execution_handler
static device_specific::execution_handler & execution_handler(viennacl::ocl::context &ctx)
Definition: matrix.hpp:696

viennacl::matrix
A dense matrix class.
Definition: forwards.h:375

viennacl::linalg::opencl::kernels::svd::init
static void init(viennacl::ocl::context &ctx)
Definition: svd.hpp:652

stride.hpp
Determines row and column increments for matrices and matrix proxies.

viennacl::scheduler::OPERATION_BINARY_ASSIGN_TYPE
Definition: forwards.h:115

viennacl::linalg::opencl::bidiag_pack
void bidiag_pack(matrix_base< NumericT > &A, viennacl::vector< NumericT > &dh, viennacl::vector< NumericT > &sh)
Definition: matrix_operations.hpp:426

viennacl::scheduler::preset::avbv
scheduler::statement avbv(scheduler::operation_node_type ASSIGN_OP, NumericT const *x, NumericT const *y, ScalarT1 const *a, bool flip_a, bool reciprocal_a, NumericT const *z, ScalarT2 const *b, bool flip_b, bool reciprocal_b)
Definition: preset.hpp:33

viennacl::traits::size2
result_of::size_type< MatrixType >::type size2(MatrixType const &mat)
Generic routine for obtaining the number of columns of a matrix (ViennaCL, uBLAS, etc...
Definition: size.hpp:201

viennacl::linalg::opencl::scaled_rank_1_update
void scaled_rank_1_update(matrix_base< NumericT > &A, ScalarT1 const &alpha, vcl_size_t len_alpha, bool reciprocal_alpha, bool flip_sign_alpha, const vector_base< NumericT > &vec1, const vector_base< NumericT > &vec2)
The implementation of the operation mat += alpha * vec1 * vec2^T, i.e. a scaled rank 1 update...
Definition: matrix_operations.hpp:364

svd.hpp
OpenCL kernel file for singular value decomposition.

viennacl::linalg::opencl::SVD_COPY_ROW_KERNEL
const std::string SVD_COPY_ROW_KERNEL
Definition: matrix_operations.hpp:92

common.hpp
Common implementations shared by OpenCL-based operations.

NumericT
float NumericT
Definition: bisect.cpp:40

viennacl::linalg::opencl::copy_vec
void copy_vec(matrix_base< NumericT > &A, vector_base< NumericT > &V, vcl_size_t row_start, vcl_size_t col_start, bool copy_col)
Definition: matrix_operations.hpp:638

viennacl::linalg::opencl::house_update_A_right
void house_update_A_right(matrix_base< NumericT > &A, vector_base< NumericT > &D)
Definition: matrix_operations.hpp:508

viennacl::linalg::opencl::element_op
void element_op(matrix_base< NumericT > &A, matrix_expression< const matrix_base< NumericT >, const matrix_base< NumericT >, op_element_binary< OpT > > const &proxy)
Implementation of binary element-wise operations A = OP(B,C)
Definition: matrix_operations.hpp:257

viennacl
Main namespace in ViennaCL. Holds all the basic types such as vector, matrix, etc. and defines operations upon them.
Definition: cpu_ram.hpp:34

viennacl::linalg::opencl::ambm
void ambm(matrix_base< NumericT > &A, matrix_base< NumericT > const &B, ScalarT1 const &alpha, vcl_size_t, bool reciprocal_alpha, bool flip_sign_alpha, matrix_base< NumericT > const &C, ScalarT2 const &beta, vcl_size_t, bool reciprocal_beta, bool flip_sign_beta)
Definition: matrix_operations.hpp:136

viennacl::linalg::opencl::house_update_QL
void house_update_QL(matrix_base< NumericT > &Q, vector_base< NumericT > &D, vcl_size_t A_size1)
Definition: matrix_operations.hpp:552

viennacl::linalg::opencl::kernels::matrix_prod::execution_handler
static device_specific::execution_handler & execution_handler(bool is_row_major, viennacl::ocl::context &ctx)
Definition: matrix.hpp:726

viennacl::scheduler::preset::binary_element_op
statement binary_element_op(NumericT const *x, NumericT const *y, NumericT const *z, scheduler::operation_node_type TYPE)
Definition: preset.hpp:284

viennacl::traits::size
vcl_size_t size(VectorType const &vec)
Generic routine for obtaining the size of a vector (ViennaCL, uBLAS, etc.)
Definition: size.hpp:235

viennacl::traits::start2
result_of::size_type< T >::type start2(T const &obj)
Definition: start.hpp:84

viennacl::ocl::local_mem
A class representing local (shared) OpenCL memory. Typically used as kernel argument.
Definition: local_mem.hpp:33

viennacl::is_cpu_scalar
Helper struct for checking whether a type is a host scalar type (e.g. float, double) ...
Definition: forwards.h:448

viennacl::linalg::opencl::kernels::svd
Main kernel class for generating OpenCL kernels for singular value decomposition of dense matrices...
Definition: svd.hpp:644

detail
Definition: blas3.hpp:36

viennacl::ocl::context::get_kernel
viennacl::ocl::kernel & get_kernel(std::string const &program_name, std::string const &kernel_name)
Convenience function for retrieving the kernel of a program directly from the context.
Definition: context.hpp:605

viennacl::scheduler::preset::mat_vec_prod
statement mat_vec_prod(viennacl::matrix_base< NumericT > const *A, bool A_trans, viennacl::vector_base< NumericT > const *x, viennacl::vector_base< NumericT > const *y)
Definition: preset.hpp:410

viennacl::scheduler::OPERATION_BINARY_INPLACE_ADD_TYPE
Definition: forwards.h:116

handle.hpp
Implementation of a smart-pointer-like class for handling OpenCL handles.

viennacl::traits::start
result_of::size_type< T >::type start(T const &obj)
Definition: start.hpp:44

viennacl::linalg::opencl::detail::make_options
cl_uint make_options(vcl_size_t length, bool reciprocal, bool flip_sign)
Definition: common.hpp:42

viennacl::linalg::opencl::kernels::matrix_legacy
Main kernel class for generating OpenCL kernels for operations on/with dense matrix objects of type v...
Definition: matrix.hpp:772

viennacl::scheduler::result_of::op_type_info
Metafunction for querying type informations.
Definition: forwards.h:156

viennacl::linalg::opencl::SVD_HOUSEHOLDER_UPDATE_QL_KERNEL
const std::string SVD_HOUSEHOLDER_UPDATE_QL_KERNEL
Definition: matrix_operations.hpp:89

viennacl::scalar_matrix
Represents a vector consisting of scalars 's' only, i.e. v[i] = s for all i. To be used as an initial...
Definition: matrix_def.hpp:93

viennacl::matrix_base::stride1
size_type stride1() const
Returns the number of rows.
Definition: matrix_def.hpp:232

viennacl::vector_base< NumericT >

viennacl::scheduler::preset::unary_element_op
statement unary_element_op(NumericT const *x, NumericT const *y, scheduler::operation_node_type TYPE)
Definition: preset.hpp:305

viennacl::scheduler::preset::av
scheduler::statement av(scheduler::operation_node_type ASSIGN_OP, NumericT const *x, NumericT const *y, ScalarT1 const *a, bool flip_a, bool reciprocal_a)
Definition: preset.hpp:88

viennacl::vcl_size_t
std::size_t vcl_size_t
Definition: forwards.h:75

viennacl::matrix_base::size2
size_type size2() const
Returns the number of columns.
Definition: matrix_def.hpp:226

viennacl::linalg::opencl::bidiag_pack_svd
void bidiag_pack_svd(viennacl::matrix< SCALARTYPE > &A, VectorType &dh, VectorType &sh)
Definition: matrix_operations.hpp:400

viennacl::vector
Definition: forwards.h:266

viennacl::ocl::program
Wrapper class for an OpenCL program.
Definition: program.hpp:42

forwards.h
Provides the datastructures for dealing with a single statement such as 'x = y + z;'.

viennacl::device_specific::execute
void execute(template_base const &T, statements_container const &statements, viennacl::ocl::context &ctx=viennacl::ocl::current_context(), bool force_compilation=false)
Definition: execute.hpp:44

viennacl::linalg::opencl::house_update_A_left
void house_update_A_left(matrix_base< NumericT > &A, vector_base< NumericT > &D, vcl_size_t start)
Definition: matrix_operations.hpp:465

viennacl::matrix_base::size1
size_type size1() const
Returns the number of rows.
Definition: matrix_def.hpp:224

vector_proxy.hpp
Proxy classes for vectors.

viennacl::traits::stride2
result_of::size_type< matrix_base< NumericT > >::type stride2(matrix_base< NumericT > const &s)
Definition: stride.hpp:65

viennacl::scheduler::operation_node_type
operation_node_type
Enumeration for identifying the possible operations.
Definition: forwards.h:68

predicate.hpp
All the predicates used within ViennaCL. Checks for expressions to be vectors, etc.

viennacl::linalg::opencl::convert
void convert(matrix_base< DestNumericT > &dest, matrix_base< SrcNumericT > const &src)
Definition: matrix_operations.hpp:95

viennacl::scheduler::preset::mat_mat_prod
statement mat_mat_prod(NumericT alpha, viennacl::matrix_base< NumericT > const *A, bool A_trans, viennacl::matrix_base< NumericT > const *B, bool B_trans, NumericT beta, viennacl::matrix_base< NumericT > const *C)
Definition: preset.hpp:416

viennacl::scheduler::preset::matrix_diag_to_vector
statement matrix_diag_to_vector(viennacl::vector_base< NumericT > const *x, viennacl::matrix_base< NumericT > const *A, int id)
Definition: preset.hpp:357

viennacl::linalg::opencl::matrix_diag_to_vector
void matrix_diag_to_vector(const matrix_base< NumericT > &A, int k, vector_base< NumericT > &vec)
Definition: matrix_operations.hpp:225

viennacl::traits::context
viennacl::context context(T const &t)
Returns an ID for the currently active memory domain of an object.
Definition: context.hpp:40

viennacl::linalg::opencl::kernels::matrix::execution_handler
static device_specific::execution_handler & execution_handler(bool is_row_major, viennacl::ocl::context &ctx)
Definition: matrix.hpp:541

viennacl::linalg::opencl::detail::legacy_kernel_for_matrix
viennacl::ocl::kernel & legacy_kernel_for_matrix(matrix_base< NumericT > const &M, std::string const &kernel_name)
Definition: matrix_operations.hpp:61

viennacl::ocl::enqueue
void enqueue(KernelType &k, viennacl::ocl::command_queue const &queue)
Enqueues a kernel in the provided queue.
Definition: enqueue.hpp:50

kernel.hpp
Representation of an OpenCL kernel in ViennaCL.

vector.hpp
The vector type with operator-overloads and proxy classes is defined here. Linear algebra operations ...

viennacl::matrix_base::row_major
bool row_major() const
Definition: matrix_def.hpp:248

viennacl::scalar_vector
Represents a vector consisting of scalars 's' only, i.e. v[i] = s for all i. To be used as an initial...
Definition: vector_def.hpp:87

viennacl::linalg::opencl::matrix_assign
void matrix_assign(matrix_base< NumericT > &A, NumericT s, bool up_to_internal_size=false)
Definition: matrix_operations.hpp:200

viennacl::scheduler::preset::diagonal_assign_cpu
scheduler::statement diagonal_assign_cpu(matrix_base< NumericT > const *x, implicit_vector_base< NumericT > const *y)
Definition: preset.hpp:147

ScalarType
float ScalarType
Definition: fft_1d.cpp:42

viennacl::ocl::kernel::global_work_size
size_type global_work_size(int index=0) const
Returns the global work size at the respective dimension.
Definition: kernel.hpp:751

viennacl::scheduler::preset::matrix_row
statement matrix_row(viennacl::vector_base< NumericT > const *x, viennacl::matrix_base< NumericT > const *A, unsigned int id)
Definition: preset.hpp:344

viennacl::linalg::opencl::kernels::matrix_element::execution_handler
static device_specific::execution_handler & execution_handler(bool is_row_major, viennacl::ocl::context &ctx)
Definition: matrix.hpp:609

viennacl::linalg::opencl::givens_next
void givens_next(matrix_base< NumericT > &matrix, vector_base< NumericT > &tmp1, vector_base< NumericT > &tmp2, int l, int m)
Definition: matrix_operations.hpp:590

viennacl::op_trans
A tag class representing transposed matrices.
Definition: forwards.h:220

viennacl::scheduler::preset::matrix_column
statement matrix_column(viennacl::vector_base< NumericT > const *x, viennacl::matrix_base< NumericT > const *A, unsigned int id)
Definition: preset.hpp:350

viennacl::matrix_base::start2
size_type start2() const
Returns the number of columns.
Definition: matrix_def.hpp:230

viennacl::device_specific::execution_handler::execute
void execute(container_type::key_type const &key, statements_container const &statements)
Definition: execution_handler.hpp:86

viennacl::op_element_binary
A tag class representing element-wise binary operations (like multiplication) on vectors or matrices...
Definition: forwards.h:130

viennacl::matrix_base::internal_size2
size_type internal_size2() const
Returns the internal number of columns. Usually required for launching OpenCL kernels only...
Definition: matrix_def.hpp:240

viennacl::scheduler::statement
The main class for representing a statement such as x = inner_prod(y,z); at runtime.
Definition: forwards.h:502

viennacl::linalg::opencl::SVD_COPY_COL_KERNEL
const std::string SVD_COPY_COL_KERNEL
Definition: matrix_operations.hpp:91

viennacl::device_specific::matrix_axpy_template
Definition: matrix_axpy_template.hpp:57

viennacl::matrix_base::internal_size1
size_type internal_size1() const
Returns the internal number of rows. Usually required for launching OpenCL kernels only...
Definition: matrix_def.hpp:238

viennacl::linalg::opencl::matrix_row
void matrix_row(const matrix_base< NumericT > &A, unsigned int i, vector_base< NumericT > &vec)
Definition: matrix_operations.hpp:232

viennacl::linalg::detail::min
T min(const T &lhs, const T &rhs)
Minimum.
Definition: util.hpp:45

handle.hpp
Extracts the underlying OpenCL handle from a vector, a matrix, an expression etc. ...

viennacl::scheduler::preset::assign_cpu
scheduler::statement assign_cpu(vector_base< NumericT > const *x, implicit_vector_base< NumericT > const *y)
Definition: preset.hpp:123

viennacl::ocl::program::get_kernel
viennacl::ocl::kernel & get_kernel(std::string const &name)
Returns the kernel with the provided name.
Definition: context.hpp:773

viennacl::traits::handle
viennacl::backend::mem_handle & handle(T &obj)
Returns the generic memory handle of an object. Non-const version.
Definition: handle.hpp:41

viennacl::device_specific::tree_parsing::operator_string
const char * operator_string(scheduler::operation_node_type type)
Definition: tree_parsing.hpp:205

viennacl::linalg::opencl::kernels::matrix_convert::init
static void init(viennacl::ocl::context &ctx)
Definition: matrix.hpp:869

viennacl::ocl::type_to_string
Helper class for converting a type to its string representation.
Definition: utils.hpp:57

viennacl::op_element_unary
A tag class representing element-wise unary operations (like sin()) on vectors or matrices...
Definition: forwards.h:134

scalar.hpp
Implementation of the ViennaCL scalar class.

result_of.hpp
A collection of compile time type deductions.

viennacl::linalg::opencl::kernels::matrix_convert::program_name
static std::string program_name()
Definition: matrix.hpp:864

viennacl::linalg::opencl::prod_impl
void prod_impl(const matrix_base< NumericT > &A, bool trans_A, const vector_base< NumericT > &vec, vector_base< NumericT > &result)
Carries out matrix-vector multiplication.
Definition: matrix_operations.hpp:305

viennacl::linalg::opencl::ambm_m
void ambm_m(matrix_base< NumericT > &A, matrix_base< NumericT > const &B, ScalarT1 const &alpha, vcl_size_t, bool reciprocal_alpha, bool flip_sign_alpha, matrix_base< NumericT > const &C, ScalarT2 const &beta, vcl_size_t, bool reciprocal_beta, bool flip_sign_beta)
Definition: matrix_operations.hpp:159

viennacl::linalg::opencl::matrix_diagonal_assign
void matrix_diagonal_assign(matrix_base< NumericT > &A, NumericT s)
Definition: matrix_operations.hpp:210

enable_if.hpp
Simple enable-if variant that uses the SFINAE pattern.

viennacl::matrix_base::start1
size_type start1() const
Returns the number of rows.
Definition: matrix_def.hpp:228

matrix.hpp
Runtime generation of OpenCL kernels for matrix operations.

viennacl::fast_copy
void fast_copy(const const_vector_iterator< SCALARTYPE, ALIGNMENT > &gpu_begin, const const_vector_iterator< SCALARTYPE, ALIGNMENT > &gpu_end, CPU_ITERATOR cpu_begin)