doc/html/enqueue_8hpp_source.html

 #ifndef VIENNACL_OCL_ENQUEUE_HPP_

 #define VIENNACL_OCL_ENQUEUE_HPP_


 /* =========================================================================

    Copyright (c) 2010-2015, Institute for Microelectronics,

                             Institute for Analysis and Scientific Computing,

                             TU Wien.

    Portions of this software are copyright by UChicago Argonne, LLC.


                             -----------------

                   ViennaCL - The Vienna Computing Library

                             -----------------


    Project Head:    Karl Rupp                   rupp@iue.tuwien.ac.at


    (A list of authors and contributors can be found in the manual)


    License:         MIT (X11), see file LICENSE in the base directory

 ============================================================================= */


 #ifdef __APPLE__

 #include <OpenCL/cl.h>

 #else

 #include <CL/cl.h>

 #endif


 #include "viennacl/ocl/backend.hpp"

 #include "viennacl/ocl/kernel.hpp"

 #include "viennacl/ocl/command_queue.hpp"

 #include "viennacl/ocl/context.hpp"


 namespace viennacl

 {


 namespace device_specific

 {

   class custom_operation;

   void enqueue_custom_op(viennacl::device_specific::custom_operation & op, viennacl::ocl::command_queue const & queue);

 }


 namespace ocl

 {


 template<typename KernelType>

 void enqueue(KernelType & k, viennacl::ocl::command_queue const & queue)

 {

 #if defined(VIENNACL_DEBUG_ALL) || defined(VIENNACL_DEBUG_KERNEL)

   cl_event event;

 #endif


   // 1D kernel:

   if (k.local_work_size(1) == 0)

   {

 #if defined(VIENNACL_DEBUG_ALL) || defined(VIENNACL_DEBUG_KERNEL)

     std::cout << "ViennaCL: Starting 1D-kernel '" << k.name() << "'..." << std::endl;

     std::cout << "ViennaCL: Global work size: '"  << k.global_work_size() << "'..." << std::endl;

     std::cout << "ViennaCL: Local work size: '"   << k.local_work_size() << "'..." << std::endl;

 #endif


     vcl_size_t tmp_global = k.global_work_size();

     vcl_size_t tmp_local = k.local_work_size();


     cl_int err;

     if (tmp_global == 1 && tmp_local == 1)

 #if defined(VIENNACL_DEBUG_ALL) || defined(VIENNACL_DEBUG_KERNEL)

       err = clEnqueueTask(queue.handle().get(), k.handle().get(), 0, NULL, &event);

 #else

       err = clEnqueueTask(queue.handle().get(), k.handle().get(), 0, NULL, NULL);

 #endif

     else

 #if defined(VIENNACL_DEBUG_ALL) || defined(VIENNACL_DEBUG_KERNEL)

       err = clEnqueueNDRangeKernel(queue.handle().get(), k.handle().get(), 1, NULL, &tmp_global, &tmp_local, 0, NULL, &event);

 #else

       err = clEnqueueNDRangeKernel(queue.handle().get(), k.handle().get(), 1, NULL, &tmp_global, &tmp_local, 0, NULL, NULL);

 #endif


     if (err != CL_SUCCESS)

     {

       std::cerr << "ViennaCL: FATAL ERROR: Kernel start failed for '" << k.name() << "'." << std::endl;

       std::cerr << "ViennaCL: Smaller work sizes could not solve the problem. " << std::endl;

       VIENNACL_ERR_CHECK(err);

     }

   }

   else //2D or 3D kernel

   {

 #if defined(VIENNACL_DEBUG_ALL) || defined(VIENNACL_DEBUG_KERNEL)

     std::cout << "ViennaCL: Starting 2D/3D-kernel '" << k.name() << "'..." << std::endl;

     std::cout << "ViennaCL: Global work size: '"  << k.global_work_size(0) << ", " << k.global_work_size(1) << ", " << k.global_work_size(2) << "'..." << std::endl;

     std::cout << "ViennaCL: Local work size: '"   << k.local_work_size(0) << ", " << k.local_work_size(1) << ", " << k.local_work_size(2) << "'..." << std::endl;

 #endif


     vcl_size_t tmp_global[3];

     tmp_global[0] = k.global_work_size(0);

     tmp_global[1] = k.global_work_size(1);

     tmp_global[2] = k.global_work_size(2);


     vcl_size_t tmp_local[3];

     tmp_local[0] = k.local_work_size(0);

     tmp_local[1] = k.local_work_size(1);

     tmp_local[2] = k.local_work_size(2);


 #if defined(VIENNACL_DEBUG_ALL) || defined(VIENNACL_DEBUG_KERNEL)

     cl_int err = clEnqueueNDRangeKernel(queue.handle().get(), k.handle().get(), (tmp_global[2] == 0) ? 2 : 3, NULL, tmp_global, tmp_local, 0, NULL, &event);

 #else

     cl_int err = clEnqueueNDRangeKernel(queue.handle().get(), k.handle().get(), (tmp_global[2] == 0) ? 2 : 3, NULL, tmp_global, tmp_local, 0, NULL, NULL);

 #endif

     if (err != CL_SUCCESS)

     {

       //could not start kernel with any parameters

       std::cerr << "ViennaCL: FATAL ERROR: Kernel start failed for '" << k.name() << "'." << std::endl;

       VIENNACL_ERR_CHECK(err);

     }

   }


 #if defined(VIENNACL_DEBUG_ALL) || defined(VIENNACL_DEBUG_KERNEL)

   queue.finish();

   cl_int execution_status;

   clGetEventInfo(event, CL_EVENT_COMMAND_EXECUTION_STATUS, sizeof(cl_int), &execution_status, NULL);

   std::cout << "ViennaCL: Kernel " << k.name() << " finished with status " << execution_status << "!" << std::endl;

 #endif

 } //enqueue()


 template<typename KernelType>

 void enqueue(KernelType & k)

 {

   enqueue(k, k.context().get_queue());

 }


 inline void enqueue(viennacl::device_specific::custom_operation & op, viennacl::ocl::command_queue const & queue)

 {

   device_specific::enqueue_custom_op(op,queue);

 }


 inline void enqueue(viennacl::device_specific::custom_operation & op)

 {

   enqueue(op, viennacl::ocl::current_context().get_queue());

 }


 } // namespace ocl

 } // namespace viennacl

 #endif

viennacl::ocl::command_queue::finish
void finish() const
Waits until all kernels in the queue have finished their execution.
Definition: command_queue.hpp:70

viennacl::ocl::current_context
viennacl::ocl::context & current_context()
Convenience function for returning the current context.
Definition: backend.hpp:213

viennacl::ocl::command_queue
A class representing a command queue.
Definition: command_queue.hpp:45

viennacl::ocl::command_queue::handle
viennacl::ocl::handle< cl_command_queue > const & handle() const
Definition: command_queue.hpp:81

command_queue.hpp
Implementations of command queue representations.

VIENNACL_ERR_CHECK
#define VIENNACL_ERR_CHECK(err)
Definition: error.hpp:681

viennacl
Main namespace in ViennaCL. Holds all the basic types such as vector, matrix, etc. and defines operations upon them.
Definition: cpu_ram.hpp:34

viennacl::ocl::handle::get
const OCL_TYPE & get() const
Definition: handle.hpp:189

viennacl::ocl::get_queue
viennacl::ocl::command_queue & get_queue()
Convenience function for getting the default queue for the currently active device in the active cont...
Definition: backend.hpp:320

viennacl::device_specific::enqueue_custom_op
void enqueue_custom_op(viennacl::device_specific::custom_operation &op, viennacl::ocl::command_queue const &queue)

viennacl::vcl_size_t
std::size_t vcl_size_t
Definition: forwards.h:75

context.hpp
Represents an OpenCL context within ViennaCL.

backend.hpp
Implementations of the OpenCL backend, where all contexts are stored in.

viennacl::ocl::enqueue
void enqueue(KernelType &k, viennacl::ocl::command_queue const &queue)
Enqueues a kernel in the provided queue.
Definition: enqueue.hpp:50

kernel.hpp
Representation of an OpenCL kernel in ViennaCL.