math/indexing__rev_8hpp_source.html

#ifndef STAN_MATH_OPENCL_INDEXING_REV_HPP

#define STAN_MATH_OPENCL_INDEXING_REV_HPP

#ifdef STAN_OPENCL


#include <stan/math/opencl/matrix_cl.hpp>

#include <stan/math/opencl/kernel_generator.hpp>

#include <stan/math/opencl/kernels/indexing_rev.hpp>

#include <stan/math/opencl/kernels/add.hpp>


namespace stan {

namespace math {


void indexing_rev(matrix_cl<double>& adj, const matrix_cl<int>& idx,

                  const matrix_cl<double>& res) {

  int local_mem_size

      = opencl_context.device()[0].getInfo<CL_DEVICE_LOCAL_MEM_SIZE>();

  int preferred_work_groups

      = opencl_context.device()[0].getInfo<CL_DEVICE_MAX_COMPUTE_UNITS>();

  int local_size = 64;

  int n_threads = preferred_work_groups * 16 * local_size;


  try {

    if (local_mem_size > sizeof(double) * adj.size() * local_size * 2) {

      stan::math::opencl_kernels::indexing_rev_local_independent(

          cl::NDRange(n_threads), cl::NDRange(local_size), adj, idx, res,

          cl::Local(sizeof(double) * adj.size() * local_size), res.size(),

          adj.size());

    } else if (local_mem_size > sizeof(double) * adj.size()) {

      stan::math::opencl_kernels::indexing_rev_local_atomic(

          cl::NDRange(n_threads), cl::NDRange(local_size), adj, idx, res,

          cl::Local(sizeof(double) * adj.size()), res.size(), adj.size());

    } else {

      stan::math::opencl_kernels::indexing_rev_global_atomic(

          cl::NDRange(n_threads), cl::NDRange(local_size), adj, idx, res,

          res.size());

    }

  } catch (cl::Error& e) {

    check_opencl_error("indexing reverse pass", e);

  }

}


}  // namespace math

}  // namespace stan


#endif

#endif

stan::math::matrix_cl::size
int size() const
Definition matrix_cl.hpp:68

stan::math::matrix_cl
Represents an arithmetic matrix on the OpenCL device.
Definition matrix_cl.hpp:47

stan::math::opencl_context
The API to access the methods and values in opencl_context_base.
Definition opencl_context.hpp:210

stan::math::check_opencl_error
void check_opencl_error(const char *function, const cl::Error &e)
Throws the domain error with specifying the OpenCL error that occurred.
Definition check_opencl.hpp:23

stan::math::opencl_context::device
std::vector< cl::Device > & device() noexcept
Returns a vector containing the OpenCL device used to create the context.
Definition opencl_context.hpp:393

stan::math::opencl_kernels::indexing_rev_local_independent
const kernel_cl< in_out_buffer, in_buffer, in_buffer, cl::LocalSpaceArg, int, int > indexing_rev_local_independent("indexing_rev", {atomic_add_double_device_function, indexing_rev_local_independent_kernel_code})
See the docs for add_batch() .

stan::math::opencl_kernels::indexing_rev_local_atomic
const kernel_cl< in_out_buffer, in_buffer, in_buffer, cl::LocalSpaceArg, int, int > indexing_rev_local_atomic("indexing_rev", {atomic_add_double_device_function, indexing_rev_local_atomic_kernel_code})
See the docs for add_batch() .

stan::math::opencl_kernels::indexing_rev_global_atomic
const kernel_cl< in_out_buffer, in_buffer, in_buffer, int > indexing_rev_global_atomic("indexing_rev", {atomic_add_double_device_function, indexing_rev_global_atomic_kernel_code})
See the docs for add_batch() .

kernel_generator.hpp

indexing_rev.hpp

matrix_cl.hpp

stan::math::e
static constexpr double e()
Return the base of the natural logarithm.
Definition constants.hpp:20

stan::math::indexing_rev
void indexing_rev(matrix_cl< double > &adj, const matrix_cl< int > &idx, const matrix_cl< double > &res)
Performs reverse pass for indexing operation on the OpenCL device.
Definition indexing_rev.hpp:22

stan
The lgamma implementation in stan-math is based on either the reentrant safe lgamma_r implementation ...
Definition unit_vector_constrain.hpp:15

add.hpp