math/opencl_2prim_2neg__binomial__2__log__glm__lpmf_8hpp_source.html

#ifndef STAN_MATH_OPENCL_PRIM_NEG_BINOMIAL_2_LOG_GLM_LPMF_HPP

#define STAN_MATH_OPENCL_PRIM_NEG_BINOMIAL_2_LOG_GLM_LPMF_HPP

#ifdef STAN_OPENCL


#include <stan/math/opencl/prim/size.hpp>

#include <stan/math/opencl/rev/operands_and_partials.hpp>

#include <stan/math/opencl/copy.hpp>

#include <stan/math/opencl/prim/multiply.hpp>

#include <stan/math/opencl/plain_type.hpp>

#include <stan/math/opencl/kernel_generator.hpp>

#include <stan/math/opencl/kernels/neg_binomial_2_log_glm_lpmf.hpp>

#include <stan/math/prim/meta.hpp>

#include <stan/math/prim/err.hpp>

#include <stan/math/prim/fun/constants.hpp>

#include <stan/math/prim/fun/eval.hpp>

#include <stan/math/prim/fun/digamma.hpp>

#include <stan/math/prim/fun/lgamma.hpp>

#include <stan/math/prim/fun/multiply_log.hpp>

#include <stan/math/prim/fun/size.hpp>

#include <stan/math/prim/fun/sum.hpp>

#include <stan/math/prim/fun/to_ref.hpp>

#include <stan/math/prim/fun/value_of_rec.hpp>

#include <vector>

#include <cmath>


namespace stan {

namespace math {


template <bool propto, typename T_y_cl, typename T_x_cl, typename T_alpha_cl,

          typename T_beta_cl, typename T_phi_cl,

          require_all_prim_or_rev_kernel_expression_t<

              T_x_cl, T_y_cl, T_alpha_cl, T_beta_cl, T_phi_cl>* = nullptr>

return_type_t<T_x_cl, T_alpha_cl, T_beta_cl, T_phi_cl>

neg_binomial_2_log_glm_lpmf(const T_y_cl& y, const T_x_cl& x,

                            const T_alpha_cl& alpha, const T_beta_cl& beta,

                            const T_phi_cl& phi) {

  static constexpr const char* function = "neg_binomial_2_log_glm_lpmf(OpenCL)";

  using T_partials_return

      = partials_return_t<T_x_cl, T_alpha_cl, T_beta_cl, T_phi_cl>;

  constexpr bool is_y_vector = !is_stan_scalar<T_y_cl>::value;

  constexpr bool is_phi_vector = !is_stan_scalar<T_phi_cl>::value;

  constexpr bool is_alpha_vector = !is_stan_scalar<T_alpha_cl>::value;

  using Eigen::Dynamic;

  using std::isfinite;


  const size_t N = x.rows();

  const size_t M = x.cols();


  if (is_y_vector) {

    check_size_match(function, "Rows of ", "x", N, "rows of ", "y",

                     math::size(y));

  }

  check_size_match(function, "Columns of ", "x", M, "size of ", "beta",

                   math::size(beta));

  if (is_phi_vector) {

    check_size_match(function, "Rows of ", "x", N, "size of ", "phi",

                     math::size(phi));

  }

  if (is_alpha_vector) {

    check_size_match(function, "Rows of ", "x", N, "size of ", "alpha",

                     math::size(alpha));

  }

  if (N == 0) {

    return 0;

  }

  if (!include_summand<propto, T_x_cl, T_alpha_cl, T_beta_cl,

                       T_phi_cl>::value) {

    return 0;

  }


  const auto& y_val = eval(value_of(y));

  const auto& x_val = eval(value_of(x));

  const auto& alpha_val = eval(value_of(alpha));

  const auto& beta_val = eval(value_of(beta));

  const auto& phi_val = eval(value_of(phi));


  // copy any scalars to device, as this is expected by the kernel

  const auto& y_val_cl = to_matrix_cl(y_val);

  const auto& alpha_val_cl = to_matrix_cl(alpha_val);

  const auto& phi_val_cl = to_matrix_cl(phi_val);


  const int local_size

      = opencl_kernels::neg_binomial_2_log_glm.get_option("LOCAL_SIZE_");

  const int wgs = (N + local_size - 1) / local_size;


  const bool need_theta_derivative

      = !is_constant_all<T_x_cl, T_beta_cl, T_alpha_cl>::value;

  matrix_cl<double> theta_derivative_cl(need_theta_derivative ? N : 0, 1);

  const bool need_theta_derivative_sum

      = need_theta_derivative && !is_alpha_vector;

  matrix_cl<double> theta_derivative_sum_cl(wgs, 1);

  const bool need_phi_derivative_sum = !is_alpha_vector;

  const bool need_phi_derivative

      = !is_constant_all<T_phi_cl>::value || need_phi_derivative_sum;

  matrix_cl<double> phi_derivative_cl(

      need_phi_derivative ? (need_phi_derivative_sum ? wgs : N) : 0, 1);

  const bool need_logp1 = include_summand<propto>::value;

  const bool need_logp2

      = include_summand<propto, T_phi_cl>::value && is_phi_vector;

  const bool need_logp3

      = include_summand<propto, T_x_cl, T_alpha_cl, T_beta_cl>::value;

  const bool need_logp4 = include_summand<propto, T_phi_cl>::value

                          && (is_y_vector || is_phi_vector);

  matrix_cl<double> logp_cl(wgs, 1);


  try {

    opencl_kernels::neg_binomial_2_log_glm(

        cl::NDRange(local_size * wgs), cl::NDRange(local_size), logp_cl,

        theta_derivative_cl, theta_derivative_sum_cl, phi_derivative_cl,

        y_val_cl, x_val, alpha_val_cl, beta_val, phi_val_cl, N, M, is_y_vector,

        is_alpha_vector, is_phi_vector, need_theta_derivative,

        need_theta_derivative_sum, need_phi_derivative, need_phi_derivative_sum,

        need_logp1, need_logp2, need_logp3, need_logp4);

  } catch (const cl::Error& e) {

    check_opencl_error(function, e);

  }


  T_partials_return logp = sum(from_matrix_cl(logp_cl));

  if (!std::isfinite(logp)) {

    results(

        check_cl(function, "Vector of dependent variables", y_val,

                 "nonnegative"),

        check_cl(function, "Intercept", alpha_val, "finite"),

        check_cl(function, "Precision parameter", phi_val, "positive finite"))

        = expressions(y_val >= 0, isfinite(alpha_val),

                      isfinite(phi_val) && phi_val > 0);

    check_cl(function, "Design matrix", x_val, "finite") = isfinite(x_val);

    check_cl(function, "Weight vector", beta_val, "finite")

        = isfinite(beta_val);

  } else {

    check_cl(function, "Precision parameter", phi_val, "positive finite")

        = isfinite(phi_val) && phi_val > 0;

  }


  if (include_summand<propto, T_phi_cl>::value && !is_phi_vector) {

    logp += N

            * (multiply_log(forward_as<double>(phi_val),

                            forward_as<double>(phi_val))

               - lgamma(forward_as<double>(phi_val)));

  }

  if (include_summand<propto, T_phi_cl>::value && !is_y_vector

      && !is_phi_vector) {

    logp += forward_as<double>(lgamma(y_val + phi_val)) * N;

  }


  auto ops_partials = make_partials_propagator(x, alpha, beta, phi);

  // Compute the necessary derivatives.

  if (!is_constant<T_x_cl>::value) {

    partials<0>(ops_partials)

        = transpose(beta_val * transpose(theta_derivative_cl));

  }

  if (!is_constant_all<T_beta_cl>::value) {

    // transposition of a vector can be done without copying

    const matrix_cl<double> theta_derivative_transpose_cl(

        theta_derivative_cl.buffer(), 1, theta_derivative_cl.rows());

    matrix_cl<double> edge3_partials_transpose_cl

        = theta_derivative_transpose_cl * x_val;

    partials<2>(ops_partials)

        = matrix_cl<double>(edge3_partials_transpose_cl.buffer(),

                            edge3_partials_transpose_cl.cols(), 1);

    if (beta_val.rows() != 0) {

      edge<2>(ops_partials)

          .partials_.add_write_event(

              edge3_partials_transpose_cl.write_events().back());

    }

  }

  if (!is_constant_all<T_alpha_cl>::value) {

    if (is_alpha_vector) {

      partials<1>(ops_partials) = std::move(theta_derivative_cl);

    } else {

      forward_as<internal::broadcast_array<double>>(

          partials<1>(ops_partials))[0]

          = sum(from_matrix_cl(theta_derivative_sum_cl));

    }

  }

  if (!is_constant_all<T_phi_cl>::value) {

    if (is_phi_vector) {

      partials<3>(ops_partials) = std::move(phi_derivative_cl);

    } else {

      forward_as<internal::broadcast_array<double>>(

          partials<3>(ops_partials))[0]

          = sum(from_matrix_cl(phi_derivative_cl));

    }

  }

  return ops_partials.build(logp);

}


}  // namespace math

}  // namespace stan


#endif

#endif

stan::math::matrix_cl::buffer
const cl::Buffer & buffer() const
Definition matrix_cl.hpp:177

stan::math::matrix_cl::cols
int cols() const
Definition matrix_cl.hpp:66

stan::math::matrix_cl::rows
int rows() const
Definition matrix_cl.hpp:64

stan::math::matrix_cl::write_events
const tbb::concurrent_vector< cl::Event > & write_events() const
Get the events from the event stacks.
Definition matrix_cl.hpp:103

stan::math::matrix_cl
Represents an arithmetic matrix on the OpenCL device.
Definition matrix_cl.hpp:47

constants.hpp

copy.hpp

eval.hpp

stan::math::check_opencl_error
void check_opencl_error(const char *function, const cl::Error &e)
Throws the domain error with specifying the OpenCL error that occurred.
Definition check_opencl.hpp:23

stan::math::isfinite
isfinite_< as_operation_cl_t< T > > isfinite(T &&a)
Definition elt_function_cl.hpp:332

stan::math::check_cl
auto check_cl(const char *function, const char *var_name, T &&y, const char *must_be)
Constructs a check on opencl matrix or expression.
Definition check_cl.hpp:219

stan::math::results
results_cl< T_results... > results(T_results &&... results)
Deduces types for constructing results_cl object.
Definition multi_result_kernel.hpp:668

stan::math::transpose
auto transpose(Arg &&a)
Transposes a kernel generator expression.
Definition transpose.hpp:139

stan::math::expressions
expressions_cl< T_expressions... > expressions(T_expressions &&... expressions)
Deduces types for constructing expressions_cl object.
Definition multi_result_kernel.hpp:289

stan::math::opencl_kernels::neg_binomial_2_log_glm
const kernel_cl< out_buffer, out_buffer, out_buffer, out_buffer, in_buffer, in_buffer, in_buffer, in_buffer, in_buffer, int, int, int, int, int, int, int, int, int, int, int, int, int > neg_binomial_2_log_glm("neg_binomial_2_log_glm", {digamma_device_function, log1p_exp_device_function, neg_binomial_2_log_glm_kernel_code}, {{"REDUCTION_STEP_SIZE", 4}, {"LOCAL_SIZE_", 64}})
See the docs for neg_binomial_2_log_glm_lpmf() .

stan::math::to_matrix_cl
matrix_cl< scalar_type_t< T > > to_matrix_cl(T &&src)
Copies the source Eigen matrix, std::vector or scalar to the destination matrix that is stored on the...
Definition copy.hpp:45

stan::math::neg_binomial_2_log_glm_lpmf
return_type_t< T_x_cl, T_alpha_cl, T_beta_cl, T_phi_cl > neg_binomial_2_log_glm_lpmf(const T_y_cl &y, const T_x_cl &x, const T_alpha_cl &alpha, const T_beta_cl &beta, const T_phi_cl &phi)
Returns the log PMF of the Generalized Linear Model (GLM) with Negative-Binomial-2 distribution and l...
Definition neg_binomial_2_log_glm_lpmf.hpp:69

stan::math::from_matrix_cl
auto from_matrix_cl(const T &src)
Copies the source matrix that is stored on the OpenCL device to the destination Eigen matrix.
Definition copy.hpp:61

stan::require_all_prim_or_rev_kernel_expression_t
require_all_t< is_prim_or_rev_kernel_expression< std::decay_t< Types > >... > require_all_prim_or_rev_kernel_expression_t
Require type satisfies is_prim_or_rev_kernel_expression.
Definition is_kernel_expression.hpp:148

stan::math::size
int64_t size(const T &m)
Returns the size (number of the elements) of a matrix_cl or var_value<matrix_cl<T>>.
Definition size.hpp:19

kernel_generator.hpp

stan::math::multiply_log
fvar< T > multiply_log(const fvar< T > &x1, const fvar< T > &x2)
Definition multiply_log.hpp:14

stan::math::e
static constexpr double e()
Return the base of the natural logarithm.
Definition constants.hpp:20

stan::math::eval
T eval(T &&arg)
Inputs which have a plain_type equal to the own time are forwarded unmodified (for Eigen expressions ...
Definition eval.hpp:20

stan::math::value_of
T value_of(const fvar< T > &v)
Return the value of the specified variable.
Definition value_of.hpp:18

stan::math::lgamma
fvar< T > lgamma(const fvar< T > &x)
Return the natural logarithm of the gamma function applied to the specified argument.
Definition lgamma.hpp:21

stan::math::sum
auto sum(const std::vector< T > &m)
Return the sum of the entries of the specified standard vector.
Definition sum.hpp:23

stan::math::check_size_match
void check_size_match(const char *function, const char *name_i, T_size1 i, const char *name_j, T_size2 j)
Check if the provided sizes match.
Definition check_size_match.hpp:24

stan::math::beta
fvar< T > beta(const fvar< T > &x1, const fvar< T > &x2)
Return fvar with the beta function applied to the specified arguments and its gradient.
Definition beta.hpp:51

stan::math::make_partials_propagator
auto make_partials_propagator(Ops &&... ops)
Construct an partials_propagator.
Definition partials_propagator.hpp:119

stan::partials_return_t
typename partials_return_type< Args... >::type partials_return_t
Definition partials_return_type.hpp:44

stan
The lgamma implementation in stan-math is based on either the reentrant safe lgamma_r implementation ...
Definition unit_vector_constrain.hpp:15

neg_binomial_2_log_glm_lpmf.hpp

plain_type.hpp

multiply.hpp

size.hpp

operands_and_partials.hpp

err.hpp

digamma.hpp

lgamma.hpp

multiply_log.hpp

size.hpp

sum.hpp

value_of_rec.hpp

meta.hpp

stan::is_constant
Metaprogramming struct to detect whether a given type is constant in the mathematical sense (not the ...
Definition is_constant.hpp:30

stan::is_stan_scalar
Checks if decayed type is a var, fvar, or arithmetic.
Definition is_stan_scalar.hpp:29

stan::math::conjunction
Extends std::true_type when instantiated with zero or more template parameters, all of which extend t...
Definition conjunction.hpp:14

stan::math::include_summand
Template metaprogram to calculate whether a summand needs to be included in a proportional (log) prob...
Definition include_summand.hpp:39

to_ref.hpp