math/opencl_2prim_2ordered__logistic__lpmf_8hpp_source.html

#ifndef STAN_MATH_OPENCL_PRIM_ORDERED_LOGISTIC_LPMF_HPP

#define STAN_MATH_OPENCL_PRIM_ORDERED_LOGISTIC_LPMF_HPP

#ifdef STAN_OPENCL


#include <stan/math/opencl/kernel_generator.hpp>

#include <stan/math/opencl/kernels/add.hpp>

#include <stan/math/opencl/kernels/ordered_logistic_lpmf.hpp>

#include <stan/math/prim/meta.hpp>

#include <stan/math/prim/err.hpp>

#include <stan/math/prim/fun/constants.hpp>

#include <stan/math/prim/fun/elt_divide.hpp>

#include <stan/math/prim/fun/elt_multiply.hpp>

#include <stan/math/prim/functor/partials_propagator.hpp>

#include <stan/math/prim/err/constraint_tolerance.hpp>


namespace stan {

namespace math {


template <bool propto, typename T_y_cl, typename T_loc_cl, typename T_cuts_cl,

          require_all_prim_or_rev_kernel_expression_t<T_y_cl, T_loc_cl,

                                                      T_cuts_cl>* = nullptr>

inline return_type_t<T_y_cl, T_loc_cl, T_cuts_cl> ordered_logistic_lpmf(

    const T_y_cl& y, const T_loc_cl& lambda, const T_cuts_cl& cuts) {

  constexpr bool is_y_vector = !is_stan_scalar<T_y_cl>::value;

  static constexpr const char* function = "ordered_logistic_lpmf(OpenCL)";


  if (size(y) != 1) {

    check_size_match(function, "Size of ", "y", math::size(y), "Size of",

                     "lambda", math::size(lambda));

  }


  int N_instances = max_size(y, lambda);

  int N_classes = cuts.rows() + 1;

  int N_cut_sets = cuts.cols();


  if (N_cut_sets > 1) {

    check_size_match(function, "Length of lambda variables ", N_instances,

                     "Number of cutpoint vectors ", N_cut_sets);

  }

  if (N_instances == 0 || N_classes == 1) {

    return 0.0;

  }

  const auto& cuts_val = eval(value_of(cuts));

  if (N_classes >= 2) {

    auto cuts_head

        = block_zero_based(cuts_val, 0, 0, cuts.rows() - 1, N_cut_sets);

    auto cuts_tail

        = block_zero_based(cuts_val, 1, 0, cuts.rows() - 1, N_cut_sets);

    check_cl(function, "Cuts", cuts_head, "ordered and finite")

        = cuts_head < cuts_tail && isfinite(cuts_head) && isfinite(cuts_tail);

  } else if (N_classes == 1) {

    check_cl(function, "Cuts", cuts_val, "finite") = isfinite(cuts_val);

  }


  if (!include_summand<propto, T_loc_cl, T_cuts_cl>::value) {

    return 0.0;

  }


  const auto& y_val = eval(value_of(y));

  const auto& lambda_val = eval(value_of(lambda));


  const auto& y_val_cl = to_matrix_cl(y_val);


  const int local_size

      = opencl_kernels::ordered_logistic.get_option("LOCAL_SIZE_");

  const int wgs = (N_instances + local_size - 1) / local_size;


  bool need_lambda_derivative = !is_constant_all<T_loc_cl>::value;

  bool need_cuts_derivative = !is_constant_all<T_cuts_cl>::value;

  bool need_broadcasting = N_cut_sets == 1 && N_instances != 1;

  matrix_cl<double> logp_cl(wgs, 1);

  matrix_cl<double> lambda_derivative_cl(N_instances,

                                         need_lambda_derivative ? 1 : 0);

  matrix_cl<double> cuts_derivative_cl(

      N_classes - 1,

      need_cuts_derivative ? (need_broadcasting ? wgs : N_cut_sets) : 0);


  try {

    opencl_kernels::ordered_logistic(

        cl::NDRange(local_size * wgs), cl::NDRange(local_size), logp_cl,

        lambda_derivative_cl, cuts_derivative_cl, y_val_cl, lambda_val,

        cuts_val, N_instances, N_classes, is_y_vector, !need_broadcasting,

        need_lambda_derivative, need_cuts_derivative);

  } catch (const cl::Error& e) {

    check_opencl_error(function, e);

  }


  double logp = sum(from_matrix_cl(logp_cl));


  if (!std::isfinite(logp)) {

    results(check_cl(function, "Vector of dependent variables", y_val,

                     "between 0 and number of classes"),

            check_cl(function, "lambda vector", lambda_val, "finite"))

        = expressions(y_val >= 1 && y_val <= static_cast<int>(N_classes),

                      isfinite(lambda_val));

  }

  auto ops_partials = make_partials_propagator(lambda, cuts);


  if (!is_constant_all<T_loc_cl>::value) {

    partials<0>(ops_partials) = lambda_derivative_cl;

  }

  if (!is_constant_all<T_cuts_cl>::value) {

    if (need_broadcasting) {

      partials<1>(ops_partials) = rowwise_sum(cuts_derivative_cl);

    } else {

      partials<1>(ops_partials) = std::move(cuts_derivative_cl);

    }

  }

  return ops_partials.build(logp);

}


}  // namespace math

}  // namespace stan

#endif

#endif

stan::math::matrix_cl
Represents an arithmetic matrix on the OpenCL device.
Definition matrix_cl.hpp:47

constants.hpp

constraint_tolerance.hpp

stan::math::check_opencl_error
void check_opencl_error(const char *function, const cl::Error &e)
Throws the domain error with specifying the OpenCL error that occurred.
Definition check_opencl.hpp:23

stan::math::isfinite
isfinite_< as_operation_cl_t< T > > isfinite(T &&a)
Definition elt_function_cl.hpp:332

stan::math::check_cl
auto check_cl(const char *function, const char *var_name, T &&y, const char *must_be)
Constructs a check on opencl matrix or expression.
Definition check_cl.hpp:219

stan::math::block_zero_based
auto block_zero_based(T &&a, int start_row, int start_col, int rows, int cols)
Block of a kernel generator expression.
Definition block_zero_based.hpp:340

stan::math::results
results_cl< T_results... > results(T_results &&... results)
Deduces types for constructing results_cl object.
Definition multi_result_kernel.hpp:668

stan::math::rowwise_sum
auto rowwise_sum(T &&a)
Rowwise sum reduction of a kernel generator expression.
Definition rowwise_reduction.hpp:330

stan::math::expressions
expressions_cl< T_expressions... > expressions(T_expressions &&... expressions)
Deduces types for constructing expressions_cl object.
Definition multi_result_kernel.hpp:289

stan::math::opencl_kernels::ordered_logistic
const kernel_cl< out_buffer, out_buffer, out_buffer, in_buffer, in_buffer, in_buffer, int, int, int, int, int, int > ordered_logistic("ordered_logistic", {log1p_exp_device_function, log1m_exp_device_function, inv_logit_device_function, ordered_logistic_kernel_code}, {{"REDUCTION_STEP_SIZE", 4}, {"LOCAL_SIZE_", 64}})
See the docs for ordered_logistic() .

stan::math::to_matrix_cl
matrix_cl< scalar_type_t< T > > to_matrix_cl(T &&src)
Copies the source Eigen matrix, std::vector or scalar to the destination matrix that is stored on the...
Definition copy.hpp:45

stan::math::ordered_logistic_lpmf
return_type_t< T_y_cl, T_loc_cl, T_cuts_cl > ordered_logistic_lpmf(const T_y_cl &y, const T_loc_cl &lambda, const T_cuts_cl &cuts)
Returns the (natural) log probability of the specified array of integers given the vector of continuo...
Definition ordered_logistic_lpmf.hpp:70

stan::math::from_matrix_cl
auto from_matrix_cl(const T &src)
Copies the source matrix that is stored on the OpenCL device to the destination Eigen matrix.
Definition copy.hpp:61

stan::require_all_prim_or_rev_kernel_expression_t
require_all_t< is_prim_or_rev_kernel_expression< std::decay_t< Types > >... > require_all_prim_or_rev_kernel_expression_t
Require type satisfies is_prim_or_rev_kernel_expression.
Definition is_kernel_expression.hpp:148

stan::return_type_t
typename return_type< Ts... >::type return_type_t
Convenience type for the return type of the specified template parameters.
Definition return_type.hpp:218

stan::math::size
int64_t size(const T &m)
Returns the size (number of the elements) of a matrix_cl or var_value<matrix_cl<T>>.
Definition size.hpp:19

kernel_generator.hpp

stan::math::e
static constexpr double e()
Return the base of the natural logarithm.
Definition constants.hpp:20

stan::math::eval
T eval(T &&arg)
Inputs which have a plain_type equal to the own time are forwarded unmodified (for Eigen expressions ...
Definition eval.hpp:20

stan::math::value_of
T value_of(const fvar< T > &v)
Return the value of the specified variable.
Definition value_of.hpp:18

stan::math::sum
auto sum(const std::vector< T > &m)
Return the sum of the entries of the specified standard vector.
Definition sum.hpp:23

stan::math::check_size_match
void check_size_match(const char *function, const char *name_i, T_size1 i, const char *name_j, T_size2 j)
Check if the provided sizes match.
Definition check_size_match.hpp:24

stan::math::max_size
int64_t max_size(const T1 &x1, const Ts &... xs)
Calculate the size of the largest input.
Definition max_size.hpp:20

stan::math::make_partials_propagator
auto make_partials_propagator(Ops &&... ops)
Construct an partials_propagator.
Definition partials_propagator.hpp:119

stan
The lgamma implementation in stan-math is based on either the reentrant safe lgamma_r implementation ...
Definition unit_vector_constrain.hpp:15

add.hpp

ordered_logistic_lpmf.hpp

err.hpp

elt_divide.hpp

elt_multiply.hpp

partials_propagator.hpp

meta.hpp

stan::is_stan_scalar
Checks if decayed type is a var, fvar, or arithmetic.
Definition is_stan_scalar.hpp:29

stan::math::conjunction
Extends std::true_type when instantiated with zero or more template parameters, all of which extend t...
Definition conjunction.hpp:14

stan::math::include_summand
Template metaprogram to calculate whether a summand needs to be included in a proportional (log) prob...
Definition include_summand.hpp:39