math/multi__student__t__cholesky__lpdf_8hpp_source.html

#ifndef STAN_MATH_PRIM_PROB_MULTI_STUDENT_T_CHOLESKY_LPDF_HPP

#define STAN_MATH_PRIM_PROB_MULTI_STUDENT_T_CHOLESKY_LPDF_HPP


#include <stan/math/prim/meta.hpp>

#include <stan/math/prim/err.hpp>

#include <stan/math/prim/fun/as_column_vector_or_scalar.hpp>

#include <stan/math/prim/fun/columns_dot_self.hpp>

#include <stan/math/prim/fun/constants.hpp>

#include <stan/math/prim/fun/digamma.hpp>

#include <stan/math/prim/fun/dot_product.hpp>

#include <stan/math/prim/fun/dot_self.hpp>

#include <stan/math/prim/fun/inv.hpp>

#include <stan/math/prim/fun/is_inf.hpp>

#include <stan/math/prim/fun/log.hpp>

#include <stan/math/prim/fun/log1p.hpp>

#include <stan/math/prim/fun/lgamma.hpp>

#include <stan/math/prim/fun/max_size_mvt.hpp>

#include <stan/math/prim/fun/mdivide_left_tri.hpp>

#include <stan/math/prim/fun/mdivide_right_tri.hpp>

#include <stan/math/prim/fun/size_mvt.hpp>

#include <stan/math/prim/fun/to_ref.hpp>

#include <stan/math/prim/fun/vector_seq_view.hpp>

#include <stan/math/prim/prob/multi_normal_cholesky_lpdf.hpp>

#include <stan/math/prim/functor/partials_propagator.hpp>

#include <cmath>

#include <cstdlib>

#include <iostream>


namespace stan {

namespace math {

template <

    bool propto, typename T_y, typename T_dof, typename T_loc, typename T_covar,

    require_any_not_vector_vt<is_stan_scalar, T_y, T_dof, T_loc>* = nullptr,

    require_all_not_nonscalar_prim_or_rev_kernel_expression_t<

        T_y, T_loc, T_covar>* = nullptr>

inline return_type_t<T_y, T_dof, T_loc, T_covar> multi_student_t_cholesky_lpdf(

    const T_y& y, const T_dof& nu, const T_loc& mu, const T_covar& L) {

  static constexpr const char* function = "multi_student_t_cholesky";

  using T_covar_elem = typename scalar_type<T_covar>::type;

  using T_return = return_type_t<T_y, T_dof, T_loc, T_covar>;

  using T_partials_return = partials_return_t<T_y, T_dof, T_loc, T_covar>;

  using matrix_partials_t

      = Eigen::Matrix<T_partials_return, Eigen::Dynamic, Eigen::Dynamic>;

  using vector_partials_t = Eigen::Matrix<T_partials_return, Eigen::Dynamic, 1>;

  using row_vector_partials_t

      = Eigen::Matrix<T_partials_return, 1, Eigen::Dynamic>;

  using T_y_ref = ref_type_t<T_y>;

  using T_nu_ref = ref_type_t<T_dof>;

  using T_mu_ref = ref_type_t<T_loc>;

  using T_L_ref = ref_type_t<T_covar>;


  check_consistent_sizes_mvt(function, "y", y, "mu", mu);

  size_t num_y = size_mvt(y);

  size_t num_mu = size_mvt(mu);


  if (num_y == 0 || num_mu == 0) {

    return 0;

  }


  T_y_ref y_ref = y;

  T_nu_ref nu_ref = nu;

  T_mu_ref mu_ref = mu;

  T_L_ref L_ref = L;

  vector_seq_view<T_y_ref> y_vec(y_ref);

  vector_seq_view<T_mu_ref> mu_vec(mu_ref);

  const size_t size_vec = max_size_mvt(y_ref, mu_ref);


  check_not_nan(function, "Degrees of freedom parameter", nu_ref);

  check_positive(function, "Degrees of freedom parameter", nu_ref);

  check_finite(function, "Degrees of freedom parameter", nu_ref);

  check_cholesky_factor(function, "scale parameter", L_ref);


  const int size_y = y_vec[0].size();

  const int size_mu = mu_vec[0].size();

  const int num_dims = L.rows();


  if (unlikely(num_dims == 0)) {

    return T_return(0);

  }


  for (size_t i = 1, size_mvt_y = num_y; i < size_mvt_y; i++) {

    check_size_match(

        function, "Size of one of the vectors of the random variable",

        y_vec[i].size(), "Size of another vector of the random variable",

        y_vec[i - 1].size());

  }


  for (size_t i = 1, size_mvt_mu = num_mu; i < size_mvt_mu; i++) {

    check_size_match(function,

                     "Size of one of the vectors "

                     "of the location variable",

                     mu_vec[i].size(),

                     "Size of another vector of "

                     "the location variable",

                     mu_vec[i - 1].size());

  }


  check_size_match(function, "Size of random variable", size_mu,

                   "rows of scale parameter", L.rows());

  check_size_match(function, "Size of random variable", size_y,

                   "size of location parameter", size_mu);

  check_size_match(function, "Size of random variable", size_y,

                   "rows of scale parameter", L.rows());

  check_size_match(function, "Size of random variable", size_y,

                   "columns of scale parameter", L.cols());


  for (size_t i = 0; i < size_vec; i++) {

    check_finite(function, "Location parameter", mu_vec[i]);

    check_not_nan(function, "Random variable", y_vec[i]);

  }


  auto ops_partials = make_partials_propagator(y_ref, nu_ref, mu_ref, L_ref);


  T_partials_return lp(0);


  if constexpr (include_summand<propto>::value) {

    lp += -0.5 * num_dims * LOG_PI * size_vec;

  }


  if constexpr (include_summand<propto, T_y, T_dof, T_loc,

                                T_covar_elem>::value) {

    T_partials_return nu_val = value_of(nu_ref);

    T_partials_return inv_nu = inv(nu_val);

    T_partials_return nu_plus_dims = nu_val + num_dims;

    matrix_partials_t L_val = value_of(L_ref);

    matrix_partials_t L_deriv;

    const auto& half_nu

        = to_ref_if<include_summand<propto, T_dof>::value>(0.5 * nu_val);

    const auto& digamma_vals = to_ref_if<is_autodiff_v<T_dof>>(

        digamma(half_nu + 0.5 * num_dims) - digamma(half_nu));


    if constexpr (include_summand<propto, T_dof>::value) {

      lp += lgamma(0.5 * nu_plus_dims) * size_vec;

      lp += -lgamma(0.5 * nu_val) * size_vec;

      lp += -(0.5 * num_dims) * log(nu_val) * size_vec;

    }


    if constexpr (include_summand<propto, T_covar_elem>::value) {

      lp += -sum(log(L_val.diagonal())) * size_vec;

    }


    T_partials_return sum_lp_vec(0.0);

    row_vector_partials_t half(size_y);

    vector_partials_t y_val_minus_mu_val(size_y);

    vector_partials_t scaled_diff(size_y);


    for (size_t i = 0; i < size_vec; i++) {

      decltype(auto) y_val = as_value_column_vector_or_scalar(y_vec[i]);

      decltype(auto) mu_val = as_value_column_vector_or_scalar(mu_vec[i]);

      y_val_minus_mu_val = eval(y_val - mu_val);


      half = mdivide_left_tri<Eigen::Lower>(L_val, y_val_minus_mu_val)

                 .transpose();


      scaled_diff = mdivide_right_tri<Eigen::Lower>(half, L_val).transpose();


      T_partials_return dot_half = dot_self(half);


      if constexpr (is_autodiff_v<T_dof>) {

        T_partials_return G = dot_product(scaled_diff, y_val_minus_mu_val);

        partials<1>(ops_partials)[i] += 0.5

                                        * (digamma_vals - log1p(G * inv_nu)

                                           + (G - num_dims) / (G + nu_val));

      }


      scaled_diff *= nu_plus_dims / (dot_half + nu_val);


      if constexpr (is_autodiff_v<T_y>) {

        partials_vec<0>(ops_partials)[i] += -scaled_diff;

      }


      if constexpr (is_autodiff_v<T_loc>) {

        partials_vec<2>(ops_partials)[i] += scaled_diff;

      }


      if constexpr (is_autodiff_v<T_covar_elem>) {

        if (i == 0) {

          L_deriv

              = (scaled_diff * half).template triangularView<Eigen::Lower>();

        } else {

          L_deriv

              += (scaled_diff * half).template triangularView<Eigen::Lower>();

        }

      }


      sum_lp_vec += log1p(dot_half * inv_nu);

    }


    if constexpr (is_autodiff_v<T_covar_elem>) {

      L_deriv.diagonal().array() -= size_vec / L_val.diagonal().array();

      partials<3>(ops_partials) += L_deriv;

    }

    lp += -0.5 * nu_plus_dims * sum_lp_vec;

  }

  return ops_partials.build(lp);

}


template <bool propto, typename T_y, typename T_dof, typename T_loc,

          typename T_covar,

          require_all_vector_vt<is_stan_scalar, T_y, T_dof, T_loc>* = nullptr,

          require_all_not_nonscalar_prim_or_rev_kernel_expression_t<

              T_y, T_dof, T_loc, T_covar>* = nullptr>

inline return_type_t<T_y, T_dof, T_loc, T_covar> multi_student_t_cholesky_lpdf(

    const T_y& y, const T_dof& nu, const T_loc& mu, const T_covar& L) {

  static const char* function = "multi_student_t_cholesky";

  using T_covar_elem = typename scalar_type<T_covar>::type;

  using Eigen::Matrix;

  using T_return = return_type_t<T_y, T_dof, T_loc, T_covar>;

  using T_partials_return = partials_return_t<T_y, T_dof, T_loc, T_covar>;

  using matrix_partials_t

      = Eigen::Matrix<T_partials_return, Eigen::Dynamic, Eigen::Dynamic>;

  using vector_partials_t = Eigen::Matrix<T_partials_return, Eigen::Dynamic, 1>;

  using row_vector_partials_t

      = Eigen::Matrix<T_partials_return, 1, Eigen::Dynamic>;

  using T_y_ref = ref_type_t<T_y>;

  using T_nu_ref = ref_type_t<T_dof>;

  using T_mu_ref = ref_type_t<T_loc>;

  using T_L_ref = ref_type_t<T_covar>;


  T_y_ref y_ref = y;

  T_nu_ref nu_ref = nu;

  T_mu_ref mu_ref = mu;

  T_L_ref L_ref = L;

  vector_partials_t y_val = as_value_column_vector_or_scalar(y_ref);

  vector_partials_t mu_val = as_value_column_vector_or_scalar(mu_ref);


  const int size_y = y_ref.size();

  const int size_mu = mu_ref.size();


  if (unlikely(size_y == 0)) {

    return T_return(0);

  }


  check_not_nan(function, "Degrees of freedom parameter", nu_ref);

  check_positive(function, "Degrees of freedom parameter", nu_ref);

  check_finite(function, "Degrees of freedom parameter", nu_ref);


  check_size_match(function, "Size of random variable", size_mu,

                   "rows of scale parameter", L.rows());

  check_size_match(function, "Size of random variable", size_y,

                   "size of location parameter", size_mu);

  check_size_match(function, "Size of random variable", size_y,

                   "rows of scale parameter", L.rows());

  check_size_match(function, "Size of random variable", size_y,

                   "columns of scale parameter", L.cols());


  check_finite(function, "Location parameter", mu_val);

  check_not_nan(function, "Random variable", y_val);


  check_cholesky_factor(function, "scale parameter", L_ref);


  T_partials_return lp(0);


  auto ops_partials = make_partials_propagator(y_ref, nu_ref, mu_ref, L_ref);


  if constexpr (include_summand<propto>::value) {

    lp += -0.5 * size_y * LOG_PI;

  }


  if constexpr (include_summand<propto, T_y, T_dof, T_loc,

                                T_covar_elem>::value) {

    T_partials_return nu_val = value_of(nu_ref);

    T_partials_return inv_nu = inv(nu_val);

    T_partials_return nu_plus_dims = nu_val + size_y;

    vector_partials_t y_val_minus_mu_val = eval(y_val - mu_val);


    matrix_partials_t L_val = value_of(L_ref);

    row_vector_partials_t half

        = mdivide_left_tri<Eigen::Lower>(L_val, y_val_minus_mu_val).transpose();

    vector_partials_t scaled_diff

        = mdivide_right_tri<Eigen::Lower>(half, L_val).transpose();

    T_partials_return dot_half = dot_self(half);


    if constexpr (is_autodiff_v<T_dof>) {

      T_partials_return half_nu = 0.5 * nu_val;

      T_partials_return digamma_vals

          = digamma(half_nu + 0.5 * size_y) - digamma(half_nu);

      T_partials_return G = dot_product(scaled_diff, y_val_minus_mu_val);


      partials<1>(ops_partials)

          += 0.5

             * (digamma_vals - log1p(G * inv_nu) + (G - size_y) / (G + nu_val));

    }


    if constexpr (include_summand<propto, T_dof>::value) {

      lp += lgamma(0.5 * (nu_val + size_y));

      lp += -lgamma(0.5 * nu_val);

      lp += -0.5 * size_y * log(nu_val);

    }


    if constexpr (include_summand<propto, T_covar_elem>::value) {

      lp += -sum(log(L_val.diagonal()));

    }


    if constexpr (is_any_autodiff_v<T_y, T_loc, T_covar_elem>) {

      T_partials_return scale_val = nu_plus_dims / (dot_half + nu_val);


      if constexpr (is_autodiff_v<T_y>) {

        partials<0>(ops_partials) += -scaled_diff * scale_val;

      }

      if constexpr (is_autodiff_v<T_loc>) {

        partials<2>(ops_partials) += scaled_diff * scale_val;

      }

      if constexpr (is_autodiff_v<T_covar_elem>) {

        matrix_partials_t L_deriv

            = (scaled_diff * half).template triangularView<Eigen::Lower>();

        L_deriv.diagonal().array() -= 1 / L_val.diagonal().array();

        edge<3>(ops_partials).partials_ += L_deriv;

      }

    }


    lp += -0.5 * nu_plus_dims * log1p(dot_half * inv_nu);

  }


  return ops_partials.build(lp);

}


template <typename T_y, typename T_dof, typename T_loc, typename T_covar>

inline return_type_t<T_y, T_dof, T_loc, T_covar> multi_student_t_cholesky_lpdf(

    const T_y& y, const T_dof& nu, const T_loc& mu, const T_covar& L) {

  return multi_student_t_cholesky_lpdf<false>(y, nu, mu, L);

}


}  // namespace math

}  // namespace stan

#endif

stan::vector_seq_view
This class provides a low-cost wrapper for situations where you either need an Eigen Vector or RowVec...
Definition vector_seq_view.hpp:32

unlikely
#define unlikely(x)
Definition compiler_attributes.hpp:40

constants.hpp

stan::math::multi_student_t_cholesky_lpdf
return_type_t< T_y, T_dof, T_loc, T_covar > multi_student_t_cholesky_lpdf(const T_y &y, const T_dof &nu, const T_loc &mu, const T_covar &L)
The log of the multivariate student t density for the given y, mu, nu, and a Cholesky factor L of the...
Definition multi_student_t_cholesky_lpdf.hpp:57

stan::require_all_not_nonscalar_prim_or_rev_kernel_expression_t
require_all_not_t< is_nonscalar_prim_or_rev_kernel_expression< std::decay_t< Types > >... > require_all_not_nonscalar_prim_or_rev_kernel_expression_t
Require none of the types satisfy is_nonscalar_prim_or_rev_kernel_expression.
Definition is_kernel_expression.hpp:191

stan::math::size_mvt
int64_t size_mvt(const ScalarT &)
Provides the size of a multivariate argument.
Definition size_mvt.hpp:25

stan::return_type_t
typename return_type< Ts... >::type return_type_t
Convenience type for the return type of the specified template parameters.
Definition return_type.hpp:218

stan::math::size
int64_t size(const T &m)
Returns the size (number of the elements) of a matrix_cl or var_value<matrix_cl<T>>.
Definition size.hpp:19

stan::require_all_vector_vt
require_all_t< container_type_check_base< is_vector, value_type_t, TypeCheck, Check >... > require_all_vector_vt
Require all of the types satisfy is_vector.
Definition is_vector.hpp:512

max_size_mvt.hpp

mdivide_right_tri.hpp

stan::math::check_consistent_sizes_mvt
void check_consistent_sizes_mvt(const char *)
Trivial no input case, this function is a no-op.
Definition check_consistent_sizes_mvt.hpp:15

stan::math::eval
T eval(T &&arg)
Inputs which have a plain_type equal to the own time are forwarded unmodified (for Eigen expressions ...
Definition eval.hpp:20

stan::math::value_of
T value_of(const fvar< T > &v)
Return the value of the specified variable.
Definition value_of.hpp:18

stan::math::log
fvar< T > log(const fvar< T > &x)
Definition log.hpp:18

stan::math::max_size_mvt
int64_t max_size_mvt(const T1 &x1, const Ts &... xs)
Calculate the size of the largest multivariate input.
Definition max_size_mvt.hpp:25

stan::math::LOG_PI
static constexpr double LOG_PI
The natural logarithm of , .
Definition constants.hpp:86

stan::math::log1p
fvar< T > log1p(const fvar< T > &x)
Definition log1p.hpp:12

stan::math::check_finite
void check_finite(const char *function, const char *name, const T_y &y)
Return true if all values in y are finite.
Definition check_finite.hpp:28

stan::math::lgamma
fvar< T > lgamma(const fvar< T > &x)
Return the natural logarithm of the gamma function applied to the specified argument.
Definition lgamma.hpp:21

stan::math::check_not_nan
void check_not_nan(const char *function, const char *name, const T_y &y)
Check if y is not NaN.
Definition check_not_nan.hpp:26

stan::math::sum
auto sum(const std::vector< T > &m)
Return the sum of the entries of the specified standard vector.
Definition sum.hpp:23

stan::math::check_cholesky_factor
void check_cholesky_factor(const char *function, const char *name, const Mat &y)
Throw an exception if the specified matrix is not a valid Cholesky factor.
Definition check_cholesky_factor.hpp:33

stan::math::check_positive
void check_positive(const char *function, const char *name, const T_y &y)
Check if y is positive.
Definition check_positive.hpp:27

stan::math::dot_self
auto dot_self(const T &a)
Returns squared norm of a vector or matrix.
Definition dot_self.hpp:21

stan::math::check_size_match
void check_size_match(const char *function, const char *name_i, T_size1 i, const char *name_j, T_size2 j)
Check if the provided sizes match.
Definition check_size_match.hpp:24

stan::math::dot_product
auto dot_product(const T_a &a, const T_b &b)
Returns the dot product of the specified vectors.
Definition dot_product.hpp:26

stan::math::as_value_column_vector_or_scalar
auto as_value_column_vector_or_scalar(T &&a)
Extract values from input argument and transform to a column vector.
Definition as_value_column_vector_or_scalar.hpp:23

stan::math::inv
fvar< T > inv(const fvar< T > &x)
Definition inv.hpp:13

stan::math::make_partials_propagator
auto make_partials_propagator(Ops &&... ops)
Construct an partials_propagator.
Definition partials_propagator.hpp:118

stan::math::digamma
fvar< T > digamma(const fvar< T > &x)
Return the derivative of the log gamma function at the specified argument.
Definition digamma.hpp:23

stan::ref_type_t
typename ref_type_if< true, T >::type ref_type_t
Definition ref_type.hpp:56

stan::partials_return_t
typename partials_return_type< Args... >::type partials_return_t
Definition partials_return_type.hpp:44

stan
The lgamma implementation in stan-math is based on either the reentrant safe lgamma_r implementation ...
Definition unit_vector_constrain.hpp:15

err.hpp

as_column_vector_or_scalar.hpp

columns_dot_self.hpp

digamma.hpp

dot_product.hpp

dot_self.hpp

inv.hpp

is_inf.hpp

lgamma.hpp

log1p.hpp

log.hpp

mdivide_left_tri.hpp

partials_propagator.hpp

meta.hpp

multi_normal_cholesky_lpdf.hpp

size_mvt.hpp

stan::math::include_summand
Template metaprogram to calculate whether a summand needs to be included in a proportional (log) prob...
Definition include_summand.hpp:39

stan::scalar_type::type
std::decay_t< T > type
Definition scalar_type.hpp:21

to_ref.hpp

vector_seq_view.hpp