math/rev_2constraint_2stochastic__column__constrain_8hpp_source.html

#ifndef STAN_MATH_REV_CONSTRAINT_STOCHASTIC_COLUMN_CONSTRAIN_HPP

#define STAN_MATH_REV_CONSTRAINT_STOCHASTIC_COLUMN_CONSTRAIN_HPP


#include <stan/math/prim/fun/Eigen.hpp>

#include <stan/math/rev/meta.hpp>

#include <stan/math/rev/core/reverse_pass_callback.hpp>

#include <stan/math/rev/core/arena_matrix.hpp>

#include <stan/math/rev/fun/value_of.hpp>

#include <stan/math/prim/constraint/stochastic_column_constrain.hpp>

#include <stan/math/rev/constraint/sum_to_zero_constrain.hpp>

#include <cmath>


namespace stan {

namespace math {


template <typename T, require_rev_matrix_t<T>* = nullptr>

inline plain_type_t<T> stochastic_column_constrain(const T& y) {

  using ret_type = plain_type_t<T>;


  const auto N = y.rows();

  const auto M = y.cols();

  arena_t<T> arena_y = y;


  arena_t<ret_type> arena_x = stochastic_column_constrain(arena_y.val_op());


  if (unlikely(N == 0 || M == 0)) {

    return arena_x;

  }


  reverse_pass_callback([arena_y, arena_x]() mutable {

    const auto M = arena_y.cols();


    auto&& x_val = arena_x.val_op();

    auto&& x_adj = arena_x.adj_op();


    Eigen::VectorXd x_pre_softmax_adj(x_val.rows());

    for (Eigen::Index i = 0; i < M; ++i) {

      // backprop for softmax

      x_pre_softmax_adj.noalias()

          = -x_val.col(i) * x_adj.col(i).dot(x_val.col(i))

            + x_val.col(i).cwiseProduct(x_adj.col(i));


      // backprop for sum_to_zero_constrain

      internal::sum_to_zero_vector_backprop(arena_y.col(i).adj(),

                                            x_pre_softmax_adj);

    }

  });


  return arena_x;

}


template <typename T, require_rev_matrix_t<T>* = nullptr>

inline plain_type_t<T> stochastic_column_constrain(const T& y,

                                                   scalar_type_t<T>& lp) {

  using ret_type = plain_type_t<T>;


  const auto N = y.rows();

  const auto M = y.cols();

  arena_t<T> arena_y = y;


  double lp_val = 0;

  arena_t<ret_type> arena_x

      = stochastic_column_constrain(arena_y.val_op(), lp_val);

  lp += lp_val;


  if (unlikely(N == 0 || M == 0)) {

    return arena_x;

  }


  reverse_pass_callback([arena_y, arena_x, lp]() mutable {

    const auto M = arena_y.cols();


    auto&& x_val = arena_x.val_op();

    auto&& x_adj = arena_x.adj_op();


    const auto x_val_rows = x_val.rows();


    Eigen::VectorXd x_pre_softmax_adj(x_val.rows());

    for (Eigen::Index i = 0; i < M; ++i) {

      // backprop for softmax

      x_pre_softmax_adj.noalias()

          = -x_val.col(i)

                * (x_adj.col(i).dot(x_val.col(i)) + lp.adj() * x_val_rows)

            + (x_val.col(i).cwiseProduct(x_adj.col(i)).array() + lp.adj())

                  .matrix();


      // backprop for sum_to_zero_constrain

      internal::sum_to_zero_vector_backprop(arena_y.col(i).adj(),

                                            x_pre_softmax_adj);

    }

  });


  return arena_x;

}


}  // namespace math

}  // namespace stan

#endif

Eigen.hpp

arena_matrix.hpp

unlikely
#define unlikely(x)
Definition compiler_attributes.hpp:31

stan::math::internal::sum_to_zero_vector_backprop
void sum_to_zero_vector_backprop(T &&y_adj, const Eigen::VectorXd &z_adj)
The reverse pass backprop for the sum_to_zero_constrain on vectors.
Definition sum_to_zero_constrain.hpp:28

stan::math::reverse_pass_callback
void reverse_pass_callback(F &&functor)
Puts a callback on the autodiff stack to be called in reverse pass.
Definition reverse_pass_callback.hpp:38

stan::math::stochastic_column_constrain
plain_type_t< Mat > stochastic_column_constrain(const Mat &y)
Return a column stochastic matrix.
Definition stochastic_column_constrain.hpp:24

stan::plain_type_t
typename plain_type< std::decay_t< T > >::type plain_type_t
Definition plain_type.hpp:23

stan::scalar_type_t
typename scalar_type< T >::type scalar_type_t
Definition scalar_type.hpp:25

stan::arena_t
typename internal::arena_type_impl< std::decay_t< T > >::type arena_t
Determines a type that can be used in place of T that does any dynamic allocations on the AD stack.
Definition arena_type.hpp:60

stan
The lgamma implementation in stan-math is based on either the reentrant safe lgamma_r implementation ...
Definition unit_vector_constrain.hpp:15

stochastic_column_constrain.hpp

sum_to_zero_constrain.hpp

value_of.hpp

meta.hpp

reverse_pass_callback.hpp