math/rev_2fun_2log__softmax_8hpp_source.html

#ifndef STAN_MATH_REV_FUN_LOG_SOFTMAX_HPP

#define STAN_MATH_REV_FUN_LOG_SOFTMAX_HPP


#include <stan/math/prim/fun/Eigen.hpp>

#include <stan/math/rev/core.hpp>

#include <stan/math/rev/core/typedefs.hpp>

#include <stan/math/rev/fun/softmax.hpp>

#include <stan/math/prim/meta.hpp>

#include <stan/math/prim/err.hpp>

#include <stan/math/prim/fun/to_ref.hpp>

#include <stan/math/prim/fun/typedefs.hpp>

#include <stan/math/prim/fun/log_softmax.hpp>

#include <cmath>

#include <vector>


namespace stan {

namespace math {


namespace internal {


class log_softmax_elt_vari : public vari {

 private:

  vari** alpha_;

  const double* softmax_alpha_;

  const int size_;  // array sizes

  const int idx_;   // in in softmax output


 public:

  log_softmax_elt_vari(double val, vari** alpha, const double* softmax_alpha,

                       int size, int idx)

      : vari(val),

        alpha_(alpha),

        softmax_alpha_(softmax_alpha),

        size_(size),

        idx_(idx) {}

  void chain() {

    for (int m = 0; m < size_; ++m) {

      if (m == idx_) {

        alpha_[m]->adj_ += adj_ * (1 - softmax_alpha_[m]);

      } else {

        alpha_[m]->adj_ -= adj_ * softmax_alpha_[m];

      }

    }

  }

};

}  // namespace internal


template <typename T, require_eigen_st<is_var, T>* = nullptr>

auto log_softmax(const T& x) {

  const int a_size = x.size();


  check_nonzero_size("log_softmax", "x", x);


  const auto& x_ref = to_ref(x);


  vari** x_vi_array

      = ChainableStack::instance_->memalloc_.alloc_array<vari*>(a_size);

  Eigen::Map<vector_vi>(x_vi_array, a_size) = x_ref.vi();


  vector_d x_d = x_ref.val();


  // fold logic of math::softmax() and math::log_softmax()

  // to save computations


  vector_d diff = (x_d.array() - x_d.maxCoeff());

  vector_d softmax_x_d = diff.array().exp();

  double sum = softmax_x_d.sum();

  vector_d log_softmax_x_d = diff.array() - std::log(sum);


  // end fold

  double* softmax_x_d_array

      = ChainableStack::instance_->memalloc_.alloc_array<double>(a_size);

  Eigen::Map<vector_d>(softmax_x_d_array, a_size) = softmax_x_d.array() / sum;


  plain_type_t<T> log_softmax_x(a_size);

  for (int k = 0; k < a_size; ++k) {

    log_softmax_x(k) = var(new internal::log_softmax_elt_vari(

        log_softmax_x_d[k], x_vi_array, softmax_x_d_array, a_size, k));

  }

  return log_softmax_x;

}


template <typename T, require_var_matrix_t<T>* = nullptr>

inline auto log_softmax(const T& x) {

  check_nonzero_size("log_softmax", "x", x);


  const auto& theta = (x.val().array() - x.val().maxCoeff()).eval();


  return make_callback_var(

      (theta.array() - log(theta.exp().sum())).matrix(),

      [x](const auto& res) mutable {

        x.adj().noalias()

            += res.adj() - (res.adj().sum() * res.val().array().exp()).matrix();

      });

}


template <typename T, require_std_vector_st<is_var, T>* = nullptr>

inline auto log_softmax(const T& x) {

  return apply_vector_unary<T>::apply(

      x, [](const auto& alpha) { return log_softmax(alpha); });

}


}  // namespace math

}  // namespace stan

#endif

Eigen.hpp

stan::math::internal::log_softmax_elt_vari::chain
void chain()
Definition log_softmax.hpp:36

stan::math::internal::log_softmax_elt_vari::idx_
const int idx_
Definition log_softmax.hpp:26

stan::math::internal::log_softmax_elt_vari::softmax_alpha_
const double * softmax_alpha_
Definition log_softmax.hpp:24

stan::math::internal::log_softmax_elt_vari::size_
const int size_
Definition log_softmax.hpp:25

stan::math::internal::log_softmax_elt_vari::alpha_
vari ** alpha_
Definition log_softmax.hpp:23

stan::math::internal::log_softmax_elt_vari::log_softmax_elt_vari
log_softmax_elt_vari(double val, vari **alpha, const double *softmax_alpha, int size, int idx)
Definition log_softmax.hpp:29

stan::math::internal::log_softmax_elt_vari
Definition log_softmax.hpp:21

stan::math::stack_alloc::alloc_array
T * alloc_array(size_t n)
Allocate an array on the arena of the specified size to hold values of the specified template paramet...
Definition stack_alloc.hpp:193

stan::math::vari_value
Definition vari.hpp:17

stan::math::size
int64_t size(const T &m)
Returns the size (number of the elements) of a matrix_cl or var_value<matrix_cl<T>>.
Definition size.hpp:19

stan::math::vector_d
Eigen::Matrix< double, Eigen::Dynamic, 1 > vector_d
Type for (column) vector of double values.
Definition typedefs.hpp:24

stan::math::make_callback_var
var_value< plain_type_t< T > > make_callback_var(T &&value, F &&functor)
Creates a new var initialized with a callback_vari with a given value and reverse-pass callback funct...
Definition callback_vari.hpp:61

stan::math::eval
T eval(T &&arg)
Inputs which have a plain_type equal to the own time are forwarded unmodified (for Eigen expressions ...
Definition eval.hpp:20

stan::math::log
fvar< T > log(const fvar< T > &x)
Definition log.hpp:18

stan::math::vari
vari_value< double > vari
Definition vari.hpp:197

stan::math::sum
auto sum(const std::vector< T > &m)
Return the sum of the entries of the specified standard vector.
Definition sum.hpp:23

stan::math::var
var_value< double > var
Definition var.hpp:1187

stan::math::check_nonzero_size
void check_nonzero_size(const char *function, const char *name, const T_y &y)
Check if the specified matrix/vector is of non-zero size.
Definition check_nonzero_size.hpp:22

stan::math::log_softmax
auto log_softmax(const T &x)
Return the log softmax of the specified vector or container of vectors.
Definition log_softmax.hpp:22

stan::math::to_ref
ref_type_t< T && > to_ref(T &&a)
This evaluates expensive Eigen expressions.
Definition to_ref.hpp:18

stan::plain_type_t
typename plain_type< std::decay_t< T > >::type plain_type_t
Definition plain_type.hpp:23

stan
The lgamma implementation in stan-math is based on either the reentrant safe lgamma_r implementation ...
Definition unit_vector_constrain.hpp:15

err.hpp

log_softmax.hpp

typedefs.hpp

meta.hpp

typedefs.hpp

core.hpp

softmax.hpp

stan::math::AutodiffStackSingleton::AutodiffStackStorage::memalloc_
stack_alloc memalloc_
Definition autodiffstackstorage.hpp:107

stan::math::AutodiffStackSingleton::instance_
static thread_local AutodiffStackStorage * instance_
Definition autodiffstackstorage.hpp:118

to_ref.hpp