docs/cpp/hessian_8hpp_source.html

// Copyright (c) Sleipnir contributors


#pragma once


#include <utility>


#include <Eigen/SparseCore>

#include <gch/small_vector.hpp>


#include "sleipnir/autodiff/adjoint_expression_graph.hpp"

#include "sleipnir/autodiff/variable.hpp"

#include "sleipnir/autodiff/variable_matrix.hpp"

#include "sleipnir/util/concepts.hpp"

#include "sleipnir/util/symbol_exports.hpp"


namespace slp {


template <int UpLo>

  requires(UpLo == Eigen::Lower) || (UpLo == (Eigen::Lower | Eigen::Upper))


class SLEIPNIR_DLLEXPORT Hessian {

 public:


  Hessian(Variable variable, Variable wrt) noexcept

      : Hessian{std::move(variable), VariableMatrix{std::move(wrt)}} {}


  Hessian(Variable variable, SleipnirMatrixLike auto wrt) noexcept

      : m_variables{detail::AdjointExpressionGraph{variable}

                        .generate_gradient_tree(wrt)},

        m_wrt{wrt} {

    // Initialize column each expression's adjoint occupies in the Jacobian

    for (size_t col = 0; col < m_wrt.size(); ++col) {

      m_wrt[col].expr->col = col;

    }


    for (auto& variable : m_variables) {

      m_graphs.emplace_back(variable);

    }


    // Reset col to -1

    for (auto& node : m_wrt) {

      node.expr->col = -1;

    }


    for (int row = 0; row < m_variables.rows(); ++row) {

      if (m_variables[row].expr == nullptr) {

        continue;

      }


      if (m_variables[row].type() == ExpressionType::LINEAR) {

        // If the row is linear, compute its gradient once here and cache its

        // triplets. Constant rows are ignored because their gradients have no

        // nonzero triplets.

        m_graphs[row].append_adjoint_triplets(m_cached_triplets, row, m_wrt);

      } else if (m_variables[row].type() > ExpressionType::LINEAR) {

        // If the row is quadratic or nonlinear, add it to the list of nonlinear

        // rows to be recomputed in Value().

        m_nonlinear_rows.emplace_back(row);

      }

    }


    if (m_nonlinear_rows.empty()) {

      m_H.setFromTriplets(m_cached_triplets.begin(), m_cached_triplets.end());

      if constexpr (UpLo == Eigen::Lower) {

        m_H = m_H.triangularView<Eigen::Lower>();

      }

    }

  }


  VariableMatrix get() const {

    VariableMatrix result{VariableMatrix::empty, m_variables.rows(),

                          m_wrt.rows()};


    for (int row = 0; row < m_variables.rows(); ++row) {

      auto grad = m_graphs[row].generate_gradient_tree(m_wrt);

      for (int col = 0; col < m_wrt.rows(); ++col) {

        if (grad[col].expr != nullptr) {

          result[row, col] = std::move(grad[col]);

        } else {

          result[row, col] = Variable{0.0};

        }

      }

    }


    return result;

  }


  const Eigen::SparseMatrix<double>& value() {

    if (m_nonlinear_rows.empty()) {

      return m_H;

    }


    for (auto& graph : m_graphs) {

      graph.update_values();

    }


    // Copy the cached triplets so triplets added for the nonlinear rows are

    // thrown away at the end of the function

    auto triplets = m_cached_triplets;


    // Compute each nonlinear row of the Hessian

    for (int row : m_nonlinear_rows) {

      m_graphs[row].append_adjoint_triplets(triplets, row, m_wrt);

    }


    if (!triplets.empty()) {

      m_H.setFromTriplets(triplets.begin(), triplets.end());

      if constexpr (UpLo == Eigen::Lower) {

        m_H = m_H.triangularView<Eigen::Lower>();

      }

    } else {

      // setFromTriplets() is a no-op on empty triplets, so explicitly zero out

      // the storage

      m_H.setZero();

    }


    return m_H;

  }


 private:

  VariableMatrix m_variables;

  VariableMatrix m_wrt;


  gch::small_vector<detail::AdjointExpressionGraph> m_graphs;


  Eigen::SparseMatrix<double> m_H{m_variables.rows(), m_wrt.rows()};


  // Cached triplets for gradients of linear rows

  gch::small_vector<Eigen::Triplet<double>> m_cached_triplets;


  // List of row indices for nonlinear rows whose graients will be computed in

  // Value()

  gch::small_vector<int> m_nonlinear_rows;

};


}  // namespace slp

slp::Hessian
Definition hessian.hpp:29

slp::Hessian::Hessian
Hessian(Variable variable, SleipnirMatrixLike auto wrt) noexcept
Definition hessian.hpp:47

slp::Hessian::Hessian
Hessian(Variable variable, Variable wrt) noexcept
Definition hessian.hpp:37

slp::Hessian::get
VariableMatrix get() const
Definition hessian.hpp:98

slp::Hessian::value
const Eigen::SparseMatrix< double > & value()
Definition hessian.hpp:121

slp::VariableMatrix
Definition variable_matrix.hpp:29

slp::VariableMatrix::rows
int rows() const
Definition variable_matrix.hpp:951

slp::VariableMatrix::col
VariableBlock< VariableMatrix > col(int col)
Definition variable_matrix.hpp:546

slp::VariableMatrix::empty
static constexpr empty_t empty
Definition variable_matrix.hpp:39

slp::Variable
Definition variable.hpp:40

slp::detail::AdjointExpressionGraph
Definition adjoint_expression_graph.hpp:21

slp::detail::AdjointExpressionGraph::generate_gradient_tree
VariableMatrix generate_gradient_tree(const VariableMatrix &wrt) const
Definition adjoint_expression_graph.hpp:52

slp::SleipnirMatrixLike
Definition concepts.hpp:30