doc/html/GNRiccatiSolver-impl_8hpp_source.html

 /**********************************************************************************************************************
 This file is part of the Control Toolbox (https://github.com/ethz-adrl/control-toolbox), copyright by ETH Zurich.
 Licensed under the BSD-2 license (see LICENSE file in main directory)
  **********************************************************************************************************************/

 #pragma once

 namespace ct {
 namespace optcon {


 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::GNRiccatiSolver(const std::shared_ptr<LQOCProblem_t>& lqocProblem)
     : LQOCSolver<STATE_DIM, CONTROL_DIM, SCALAR>(lqocProblem), N_(-1)
 {
     Eigen::initParallel();
     Eigen::setNbThreads(settings_.nThreadsEigen);
 }


 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::GNRiccatiSolver(int N)
 {
     changeNumberOfStages(N);
 }

 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 void GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::solve()
 {
     for (int i = this->lqocProblem_->getNumberOfStages() - 1; i >= 0; i--)
         solveSingleStage(i);
 }


 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 void GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::solveSingleStage(int N)
 {
     if (N == this->lqocProblem_->getNumberOfStages() - 1)
         initializeCostToGo();

     designController(N);

     if (N > 0)
         computeCostToGo(N);
 }


 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 void GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::configure(const NLOptConSettings& settings)
 {
     settings_ = settings;
     H_corrFix_ = settings_.epsilon * ControlMatrix::Identity();
 }

 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 void GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::computeStatesAndControls()
 {
     LQOCProblem_t& p = *this->lqocProblem_;

     this->x_sol_[0].setZero();  // should always be zero (fixed init state)

     for (int k = 0; k < this->lqocProblem_->getNumberOfStages(); k++)
     {
         this->u_sol_[k] = this->lv_[k] + this->L_[k] * this->x_sol_[k];

         this->x_sol_[k + 1] = p.A_[k] * this->x_sol_[k] + p.B_[k] * (this->u_sol_[k]) + p.b_[k];
     }
 }

 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 void GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::computeFeedbackMatrices()
 { /*no action required, already computed in backward pass */
 }

 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 void GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::compute_lv()
 { /*no action required, already computed in backward pass*/
 }

 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 SCALAR GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::getSmallestEigenvalue()
 {
     return smallestEigenvalue_;
 }

 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 void GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::setProblemImpl(std::shared_ptr<LQOCProblem_t> lqocProblem)
 {
     if (lqocProblem->isConstrained())
     {
         throw std::runtime_error(
             "Selected wrong solver - GNRiccatiSolver cannot handle constrained problems. Use a different solver");
     }

     const int& N = lqocProblem->getNumberOfStages();
     changeNumberOfStages(N);
 }


 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 void GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::changeNumberOfStages(int N)
 {
     if (N <= 0)
         return;

     if (N_ == N)
         return;

     gv_.resize(N);
     G_.resize(N);

     H_.resize(N);
     Hi_.resize(N);
     Hi_inverse_.resize(N);

     this->lv_.resize(N);
     this->L_.resize(N);

     this->x_sol_.resize(N + 1);
     this->u_sol_.resize(N);

     sv_.resize(N + 1);
     S_.resize(N + 1);

     N_ = N;
 }


 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 void GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::initializeCostToGo()
 {
     smallestEigenvalue_ = std::numeric_limits<SCALAR>::infinity();

     // initialize quadratic approximation of cost to go
     const int& N = this->lqocProblem_->getNumberOfStages();
     LQOCProblem_t& p = *this->lqocProblem_;

     S_[N] = p.Q_[N];
     sv_[N] = p.qv_[N];
 }


 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 void GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::computeCostToGo(size_t k)
 {
     LQOCProblem_t& p = *this->lqocProblem_;

     S_[k] = p.Q_[k];
     S_[k].noalias() += p.A_[k].transpose() * S_[k + 1] * p.A_[k];
     S_[k].noalias() -= this->L_[k].transpose() * Hi_[k] * this->L_[k];

     S_[k] = 0.5 * (S_[k] + S_[k].transpose()).eval();

     sv_[k] = p.qv_[k];
     sv_[k].noalias() += p.A_[k].transpose() * sv_[k + 1];
     sv_[k].noalias() += p.A_[k].transpose() * S_[k + 1] * p.b_[k];
     sv_[k].noalias() += this->L_[k].transpose() * Hi_[k] * this->lv_[k];
     sv_[k].noalias() += this->L_[k].transpose() * gv_[k];
     sv_[k].noalias() += G_[k].transpose() * this->lv_[k];
 }


 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 void GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::designController(size_t k)
 {
     LQOCProblem_t& p = *this->lqocProblem_;

     gv_[k] = p.rv_[k];
     gv_[k].noalias() += p.B_[k].transpose() * sv_[k + 1];
     gv_[k].noalias() += p.B_[k].transpose() * S_[k + 1].template selfadjointView<Eigen::Lower>() * p.b_[k];

     G_[k] = p.P_[k];
     //G_[k].noalias() += B_[k].transpose() * S_[k+1] * A_[k];
     G_[k].noalias() += p.B_[k].transpose() * S_[k + 1].template selfadjointView<Eigen::Lower>() * p.A_[k];

     H_[k] = p.R_[k];
     //H_[k].noalias() += B_[k].transpose() * S_[k+1] * B_[k];
     H_[k].noalias() += p.B_[k].transpose() * S_[k + 1].template selfadjointView<Eigen::Lower>() * p.B_[k];

     if (settings_.fixedHessianCorrection)
     {
         if (settings_.epsilon > 1e-10)
             Hi_[k] = H_[k] + settings_.epsilon * ControlMatrix::Identity();
         else
             Hi_[k] = H_[k];

         if (settings_.recordSmallestEigenvalue)
         {
             // compute eigenvalues with eigenvectors enabled
             eigenvalueSolver_.compute(Hi_[k], Eigen::ComputeEigenvectors);
             const ControlMatrix& V = eigenvalueSolver_.eigenvectors().real();
             const ControlVector& lambda = eigenvalueSolver_.eigenvalues();

             smallestEigenvalue_ = std::min(smallestEigenvalue_, lambda.minCoeff());

             // Corrected Eigenvalue Matrix
             ControlMatrix D = ControlMatrix::Zero();
             // make D positive semi-definite (as described in IV. B.)
             D.diagonal() = lambda.cwiseMax(settings_.epsilon);

             // reconstruct H
             ControlMatrix Hi_regular = V * D * V.transpose();

             // invert D
             ControlMatrix D_inverse = ControlMatrix::Zero();
             // eigenvalue-wise inversion
             D_inverse.diagonal() = -1.0 * D.diagonal().cwiseInverse();
             ControlMatrix Hi_inverse_regular = V * D_inverse * V.transpose();

             if (!Hi_inverse_[k].isApprox(Hi_inverse_regular, 1e-4))
             {
                 std::cout << "warning, inverses not identical at " << k << std::endl;
                 std::cout << "Hi_inverse_fixed - Hi_inverse_regular: " << std::endl
                           << Hi_inverse_[k] - Hi_inverse_regular << std::endl
                           << std::endl;
             }
         }

         Hi_inverse_[k] = -Hi_[k].template selfadjointView<Eigen::Lower>().llt().solve(ControlMatrix::Identity());

         // calculate FB gain update
         this->L_[k].noalias() = Hi_inverse_[k].template selfadjointView<Eigen::Lower>() * G_[k];

         // calculate FF update
         this->lv_[k].noalias() = Hi_inverse_[k].template selfadjointView<Eigen::Lower>() * gv_[k];
     }
     else
     {
         // compute eigenvalues with eigenvectors enabled
         eigenvalueSolver_.compute(H_[k], Eigen::ComputeEigenvectors);
         const ControlMatrix& V = eigenvalueSolver_.eigenvectors().real();
         const ControlVector& lambda = eigenvalueSolver_.eigenvalues();

         if (settings_.recordSmallestEigenvalue)
         {
             smallestEigenvalue_ = std::min(smallestEigenvalue_, lambda.minCoeff());
         }

         // Corrected Eigenvalue Matrix
         ControlMatrix D = ControlMatrix::Zero();
         // make D positive semi-definite (as described in IV. B.)
         D.diagonal() = lambda.cwiseMax(settings_.epsilon);

         // reconstruct H
         Hi_[k].noalias() = V * D * V.transpose();

         // invert D
         ControlMatrix D_inverse = ControlMatrix::Zero();
         // eigenvalue-wise inversion
         D_inverse.diagonal() = -1.0 * D.diagonal().cwiseInverse();
         Hi_inverse_[k].noalias() = V * D_inverse * V.transpose();

         // calculate FB gain update
         this->L_[k].noalias() = Hi_inverse_[k] * G_[k];

         // calculate FF update
         this->lv_[k].noalias() = Hi_inverse_[k] * gv_[k];
     }
 }


 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 void GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::logToMatlab()
 {
 #ifdef MATLAB_FULL_LOG

     matFile_.open("GNRiccatiSolver.mat");

     matFile_.put("sv", sv_.toImplementation());
     matFile_.put("S", S_.toImplementation());
     matFile_.put("L", this->L_.toImplementation());
     matFile_.put("H", H_.toImplementation());
     matFile_.put("Hi_", Hi_.toImplementation());
     matFile_.put("Hi_inverse", Hi_inverse_.toImplementation());
     matFile_.put("G", G_.toImplementation());
     matFile_.put("gv", gv_.toImplementation());

     matFile_.close();
 #endif
 }

 template <size_t STATE_DIM, size_t CONTROL_DIM, typename SCALAR>
 void GNRiccatiSolver<STATE_DIM, CONTROL_DIM, SCALAR>::initializeAndAllocate()
 {
     // do nothing
 }


 }  // namespace optcon
 }  // namespace ct
ct::optcon::LQOCProblem::B_
ct::core::StateControlMatrixArray< STATE_DIM, CONTROL_DIM, SCALAR > B_
Definition: LQOCProblem.hpp:207

ct::optcon::LQOCProblem::A_
ct::core::StateMatrixArray< STATE_DIM, SCALAR > A_
affine, time-varying system dynamics in discrete time
Definition: LQOCProblem.hpp:206

ct::optcon::GNRiccatiSolver::changeNumberOfStages
void changeNumberOfStages(int N)
Definition: GNRiccatiSolver-impl.hpp:103

ct::optcon::LQOCProblem::R_
ct::core::ControlMatrixArray< CONTROL_DIM, SCALAR > R_
Definition: LQOCProblem.hpp:219

ct::optcon::LQOCProblem::P_
ct::core::FeedbackArray< STATE_DIM, CONTROL_DIM, SCALAR > P_
LQ approximation of the cross terms of the cost function.
Definition: LQOCProblem.hpp:222

ct::optcon::GNRiccatiSolver::compute_lv
virtual void compute_lv() override
compute iLQR-style lv
Definition: GNRiccatiSolver-impl.hpp:78

ct::optcon::NLOptConSettings::nThreadsEigen
size_t nThreadsEigen
number of threads, for MP version
Definition: NLOptConSettings.hpp:274

ct::optcon::GNRiccatiSolver::H_corrFix_
ControlMatrix H_corrFix_
Definition: GNRiccatiSolver.hpp:88

ct::optcon::GNRiccatiSolver::setProblemImpl
virtual void setProblemImpl(std::shared_ptr< LQOCProblem_t > lqocProblem) override
Definition: GNRiccatiSolver-impl.hpp:89

ct::optcon::GNRiccatiSolver::smallestEigenvalue_
SCALAR smallestEigenvalue_
Definition: GNRiccatiSolver.hpp:95

ct::optcon::LQOCSolver::L_
ct::core::FeedbackArray< STATE_DIM, CONTROL_DIM, SCALAR > L_
Definition: LQOCSolver.hpp:111

ct::optcon::LQOCProblem::b_
ct::core::StateVectorArray< STATE_DIM, SCALAR > b_
Definition: LQOCProblem.hpp:208

ct::optcon::GNRiccatiSolver::solve
virtual void solve() override
solve the LQOC problem
Definition: GNRiccatiSolver-impl.hpp:28

ct::optcon::GNRiccatiSolver::getSmallestEigenvalue
virtual SCALAR getSmallestEigenvalue() override
return the smallest eigenvalue
Definition: GNRiccatiSolver-impl.hpp:83

ct::optcon::GNRiccatiSolver::configure
virtual void configure(const NLOptConSettings &settings) override
Definition: GNRiccatiSolver-impl.hpp:49

ct::optcon::NLOptConSettings::epsilon
double epsilon
the prefix to be stored before the matfile name for logging
Definition: NLOptConSettings.hpp:261

ct::optcon::LQOCProblem::Q_
ct::core::StateMatrixArray< STATE_DIM, SCALAR > Q_
Definition: LQOCProblem.hpp:215

ct::core::ControlVector

ct::optcon::NLOptConSettings
Settings for the NLOptCon algorithm.
Definition: NLOptConSettings.hpp:198

SCALAR
CppAD::AD< CppAD::cg::CG< double > > SCALAR

ct::optcon::LQOCSolver::lqocProblem_
std::shared_ptr< LQOCProblem_t > lqocProblem_
Definition: LQOCSolver.hpp:107

ct::optcon::GNRiccatiSolver::initializeCostToGo
void initializeCostToGo()
Definition: GNRiccatiSolver-impl.hpp:132

ct::optcon::GNRiccatiSolver::designController
void designController(size_t k)
Definition: GNRiccatiSolver-impl.hpp:167

ct::optcon::LQOCProblem
Defines a Linear-Quadratic Optimal Control Problem, which is optionally constrained.
Definition: LQOCProblem.hpp:57

ct::optcon::GNRiccatiSolver::logToMatlab
void logToMatlab()
Definition: GNRiccatiSolver-impl.hpp:266

ct::optcon::GNRiccatiSolver::GNRiccatiSolver
GNRiccatiSolver(const std::shared_ptr< LQOCProblem_t > &lqocProblem=nullptr)
Definition: GNRiccatiSolver-impl.hpp:13

i
for i
Definition: mpc_unittest_plotting.m:14

ct::optcon::NLOptConSettings::fixedHessianCorrection
bool fixedHessianCorrection
the maximum admissible number of NLOptCon main iterations
Definition: NLOptConSettings.hpp:270

ct::optcon::GNRiccatiSolver::H_
ControlMatrixArray H_
Definition: GNRiccatiSolver.hpp:85

ct::optcon::GNRiccatiSolver::S_
StateMatrixArray S_
Definition: GNRiccatiSolver.hpp:91

ct::optcon::GNRiccatiSolver::Hi_inverse_
ControlMatrixArray Hi_inverse_
Definition: GNRiccatiSolver.hpp:87

ct::optcon::LQOCSolver::u_sol_
core::ControlVectorArray< CONTROL_DIM, SCALAR > u_sol_
Definition: LQOCSolver.hpp:110

ct::optcon::GNRiccatiSolver::computeCostToGo
void computeCostToGo(size_t k)
Definition: GNRiccatiSolver-impl.hpp:147

ct::optcon::GNRiccatiSolver::computeStatesAndControls
virtual void computeStatesAndControls() override
extract the solution (can be overriden if additional extraction steps required in specific solver) ...
Definition: GNRiccatiSolver-impl.hpp:56

ct::core::DiscreteArray::toImplementation
Base & toImplementation()

ct::optcon::GNRiccatiSolver::computeFeedbackMatrices
virtual void computeFeedbackMatrices() override
return TVLQR feedback matrices
Definition: GNRiccatiSolver-impl.hpp:73

ct::optcon::LQOCSolver::lv_
ct::core::ControlVectorArray< CONTROL_DIM, SCALAR > lv_
Definition: LQOCSolver.hpp:112

ct::optcon::GNRiccatiSolver::Hi_
ControlMatrixArray Hi_
Definition: GNRiccatiSolver.hpp:86

ct::optcon::LQOCProblem::rv_
ct::core::ControlVectorArray< CONTROL_DIM, SCALAR > rv_
LQ approximation of the pure control penalty.
Definition: LQOCProblem.hpp:218

ct::optcon::LQOCProblem::qv_
ct::core::StateVectorArray< STATE_DIM, SCALAR > qv_
LQ approximation of the pure state penalty, including terminal state penalty.
Definition: LQOCProblem.hpp:214

ct::optcon::GNRiccatiSolver::G_
FeedbackArray G_
Definition: GNRiccatiSolver.hpp:83

ct::optcon::NLOptConSettings::recordSmallestEigenvalue
bool recordSmallestEigenvalue
perform Hessian regularization by incrementing the eigenvalues by epsilon.
Definition: NLOptConSettings.hpp:271

ct::optcon::GNRiccatiSolver::gv_
ControlVectorArray gv_
Definition: GNRiccatiSolver.hpp:82

ct::optcon::GNRiccatiSolver::initializeAndAllocate
virtual void initializeAndAllocate() override
a method reserved for memory allocation (e.g. required for HPIPM)
Definition: GNRiccatiSolver-impl.hpp:286

ct

ct::optcon::GNRiccatiSolver::N_
int N_
Definition: GNRiccatiSolver.hpp:93

ct::core::ControlMatrix

ct::optcon::GNRiccatiSolver::eigenvalueSolver_
Eigen::SelfAdjointEigenSolver< Eigen::Matrix< SCALAR, CONTROL_DIM, CONTROL_DIM > > eigenvalueSolver_
Eigenvalue solver, used for inverting the Hessian and for regularization.
Definition: GNRiccatiSolver.hpp:98

ct::optcon::LQOCSolver::x_sol_
core::StateVectorArray< STATE_DIM, SCALAR > x_sol_
Definition: LQOCSolver.hpp:109

ct::optcon::GNRiccatiSolver::settings_
NLOptConSettings settings_
Definition: GNRiccatiSolver.hpp:80

ct::optcon::GNRiccatiSolver::solveSingleStage
virtual void solveSingleStage(int N) override
Definition: GNRiccatiSolver-impl.hpp:36

ct::optcon::GNRiccatiSolver::sv_
StateVectorArray sv_
Definition: GNRiccatiSolver.hpp:90

ct::optcon::LQOCSolver
Definition: LQOCSolver.hpp:22