_site/latest/NewtonTrust_8cpp_source.html

 #include "MUQ/Optimization/NewtonTrust.h"


 #include <stdio.h>


 using namespace muq::Optimization;


 REGISTER_OPTIMIZER(NewtonTrust, NewtonTrust)


 NewtonTrust::NewtonTrust(std::shared_ptr<muq::Modeling::ModPiece> const& cost,

                          boost::property_tree::ptree const& pt) : Optimizer(cost, pt),

                              maxRadius(pt.get("MaxRadius", std::numeric_limits<double>::infinity())),

                              initialRadius(pt.get("InitialRadius", std::min(1.0,maxRadius))),

                              acceptRatio(pt.get("AcceptRatio", 0.05)),

                              shrinkRatio(pt.get("ShrinkRatio", 0.25)),

                              growRatio(pt.get("GrowRatio", 0.75)),

                              shrinkRate(pt.get("ShrinkRate",0.25)),

                              growRate(pt.get("GrowRate", 2.0)),

                              trustTol(pt.get("TrustTol", std::min(1e-4,xtol_abs))),

                              printLevel(pt.get("PrintLevel", 0)){

 }


 std::pair<Eigen::VectorXd, double> NewtonTrust::Solve(std::vector<Eigen::VectorXd> const& inputs) {


   // Trust region approach with a double dogleg step

   trustRadius = initialRadius;


   Eigen::VectorXd const& x0 = inputs.at(0);

   Eigen::VectorXd x = x0;

   Eigen::VectorXd step;


   if(printLevel>0){

     std::cout << "Using NewtonTrust optimizer..." << std::endl;

     std::cout << "  Iteration, TrustRadius,       fval,      ||g||" << std::endl;

   }


   double fval;


   for(int it=0; it<maxEvals; ++it) {


     opt->SetPoint(x);

     fval = opt->Cost();

     Eigen::VectorXd const& grad = opt->Gradient();


     if(printLevel>0){

       char buf[1024];

       std::sprintf(buf, "  %9d, %11.3f,  %4.3e,  %5.3e\n", it, trustRadius, fval, grad.norm()); // create string and then cout so pybind11 can capture output

       std::cout << std::string(buf);

     }//std::printf("  %9d, %11.3f,  %4.3e,  %5.3e\n", it, trustRadius, fval, grad.norm());


     if(grad.norm() < xtol_abs)

         return std::make_pair(x,fval);


     step = SolveSub(fval, x, grad);


     double modDelta = grad.dot(step)+0.5*step.dot(opt->ApplyHessian(step));

     Eigen::VectorXd newX = x+step;


     double newf = opt->Cost(newX);

     double rho = (newf-fval)/modDelta;


     // Update the position.  If the model is really bad, we'll just stay put

     if(rho>acceptRatio){


       if(step.norm() < xtol_abs)

         return std::make_pair(newX,newf);


       if((fval-newf)<ftol_abs)

         return std::make_pair(newX,newf);


       x = newX;

       fval = newf;

     }


     // Update the trust region size

     if(rho<shrinkRatio){

       trustRadius = shrinkRate*trustRadius; // shrink trust region

     }else if((rho>growRatio)&&(std::abs(step.norm()-trustRadius)<1e-10)) {

       trustRadius = std::min(growRate*trustRadius, maxRadius);

     }


   }


   return std::make_pair(x,fval);

 }


 Eigen::VectorXd NewtonTrust::SolveSub(double                 fval,

                                       Eigen::VectorXd const& x0,

                                       Eigen::VectorXd const& grad) {

   const unsigned int dim = x0.size();


   // Current estimate of the subproblem minimum

   Eigen::VectorXd z = Eigen::VectorXd::Zero(dim);


   // Related to the step direction

   Eigen::VectorXd r = grad;

   Eigen::VectorXd d = -r;


   // If the gradient is small enough where we're starting, then we're done

   if(r.norm()<trustTol)

     return z;


   Eigen::VectorXd Bd; // the Hessian (B) applied to a vector d


   double alpha, beta, gradd, dBd, rr;


   for(int i=0; i<dim; ++i){

     Bd = opt->ApplyHessian(d);

     gradd = grad.dot(d);

     dBd = d.dot(Bd);

     rr = r.squaredNorm();


     // If the Hessian isn't positive definite in this direction, we can go all

     // the way to the trust region boundary

     if(dBd<=0){

       // do something


       double dz = d.dot(z);

       double dd = d.squaredNorm();

       double zz = z.squaredNorm();

       double r2 = trustRadius*trustRadius;


       double tau1 = (-dz + sqrt(dz*dz - dd*(zz-r2)))/dd;

       double tau2 = (-dz - sqrt(dz*dz - dd*(zz-r2)))/dd;


       double zBd = z.dot(Bd);

       double mval1 = tau1*gradd + tau1*zBd + tau1*tau1*dBd;

       double mval2 = tau2*gradd + tau2*zBd + tau2*tau2*dBd;


       return (mval1<mval2) ? (z+tau1*d) : (z+tau2*d);

     }


     alpha = rr / dBd;

     Eigen::VectorXd newZ = z + alpha * d;


     if(newZ.norm()>trustRadius){


       double dz = d.dot(z);

       double dd = d.squaredNorm();

       double zz = z.squaredNorm();

       double r2 = trustRadius*trustRadius;


       double tau = (-dz + sqrt(dz*dz - dd*(zz-r2)))/dd;

       return z + tau*d;

     }


     z = newZ;


     r += alpha*Bd;


     if(r.norm()<trustTol)

       return z;


     beta = r.squaredNorm() / rr;

     d = (-r + beta*d).eval();

   }


   return z;

 }

REGISTER_OPTIMIZER
REGISTER_OPTIMIZER(NewtonTrust, NewtonTrust) NewtonTrust
Definition: NewtonTrust.cpp:7

NewtonTrust.h

muq::Optimization::NewtonTrust
Newton optimizer with trust region to ensure global convergence.
Definition: NewtonTrust.h:19

muq::Optimization::NewtonTrust::initialRadius
const double initialRadius
Definition: NewtonTrust.h:74

muq::Optimization::NewtonTrust::SolveSub
Eigen::VectorXd SolveSub(double fval, Eigen::VectorXd const &x0, Eigen::VectorXd const &grad)
Definition: NewtonTrust.cpp:89

muq::Optimization::NewtonTrust::NewtonTrust
NewtonTrust(std::shared_ptr< muq::Modeling::ModPiece > const &cost, boost::property_tree::ptree const &pt)

muq::Optimization::NewtonTrust::trustTol
const double trustTol
Definition: NewtonTrust.h:80

muq::Optimization::NewtonTrust::growRate
const double growRate
Definition: NewtonTrust.h:79

muq::Optimization::NewtonTrust::maxRadius
const double maxRadius
Definition: NewtonTrust.h:73

muq::Optimization::NewtonTrust::trustRadius
double trustRadius
Definition: NewtonTrust.h:72

muq::Optimization::NewtonTrust::acceptRatio
const double acceptRatio
Definition: NewtonTrust.h:75

muq::Optimization::NewtonTrust::shrinkRate
const double shrinkRate
Definition: NewtonTrust.h:78

muq::Optimization::NewtonTrust::growRatio
const double growRatio
Definition: NewtonTrust.h:77

muq::Optimization::NewtonTrust::printLevel
const unsigned int printLevel
Definition: NewtonTrust.h:81

muq::Optimization::NewtonTrust::shrinkRatio
const double shrinkRatio
Definition: NewtonTrust.h:76

muq::Optimization::Optimizer
Solve an optimization problem.
Definition: Optimizer.h:21

muq::Optimization::Optimizer::opt
std::shared_ptr< CostFunction > opt
The cost function that we are trying to minimize.
Definition: Optimizer.h:105

muq::Optimization::Optimizer::xtol_abs
const double xtol_abs
Definition: Optimizer.h:117

muq::Optimization::Optimizer::maxEvals
const unsigned int maxEvals
Maximum number of cost function evaluations.
Definition: Optimizer.h:123

muq::Optimization::Optimizer::ftol_abs
const double ftol_abs
Definition: Optimizer.h:117

muq::Optimization
Definition: AllClassWrappers.h:7

nlohmann::detail::dtoa_impl::buf
* buf
Definition: json.h:15295

nlohmann::detail::dtoa_impl::e
int e
Definition: json.h:15263

nlohmann::detail::get
auto get(const nlohmann::detail::iteration_proxy_value< IteratorType > &i) -> decltype(i.key())
Definition: json.h:3956