doc/html/ROL__TypeB__NewtonKrylovAlgorithm__Def_8hpp_source.html

 // @HEADER

 // ************************************************************************

 //

 //               Rapid Optimization Library (ROL) Package

 //                 Copyright (2014) Sandia Corporation

 //

 // Under terms of Contract DE-AC04-94AL85000, there is a non-exclusive

 // license for use of this work by or on behalf of the U.S. Government.

 //

 // Redistribution and use in source and binary forms, with or without

 // modification, are permitted provided that the following conditions are

 // met:

 //

 // 1. Redistributions of source code must retain the above copyright

 // notice, this list of conditions and the following disclaimer.

 //

 // 2. Redistributions in binary form must reproduce the above copyright

 // notice, this list of conditions and the following disclaimer in the

 // documentation and/or other materials provided with the distribution.

 //

 // 3. Neither the name of the Corporation nor the names of the

 // contributors may be used to endorse or promote products derived from

 // this software without specific prior written permission.

 //

 // THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY

 // EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR

 // PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE

 // CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,

 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,

 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR

 // PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF

 // LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING

 // NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

 // SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 //

 // Questions? Contact lead developers:

 //              Drew Kouri   (dpkouri@sandia.gov) and

 //              Denis Ridzal (dridzal@sandia.gov)

 //

 // ************************************************************************

 // @HEADER


 #ifndef ROL_TYPEB_NEWTONKRYLOVALGORITHM_DEF_HPP

 #define ROL_TYPEB_NEWTONKRYLOVALGORITHM_DEF_HPP


 namespace ROL {

 namespace TypeB {


 template<typename Real>

 NewtonKrylovAlgorithm<Real>::NewtonKrylovAlgorithm(ParameterList           &list,

                                                    const Ptr<Secant<Real>> &secant)

   : secant_(secant), esec_(SECANT_USERDEFINED) {

   parseParameterList(list);


   if ( secant_ == nullPtr ) {

     secantName_ = list.sublist("General").sublist("Secant").get("Type","Limited-Memory BFGS");

     esec_ = StringToESecant(secantName_);

     secant_ = SecantFactory<Real>(list);

   }

   else {

     secantName_ = list.sublist("General").sublist("Secant").get("User Defined Secant Name",

                                                                 "Unspecified User Defined Secant Method");

   }


   krylovName_ = list.sublist("General").sublist("Krylov").get("Type","Conjugate Gradients");

   ekv_ = StringToEKrylov(krylovName_);

   krylov_ = KrylovFactory<Real>(list);

 }


 template<typename Real>

 NewtonKrylovAlgorithm<Real>::NewtonKrylovAlgorithm(ParameterList           &list,

                                                    const Ptr<Krylov<Real>> &krylov,

                                                    const Ptr<Secant<Real>> &secant)

   : secant_(secant), esec_(SECANT_USERDEFINED), krylov_(krylov), ekv_(KRYLOV_USERDEFINED) {

   parseParameterList(list);


   if ( secant_ == nullPtr ) {

     secantName_ = list.sublist("General").sublist("Secant").get("Type","Limited-Memory BFGS");

     esec_ = StringToESecant(secantName_);

     secant_ = SecantFactory<Real>(list);

   }

   else {

     secantName_ = list.sublist("General").sublist("Secant").get("User Defined Secant Name",

                                                                 "Unspecified User Defined Secant Method");

   }


   krylovName_ = list.sublist("General").sublist("Krylov").get("User Defined Krylov Name",

                                                               "Unspecified User Defined Krylov Method");

 }


 template<typename Real>

 void NewtonKrylovAlgorithm<Real>::parseParameterList(ParameterList &list) {

   // Set status test

   status_->reset();

   status_->add(makePtr<StatusTest<Real>>(list));


   // Parse parameter list

   ParameterList &lslist = list.sublist("Step").sublist("Line Search");

   maxit_        = lslist.get("Function Evaluation Limit",                        20);

   alpha0_       = lslist.get("Initial Step Size",                               1.0);

   useralpha_    = lslist.get("User Defined Initial Step Size",                false);

   usePrevAlpha_ = lslist.get("Use Previous Step Length as Initial Guess",     false);

   c1_           = lslist.get("Sufficient Decrease Tolerance",                  1e-4);

   rhodec_       = lslist.sublist("Line-Search Method").get("Backtracking Rate", 0.5);


   useSecantHessVec_ = list.sublist("General").sublist("Secant").get("Use as Hessian",        false);

   useSecantPrecond_ = list.sublist("General").sublist("Secant").get("Use as Preconditioner", false);


   verbosity_    = list.sublist("General").get("Output Level",                     0);

   writeHeader_  = verbosity_ > 2;

 }


 template<typename Real>

 void NewtonKrylovAlgorithm<Real>::initialize(Vector<Real>          &x,

                                              const Vector<Real>    &g,

                                              Objective<Real>       &obj,

                                              BoundConstraint<Real> &bnd,

                                              std::ostream &outStream) {

   const Real one(1);

   if (proj_ == nullPtr) {

     proj_ = makePtr<PolyhedralProjection<Real>>(makePtrFromRef(bnd));

   }

   // Initialize data

   TypeB::Algorithm<Real>::initialize(x,g);

   // Update approximate gradient and approximate objective function.

   Real ftol = std::sqrt(ROL_EPSILON<Real>());

   proj_->project(x,outStream);

   state_->iterateVec->set(x);

   obj.update(x,UpdateType::Initial,state_->iter);

   state_->value = obj.value(x,ftol); state_->nfval++;

   obj.gradient(*state_->gradientVec,x,ftol); state_->ngrad++;

   state_->stepVec->set(x);

   state_->stepVec->axpy(-one,state_->gradientVec->dual());

   proj_->project(*state_->stepVec,outStream);

   state_->stepVec->axpy(-one,x);

   state_->gnorm = state_->stepVec->norm();

   state_->snorm = ROL_INF<Real>();

   if (!useralpha_) alpha0_ = one;

   state_->searchSize = alpha0_;

 }


 template<typename Real>

 void NewtonKrylovAlgorithm<Real>::run( Vector<Real>          &x,

                                        const Vector<Real>    &g,

                                        Objective<Real>       &obj,

                                        BoundConstraint<Real> &bnd,

                                        std::ostream          &outStream ) {

   const Real one(1);

   // Initialize trust-region data

   initialize(x,g,obj,bnd,outStream);

   Ptr<Vector<Real>> s = x.clone(), gp = x.clone(), gold = g.clone();

   Ptr<Vector<Real>> pwa = x.clone(), pwa1 = x.clone();

   Real ftrial(0), gs(0), tol(std::sqrt(ROL_EPSILON<Real>()));


   Ptr<LinearOperator<Real>> hessian, precond;


   // Output

   if (verbosity_ > 0) writeOutput(outStream,true);


   // Compute steepest descent step

   gp->set(state_->gradientVec->dual());

   while (status_->check(*state_)) {

     // Compute step

     hessian = makePtr<HessianPNK>(makePtrFromRef(obj),makePtrFromRef(bnd),

                                   state_->iterateVec,state_->gradientVec,state_->gnorm,

                                   secant_,useSecantHessVec_,pwa);

     precond = makePtr<PrecondPNK>(makePtrFromRef(obj),makePtrFromRef(bnd),

                                   state_->iterateVec,state_->gradientVec,state_->gnorm,

                                   secant_,useSecantPrecond_,pwa1);

     flagKrylov_ = 0;

     krylov_->run(*s,*hessian,*state_->gradientVec,*precond,iterKrylov_,flagKrylov_);

     if (flagKrylov_ == 2 && iterKrylov_ <= 1) {

       s->set(*gp);

     }

     // Perform backtracking line search

     if (!usePrevAlpha_) state_->searchSize = alpha0_;

     x.set(*state_->iterateVec);

     x.axpy(-state_->searchSize,*s);

     proj_->project(x,outStream);

     obj.update(x,UpdateType::Trial);

     ftrial = obj.value(x,tol); ls_nfval_ = 1;

     state_->stepVec->set(x);

     state_->stepVec->axpy(-one,*state_->iterateVec);

     gs = state_->stepVec->dot(*gp);

     if (verbosity_ > 1) {

       outStream << "  In TypeB::NewtonKrylovAlgorithm: Line Search"  << std::endl;

       outStream << "    Step size:                        " << state_->searchSize   << std::endl;

       outStream << "    Trial objective value:            " << ftrial               << std::endl;

       outStream << "    Computed reduction:               " << state_->value-ftrial << std::endl;

       outStream << "    Dot product of gradient and step: " << gs                   << std::endl;

       outStream << "    Sufficient decrease bound:        " << -gs*c1_              << std::endl;

       outStream << "    Number of function evaluations:   " << ls_nfval_            << std::endl;

     }

     while ( state_->value - ftrial < -c1_*gs && ls_nfval_ < maxit_ ) {

       state_->searchSize *= rhodec_;

       x.set(*state_->iterateVec);

       x.axpy(-state_->searchSize,*s);

       proj_->project(x,outStream);

       obj.update(x,UpdateType::Trial);

       ftrial = obj.value(x,tol); ls_nfval_++;

       state_->stepVec->set(x);

       state_->stepVec->axpy(-one,*state_->iterateVec);

       gs = state_->stepVec->dot(*gp);

       if (verbosity_ > 1) {

         outStream << std::endl;

         outStream << "    Step size:                        " << state_->searchSize   << std::endl;

         outStream << "    Trial objective value:            " << ftrial               << std::endl;

         outStream << "    Computed reduction:               " << state_->value-ftrial << std::endl;

         outStream << "    Dot product of gradient and step: " << gs                   << std::endl;

         outStream << "    Sufficient decrease bound:        " << -gs*c1_              << std::endl;

         outStream << "    Number of function evaluations:   " << ls_nfval_            << std::endl;

       }

     }

     state_->nfval += ls_nfval_;


     // Compute norm of step

     state_->snorm = state_->stepVec->norm();


     // Update iterate

     state_->iterateVec->set(x);


     // Compute new value and gradient

     state_->iter++;

     state_->value = ftrial;

     obj.update(x,UpdateType::Accept,state_->iter);

     gold->set(*state_->gradientVec);

     obj.gradient(*state_->gradientVec,x,tol); state_->ngrad++;

     gp->set(state_->gradientVec->dual());


     // Compute projected gradient norm

     s->set(x); s->axpy(-one,*gp);

     proj_->project(*s,outStream);

     s->axpy(-one,x);

     state_->gnorm = s->norm();


     // Update secant

     secant_->updateStorage(x,*state_->gradientVec,*gold,*state_->stepVec,state_->snorm,state_->iter);


     // Update Output

     if (verbosity_ > 0) writeOutput(outStream,writeHeader_);

   }

   if (verbosity_ > 0) TypeB::Algorithm<Real>::writeExitStatus(outStream);

 }


 template<typename Real>

 void NewtonKrylovAlgorithm<Real>::run( Problem<Real> &problem,

                                        std::ostream  &outStream ) {

   if (problem.getPolyhedralProjection() == nullPtr) {

     return TypeB::Algorithm<Real>::run(problem,outStream);

   }

   else {

     throw Exception::NotImplemented(">>> TypeB::NewtonKrylovAlgorithm::run : This algorithm cannot solve problems with linear equality constraints!");

   }

 }


 template<typename Real>

 void NewtonKrylovAlgorithm<Real>::run( Vector<Real>          &x,

                                        const Vector<Real>    &g,

                                        Objective<Real>       &obj,

                                        BoundConstraint<Real> &bnd,

                                        Constraint<Real>      &linear_econ,

                                        Vector<Real>          &linear_emul,

                                        const Vector<Real>    &linear_eres,

                                        std::ostream          &outStream ) {

   throw Exception::NotImplemented(">>> TypeB::NewtonKrylovAlgorithm::run : This algorithm cannot solve problems with linear equality constraints!");

 }


 template<typename Real>

 void NewtonKrylovAlgorithm<Real>::writeHeader( std::ostream& os ) const {

   std::ios_base::fmtflags osFlags(os.flags());

   if (verbosity_ > 1) {

     os << std::string(114,'-') << std::endl;

     if (!useSecantHessVec_) {

       os << "Line-Search Projected Newton";

     }

     else {

       os << "Line-Search Projected Quasi-Newton with " << secantName_ << " Hessian approximation";

     }

     os << " status output definitions" << std::endl << std::endl;

     os << "  iter     - Number of iterates (steps taken)" << std::endl;

     os << "  value    - Objective function value" << std::endl;

     os << "  gnorm    - Norm of the gradient" << std::endl;

     os << "  snorm    - Norm of the step (update to optimization vector)" << std::endl;

     os << "  alpha    - Line search step length" << std::endl;

     os << "  #fval    - Cumulative number of times the objective function was evaluated" << std::endl;

     os << "  #grad    - Cumulative number of times the gradient was computed" << std::endl;

     os << "  ls_#fval - Number of the times the objective function was evaluated during the line search" << std::endl;

     os << "  iterCG   - Number of Krylov iterations" << std::endl << std::endl;

     os << "  flagGC   - Krylov flag" << std::endl;

     for( int flag = CG_FLAG_SUCCESS; flag != CG_FLAG_UNDEFINED; ++flag ) {

       os << "    " << NumberToString(flag) << " - "

            << ECGFlagToString(static_cast<ECGFlag>(flag)) << std::endl;

     }

     os << std::string(114,'-') << std::endl;

   }


   os << "  ";

   os << std::setw(6)  << std::left << "iter";

   os << std::setw(15) << std::left << "value";

   os << std::setw(15) << std::left << "gnorm";

   os << std::setw(15) << std::left << "snorm";

   os << std::setw(15) << std::left << "alpha";

   os << std::setw(10) << std::left << "#fval";

   os << std::setw(10) << std::left << "#grad";

   os << std::setw(10) << std::left << "#ls_fval";

   os << std::setw(10) << std::left << "iterCG";

   os << std::setw(10) << std::left << "flagCG";

   os << std::endl;

   os.flags(osFlags);

 }


 template<typename Real>

 void NewtonKrylovAlgorithm<Real>::writeName( std::ostream& os ) const {

   std::ios_base::fmtflags osFlags(os.flags());

   if (!useSecantHessVec_) {

     os << std::endl << "Line-Search Projected Newton (Type B, Bound Constraints)" << std::endl;

   }

   else {

     os << std::endl << "Line-Search Projected Quasi-Newton with "

          << secantName_ << " Hessian approximation" << std::endl;

   }

   os.flags(osFlags);

 }


 template<typename Real>

 void NewtonKrylovAlgorithm<Real>::writeOutput( std::ostream& os, bool write_header ) const {

   std::ios_base::fmtflags osFlags(os.flags());

   os << std::scientific << std::setprecision(6);

   if ( state_->iter == 0 ) writeName(os);

   if ( write_header )      writeHeader(os);

   if ( state_->iter == 0 ) {

     os << "  ";

     os << std::setw(6)  << std::left << state_->iter;

     os << std::setw(15) << std::left << state_->value;

     os << std::setw(15) << std::left << state_->gnorm;

     os << std::setw(15) << std::left << "---";

     os << std::setw(15) << std::left << "---";

     os << std::setw(10) << std::left << state_->nfval;

     os << std::setw(10) << std::left << state_->ngrad;

     os << std::setw(10) << std::left << "---";

     os << std::setw(10) << std::left << "---";

     os << std::setw(10) << std::left << "---";

     os << std::endl;

   }

   else {

     os << "  ";

     os << std::setw(6)  << std::left << state_->iter;

     os << std::setw(15) << std::left << state_->value;

     os << std::setw(15) << std::left << state_->gnorm;

     os << std::setw(15) << std::left << state_->snorm;

     os << std::setw(15) << std::left << state_->searchSize;

     os << std::setw(10) << std::left << state_->nfval;

     os << std::setw(10) << std::left << state_->ngrad;

     os << std::setw(10) << std::left << ls_nfval_;

     os << std::setw(10) << std::left << iterKrylov_;

     os << std::setw(10) << std::left << flagKrylov_;

     os << std::endl;

   }

   os.flags(osFlags);

 }


 } // namespace TypeB

 } // namespace ROL


 #endif

ROL::ECGFlagToString
std::string ECGFlagToString(ECGFlag cgf)
Definition: ROL_Types.hpp:831

ROL::Objective
Provides the interface to evaluate objective functions.
Definition: ROL_Objective.hpp:78

ROL::Vector::clone
virtual ROL::Ptr< Vector > clone() const =0
Clone to make a new (uninitialized) vector.

ROL::TypeB::NewtonKrylovAlgorithm::writeHeader
void writeHeader(std::ostream &os) const override
Print iterate header.
Definition: ROL_TypeB_NewtonKrylovAlgorithm_Def.hpp:270

ROL::TypeB::NewtonKrylovAlgorithm::NewtonKrylovAlgorithm
NewtonKrylovAlgorithm(ParameterList &list, const Ptr< Secant< Real >> &secant=nullPtr)
Definition: ROL_TypeB_NewtonKrylovAlgorithm_Def.hpp:51

ROL::Vector::axpy
virtual void axpy(const Real alpha, const Vector &x)
Compute  where .
Definition: ROL_Vector.hpp:153

ROL::Objective::value
virtual Real value(const Vector< Real > &x, Real &tol)=0
Compute value.

ROL::TypeB::NewtonKrylovAlgorithm::initialize
void initialize(Vector< Real > &x, const Vector< Real > &g, Objective< Real > &obj, BoundConstraint< Real > &bnd, std::ostream &outStream=std::cout)
Definition: ROL_TypeB_NewtonKrylovAlgorithm_Def.hpp:115

ROL::KRYLOV_USERDEFINED
Definition: ROL_KrylovFactory.hpp:71

ROL::UpdateType::Trial

ROL::CG_FLAG_SUCCESS
Definition: ROL_Types.hpp:822

ROL::TypeB::Algorithm::writeExitStatus
virtual void writeExitStatus(std::ostream &os) const
Definition: ROL_TypeB_Algorithm_Def.hpp:304

ROL::TypeB::NewtonKrylovAlgorithm::run
void run(Vector< Real > &x, const Vector< Real > &g, Objective< Real > &obj, BoundConstraint< Real > &bnd, std::ostream &outStream=std::cout) override
Run algorithm on bound constrained problems (Type-B). This general interface supports the use of dual...
Definition: ROL_TypeB_NewtonKrylovAlgorithm_Def.hpp:144

ROL::StringToESecant
ESecant StringToESecant(std::string s)
Definition: ROL_Types.hpp:543

ROL::Vector
Defines the linear algebra or vector space interface.
Definition: ROL_Vector.hpp:80

ROL::Objective::update
virtual void update(const Vector< Real > &x, UpdateType type, int iter=-1)
Update objective function.
Definition: ROL_Objective.hpp:96

ROL::TypeB::NewtonKrylovAlgorithm::ekv_
EKrylov ekv_
Krylov type.
Definition: ROL_TypeB_NewtonKrylovAlgorithm.hpp:66

ROL::SECANT_USERDEFINED
Definition: ROL_Types.hpp:491

ROL::StringToEKrylov
EKrylov StringToEKrylov(std::string s)
Definition: ROL_KrylovFactory.hpp:121

ROL::Problem
Definition: function/prox/ROL_Problem.hpp:61

ROL::UpdateType::Initial

ROL::Objective::gradient
virtual void gradient(Vector< Real > &g, const Vector< Real > &x, Real &tol)
Compute gradient.
Definition: ROL_ObjectiveDef.hpp:74

ROL::Exception::NotImplemented
Definition: ROL_Types.hpp:914

ROL::NumberToString
std::string NumberToString(T Number)
Definition: ROL_Types.hpp:81

ROL::TypeB::NewtonKrylovAlgorithm::krylovName_
std::string krylovName_
Krylov name.
Definition: ROL_TypeB_NewtonKrylovAlgorithm.hpp:67

ROL::CG_FLAG_UNDEFINED
Definition: ROL_Types.hpp:827

ROL::TypeB::NewtonKrylovAlgorithm::writeOutput
void writeOutput(std::ostream &os, const bool write_header=false) const override
Print iterate status.
Definition: ROL_TypeB_NewtonKrylovAlgorithm_Def.hpp:327

ROL::Secant
Provides interface for and implements limited-memory secant operators.
Definition: ROL_Secant.hpp:79

ROL::TypeB::NewtonKrylovAlgorithm::secantName_
std::string secantName_
Secant name.
Definition: ROL_TypeB_NewtonKrylovAlgorithm.hpp:63

ROL::StatusTest
Provides an interface to check status of optimization algorithms.
Definition: ROL_StatusTest.hpp:58

ROL::Krylov
Provides definitions for Krylov solvers.
Definition: ROL_Krylov.hpp:58

ROL::BoundConstraint
Provides the interface to apply upper and lower bound constraints.
Definition: ROL_BoundConstraint.hpp:73

ROL::Problem::getPolyhedralProjection
const Ptr< PolyhedralProjection< Real > > & getPolyhedralProjection()
Get the polyhedral projection object. This is a null pointer if no linear constraints and/or bounds a...
Definition: function/prox/ROL_Problem_Def.hpp:517

ROL::TypeB::NewtonKrylovAlgorithm::secant_
Ptr< Secant< Real > > secant_
Secant object (used for quasi-Newton)
Definition: ROL_TypeB_NewtonKrylovAlgorithm.hpp:61

ROL::TypeB::NewtonKrylovAlgorithm::parseParameterList
void parseParameterList(ParameterList &list)
Definition: ROL_TypeB_NewtonKrylovAlgorithm_Def.hpp:93

ROL::TypeB::Algorithm::initialize
void initialize(const Vector< Real > &x, const Vector< Real > &g)
Definition: ROL_TypeB_Algorithm_Def.hpp:63

ROL::TypeB::NewtonKrylovAlgorithm::krylov_
Ptr< Krylov< Real > > krylov_
Krylov solver object (used for inexact Newton)
Definition: ROL_TypeB_NewtonKrylovAlgorithm.hpp:65

ROL::TypeB::NewtonKrylovAlgorithm::esec_
ESecant esec_
Secant type.
Definition: ROL_TypeB_NewtonKrylovAlgorithm.hpp:62

ROL::TypeB::Algorithm::run
virtual void run(Problem< Real > &problem, std::ostream &outStream=std::cout)
Run algorithm on bound constrained problems (Type-B). This is the primary Type-B interface.
Definition: ROL_TypeB_Algorithm_Def.hpp:107

ROL::Vector::set
virtual void set(const Vector &x)
Set  where .
Definition: ROL_Vector.hpp:209

ROL::TypeB::NewtonKrylovAlgorithm::writeName
void writeName(std::ostream &os) const override
Print step name.
Definition: ROL_TypeB_NewtonKrylovAlgorithm_Def.hpp:314

ROL::Constraint
Defines the general constraint operator interface.
Definition: ROL_Constraint.hpp:86

ROL::UpdateType::Accept