v0.55.0/html/a00374_source.html

 //-----------------------------------------------------------------------bl-

 //--------------------------------------------------------------------------

 //

 // QUESO - a library to support the Quantification of Uncertainty

 // for Estimation, Simulation and Optimization

 //

 // Copyright (C) 2008-2015 The PECOS Development Team

 //

 // This library is free software; you can redistribute it and/or

 // modify it under the terms of the Version 2.1 GNU Lesser General

 // Public License as published by the Free Software Foundation.

 //

 // This library is distributed in the hope that it will be useful,

 // but WITHOUT ANY WARRANTY; without even the implied warranty of

 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU

 // Lesser General Public License for more details.

 //

 // You should have received a copy of the GNU Lesser General Public

 // License along with this library; if not, write to the Free Software

 // Foundation, Inc. 51 Franklin Street, Fifth Floor,

 // Boston, MA  02110-1301  USA

 //

 //-----------------------------------------------------------------------el-


 #include <iostream>


 #include <queso/Defines.h>

 #include <queso/GslVector.h>

 #include <queso/VectorSpace.h>

 #include <queso/ScalarFunction.h>

 #include <queso/GslOptimizer.h>

 #include <queso/OptimizerMonitor.h>


 #include <gsl/gsl_multimin.h>

 #include <gsl/gsl_blas.h>


 namespace QUESO {


 // We need to extern "C" because gsl needs a pointer to a C function to

 // minimize

 extern "C" {

   // This evaluate -log posterior

   double c_evaluate(const gsl_vector * x, void * context) {


     GslOptimizer * optimizer = static_cast<GslOptimizer * >(context);


     GslVector state(

         optimizer->objectiveFunction().domainSet().vectorSpace().zeroVector());


     // DM: Doing this copy sucks, but whatever.  It'll do for now.

     for (unsigned int i = 0; i < state.sizeLocal(); i++) {

       state[i] = gsl_vector_get(x, i);

     }


     // Bail early if GSL tries to evaluate outside of the domain

     if (!optimizer->objectiveFunction().domainSet().contains(state)) {

       return GSL_NAN;

     }


     // Should cache derivative here so we don't a) segfault in the user's code

     // and b) so we don't recompute stuff

     double result = -optimizer->objectiveFunction().lnValue(state, NULL, NULL,

         NULL, NULL);


     return result;

   }


   // This evaluates the derivative of -log posterior

   void c_evaluate_derivative(const gsl_vector * x, void * context,

       gsl_vector * derivative) {

     GslOptimizer * optimizer = static_cast<GslOptimizer * >(context);


     GslVector state(

         optimizer->objectiveFunction().domainSet().vectorSpace().zeroVector());

     GslVector deriv(

         optimizer->objectiveFunction().domainSet().vectorSpace().zeroVector());


     // DM: Doing this copy sucks, but whatever.  It'll do for now.

     for (unsigned int i = 0; i < state.sizeLocal(); i++) {

       state[i] = gsl_vector_get(x, i);


       // We fill with GSL_NAN and use it as a flag to check later that the user

       // actually fills the derivative vector with stuff

       deriv[i] = GSL_NAN;

     }


     if (!optimizer->objectiveFunction().domainSet().contains(state)) {

       // Fill derivative with error codes if the point is outside of the

       // domain

       for (unsigned int i = 0; i < deriv.sizeLocal(); i++) {

         gsl_vector_set(derivative, i, GSL_NAN);

       }

     }

     else {

       // We should cache the return value here so we don't recompute stuff

       double fx = -optimizer->objectiveFunction().lnValue(state, NULL, &deriv,

           NULL, NULL);


       // Decide whether or not we need to do a finite difference based on

       // whether the user actually filled deriv with values that are not

       // GSL_NAN

       //

       // We're currently doing this check every time this function gets called.

       // We could probably pull this logic out of here and put it somewhere

       // where it only happens once

       bool userComputedDerivative = true;

       for (unsigned int i = 0; i < deriv.sizeLocal(); i++) {

         // If the user missed out a derivative in any direction, fall back to

         // a finite difference

         if (gsl_isnan(deriv[i])) {

           userComputedDerivative = false;

           break;

         }

       }


       if (userComputedDerivative) {

         for (unsigned int i = 0; i < deriv.sizeLocal(); i++) {

           gsl_vector_set(derivative, i, -deriv[i]);  // We need the minus sign

         }

       }

       else {

         // Finite difference step-size

         double h = optimizer->getFiniteDifferenceStepSize();


         // User did not provide a derivative, so do a finite difference

         for (unsigned int i = 0; i < deriv.sizeLocal(); i++) {

           double tempState = state[i];

           state[i] += h;


           // User didn't provide a derivative, so we don't bother passing in

           // the derivative vector again

           double fxph = -optimizer->objectiveFunction().lnValue(state, NULL,

               NULL, NULL, NULL);


           // Reset the state back to what it was before

           state[i] = tempState;


           // Make sure we didn't do anything dumb and tell gsl if we did

           if (!gsl_isnan(fx) && !gsl_isnan(fxph)) {

             gsl_vector_set(derivative, i, (fxph - fx) / h);

           }

           else {

             gsl_vector_set(derivative, i, GSL_NAN);

           }

         }

       }

     }

   }


   // This evaluates -log posterior and the derivative of -log posterior

   void c_evaluate_with_derivative(const gsl_vector * x, void * context,

       double * f, gsl_vector * derivative) {

     // We don't need to call both of these

     *f = c_evaluate(x, context);

     c_evaluate_derivative(x, context, derivative);

   }

 }  // End extern "C"


 GslOptimizer::GslOptimizer(

     const BaseScalarFunction<GslVector, GslMatrix> & objectiveFunction)

   : BaseOptimizer(),

     m_objectiveFunction(objectiveFunction),

     m_initialPoint(new GslVector(objectiveFunction.domainSet().

           vectorSpace().zeroVector())),

     m_minimizer(new GslVector(this->m_objectiveFunction.domainSet().

         vectorSpace().zeroVector())),

     m_solver_type(BFGS2),

     m_fstep_size(this->m_objectiveFunction.domainSet().vectorSpace().zeroVector()),

     m_fdfstep_size(1.0),

     m_line_tol(0.1)

 {

   // We initialize the minimizer to GSL_NAN just in case the optimization fails

   m_minimizer->cwSet(GSL_NAN);


   // Set to documented default value.

   m_fstep_size.cwSet(0.1);

 }


 GslOptimizer::~GslOptimizer()

 {

   delete this->m_initialPoint;

 }


 void GslOptimizer::minimize(OptimizerMonitor* monitor) {


   // First check that initial guess is reasonable

   if (!this->m_objectiveFunction.domainSet().contains(*(this->m_initialPoint)))

     {

       if( m_objectiveFunction.domainSet().env().fullRank() == 0 )

         {

           std::cerr << "Minimization was given initial point outside of domain"

                     << std::endl;

         }

       queso_error();

     }


   unsigned int dim = this->m_objectiveFunction.domainSet().vectorSpace().

     zeroVector().sizeLocal();


   if( this->solver_needs_gradient(m_solver_type) )

     {

       this->minimize_with_gradient( dim, monitor );

     }

   else

     {

       this->minimize_no_gradient( dim, monitor );

     }


   return;

 }


 const BaseScalarFunction<GslVector, GslMatrix> &

 GslOptimizer::objectiveFunction() const

 {

   return this->m_objectiveFunction;

 }


 void

 GslOptimizer::setInitialPoint(const GslVector & initialPoint)

 {

   for (unsigned int i = 0; i < initialPoint.sizeLocal(); i++) {

     (*(this->m_initialPoint))[i] = initialPoint[i];

   }

 }


 const GslVector &

 GslOptimizer::minimizer() const

 {

   return *(this->m_minimizer);

 }


   void GslOptimizer::set_solver_type( SolverType solver )

   {

     m_solver_type = solver;

   }


   bool GslOptimizer::solver_needs_gradient( SolverType solver )

   {

     bool gradient_needed = false;


     switch(solver)

       {

       case(FLETCHER_REEVES_CG):

       case(POLAK_RIBIERE_CG):

       case(BFGS):

       case(BFGS2):

       case(STEEPEST_DESCENT):

         {

           gradient_needed = true;

           break;

         }

       case(NELDER_MEAD):

       case(NELDER_MEAD2):

       case(NELDER_MEAD2_RAND):

         {

           break;

         }

       default:

         {

           // Wat?!

           queso_error();

         }

       } // switch(solver)


     return gradient_needed;

   }


   void GslOptimizer::minimize_with_gradient( unsigned int dim, OptimizerMonitor* monitor )

   {

     // Set initial point

     gsl_vector * x = gsl_vector_alloc(dim);

     for (unsigned int i = 0; i < dim; i++) {

       gsl_vector_set(x, i, (*m_initialPoint)[i]);

     }


     // Tell GSL which solver we're using

     const gsl_multimin_fdfminimizer_type* type = NULL;


     switch(m_solver_type)

       {

       case(FLETCHER_REEVES_CG):

         type = gsl_multimin_fdfminimizer_conjugate_fr;

         break;

       case(POLAK_RIBIERE_CG):

         type = gsl_multimin_fdfminimizer_conjugate_pr;

         break;

       case(BFGS):

         type = gsl_multimin_fdfminimizer_vector_bfgs;

         break;

       case(BFGS2):

         type = gsl_multimin_fdfminimizer_vector_bfgs2;

         break;

       case(STEEPEST_DESCENT):

         type = gsl_multimin_fdfminimizer_steepest_descent;

         break;

       case(NELDER_MEAD):

       case(NELDER_MEAD2):

       case(NELDER_MEAD2_RAND):

       default:

         // Wat?!

         queso_error();

       }


     // Init solver

     gsl_multimin_fdfminimizer * solver =

       gsl_multimin_fdfminimizer_alloc(type, dim);


     // Point GSL to the right functions

     gsl_multimin_function_fdf minusLogPosterior;

     minusLogPosterior.n = dim;

     minusLogPosterior.f = &c_evaluate;

     minusLogPosterior.df = &c_evaluate_derivative;

     minusLogPosterior.fdf = &c_evaluate_with_derivative;

     minusLogPosterior.params = (void *)(this);


     gsl_multimin_fdfminimizer_set(solver, &minusLogPosterior, x, m_fdfstep_size, m_line_tol);


     int status;

     size_t iter = 0;


     do {

       iter++;

       status = gsl_multimin_fdfminimizer_iterate(solver);


       if (status) {

         if( m_objectiveFunction.domainSet().env().fullRank() == 0 )

           {

             std::cerr << "Error while GSL does optimisation. "

                       << "See below for GSL error type." << std::endl;

             std::cerr << "Gsl error: " << gsl_strerror(status) << std::endl;

           }

         break;

       }


       status = gsl_multimin_test_gradient(solver->gradient, this->getTolerance());


       if(monitor)

         {

           gsl_vector* x = gsl_multimin_fdfminimizer_x(solver);

           std::vector<double> x_min(dim);

           for( unsigned int i = 0; i < dim; i++)

             x_min[i] = gsl_vector_get(x,i);


           double f = gsl_multimin_fdfminimizer_minimum(solver);


           gsl_vector* grad = gsl_multimin_fdfminimizer_gradient(solver);

           double grad_norm = gsl_blas_dnrm2(grad);


           monitor->append( x_min, f, grad_norm );

         }


     } while ((status == GSL_CONTINUE) && (iter < this->getMaxIterations()));


     for (unsigned int i = 0; i < dim; i++) {

       (*m_minimizer)[i] = gsl_vector_get(solver->x, i);

     }


     // We're being good human beings and cleaning up the memory we allocated

     gsl_multimin_fdfminimizer_free(solver);

     gsl_vector_free(x);


     return;

   }


   void GslOptimizer::minimize_no_gradient( unsigned int dim, OptimizerMonitor* monitor )

   {

     // Set initial point

     gsl_vector* x = gsl_vector_alloc(dim);

     for (unsigned int i = 0; i < dim; i++) {

       gsl_vector_set(x, i, (*m_initialPoint)[i]);

     }


     // Tell GSL which solver we're using

     const gsl_multimin_fminimizer_type* type = NULL;


     switch(m_solver_type)

       {

       case(NELDER_MEAD):

         type = gsl_multimin_fminimizer_nmsimplex;

         break;

       case(NELDER_MEAD2):

         type = gsl_multimin_fminimizer_nmsimplex2;

         break;

       case(NELDER_MEAD2_RAND):

         type = gsl_multimin_fminimizer_nmsimplex2rand;

         break;

       case(FLETCHER_REEVES_CG):

       case(POLAK_RIBIERE_CG):

       case(BFGS):

       case(BFGS2):

       case(STEEPEST_DESCENT):

       default:

         // Wat?!

         queso_error();

       }


     // Init solver

     gsl_multimin_fminimizer* solver =

       gsl_multimin_fminimizer_alloc(type, dim);


     // Point GSL at the right functions

     gsl_multimin_function minusLogPosterior;

     minusLogPosterior.n = dim;

     minusLogPosterior.f = &c_evaluate;

     minusLogPosterior.params = (void *)(this);


     // Needed for these gradient free algorithms.

     gsl_vector* step_size = gsl_vector_alloc(dim);


     for(unsigned int i = 0; i < dim; i++) {

       gsl_vector_set(step_size, i, m_fstep_size[i]);

     }


     gsl_multimin_fminimizer_set(solver, &minusLogPosterior, x, step_size);


     int status;

     size_t iter = 0;

     double size = 0.0;


     do

       {

         iter++;

         status = gsl_multimin_fminimizer_iterate(solver);


         if (status) {

           if( m_objectiveFunction.domainSet().env().fullRank() == 0 )

             {

               std::cerr << "Error while GSL does optimisation. "

                         << "See below for GSL error type." << std::endl;

               std::cerr << "Gsl error: " << gsl_strerror(status) << std::endl;

             }

           break;

         }


         size = gsl_multimin_fminimizer_size(solver);


         status = gsl_multimin_test_size (size, this->getTolerance());


         if(monitor)

         {

           gsl_vector* x = gsl_multimin_fminimizer_x(solver);

           std::vector<double> x_min(dim);

           for( unsigned int i = 0; i < dim; i++)

             x_min[i] = gsl_vector_get(x,i);


           double f = gsl_multimin_fminimizer_minimum(solver);


           monitor->append( x_min, f, size );

         }


       }


     while ((status == GSL_CONTINUE) && (iter < this->getMaxIterations()));


     for (unsigned int i = 0; i < dim; i++) {

       (*m_minimizer)[i] = gsl_vector_get(solver->x, i);

     }


     // We're being good human beings and cleaning up the memory we allocated

     gsl_vector_free(step_size);

     gsl_multimin_fminimizer_free(solver);

     gsl_vector_free(x);


     return;

   }


   void GslOptimizer::set_step_size( const GslVector& step_size )

   {

     m_fstep_size = step_size;

   }


   void GslOptimizer::set_step_size( double step_size )

   {

     m_fdfstep_size = step_size;

   }


   GslOptimizer::SolverType GslOptimizer::string_to_enum( std::string& solver )

   {

     SolverType solver_type;


     if( solver == std::string("fletcher_reeves_cg") )

       solver_type = FLETCHER_REEVES_CG;

     else if( solver == std::string("polak_ribiere_cg") )

       solver_type = POLAK_RIBIERE_CG;

     else if( solver == std::string("bfgs") )

       solver_type = BFGS;

     else if( solver == std::string("bfgs2") )

       solver_type = BFGS2;

     else if( solver == std::string("steepest_decent") )

       solver_type = STEEPEST_DESCENT;

     else if( solver == std::string("nelder_mead") )

       solver_type = NELDER_MEAD;

     else if( solver == std::string("nelder_mead2") )

       solver_type = NELDER_MEAD2;

     else if( solver == std::string("nelder_mead2_rand") )

       solver_type = NELDER_MEAD2_RAND;

     else

       {

         if( m_objectiveFunction.domainSet().env().fullRank() == 0 )

           {

             std::cerr << "Error: Invalid GslOptimizer solver name: " << solver << std::endl

                       << "       Valids choices are: fletcher_reeves_cg" << std::endl

                       << "                           polak_ribiere_cg" << std::endl

                       << "                           bfgs" << std::endl

                       << "                           bfgs2" << std::endl

                       << "                           steepest_decent" << std::endl

                       << "                           nelder_mead" << std::endl

                       << "                           nelder_mead2" << std::endl

                       << "                           nelder_mead2_rand" << std::endl;

           }

         queso_error();

       }


     return solver_type;

   }


   void GslOptimizer::set_solver_type( std::string& solver )

   {

     this->set_solver_type( this->string_to_enum(solver) );

   }


 }  // End namespace QUESO

QUESO::GslOptimizer::GslOptimizer
GslOptimizer(const BaseScalarFunction< GslVector, GslMatrix > &objectiveFunction)
Constructs an object that will maximize a scalar function.
Definition: GslOptimizer.C:159

QUESO::GslOptimizer::NELDER_MEAD
Definition: GslOptimizer.h:76

QUESO::OptimizerMonitor::append
void append(std::vector< double > &x_min, double objective, double norm)
Add current value of minimizer, objective, and error norm.
Definition: OptimizerMonitor.C:53

QUESO::GslOptimizer::m_line_tol
double m_line_tol
Line minimization tolerance in gradient-based algorithms.
Definition: GslOptimizer.h:134

QUESO::GslOptimizer::set_step_size
void set_step_size(const GslVector &step_size)
Sets step size used in gradient-free solvers.
Definition: GslOptimizer.C:467

QUESO::GslOptimizer::~GslOptimizer
virtual ~GslOptimizer()
Destructor.
Definition: GslOptimizer.C:179

QUESO::GslOptimizer::BFGS
Definition: GslOptimizer.h:73

QUESO::GslOptimizer::m_solver_type
SolverType m_solver_type
Definition: GslOptimizer.h:125

QUESO::GslOptimizer
A base class for handling optimisation of scalar functions.
Definition: GslOptimizer.h:50

dim
int dim
Definition: ann2fig.cpp:81

QUESO::GslOptimizer::NELDER_MEAD2
Definition: GslOptimizer.h:77

QUESO::GslOptimizer::setInitialPoint
void setInitialPoint(const GslVector &intialPoint)
Set the point at which the optimization starts.
Definition: GslOptimizer.C:219

QUESO::GslOptimizer::FLETCHER_REEVES_CG
Definition: GslOptimizer.h:71

QUESO::GslOptimizer::m_objectiveFunction
const BaseScalarFunction< GslVector, GslMatrix > & m_objectiveFunction
Definition: GslOptimizer.h:120

QUESO::GslOptimizer::objectiveFunction
const BaseScalarFunction< GslVector, GslMatrix > & objectiveFunction() const
Returns the objective function.
Definition: GslOptimizer.C:213

QUESO::GslOptimizer::BFGS2
Definition: GslOptimizer.h:74

QUESO::GslOptimizer::POLAK_RIBIERE_CG
Definition: GslOptimizer.h:72

QUESO::BaseScalarFunction
A templated (base) class for handling scalar functions.
Definition: ScalarFunction.h:51

QUESO::GslOptimizer::minimize
virtual void minimize(OptimizerMonitor *monitor=NULL)
Minimize the objective function, starting at m_initialPoint.
Definition: GslOptimizer.C:184

QUESO::GslOptimizer::solver_needs_gradient
bool solver_needs_gradient(SolverType solver)
Helper function.
Definition: GslOptimizer.C:237

QUESO::GslOptimizer::minimize_with_gradient
void minimize_with_gradient(unsigned int dim, OptimizerMonitor *monitor)
Definition: GslOptimizer.C:268

QUESO::GslVector::cwSet
void cwSet(double value)
Component-wise sets all values to this with value.
Definition: GslVector.C:326

QUESO::BaseOptimizer
A base class for handling optimisation of scalar functions.
Definition: Optimizer.h:44

QUESO::GslOptimizer::STEEPEST_DESCENT
Definition: GslOptimizer.h:75

QUESO::GslOptimizer::m_fdfstep_size
double m_fdfstep_size
For use in gradient-based algorithms.
Definition: GslOptimizer.h:131

QUESO::GslOptimizer::m_initialPoint
GslVector * m_initialPoint
Definition: GslOptimizer.h:122

QUESO::BaseOptimizer::getMaxIterations
unsigned int getMaxIterations() const
Returns the maximum number of iterations the optimizer will do.
Definition: Optimizer.C:41

QUESO::GslOptimizer::m_minimizer
GslVector * m_minimizer
Definition: GslOptimizer.h:123

queso_error
#define queso_error()
Definition: asserts.h:53

QUESO::BaseOptimizer::getTolerance
double getTolerance() const
Returns the tolerance used to test for an extremum in the optimizer.
Definition: Optimizer.C:47

QUESO::GslOptimizer::set_solver_type
void set_solver_type(SolverType solver)
Definition: GslOptimizer.C:232

QUESO::GslVector::sizeLocal
unsigned int sizeLocal() const
Returns the length of this vector.
Definition: GslVector.C:240

QUESO::GslOptimizer::minimize_no_gradient
void minimize_no_gradient(unsigned int dim, OptimizerMonitor *monitor)
Definition: GslOptimizer.C:365

QUESO::GslOptimizer::minimizer
const GslVector & minimizer() const
Return the point that minimizes the objective function.
Definition: GslOptimizer.C:227

QUESO::c_evaluate_derivative
void c_evaluate_derivative(const gsl_vector *x, void *context, gsl_vector *derivative)
Definition: GslOptimizer.C:69

QUESO::c_evaluate_with_derivative
void c_evaluate_with_derivative(const gsl_vector *x, void *context, double *f, gsl_vector *derivative)
Definition: GslOptimizer.C:151

QUESO::GslOptimizer::NELDER_MEAD2_RAND
Definition: GslOptimizer.h:78

QUESO::BaseOptimizer::getFiniteDifferenceStepSize
double getFiniteDifferenceStepSize() const
Returns the step size used in the finite difference formula.
Definition: Optimizer.C:53

QUESO::GslVector
Class for vector operations using GSL library.
Definition: GslVector.h:49

QUESO::GslOptimizer::m_fstep_size
GslVector m_fstep_size
For use in gradient-free algorithms.
Definition: GslOptimizer.h:128

QUESO::OptimizerMonitor
Object to monitor convergence of optimizers.
Definition: OptimizerMonitor.h:36

QUESO::c_evaluate
double c_evaluate(const gsl_vector *x, void *context)
Definition: GslOptimizer.C:43

QUESO::GslOptimizer::string_to_enum
SolverType string_to_enum(std::string &solver)
Definition: GslOptimizer.C:477

QUESO::GslOptimizer::SolverType
SolverType
Definition: GslOptimizer.h:71