madness/solvers_8h_source.html

 /*

   This file is part of MADNESS.


   Copyright (C) 2007,2010 Oak Ridge National Laboratory


   This program is free software; you can redistribute it and/or modify

   it under the terms of the GNU General Public License as published by

   the Free Software Foundation; either version 2 of the License, or

   (at your option) any later version.


   This program is distributed in the hope that it will be useful,

   but WITHOUT ANY WARRANTY; without even the implied warranty of

   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

   GNU General Public License for more details.


   You should have received a copy of the GNU General Public License

   along with this program; if not, write to the Free Software

   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA


   For more information please contact:


   Robert J. Harrison

   Oak Ridge National Laboratory

   One Bethel Valley Road

   P.O. Box 2008, MS-6367


   email: harrisonrj@ornl.gov

   tel:   865-241-3937

   fax:   865-572-0680


   $Id$

 */

 #ifndef MADNESS_LINALG_SOLVERS_H__INCLUDED

 #define MADNESS_LINALG_SOLVERS_H__INCLUDED


 #include <madness/tensor/tensor.h>

 #include <madness/world/print.h>

 #include <iostream>

 #include <madness/tensor/tensor_lapack.h>


 namespace madness {


     template <typename T>

     Tensor<T> KAIN(const Tensor<T>& Q, double rcond=1e-12) {

         const int nvec = Q.dim(0);

         const int m = nvec-1;


         if (nvec == 1) {

             Tensor<T> c(1);

             c(0L) = 1.0;

             return c;

         }


         Tensor<T> A(m,m);

         Tensor<T> b(m);

         for (long i=0; i<m; ++i) {

             b(i) = Q(m,m) - Q(i,m);

             for (long j=0; j<m; ++j) {

                 A(i,j) = Q(i,j) - Q(m,j) - Q(i,m) + Q(m,m);

             }

         }


     //     print("Q");

     //     print(Q);

     //     print("A");

     //     print(A);

     //     print("b");

     //     print(b);


         Tensor<T> x;

         Tensor<double> s, sumsq;

         long rank;

         gelss(A, b, rcond, x, s, rank, sumsq);

 //         print("singular values", s);

 //         print("rank", rank);

 //         print("solution", x);


         Tensor<T> c(nvec);

         T sumC = 0.0;

         for (long i=0; i<m; ++i) sumC += x(i);

         c(Slice(0,m-1)) = x;

 //         print("SUMC", nvec, m, sumC);

         c(m) = 1.0 - sumC;


 //         print("returned C", c);


         return c;

     }


     struct SolverTargetInterface {

         virtual Tensor<double> residual(const Tensor<double>& x) = 0;


         virtual bool provides_jacobian() const {return false;}


         virtual Tensor<double> jacobian(const Tensor<double>& x) {

             throw "not implemented";

         }


         virtual void residual_and_jacobian(const Tensor<double>& x,

                                            Tensor<double>& residual, Tensor<double>& jacobian) {

             residual = this->residual(x);

             jacobian = this->jacobian(x);

         }


         virtual ~SolverTargetInterface() {}

     };


     struct OptimizationTargetInterface {

         virtual double value(const Tensor<double>& x) = 0;


         virtual bool provides_gradient() const {return false;}


         virtual Tensor<double> gradient(const Tensor<double>& x) {

             throw "not implemented";

         }


         virtual void value_and_gradient(const Tensor<double>& x,

                                         double& value,

                                         Tensor<double>& gradient) {

             value = this->value(x);

             gradient = this->gradient(x);

         }


         double test_gradient(Tensor<double>& x, double value_precision, bool doprint=true);


         virtual ~OptimizationTargetInterface(){}

     };


     struct SolverInterface {

         virtual bool solve(Tensor<double>& x) = 0;

         virtual bool converged() const = 0;

         virtual double residual_norm() const = 0;

         virtual ~SolverInterface() {}

     };


     struct OptimizerInterface {

         virtual bool optimize(Tensor<double>& x) = 0;

         virtual bool converged() const = 0;

         virtual double value() const = 0;

         virtual double gradient_norm() const = 0;

         virtual ~OptimizerInterface(){}

     };


     class SteepestDescent : public OptimizerInterface {

         std::shared_ptr<OptimizationTargetInterface> target;

         const double tol;

         const double value_precision;  // Numerical precision of value

         const double gradient_precision; // Numerical precision of each element of residual

         double f;

         double gnorm;


     public:

         SteepestDescent(const std::shared_ptr<OptimizationTargetInterface>& tar,

                         double tol = 1e-6,

                         double value_precision = 1e-12,

                         double gradient_precision = 1e-12);


         bool optimize(Tensor<double>& x);


         bool converged() const;


         double gradient_norm() const;


         double value() const;


         virtual ~SteepestDescent() { }

     };


     class QuasiNewton : public OptimizerInterface {

     private:

         std::string update;              // One of BFGS or SR1

         std::shared_ptr<OptimizationTargetInterface> target;

         const int maxiter;

         const double tol;

         const double value_precision;  // Numerical precision of value

         const double gradient_precision; // Numerical precision of each element of residual

         double f;

         double gnorm;

         Tensor<double> h;

         int n;

         bool printtest;


         double line_search(double a1, double f0, double dxgrad, const Tensor<double>& x, const Tensor<double>& dx);


         void hessian_update_sr1(const Tensor<double>& s, const Tensor<double>& y);


         void hessian_update_bfgs(const Tensor<double>& dx,

                                  const Tensor<double>& dg);


         Tensor<double> new_search_direction(const Tensor<double>& g);


     public:

         QuasiNewton(const std::shared_ptr<OptimizationTargetInterface>& tar,

                     int maxiter = 20,

                     double tol = 1e-6,

                     double value_precision = 1e-12,

                     double gradient_precision = 1e-12);


         void set_update(const std::string& method);


         void set_test(const bool& test_level);


         bool optimize(Tensor<double>& x);


         bool converged() const;


         double value() const;


         void reset_hessian() {h = Tensor<double>();}


         void set_hessian(const Tensor<double>& matrix) {h = madness::copy(matrix);}


         double gradient_norm() const;


         virtual ~QuasiNewton() {}

     };

 }


 #endif // MADNESS_LINALG_SOLVERS_H__INCLUDED

madness::tr1::shptr::shared_ptr< OptimizationTargetInterface >

madness::SolverTargetInterface::residual
virtual Tensor< double > residual(const Tensor< double > &x)=0
Should return the resdiual (vector F(x))

madness::g
NDIM const Function< R, NDIM > & g
Definition: mra.h:2179

madness::SteepestDescent::~SteepestDescent
virtual ~SteepestDescent()
Definition: solvers.h:250

madness::QuasiNewton::set_hessian
void set_hessian(const Tensor< double > &matrix)
Sets Hessian to given matrix.
Definition: solvers.h:313

madness::OptimizerInterface::converged
virtual bool converged() const =0

madness::gelss
void gelss(const Tensor< T > &a, const Tensor< T > &b, double rcond, Tensor< T > &x, Tensor< typename Tensor< T >::scalar_type > &s, long &rank, Tensor< typename Tensor< T >::scalar_type > &sumsq)
Solve Ax = b for general A using the LAPACK *gelss routines.
Definition: lapack.cc:393

L
const double L
Definition: 3dharmonic.cc:123

testing::internal::string
::std::string string
Definition: gtest-port.h:872

madness::OptimizerInterface::value
virtual double value() const =0

madness::SolverInterface::converged
virtual bool converged() const =0

madness::SteepestDescent::gradient_norm
double gradient_norm() const
Definition: solvers.cc:110

madness::OptimizerInterface
The interface to be provided by optimizers.
Definition: solvers.h:216

madness::QuasiNewton::QuasiNewton
QuasiNewton(const std::shared_ptr< OptimizationTargetInterface > &tar, int maxiter=20, double tol=1e-6, double value_precision=1e-12, double gradient_precision=1e-12)
Definition: solvers.cc:247

madness::SolverTargetInterface::residual_and_jacobian
virtual void residual_and_jacobian(const Tensor< double > &x, Tensor< double > &residual, Tensor< double > &jacobian)
Implement this if advantageous to compute residual and jacobian simultaneously.
Definition: solvers.h:163

madness::SteepestDescent::value
double value() const
Definition: solvers.cc:112

madness::SteepestDescent
Unconstrained minimization via steepest descent.
Definition: solvers.h:228

madness::QuasiNewton::optimize
bool optimize(Tensor< double > &x)
Runs the optimizer.
Definition: solvers.cc:274

madness::QuasiNewton::reset_hessian
void reset_hessian()
Resets Hessian to default guess.
Definition: solvers.h:310

madness::SolverInterface::~SolverInterface
virtual ~SolverInterface()
Definition: solvers.h:210

tensor.h
Defines and implements most of Tensor.

madness::SolverInterface::residual_norm
virtual double residual_norm() const =0

madness::OptimizerInterface::~OptimizerInterface
virtual ~OptimizerInterface()
Definition: solvers.h:221

madness::QuasiNewton
Optimization via quasi-Newton (BFGS or SR1 update)
Definition: solvers.h:258

std::tr1::T
const T1 &f1 return GTEST_2_TUPLE_() T(f0, f1)

madness::OptimizationTargetInterface
The interface to be provided by functions to be optimized.
Definition: solvers.h:176

madness::copy
Function< T, NDIM > copy(const Function< T, NDIM > &f, const std::shared_ptr< WorldDCPmapInterface< Key< NDIM > > > &pmap, bool fence=true)
Create a new copy of the function with different distribution and optional fence. ...
Definition: mra.h:1835

tensor_lapack.h
Prototypes for a partial interface from Tensor to LAPACK.

madness::QuasiNewton::gradient_norm
double gradient_norm() const
Value of gradient norm.
Definition: solvers.cc:329

madness::SolverTargetInterface::~SolverTargetInterface
virtual ~SolverTargetInterface()
Definition: solvers.h:169

madness::QuasiNewton::~QuasiNewton
virtual ~QuasiNewton()
Definition: solvers.h:320

madness::OptimizationTargetInterface::provides_gradient
virtual bool provides_gradient() const
Override this to return true if the derivative is implemented.
Definition: solvers.h:181

madness::SteepestDescent::converged
bool converged() const
Definition: solvers.cc:108

madness::OptimizationTargetInterface::gradient
virtual Tensor< double > gradient(const Tensor< double > &x)
Should return the derivative of the function.
Definition: solvers.h:184

madness::QuasiNewton::set_test
void set_test(const bool &test_level)
Choose update method (currently only "BFGS" or "SR1")
Definition: solvers.cc:269

madness::SteepestDescent::optimize
bool optimize(Tensor< double > &x)
Definition: solvers.cc:80

madness::SolverTargetInterface
The interface to be provided by targets for non-linear equation solver.
Definition: solvers.h:148

madness::SolverTargetInterface::jacobian
virtual Tensor< double > jacobian(const Tensor< double > &x)
Some solvers require the jacobian or are faster if an analytic form is available. ...
Definition: solvers.h:158

madness::QuasiNewton::set_update
void set_update(const std::string &method)
Choose update method (currently only "BFGS" or "SR1")
Definition: solvers.cc:265

m
const double m
Definition: gfit.cc:199

madness::SolverTargetInterface::provides_jacobian
virtual bool provides_jacobian() const
Override this to return true if the Jacobian is implemented.
Definition: solvers.h:153

print.h
Defines simple templates for printing to std::cout "a la Python".

madness::OptimizationTargetInterface::value_and_gradient
virtual void value_and_gradient(const Tensor< double > &x, double &value, Tensor< double > &gradient)
Reimplement if more efficient to evaluate both value and gradient in one call.
Definition: solvers.h:189

a1
const double a1
Definition: vnucso.cc:90

madness::OptimizationTargetInterface::test_gradient
double test_gradient(Tensor< double > &x, double value_precision, bool doprint=true)
Numerical test of the derivative ... optionally prints to stdout, returns max abs error...
Definition: solvers.cc:38

madness::OptimizationTargetInterface::~OptimizationTargetInterface
virtual ~OptimizationTargetInterface()
Definition: solvers.h:199

madness::SolverInterface::solve
virtual bool solve(Tensor< double > &x)=0

madness::OptimizerInterface::gradient_norm
virtual double gradient_norm() const =0

madness::QuasiNewton::value
double value() const
Value of objective function.
Definition: solvers.cc:327

madness::Slice
A slice defines a sub-range or patch of a dimension.
Definition: slice.h:103

madness::SteepestDescent::SteepestDescent
SteepestDescent(const std::shared_ptr< OptimizationTargetInterface > &tar, double tol=1e-6, double value_precision=1e-12, double gradient_precision=1e-12)
Definition: solvers.cc:67

madness
Holds machinery to set up Functions/FuncImpls using various Factories and Interfaces.
Definition: chem/atomutil.cc:45

c
const double c
Definition: gfit.cc:200

b
FLOAT b(int j, FLOAT z)
Definition: y1.cc:79

madness::SolverInterface
The interface to be provided by solvers ... NOT USED ANYWHERE?
Definition: solvers.h:206

madness::OptimizationTargetInterface::value
virtual double value(const Tensor< double > &x)=0
Should return the value of the objective function.

madness::KAIN
Tensor< T > KAIN(const Tensor< T > &Q, double rcond=1e-12)
Solves non-linear equation using KAIN (returns coefficients to compute next vector) ...
Definition: solvers.h:98

madness::OptimizerInterface::optimize
virtual bool optimize(Tensor< double > &x)=0

madness::QuasiNewton::converged
bool converged() const
After running the optimizer returns true if converged.
Definition: solvers.cc:325