doc/doxygen/diff__optim_8h_source.html

 /* =========================================================================== *

    |

    |  Copyright (c) 1994-2011 by Kobus Barnard (author)

    |

    |  Personal and educational use of this code is granted, provided that this

    |  header is kept intact, and that the authorship is not misrepresented, that

    |  its use is acknowledged in publications, and relevant papers are cited.

    |

    |  For other use contact the author (kobus AT cs DOT arizona DOT edu).

    |

    |  Please note that the code in this file has not necessarily been adequately

    |  tested. Naturally, there is no guarantee of performance, support, or fitness

    |  for any particular task. Nonetheless, I am interested in hearing about

    |  problems that you encounter.

    |

    |  Author:  Ernesto Brau

  * =========================================================================== */


 /* $Id$ */


 #ifndef DIFF_OPTIM_H

 #define DIFF_OPTIM_H


 #include <l/l_verbose.h>

 #include <l_cpp/l_exception.h>

 #include <m_cpp/m_vector.h>

 #include <diff_cpp/diff_util.h>

 #include <vector>

 #include <utility>

 #include <limits>

 #include <algorithm>

 #include <functional>


 namespace kjb {


 template<class F, class M, class A>

 double grid_maximize

 (

     const F& fcn,

     const std::vector<std::pair<double, double> >& bounds,

     size_t nbins,

     const A& adapter,

     M& mxm

 )

 {

     const size_t D = bounds.size();

     IFT(D != 0, Illegal_argument, "Cannot optimize 0-dimensional function");


     if(D > 8)

     {

         kjb_c::warn_pso("The dimensionality of this function is %d; this "

                         "approximation might take a really long time.", D);

     }


     std::vector<double> bin_widths(D);

     for(size_t i = 0; i < D; i++)

     {

         bin_widths[i] = (bounds[i].second - bounds[i].first)/nbins;

     }


     std::vector<size_t> indices;

     M x = mxm;

     double mx = -std::numeric_limits<double>::max();

     while(next_point(bounds, bin_widths, nbins, indices, x, adapter))

     {

         double fx = fcn(x);

         if(fx > mx)

         {

             mx = fx;

             mxm = x;

         }

     }


     return mx;

 }


 template<class F, class V>

 inline

 double grid_maximize

 (

     const F& fcn,

     const std::vector<std::pair<double, double> >& bounds,

     size_t nbins,

     V& mxm

 )

 {

     const size_t D = bounds.size();

     if(mxm.size() != D)

     {

         mxm.resize(D);

     }


     return grid_maximize(fcn, bounds, nbins, Vector_adapter<V>(), mxm);

 }


 template<class F, class M, class G, class A>

 void gradient_ascent

 (

     const F& fcn,

     M& x,

     const std::vector<double>& steps,

     const G& grad,

     const A& adapter

 )

 {

     const size_t D = adapter.size(&x);

     IFT(D == steps.size(), Illegal_argument,

         "cannot perform gradient ascent: wrong number of step sizes.");


     Vector g(D);

     std::vector<double> exg(D);


     // simultaneuous optimization

     double cur_f = fcn(x);

     double prev_f;

     do

     {

         // old f(x)

         prev_f = cur_f;


         // compute gradient and move

         g = grad(x);

         std::transform(

                 steps.begin(),

                 steps.end(),

                 g.begin(),

                 exg.begin(),

                 std::multiplies<double>());


         // move model

         move_params(x, exg, adapter);


         // new f(x)

         cur_f = fcn(x);

     }

     while(cur_f > prev_f);


     std::transform(exg.begin(), exg.end(), exg.begin(), std::negate<double>());

     move_params(x, exg, adapter);

 }


 template<class F, class V, class G>

 inline

 void gradient_ascent

 (

     const F& fcn,

     V& x,

     const std::vector<double>& steps,

     const G& grad

 )

 {

     gradient_ascent(fcn, x, steps, grad, Vector_adapter<V>());

 }


 template<class F, class M, class A>

 void refine_max

 (

     const F& fcn,

     M& x,

     const std::vector<double>& steps,

     const A& adapter

 )

 {

     double cur_pt = fcn(x);

     bool at_max = false;

     while(!at_max)

     {

         at_max = true;

         for(size_t i = 0; i < adapter.size(&x); i++)

         {

             double xi = adapter.get(&x, i);

             // move right

             move_param(x, i, steps[i], adapter);

             double right_pt = fcn(x);


             // move left

             move_param(x, i, -2.0*steps[i], adapter);

             double left_pt = fcn(x);


             // move back

             adapter.set(&x, i, xi);

             if(cur_pt >= left_pt && cur_pt >= right_pt) continue;


             at_max = false;

             if(left_pt > right_pt)

             {

                 move_param(x, i, -steps[i], adapter);

                 cur_pt = left_pt;

             }

             else

             {

                 move_param(x, i, steps[i], adapter);

                 cur_pt = right_pt;

             }

         }

     }

 }


 } //namespace kjb


 #endif /*DIFF_OPTIM_H */


kjb::max
Int_matrix::Value_type max(const Int_matrix &mat)
Return the maximum value in this matrix.
Definition: l_int_matrix.h:1397

kjb::gradient_ascent
void gradient_ascent(const F &fcn, M &x, const std::vector< double > &steps, const G &grad, const A &adapter)
Maximizes a function using a simple gradient ascent method.
Definition: diff_optim.h:148

kjb::move_param
void move_param(Model &x, size_t i, double dv, const Adapter &aptr)
Helper function that moves a parameter by an amount.
Definition: diff_util.h:102

kjb::Vector
This class implements vectors, in the linear-algebra sense, with real-valued elements.
Definition: m_vector.h:87

IFT
#define IFT(a, ex, msg)
Definition: l_exception.h:101

kjb::next_point
bool next_point(const std::vector< std::pair< double, double > > &bounds, const std::vector< double > &widths, size_t nbins, std::vector< size_t > &indices, M &x, const A &adapter)
Gets the next point in a N-dimensional grid.
Definition: diff_util.h:145

kjb::move_params
void move_params(Model &x, size_t i, size_t j, double dv, double dw, const Adapter &aptr)
Helper function that moves a pair of parameters by an amount.
Definition: diff_util.h:111

x
x
Definition: APPgetLargeConnectedEdges.m:100

diff_util.h

kjb::Vector_adapter
Default adapter for the hessian function.
Definition: diff_util.h:42

kjb::Illegal_argument
Object thrown when an argument to a function is not acceptable.
Definition: l_exception.h:377

i
get the indices of edges in each direction for i
Definition: APPgetLargeConnectedEdges.m:48

D
D
Definition: APPgetLargeConnectedEdges.m:106

l_exception.h
Support for error handling exception classes in libKJB.

kjb::grid_maximize
double grid_maximize(const F &fcn, const std::vector< std::pair< double, double > > &bounds, size_t nbins, const A &adapter, M &mxm)
Maximizes a function by evaluating at all points in a grid.
Definition: diff_optim.h:56

kjb::refine_max
void refine_max(const F &fcn, M &x, const std::vector< double > &steps, const A &adapter)
Refine the maximum of a function.
Definition: diff_optim.h:236

m_vector.h
Definition for the Vector class, a thin wrapper on the KJB Vector struct and its related functionalit...