abacus-develop/opt__TN_8hpp_source.html

#ifndef OPT_TN_H

#define OPT_TN_H


#include "opt_CG.h"


#include <limits>


namespace ModuleBase

{


class Opt_TN

{

  public:


    Opt_TN()

    {

        this->mach_prec_ = std::numeric_limits<double>::epsilon(); // get machine precise

    }


    ~Opt_TN() {};


    void allocate(int nx)

    {

        this->nx_ = nx;

        this->cg_.allocate(this->nx_);

    }


    void set_para(double dV)

    {

        this->dV_ = dV;

        this->cg_.set_para(this->dV_);

    }


    void refresh(int nx_new = 0)

    {

        this->iter_ = 0;

        if (nx_new != 0)

        {

            this->nx_ = nx_new;

        }

        this->cg_.refresh(nx_new);

    }


    template <class T>

    void next_direct(

        double* px,        // current x

        double* pgradient, // df(x)/dx

        int& flag,       // record which truncated condition was triggered, 0 for cond.1, 1 for cond.2, and 2 for cond.3

        double* rdirect, // next optimization direction

        T* t,            // point of class T, which contains the gradient function

        void (T::*p_calGradient)(

            double* ptemp_x,

            double* rtemp_gradient) // a function point, which calculates the gradient at provided x

    );


    int get_iter()

    {

        return this->iter_;

    }


  private:

    Opt_CG cg_;

    double dV_ = 1.;


    int nx_ = 0;            // length of the solution array x

    int iter_ = 0;          // number of the iteration

    double mach_prec_ = 0.; // machine precision


    double inner_product(double* pa, double* pb, int length)

    {

        double innerproduct = BlasConnector::dot(length, pa, 1, pb, 1);

        innerproduct *= this->dV_;

        return innerproduct;

    }


    double get_epsilon(double* px, double* pcg_direction)

    {

        double epsilon = 0.;

        double xx = this->inner_product(px, px, this->nx_);

        Parallel_Reduce::reduce_all(xx);

        double dd = this->inner_product(pcg_direction, pcg_direction, this->nx_);

        Parallel_Reduce::reduce_all(dd);

        epsilon = 2 * sqrt(this->mach_prec_) * (1 + sqrt(xx)) / sqrt(dd);

        // epsilon = 2 * sqrt(this->mach_prec_) * (1 + sqrt(this->inner_product(px, px, this->nx_)))

        //         / sqrt(this->inner_product(pcg_direction, pcg_direction, this->nx_));

        return epsilon;

    }


};


template <class T>


void Opt_TN::next_direct(double* px,

                         double* pgradient,

                         int& flag,

                         double* rdirect,

                         T* t,

                         void (T::*p_calGradient)(double* px, double* rgradient))

{

    // initialize arrays and parameters

    ModuleBase::GlobalFunc::ZEROS(rdirect, this->nx_); // very important


    double* minus_gradient = new double[this->nx_]; // b=-g, which will be used in CG

    double* temp_x = new double[this->nx_];         // temp_x = x + step * cg_direct, used in interpolation

    double* temp_gradient = new double[this->nx_];  // df(temp_x)/dx

    double* cg_direct = new double[this->nx_];      // rdirect += cg_alpha * cg_direct at each step

    double* temp_Hcgd = new double[this->nx_];      // Hessian * cg_direct

    for (int i = 0; i < this->nx_; ++i)

    {

        minus_gradient[i] = -pgradient[i];

    }

    ModuleBase::GlobalFunc::ZEROS(cg_direct, this->nx_);

    ModuleBase::GlobalFunc::ZEROS(temp_x, this->nx_);

    ModuleBase::GlobalFunc::ZEROS(temp_gradient, this->nx_);

    ModuleBase::GlobalFunc::ZEROS(temp_Hcgd, this->nx_);


    cg_.refresh(0, minus_gradient);

    int cg_iter = 0;

    int cg_ifPD = 0;


    double epsilon = 0.;       // step length in interpolation

    double cg_alpha = 0.;      // step length got by CG

    double init_residual = 0.; // initial residual of CG

    double last_residual = 0.; // last residual of CG

    double curr_residual = 0.; // current residual of CG


    while (true)

    {

        cg_.next_direct(temp_Hcgd, 0, cg_direct);


        // get temp_Hcgd with interpolation

        // Hcgd = (df(temp_x)/dx - df(x)/x) / epsilon, where temp_x = x + step * cg_direct

        epsilon = this->get_epsilon(px, cg_direct);

        // epsilon = 1e-9;

        for (int i = 0; i < this->nx_; ++i)

        {

            temp_x[i] = px[i] + epsilon * cg_direct[i];

        }

        (t->*p_calGradient)(temp_x, temp_gradient);

        for (int i = 0; i < this->nx_; ++i)

        {

            temp_Hcgd[i] = (temp_gradient[i] - pgradient[i]) / epsilon;

        }


        // get CG step length and update rdirect

        cg_alpha = cg_.step_length(temp_Hcgd, cg_direct, cg_ifPD);

        if (cg_ifPD == -1) // Hessian is not positive definite, and cgiter = 1.

        {

            for (int i = 0; i < this->nx_; ++i)

            {

                rdirect[i] += cg_alpha * cg_direct[i];

            }

            flag = -1;

            break;

        }

        else if (cg_ifPD == -2) // Hessian is not positive definite, and cgiter > 1.

        {

            flag = -2;

            break;

        }


        for (int i = 0; i < this->nx_; ++i)

        {

            rdirect[i] += cg_alpha * cg_direct[i];

        }


        // store residuals used in truncated conditions

        last_residual = curr_residual;

        curr_residual = cg_.get_residual();

        cg_iter = cg_.get_iter();

        if (cg_iter == 1)

        {

            init_residual = curr_residual;

        }


        // check truncated conditions

        // if (curr_residual < 1e-12)

        if (curr_residual < 0.1 * init_residual)

        {

            flag = 0;

            // std::cout << "cg_ iter_ = " << cg_iter << "\n";

            break;

        }

        else if (cg_iter > 50)

        {

            flag = 1;

            break;

        }

        else if ((fabs(curr_residual - last_residual) / curr_residual) < 0.01 && cg_iter > 9)

        {

            flag = 2;

            break;

        }

    }

    this->iter_++;

    delete[] minus_gradient;

    delete[] temp_gradient;

    delete[] temp_x;

    delete[] temp_Hcgd;

    delete[] cg_direct;

}


} // namespace ModuleBase

#endif

BlasConnector::dot
static float dot(const int n, const float *const X, const int incX, const float *const Y, const int incY, base_device::AbacusDevice_t device_type=base_device::AbacusDevice_t::CpuDevice)
Definition blas_connector_vector.cpp:142

ModuleBase::Opt_CG
A class designed to deal with optimization problems with CG method. Three forms of CG methods have be...
Definition opt_CG.h:25

ModuleBase::Opt_CG::allocate
void allocate(int nx)
Allocate the space for pdirect_old and pgradient_old.
Definition opt_CG.cpp:36

ModuleBase::Opt_CG::get_residual
double get_residual()
Definition opt_CG.h:48

ModuleBase::Opt_CG::get_iter
int get_iter()
Definition opt_CG.h:52

ModuleBase::Opt_CG::next_direct
void next_direct(double *pgradient, int label, double *rdirect)
Get the next optimization direction.
Definition opt_CG.cpp:85

ModuleBase::Opt_CG::refresh
void refresh(int nx_new=0, double *pinp_b=nullptr)
Refresh the class. If nx changes, reallocate space. If b is provided, initialize it.
Definition opt_CG.cpp:59

ModuleBase::Opt_CG::set_para
void set_para(double dV)
Definition opt_CG.cpp:47

ModuleBase::Opt_CG::step_length
double step_length(double *pAd, double *pdirect, int &ifPD)
Get the step length, only work for standard CG.
Definition opt_CG.cpp:131

ModuleBase::Opt_TN
A class designed to deal with optimization problems with Truncated-Newton (TN) method....
Definition opt_TN.hpp:22

ModuleBase::Opt_TN::cg_
Opt_CG cg_
Definition opt_TN.hpp:81

ModuleBase::Opt_TN::get_epsilon
double get_epsilon(double *px, double *pcg_direction)
Get epsilon used in interpolation. epsilon = 2*sqrt(mach_prec_) * (1+|x|) / |d|. || means modulu.
Definition opt_TN.hpp:103

ModuleBase::Opt_TN::next_direct
void next_direct(double *px, double *pgradient, int &flag, double *rdirect, T *t, void(T::*p_calGradient)(double *ptemp_x, double *rtemp_gradient))

ModuleBase::Opt_TN::dV_
double dV_
Definition opt_TN.hpp:82

ModuleBase::Opt_TN::inner_product
double inner_product(double *pa, double *pb, int length)
Definition opt_TN.hpp:88

ModuleBase::Opt_TN::nx_
int nx_
Definition opt_TN.hpp:84

ModuleBase::Opt_TN::~Opt_TN
~Opt_TN()
Definition opt_TN.hpp:28

ModuleBase::Opt_TN::refresh
void refresh(int nx_new=0)
Refresh the class. If nx changes, reallocate space in cg_.
Definition opt_TN.hpp:53

ModuleBase::Opt_TN::Opt_TN
Opt_TN()
Definition opt_TN.hpp:24

ModuleBase::Opt_TN::get_iter
int get_iter()
Definition opt_TN.hpp:75

ModuleBase::Opt_TN::mach_prec_
double mach_prec_
Definition opt_TN.hpp:86

ModuleBase::Opt_TN::allocate
void allocate(int nx)
Allocate the space for the arrays in cg_.
Definition opt_TN.hpp:35

ModuleBase::Opt_TN::set_para
void set_para(double dV)
Definition opt_TN.hpp:41

ModuleBase::Opt_TN::iter_
int iter_
Definition opt_TN.hpp:85

T
#define T
Definition exp.cpp:237

ModuleBase::GlobalFunc::ZEROS
void ZEROS(std::complex< T > *u, const TI n)
Definition global_function.h:109

ModuleBase
Definition array_pool.h:6

Parallel_Reduce::reduce_all
void reduce_all(T &object)
reduce in all process
Definition depend_mock.cpp:14

opt_CG.h