abacus-develop/diago__bpcg_8h_source.html

#ifndef DIAGO_BPCG_H_

#define DIAGO_BPCG_H_


#include "source_base/kernels/math_kernel_op.h"

#include "source_base/module_device/memory_op.h"

#include "source_base/module_device/types.h"

#include "source_base/para_gemm.h"

#include "source_hamilt/hamilt.h"

#include "source_pw/module_pwdft/structure_factor.h"

#include "source_hsolver/kernels/hegvd_op.h"

#include "source_hsolver/para_linear_transform.h"


#include <ATen/core/tensor.h>

#include <ATen/core/tensor_map.h>

#include <source_base/macros.h>


namespace hsolver {


template <typename T = std::complex<double>, typename Device = base_device::DEVICE_CPU>


class DiagoBPCG

{

  private:

    // Note GetTypeReal<T>::type will

    // return T if T is real type(float, double),

    // otherwise return the real type of T(complex<float>, std::complex<double>)

    using Real = typename GetTypeReal<T>::type;

  // Column major psi in this class

  public:

    explicit DiagoBPCG(const Real* precondition);


    ~DiagoBPCG();


    void init_iter(const int nband, const int nband_l, const int nbasis, const int ndim);


    using HPsiFunc = std::function<void(T*, T*, const int, const int)>;


    void diag(const HPsiFunc& hpsi_func,

              T* psi_in,

              Real* eigenvalue_in,

              const std::vector<double>& ethr_band);


  private:

    int n_band = 0;

    int n_band_l = 0;

    int n_basis = 0;

    int n_dim = 0;

    int nline = 4;

    ModuleBase::PGemmCN<T, Device> pmmcn;

    PLinearTransform<T, Device> plintrans;


    ct::DataType r_type  = ct::DataType::DT_INVALID;

    ct::DataType t_type  = ct::DataType::DT_INVALID;

    ct::DeviceType device_type = ct::DeviceType::UnKnown;


    ct::Tensor prec = {}, h_prec = {};


    ct::Tensor beta = {};

    ct::Tensor err_st = {};

    ct::Tensor eigen = {};


    ct::Tensor psi = {}, hpsi = {};


    ct::Tensor hsub = {};


    ct::Tensor grad = {}, hgrad = {}, grad_old = {};


    ct::Tensor work = {};


    // These are for hsolver gemm_op use

    Device * ctx = {};

    // Pointer to objects of 1 and 0 for gemm

    const T *one = nullptr, *zero = nullptr, *neg_one = nullptr;

    const T one_ = static_cast<T>(1.0), zero_ = static_cast<T>(0.0), neg_one_ = static_cast<T>(-1.0);


    void calc_prec();


    void calc_hpsi_with_block(

        const HPsiFunc& hpsi_func,

        T *psi_in,

        ct::Tensor& hpsi_out);


    void diag_hsub(

        const ct::Tensor& psi_in,

        const ct::Tensor& hpsi_in,

        ct::Tensor& hsub_out,

        ct::Tensor& eigenvalue_out);


    void rotate_wf(

        const ct::Tensor& hsub_in,

        ct::Tensor& psi_out,

        ct::Tensor& workspace_in);


    void calc_grad_with_block(

        const ct::Tensor& prec_in,

        ct::Tensor& err_out,

        ct::Tensor& beta_out,

        ct::Tensor& psi_in, ct::Tensor& hpsi_in,

        ct::Tensor& grad_out, ct::Tensor& grad_old_out);


    void calc_hsub_with_block(

        const HPsiFunc& hpsi_func,

        T *psi_in,

        ct::Tensor& psi_out, ct::Tensor& hpsi_out,

        ct::Tensor& hsub_out, ct::Tensor& workspace_in,

        ct::Tensor& eigenvalue_out);


    void calc_hsub_with_block_exit(

        ct::Tensor& psi_out,

        ct::Tensor& hpsi_out,

        ct::Tensor& hsub_out,

        ct::Tensor& workspace_in,

        ct::Tensor& eigenvalue_out);


    void orth_projection(

        const ct::Tensor& psi_in,

        ct::Tensor& hsub_in,

        ct::Tensor& grad_out);


    void line_minimize(

        ct::Tensor& grad_in,

        ct::Tensor& hgrad_in,

        ct::Tensor& psi_out,

        ct::Tensor& hpsi_out);


    void orth_cholesky(

        ct::Tensor& workspace_in,

        ct::Tensor& psi_out,

        ct::Tensor& hpsi_out,

        ct::Tensor& hsub_out);


    bool test_error(const ct::Tensor& err_in, const std::vector<double>& ethr_band);


    using ct_Device = typename ct::PsiToContainer<Device>::type;

    using setmem_var_op = ct::kernels::set_memory<Real, ct_Device>;

    using resmem_var_op = ct::kernels::resize_memory<Real, ct_Device>;

    using delmem_var_op = ct::kernels::delete_memory<Real, ct_Device>;

    using syncmem_var_h2d_op = ct::kernels::synchronize_memory<Real, ct_Device, ct::DEVICE_CPU>;

    using syncmem_var_d2h_op = ct::kernels::synchronize_memory<Real, ct::DEVICE_CPU, ct_Device>;


    using setmem_complex_op = ct::kernels::set_memory<T, ct_Device>;

    using delmem_complex_op = ct::kernels::delete_memory<T, ct_Device>;

    using resmem_complex_op = ct::kernels::resize_memory<T, ct_Device>;

    using syncmem_complex_op = ct::kernels::synchronize_memory<T, ct_Device, ct_Device>;


    // note: these operators use template parameter base_device::Device_*

    // defined in source_base/module_device/types.h

    // different from ct_Device!

    using gemm_op = ModuleBase::gemm_op<T, Device>;


};


} // namespace hsolver

#endif // DIAGO_BPCG_H_

ModuleBase::PGemmCN
this class is used to perform parallel matrix multiplication C = alpha * A^H * B + beta * C Here,...
Definition para_gemm.h:25

container::Tensor
A multi-dimensional array of elements of a single data type.
Definition tensor.h:32

hsolver::DiagoBPCG
A class for diagonalization using the Blocked-PCG method.
Definition diago_bpcg.h:27

hsolver::DiagoBPCG::hpsi
ct::Tensor hpsi
Definition diago_bpcg.h:109

hsolver::DiagoBPCG::n_dim
int n_dim
valid dimension of psi
Definition diago_bpcg.h:85

hsolver::DiagoBPCG::h_prec
ct::Tensor h_prec
Definition diago_bpcg.h:97

hsolver::DiagoBPCG::init_iter
void init_iter(const int nband, const int nband_l, const int nbasis, const int ndim)
Initialize the class before diagonalization.
Definition diago_bpcg.cpp:37

hsolver::DiagoBPCG::calc_hsub_with_block_exit
void calc_hsub_with_block_exit(ct::Tensor &psi_out, ct::Tensor &hpsi_out, ct::Tensor &hsub_out, ct::Tensor &workspace_in, ct::Tensor &eigenvalue_out)
Apply the Hamiltonian operator to psi and obtain the hpsi matrix.
Definition diago_bpcg.cpp:244

hsolver::DiagoBPCG::prec
ct::Tensor prec
Definition diago_bpcg.h:97

hsolver::DiagoBPCG::calc_grad_with_block
void calc_grad_with_block(const ct::Tensor &prec_in, ct::Tensor &err_out, ct::Tensor &beta_out, ct::Tensor &psi_in, ct::Tensor &hpsi_in, ct::Tensor &grad_out, ct::Tensor &grad_old_out)
Calculate the gradient for all bands used in CG method.
Definition diago_bpcg.cpp:137

hsolver::DiagoBPCG::n_basis
int n_basis
the number of cols of the input psi
Definition diago_bpcg.h:83

hsolver::DiagoBPCG::rotate_wf
void rotate_wf(const ct::Tensor &hsub_in, ct::Tensor &psi_out, ct::Tensor &workspace_in)
Inplace matrix multiplication to obtain the initial guessed wavefunction.
Definition diago_bpcg.cpp:180

hsolver::DiagoBPCG::orth_projection
void orth_projection(const ct::Tensor &psi_in, ct::Tensor &hsub_in, ct::Tensor &grad_out)
Orthogonalize column vectors in grad to column vectors in psi.
Definition diago_bpcg.cpp:165

hsolver::DiagoBPCG::zero_
const T zero_
Definition diago_bpcg.h:125

hsolver::DiagoBPCG::setmem_var_op
ct::kernels::set_memory< Real, ct_Device > setmem_var_op
Definition diago_bpcg.h:338

hsolver::DiagoBPCG::~DiagoBPCG
~DiagoBPCG()
Destructor for DiagoBPCG class.
Definition diago_bpcg.cpp:32

hsolver::DiagoBPCG::syncmem_var_d2h_op
ct::kernels::synchronize_memory< Real, ct::DEVICE_CPU, ct_Device > syncmem_var_d2h_op
Definition diago_bpcg.h:342

hsolver::DiagoBPCG::diag_hsub
void diag_hsub(const ct::Tensor &psi_in, const ct::Tensor &hpsi_in, ct::Tensor &hsub_out, ct::Tensor &eigenvalue_out)
Diagonalization of the subspace matrix.
Definition diago_bpcg.cpp:203

hsolver::DiagoBPCG::syncmem_complex_op
ct::kernels::synchronize_memory< T, ct_Device, ct_Device > syncmem_complex_op
Definition diago_bpcg.h:347

hsolver::DiagoBPCG::nline
int nline
max iter steps for all-band cg loop
Definition diago_bpcg.h:87

hsolver::DiagoBPCG::calc_hsub_with_block
void calc_hsub_with_block(const HPsiFunc &hpsi_func, T *psi_in, ct::Tensor &psi_out, ct::Tensor &hpsi_out, ct::Tensor &hsub_out, ct::Tensor &workspace_in, ct::Tensor &eigenvalue_out)
Apply the Hamiltonian operator to psi and obtain the hpsi matrix.
Definition diago_bpcg.cpp:219

hsolver::DiagoBPCG::zero
const T * zero
Definition diago_bpcg.h:124

hsolver::DiagoBPCG::one
const T * one
Definition diago_bpcg.h:124

hsolver::DiagoBPCG::grad
ct::Tensor grad
Definition diago_bpcg.h:115

hsolver::DiagoBPCG::n_band
int n_band
the number of bands of all processes
Definition diago_bpcg.h:79

hsolver::DiagoBPCG::t_type
ct::DataType t_type
Definition diago_bpcg.h:94

hsolver::DiagoBPCG::HPsiFunc
std::function< void(T *, T *, const int, const int)> HPsiFunc
Definition diago_bpcg.h:60

hsolver::DiagoBPCG::resmem_var_op
ct::kernels::resize_memory< Real, ct_Device > resmem_var_op
Definition diago_bpcg.h:339

hsolver::DiagoBPCG::hgrad
ct::Tensor hgrad
Definition diago_bpcg.h:115

hsolver::DiagoBPCG::one_
const T one_
Definition diago_bpcg.h:125

hsolver::DiagoBPCG::n_band_l
int n_band_l
the number of bands of current process
Definition diago_bpcg.h:81

hsolver::DiagoBPCG::ctx
Device * ctx
ctx is nothing but the devices used in gemm_op (Device * ctx = nullptr;),
Definition diago_bpcg.h:122

hsolver::DiagoBPCG::setmem_complex_op
ct::kernels::set_memory< T, ct_Device > setmem_complex_op
Definition diago_bpcg.h:344

hsolver::DiagoBPCG::pmmcn
ModuleBase::PGemmCN< T, Device > pmmcn
parallel matrix multiplication
Definition diago_bpcg.h:89

hsolver::DiagoBPCG::ct_Device
typename ct::PsiToContainer< Device >::type ct_Device
Definition diago_bpcg.h:337

hsolver::DiagoBPCG::diag
void diag(const HPsiFunc &hpsi_func, T *psi_in, Real *eigenvalue_in, const std::vector< double > &ethr_band)
Diagonalize the Hamiltonian using the BPCG method.
Definition diago_bpcg.cpp:262

hsolver::DiagoBPCG::beta
ct::Tensor beta
The coefficient for mixing the current and previous step gradients, used in iterative methods.
Definition diago_bpcg.h:100

hsolver::DiagoBPCG::neg_one_
const T neg_one_
Definition diago_bpcg.h:125

hsolver::DiagoBPCG::calc_hpsi_with_block
void calc_hpsi_with_block(const HPsiFunc &hpsi_func, T *psi_in, ct::Tensor &hpsi_out)
Apply the H operator to psi and obtain the hpsi matrix.
Definition diago_bpcg.cpp:193

hsolver::DiagoBPCG::syncmem_var_h2d_op
ct::kernels::synchronize_memory< Real, ct_Device, ct::DEVICE_CPU > syncmem_var_h2d_op
Definition diago_bpcg.h:341

hsolver::DiagoBPCG::orth_cholesky
void orth_cholesky(ct::Tensor &workspace_in, ct::Tensor &psi_out, ct::Tensor &hpsi_out, ct::Tensor &hsub_out)
Orthogonalize and normalize the column vectors in psi_out using Cholesky decomposition.
Definition diago_bpcg.cpp:114

hsolver::DiagoBPCG::line_minimize
void line_minimize(ct::Tensor &grad_in, ct::Tensor &hgrad_in, ct::Tensor &psi_out, ct::Tensor &hpsi_out)
Optimize psi as well as the hpsi.
Definition diago_bpcg.cpp:96

hsolver::DiagoBPCG::err_st
ct::Tensor err_st
Error state value, if it is smaller than the given threshold, then exit the iteration.
Definition diago_bpcg.h:102

hsolver::DiagoBPCG::delmem_complex_op
ct::kernels::delete_memory< T, ct_Device > delmem_complex_op
Definition diago_bpcg.h:345

hsolver::DiagoBPCG::plintrans
PLinearTransform< T, Device > plintrans
Definition diago_bpcg.h:90

hsolver::DiagoBPCG::eigen
ct::Tensor eigen
Calculated eigen.
Definition diago_bpcg.h:104

hsolver::DiagoBPCG::grad_old
ct::Tensor grad_old
Definition diago_bpcg.h:115

hsolver::DiagoBPCG::r_type
ct::DataType r_type
Definition diago_bpcg.h:93

hsolver::DiagoBPCG::hsub
ct::Tensor hsub
Definition diago_bpcg.h:111

hsolver::DiagoBPCG::test_error
bool test_error(const ct::Tensor &err_in, const std::vector< double > &ethr_band)
Checks if the error satisfies the given threshold.
Definition diago_bpcg.cpp:70

hsolver::DiagoBPCG::neg_one
const T * neg_one
Definition diago_bpcg.h:124

hsolver::DiagoBPCG::resmem_complex_op
ct::kernels::resize_memory< T, ct_Device > resmem_complex_op
Definition diago_bpcg.h:346

hsolver::DiagoBPCG::calc_prec
void calc_prec()
Update the precondition array.
Definition diago_bpcg.cpp:159

hsolver::DiagoBPCG::Real
typename GetTypeReal< T >::type Real
Definition diago_bpcg.h:32

hsolver::DiagoBPCG::delmem_var_op
ct::kernels::delete_memory< Real, ct_Device > delmem_var_op
Definition diago_bpcg.h:340

hsolver::DiagoBPCG::work
ct::Tensor work
work for some calculations within this class, including rotate_wf call
Definition diago_bpcg.h:118

hsolver::DiagoBPCG::device_type
ct::DeviceType device_type
Definition diago_bpcg.h:95

hsolver::PLinearTransform
B = alpha * A * U + beta * B A and B are local matrice U can be a local matrix or a global matrix.
Definition para_linear_transform.h:22

tensor.h

T
#define T
Definition exp.cpp:237

hamilt.h

hegvd_op.h

macros.h

math_kernel_op.h

memory_op.h

container::DataType
DataType
Enumeration of data types for tensors. The DataType enum lists the supported data types for tensors....
Definition tensor_types.h:50

container::DeviceType
DeviceType
The type of memory used by an allocator.
Definition tensor_types.h:73

hsolver
Definition diag_comm_info.h:9

psi
Definition exx_lip.h:23

para_gemm.h

para_linear_transform.h

GetTypeReal::type
T type
Definition macros.h:8

ModuleBase::gemm_op
Definition math_kernel_op.h:217

container::PsiToContainer
Definition tensor_types.h:113

structure_factor.h

tensor_map.h

types.h