abacus-develop/math__kernel__op_8h_source.html

// TODO: This is a temperary location for these functions.

// And will be moved to a global module(module base) later.

#ifndef MODULE_HSOLVER_MATH_KERNEL_H

#define MODULE_HSOLVER_MATH_KERNEL_H


#include "source_base/macros.h"


#include "source_base/parallel_reduce.h"


#include "source_base/module_device/memory_op.h"

#include "source_base/module_device/types.h"


#if defined(__CUDA) || defined(__UT_USE_CUDA)

#include <cuda_runtime.h>


#include "cublas_v2.h"

#endif //__CUDA || __UT_USE_CUDA


namespace ModuleBase {


//---------------------------------------------------------------------------------

//-----------------------------0. Tool Functions-----------------------------------

//---------------------------------------------------------------------------------


inline std::complex<double> set_real_tocomplex(const std::complex<double> &x) {

  return {x.real(), 0.0};

}


inline std::complex<float> set_real_tocomplex(const std::complex<float> &x) {

  return {x.real(), 0.0};

}


inline double set_real_tocomplex(const double &x) { return x; }


inline float set_real_tocomplex(const float &x) { return x; }


inline std::complex<double> get_conj(const std::complex<double> &x) {

  return {x.real(), -x.imag()};

}


inline std::complex<float> get_conj(const std::complex<float> &x) {

  return {x.real(), -x.imag()};

}


inline double get_conj(const double &x) { return x; }


inline float get_conj(const float &x) { return x; }


//---------------------------------------------------------------------------------

//-----------------------------1. Vector Operations--------------------------------

//---------------------------------------------------------------------------------


template <typename FPTYPE, typename Device> struct scal_op {

  void operator()(const int &N,

                  const std::complex<FPTYPE> *alpha, std::complex<FPTYPE> *X,

                  const int &incx);

};


template <typename T, typename Device> struct vector_mul_real_op {

  using Real = typename GetTypeReal<T>::type;

  void operator()(const int dim, T* result, const T* vector, const Real constant);

};


// vector operator: result[i] = vector1[i](complex) * vector2[i](not complex)


template <typename T, typename Device> struct vector_mul_vector_op {

  using Real = typename GetTypeReal<T>::type;

  void operator()(const int& dim, T* result, const T* vector1, const Real* vector2, const bool& add = false);

};


// vector operator: result[i] = vector[i] / constant


template <typename T, typename Device> struct vector_div_constant_op {

  using Real = typename GetTypeReal<T>::type;

  void operator()(const int& dim, T* result, const T* vector, const Real constant);

};


// vector operator: result[i] = vector1[i](complex) / vector2[i](not complex)


template <typename T, typename Device> struct vector_div_vector_op {

  using Real = typename GetTypeReal<T>::type;

  void operator()(const int &dim, T *result, const T *vector1,

                  const Real *vector2);

};


//  compute Y = alpha * X + Y


template <typename T, typename Device> struct axpy_op {

  void operator()(const int &N, const T *alpha, const T *X,

                  const int &incX, T *Y, const int &incY);

};


// vector operator: result[i] = vector1[i] * constant1 + vector2[i] * constant2

template <typename T, typename Device>


struct vector_add_vector_op {

  using Real = typename GetTypeReal<T>::type;

  void operator()(const int &dim, T *result, const T *vector1,

                  const Real constant1, const T *vector2, const Real constant2);

};


template <typename T, typename Device> struct dot_real_op {

  using Real = typename GetTypeReal<T>::type;

  Real operator()(const int &dim, const T *psi_L,

                  const T *psi_R, const bool reduce = true);

};


//---------------------------------------------------------------------------------

//-----------------------------2. Matrix Operations--------------------------------

//---------------------------------------------------------------------------------


// compute y = alpha * op(A) * x + beta * y


template <typename T, typename Device> struct gemv_op {

  void operator()(const char &trans, const int &m,

                  const int &n, const T *alpha, const T *A, const int &lda,

                  const T *X, const int &incx, const T *beta, T *Y,

                  const int &incy);

};


// compute C = alpha * op(A) * op(B) + beta * C


template <typename T, typename Device> struct gemm_op {

  void operator()(const char &transa, const char &transb,

                  const int &m, const int &n, const int &k, const T *alpha,

                  const T *a, const int &lda, const T *b, const int &ldb,

                  const T *beta, T *c, const int &ldc);

};


#ifdef __DSP

// compute C = alpha * op(A) * op(B) + beta * C on DSP Hardware

template <typename T, typename Device> struct gemm_op_mt {

  void operator()(const char &transa, const char &transb,

                  const int &m, const int &n, const int &k, const T *alpha,

                  const T *a, const int &lda, const T *b, const int &ldb,

                  const T *beta, T *c, const int &ldc);

};

#endif


template <typename T, typename Device> struct matrixTranspose_op {

  void operator()(const int &row, const int &col,

                  const T *input_matrix, T *output_matrix);

};


template <typename T, typename Device> struct matrixCopy {

  void operator()(const int& n1, const int& n2, const T* A, const int& LDA, T* B, const int& LDB);

};


template <typename T, typename Device>


struct matrix_mul_vector_op {

    using Real = typename GetTypeReal<T>::type;

  void operator()(const int &m, const int &n,

                  T *a,

                  const int &lda,

                  const Real *b,

                  const Real alpha,

                  T *c,

                  const int &ldc);

};


template <typename T, typename Device>


struct apply_eigenvalues_op {

    using Real = typename GetTypeReal<T>::type;


    void operator()(const Device *d, const int &nbase, const int &nbase_x, const int &notconv,

                    T *result, const T *vectors, const Real *eigenvalues);

};


template <typename T, typename Device>


struct precondition_op {

    using Real = typename GetTypeReal<T>::type;

    void operator()(const Device* d,

                   const int& dim,

                   T* psi_iter,

                   const int& nbase,

                   const int& notconv,

                   const Real* precondition,

                   const Real* eigenvalues);

};


template <typename T, typename Device>


struct normalize_op {

    using Real = typename GetTypeReal<T>::type;

    void operator()(const Device* d,

                   const int& dim,

                   T* psi_iter,

                   const int& nbase,

                   const int& notconv,

                   Real* psi_norm = nullptr);

};


template <typename T>


struct normalize_op<T, base_device::DEVICE_GPU> {

    using Real = typename GetTypeReal<T>::type;

    void operator()(const base_device::DEVICE_GPU* d,

                   const int& dim,

                   T* psi_iter,

                   const int& nbase,

                   const int& notconv,

                   Real* psi_norm);

};


#if __CUDA || __UT_USE_CUDA || __ROCM || __UT_USE_ROCM

// Partially specialize functor for base_device::GpuDevice.

template <typename T> struct dot_real_op<T, base_device::DEVICE_GPU> {

  using Real = typename GetTypeReal<T>::type;

  Real operator()(const int &dim,

                  const T *psi_L, const T *psi_R, const bool reduce = true);

};


// vector operator: result[i] = vector[i] / constant

template <typename T>

struct vector_mul_real_op<T, base_device::DEVICE_GPU>

{

  using Real = typename GetTypeReal<T>::type;

  void operator()(const int dim, T* result, const T* vector, const Real constant);

};


// vector operator: result[i] = vector1[i](complex) * vector2[i](not complex)

template <typename T> struct vector_mul_vector_op<T, base_device::DEVICE_GPU> {

  using Real = typename GetTypeReal<T>::type;

  void operator()(const int& dim, T* result, const T* vector1, const Real* vector2, const bool& add = false);

};


// vector operator: result[i] = vector[i] / constant

template <typename T> struct vector_div_constant_op<T, base_device::DEVICE_GPU> {

  using Real = typename GetTypeReal<T>::type;

  void operator()(const int& dim, T* result, const T* vector, const Real constant);

};


// vector operator: result[i] = vector1[i](complex) / vector2[i](not complex)

template <typename T> struct vector_div_vector_op<T, base_device::DEVICE_GPU> {

  using Real = typename GetTypeReal<T>::type;

  void operator()(const int &dim, T *result,

                  const T *vector1, const Real *vector2);

};


// vector operator: result[i] = vector1[i] * constant1 + vector2[i] * constant2

template <typename T>

struct vector_add_vector_op<T, base_device::DEVICE_GPU> {

  using Real = typename GetTypeReal<T>::type;

  void operator()(const int &dim, T *result,

                  const T *vector1, const Real constant1, const T *vector2,

                  const Real constant2);

};


template <typename T> struct matrixCopy<T, base_device::DEVICE_GPU> {

    void operator()(const int& n1,

                    const int& n2,

                    const T* A, // input

                    const int& LDA,

                    T* B, // output

                    const int& LDB);

};


template <typename T> struct matrix_mul_vector_op<T, base_device::DEVICE_GPU> {

  using Real = typename GetTypeReal<T>::type;

  void operator()(const int &m, const int &n,

                  T *a,

                  const int &lda,

                  const Real *b,

                  const Real alpha,

                  T *c,

                  const int &ldc);

};


void createGpuBlasHandle();

void destoryBLAShandle();


// vector operator: result[i] = -lambda[i] * vector[i]

template <typename T> struct apply_eigenvalues_op<T, base_device::DEVICE_GPU> {

    using Real = typename GetTypeReal<T>::type;


    void operator()(const base_device::DEVICE_GPU *d, const int &nbase, const int &nbase_x, const int &notconv,

                    T *result, const T *vectors, const Real *eigenvalues);

};


template <typename T>

struct precondition_op<T, base_device::DEVICE_GPU> {

    using Real = typename GetTypeReal<T>::type;

    void operator()(const base_device::DEVICE_GPU* d,

                   const int& dim,

                   T* psi_iter,

                   const int& nbase,

                   const int& notconv,

                   const Real* precondition,

                   const Real* eigenvalues);

};


#endif // __CUDA || __UT_USE_CUDA || __ROCM || __UT_USE_ROCM

} // namespace hsolver


#endif // MODULE_HSOLVER_MATH_KERNEL_H

N
#define N
Definition exp.cpp:24

T
#define T
Definition exp.cpp:237

macros.h

memory_op.h

ModuleBase
Definition array_pool.h:6

ModuleBase::set_real_tocomplex
std::complex< double > set_real_tocomplex(const std::complex< double > &x)
Definition math_kernel_op.h:24

ModuleBase::get_conj
std::complex< double > get_conj(const std::complex< double > &x)
Definition math_kernel_op.h:36

base_device
Definition device.cpp:20

parallel_reduce.h

GetTypeReal::type
T type
Definition macros.h:8

ModuleBase::apply_eigenvalues_op
Definition math_kernel_op.h:327

ModuleBase::apply_eigenvalues_op::operator()
void operator()(const Device *d, const int &nbase, const int &nbase_x, const int &notconv, T *result, const T *vectors, const Real *eigenvalues)

ModuleBase::apply_eigenvalues_op::Real
typename GetTypeReal< T >::type Real
Definition math_kernel_op.h:328

ModuleBase::axpy_op
Definition math_kernel_op.h:132

ModuleBase::axpy_op::operator()
void operator()(const int &N, const T *alpha, const T *X, const int &incX, T *Y, const int &incY)
Y = alpha * X + Y.

ModuleBase::dot_real_op
Definition math_kernel_op.h:168

ModuleBase::dot_real_op::Real
typename GetTypeReal< T >::type Real
Definition math_kernel_op.h:169

ModuleBase::dot_real_op::operator()
Real operator()(const int &dim, const T *psi_L, const T *psi_R, const bool reduce=true)
dot_real_op computes the dot product of the given complex arrays(treated as float arrays)....

ModuleBase::gemm_op
Definition math_kernel_op.h:217

ModuleBase::gemm_op::operator()
void operator()(const char &transa, const char &transb, const int &m, const int &n, const int &k, const T *alpha, const T *a, const int &lda, const T *b, const int &ldb, const T *beta, T *c, const int &ldc)
C = alpha * op(A) * op(B) + beta * C.

ModuleBase::gemv_op
Definition math_kernel_op.h:192

ModuleBase::gemv_op::operator()
void operator()(const char &trans, const int &m, const int &n, const T *alpha, const T *A, const int &lda, const T *X, const int &incx, const T *beta, T *Y, const int &incy)
y = alpha * op(A) * x + beta * y

ModuleBase::matrixCopy
Definition math_kernel_op.h:286

ModuleBase::matrixCopy::operator()
void operator()(const int &n1, const int &n2, const T *A, const int &LDA, T *B, const int &LDB)
copy matrix A to B, they can have different leading dimensions

ModuleBase::matrixTranspose_op
Definition math_kernel_op.h:272

ModuleBase::matrixTranspose_op::operator()
void operator()(const int &row, const int &col, const T *input_matrix, T *output_matrix)
transpose the input matrix

ModuleBase::matrix_mul_vector_op
Definition math_kernel_op.h:302

ModuleBase::matrix_mul_vector_op::operator()
void operator()(const int &m, const int &n, T *a, const int &lda, const Real *b, const Real alpha, T *c, const int &ldc)
a * b * beta by each column

ModuleBase::matrix_mul_vector_op::Real
typename GetTypeReal< T >::type Real
Definition math_kernel_op.h:303

ModuleBase::normalize_op< T, base_device::DEVICE_GPU >::operator()
void operator()(const base_device::DEVICE_GPU *d, const int &dim, T *psi_iter, const int &nbase, const int &notconv, Real *psi_norm)

ModuleBase::normalize_op< T, base_device::DEVICE_GPU >::Real
typename GetTypeReal< T >::type Real
Definition math_kernel_op.h:359

ModuleBase::normalize_op
Definition math_kernel_op.h:347

ModuleBase::normalize_op::Real
typename GetTypeReal< T >::type Real
Definition math_kernel_op.h:348

ModuleBase::normalize_op::operator()
void operator()(const Device *d, const int &dim, T *psi_iter, const int &nbase, const int &notconv, Real *psi_norm=nullptr)

ModuleBase::precondition_op
Definition math_kernel_op.h:335

ModuleBase::precondition_op::Real
typename GetTypeReal< T >::type Real
Definition math_kernel_op.h:336

ModuleBase::precondition_op::operator()
void operator()(const Device *d, const int &dim, T *psi_iter, const int &nbase, const int &notconv, const Real *precondition, const Real *eigenvalues)

ModuleBase::scal_op
Definition math_kernel_op.h:52

ModuleBase::scal_op::operator()
void operator()(const int &N, const std::complex< FPTYPE > *alpha, std::complex< FPTYPE > *X, const int &incx)
x = alpha * x, where alpha and x are complex numbers

ModuleBase::vector_add_vector_op
Definition math_kernel_op.h:151

ModuleBase::vector_add_vector_op::operator()
void operator()(const int &dim, T *result, const T *vector1, const Real constant1, const T *vector2, const Real constant2)
result[i] = vector1[i] * constant1 + vector2[i] * constant2

ModuleBase::vector_add_vector_op::Real
typename GetTypeReal< T >::type Real
Definition math_kernel_op.h:152

ModuleBase::vector_div_constant_op
Definition math_kernel_op.h:101

ModuleBase::vector_div_constant_op::Real
typename GetTypeReal< T >::type Real
Definition math_kernel_op.h:102

ModuleBase::vector_div_constant_op::operator()
void operator()(const int &dim, T *result, const T *vector, const Real constant)
result[i] = vector[i] / constant

ModuleBase::vector_div_vector_op
Definition math_kernel_op.h:116

ModuleBase::vector_div_vector_op::operator()
void operator()(const int &dim, T *result, const T *vector1, const Real *vector2)
result[i] = vector1[i](complex) / vector2[i](not complex)

ModuleBase::vector_div_vector_op::Real
typename GetTypeReal< T >::type Real
Definition math_kernel_op.h:117

ModuleBase::vector_mul_real_op
Definition math_kernel_op.h:68

ModuleBase::vector_mul_real_op::operator()
void operator()(const int dim, T *result, const T *vector, const Real constant)
result[i] = vector[i] * constant, where vector is complex number and constant is real number。 It is d...

ModuleBase::vector_mul_real_op::Real
typename GetTypeReal< T >::type Real
Definition math_kernel_op.h:69

ModuleBase::vector_mul_vector_op
Definition math_kernel_op.h:85

ModuleBase::vector_mul_vector_op::Real
typename GetTypeReal< T >::type Real
Definition math_kernel_op.h:86

ModuleBase::vector_mul_vector_op::operator()
void operator()(const int &dim, T *result, const T *vector1, const Real *vector2, const bool &add=false)
result[i] = vector1[i](complex) * vector2[i](not complex)

types.h