ABACUS develop
Atomic-orbital Based Ab-initio Computation at UStc
Loading...
Searching...
No Matches
Classes | Functions
perf_math_kernel.cpp File Reference
#include "source_base/constants.h"
#include "source_base/module_device/memory_op.h"
#include "source_base/kernels/math_kernel_op.h"
#include <complex>
#include <benchmark/benchmark.h>
#include <iostream>
#include <cmath>
#include <cstdlib>
#include <chrono>
Include dependency graph for perf_math_kernel.cpp:

Classes

class  PerfModuleHsolverMathKernel
 

Functions

 BENCHMARK_DEFINE_F (PerfModuleHsolverMathKernel, BM_zdot_real_cpu_op)(benchmark
 
 BENCHMARK_DEFINE_F (PerfModuleHsolverMathKernel, BM_vector_mul_real_op_cpu)(benchmark
 
 BENCHMARK_DEFINE_F (PerfModuleHsolverMathKernel, BM_vector_mul_vector_op_cpu)(benchmark
 
 BENCHMARK_DEFINE_F (PerfModuleHsolverMathKernel, BM_vector_div_vector_op_cpu)(benchmark
 
 BENCHMARK_DEFINE_F (PerfModuleHsolverMathKernel, BM_vector_add_vector_op_cpu)(benchmark
 
 BENCHMARK_DEFINE_F (PerfModuleHsolverMathKernel, BM_axpy_op_cpu)(benchmark
 
 BENCHMARK_DEFINE_F (PerfModuleHsolverMathKernel, BM_scal_op_cpu)(benchmark
 
 BENCHMARK_REGISTER_F (PerfModuleHsolverMathKernel, BM_zdot_real_cpu_op) -> RangeMultiplier(10) ->Range(1, 10e6) ->Unit(benchmark::kMicrosecond)
 
 BENCHMARK_REGISTER_F (PerfModuleHsolverMathKernel, BM_vector_mul_real_op_cpu) -> RangeMultiplier(10) ->Range(1, 10e6) ->Unit(benchmark::kMicrosecond)
 
 BENCHMARK_REGISTER_F (PerfModuleHsolverMathKernel, BM_vector_mul_vector_op_cpu) -> RangeMultiplier(10) ->Range(1, 10e6) ->Unit(benchmark::kMicrosecond)
 
 BENCHMARK_REGISTER_F (PerfModuleHsolverMathKernel, BM_vector_div_vector_op_cpu) -> RangeMultiplier(10) ->Range(1, 10e6) ->Unit(benchmark::kMicrosecond)
 
 BENCHMARK_REGISTER_F (PerfModuleHsolverMathKernel, BM_vector_add_vector_op_cpu) -> RangeMultiplier(10) ->Range(1, 10e6) ->Unit(benchmark::kMicrosecond)
 
 BENCHMARK_REGISTER_F (PerfModuleHsolverMathKernel, BM_axpy_op_cpu) -> RangeMultiplier(10) ->Range(1, 10e6) ->Unit(benchmark::kMicrosecond)
 
 BENCHMARK_REGISTER_F (PerfModuleHsolverMathKernel, BM_scal_op_cpu) -> RangeMultiplier(10) ->Range(1, 10e6) ->Unit(benchmark::kMicrosecond)
 
 BENCHMARK_MAIN ()
 

Function Documentation

◆ BENCHMARK_DEFINE_F() [1/7]

BENCHMARK_DEFINE_F ( PerfModuleHsolverMathKernel  ,
BM_axpy_op_cpu   
)

◆ BENCHMARK_DEFINE_F() [2/7]

BENCHMARK_DEFINE_F ( PerfModuleHsolverMathKernel  ,
BM_scal_op_cpu   
)

◆ BENCHMARK_DEFINE_F() [3/7]

BENCHMARK_DEFINE_F ( PerfModuleHsolverMathKernel  ,
BM_vector_add_vector_op_cpu   
)

◆ BENCHMARK_DEFINE_F() [4/7]

BENCHMARK_DEFINE_F ( PerfModuleHsolverMathKernel  ,
BM_vector_div_vector_op_cpu   
)

◆ BENCHMARK_DEFINE_F() [5/7]

BENCHMARK_DEFINE_F ( PerfModuleHsolverMathKernel  ,
BM_vector_mul_real_op_cpu   
)

◆ BENCHMARK_DEFINE_F() [6/7]

BENCHMARK_DEFINE_F ( PerfModuleHsolverMathKernel  ,
BM_vector_mul_vector_op_cpu   
)

◆ BENCHMARK_DEFINE_F() [7/7]

BENCHMARK_DEFINE_F ( PerfModuleHsolverMathKernel  ,
BM_zdot_real_cpu_op   
)

◆ BENCHMARK_MAIN()

BENCHMARK_MAIN ( )

◆ BENCHMARK_REGISTER_F() [1/7]

BENCHMARK_REGISTER_F ( PerfModuleHsolverMathKernel  ,
BM_axpy_op_cpu   
) -> RangeMultiplier(10) ->Range(1, 10e6) ->Unit(benchmark::kMicrosecond)

◆ BENCHMARK_REGISTER_F() [2/7]

BENCHMARK_REGISTER_F ( PerfModuleHsolverMathKernel  ,
BM_scal_op_cpu   
) -> RangeMultiplier(10) ->Range(1, 10e6) ->Unit(benchmark::kMicrosecond)

◆ BENCHMARK_REGISTER_F() [3/7]

BENCHMARK_REGISTER_F ( PerfModuleHsolverMathKernel  ,
BM_vector_add_vector_op_cpu   
) -> RangeMultiplier(10) ->Range(1, 10e6) ->Unit(benchmark::kMicrosecond)

◆ BENCHMARK_REGISTER_F() [4/7]

BENCHMARK_REGISTER_F ( PerfModuleHsolverMathKernel  ,
BM_vector_div_vector_op_cpu   
) -> RangeMultiplier(10) ->Range(1, 10e6) ->Unit(benchmark::kMicrosecond)

◆ BENCHMARK_REGISTER_F() [5/7]

BENCHMARK_REGISTER_F ( PerfModuleHsolverMathKernel  ,
BM_vector_mul_real_op_cpu   
) -> RangeMultiplier(10) ->Range(1, 10e6) ->Unit(benchmark::kMicrosecond)

◆ BENCHMARK_REGISTER_F() [6/7]

BENCHMARK_REGISTER_F ( PerfModuleHsolverMathKernel  ,
BM_vector_mul_vector_op_cpu   
) -> RangeMultiplier(10) ->Range(1, 10e6) ->Unit(benchmark::kMicrosecond)

◆ BENCHMARK_REGISTER_F() [7/7]

BENCHMARK_REGISTER_F ( PerfModuleHsolverMathKernel  ,
BM_zdot_real_cpu_op   
) -> RangeMultiplier(10) ->Range(1, 10e6) ->Unit(benchmark::kMicrosecond)