Name | Module | Coverage (%) | Time (s) | Nb Threads | Deviation (coverage) | Deviation (time) |
orig | compilers/armclang_5 | orig | compilers/armclang_5 | orig | compilers/armclang_5 | orig | compilers/armclang_5 | orig | compilers/armclang_5 |
void miniqmcreference::MultiBsplineEvalRef::evaluate_v<double>(qmcplusplus::bspline_traits<double, 3u>::SplineType const*, double, double, double, double*, unsigned long) | exec | 29.32 | 29.23 | 16.33 | 16.36 | 80 | 80 | 0.37 | 0.38 | 0.21 | 0.24 |
void miniqmcreference::MultiBsplineEvalRef::evaluate_vgh<double>(qmcplusplus::bspline_traits<double, 3u>::SplineType const*, double, double, double, double*, double*, double*, unsigned long) | exec | 14.47 | 14.42 | 8.06 | 8.07 | 80 | 80 | 0.26 | 0.28 | 0.14 | 0.15 |
dgemm_vanilla_big_no_prefetch | libarmpl_mp.so | NA | 18 | NA | 10.07 | NA | 80 | NA | 0.37 | NA | 0.21 |
dgemm_vanilla_big_no_prefetch | libarmpl.so | 17.78 | NA | 9.91 | NA | 80 | NA | 0.35 | NA | 0.20 | NA |
qmcplusplus::SoaDistanceTableAAOMPTarget<double, 3u, 40>::update(int) | exec | 7.05 | 7.05 | 3.93 | 3.95 | 80 | 80 | 0.27 | 0.24 | 0.15 | 0.13 |
qmcplusplus::SoaDistanceTableABOMPTarget<double, 3u, 40>::evaluate(qmcplusplus::ParticleSet&) | exec | 4.35 | 4.36 | 2.42 | 2.44 | 80 | 80 | 0.13 | 0.15 | 0.07 | 0.08 |
n_interleave_kernel_d6 | libarmpl.so | 6.01 | NA | 3.35 | NA | 80 | NA | 0.35 | NA | 0.19 | NA |
n_interleave_kernel_d6 | libarmpl_mp.so | NA | 5.96 | NA | 3.34 | NA | 80 | NA | 0.35 | NA | 0.20 |
void qmcplusplus::DTD_BConds<double, 3u, 40>::computeDistances<qmcplusplus::TinyVector<double, 3u>, qmcplusplus::VectorSoAContainer<double, 3u, qmcplusplus::Mallocator<double, 32ul> >, qmcplusplus::VectorSoAContainer<double, 3... | exec | 2.32 | 2.32 | 1.29 | 1.3 | 80 | 80 | 0.16 | 0.16 | 0.09 | 0.09 |
miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector<double, std::allocator<double> >&) | exec | 1.69 | 1.68 | 0.94 | 0.94 | 80 | 80 | 0.12 | 0.13 | 0.06 | 0.07 |
dgemv_t_neon_kernel_serial | libarmpl.so | 3.27 | NA | 1.82 | NA | 80 | NA | 0.17 | NA | 0.09 | NA |
miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::acceptMove(qmcplusplus::ParticleSet&, int) | exec | 1.64 | 1.62 | 0.91 | 0.91 | 80 | 80 | 0.12 | 0.12 | 0.07 | 0.07 |
dgemv_t_neon_kernel_serial | libarmpl_mp.so | NA | 3.23 | NA | 1.81 | NA | 80 | NA | 0.18 | NA | 0.10 |
kmp_flag_64<false, true>::wait(kmp_info*, int, void*) | libomp_with_lse.so | 1.29 | 1.21 | 0.72 | 0.68 | 80 | 80 | 0.32 | 0.30 | 0.18 | 0.17 |
__memcpy | libastring_aarch64.so | 1.03 | 1.02 | 0.57 | 0.57 | 80 | 80 | 0.09 | 0.10 | 0.05 | 0.06 |
dgemv_n_neon_kernel | libarmpl.so | 1.87 | NA | 1.04 | NA | 80 | NA | 0.12 | NA | 0.07 | NA |
dgemv_n_neon_kernel | libarmpl_mp.so | NA | 1.86 | NA | 1.04 | NA | 80 | NA | 0.11 | NA | 0.06 |
qmcplusplus::BsplineFunctor<double>::evaluateVGL(int, int, int, double const*, double*, double*, double*, double*, int*) const [clone .109] [clone .extracted] | exec | 0.9 | 0.9 | 0.5 | 0.5 | 80 | 80 | 0.09 | 0.10 | 0.05 | 0.06 |
miniqmcreference::einspline_spo_ref<double>::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector<double, std::allocator<double> >&, qmcplusplus::Vector<qmcplusplus::TinyVector<double, 3u>, std::allocator<... | exec | 0.89 | 0.9 | 0.5 | 0.51 | 80 | 80 | 0.10 | 0.09 | 0.06 | 0.05 |
miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | exec | 0.89 | 0.87 | 0.5 | 0.49 | 80 | 80 | 0.09 | 0.10 | 0.05 | 0.05 |
miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<... | exec | 0.84 | 0.83 | 0.47 | 0.47 | 80 | 80 | 0.04 | 0.03 | 0.02 | 0.02 |
miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evalGrad(qmcplusplus::ParticleSet&, int) | exec | 0.64 | 0.66 | 0.36 | 0.37 | 80 | 80 | 0.08 | 0.07 | 0.04 | 0.04 |
__memset | libastring_aarch64.so | 0.62 | 0.63 | 0.35 | 0.35 | 80 | 80 | 0.08 | 0.08 | 0.05 | 0.04 |
qmcplusplus::SPOSet::evaluateDetRatios(qmcplusplus::VirtualParticleSet const&, qmcplusplus::Vector<double, std::allocator<double> >&, qmcplusplus::Vector<double, std::allocator<double> > const&, std::vector<double, st... | exec | 0.34 | 0.35 | 0.19 | 0.2 | 80 | 80 | 0.05 | 0.06 | 0.03 | 0.04 |
t_interleave_kernel_d8 | libarmpl_mp.so | NA | 0.53 | NA | 0.3 | NA | 80 | NA | 0.07 | NA | 0.04 |
t_interleave_kernel_d8 | libarmpl.so | 0.46 | NA | 0.26 | NA | 80 | NA | 0.07 | NA | 0.04 | NA |
miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | exec | 0.16 | 0.17 | 0.09 | 0.1 | 80 | 80 | 0.04 | 0.04 | 0.02 | 0.02 |
miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector<double, std::allocator<double> >&) | exec | 0.13 | 0.14 | 0.07 | 0.08 | 80 | 80 | 0.04 | 0.04 | 0.02 | 0.02 |
qmcplusplus::DiracMatrix<double, double>::invert_transpose(qmcplusplus::Matrix<double, std::allocator<double> > const&, qmcplusplus::Matrix<double, std::allocator<double> >&, double&, double&) | exec | 0.13 | 0.14 | 0.07 | 0.08 | 80 | 80 | 0.02 | 0.02 | 0.01 | 0.01 |
qmcplusplus::NonLocalPP<double>::evaluate(qmcplusplus::ParticleSet const&, qmcplusplus::WaveFunction&) | exec | 0.12 | 0.11 | 0.07 | 0.06 | 80 | 80 | 0.03 | 0.03 | 0.02 | 0.02 |
miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | exec | 0.11 | 0.1 | 0.06 | 0.06 | 80 | 80 | 0.04 | 0.03 | 0.02 | 0.02 |
miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evaluateLog(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector&l... | exec | 0.1 | 0.1 | 0.05 | 0.06 | 80 | 80 | 0.02 | 0.01 | 0.01 | 0.01 |
miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::recompute(qmcplusplus::ParticleSet&) | exec | 0.07 | 0.07 | 0.04 | 0.04 | 80 | 80 | 0.02 | 0.02 | 0.01 | 0.01 |
dgeset | libarmpl_mp.so | NA | 0.13 | NA | 0.07 | NA | 80 | NA | 0.03 | NA | 0.02 |
n_interleave_kernel_d8 | libarmpl_mp.so | NA | 0.13 | NA | 0.07 | NA | 80 | NA | 0.03 | NA | 0.02 |
n_interleave_kernel_d8 | libarmpl.so | 0.12 | NA | 0.07 | NA | 80 | NA | 0.03 | NA | 0.02 | NA |
dgeset | libarmpl.so | 0.12 | NA | 0.07 | NA | 80 | NA | 0.04 | NA | 0.02 | NA |
qmcplusplus::TimerType<std::chrono::_V2::system_clock>::start() | exec | 0.06 | 0.06 | 0.04 | 0.03 | 80 | 80 | 0.02 | 0.02 | 0.01 | 0.01 |
qmcplusplus::Vector<double, std::allocator<double> >::resize(unsigned long, double) | exec | 0.05 | 0.04 | 0.03 | 0.02 | 80 | 78 | 0.01 | 0.02 | 0.01 | 0.01 |
miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::computeU3(qmcplusplus::ParticleSet&, int, double const*) | exec | 0.04 | 0.04 | 0.02 | 0.02 | 79 | 79 | 0.02 | 0.02 | 0.01 | 0.01 |
dgetrf7vn_ | libarmpl.so | 0.06 | NA | 0.04 | NA | 80 | NA | 0.02 | NA | 0.01 | NA |
.omp_outlined..64 | exec | 0.03 | 0.03 | 0.01 | 0.02 | 78 | 75 | 0.02 | 0.02 | 0.01 | 0.01 |
dgetrf7vn_ | libarmpl_mp.so | NA | 0.06 | NA | 0.04 | NA | 80 | NA | 0.02 | NA | 0.01 |
qmcplusplus::SoaDistanceTableABOMPTarget<double, 3u, 40>::move(qmcplusplus::ParticleSet const&, qmcplusplus::TinyVector<double, 3u> const&, int, bool) | exec | 0.03 | 0.03 | 0.01 | 0.02 | 75 | 77 | 0.01 | 0.01 | 0.01 | 0.01 |
qmcplusplus::ParticleSet::acceptMove(int) | exec | 0.03 | 0.03 | 0.01 | 0.02 | 76 | 76 | 0.02 | 0.01 | 0.01 | 0.01 |
__exp_finite | libamath_neoverse-n1.so | 0.03 | 0.03 | 0.02 | 0.02 | 75 | 77 | 0.02 | 0.02 | 0.01 | 0.01 |
qmcplusplus::TimerType<std::chrono::_V2::system_clock>::stop() | exec | 0.03 | 0.03 | 0.02 | 0.01 | 74 | 73 | 0.04 | 0.05 | 0.02 | 0.03 |
qmcplusplus::WaveFunction::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | exec | 0.02 | 0.03 | 0.01 | 0.01 | 63 | 75 | 0.01 | 0.01 | 0.01 | 0.01 |
qmcplusplus::SoaDistanceTableAAOMPTarget<double, 3u, 40>::move(qmcplusplus::ParticleSet const&, qmcplusplus::TinyVector<double, 3u> const&, int, bool) | exec | 0.02 | 0.03 | 0.01 | 0.01 | 76 | 76 | 0.01 | 0.02 | 0.01 | 0.01 |
qmcplusplus::WaveFunction::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector<double, std::allocator<double> >&) | exec | 0.02 | 0.03 | 0.01 | 0.01 | 76 | 76 | 0.01 | 0.01 | 0.01 | 0.01 |
__kmp_get_global_thread_id_reg | libomp_with_lse.so | 0.03 | 0.02 | 0.02 | 0.01 | 79 | 74 | 0.02 | 0.01 | 0.01 | 0.01 |
@plt_start@ | libarmpl_mp.so | NA | 0.05 | NA | 0.03 | NA | 80 | NA | 0.02 | NA | 0.01 |
__GI___sched_yield | libc-2.28.so | 0.03 | 0.02 | 0.01 | 0.01 | 75 | 76 | 0.01 | 0.01 | 0.01 | 0.01 |
void armpl::clag::(anonymous namespace)::gemv_a_cntg_first<false, double, double, double, double>(long, long, double, double const*, long, long, double const*, long, double, double*, long) | libarmpl_mp.so | NA | 0.05 | NA | 0.03 | NA | 80 | NA | 0.02 | NA | 0.01 |
__kmp_api_omp_get_level | libomp_with_lse.so | 0.02 | 0.03 | 0.01 | 0.01 | 75 | 76 | 0.01 | 0.01 | 0.01 | 0.01 |
void qmcplusplus::DelayedUpdate<double, double>::getInvRow<qmcplusplus::Vector<double, std::allocator<double> > >(qmcplusplus::Matrix<double, std::allocator<double> > const&, int, qmcplusplus::Vector<double, std::... | exec | 0.02 | 0.02 | 0.01 | 0.01 | 66 | 64 | 0.01 | 0.01 | 0.01 | 0.01 |
qmcplusplus::ParticleSet::makeMove(int, qmcplusplus::TinyVector<double, 3u> const&, bool) | exec | 0.02 | 0.02 | 0.01 | 0.01 | 66 | 70 | 0.01 | 0.01 | 0.00 | 0.01 |
@plt_start@ | libarmpl.so | 0.04 | NA | 0.02 | NA | 79 | NA | 0.02 | NA | 0.01 | NA |
void armpl::clag::(anonymous namespace)::gemv_a_cntg_first<false, double, double, double, double>(long, long, double, double const*, long, long, double const*, long, double, double*, long) | libarmpl.so | 0.04 | NA | 0.02 | NA | 79 | NA | 0.02 | NA | 0.01 | NA |
__cxxabiv1::__vmi_class_type_info::__do_dyncast(long, __cxxabiv1::__class_type_info::__sub_kind, __cxxabiv1::__class_type_info const*, void const*, __cxxabiv1::__class_type_info const*, void const*, __cxxabiv1::__class_type_info::__dyncast_result&) co... | libarmpl.so | 0.04 | NA | 0.02 | NA | 78 | NA | 0.02 | NA | 0.01 | NA |
qmcplusplus::SoaDistanceTableABOMPTarget<double, 3u, 40>::update(int) | exec | 0.02 | 0.02 | 0.01 | 0.01 | 67 | 71 | 0.01 | 0.01 | 0.01 | 0.01 |
void armpl::clag::blas3_gemv::operator()<double, armpl::clag::spec::neoverse_n1_machine_spec>(armpl::clag::spec::problem_context<double, (armpl::clag::spec::problem_type)29, armpl::clag::spec::neoverse_n1_machine_spec> const&) const | libarmpl_mp.so | NA | 0.04 | NA | 0.02 | NA | 76 | NA | 0.02 | NA | 0.01 |
void qmcplusplus::DelayedUpdate<double, double>::acceptRow<qmcplusplus::Vector<double, std::allocator<double> > >(qmcplusplus::Matrix<double, std::allocator<double> >&, int, qmcplusplus::Vector<double, std::alloca... | exec | 0.02 | 0.02 | 0.01 | 0.01 | 73 | 68 | 0.01 | 0.01 | 0.01 | 0.01 |
unknown_function | exec | 0.02 | 0.02 | 0.01 | 0.01 | 78 | 69 | 0.01 | 0.01 | 0.01 | 0.01 |
void armpl::clag::(anonymous namespace)::trsm_kernel<double, true, true, true, false, false>(double const*, long, long, double*, long, long, long, long) | libarmpl_mp.so | NA | 0.04 | NA | 0.02 | NA | 78 | NA | 0.02 | NA | 0.01 |
miniqmcreference::einspline_spo_ref<double>::evaluate_v(qmcplusplus::ParticleSet const&, int) | exec | 0.02 | 0.02 | 0.01 | 0.01 | 73 | 75 | 0.01 | 0.02 | 0.01 | 0.01 |
unknown_function | Unknown module | 0.02 | 0.02 | 0.01 | 0.01 | 69 | 63 | 0.01 | 0.01 | 0.01 | 0.01 |
miniqmcreference::einspline_spo_ref<double>::evaluate_vgh(qmcplusplus::ParticleSet const&, int) | exec | 0.02 | 0.02 | 0.01 | 0.01 | 70 | 75 | 0.01 | 0.01 | 0.01 | 0.01 |
qmcplusplus::WaveFunction::evalGrad(qmcplusplus::ParticleSet&, int) | exec | 0.02 | 0.02 | 0.01 | 0.01 | 74 | 71 | 0.01 | 0.01 | 0.01 | 0.01 |
__dynamic_cast | libarmpl_mp.so | NA | 0.03 | NA | 0.01 | NA | 75 | NA | 0.02 | NA | 0.01 |
dlaswp_ | libarmpl_mp.so | NA | 0.03 | NA | 0.02 | NA | 79 | NA | 0.01 | NA | 0.01 |
__cxxabiv1::__vmi_class_type_info::__do_dyncast(long, __cxxabiv1::__class_type_info::__sub_kind, __cxxabiv1::__class_type_info const*, void const*, __cxxabiv1::__class_type_info const*, void const*, __cxxabiv1::__class_type_info::__dyncast_result&) co... | libarmpl_mp.so | NA | 0.03 | NA | 0.02 | NA | 78 | NA | 0.02 | NA | 0.01 |
miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evalGrad(qmcplusplus::ParticleSet&, int) | exec | 0.01 | 0.02 | 0.01 | 0.01 | 61 | 67 | 0.01 | 0.01 | 0.01 | 0.01 |
dlaswp_ | libarmpl.so | 0.03 | NA | 0.02 | NA | 76 | NA | 0.02 | NA | 0.01 | NA |
__dynamic_cast | libarmpl.so | 0.03 | NA | 0.02 | NA | 77 | NA | 0.02 | NA | 0.01 | NA |
void armpl::clag::(anonymous namespace)::trsm_kernel<double, true, true, true, false, false>(double const*, long, long, double*, long, long, long, long) | libarmpl.so | 0.03 | NA | 0.02 | NA | 80 | NA | 0.02 | NA | 0.01 | NA |
__strcmp | libastring_aarch64.so | 0.01 | 0.01 | 0.01 | 0 | 62 | 46 | 0.01 | 0.00 | 0.00 | 0.00 |
qmcplusplus::ParticleSet::update(bool) | exec | 0.01 | 0.01 | 0.01 | 0.01 | 59 | 58 | 0.01 | 0.01 | 0.00 | 0.01 |
qmcplusplus::VirtualParticleSet::makeMoves(qmcplusplus::ParticleSet const&, int, std::vector<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<double, 3u> > > const&, bool, int) | exec | 0.01 | 0.01 | 0 | 0 | 48 | 46 | 0.01 | 0.01 | 0.00 | 0.00 |
miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::acceptMove(qmcplusplus::ParticleSet&, int) | exec | 0.01 | 0.01 | 0.01 | 0.01 | 55 | 58 | 0.01 | 0.01 | 0.01 | 0.01 |
__kmp_get_ancestor_thread_num | libomp_with_lse.so | 0.01 | 0.01 | 0.01 | 0.01 | 60 | 58 | 0.01 | 0.01 | 0.01 | 0.00 |
f64xsubf128 | libm-2.28.so | 0.01 | 0.01 | 0.01 | 0 | 79 | 72 | 0.00 | 0.00 | 0.00 | 0.00 |
bool armpl::dispatch_atomic_neon<double>(armpl::armpl_trans, armpl::armpl_trans, long, long, long, double const*, long, double const*, long, double*, long, double, double) | libarmpl.so | 0.02 | NA | 0.01 | NA | 75 | NA | 0.01 | NA | 0.01 | NA |
qmcplusplus::ParticleSet::computeNewPosDistTables(int, qmcplusplus::TinyVector<double, 3u> const&, bool) | exec | 0.01 | 0.01 | 0.01 | 0.01 | 53 | 51 | 0.01 | 0.01 | 0.01 | 0.00 |
miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::recompute(qmcplusplus::ParticleSet&) | exec | 0.01 | 0.01 | 0.01 | 0.01 | 66 | 75 | 0.00 | 0.00 | 0.00 | 0.00 |
daxpy_kernel | libarmpl_mp.so | NA | 0.02 | NA | 0.01 | NA | 65 | NA | 0.02 | NA | 0.01 |
void armpl::clag::blas3_gemv::operator()<double, armpl::clag::spec::neoverse_n1_machine_spec>(armpl::clag::spec::problem_context<double, (armpl::clag::spec::problem_type)29, armpl::clag::spec::neoverse_n1_machine_spec> const&) const | libarmpl.so | 0.02 | NA | 0.01 | NA | 70 | NA | 0.01 | NA | 0.01 | NA |
miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evalGrad(qmcplusplus::ParticleSet&, int) | exec | 0.01 | 0.01 | 0.01 | 0.01 | 56 | 60 | 0.01 | 0.01 | 0.00 | 0.00 |
daxpy_kernel | libarmpl.so | 0.02 | NA | 0.01 | NA | 66 | NA | 0.02 | NA | 0.01 | NA |
qmcplusplus::Vector<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<double, 3u> > >::resize(unsigned long, qmcplusplus::TinyVector<double, 3u>) | exec | 0.01 | 0.01 | 0 | 0 | 42 | 42 | 0.01 | 0.01 | 0.00 | 0.00 |
qmcplusplus::WaveFunction::acceptMove(qmcplusplus::ParticleSet&, int) | exec | 0.01 | 0.01 | 0 | 0 | 44 | 52 | 0.01 | 0.00 | 0.00 | 0.00 |
miniqmcreference::einspline_spo_ref<double>::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector<double, std::allocator<double> >&) | exec | 0.01 | 0.01 | 0 | 0.01 | 33 | 52 | 0.01 | 0.01 | 0.00 | 0.00 |
qmcplusplus::Vector<double, qmcplusplus::OMPallocator<double, qmcplusplus::Mallocator<double, 32ul> > >::resize(unsigned long, double) | exec | 0.01 | 0.01 | 0 | 0 | 37 | 44 | 0.01 | 0.01 | 0.00 | 0.00 |
unknown_function | [vdso] | 0.01 | 0.01 | 0 | 0 | 47 | 38 | 0.01 | 0.01 | 0.01 | 0.01 |
void armpl::clag::ger<true, int, false, double, armpl::clag::spec::neoverse_n1_machine_spec>(int const*, int const*, double const*, double const*, int const*, double const*, int const*, double*, int const*) | libarmpl_mp.so | NA | 0.01 | NA | 0.01 | NA | 61 | NA | 0.01 | NA | 0.01 |
void armpl::clag::ger<true, int, false, double, armpl::clag::spec::neoverse_n1_machine_spec>(int const*, int const*, double const*, double const*, int const*, double const*, int const*, double*, int const*) | libarmpl.so | 0.01 | NA | 0 | NA | 41 | NA | 0.01 | NA | 0.00 | NA |
dger_ | libarmpl_mp.so | NA | 0.01 | NA | 0 | NA | 46 | NA | 0.01 | NA | 0.00 |
lsame_ | libarmpl_mp.so | NA | 0.01 | NA | 0 | NA | 52 | NA | 0.01 | NA | 0.00 |
__cxxabiv1::__si_class_type_info::__do_dyncast(long, __cxxabiv1::__class_type_info::__sub_kind, __cxxabiv1::__class_type_info const*, void const*, __cxxabiv1::__class_type_info const*, void const*, __cxxabiv1::__class_type_info::__dyncast_result&) co... | libarmpl.so | 0.01 | NA | 0 | NA | 41 | NA | 0.01 | NA | 0.00 | NA |
void armpl::clag::(anonymous namespace)::outer_product_terminal<void (*)(long, double, double const*, double, double*, long, long)>::operator()<armpl::clag::general_matrix<armpl::clag::(anonymous namespace)::matrix_base<double const> >... | libarmpl_mp.so | NA | 0.01 | NA | 0 | NA | 48 | NA | 0.01 | NA | 0.00 |
void armpl::clag::gemv<true, int, double, double, double, double, armpl::clag::spec::neoverse_n1_machine_spec>(char const*, int const*, int const*, double const*, double const*, int const*, double const*, int const*, double const*, double*, int cons... | libarmpl_mp.so | NA | 0.01 | NA | 0 | NA | 44 | NA | 0.01 | NA | 0.00 |
void armpl::clag::(anonymous namespace)::outer_product_terminal<void (*)(long, double, double const*, double, double*, long, long)>::operator()<armpl::clag::general_matrix<armpl::clag::(anonymous namespace)::matrix_base<double const> >... | libarmpl.so | 0.01 | NA | 0 | NA | 40 | NA | 0.01 | NA | 0.00 | NA |
bool armpl::dispatch_atomic_neon<double>(armpl::armpl_trans, armpl::armpl_trans, long, long, long, double const*, long, double const*, long, double*, long, double, double) | libarmpl_mp.so | NA | 0.01 | NA | 0.01 | NA | 52 | NA | 0.01 | NA | 0.01 |
__fd_log_1 | libamath_neoverse-n1.so | 0.01 | 0 | 0 | 0 | 35 | 18 | 0.01 | 0.00 | 0.00 | 0.00 |
__kmp_api_omp_get_ancestor_thread_num | libomp_with_lse.so | 0 | 0.01 | 0 | 0 | 29 | 40 | 0.00 | 0.00 | 0.00 | 0.00 |
void armpl::clag::gemv<true, int, double, double, double, double, armpl::clag::spec::neoverse_n1_machine_spec>(char const*, int const*, int const*, double const*, double const*, int const*, double const*, int const*, double const*, double*, int cons... | libarmpl.so | 0.01 | NA | 0 | NA | 38 | NA | 0.01 | NA | 0.00 | NA |
miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::acceptMove(qmcplusplus::ParticleSet&, int) | exec | 0.01 | 0 | 0 | 0 | 39 | 32 | 0.00 | 0.00 | 0.00 | 0.00 |
void armpl::clag::gemm<true, int, double, double, double, armpl::clag::spec::neoverse_n1_machine_spec>(char const*, char const*, int const*, int const*, int const*, double const*, double const*, int const*, double const*, int const*, double const*, d... | libarmpl.so | 0.01 | NA | 0.01 | NA | 61 | NA | 0.01 | NA | 0.00 | NA |
lsame_ | libarmpl.so | 0.01 | NA | 0 | NA | 35 | NA | 0.01 | NA | 0.00 | NA |
ddot_kernel | libarmpl.so | 0.01 | NA | 0 | NA | 35 | NA | 0.01 | NA | 0.00 | NA |
void armpl::clag::gemm<true, int, double, double, double, armpl::clag::spec::neoverse_n1_machine_spec>(char const*, char const*, int const*, int const*, int const*, double const*, double const*, int const*, double const*, int const*, double const*, d... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 20 | NA | 0.00 | NA | 0.00 |
void armpl::clag::(anonymous namespace)::gemv_shim<true, double, &dgemv_t_neon_kernel_serial>(long, long, double, double const*, long, long, double const*, long, double, double*, long) | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 12 | NA | 0.00 | NA | 0.00 |
__cxxabiv1::__si_class_type_info::__do_dyncast(long, __cxxabiv1::__class_type_info::__sub_kind, __cxxabiv1::__class_type_info const*, void const*, __cxxabiv1::__class_type_info const*, void const*, __cxxabiv1::__class_type_info::__dyncast_result&) co... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 22 | NA | 0.00 | NA | 0.00 |
void armpl::clag::blas1_axpby::operator()<double, armpl::clag::spec::neoverse_n1_machine_spec>(armpl::clag::spec::problem_context<double, (armpl::clag::spec::problem_type)46, armpl::clag::spec::neoverse_n1_machine_spec> const&) const | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 8 | NA | 0.00 | NA | 0.00 |
kernel_dgemm_5_1_5_NT | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 8 | NA | 0.00 | NA | 0.00 |
void armpl::clag::(anonymous namespace)::c_copy<double, armpl::clag::(anonymous namespace)::kernel_exec<void (*)(double const*, double const*, double*, long, long, long, long, double, double)> >::operator()<armpl::clag::(anonymous namespace)... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
void armpl::clag::(anonymous namespace)::axpby_fallback<false, double, double, double>(long, double, double const*, double, double*, long, long) | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 8 | NA | 0.00 | NA | 0.00 |
void armpl::clag::(anonymous namespace)::neon_interleave::operator()<double const, double>(armpl::clag::general_matrix<armpl::clag::(anonymous namespace)::matrix_base<double const> > const&, armpl::clag::(anonymous namespace)::interle... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
idamax_kernel | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 11 | NA | 0.01 | NA | 0.00 |
bool armpl::clag::gemm_atomic::use<armpl::clag::spec::problem_context<double, (armpl::clag::spec::problem_type)29, armpl::clag::spec::neoverse_n1_machine_spec> >(armpl::clag::spec::problem_context<double, (armpl::clag::spec::problem_type)29,... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 25 | NA | 0.00 | NA | 0.00 |
.text@start | libmlx5.so.1.24.44.0 | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
dgemv_ | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 25 | NA | 0.00 | NA | 0.00 |
__kmp_get_max_active_levels | libomp_with_lse.so | NA | 0 | NA | 0 | NA | 8 | NA | 0.00 | NA | 0.00 |
__memmove | libastring_aarch64.so | 0 | 0 | 0 | 0 | 1 | 1 | 0.00 | 0.00 | 0.00 | 0.00 |
@plt_start@ | libucs.so.0.0.0 | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
bool armpl::dispatch_atomic<double>(armpl::armpl_trans, armpl::armpl_trans, long, long, long, double const*, long, double const*, long, double*, long, double, double) | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 28 | NA | 0.00 | NA | 0.00 |
_ZSt13__invoke_implIvZN5armpl4clag4gemmIdLNS1_4spec12problem_typeE0ENS3_24neoverse_n1_machine_specEEEvRKNS3_15problem_contextIT_XT0_ET1_EEEUlDpRT_E_JRKNS1_18blas3_set_or_scaleERKNS1_11gemm_atomicERKNS1_9blas1_dotERKNS1_11blas1_axpbyERKNS1_10blas3_gemvERKNS... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 |
ddot_kernel | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 33 | NA | 0.01 | NA | 0.00 |
___kmp_free | libomp_with_lse.so | 0 | 0 | 0 | 0 | 1 | 3 | 0.00 | 0.00 | 0.00 | 0.00 |
_ZSt13__invoke_implIvZN5armpl4clag4gemmIdLNS1_4spec12problem_typeE29ENS3_24neoverse_n1_machine_specEEEvRKNS3_15problem_contextIT_XT0_ET1_EEEUlDpRT_E_JRKNS1_18blas3_set_or_scaleERKNS1_11gemm_atomicERKNS1_9blas1_dotERKNS1_11blas1_axpbyERKNS1_10blas3_gemvEEES... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 29 | NA | 0.00 | NA | 0.00 |
__kmp_api_omp_get_thread_num | libomp_with_lse.so | NA | 0 | NA | 0 | NA | 33 | NA | 0.00 | NA | 0.00 |
void geset<double>(double, long, long, double const*, long) | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 7 | NA | 0.00 | NA | 0.00 |
std::vector<qmcplusplus::BsplineFunctor<double>*, std::allocator<qmcplusplus::BsplineFunctor<double>*> >::_M_fill_insert(__gnu_cxx::__normal_iterator<qmcplusplus::BsplineFunctor<double>**, std::vector<qmcplusplus::Bsplin... | exec | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
kernel_dgemm_3_1_3_NT | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 6 | NA | 0.00 | NA | 0.00 |
dgemm_ | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
bool armpl::clag::gemm_atomic::use<armpl::clag::spec::problem_context<double, (armpl::clag::spec::problem_type)0, armpl::clag::spec::neoverse_n1_machine_spec> >(armpl::clag::spec::problem_context<double, (armpl::clag::spec::problem_type)0, a... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
operator delete(void*) | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
__nv_dgetrf_nag__F1L101_1_ | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
void armpl::clag::triangular_solve_resident<armpl::clag::(anonymous namespace)::gemm_exec<armpl::clag::spec::neoverse_n1_machine_spec>, armpl::clag::(anonymous namespace)::trsm_kernel_exec<double> >::operator()<armpl::clag::(anonymous ... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
void armpl::clag::triangular_solve_resident<armpl::clag::(anonymous namespace)::gemm_exec<armpl::clag::spec::neoverse_n1_machine_spec>, armpl::clag::triangular_solve_resident<armpl::clag::(anonymous namespace)::gemm_exec<armpl::clag::spec::n... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
void armpl::clag::triangular_solve_resident<armpl::clag::(anonymous namespace)::gemm_exec<armpl::clag::spec::neoverse_n1_machine_spec>, armpl::clag::triangular_solve_resident<armpl::clag::(anonymous namespace)::gemm_exec<armpl::clag::spec::n... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
dtrtri_ | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
void armpl::clag::triangular_solve_resident<armpl::clag::(anonymous namespace)::gemm_exec<armpl::clag::spec::neoverse_n1_machine_spec>, armpl::clag::triangular_solve_resident<armpl::clag::(anonymous namespace)::gemm_exec<armpl::clag::spec::n... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
void armpl::clag::scal_impl<double, double, armpl::clag::spec::neoverse_n1_machine_spec>(armpl::clag::spec::problem_context_2T<double, double, (armpl::clag::spec::problem_type)41, armpl::clag::spec::neoverse_n1_machine_spec> const&) | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
with_errno | libamath_neoverse-n1.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
std::vector<qmcplusplus::Vector<double, qmcplusplus::Mallocator<double, 32ul> >, std::allocator<qmcplusplus::Vector<double, qmcplusplus::Mallocator<double, 32ul> > > >::_M_default_append(unsigned long) [clone .39] [clone... | exec | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
frexpf128 | libm-2.28.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
check_match | ld-2.28.so | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
pthread_self | libpthread-2.28.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
__kmp_api_omp_get_max_active_levels | libomp_with_lse.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
.omp_outlined..16 | exec | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
__kmp_join_barrier(int) | libomp_with_lse.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::completeUpdates() | exec | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
void std::_Destroy_aux<false>::__destroy<std::unique_ptr<qmcplusplus::TimerType<std::chrono::_V2::system_clock>, std::default_delete<qmcplusplus::TimerType<std::chrono::_V2::system_clock> > >*>(std::unique_ptr<qmcplus... | exec | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
dtrsm_reference_ | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 6 | NA | 0.00 | NA | 0.00 |
dgerb_ | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
ucs_async_handler_get | libucs.so.0.0.0 | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
kernel_dgemm_2_1_2_NT | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 3 | NA | 0.00 | NA | 0.00 |
dscal_kernel | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 3 | NA | 0.00 | NA | 0.00 |
void armpl::clag::(anonymous namespace)::gemv_shim<false, double, &dgemv_n_neon_kernel>(long, long, double, double const*, long, long, double const*, long, double, double*, long) | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 3 | NA | 0.00 | NA | 0.00 |
void armpl::clag::blas1_axpby::operator()<double, (armpl::clag::spec::problem_type)29, armpl::clag::spec::neoverse_n1_machine_spec>(armpl::clag::spec::problem_context<double, (armpl::clag::spec::problem_type)29, armpl::clag::spec::neoverse_n1_mach... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 |
void armpl::clag::(anonymous namespace)::axpy_axpby_shim<double, &daxpy_kernel>(long, double, double const*, double, double*, long, long) | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
kernel_dgemm_4_1_4_NT | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 5 | NA | 0.00 | NA | 0.00 |
dgetrf2_ | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 3 | NA | 0.01 | NA | 0.00 |
void armpl::clag::trsm<true, int, double, armpl::clag::spec::neoverse_n1_machine_spec>(char const*, char const*, char const*, char const*, int const*, int const*, double const*, double const*, int const*, double*, int const*) | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 6 | NA | 0.00 | NA | 0.00 |
void armpl::clag::(anonymous namespace)::kernel_exec<void (*)(double const*, double const*, double*, long, long, long, long, double, double)>::operator()<armpl::clag::(anonymous namespace)::interleaved_matrix<double>, armpl::clag::(anonymous... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 5 | NA | 0.00 | NA | 0.00 |
ilaenv_ | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
kernel_dgemm_6_1_6_NT | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 |
kernel_dgemm_1_1_1_NN | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 |
__kmp_invoke_microtask | libomp_with_lse.so | NA | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 |
qmcplusplus::SoaDistanceTableABOMPTarget<double, 3u, 40>::resize() [clone .41] [clone .extracted] | exec | NA | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 |
__kmpc_master | libomp_with_lse.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
kernel_dgemm_1_1_1_NT | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 |
dtrsm_ | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 |
void armpl::clag::triangular_solve_resident<armpl::clag::(anonymous namespace)::gemm_exec<armpl::clag::spec::neoverse_n1_machine_spec>, armpl::clag::triangular_solve_resident<armpl::clag::(anonymous namespace)::gemm_exec<armpl::clag::spec::n... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 |
void armpl::clag::gemm_basic::operator()<double, armpl::clag::spec::neoverse_n1_machine_spec>(armpl::clag::spec::problem_context<double, (armpl::clag::spec::problem_type)0, armpl::clag::spec::neoverse_n1_machine_spec> const&) const | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 |
void armpl::clag::triangular_solve_resident<armpl::clag::(anonymous namespace)::gemm_exec<armpl::clag::spec::neoverse_n1_machine_spec>, armpl::clag::triangular_solve_resident<armpl::clag::(anonymous namespace)::gemm_exec<armpl::clag::spec::n... | libarmpl_mp.so | NA | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 |
do_lookup_x | ld-2.28.so | 0 | 0 | 0 | 0 | 1 | 1 | 0.00 | 0.00 | 0.00 | 0.00 |
void armpl::clag::triangular_solve_resident<armpl::clag::(anonymous namespace)::gemm_exec<armpl::clag::spec::neoverse_n1_machine_spec>, armpl::clag::triangular_solve_resident<armpl::clag::(anonymous namespace)::gemm_exec<armpl::clag::spec::n... | libarmpl.so | 0 | NA | 0 | NA | 3 | NA | 0.00 | NA | 0.00 | NA |
__errno_location | libpthread-2.28.so | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
void armpl::clag::(anonymous namespace)::gemm_exec<armpl::clag::spec::neoverse_n1_machine_spec>::operator()<armpl::clag::(anonymous namespace)::triangular_matrix<armpl::clag::(anonymous namespace)::matrix_base<double const> >, armpl::c... | libarmpl.so | 0 | NA | 0 | NA | 6 | NA | 0.00 | NA | 0.00 | NA |
sincos | libm-2.28.so | 0 | 0 | 0 | 0 | 6 | 8 | 0.00 | 0.00 | 0.00 | 0.00 |
miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<double, ... | exec | 0 | 0 | 0 | 0 | 6 | 4 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmpc_end_serialized_parallel | libomp_with_lse.so | 0 | 0 | 0 | 0 | 5 | 3 | 0.00 | 0.00 | 0.00 | 0.00 |
kernel_dgemm_5_1_5_NT | libarmpl.so | 0 | NA | 0 | NA | 6 | NA | 0.00 | NA | 0.00 | NA |
qmcplusplus::RealSpacePositions::setAllParticlePos(qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<double, 3u> > > const&) | exec | 0 | NA | 0 | NA | 6 | NA | 0.00 | NA | 0.00 | NA |
miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<double, ... | exec | 0 | 0 | 0 | 0 | 7 | 8 | 0.00 | 0.00 | 0.00 | 0.00 |
.omp_outlined..11 | exec | 0 | 0 | 0 | 0 | 8 | 3 | 0.00 | 0.00 | 0.00 | 0.00 |
void armpl::clag::(anonymous namespace)::gemv_shim<true, double, &dgemv_t_neon_kernel_serial>(long, long, double, double const*, long, long, double const*, long, double, double*, long) | libarmpl.so | 0 | NA | 0 | NA | 7 | NA | 0.00 | NA | 0.00 | NA |
void geset<double>(double, long, long, double const*, long) | libarmpl.so | 0 | NA | 0 | NA | 7 | NA | 0.01 | NA | 0.00 | NA |
__divtf3 | libgcc_s.so.1 | 0 | 0 | 0 | 0 | 6 | 4 | 0.00 | 0.00 | 0.00 | 0.00 |
kernel_dgemm_2_1_2_NT | libarmpl.so | 0 | NA | 0 | NA | 5 | NA | 0.00 | NA | 0.00 | NA |
qmcplusplus::WaveFunction::restore(int) | exec | 0 | 0 | 0 | 0 | 5 | 3 | 0.00 | 0.00 | 0.00 | 0.00 |
void armpl::clag::trsm<true, int, double, armpl::clag::spec::neoverse_n1_machine_spec>(char const*, char const*, char const*, char const*, int const*, int const*, double const*, double const*, int const*, double*, int const*) | libarmpl.so | 0 | NA | 0 | NA | 4 | NA | 0.00 | NA | 0.00 | NA |
void armpl::clag::triangular_solve_resident<armpl::clag::(anonymous namespace)::gemm_exec<armpl::clag::spec::neoverse_n1_machine_spec>, armpl::clag::(anonymous namespace)::trsm_kernel_exec<double> >::operator()<armpl::clag::(anonymous ... | libarmpl.so | 0 | NA | 0 | NA | 3 | NA | 0.01 | NA | 0.00 | NA |
kernel_dgemm_4_1_4_NT | libarmpl.so | 0 | NA | 0 | NA | 5 | NA | 0.00 | NA | 0.00 | NA |
__logl_finite | libm-2.28.so | 0 | 0 | 0 | 0 | 5 | 5 | 0.00 | 0.00 | 0.00 | 0.00 |
qmcplusplus::RealSpacePositionsOMPTarget::getAllParticlePos() const | exec | 0 | 0 | 0 | 0 | 5 | 4 | 0.00 | 0.00 | 0.00 | 0.00 |
qmcplusplus::SPOSet::evaluate_notranspose(qmcplusplus::ParticleSet const&, int, int, qmcplusplus::Matrix<double, std::allocator<double> >&, qmcplusplus::Matrix<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus:... | exec | 0 | 0 | 0 | 0 | 5 | 6 | 0.00 | 0.00 | 0.00 | 0.00 |
dtrsm_reference_ | libarmpl.so | 0 | NA | 0 | NA | 5 | NA | 0.00 | NA | 0.00 | NA |
__kmp_join_call | libomp_with_lse.so | 0 | 0 | 0 | 0 | 4 | 6 | 0.00 | 0.00 | 0.00 | 0.00 |
qmcplusplus::ParticleSet::getDistTableAA(int) const | exec | 0 | 0 | 0 | 0 | 10 | 4 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmp_now_nsec | libomp_with_lse.so | 0 | 0 | 0 | 0 | 10 | 15 | 0.00 | 0.00 | 0.00 | 0.00 |
_ZZN5armpl4clag4gemmIdLNS0_4spec12problem_typeE29ENS2_24neoverse_n1_machine_specEEEvRKNS2_15problem_contextIT_XT0_ET1_EEENKUlDpRT_E_clIJKNS0_18blas3_set_or_scaleEKNS0_11gemm_atomicEKNS0_9blas1_dotEKNS0_11blas1_axpbyEKNS0_10blas3_gemvEEEEDaSD_ | libarmpl.so | 0 | NA | 0 | NA | 30 | NA | 0.00 | NA | 0.00 | NA |
_dl_tlsdesc_return | ld-2.28.so | 0 | 0 | 0 | 0 | 28 | 8 | 0.00 | 0.00 | 0.00 | 0.00 |
@plt_start@ | libomp_with_lse.so | 0 | 0 | 0 | 0 | 27 | 23 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmp_yield | libomp_with_lse.so | 0 | 0 | 0 | 0 | 26 | 22 | 0.00 | 0.00 | 0.00 | 0.00 |
qmcplusplus::RealSpacePositionsOMPTarget::setOneParticlePos(qmcplusplus::TinyVector<double, 3u> const&, unsigned long) | exec | 0 | 0 | 0 | 0 | 32 | 19 | 0.00 | 0.00 | 0.00 | 0.00 |
miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector<double, std::allocator<double> >&) | exec | 0 | 0 | 0 | 0 | 31 | 32 | 0.00 | 0.00 | 0.00 | 0.00 |
qmcplusplus::ParticleSet::getDistTableAB(int) const | exec | 0 | 0 | 0 | 0 | 31 | 23 | 0.01 | 0.00 | 0.00 | 0.00 |
bool armpl::dispatch_atomic<double>(armpl::armpl_trans, armpl::armpl_trans, long, long, long, double const*, long, double const*, long, double*, long, double, double) | libarmpl.so | 0 | NA | 0 | NA | 31 | NA | 0.01 | NA | 0.00 | NA |
dger_ | libarmpl.so | 0 | NA | 0 | NA | 34 | NA | 0.01 | NA | 0.00 | NA |
qmcplusplus::ParticleSet::rejectMove(int) | exec | 0 | 0 | 0 | 0 | 10 | 5 | 0.00 | 0.00 | 0.00 | 0.00 |
bool armpl::clag::gemm_atomic::use<armpl::clag::spec::problem_context<double, (armpl::clag::spec::problem_type)29, armpl::clag::spec::neoverse_n1_machine_spec> >(armpl::clag::spec::problem_context<double, (armpl::clag::spec::problem_type)29,... | libarmpl.so | 0 | NA | 0 | NA | 24 | NA | 0.00 | NA | 0.00 | NA |
void armpl::clag::(anonymous namespace)::neon_interleave::operator()<double const, double>(armpl::clag::general_matrix<armpl::clag::(anonymous namespace)::matrix_base<double const> > const&, armpl::clag::(anonymous namespace)::interle... | libarmpl.so | 0 | NA | 0 | NA | 3 | NA | 0.00 | NA | 0.00 | NA |
dscal_kernel | libarmpl.so | 0 | NA | 0 | NA | 12 | NA | 0.00 | NA | 0.00 | NA |
void armpl::clag::(anonymous namespace)::c_copy<double, armpl::clag::(anonymous namespace)::kernel_exec<void (*)(double const*, double const*, double*, long, long, long, long, double, double)> >::operator()<armpl::clag::(anonymous namespace)... | libarmpl.so | 0 | NA | 0 | NA | 11 | NA | 0.00 | NA | 0.00 | NA |
qmcplusplus::SoaDistanceTableAAOMPTarget<double, 3u, 40>::evaluate(qmcplusplus::ParticleSet&) | exec | 0 | 0 | 0 | 0 | 10 | 10 | 0.00 | 0.00 | 0.00 | 0.00 |
dgemv_ | libarmpl.so | 0 | NA | 0 | NA | 24 | NA | 0.00 | NA | 0.00 | NA |
idamax_kernel | libarmpl.so | 0 | NA | 0 | NA | 11 | NA | 0.00 | NA | 0.00 | NA |
__kmp_fork_call | libomp_with_lse.so | 0 | 0 | 0 | 0 | 14 | 12 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmp_serialized_parallel | libomp_with_lse.so | 0 | 0 | 0 | 0 | 11 | 7 | 0.00 | 0.00 | 0.00 | 0.00 |
qmcplusplus::DelayedUpdate<double, double>::updateInvMat(qmcplusplus::Matrix<double, std::allocator<double> >&) | exec | 0 | 0 | 0 | 0 | 15 | 16 | 0.00 | 0.00 | 0.00 | 0.00 |
pthread_spin_lock | libpthread-2.28.so | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
__kmpc_fork_call | libomp_with_lse.so | 0 | 0 | 0 | 0 | 4 | 7 | 0.00 | 0.00 | 0.00 | 0.00 |
kernel_dgemm_1_1_1_NN | libarmpl.so | 0 | NA | 0 | NA | 3 | NA | 0.00 | NA | 0.00 | NA |
__math_divzero | libamath_neoverse-n1.so | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
qmcplusplus::BlasThreadingEnv::BlasThreadingEnv(int) | exec | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
__kmp_api_omp_get_num_threads | libomp_with_lse.so | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
qmcplusplus::SoaDistanceTableABOMPTarget<double, 3u, 40>::~SoaDistanceTableABOMPTarget() | exec | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
operator delete(void*) | libarmpl.so | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
dtrsm_ | libarmpl.so | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
dscal_ | libarmpl.so | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
dgetrf_nag_ | libarmpl.so | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
ilaenvkernel_neoverse_n1_ | libarmpl.so | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
kernel_dgemm_1_1_1_NT | libarmpl.so | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
std::vector<qmcplusplus::VectorSoAContainer<double, 3u, qmcplusplus::Mallocator<double, 32ul> >, std::allocator<qmcplusplus::VectorSoAContainer<double, 3u, qmcplusplus::Mallocator<double, 32ul> > > >::_M_default_append(u... | exec | 0 | 0 | 0 | 0 | 1 | 1 | 0.00 | 0.00 | 0.00 | 0.00 |
qmcplusplus::TimerManager<qmcplusplus::TimerType<std::chrono::_V2::system_clock> >::pop_timer(qmcplusplus::TimerType<std::chrono::_V2::system_clock>*) | exec | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
uct_ud_mlx5_iface_post_recv | libuct_ib.so.0.0.0 | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
qmcplusplus::DistanceTable::finalizePbyP(qmcplusplus::ParticleSet const&) | exec | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
void qmcplusplus::expandSuperCell<qmcplusplus::ParticleSet>(qmcplusplus::ParticleSet&, qmcplusplus::Tensor<int, 3u> const&) | exec | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
f90_str_copy_klen | libarmflang.so | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
ucs_get_cpu_clocks_per_sec | libucs.so.0.0.0 | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
ucs_vfs_node_find_by_obj | libucs.so.0.0.0 | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
uct_ud_mlx5_iface_async_progress | libuct_ib.so.0.0.0 | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
qmcplusplus::RealSpacePositions::resize(unsigned long) | exec | 0 | 0 | 0 | 0 | 1 | 1 | 0.00 | 0.00 | 0.00 | 0.00 |
double std::generate_canonical<double, 53ul, std::mersenne_twister_engine<unsigned long, 32ul, 624ul, 397ul, 31ul, 2567483615ul, 11ul, 4294967295ul, 7ul, 2636928640ul, 15ul, 4022730752ul, 18ul, 1812433253ul> >(std::mersenne_twister_engine<un... | exec | 0 | NA | 0 | NA | 4 | NA | 0.00 | NA | 0.00 | NA |
dtrsv_reference_ | libarmpl.so | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 | NA |
__fixunstfdi | libgcc_s.so.1 | 0 | 0 | 0 | 0 | 2 | 1 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmp_resume_if_soft_paused | libomp_with_lse.so | 0 | 0 | 0 | 0 | 3 | 2 | 0.00 | 0.00 | 0.00 | 0.00 |
kernel_dgemm_6_1_6_NT | libarmpl.so | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 | NA |
kernel_dgemm_3_1_3_NT | libarmpl.so | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 | NA |
dgetrf2_ | libarmpl.so | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 | NA |
__kmp_push_current_task_to_thread | libomp_with_lse.so | 0 | 0 | 0 | 0 | 3 | 4 | 0.00 | 0.00 | 0.00 | 0.00 |
void armpl::clag::(anonymous namespace)::kernel_exec<void (*)(double const*, double const*, double*, long, long, long, long, double, double)>::operator()<armpl::clag::(anonymous namespace)::interleaved_matrix<double>, armpl::clag::(anonymous... | libarmpl.so | 0 | NA | 0 | NA | 3 | NA | 0.00 | NA | 0.00 | NA |
void armpl::clag::gerb<true, int, false, double, armpl::clag::spec::neoverse_n1_machine_spec>(int const*, int const*, double const*, double const*, int const*, double const*, int const*, double const*, double*, int const*) | libarmpl.so | 0 | NA | 0 | NA | 3 | NA | 0.00 | NA | 0.00 | NA |
___kmp_allocate | libomp_with_lse.so | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |
@plt_start@ | libamath_neoverse-n1.so | 0 | 0 | 0 | 0 | 2 | 1 | 0.00 | 0.00 | 0.00 | 0.00 |
armpl::clag::use_overrides() | libarmpl.so | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 | NA |
void armpl::clag::(anonymous namespace)::gemv_shim<false, double, &dgemv_n_neon_kernel>(long, long, double, double const*, long, long, double const*, long, double, double*, long) | libarmpl.so | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 | NA |
opal_mem_hooks_release_hook | libopen-pal.so.40.30.2 | 0 | 0 | 0 | 0 | 2 | 3 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmpc_serialized_parallel | libomp_with_lse.so | 0 | 0 | 0 | 0 | 2 | 2 | 0.00 | 0.00 | 0.00 | 0.00 |
__kmpc_bound_num_threads | libomp_with_lse.so | 0 | 0 | 0 | 0 | 2 | 1 | 0.00 | 0.00 | 0.00 | 0.00 |
void armpl::clag::(anonymous namespace)::axpy_axpby_shim<double, &daxpy_kernel>(long, double, double const*, double, double*, long, long) | libarmpl.so | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 | NA |
__kmpc_end_master | libomp_with_lse.so | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 | NA |
__math_invalid | libamath_neoverse-n1.so | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 | NA |
qmcplusplus::Vector<double, qmcplusplus::Mallocator<double, 32ul> >::~Vector() | exec | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 | NA |
void armpl::clag::(anonymous namespace)::axpby_fallback<false, double, double, double>(long, double, double const*, double, double*, long, long) | libarmpl.so | 0 | NA | 0 | NA | 2 | NA | 0.00 | NA | 0.00 | NA |
ucs_async_handler_dispatch | libucs.so.0.0.0 | NA | 0 | NA | 0 | NA | 1 | NA | 0.00 | NA | 0.00 |