options

Profiling MPI #0 - OMP #0.0 - node ip-172-31-38-240.ec2.internal - process 28951 - thread 28951

NameModuleCoverage (%)Time (s)
dgemm_sve_biglibarmpl_lp64.so42.0018.45
void miniqmcreference::MultiBsplineEvalRef::evaluate_v(qmcplusplus::bspline_traits::SplineType const*, double, double, double, double*, unsigned long)+exec14.496.37
Loop 813 - MultiBsplineRef.hpp:63-71 - exec+14.396.32
Loop 810 - MultiBsplineRef.hpp:68-71 - exec3.741.64
Loop 812 - MultiBsplineRef.hpp:68-71 - exec3.701.62
Loop 809 - MultiBsplineRef.hpp:68-71 - exec3.681.62
Loop 811 - MultiBsplineRef.hpp:68-71 - exec3.271.43
void miniqmcreference::MultiBsplineEvalRef::evaluate_vgh(qmcplusplus::bspline_traits::SplineType const*, double, double, double, double*, double*, double*, unsigned long)+exec12.145.34
Loop 819 - MultiBsplineRef.hpp:226-262 - exec+11.775.17
Loop 818 - MultiBsplineRef.hpp:242-262 - exec11.775.17
Loop 816 - MultiBsplineRef.hpp:276-286 - exec0.340.15
n_interleave_kernel_d8libarmpl_lp64.so6.352.79
qmcplusplus::SoaDistanceTableABOMPTarget::evaluate(qmcplusplus::ParticleSet&)+exec4.281.88
Loop 2052 - SoaDistanceTableABOMPTarget.h:214-228 - exec+4.261.87
Loop 2053 - ParticleBConds3DSoa.h:280-298 - exec+4.261.87
Loop 2055 - ParticleBConds3DSoa.h:280-298 - exec4.261.87
Loop 2057 - SoaDistanceTableABOMPTarget.h:194-196 - exec0.010.00
qmcplusplus::SoaDistanceTableAAOMPTarget::update(int)+exec3.861.69
Loop 1794 - VectorSoAContainer.h:244-263 - exec3.861.69
void qmcplusplus::DTD_BConds::computeDistances, qmcplusplus::VectorSoAContainer >, qmcplusplus::VectorSoAContainer+exec2.821.24
Loop 1262 - ParticleBConds3DSoa.h:235-255 - exec2.821.24
void armpl::clag::gemv_a_cntg_first(long, long, double, double const*, long, long, double const*, long, double, double*, long)libarmpl_lp64.so1.810.80
miniqmcreference::TwoBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)+exec1.400.61
Loop 323 - BsplineFunctor.h:233-260 - exec+0.110.05
Loop 324 - BsplineFunctor.h:233-260 - exec+0.110.05
Loop 325 - BsplineFunctor.h:233-260 - exec+0.110.05
Loop 326 - BsplineFunctor.h:246-260 - exec0.100.04
Loop 327 - BsplineFunctor.h:246-260 - exec0.010.00
auto armpl::clag::execute_strategy<15ul, std::tuplelibarmpl_lp64.so1.310.57
miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&, qmcplusplus::Vector, std::allocator >...+exec0.810.35
Loop 800 - einspline_spo_ref.hpp:219-227 - exec+0.800.35
Loop 801 - einspline_spo_ref.hpp:223-227 - exec0.800.35
void armpl::clag::gemv_a_strd_first_impl, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::clag::(anonymous ...libarmpl_lp64.so0.680.30
miniqmcreference::TwoBodyJastrowRef >::acceptMove(qmcplusplus::ParticleSet&, int)+exec0.650.28
Loop 316 - TwoBodyJastrowRef.h:324-331 - exec0.260.12
Loop 314 - TwoBodyJastrowRef.h:342-347 - exec0.130.05
Loop 313 - TwoBodyJastrowRef.h:342-347 - exec0.130.05
Loop 315 - TwoBodyJastrowRef.h:342-347 - exec0.110.05
miniqmcreference::TwoBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)+exec0.640.28
Loop 300 - TwoBodyJastrowRef.h:155-156 - exec0.260.12
Loop 302 - TwoBodyJastrowRef.h:155-156 - exec0.130.05
Loop 301 - TwoBodyJastrowRef.h:155-156 - exec0.100.04
Loop 307 - stl_numeric.h:140-141 - exec0.100.04
Loop 308 - TwoBodyJastrowRef.h:269-274 - exec0.010.00
qmcplusplus::BsplineFunctor::evaluateVGL(int, int, int, double const*, double*, double*, double*, double*, int*) const+exec0.590.26
Loop 272 - BsplineFunctor.h:291-298 - exec0.510.22
Loop 271 - BsplineFunctor.h:303-336 - exec0.080.04
__GI___memcpy_svelibc.so.60.570.25
__GI___memset_genericlibc.so.60.560.24
dswap_libarmpl_lp64.so0.340.15
miniqmcreference::DiracDeterminantRef >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus:...+exec0.310.13
Loop 920 - OhmmsVector.h:223-223 - exec+0.310.14
Loop 918 - inner_product.hpp:155-155 - exec0.230.10
Loop 922 - inner_product.hpp:82-155 - exec+0.080.04
Loop 919 - inner_product.hpp:82-83 - exec0.080.04
miniqmcreference::DiracDeterminantRef >::evalGrad(qmcplusplus::ParticleSet&, int)+exec0.270.12
Loop 910 - inner_product.hpp:155-155 - exec0.270.12
auto armpl::clag::execute_strategy<16ul, std::tuplelibarmpl_lp64.so0.220.09
miniqmcreference::DiracDeterminantRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)+exec0.220.09
Loop 913 - inner_product.hpp:155-155 - exec0.140.06
Loop 912 - inner_product.hpp:82-83 - exec0.070.03
qmcplusplus::SPOSet::evaluateDetRatios(qmcplusplus::VirtualParticleSet const&, qmcplusplus::Vector >&, qmcplusplus::Vector > const&, std::vector >&)+exec0.220.09
Loop 804 - stl_vector.h:1131-1131 - exec+0.200.09
Loop 802 - inner_product.hpp:82-83 - exec0.200.09
miniqmcreference::TwoBodyJastrowRef >::recompute(qmcplusplus::ParticleSet&)+exec0.180.08
Loop 333 - TwoBodyJastrowRef.h:268-398 - exec+0.170.07
Loop 335 - TwoBodyJastrowRef.h:268-398 - exec+0.170.07
Loop 332 - TwoBodyJastrowRef.h:268-388 - exec+0.130.05
Loop 337 - TwoBodyJastrowRef.h:381-382 - exec0.060.03
Loop 338 - TwoBodyJastrowRef.h:381-382 - exec0.030.01
Loop 339 - TwoBodyJastrowRef.h:381-382 - exec0.010.00
Loop 344 - stl_numeric.h:140-141 - exec0.010.00
Loop 336 - TwoBodyJastrowRef.h:375-376 - exec0.010.00
Loop 334 - TwoBodyJastrowRef.h:388-391 - exec0.020.01
Loop 348 - TwoBodyJastrowRef.h:397-398 - exec0.010.00
Loop 351 - TwoBodyJastrowRef.h:397-398 - exec0.010.00
qmcplusplus::DiracMatrix::invert_transpose(qmcplusplus::Matrix > const&, qmcplusplus::Matrix >&, double&, double&)+exec0.140.06
Loop 891 - inner_product.hpp:210-212 - exec+0.140.06
Loop 892 - inner_product.hpp:211-212 - exec0.140.06
qmcplusplus::TimerType::stop()+exec0.130.05
Loop 1477 - NewTimer.h:119-119 - exec+0.030.01
Loop 1478 - stl_tree.h:1947-1947 - exec0.030.01
Loop 1475 - NewTimer.h:119-119 - exec+0.010.00
Loop 1476 - stl_tree.h:1947-1947 - exec0.010.00
qmcplusplus::BsplineAllocator >::setCoefficientsForOrbitals(int, int, Array&, multi_UBspline_3d_d*) [clone .omp_outlined]+exec0.100.04
Loop 786 - BsplineAllocator.hpp:172-180 - exec+0.100.04
Loop 790 - BsplineAllocator.hpp:179-180 - exec0.100.04
qmcplusplus::TimerType::start()exec0.080.04
__kmp_api_omp_get_levellibomp.so0.060.03
miniqmcreference::DiracDeterminantRef >::evaluateLog(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus...+exec0.060.03
Loop 906 - inner_product.hpp:82-155 - exec+0.060.02
Loop 904 - inner_product.hpp:155-155 - exec0.030.01
Loop 908 - inner_product.hpp:82-155 - exec+0.020.01
Loop 905 - inner_product.hpp:82-83 - exec0.020.01
__kmp_get_global_thread_id_reglibomp.so0.050.02
main.omp_outlined.62exec0.050.02
void armpl::clag::compute_impl >, armpl::clag::general_matrix >, armpl::clag::general_...libarmpl_lp64.so0.030.01
auto armpl::clag::execute_strategy<11ul, std::tuplelibarmpl_lp64.so0.030.01
daxpby_sve_kernellibarmpl_lp64.so0.030.01
qmcplusplus::Vector, std::allocator > >::resize(unsigned long, qmcplusplus::TinyVector)+exec0.030.01
Loop 253 - stl_algobase.h:939-940 - exec0.030.01
miniqmcreference::OneBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)+exec0.030.01
Loop 224 - OneBodyJastrowRef.h:192-193 - exec0.010.00
Loop 226 - OneBodyJastrowRef.h:192-193 - exec0.010.00
qmcplusplus::NonLocalPP::evaluate(qmcplusplus::ParticleSet const&, qmcplusplus::WaveFunction&)+exec0.030.01
Loop 63 - NonLocalPP.hpp:122-135 - exec+0.010.00
Loop 64 - NonLocalPP.hpp:131-132 - exec0.010.00
void armpl::clag::lu_unblocked_direct_kernel(long, long, double*, long, int*, int&)libarmpl_lp64.so0.020.01
auto armpl::clag::spec::get_spec >, armpl::clag::general_matrix >, armpl::clag...libarmpl_lp64.so0.020.01
auto armpl::clag::execute_strategy<10ul, std::tuplelibarmpl_lp64.so0.020.01
auto armpl::clag::spec::get_spec, armpl::clag::matmul::matmul3 >, armpl::clag::general_matrixlibarmpl_lp64.so0.020.01
dgemm_reference_libarmpl_lp64.so0.020.01
qmcplusplus::SoaDistanceTableABOMPTarget::update(int)exec0.020.01
__GI___libc_malloclibc.so.60.020.01
qmcplusplus::SoaDistanceTableAAOMPTarget::move(qmcplusplus::ParticleSet const&, qmcplusplus::TinyVector const&, int, bool)exec0.020.01
miniqmcreference::einspline_spo_ref::evaluate_vgh(qmcplusplus::ParticleSet const&, int)+exec0.020.01
Loop 814 - einspline_spo_ref.hpp:206-208 - exec0.010.00
miniqmcreference::einspline_spo_ref::evaluate_v(qmcplusplus::ParticleSet const&, int)+exec0.020.01
Loop 808 - einspline_spo_ref.hpp:175-176 - exec0.010.00
__cxxabiv1::__vmi_class_type_info::__do_dyncast(long, __cxxabiv1::__class_type_info::__sub_kind, __cxxabiv1::__class_type_info const*, void const*, __cxxabiv1::__class_type_info const*, void const*, __cxxabiv1::__class_type_info::__dyncast_result&) constlibstdc++.so.6.0.330.020.01
__exp_finitelibm.so.60.020.01
qmcplusplus::BsplineFunctor::evaluateV(int, int, int, double const*, double*) const+exec0.020.01
Loop 277 - BsplineFunctor.h:236-241 - exec0.020.01
miniqmcreference::OneBodyJastrowRef >::computeU(double const*)+exec0.020.01
Loop 273 - OneBodyJastrowRef.h:143-146 - exec0.020.01
qmcplusplus::Vector >::resize(unsigned long, double)+exec0.020.01
Loop 249 - stl_algobase.h:951-952 - exec0.020.01
qmcplusplus::WaveFunction::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)+exec0.020.01
Loop 115 - WaveFunction.cpp:198-201 - exec0.020.01
dgemv_libarmpl_lp64.so0.010.00
__aarch64_ldadd8_acq_rellibarmpl_lp64.so0.010.00
armpl::machine::get_system_unsafe()libarmpl_lp64.so0.010.00
__GI___clock_gettimelibc.so.60.010.00
qmcplusplus::SoaDistanceTableABOMPTarget::move(qmcplusplus::ParticleSet const&, qmcplusplus::TinyVector const&, int, bool)exec0.010.00
__GI_strcmplibc.so.60.010.00
unlink_chunk.constprop.0libc.so.60.010.00
qmcplusplus::ParticleSet::makeMove(int, qmcplusplus::TinyVector const&, bool)exec0.010.00
qmcplusplus::ParticleSet::getDistTableAB(int) constexec0.010.00
qmcplusplus::Vector > >::resize(unsigned long, double)+exec0.010.00
Loop 979 - stl_algobase.h:951-952 - exec0.010.00
miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&)exec0.010.00
miniqmcreference::TwoBodyJastrowRef >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus::Particle...+exec0.010.00
Loop 320 - TwoBodyJastrowRef.h:423-427 - exec0.010.00
_dl_tlsdesc_returnld-linux-aarch64.so.10.010.00
__dynamic_castlibstdc++.so.6.0.330.010.00
miniqmcreference::OneBodyJastrowRef >::computeU3(qmcplusplus::ParticleSet&, int, double const*)+exec0.010.00
Loop 270 - OneBodyJastrowRef.h:214-219 - exec0.010.00
miniqmcreference::OneBodyJastrowRef >::evalGrad(qmcplusplus::ParticleSet&, int)exec0.010.00
qmcplusplus::WaveFunction::acceptMove(qmcplusplus::ParticleSet&, int)+exec0.010.00
Loop 117 - WaveFunction.cpp:225-228 - exec0.010.00
_dl_lookup_symbol_xld-linux-aarch64.so.10.010.00
do_lookup_xld-linux-aarch64.so.10.010.00
×