options

Profiling MPI #0 - OMP #0.18 - node ip-172-31-38-240.ec2.internal - process 8744 - thread 8832

NameModuleCoverage (%)Time (s)
dgemm_sve_biglibarmpl_lp64.so32.5448.71
void miniqmcreference::MultiBsplineEvalRef::evaluate_v(qmcplusplus::bspline_traits::SplineType const*, double, double, double, double*, unsigned long)+exec23.5635.28
Loop 813 - MultiBsplineRef.hpp:63-71 - exec+23.5535.26
Loop 812 - MultiBsplineRef.hpp:68-71 - exec6.089.11
Loop 810 - MultiBsplineRef.hpp:68-71 - exec6.059.06
Loop 809 - MultiBsplineRef.hpp:68-71 - exec5.868.78
Loop 811 - MultiBsplineRef.hpp:68-71 - exec5.558.32
void miniqmcreference::MultiBsplineEvalRef::evaluate_vgh(qmcplusplus::bspline_traits::SplineType const*, double, double, double, double*, double*, double*, unsigned long)+exec8.0712.09
Loop 819 - MultiBsplineRef.hpp:226-262 - exec+7.9311.87
Loop 818 - MultiBsplineRef.hpp:242-262 - exec7.9311.87
Loop 816 - MultiBsplineRef.hpp:276-286 - exec0.130.20
qmcplusplus::SoaDistanceTableAAOMPTarget::update(int)+exec7.9111.85
Loop 1794 - VectorSoAContainer.h:244-263 - exec7.9111.85
n_interleave_kernel_d8libarmpl_lp64.so6.7610.13
qmcplusplus::SoaDistanceTableABOMPTarget::evaluate(qmcplusplus::ParticleSet&)+exec4.166.22
Loop 2052 - SoaDistanceTableABOMPTarget.h:214-228 - exec+4.116.15
Loop 2053 - ParticleBConds3DSoa.h:280-298 - exec+4.116.15
Loop 2055 - ParticleBConds3DSoa.h:280-298 - exec4.116.15
void armpl::clag::gemv_a_cntg_first(long, long, double, double const*, long, long, double const*, long, double, double*, long)libarmpl_lp64.so2.063.09
void qmcplusplus::DTD_BConds::computeDistances, qmcplusplus::VectorSoAContainer >, qmcplusplus::VectorSoAContainer+exec1.512.26
Loop 1262 - ParticleBConds3DSoa.h:235-255 - exec1.512.25
miniqmcreference::TwoBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)+exec1.412.11
Loop 323 - BsplineFunctor.h:233-260 - exec+0.020.04
Loop 324 - BsplineFunctor.h:233-260 - exec+0.020.04
Loop 325 - BsplineFunctor.h:233-260 - exec+0.020.04
Loop 326 - BsplineFunctor.h:246-260 - exec0.020.04
auto armpl::clag::execute_strategy<15ul, std::tuplelibarmpl_lp64.so1.321.97
void armpl::clag::gemv_a_strd_first_impl, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::clag::(anonymous ...libarmpl_lp64.so1.191.78
kmp_flag_64::wait(kmp_info*, int, void*)libomp.so0.771.15
miniqmcreference::TwoBodyJastrowRef >::acceptMove(qmcplusplus::ParticleSet&, int)+exec0.771.15
Loop 314 - TwoBodyJastrowRef.h:342-347 - exec0.230.35
Loop 315 - TwoBodyJastrowRef.h:342-347 - exec0.200.30
Loop 313 - TwoBodyJastrowRef.h:342-347 - exec0.170.25
Loop 316 - TwoBodyJastrowRef.h:324-331 - exec0.150.22
miniqmcreference::DiracDeterminantRef >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus:...+exec0.530.79
Loop 920 - OhmmsVector.h:223-223 - exec+0.530.79
Loop 918 - inner_product.hpp:155-155 - exec0.360.53
Loop 922 - inner_product.hpp:82-155 - exec+0.170.26
Loop 919 - inner_product.hpp:82-83 - exec0.170.26
__GI___memcpy_svelibc.so.60.490.73
qmcplusplus::BsplineFunctor::evaluateVGL(int, int, int, double const*, double*, double*, double*, double*, int*) const+exec0.400.60
Loop 272 - BsplineFunctor.h:291-298 - exec0.340.51
Loop 271 - BsplineFunctor.h:303-336 - exec0.040.06
miniqmcreference::TwoBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)+exec0.350.53
Loop 300 - TwoBodyJastrowRef.h:155-156 - exec0.110.17
Loop 301 - TwoBodyJastrowRef.h:155-156 - exec0.100.16
Loop 302 - TwoBodyJastrowRef.h:155-156 - exec0.100.15
Loop 307 - stl_numeric.h:140-141 - exec0.020.03
miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&, qmcplusplus::Vector, std::allocator >...+exec0.330.49
Loop 800 - einspline_spo_ref.hpp:219-227 - exec+0.330.49
Loop 801 - einspline_spo_ref.hpp:223-227 - exec0.330.49
miniqmcreference::DiracDeterminantRef >::evalGrad(qmcplusplus::ParticleSet&, int)+exec0.320.49
Loop 910 - inner_product.hpp:155-155 - exec0.320.48
qmcplusplus::SPOSet::evaluateDetRatios(qmcplusplus::VirtualParticleSet const&, qmcplusplus::Vector >&, qmcplusplus::Vector > const&, std::vector >&)+exec0.310.46
Loop 804 - stl_vector.h:1131-1131 - exec+0.280.41
Loop 802 - inner_product.hpp:82-83 - exec0.280.41
__GI___memset_genericlibc.so.60.300.44
dswap_libarmpl_lp64.so0.160.23
auto armpl::clag::execute_strategy<16ul, std::tuplelibarmpl_lp64.so0.150.22
miniqmcreference::DiracDeterminantRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)+exec0.140.21
Loop 912 - inner_product.hpp:82-83 - exec0.070.10
Loop 913 - inner_product.hpp:155-155 - exec0.070.10
qmcplusplus::NonLocalPP::evaluate(qmcplusplus::ParticleSet const&, qmcplusplus::WaveFunction&)exec0.100.15
kmp_flag_native::notdone_check()libomp.so0.090.14
miniqmcreference::TwoBodyJastrowRef >::recompute(qmcplusplus::ParticleSet&)+exec0.080.12
Loop 333 - TwoBodyJastrowRef.h:268-398 - exec+0.050.08
Loop 335 - TwoBodyJastrowRef.h:268-398 - exec+0.050.08
Loop 332 - TwoBodyJastrowRef.h:268-388 - exec+0.040.06
Loop 339 - TwoBodyJastrowRef.h:381-382 - exec0.020.04
Loop 337 - TwoBodyJastrowRef.h:381-382 - exec0.010.02
Loop 334 - TwoBodyJastrowRef.h:388-391 - exec0.020.03
miniqmcreference::DiracDeterminantRef >::evaluateLog(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus...+exec0.070.11
Loop 906 - inner_product.hpp:82-155 - exec+0.070.11
Loop 904 - inner_product.hpp:155-155 - exec0.050.08
Loop 908 - inner_product.hpp:82-155 - exec+0.020.03
Loop 905 - inner_product.hpp:82-83 - exec0.020.03
qmcplusplus::DiracMatrix::invert_transpose(qmcplusplus::Matrix > const&, qmcplusplus::Matrix >&, double&, double&)+exec0.070.10
Loop 891 - inner_product.hpp:210-212 - exec+0.070.10
Loop 892 - inner_product.hpp:211-212 - exec0.070.10
miniqmcreference::OneBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)+exec0.050.08
Loop 224 - OneBodyJastrowRef.h:192-193 - exec0.020.03
Loop 226 - OneBodyJastrowRef.h:192-193 - exec0.010.02
qmcplusplus::BsplineFunctor::evaluateV(int, int, int, double const*, double*) const+exec0.040.06
Loop 277 - BsplineFunctor.h:236-241 - exec0.030.04
void armpl::clag::lu_unblocked_direct_kernel(long, long, double*, long, int*, int&)libarmpl_lp64.so0.030.05
qmcplusplus::TimerType::start()exec0.030.05
__GI___sched_yieldlibc.so.60.020.04
auto armpl::clag::execute_strategy<10ul, std::tuplelibarmpl_lp64.so0.020.03
qmcplusplus::WaveFunction::evalGrad(qmcplusplus::ParticleSet&, int)+exec0.020.03
Loop 114 - WaveFunction.cpp:185-188 - exec0.020.03
daxpby_sve_kernellibarmpl_lp64.so0.020.03
qmcplusplus::TimerType::stop()exec0.020.03
miniqmcreference::einspline_spo_ref::evaluate_v(qmcplusplus::ParticleSet const&, int)+exec0.020.03
Loop 808 - einspline_spo_ref.hpp:175-176 - exec0.010.02
miniqmcreference::OneBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)+exec0.020.03
Loop 245 - OneBodyJastrowRef.h:134-135 - exec0.020.03
×