options

Expert Summary

Columns Filter

Source Location Source Function Level Max Time Over Threads (s) Time w.r.t. Wall Time (s) Coverage (% app. time) Speedup if no scalar integer Speedup if FP arith vectorized Speedup if fully vectorized Speedup if FP only Number of paths Vectorization Ratio (%) Vector Length Use (%) Flops (GFLOP/s) CQA cycles CQA cycles if no scalar integer CQA cycles if FP arith vectorized CQA cycles if fully vectorized CQA cycles if FP only
IDModuleSource LocationSource FunctionLevelMax Time Over Threads (s)Time w.r.t. Wall Time (s)Coverage (% app. time)Speedup if no scalar integerSpeedup if FP arith vectorizedSpeedup if fully vectorizedSpeedup if FP onlyNumber of pathsVectorization Ratio (%)Vector Length Use (%)Flops (GFLOP/s)CQA cyclesCQA cycles if no scalar integerCQA cycles if FP arith vectorizedCQA cycles if fully vectorizedCQA cycles if FP only
Loop 34845libarmpl_lp64.sodgemm_sve_bigInnermost25.7225.4116.75NANANANANANANA1408.48NANANANANA
Loop 34844libarmpl_lp64.sodgemm_sve_bigInBetween22.1121.4914.16NANANANANANANA209.81NANANANANA
Loop 1794execSoaDistanceTableAAOMPTarget.h:440-442,TinyVector.h:145-145,TinyVector.h:182-182,OhmmsVector.h:223-223,VectorSoAContainer.h:244-244,VectorSoAContainer.h:263-263qmcplusplus::SoaDistanceTableAAOMPTarget::update(int)Single12.8912.508.241.101.004.003.6710.0025.000.723.673.333.670.921.00
Loop 818execMultiBsplineRef.hpp:242-262void miniqmcreference::MultiBsplineEvalRef::evaluate_vgh(qmcplusplus::bspline_traits::SplineType const*, double, double, double, double*, double*, double*, unsigned long)Innermost12.2211.697.701.001.001.001.141100.00100.00396.6912.0012.0012.0012.0010.50
Loop 37166libarmpl_lp64.son_interleave_kernel_d8Innermost10.5310.016.60NANANANANANANA0.00NANANANANA
Loop 812execMultiBsplineRef.hpp:68-71void miniqmcreference::MultiBsplineEvalRef::evaluate_v(qmcplusplus::bspline_traits::SplineType const*, double, double, double, double*, unsigned long)Innermost9.509.065.971.001.001.001.501100.00100.0086.153.003.003.003.002.00
Loop 809execMultiBsplineRef.hpp:68-71void miniqmcreference::MultiBsplineEvalRef::evaluate_v(qmcplusplus::bspline_traits::SplineType const*, double, double, double, double*, unsigned long)Innermost9.439.005.931.001.001.001.501100.00100.0086.693.003.003.003.002.00
Loop 810execMultiBsplineRef.hpp:68-71void miniqmcreference::MultiBsplineEvalRef::evaluate_v(qmcplusplus::bspline_traits::SplineType const*, double, double, double, double*, unsigned long)Innermost9.408.885.851.001.001.001.501100.00100.0087.883.003.003.003.002.00
Loop 811execMultiBsplineRef.hpp:68-71void miniqmcreference::MultiBsplineEvalRef::evaluate_v(qmcplusplus::bspline_traits::SplineType const*, double, double, double, double*, unsigned long)Innermost9.468.885.851.001.001.001.501100.00100.0088.113.003.003.003.002.00
Loop 2055execParticleBConds3DSoa.h:280-298qmcplusplus::SoaDistanceTableABOMPTarget::evaluate(qmcplusplus::ParticleSet&)Innermost6.686.244.111.001.001.001.21 - 1.21194.00100.00383.0517.0017.0017.0017.0014.00 - 14.08
Loop 1262execParticleBConds3DSoa.h:235-255void qmcplusplus::DTD_BConds::computeDistances, qmcplusplus::VectorSoAContainer >, qmcplusplus::VectorSoAContainer > >(qmcplusplus::TinyVector const&, qmcplusplus::VectorSoAContainer > const&, double*, qmcplusplus::VectorSoAContainer >&, int, int, int) constSingle2.482.231.471.001.001.001.86 - 1.85189.0489.90552.1326.0026.0026.0026.0014.00 - 14.08
Loop 303984libarmpl_lp64.sovoid armpl::clag::gemv_a_cntg_first(long, long, double, double const*, long, long, double const*, long, double, double*, long)Innermost2.402.181.44NANANANANANANA102.47NANANANANA
Loop 324execBsplineFunctor.h:236-241miniqmcreference::TwoBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)InBetween2.252.071.373.001.006.793.5010.0021.1531.773.501.173.500.521.00
Loop 34842libarmpl_lp64.sodgemm_sve_bigInnermost2.162.031.34NANANANANANANA1214.60NANANANANA
Loop 303664libarmpl_lp64.sovoid armpl::clag::gemv_a_strd_first_impl, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double>(long, long, double, double const*, long, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double const*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, double*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>) [clone .isra.0]Innermost1.381.210.80NANANANANANANA117.55NANANANANA
Loop 304781libarmpl_lp64.soauto armpl::clag::execute_strategy<15ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)Innermost1.321.130.75NANANANANANANA0.25NANANANANA
Loop 303980libarmpl_lp64.sovoid armpl::clag::gemv_a_cntg_first(long, long, double, double const*, long, long, double const*, long, double, double*, long)Innermost1.090.940.62NANANANANANANA66.88NANANANANA
Loop 304835libarmpl_lp64.soauto armpl::clag::execute_strategy<15ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)Innermost1.050.920.60NANANANANANANA0.17NANANANANA
Loop 918execOperatorTags.h:63-63,OperatorTags.h:94-94,inner_product.hpp:155-155miniqmcreference::DiracDeterminantRef >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus::ParticleAttrib >&, bool)Innermost0.670.550.361.001.751.471.00181.8259.0965.352.002.001.141.362.00
Loop 272execBsplineFunctor.h:291-298qmcplusplus::BsplineFunctor::evaluateVGL(int, int, int, double const*, double*, double*, double*, double*, int*) constSingle0.690.550.361.251.005.001.2520.0022.9244.711.251.001.250.251.00
Loop 910execOperatorTags.h:63-63,OperatorTags.h:94-94,inner_product.hpp:155-155miniqmcreference::DiracDeterminantRef >::evalGrad(qmcplusplus::ParticleSet&, int)Single0.730.530.351.001.751.471.00181.8259.0968.112.002.001.141.362.00
Loop 802execinner_product.hpp:82-83qmcplusplus::SPOSet::evaluateDetRatios(qmcplusplus::VirtualParticleSet const&, qmcplusplus::Vector >&, qmcplusplus::Vector > const&, std::vector >&)Innermost0.580.480.321.001.001.001.00185.7189.2997.962.002.002.002.002.00
Loop 801execTinyVector.h:145-145,einspline_spo_ref.hpp:223-227,OhmmsVector.h:223-223,VectorSoAContainer.h:231-231,VectorSoAContainer.h:271-271,stl_vector.h:1131-1131,stl_algobase.h:238-238miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&, qmcplusplus::Vector, std::allocator > >&, qmcplusplus::Vector >&)Innermost0.570.470.312.331.005.257.0019.0926.140.007.003.007.001.331.00
Loop 303666libarmpl_lp64.sovoid armpl::clag::gemv_a_strd_first_impl, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double>(long, long, double, double const*, long, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double const*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, double*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>) [clone .isra.0]Single0.520.420.28NANANANANANANA124.77NANANANANA
Loop 314execTwoBodyJastrowRef.h:342-347miniqmcreference::TwoBodyJastrowRef >::acceptMove(qmcplusplus::ParticleSet&, int)Single0.400.330.221.001.001.001.50195.2496.4392.196.006.006.006.004.00
Loop 315execTwoBodyJastrowRef.h:342-347miniqmcreference::TwoBodyJastrowRef >::acceptMove(qmcplusplus::ParticleSet&, int)Single0.400.330.221.001.001.001.50195.2496.4391.476.006.006.006.004.00
Loop 313execTwoBodyJastrowRef.h:342-347miniqmcreference::TwoBodyJastrowRef >::acceptMove(qmcplusplus::ParticleSet&, int)Single0.420.320.211.001.001.001.50195.2496.4394.876.006.006.006.004.00
Loop 919execinner_product.hpp:82-83miniqmcreference::DiracDeterminantRef >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus::ParticleAttrib >&, bool)Innermost0.390.300.201.001.001.001.00185.7189.2940.012.002.002.002.002.00
Loop 316execTwoBodyJastrowRef.h:324-331miniqmcreference::TwoBodyJastrowRef >::acceptMove(qmcplusplus::ParticleSet&, int)Single0.390.270.181.001.001.001.43197.1497.86199.6910.0010.0010.0010.007.00
Loop 303660libarmpl_lp64.sovoid armpl::clag::gemv_a_strd_first_impl, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double>(long, long, double, double const*, long, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double const*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, double*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>) [clone .isra.0]Innermost0.340.250.16NANANANANANANA102.85NANANANANA
Loop 42542libarmpl_lp64.sodswap_Single0.340.250.16NANANANANANANA0.00NANANANANA
Loop 816execMultiBsplineRef.hpp:276-286void miniqmcreference::MultiBsplineEvalRef::evaluate_vgh(qmcplusplus::bspline_traits::SplineType const*, double, double, double, double*, double*, double*, unsigned long)Single0.310.230.151.001.001.002.001100.00100.00280.429.009.009.009.004.50
Loop 304604libarmpl_lp64.soauto armpl::clag::execute_strategy<16ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)Innermost0.250.190.13NANANANANANANA0.35NANANANANA
Loop 300execTwoBodyJastrowRef.h:155-156miniqmcreference::TwoBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Single0.250.180.121.001.001.001.00185.7189.29136.362.002.002.002.002.00
Loop 301execTwoBodyJastrowRef.h:155-156miniqmcreference::TwoBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Single0.250.170.111.001.001.001.001100.00100.00143.352.002.002.002.002.00
Loop 302execTwoBodyJastrowRef.h:155-156miniqmcreference::TwoBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Single0.260.150.101.001.001.001.00185.7189.29156.472.002.002.002.002.00
Loop 63execNonLocalPP.hpp:126-126,NonLocalPP.hpp:129-135,OhmmsVector.h:229-229,ParticleSet.h:277-277,stl_vector.h:993-993,stl_vector.h:1131-1131,stl_vector.h:1150-1150,unique_ptr.h:193-193qmcplusplus::NonLocalPP::evaluate(qmcplusplus::ParticleSet const&, qmcplusplus::WaveFunction&)Outermost0.190.130.089.001.005.8224.0010.0022.798.146.000.676.001.030.25
Loop 912execinner_product.hpp:82-83miniqmcreference::DiracDeterminantRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Single0.150.090.061.001.001.001.00185.7189.29128.672.002.002.002.002.00
Loop 892execinner_product.hpp:211-212qmcplusplus::DiracMatrix::invert_transpose(qmcplusplus::Matrix > const&, qmcplusplus::Matrix >&, double&, double&)Innermost0.110.090.061.001.004.002.6710.0025.000.002.672.672.670.671.00
Loop 904execOperatorTags.h:63-63,OperatorTags.h:94-94,inner_product.hpp:155-155miniqmcreference::DiracDeterminantRef >::evaluateLog(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus::ParticleAttrib >&)Innermost0.140.090.061.001.751.471.00181.8259.0984.492.002.001.141.362.00
Loop 913execOperatorTags.h:63-63,OperatorTags.h:94-94,inner_product.hpp:155-155miniqmcreference::DiracDeterminantRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Single0.130.080.061.001.751.471.00181.8259.09426.302.002.001.141.362.00
Loop 271execstl_vector.h:1150-1150,BsplineFunctor.h:303-336qmcplusplus::BsplineFunctor::evaluateVGL(int, int, int, double const*, double*, double*, double*, double*, int*) constSingle0.120.060.041.001.001.011.19191.1498.10607.7525.5025.5025.5025.1321.50
Loop 304833libarmpl_lp64.soauto armpl::clag::execute_strategy<15ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)InBetween0.110.060.04NANANANANANANA0.28NANANANANA
Loop 326execstl_vector.h:1150-1150,BsplineFunctor.h:246-260miniqmcreference::TwoBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)Innermost0.100.060.041.001.001.031.21175.0093.75690.6714.5014.5014.5014.1312.00
Loop 277execBsplineFunctor.h:236-241qmcplusplus::BsplineFunctor::evaluateV(int, int, int, double const*, double*) constSingle0.080.050.041.801.006.006.0010.0020.836.661.500.831.500.250.25
Loop 34841libarmpl_lp64.sodgemm_sve_bigInBetween0.070.040.02NANANANANANANA1245.29NANANANANA
Loop 803execOhmmsVector.h:178-178,SPOSet.h:83-86,ParticleSet.h:277-277,stl_vector.h:1131-1131,inner_product.hpp:82-82qmcplusplus::SPOSet::evaluateDetRatios(qmcplusplus::VirtualParticleSet const&, qmcplusplus::Vector >&, qmcplusplus::Vector > const&, std::vector >&)InBetween0.070.040.021.671.005.272.1710.0023.3341.993.632.173.630.691.67
Loop 323execBsplineFunctor.h:238-241miniqmcreference::TwoBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)Outermost0.060.030.021.201.004.004.0010.0025.0075.251.000.831.000.250.25
Loop 2053execSoaDistanceTableABOMPTarget.h:215-215,SoaDistanceTableABOMPTarget.h:222-222,SoaDistanceTableABOMPTarget.h:228-228,ParticleBConds3DSoa.h:298-298qmcplusplus::SoaDistanceTableABOMPTarget::evaluate(qmcplusplus::ParticleSet&)InBetween0.060.030.023.151.002.433.15202.5924.03185.5126.758.5026.7511.008.50
Loop 224execOneBodyJastrowRef.h:192-193miniqmcreference::OneBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Single0.060.030.021.001.001.001.00185.7189.2974.282.002.002.002.002.00
Loop 304754libarmpl_lp64.soauto armpl::clag::execute_strategy<15ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)InBetween0.060.030.02NANANANANANANA8.68NANANANANA
Loop 334699libarmpl_lp64.sovoid armpl::clag::lu_unblocked_direct_kernel(long, long, double*, long, int*, int&)Innermost0.060.030.02NANANANANANANA291.17NANANANANA
Loop 307execstl_numeric.h:140-141miniqmcreference::TwoBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Single0.050.020.021.001.001.121.00180.0085.00374.942.002.002.001.792.00
Loop 905execinner_product.hpp:82-83miniqmcreference::DiracDeterminantRef >::evaluateLog(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus::ParticleAttrib >&)Innermost0.060.020.011.001.001.001.00185.7189.2984.622.002.002.002.002.00
Loop 2052execSoaDistanceTableABOMPTarget.h:214-214qmcplusplus::SoaDistanceTableABOMPTarget::evaluate(qmcplusplus::ParticleSet&)Outermost0.050.020.011.211.001.2134.002058.8263.5367.2417.0014.0017.0014.000.50
Loop 325execTwoBodyJastrowRef.h:132-132,BsplineFunctor.h:236-241,BsplineFunctor.h:246-246miniqmcreference::TwoBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)InBetween0.050.020.011.031.001.219.07163.7760.5129.8911.3311.0011.339.381.25
Loop 245execOneBodyJastrowRef.h:134-135,OhmmsVector.h:223-223,OhmmsVector.h:249-249,stl_vector.h:993-993,stl_vector.h:1131-1131,stl_vector.h:1150-1150miniqmcreference::OneBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)Single0.050.020.011.421.706.181.4210.0022.502.132.832.001.670.462.00
Loop 33845libarmpl_lp64.sodaxpby_sve_kernelSingle0.050.020.01NANANANANANANA169.83NANANANANA
Loop 813execMultiBsplineRef.hpp:63-63,MultiBsplineRef.hpp:66-68void miniqmcreference::MultiBsplineEvalRef::evaluate_v(qmcplusplus::bspline_traits::SplineType const*, double, double, double, double*, unsigned long)Outermost0.050.020.01NANANANANANANA44.93NANANANANA
Loop 226execOneBodyJastrowRef.h:192-193miniqmcreference::OneBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Single0.040.010.01NANANANANANANA70.00NANANANANA
Loop 225execOneBodyJastrowRef.h:192-193miniqmcreference::OneBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Single0.060.010.01NANANANANANANA77.74NANANANANA
Loop 337execTwoBodyJastrowRef.h:381-382miniqmcreference::TwoBodyJastrowRef >::recompute(qmcplusplus::ParticleSet&)Innermost0.040.010.01NANANANANANANA88.02NANANANANA
Loop 114execOperatorTags.h:94-94,WaveFunction.cpp:185-188,refwrap.h:351-351,NewTimer.h:242-242,NewTimer.h:249-249,stl_vector.h:993-993,stl_vector.h:1131-1131qmcplusplus::WaveFunction::evalGrad(qmcplusplus::ParticleSet&, int)Single0.040.010.01NANANANANANANA1.16NANANANANA
Loop 28execTinyVector.h:62-62,refwrap.h:351-351,stl_vector.h:1131-1131,miniqmc.cpp:416-416,miniqmc.cpp:429-429,miniqmc.cpp:432-434,miniqmc.cpp:437-437,miniqmc.cpp:440-443,miniqmc.cpp:446-446,miniqmc.cpp:449-454,miniqmc.cpp:457-458main.omp_outlined.62Outermost0.040.010.01NANANANANANANA0.54NANANANANA
Loop 304782libarmpl_lp64.soauto armpl::clag::execute_strategy<15ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)InBetween0.040.010.01NANANANANANANA0.24NANANANANA
Loop 322execOhmmsVector.h:223-223,OhmmsVector.h:229-229,TwoBodyJastrowRef.h:108-108,TwoBodyJastrowRef.h:126-127,ParticleSet.h:313-313,BsplineFunctor.h:233-233,BsplineFunctor.h:236-236miniqmcreference::TwoBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)InBetween0.040.010.01NANANANANANANA11.74NANANANANA
Loop 338execTwoBodyJastrowRef.h:381-382miniqmcreference::TwoBodyJastrowRef >::recompute(qmcplusplus::ParticleSet&)Innermost0.060.010.01NANANANANANANA96.72NANANANANA
Loop 366398libarmpl_lp64.sovoid armpl::clag::(anonymous namespace)::trsm_kernel(double const*, long, long, double*, long, long, long, long)Single0.040.010.01NANANANANANANA75.90NANANANANA
Loop 799execstl_algo.h:709-709,einspline_spo_ref.hpp:183-187,stl_algobase.h:238-238,stl_algobase.h:413-413,stl_algobase.h:450-452miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&)Single0.040.010.01NANANANANANANA0.00NANANANANA
Loop 339execTwoBodyJastrowRef.h:381-382miniqmcreference::TwoBodyJastrowRef >::recompute(qmcplusplus::ParticleSet&)Innermost0.070.010.01NANANANANANANA87.34NANANANANA
Loop 334execTwoBodyJastrowRef.h:388-391miniqmcreference::TwoBodyJastrowRef >::recompute(qmcplusplus::ParticleSet&)Innermost0.030.010.01NANANANANANANA234.45NANANANANA
Loop 303661libarmpl_lp64.sovoid armpl::clag::gemv_a_strd_first_impl, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double>(long, long, double, double const*, long, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double const*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, double*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>) [clone .isra.0]Single0.040.010.00NANANANANANANA67.75NANANANANA
Loop 253execstl_algobase.h:939-940qmcplusplus::Vector, std::allocator > >::resize(unsigned long, qmcplusplus::TinyVector)Single0.030.010.00NANANANANANANA0.00NANANANANA
Loop 1113execParticleSet.cpp:242-243,stl_vector.h:993-993,unique_ptr.h:193-193qmcplusplus::ParticleSet::update(bool)Single0.030.010.00NANANANANANANA0.00NANANANANA
Loop 814execeinspline_spo_ref.hpp:206-208,VectorSoAContainer.h:265-265,stl_vector.h:1131-1131,stl_vector.h:1263-1263miniqmcreference::einspline_spo_ref::evaluate_vgh(qmcplusplus::ParticleSet const&, int)Single0.040.010.00NANANANANANANA5.82NANANANANA
Loop 64execOperatorTags.h:43-43,OperatorTags.h:63-63,TinyVector.h:144-145,NonLocalPP.hpp:131-132,OhmmsVector.h:223-223,OhmmsVector.h:229-229,VectorSoAContainer.h:231-231,stl_vector.h:993-993,stl_vector.h:1131-1131qmcplusplus::NonLocalPP::evaluate(qmcplusplus::ParticleSet const&, qmcplusplus::WaveFunction&)Innermost0.030.000.00NANANANANANANA1.01NANANANANA
Loop 249execstl_algobase.h:951-952qmcplusplus::Vector >::resize(unsigned long, double)Single0.040.000.00NANANANANANANA0.00NANANANANA
Loop 808execeinspline_spo_ref.hpp:175-176,stl_vector.h:1131-1131,stl_vector.h:1263-1263miniqmcreference::einspline_spo_ref::evaluate_v(qmcplusplus::ParticleSet const&, int)Single0.040.000.00NANANANANANANA3.97NANANANANA
Loop 119execWaveFunction.cpp:269-269,WaveFunction.cpp:272-273,refwrap.h:351-351,NewTimer.h:242-242,NewTimer.h:249-249,stl_vector.h:993-993,stl_vector.h:1131-1131qmcplusplus::WaveFunction::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)InBetween0.030.000.00NANANANANANANA0.00NANANANANA
Loop 304547libarmpl_lp64.soauto armpl::clag::execute_strategy<16ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)Innermost0.030.000.00NANANANANANANA0.00NANANANANA
Loop 115execWaveFunction.cpp:198-201,refwrap.h:351-351,NewTimer.h:242-242,NewTimer.h:249-249,stl_vector.h:993-993,stl_vector.h:1131-1131qmcplusplus::WaveFunction::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Single0.030.000.00NANANANANANANA0.00NANANANANA
Loop 321execTwoBodyJastrowRef.h:107-108,TwoBodyJastrowRef.h:126-127,refwrap.h:351-351,optional:469-469,optional:991-991,stl_vector.h:993-993,stl_vector.h:1131-1131miniqmcreference::TwoBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)Innermost0.040.000.00NANANANANANANA12.49NANANANANA
Loop 304756libarmpl_lp64.soauto armpl::clag::execute_strategy<15ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)InBetween0.040.000.00NANANANANANANA41.56NANANANANA
Loop 1478execstl_tree.h:1947-1947,NewTimer.h:119-119qmcplusplus::TimerType::stop()Innermost0.170.000.00NANANANANANANA0.00NANANANANA
Loop 819execMultiBsplineRef.hpp:226-227,MultiBsplineRef.hpp:234-239,MultiBsplineRef.hpp:242-242void miniqmcreference::MultiBsplineEvalRef::evaluate_vgh(qmcplusplus::bspline_traits::SplineType const*, double, double, double, double*, double*, double*, unsigned long)Outermost0.040.000.00NANANANANANANA185.10NANANANANA
Loop 351execTwoBodyJastrowRef.h:397-398miniqmcreference::TwoBodyJastrowRef >::recompute(qmcplusplus::ParticleSet&)Innermost0.030.000.00NANANANANANANA83.43NANANANANA
Loop 354execTwoBodyJastrowRef.h:397-398miniqmcreference::TwoBodyJastrowRef >::recompute(qmcplusplus::ParticleSet&)Innermost0.020.000.00NANANANANANANA115.48NANANANANA
Loop 304018libarmpl_lp64.soauto armpl::clag::execute_strategy<11ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)Innermost0.020.000.00NANANANANANANA127.83NANANANANA
Loop 270execOneBodyJastrowRef.h:214-219,OhmmsVector.h:223-223,shared_ptr_base.h:1667-1667,ParticleSet.h:313-313,stl_vector.h:1131-1131,stl_vector.h:1263-1263miniqmcreference::OneBodyJastrowRef >::computeU3(qmcplusplus::ParticleSet&, int, double const*)Single0.030.000.00NANANANANANANA0.88NANANANANA
Loop 304492libarmpl_lp64.soauto armpl::clag::execute_strategy<16ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)Innermost0.020.000.00NANANANANANANA0.00NANANANANA
Loop 348execTwoBodyJastrowRef.h:397-398miniqmcreference::TwoBodyJastrowRef >::recompute(qmcplusplus::ParticleSet&)Innermost0.020.000.00NANANANANANANA109.26NANANANANA
Loop 1476execstl_tree.h:1947-1947,NewTimer.h:119-119qmcplusplus::TimerType::stop()Innermost0.080.000.00NANANANANANANA0.00NANANANANA
Loop 35071libarmpl_lp64.soddot_kernelSingle0.030.000.00NANANANANANANA35.45NANANANANA
Loop 37170libarmpl_lp64.son_interleave_kernel_d8Outermost0.030.000.00NANANANANANANA0.00NANANANANA
Loop 304032libarmpl_lp64.soauto armpl::clag::execute_strategy<10ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)Outermost0.020.000.00NANANANANANANA0.00NANANANANA
Loop 336execTwoBodyJastrowRef.h:375-376miniqmcreference::TwoBodyJastrowRef >::recompute(qmcplusplus::ParticleSet&)Innermost0.020.000.00NANANANANANANA199.79NANANANANA
Loop 37169libarmpl_lp64.son_interleave_kernel_d8Innermost0.020.000.00NANANANANANANA0.00NANANANANA
Loop 304493libarmpl_lp64.soauto armpl::clag::execute_strategy<16ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)InBetween0.020.000.00NANANANANANANA0.00NANANANANA
Loop 34827libarmpl_lp64.sodgemm_reference_Innermost0.020.000.00NANANANANANANA0.00NANANANANA
Loop 37167libarmpl_lp64.son_interleave_kernel_d8Innermost0.020.000.00NANANANANANANA0.00NANANANANA
Loop 303659libarmpl_lp64.sovoid armpl::clag::gemv_a_strd_first_impl, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double>(long, long, double, double const*, long, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double const*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, double*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>) [clone .isra.0]Outermost0.020.000.00NANANANANANANA7.95NANANANANA
Loop 303979libarmpl_lp64.sovoid armpl::clag::gemv_a_cntg_first(long, long, double, double const*, long, long, double const*, long, double, double*, long)Outermost0.020.000.00NANANANANANANA15.89NANANANANA
Loop 37168libarmpl_lp64.son_interleave_kernel_d8Innermost0.020.000.00NANANANANANANA0.00NANANANANA
×