options

Expert Summary

Columns Filter

Source Location Source Function Level Max Time Over Threads (s) Time w.r.t. Wall Time (s) Coverage (% app. time) Speedup if no scalar integer Speedup if FP arith vectorized Speedup if fully vectorized Speedup if FP only Number of paths Vectorization Ratio (%) Vector Length Use (%) Flops (GFLOP/s) CQA cycles CQA cycles if no scalar integer CQA cycles if FP arith vectorized CQA cycles if fully vectorized CQA cycles if FP only
IDModuleSource LocationSource FunctionLevelMax Time Over Threads (s)Time w.r.t. Wall Time (s)Coverage (% app. time)Speedup if no scalar integerSpeedup if FP arith vectorizedSpeedup if fully vectorizedSpeedup if FP onlyNumber of pathsVectorization Ratio (%)Vector Length Use (%)Flops (GFLOP/s)CQA cyclesCQA cycles if no scalar integerCQA cycles if FP arith vectorizedCQA cycles if fully vectorizedCQA cycles if FP only
Loop 914execMultiBsplineRef.hpp:68-71miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&)Innermost36.7635.7823.341.001.001.001.001100.00100.0097.876.006.006.006.006.00
Loop 34845libarmpl_lp64.sodgemm_sve_bigInnermost25.7124.9816.29NANANANANANANA1433.88NANANANANA
Loop 34844libarmpl_lp64.sodgemm_sve_bigInBetween21.5121.1313.78NANANANANANANA212.52NANANANANA
Loop 946execMultiBsplineRef.hpp:242-262miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&, qmcplusplus::Vector, std::allocator > >&, qmcplusplus::Vector >&)Innermost15.3715.129.861.091.094.001.4010.0025.00317.708.758.008.002.196.25
Loop 2426execSoaDistanceTableAAOMPTarget.h:440-442,TinyVector.h:182-182,VectorSoAContainer.h:244-244,VectorSoAContainer.h:263-263qmcplusplus::SoaDistanceTableAAOMPTarget::update(int)Single12.6512.137.911.381.004.007.3310.0025.000.757.335.337.331.831.00
Loop 37166libarmpl_lp64.son_interleave_kernel_d8Innermost10.119.736.35NANANANANANANA0.00NANANANANA
Loop 3036execSoaDistanceTableABOMPTarget.h:228-228,ParticleBConds3DSoa.h:280-298qmcplusplus::SoaDistanceTableABOMPTarget::evaluate(qmcplusplus::ParticleSet&)Innermost8.327.835.112.922.504.001.2510.0025.00306.218.753.003.502.197.00
Loop 303984libarmpl_lp64.sovoid armpl::clag::gemv_a_cntg_first(long, long, double, double const*, long, long, double const*, long, double, double*, long)Innermost2.372.201.43NANANANANANANA101.15NANANANANA
Loop 295execBsplineFunctor.h:236-241miniqmcreference::TwoBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)Innermost2.322.071.351.591.004.2517.0065610.0020.1934.258.505.338.502.000.50
Loop 34842libarmpl_lp64.sodgemm_sve_bigInnermost2.122.001.30NANANANANANANA1233.32NANANANANA
Loop 303664libarmpl_lp64.sovoid armpl::clag::gemv_a_strd_first_impl, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double>(long, long, double, double const*, long, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double const*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, double*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>) [clone .isra.0]Innermost1.411.210.79NANANANANANANA118.81NANANANANA
Loop 304781libarmpl_lp64.soauto armpl::clag::execute_strategy<15ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)Innermost1.241.120.73NANANANANANANA0.38NANANANANA
Loop 530execTwoBodyJastrowRef.h:342-347miniqmcreference::TwoBodyJastrowRef >::acceptMove(qmcplusplus::ParticleSet&, int)Innermost1.120.950.621.001.001.001.501100.00100.00112.503.003.003.003.002.00
Loop 303980libarmpl_lp64.sovoid armpl::clag::gemv_a_cntg_first(long, long, double, double const*, long, long, double const*, long, double, double*, long)Innermost1.130.930.61NANANANANANANA67.91NANANANANA
Loop 2564execParticleBConds3DSoa.h:237-255qmcplusplus::SoaDistanceTableAAOMPTarget::move(qmcplusplus::ParticleSet const&, qmcplusplus::TinyVector const&, int, bool)Single1.080.910.591.001.001.001.21 - 1.21165.5777.87599.6817.0017.0017.0017.0014.00 - 14.08
Loop 2563execParticleBConds3DSoa.h:237-255qmcplusplus::SoaDistanceTableAAOMPTarget::move(qmcplusplus::ParticleSet const&, qmcplusplus::TinyVector const&, int, bool)Single1.100.880.581.001.001.001.21 - 1.21165.5777.87613.2017.0017.0017.0017.0014.00 - 14.08
Loop 304835libarmpl_lp64.soauto armpl::clag::execute_strategy<15ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)Innermost1.010.880.57NANANANANANANA0.21NANANANANA
Loop 944execMultiBsplineRef.hpp:276-286miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&, qmcplusplus::Vector, std::allocator > >&, qmcplusplus::Vector >&)Innermost0.750.630.411.001.004.002.6710.0025.00104.9912.0012.0012.003.004.50
Loop 1107execOperatorTags.h:63-63,OperatorTags.h:94-94,inner_product.hpp:155-155miniqmcreference::DiracDeterminantRef >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus::ParticleAttrib >&, bool)Innermost0.660.520.341.001.411.451.001100.0060.8769.194.004.002.832.764.00
Loop 229execTwoBodyJastrowRef.h:155-156miniqmcreference::TwoBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Innermost0.690.490.321.001.001.001.001100.00100.00147.292.002.002.002.002.00
Loop 1103execOperatorTags.h:63-63,OperatorTags.h:94-94miniqmcreference::DiracDeterminantRef >::evalGrad(qmcplusplus::ParticleSet&, int)Single0.580.470.311.001.711.421.001100.0063.6476.544.004.002.332.814.00
Loop 1102execinner_product.hpp:82-83miniqmcreference::DiracDeterminantRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)Innermost0.590.450.291.001.001.001.001100.00100.00107.442.002.002.002.002.00
Loop 303666libarmpl_lp64.sovoid armpl::clag::gemv_a_strd_first_impl, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double>(long, long, double, double const*, long, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double const*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, double*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>) [clone .isra.0]Single0.510.410.27NANANANANANANA126.70NANANANANA
Loop 1108execinner_product.hpp:82-83miniqmcreference::DiracDeterminantRef >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus::ParticleAttrib >&, bool)Innermost0.390.300.201.001.001.001.001100.00100.0039.572.002.002.002.002.00
Loop 233execBsplineFunctor.h:291-298miniqmcreference::TwoBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Innermost0.370.300.201.921.005.1313.6765610.0018.8854.2810.255.3310.252.000.75
Loop 527execstl_vector.h:1128-1128,TwoBodyJastrowRef.h:324-331miniqmcreference::TwoBodyJastrowRef >::acceptMove(qmcplusplus::ParticleSet&, int)Single0.410.300.191.001.004.001.6710.0025.00182.4713.3313.3313.333.338.00
Loop 303660libarmpl_lp64.sovoid armpl::clag::gemv_a_strd_first_impl, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double>(long, long, double, double const*, long, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double const*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, double*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>) [clone .isra.0]Innermost0.300.240.16NANANANANANANA105.78NANANANANA
Loop 42542libarmpl_lp64.sodswap_Single0.270.240.15NANANANANANANA0.00NANANANANA
Loop 943execTinyVector.h:145-145,einspline_spo_ref.hpp:223-227miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&, qmcplusplus::Vector, std::allocator > >&, qmcplusplus::Vector >&)Innermost0.300.200.131.001.003.6012.00111.1127.780.0012.0012.0012.003.331.00
Loop 304604libarmpl_lp64.soauto armpl::clag::execute_strategy<16ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)Innermost0.260.190.12NANANANANANANA0.24NANANANANA
Loop 525execBsplineFunctor.h:291-298miniqmcreference::TwoBodyJastrowRef >::computeU3(qmcplusplus::ParticleSet const&, int, double const*, double*, double*, double*, bool)Innermost0.240.180.111.921.005.1313.6765610.0019.3248.7610.255.3310.252.000.75
Loop 58execOperatorTags.h:43-43,OperatorTags.h:63-63,TinyVector.h:145-145,NonLocalPP.hpp:126-126,NonLocalPP.hpp:129-135,stl_vector.h:993-993,stl_vector.h:1131-1131,OhmmsVector.h:229-229,VectorSoAContainer.h:231-231,ParticleSet.h:277-277,unique_ptr.h:193-193main._omp_fn.1InBetween0.190.140.092.041.631.396.33611.4328.938.059.504.675.836.811.50
Loop 2818execParticleBConds3DSoa.h:237-255qmcplusplus::SoaDistanceTableABOMPTarget::move(qmcplusplus::ParticleSet const&, qmcplusplus::TinyVector const&, int, bool)Single0.190.110.071.001.001.001.21 - 1.21165.5777.87423.7917.0017.0017.0017.0014.00 - 14.08
Loop 2531execParticleBConds3DSoa.h:237-255qmcplusplus::SoaDistanceTableAAOMPTarget::evaluate(qmcplusplus::ParticleSet&)Innermost0.140.090.061.001.001.001.21 - 1.21165.5777.87579.9317.0017.0017.0017.0014.00 - 14.08
Loop 1097execinner_product.hpp:82-83miniqmcreference::DiracDeterminantRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Single0.160.090.061.001.001.001.001100.00100.00130.592.002.002.002.002.00
Loop 1126execinner_product.hpp:211-212miniqmcreference::DiracDeterminantRef >::evaluateLog(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus::ParticleAttrib >&)Innermost0.100.090.061.001.003.501.17114.2928.570.004.674.674.671.334.00
Loop 2819execParticleBConds3DSoa.h:237-255qmcplusplus::SoaDistanceTableABOMPTarget::move(qmcplusplus::ParticleSet const&, qmcplusplus::TinyVector const&, int, bool)Single0.140.080.051.001.001.001.21 - 1.21165.5777.87582.0617.0017.0017.0017.0014.00 - 14.08
Loop 1118execOperatorTags.h:63-63,OperatorTags.h:94-94,inner_product.hpp:155-155miniqmcreference::DiracDeterminantRef >::evaluateLog(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus::ParticleAttrib >&)Innermost0.100.070.051.001.411.451.001100.0060.8798.104.004.002.832.764.00
Loop 752execOneBodyJastrowRef.h:192-193miniqmcreference::OneBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Innermost0.130.070.041.001.001.001.001100.00100.00100.122.002.002.002.002.00
Loop 1096execOperatorTags.h:63-63,OperatorTags.h:94-94miniqmcreference::DiracDeterminantRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Single0.120.060.041.001.411.471.001100.0060.87586.534.004.002.832.714.00
Loop 304833libarmpl_lp64.soauto armpl::clag::execute_strategy<15ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)InBetween0.140.060.04NANANANANANANA0.29NANANANANA
Loop 202execBsplineFunctor.h:236-241miniqmcreference::OneBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)Innermost0.090.060.041.591.004.2517.0065610.0020.1914.138.505.338.502.000.50
Loop 296execstl_vector.h:1147-1147,BsplineFunctor.h:246-260miniqmcreference::TwoBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)Innermost0.090.050.031.001.001.001.60175.56100.00783.8940.0040.0040.0040.0025.00
Loop 545execTwoBodyJastrowRef.h:381-382miniqmcreference::TwoBodyJastrowRef >::recompute(qmcplusplus::ParticleSet&)Innermost0.080.040.031.001.001.001.001100.00100.00156.992.002.002.002.002.00
Loop 34841libarmpl_lp64.sodgemm_sve_bigInBetween0.080.040.03NANANANANANANA1159.96NANANANANA
Loop 234execstl_vector.h:1147-1147,BsplineFunctor.h:305-336miniqmcreference::TwoBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Innermost0.070.040.021.001.001.011.35186.7098.18564.7969.0069.0069.0068.0351.00
Loop 1100execOhmmsVector.h:178-178,OhmmsVector.h:248-249,SPOSet.h:83-86,inner_product.hpp:82-83miniqmcreference::DiracDeterminantRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)Outermost0.060.030.022.381.001.833.5747.1930.1931.494.461.884.462.441.25
Loop 293execrefwrap.h:351-351,stl_vector.h:993-993,OhmmsVector.h:223-223,OhmmsVector.h:249-249,TwoBodyJastrowRef.h:107-108,TwoBodyJastrowRef.h:125-127,BsplineFunctor.h:231-231,BsplineFunctor.h:246-246,optional:991-991miniqmcreference::TwoBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)Outermost0.070.030.025.001.591.585.8310000120.0026.656.785.831.173.673.691.00
Loop 232execstl_algobase.h:238-238,TwoBodyJastrowRef.h:269-271,ParticleSet.h:313-313,ParticleSet.h:316-316,BsplineFunctor.h:276-276,BsplineFunctor.h:283-284,BsplineFunctor.h:291-298,BsplineFunctor.h:336-336miniqmcreference::TwoBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Outermost0.060.030.021.101.332.0575.00100001223.8941.0429.2737.5034.0028.1318.310.50
Loop 334699libarmpl_lp64.sovoid armpl::clag::lu_unblocked_direct_kernel(long, long, double*, long, int*, int&)Innermost0.050.020.02NANANANANANANA291.52NANANANANA
Loop 541execTwoBodyJastrowRef.h:397-398miniqmcreference::TwoBodyJastrowRef >::recompute(qmcplusplus::ParticleSet&)Innermost0.050.020.021.001.001.002.001100.00100.00234.872.002.002.002.001.00
Loop 304754libarmpl_lp64.soauto armpl::clag::execute_strategy<15ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)InBetween0.050.020.02NANANANANANANA4.46NANANANANA
Loop 550execBsplineFunctor.h:291-298miniqmcreference::TwoBodyJastrowRef >::recompute(qmcplusplus::ParticleSet&)Innermost0.050.020.011.921.005.1313.6765610.0018.8858.5310.255.3310.252.000.75
Loop 199execOneBodyJastrowRef.h:134-135,OneBodyJastrowRef.h:140-141,OneBodyJastrowRef.h:151-151,OneBodyJastrowRef.h:154-155,stl_vector.h:993-993,stl_vector.h:1128-1128,stl_vector.h:1131-1131,OhmmsVector.h:223-223,OhmmsVector.h:229-229,OhmmsVector.h:249-249,BsplineFunctor.h:166-173,BsplineFunctor.h:179-182,BsplineFunctor.h:246-246miniqmcreference::OneBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)Outermost0.040.020.011.871.351.731.87100001211.4829.925.5812.136.509.007.026.50
Loop 231execstl_numeric.h:140-141miniqmcreference::TwoBodyJastrowRef >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Single0.050.020.011.001.001.001.001100.00100.00367.542.002.002.002.002.00
Loop 1117execinner_product.hpp:82-83miniqmcreference::DiracDeterminantRef >::evaluateLog(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus::ParticleAttrib >&)Innermost0.050.020.011.001.001.001.001100.00100.0086.502.002.002.002.002.00
Loop 294execTwoBodyJastrowRef.h:127-129,TwoBodyJastrowRef.h:132-132,ParticleSet.h:313-313,ParticleSet.h:316-316,BsplineFunctor.h:232-232,BsplineFunctor.h:236-241,BsplineFunctor.h:246-246,BsplineFunctor.h:259-260miniqmcreference::TwoBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)InBetween0.050.020.011.281.011.238.7910000124.2323.2838.5515.3812.0015.2812.501.75
Loop 33845libarmpl_lp64.sodaxpby_sve_kernelSingle0.050.020.01NANANANANANANA185.26NANANANANA
Loop 913execstl_algobase.h:951-952,MultiBsplineEvalHelper.hpp:53-53,MultiBsplineEvalHelper.hpp:60-63,einspline_spo_ref.hpp:175-176,stl_vector.h:1263-1263,MultiBsplineRef.hpp:42-44,MultiBsplineRef.hpp:47-49,MultiBsplineRef.hpp:57-58,MultiBsplineRef.hpp:66-68,MultiBsplineData.hpp:54-57miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&)Outermost0.040.020.01NANANANANANANA55.40NANANANANA
Loop 526execstl_vector.h:1147-1147,BsplineFunctor.h:305-336miniqmcreference::TwoBodyJastrowRef >::computeU3(qmcplusplus::ParticleSet const&, int, double const*, double*, double*, double*, bool)Innermost0.050.010.01NANANANANANANA418.15NANANANANA
Loop 3034execOMPTargetMath.hpp:38-38,SoaDistanceTableABOMPTarget.h:215-215,SoaDistanceTableABOMPTarget.h:218-218,SoaDistanceTableABOMPTarget.h:222-222,SoaDistanceTableABOMPTarget.h:228-228,ParticleBConds3DSoa.h:284-286,ParticleBConds3DSoa.h:294-296qmcplusplus::SoaDistanceTableABOMPTarget::evaluate(qmcplusplus::ParticleSet&)InBetween0.050.010.01NANANANANANANA126.81NANANANANA
Loop 139execOperatorTags.h:94-94,WaveFunction.cpp:185-188,refwrap.h:351-351,stl_vector.h:993-993,stl_vector.h:1128-1128,NewTimer.h:242-242,NewTimer.h:249-249qmcplusplus::WaveFunction::evalGrad(qmcplusplus::ParticleSet&, int)Single0.040.010.01NANANANANANANA0.52NANANANANA
Loop 915execMultiBsplineRef.hpp:64-66miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&)InBetween0.050.010.01NANANANANANANA196.53NANANANANA
Loop 366398libarmpl_lp64.sovoid armpl::clag::(anonymous namespace)::trsm_kernel(double const*, long, long, double*, long, long, long, long)Single0.040.010.01NANANANANANANA69.42NANANANANA
Loop 304782libarmpl_lp64.soauto armpl::clag::execute_strategy<15ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)InBetween0.040.010.01NANANANANANANA0.59NANANANANA
Loop 542execTwoBodyJastrowRef.h:388-391miniqmcreference::TwoBodyJastrowRef >::recompute(qmcplusplus::ParticleSet&)Innermost0.040.010.00NANANANANANANA207.17NANANANANA
Loop 912execstl_algobase.h:238-238,stl_algobase.h:413-413,stl_algobase.h:451-452,einspline_spo_ref.hpp:183-187,stl_algo.h:683-683,stl_algo.h:709-709,stl_vector.h:1263-1263miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&)Single0.040.010.00NANANANANANANA0.00NANANANANA
Loop 26execTinyVector.h:62-62,refwrap.h:351-351,stl_vector.h:1131-1131,miniqmc.cpp:429-458main._omp_fn.1Innermost0.040.010.00NANANANANANANA0.72NANANANANA
Loop 1158execstl_algobase.h:939-940miniqmcreference::DiracDeterminantRef >::resize(int, int)Innermost0.030.010.00NANANANANANANA0.00NANANANANA
Loop 303661libarmpl_lp64.sovoid armpl::clag::gemv_a_strd_first_impl, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double>(long, long, double, double const*, long, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double const*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, double*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>) [clone .isra.0]Single0.030.000.00NANANANANANANA68.85NANANANANA
Loop 524execstl_algobase.h:238-238,TwoBodyJastrowRef.h:269-271,ParticleSet.h:313-313,ParticleSet.h:316-316,BsplineFunctor.h:276-276,BsplineFunctor.h:283-284,BsplineFunctor.h:291-298,BsplineFunctor.h:336-336miniqmcreference::TwoBodyJastrowRef >::computeU3(qmcplusplus::ParticleSet const&, int, double const*, double*, double*, double*, bool)Outermost0.040.000.00NANANANANANANA19.85NANANANANA
Loop 201execOneBodyJastrowRef.h:143-146,shared_ptr_base.h:1667-1667,OhmmsVector.h:223-223,ParticleSet.h:313-313,ParticleSet.h:316-316,BsplineFunctor.h:231-232,BsplineFunctor.h:236-241,BsplineFunctor.h:246-246,BsplineFunctor.h:259-260miniqmcreference::OneBodyJastrowRef >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)InBetween0.040.000.00NANANANANANANA5.47NANANANANA
Loop 945execstl_algobase.h:951-952,MultiBsplineEvalHelper.hpp:53-56,MultiBsplineEvalHelper.hpp:60-63,MultiBsplineEvalHelper.hpp:66-66,einspline_spo_ref.hpp:206-207,einspline_spo_ref.hpp:230-230,stl_vector.h:1263-1263,VectorSoAContainer.h:265-265,MultiBsplineRef.hpp:187-192,MultiBsplineRef.hpp:199-200,MultiBsplineRef.hpp:205-206,MultiBsplineRef.hpp:209-213,MultiBsplineRef.hpp:229-230,MultiBsplineRef.hpp:269-286,MultiBsplineData.hpp:68-79miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&, qmcplusplus::Vector, std::allocator > >&, qmcplusplus::Vector >&)Outermost0.030.000.00NANANANANANANA10.76NANANANANA
Loop 1968execNewTimer.h:119-119,stl_tree.h:786-786,stl_tree.h:1947-1949qmcplusplus::TimerType::stop()Single0.220.000.00NANANANANANANA0.35NANANANANA
Loop 145execWaveFunction.cpp:269-269,WaveFunction.cpp:272-274,refwrap.h:351-351,stl_vector.h:992-993,stl_vector.h:1131-1131,NewTimer.h:242-242,NewTimer.h:249-249qmcplusplus::WaveFunction::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector >&)Outermost0.040.000.00NANANANANANANA0.00NANANANANA
Loop 1377execParticleSet.cpp:242-243,stl_vector.h:993-993,unique_ptr.h:193-193qmcplusplus::ParticleSet::update(bool)Single0.030.000.00NANANANANANANA0.00NANANANANA
Loop 916execMultiBsplineRef.hpp:63-66miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&)InBetween0.040.000.00NANANANANANANA104.35NANANANANA
Loop 1964execNewTimer.h:119-119,stl_tree.h:786-786,stl_tree.h:1947-1949qmcplusplus::TimerType::stop()Single0.130.000.00NANANANANANANA0.00NANANANANA
Loop 304018libarmpl_lp64.soauto armpl::clag::execute_strategy<11ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)Innermost0.020.000.00NANANANANANANA98.92NANANANANA
Loop 304547libarmpl_lp64.soauto armpl::clag::execute_strategy<16ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)Innermost0.030.000.00NANANANANANANA0.00NANANANANA
Loop 304756libarmpl_lp64.soauto armpl::clag::execute_strategy<15ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)InBetween0.040.000.00NANANANANANANA32.49NANANANANA
Loop 140execWaveFunction.cpp:198-201,refwrap.h:351-351,stl_vector.h:993-993,NewTimer.h:242-242,NewTimer.h:249-249qmcplusplus::WaveFunction::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector&)Single0.030.000.00NANANANANANANA0.00NANANANANA
Loop 192execOneBodyJastrowRef.h:214-218,stl_vector.h:1131-1131,shared_ptr_base.h:1667-1667,OhmmsVector.h:223-223,ParticleSet.h:316-316miniqmcreference::OneBodyJastrowRef >::computeU3(qmcplusplus::ParticleSet&, int, double const*) [clone .isra.0]Single0.030.000.00NANANANANANANA1.86NANANANANA
Loop 304492libarmpl_lp64.soauto armpl::clag::execute_strategy<16ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)Innermost0.020.000.00NANANANANANANA0.00NANANANANA
Loop 34827libarmpl_lp64.sodgemm_reference_Innermost0.030.000.00NANANANANANANA2.26NANANANANA
Loop 303983libarmpl_lp64.sovoid armpl::clag::gemv_a_cntg_first(long, long, double, double const*, long, long, double const*, long, double, double*, long)Outermost0.020.000.00NANANANANANANA37.74NANANANANA
Loop 942execstl_algobase.h:238-238,TinyVector.h:145-145,einspline_spo_ref.hpp:219-219,einspline_spo_ref.hpp:223-227,stl_vector.h:1131-1131,OhmmsVector.h:223-223,VectorSoAContainer.h:231-231,VectorSoAContainer.h:271-271miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&, qmcplusplus::Vector, std::allocator > >&, qmcplusplus::Vector >&)Outermost0.030.000.00NANANANANANANA0.00NANANANANA
Loop 57execNonLocalPP.hpp:122-122,NonLocalPP.hpp:126-126,stl_vector.h:1150-1150,ParticleSet.h:277-277main._omp_fn.1InBetween0.020.000.00NANANANANANANA0.00NANANANANA
Loop 334701libarmpl_lp64.sovoid armpl::clag::lu_unblocked_direct_kernel(long, long, double*, long, int*, int&)Innermost0.020.000.00NANANANANANANA94.97NANANANANA
Loop 2815execstl_algobase.h:413-413,stl_algobase.h:451-453,SoaDistanceTableABOMPTarget.h:375-376,stl_algo.h:683-683,stl_algo.h:709-709,stl_vector.h:1131-1131,VectorSoAContainer.h:271-271qmcplusplus::SoaDistanceTableABOMPTarget::update(int)Single0.020.000.00NANANANANANANA0.00NANANANANA
Loop 285execOneBodyJastrowRef.h:192-193miniqmcreference::OneBodyJastrowRef >::evaluateLog(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus::ParticleAttrib >&)Innermost0.020.000.00NANANANANANANA85.92NANANANANA
Loop 304493libarmpl_lp64.soauto armpl::clag::execute_strategy<16ul, std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync >, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> >(std::tuple, armpl::clag::matmul::large_no_sync, armpl::clag::matmul::rank_k_update_large, armpl::clag::matmul::rank_k_update_basic, armpl::clag::matmul::rank_one_update, armpl::clag::matmul::gemm_reference, armpl::clag::matmul::symm_hemm_l_reference, armpl::clag::matmul::symm_hemm_r_reference, armpl::clag::matmul::syrk_herk_reference, armpl::clag::matmul::backstop, armpl::clag::matmul::large_no_sync > const&, armpl::clag::spec::problem_context >, armpl::clag::general_matrix >, armpl::clag::general_matrix >, double>, armpl::clag::spec::sve_architecture_spec> const&)InBetween0.020.000.00NANANANANANANA0.00NANANANANA
Loop 35071libarmpl_lp64.soddot_kernelSingle0.020.000.00NANANANANANANA39.57NANANANANA
Loop 948execMultiBsplineRef.hpp:226-226,MultiBsplineRef.hpp:234-236miniqmcreference::einspline_spo_ref::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector >&, qmcplusplus::Vector, std::allocator > >&, qmcplusplus::Vector >&)InBetween0.020.000.00NANANANANANANA35.61NANANANANA
Loop 37170libarmpl_lp64.son_interleave_kernel_d8Outermost0.020.000.00NANANANANANANA0.00NANANANANA
Loop 37168libarmpl_lp64.son_interleave_kernel_d8Innermost0.020.000.00NANANANANANANA0.00NANANANANA
Loop 746execstl_vector.h:1147-1147,BsplineFunctor.h:305-336qmcplusplus::BsplineFunctor::evaluateVGL(int, int, int, double const*, double*, double*, double*, double*, int*) constSingle0.020.000.00NANANANANANANA0.00NANANANANA
Loop 303659libarmpl_lp64.sovoid armpl::clag::gemv_a_strd_first_impl, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double>(long, long, double, double const*, long, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double const*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, double*, armpl::clag::(anonymous namespace)::step_val_fixed<1l>) [clone .isra.0]Outermost0.020.000.00NANANANANANANA7.91NANANANANA
Loop 1105execOperatorTags.h:61-63,OperatorTags.h:94-94,TinyVector.h:62-62,OhmmsMatrix.h:217-217,TinyVectorOps.h:129-131,OhmmsVector.h:248-248,inner_product.hpp:82-83,inner_product.hpp:155-156,DiracDeterminantRef.cpp:173-173,DiracDeterminantRef.cpp:178-178miniqmcreference::DiracDeterminantRef >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib, std::allocator > >&, qmcplusplus::ParticleAttrib >&, bool)Outermost0.020.000.00NANANANANANANA0.00NANANANANA
Loop 142execWaveFunction.cpp:225-228,refwrap.h:351-351,stl_vector.h:993-993,stl_vector.h:1128-1128,NewTimer.h:242-242,NewTimer.h:249-249qmcplusplus::WaveFunction::acceptMove(qmcplusplus::ParticleSet&, int)Single0.020.000.00NANANANANANANA0.00NANANANANA
×