| Loop id | Source Location | Source Function | Level | Max Thread Time / Walltime armclang_1 (%) | Exclusive Coverage armclang_1 (%) | Inclusive Coverage armclang_1 (%) | Max Exclusive Time Over Threads armclang_1 (s) | Max Inclusive Time Over Threads armclang_1 (s) | Exclusive Time w.r.t. Wall Time armclang_1 (s) | Inclusive Time w.r.t. Wall Time armclang_1 (s) | Nb Threads armclang_1 | GFLOPS armclang_1 | Vectorization Ratio (%) | Vector Length Use (%) | Speedup If No Scalar Integer | Speedup If FP Vectorized | Speedup If Fully Vectorized | Speedup If Perfect Load Balancing armclang_1 | Stride 0 | Stride 1 | Stride n | Stride Unknown | Stride Indirect | Array Access Efficiency |
|---|
| 34845 | libarmpl_lp64.so - | dgemm_sve_big | Innermost | 16.34 | 16.75 | 16.75 | 25.72 | 25.72 | 25.41 | 25.41 | 64 | 1408.48 | 0 | 0 | 0 | 0 | 0 | 1.02 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 34844 | libarmpl_lp64.so - | dgemm_sve_big | InBetween | 14.05 | 14.16 | 30.91 | 22.11 | 47.46 | 21.49 | 46.91 | 64 | 209.81 | 0 | 0 | 0 | 0 | 0 | 1.04 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 1794 | exec - VectorSoAContainer.h:244-263 [...] | qmcplusplus::SoaDistanceTableAAOMPTarget<double, 3u, 40>::update(int) | Single | 8.19 | 8.24 | 8.24 | 12.89 | 12.89 | 12.50 | 12.50 | 64 | 0.72 | 0 | 25 | 1.1 | 1 | 4 | 1.04 | 2 | 0 | 4 | 2 | 0 | 75.00 |
| 818 | exec - MultiBsplineRef.hpp:242-262 | void miniqmcreference::MultiBsplineEvalRef::evaluate_vgh<double>(qmcplusplus::bspline_traits<double, 3u>::SplineType const*, double, double, double, double*, double*, double*, unsigned long) | Innermost | 7.77 | 7.70 | 7.70 | 12.22 | 12.22 | 11.69 | 11.69 | 64 | 396.69 | 100 | 100 | 1 | 1 | 1 | 1.05 | 0 | 0 | 0 | 14 | 0 | 50.00 |
| 37166 | libarmpl_lp64.so - | n_interleave_kernel_d8 | Innermost | 6.69 | 6.60 | 6.60 | 10.53 | 10.53 | 10.01 | 10.01 | 64 | 0.00 | 0 | 0 | 0 | 0 | 0 | 1.06 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 812 | exec - MultiBsplineRef.hpp:68-71 | void miniqmcreference::MultiBsplineEvalRef::evaluate_v<double>(qmcplusplus::bspline_traits<double, 3u>::SplineType const*, double, double, double, double*, unsigned long) | Innermost | 6.04 | 5.97 | 5.97 | 9.50 | 9.50 | 9.06 | 9.06 | 64 | 86.15 | 100 | 100 | 1 | 1 | 1 | 1.06 | 0 | 0 | 0 | 5 | 0 | 50.00 |
| 809 | exec - MultiBsplineRef.hpp:68-71 | void miniqmcreference::MultiBsplineEvalRef::evaluate_v<double>(qmcplusplus::bspline_traits<double, 3u>::SplineType const*, double, double, double, double*, unsigned long) | Innermost | 5.99 | 5.93 | 5.93 | 9.43 | 9.43 | 9.00 | 9.00 | 64 | 86.69 | 100 | 100 | 1 | 1 | 1 | 1.05 | 0 | 0 | 0 | 5 | 0 | 50.00 |
| 810 | exec - MultiBsplineRef.hpp:68-71 | void miniqmcreference::MultiBsplineEvalRef::evaluate_v<double>(qmcplusplus::bspline_traits<double, 3u>::SplineType const*, double, double, double, double*, unsigned long) | Innermost | 5.97 | 5.85 | 5.85 | 9.40 | 9.40 | 8.88 | 8.88 | 64 | 87.88 | 100 | 100 | 1 | 1 | 1 | 1.07 | 0 | 0 | 0 | 5 | 0 | 50.00 |
| 811 | exec - MultiBsplineRef.hpp:68-71 | void miniqmcreference::MultiBsplineEvalRef::evaluate_v<double>(qmcplusplus::bspline_traits<double, 3u>::SplineType const*, double, double, double, double*, unsigned long) | Innermost | 6.01 | 5.85 | 5.85 | 9.46 | 9.46 | 8.88 | 8.88 | 64 | 88.11 | 100 | 100 | 1 | 1 | 1 | 1.07 | 0 | 0 | 0 | 5 | 0 | 50.00 |
| 2055 | exec - ParticleBConds3DSoa.h:280-298 | qmcplusplus::SoaDistanceTableABOMPTarget<double, 3u, 40>::evaluate(qmcplusplus::ParticleSet&) | Innermost | 4.24 | 4.11 | 4.11 | 6.68 | 6.68 | 6.24 | 6.24 | 64 | 383.05 | 94 | 100 | 1 | 1 | 1 | 1.08 | 0 | 0 | 0 | 8 | 0 | 50.00 |
| 1262 | exec - ParticleBConds3DSoa.h:235-255 | void qmcplusplus::DTD_BConds<double, 3u, 40>::computeDistances<qmcplusplus::TinyVector<double, 3u>, qmcplusplus::VectorSoAContainer<double, 3u, qmcplusplus::Mallocator<double, 32ul> >, qmcplusplus::VectorSoAContainer<double, 3... | Single | 1.57 | 1.47 | 1.47 | 2.48 | 2.48 | 2.23 | 2.23 | 64 | 552.13 | 89.04 | 89.9 | 1 | 1 | 1 | 1.12 | 1 | 0 | 0 | 0 | 7 | 12.50 |
| 303984 | libarmpl_lp64.so - | void armpl::clag::gemv_a_cntg_first<false, armpl::clag::spec::sve_architecture_spec, double, double, double, double>(long, long, double, double const*, long, long, double const*, long, double, double*, long) | Innermost | 1.53 | 1.44 | 1.44 | 2.40 | 2.40 | 2.18 | 2.18 | 64 | 102.47 | 0 | 0 | 0 | 0 | 0 | 1.11 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 324 | exec - BsplineFunctor.h:233-260 [...] | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector<double, std::allocator<double> >&) | InBetween | 1.43 | 1.37 | 1.42 | 2.25 | 2.37 | 2.07 | 2.16 | 64 | 31.77 | 0 | 21.15 | 3 | 1 | 6.79 | 1.1 | NA | NA | NA | NA | NA | 0.00 |
| 34842 | libarmpl_lp64.so - | dgemm_sve_big | Innermost | 1.38 | 1.34 | 1.34 | 2.16 | 2.16 | 2.03 | 2.03 | 64 | 1214.60 | 0 | 0 | 0 | 0 | 0 | 1.07 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 303664 | libarmpl_lp64.so - | void armpl::clag::gemv_a_strd_first_impl<false, armpl::clag::spec::sve_architecture_spec, double, long, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::cl... | Innermost | 0.88 | 0.80 | 0.80 | 1.38 | 1.38 | 1.21 | 1.21 | 64 | 117.55 | 0 | 0 | 0 | 0 | 0 | 1.15 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 304781 | libarmpl_lp64.so - | auto armpl::clag::execute_strategy<15ul, std::tuple<armpl::clag::matmul::set_or_scale, armpl::clag::matmul::compressed_general_matrix_vector, armpl::clag::matmul::symmetric_matrix_vector, armpl::clag::matmul::compressed_symmetric_matrix_vector, armpl... | Innermost | 0.84 | 0.75 | 0.75 | 1.32 | 1.32 | 1.13 | 1.13 | 64 | 0.25 | 0 | 0 | 0 | 0 | 0 | 1.17 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 303980 | libarmpl_lp64.so - | void armpl::clag::gemv_a_cntg_first<false, armpl::clag::spec::sve_architecture_spec, double, double, double, double>(long, long, double, double const*, long, long, double const*, long, double, double*, long) | Innermost | 0.69 | 0.62 | 0.62 | 1.09 | 1.09 | 0.94 | 0.94 | 64 | 66.88 | 0 | 0 | 0 | 0 | 0 | 1.17 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 304835 | libarmpl_lp64.so - | auto armpl::clag::execute_strategy<15ul, std::tuple<armpl::clag::matmul::set_or_scale, armpl::clag::matmul::compressed_general_matrix_vector, armpl::clag::matmul::symmetric_matrix_vector, armpl::clag::matmul::compressed_symmetric_matrix_vector, armpl... | Innermost | 0.67 | 0.60 | 0.60 | 1.05 | 1.05 | 0.92 | 0.92 | 64 | 0.17 | 0 | 0 | 0 | 0 | 0 | 1.15 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 918 | exec - inner_product.hpp:155-155 [...] | miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<... | Innermost | 0.42 | 0.36 | 0.36 | 0.67 | 0.67 | 0.55 | 0.55 | 64 | 65.35 | 81.82 | 59.09 | 1 | 1.75 | 1.47 | 1.21 | 0 | 0 | 1 | 1 | 0 | 62.50 |
| 272 | exec - BsplineFunctor.h:291-298 | qmcplusplus::BsplineFunctor<double>::evaluateVGL(int, int, int, double const*, double*, double*, double*, double*, int*) const | Single | 0.44 | 0.36 | 0.36 | 0.69 | 0.69 | 0.55 | 0.55 | 64 | 44.71 | 0 | 22.92 | 1.25 | 1 | 5 | 1.26 | 0 | 0 | 1.5 | 0 | 0 | 75.00 |
| 910 | exec - inner_product.hpp:155-155 [...] | miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evalGrad(qmcplusplus::ParticleSet&, int) | Single | 0.46 | 0.35 | 0.35 | 0.73 | 0.73 | 0.53 | 0.53 | 64 | 68.11 | 81.82 | 59.09 | 1 | 1.75 | 1.47 | 1.37 | 0 | 0 | 1 | 1 | 0 | 62.50 |
| 802 | exec - inner_product.hpp:82-83 | qmcplusplus::SPOSet::evaluateDetRatios(qmcplusplus::VirtualParticleSet const&, qmcplusplus::Vector<double, std::allocator<double> >&, qmcplusplus::Vector<double, std::allocator<double> > const&, std::vector<double, st... | Innermost | 0.37 | 0.32 | 0.32 | 0.58 | 0.58 | 0.48 | 0.48 | 64 | 97.96 | 85.71 | 89.29 | 1 | 1 | 1 | 1.22 | 0 | 0 | 0 | 2 | 0 | 50.00 |
| 801 | exec - einspline_spo_ref.hpp:223-227 [...] | miniqmcreference::einspline_spo_ref<double>::evaluate(qmcplusplus::ParticleSet const&, int, qmcplusplus::Vector<double, std::allocator<double> >&, qmcplusplus::Vector<qmcplusplus::TinyVector<double, 3u>, std::allocator<... | Innermost | 0.37 | 0.31 | 0.31 | 0.57 | 0.57 | 0.47 | 0.47 | 64 | 0.00 | 9.09 | 26.14 | 2.33 | 1 | 5.25 | 1.22 | 4 | 0 | 4 | 5 | 0 | 73.08 |
| 303666 | libarmpl_lp64.so - | void armpl::clag::gemv_a_strd_first_impl<false, armpl::clag::spec::sve_architecture_spec, double, long, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::cl... | Single | 0.33 | 0.28 | 0.28 | 0.52 | 0.52 | 0.42 | 0.42 | 64 | 124.77 | 0 | 0 | 0 | 0 | 0 | 1.24 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 314 | exec - TwoBodyJastrowRef.h:342-347 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::acceptMove(qmcplusplus::ParticleSet&, int) | Single | 0.25 | 0.22 | 0.22 | 0.40 | 0.40 | 0.33 | 0.33 | 64 | 92.19 | 95.24 | 96.43 | 1 | 1 | 1 | 1.21 | 0 | 0 | 0 | 10 | 0 | 50.00 |
| 315 | exec - TwoBodyJastrowRef.h:342-347 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::acceptMove(qmcplusplus::ParticleSet&, int) | Single | 0.25 | 0.22 | 0.22 | 0.40 | 0.40 | 0.33 | 0.33 | 64 | 91.47 | 95.24 | 96.43 | 1 | 1 | 1 | 1.23 | 0 | 0 | 0 | 10 | 0 | 50.00 |
| 313 | exec - TwoBodyJastrowRef.h:342-347 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::acceptMove(qmcplusplus::ParticleSet&, int) | Single | 0.27 | 0.21 | 0.21 | 0.42 | 0.42 | 0.32 | 0.32 | 64 | 94.87 | 95.24 | 96.43 | 1 | 1 | 1 | 1.32 | 0 | 0 | 0 | 10 | 0 | 50.00 |
| 919 | exec - inner_product.hpp:82-83 | miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evaluateGL(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector<... | Innermost | 0.24 | 0.20 | 0.20 | 0.39 | 0.39 | 0.30 | 0.30 | 64 | 40.01 | 85.71 | 89.29 | 1 | 1 | 1 | 1.28 | 0 | 0 | 0 | 2 | 0 | 50.00 |
| 316 | exec - TwoBodyJastrowRef.h:324-331 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::acceptMove(qmcplusplus::ParticleSet&, int) | Single | 0.24 | 0.18 | 0.18 | 0.39 | 0.39 | 0.27 | 0.27 | 64 | 199.69 | 97.14 | 97.86 | 1 | 1 | 1 | 1.44 | 0 | 0 | 0 | 16 | 0 | 50.00 |
| 303660 | libarmpl_lp64.so - | void armpl::clag::gemv_a_strd_first_impl<false, armpl::clag::spec::sve_architecture_spec, double, long, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::clag::(anonymous namespace)::step_val_fixed<1l>, double, armpl::cl... | Innermost | 0.22 | 0.16 | 0.16 | 0.34 | 0.34 | 0.25 | 0.25 | 64 | 102.85 | 0 | 0 | 0 | 0 | 0 | 1.4 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 42542 | libarmpl_lp64.so - | dswap_ | Single | 0.22 | 0.16 | 0.16 | 0.34 | 0.34 | 0.25 | 0.25 | 64 | 0.00 | 0 | 0 | 0 | 0 | 0 | 1.4 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 816 | exec - MultiBsplineRef.hpp:276-286 | void miniqmcreference::MultiBsplineEvalRef::evaluate_vgh<double>(qmcplusplus::bspline_traits<double, 3u>::SplineType const*, double, double, double, double*, double*, double*, unsigned long) | Single | 0.20 | 0.15 | 0.15 | 0.31 | 0.31 | 0.23 | 0.23 | 64 | 280.42 | 100 | 100 | 1 | 1 | 1 | 1.35 | 0 | 0 | 0 | 9 | 0 | 50.00 |
| 304604 | libarmpl_lp64.so - | auto armpl::clag::execute_strategy<16ul, std::tuple<armpl::clag::matmul::set_or_scale, armpl::clag::matmul::compressed_general_matrix_vector, armpl::clag::matmul::symmetric_matrix_vector, armpl::clag::matmul::compressed_symmetric_matrix_vector, armpl... | Innermost | 0.16 | 0.13 | 0.13 | 0.25 | 0.25 | 0.19 | 0.19 | 64 | 0.35 | 0 | 0 | 0 | 0 | 0 | 1.32 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 300 | exec - TwoBodyJastrowRef.h:155-156 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | Single | 0.16 | 0.12 | 0.12 | 0.25 | 0.25 | 0.18 | 0.18 | 64 | 136.36 | 85.71 | 89.29 | 1 | 1 | 1 | 1.37 | 0 | 0 | 0 | 2 | 0 | 50.00 |
| 301 | exec - TwoBodyJastrowRef.h:155-156 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | Single | 0.16 | 0.11 | 0.11 | 0.25 | 0.25 | 0.17 | 0.17 | 64 | 143.35 | 100 | 100 | 1 | 1 | 1 | 1.48 | 0 | 0 | 0 | 3 | 0 | 50.00 |
| 302 | exec - TwoBodyJastrowRef.h:155-156 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | Single | 0.16 | 0.10 | 0.10 | 0.26 | 0.26 | 0.15 | 0.15 | 64 | 156.47 | 85.71 | 89.29 | 1 | 1 | 1 | 1.67 | 0 | 0 | 0 | 2 | 0 | 50.00 |
| 63 | exec - NonLocalPP.hpp:122-135 [...] | qmcplusplus::NonLocalPP<double>::evaluate(qmcplusplus::ParticleSet const&, qmcplusplus::WaveFunction&) | Outermost | 0.12 | 0.08 | 0.09 | 0.19 | 0.19 | 0.13 | 0.13 | 64 | 8.14 | 0 | 22.79 | 9 | 1 | 5.82 | 1.56 | NA | NA | NA | NA | NA | 0.00 |
| 912 | exec - inner_product.hpp:82-83 | miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | Single | 0.10 | 0.06 | 0.06 | 0.15 | 0.15 | 0.09 | 0.09 | 64 | 128.67 | 85.71 | 89.29 | 1 | 1 | 1 | 1.61 | 0 | 0 | 0 | 2 | 0 | 50.00 |
| 892 | exec - inner_product.hpp:211-212 | qmcplusplus::DiracMatrix<double, double>::invert_transpose(qmcplusplus::Matrix<double, std::allocator<double> > const&, qmcplusplus::Matrix<double, std::allocator<double> >&, double&, double&) | Innermost | 0.07 | 0.06 | 0.06 | 0.11 | 0.11 | 0.09 | 0.09 | 64 | 0.00 | 0 | 25 | 1 | 1 | 4 | 1.24 | 0 | 0 | 1 | 1 | 0 | 62.50 |
| 904 | exec - inner_product.hpp:155-155 [...] | miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evaluateLog(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector&l... | Innermost | 0.09 | 0.06 | 0.06 | 0.14 | 0.14 | 0.09 | 0.09 | 64 | 84.49 | 81.82 | 59.09 | 1 | 1.75 | 1.47 | 1.71 | 0 | 0 | 1 | 1 | 0 | 62.50 |
| 913 | exec - inner_product.hpp:155-155 [...] | miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | Single | 0.08 | 0.06 | 0.06 | 0.13 | 0.13 | 0.08 | 0.08 | 64 | 426.30 | 81.82 | 59.09 | 1 | 1.75 | 1.47 | 1.55 | 0 | 0 | 1 | 1 | 0 | 62.50 |
| 271 | exec - BsplineFunctor.h:303-336 [...] | qmcplusplus::BsplineFunctor<double>::evaluateVGL(int, int, int, double const*, double*, double*, double*, double*, int*) const | Single | 0.08 | 0.04 | 0.04 | 0.12 | 0.12 | 0.06 | 0.06 | 64 | 607.75 | 91.14 | 98.1 | 1 | 1 | 1.01 | 2.05 | 1 | 0 | 0 | 3 | 5 | 27.78 |
| 304833 | libarmpl_lp64.so - | auto armpl::clag::execute_strategy<15ul, std::tuple<armpl::clag::matmul::set_or_scale, armpl::clag::matmul::compressed_general_matrix_vector, armpl::clag::matmul::symmetric_matrix_vector, armpl::clag::matmul::compressed_symmetric_matrix_vector, armpl... | InBetween | 0.07 | 0.04 | 0.64 | 0.11 | 1.10 | 0.06 | 0.98 | 64 | 0.28 | 0 | 0 | 0 | 0 | 0 | 1.89 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 326 | exec - BsplineFunctor.h:246-260 [...] | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector<double, std::allocator<double> >&) | Innermost | 0.06 | 0.04 | 0.04 | 0.10 | 0.10 | 0.06 | 0.06 | 64 | 690.67 | 75 | 93.75 | 1 | 1 | 1.03 | 1.71 | 0 | 0 | 0 | 2 | 2 | 25.00 |
| 277 | exec - BsplineFunctor.h:236-241 | qmcplusplus::BsplineFunctor<double>::evaluateV(int, int, int, double const*, double*) const | Single | 0.05 | 0.04 | 0.04 | 0.08 | 0.08 | 0.05 | 0.05 | 64 | 6.66 | 0 | 20.83 | 1.8 | 1 | 6 | 1.47 | NA | NA | NA | NA | NA | 0.00 |
| 34841 | libarmpl_lp64.so - | dgemm_sve_big | InBetween | 0.04 | 0.02 | 1.36 | 0.07 | 2.20 | 0.04 | 2.07 | 63 | 1245.29 | 0 | 0 | 0 | 0 | 0 | 1.71 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 803 | exec - inner_product.hpp:82-83 [...] | qmcplusplus::SPOSet::evaluateDetRatios(qmcplusplus::VirtualParticleSet const&, qmcplusplus::Vector<double, std::allocator<double> >&, qmcplusplus::Vector<double, std::allocator<double> > const&, std::vector<double, st... | InBetween | 0.04 | 0.02 | 0.02 | 0.07 | 0.07 | 0.04 | 0.04 | 60 | 41.99 | 0 | 23.33 | 1.67 | 1 | 5.27 | 1.65 | NA | NA | NA | NA | NA | 0.00 |
| 323 | exec - BsplineFunctor.h:233-260 [...] | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector<double, std::allocator<double> >&) | Outermost | 0.04 | 0.02 | 1.44 | 0.06 | 2.42 | 0.03 | 2.19 | 54 | 75.25 | 0 | 25 | 1.2 | 1 | 4 | 1.92 | NA | NA | NA | NA | NA | 0.00 |
| 2053 | exec - ParticleBConds3DSoa.h:280-298 [...] | qmcplusplus::SoaDistanceTableABOMPTarget<double, 3u, 40>::evaluate(qmcplusplus::ParticleSet&) | InBetween | 0.04 | 0.02 | 4.13 | 0.06 | 6.72 | 0.03 | 6.27 | 54 | 185.51 | 2.59 | 24.03 | 3.15 | 1 | 2.43 | 1.81 | NA | NA | NA | NA | NA | 0.00 |
| 224 | exec - OneBodyJastrowRef.h:192-193 | miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | Single | 0.04 | 0.02 | 0.02 | 0.06 | 0.06 | 0.03 | 0.03 | 56 | 74.28 | 85.71 | 89.29 | 1 | 1 | 1 | 1.92 | 0 | 0 | 0 | 2 | 0 | 50.00 |
| 304754 | libarmpl_lp64.so - | auto armpl::clag::execute_strategy<15ul, std::tuple<armpl::clag::matmul::set_or_scale, armpl::clag::matmul::compressed_general_matrix_vector, armpl::clag::matmul::symmetric_matrix_vector, armpl::clag::matmul::compressed_symmetric_matrix_vector, armpl... | InBetween | 0.04 | 0.02 | 1.42 | 0.06 | 2.42 | 0.03 | 2.15 | 52 | 8.68 | 0 | 0 | 0 | 0 | 0 | 1.91 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 334699 | libarmpl_lp64.so - | void armpl::clag::lu_unblocked_direct_kernel<armpl::clag::spec::sve_architecture_spec, double, int>(long, long, double*, long, int*, int&) | Innermost | 0.04 | 0.02 | 0.02 | 0.06 | 0.06 | 0.03 | 0.03 | 54 | 291.17 | 0 | 0 | 0 | 0 | 0 | 2.17 | 0 | 0 | 0 | 0 | 0 | 0.00 |
| 307 | exec - stl_numeric.h:140-141 | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::ratioGrad(qmcplusplus::ParticleSet&, int, qmcplusplus::TinyVector<double, 3u>&) | Single | 0.03 | 0.02 | 0.02 | 0.05 | 0.05 | 0.02 | 0.02 | 50 | 374.94 | 80 | 85 | 1 | 1 | 1.12 | 1.6 | 0 | 0 | 0 | 1 | 0 | 50.00 |
| 905 | exec - inner_product.hpp:82-83 | miniqmcreference::DiracDeterminantRef<qmcplusplus::DelayedUpdate<double, double> >::evaluateLog(qmcplusplus::ParticleSet&, qmcplusplus::ParticleAttrib<qmcplusplus::TinyVector<double, 3u>, std::allocator<qmcplusplus::TinyVector&l... | Innermost | 0.04 | 0.01 | 0.01 | 0.06 | 0.06 | 0.02 | 0.02 | 46 | 84.62 | 85.71 | 89.29 | 1 | 1 | 1 | 2.06 | 0 | 0 | 0 | 4 | 0 | 50.00 |
| 2052 | exec - SoaDistanceTableABOMPTarget.h:214-228 [...] | qmcplusplus::SoaDistanceTableABOMPTarget<double, 3u, 40>::evaluate(qmcplusplus::ParticleSet&) | Outermost | 0.03 | 0.01 | 4.14 | 0.05 | 6.73 | 0.02 | 6.29 | 48 | 67.24 | 58.82 | 63.53 | 1.21 | 1 | 1.21 | 1.85 | NA | NA | NA | NA | NA | 0.00 |
| 325 | exec - BsplineFunctor.h:233-260 [...] | miniqmcreference::TwoBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector<double, std::allocator<double> >&) | InBetween | 0.03 | 0.01 | 0.06 | 0.05 | 0.14 | 0.02 | 0.09 | 42 | 29.89 | 63.77 | 60.51 | 1.03 | 1 | 1.21 | 2.04 | NA | NA | NA | NA | NA | 0.00 |
| 245 | exec - OneBodyJastrowRef.h:134-135 [...] | miniqmcreference::OneBodyJastrowRef<qmcplusplus::BsplineFunctor<double> >::evaluateRatios(qmcplusplus::VirtualParticleSet&, std::vector<double, std::allocator<double> >&) | Single | 0.03 | 0.01 | 0.01 | 0.05 | 0.05 | 0.02 | 0.02 | 38 | 2.13 | 0 | 22.5 | 1.42 | 1.7 | 6.18 | 2 | 3 | 0 | 2 | 1 | 1 | 71.43 |
| 33845 | libarmpl_lp64.so - | daxpby_sve_kernel | Single | 0.03 | 0.01 | 0.01 | 0.05 | 0.05 | 0.02 | 0.02 | 36 | 169.83 | 0 | 0 | 0 | 0 | 0 | 1.94 | 0 | 0 | 0 | 0 | 0 | 0.00 |