auto armpl::clag::spec::get_spec<armpl::clag::spec::strategy_tag<armpl::clag::matmul::gemv>, armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double> >(armpl::clag::spec::strategy_tag<armpl::clag::matmul::gemv>, armpl::clag::spec::problem_context<armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double>, armpl::clag::spec::sve_architecture_spec> const&) [clone .isra.0] - Load Distribution

minmedavgmax
Percentile Index10 20 30 40 50 60 70 80 90 100
Value


minmedavgmax
Percentile Index10 20 30 40 50 60 70 80 90 100
Value

auto armpl::clag::spec::get_spec<armpl::clag::spec::strategy_tag<armpl::clag::matmul::gemv>, armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double> >(armpl::clag::spec::strategy_tag<armpl::clag::matmul::gemv>, armpl::clag::spec::problem_context<armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double>, armpl::clag::spec::sve_architecture_spec> const&) [clone .isra.0] - Sorted Load Distribution

minmedavgmax
Percentile Index10 20 30 40 50 60 70 80 90 100
Value


minmedavgmax
Percentile Index10 20 30 40 50 60 70 80 90 100
Value

auto armpl::clag::spec::get_spec<armpl::clag::spec::strategy_tag<armpl::clag::matmul::gemv>, armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double> >(armpl::clag::spec::strategy_tag<armpl::clag::matmul::gemv>, armpl::clag::spec::problem_context<armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double>, armpl::clag::spec::sve_architecture_spec> const&) [clone .isra.0] - Load Distribution All Threads

minmedavgmax
Percentile Index10 20 30 40 50 60 70 80 90 100
Value


minmedavgmax
Percentile Index10 20 30 40 50 60 70 80 90 100
Value

auto armpl::clag::spec::get_spec<armpl::clag::spec::strategy_tag<armpl::clag::matmul::gemv>, armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double> >(armpl::clag::spec::strategy_tag<armpl::clag::matmul::gemv>, armpl::clag::spec::problem_context<armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double>, armpl::clag::spec::sve_architecture_spec> const&) [clone .isra.0]

Columns Filter

(1x1) Efficiency (1x1) Potential Speed-Up (%) (1x2) Efficiency (1x2) Potential Speed-Up (%) (1x4) Efficiency (1x4) Potential Speed-Up (%) (1x8) Efficiency (1x8) Potential Speed-Up (%) (1x16) Efficiency (1x16) Potential Speed-Up (%) (1x24) Efficiency (1x24) Potential Speed-Up (%) (1x32) Efficiency (1x32) Potential Speed-Up (%) (1x40) Efficiency (1x40) Potential Speed-Up (%) (1x48) Efficiency (1x48) Potential Speed-Up (%) (1x56) Efficiency (1x56) Potential Speed-Up (%) (1x64) Efficiency (1x64) Potential Speed-Up (%)
(1x1) Efficiency(1x1) Potential Speed-Up (%)(1x2) Efficiency(1x2) Potential Speed-Up (%)(1x4) Efficiency(1x4) Potential Speed-Up (%)(1x8) Efficiency(1x8) Potential Speed-Up (%)(1x16) Efficiency(1x16) Potential Speed-Up (%)(1x24) Efficiency(1x24) Potential Speed-Up (%)(1x32) Efficiency(1x32) Potential Speed-Up (%)(1x40) Efficiency(1x40) Potential Speed-Up (%)(1x48) Efficiency(1x48) Potential Speed-Up (%)(1x56) Efficiency(1x56) Potential Speed-Up (%)(1x64) Efficiency(1x64) Potential Speed-Up (%)
102.6607.97011.96031.810

Speed-Up and Efficiency

Coverage (%)NameSource LocationModule
100.00+void armpl::clag::compute_impl[...]libarmpl_lp64.so
void armpl::clag::gemv<true, i[...]libarmpl_lp64.so
void qmcplusplus::DelayedUpdat[...]DelayedUpdate.h:112exec
miniqmcreference::DiracDetermi[...]OhmmsVector.h:178exec
qmcplusplus::WaveFunction::eva[...]stl_vector.h:993exec
main.omp_outlined.62miniqmc.cpp:433exec
__kmp_invoke_microtasklibomp.so
__kmp_fork_calllibomp.so
__kmpc_fork_calllibomp.so
mainminiqmc.cpp:409exec
__libc_start_call_mainlibc.so.6
__libc_start_mainlibc.so.6
_startnew_allocator.h:172exec
No callchains for this object
Coverage (%)NameSource LocationModule
100.00+void armpl::clag::compute_impl[...]libarmpl_lp64.so
void armpl::clag::gemv<true, i[...]libarmpl_lp64.so
void qmcplusplus::DelayedUpdat[...]DelayedUpdate.h:112exec
miniqmcreference::DiracDetermi[...]OhmmsVector.h:178exec
qmcplusplus::WaveFunction::eva[...]stl_vector.h:993exec
main.omp_outlined.62miniqmc.cpp:433exec
__kmp_invoke_microtasklibomp.so
__kmp_invoke_task_funclibomp.so
__kmp_launch_threadlibomp.so
__kmp_launch_worker(void*)libomp.so
start_threadlibc.so.6
thread_startlibc.so.6
Coverage (%)NameSource LocationModule
100.00+void armpl::clag::compute_impl[...]libarmpl_lp64.so
void armpl::clag::gemv<true, i[...]libarmpl_lp64.so
void qmcplusplus::DelayedUpdat[...]DelayedUpdate.h:112exec
miniqmcreference::DiracDetermi[...]OhmmsVector.h:178exec
qmcplusplus::WaveFunction::eva[...]stl_vector.h:993exec
main.omp_outlined.62miniqmc.cpp:433exec
__kmp_invoke_microtasklibomp.so
__kmp_invoke_task_funclibomp.so
__kmp_launch_threadlibomp.so
__kmp_launch_worker(void*)libomp.so
start_threadlibc.so.6
thread_startlibc.so.6
No callchains for this object
Coverage (%)NameSource LocationModule
100.00+void armpl::clag::compute_impl[...]libarmpl_lp64.so
void armpl::clag::gemv<true, i[...]libarmpl_lp64.so
void qmcplusplus::DelayedUpdat[...]DelayedUpdate.h:112exec
miniqmcreference::DiracDetermi[...]OhmmsVector.h:178exec
qmcplusplus::WaveFunction::eva[...]stl_vector.h:993exec
main.omp_outlined.62miniqmc.cpp:433exec
__kmp_invoke_microtasklibomp.so
__kmp_invoke_task_funclibomp.so
__kmp_launch_threadlibomp.so
__kmp_launch_worker(void*)libomp.so
start_threadlibc.so.6
thread_startlibc.so.6
No callchains for this object
No callchains for this object
Coverage (%)NameSource LocationModule
33.33+void armpl::clag::compute_impl[...]libarmpl_lp64.so
void armpl::clag::gemv<true, i[...]libarmpl_lp64.so
void qmcplusplus::DelayedUpdat[...]DelayedUpdate.h:136exec
miniqmcreference::DiracDetermi[...]DiracDeterminantRef.cpp:129exec
qmcplusplus::WaveFunction::acc[...]stl_vector.h:993exec
main.omp_outlined.62miniqmc.cpp:450exec
__kmp_invoke_microtasklibomp.so
__kmp_invoke_task_funclibomp.so
__kmp_launch_threadlibomp.so
__kmp_launch_worker(void*)libomp.so
start_threadlibc.so.6
thread_startlibc.so.6
33.33+void armpl::clag::compute_impl[...]libarmpl_lp64.so
void armpl::clag::gemv<true, i[...]libarmpl_lp64.so
void qmcplusplus::DelayedUpdat[...]DelayedUpdate.h:112exec
miniqmcreference::DiracDetermi[...]OhmmsVector.h:178exec
qmcplusplus::WaveFunction::eva[...]stl_vector.h:993exec
main.omp_outlined.62miniqmc.cpp:433exec
__kmp_invoke_microtasklibomp.so
__kmp_invoke_task_funclibomp.so
__kmp_launch_threadlibomp.so
__kmp_launch_worker(void*)libomp.so
start_threadlibc.so.6
thread_startlibc.so.6
33.33+void armpl::clag::compute_impl[...]libarmpl_lp64.so
void armpl::clag::gemv<true, i[...]libarmpl_lp64.so
void qmcplusplus::DelayedUpdat[...]BLAS.hpp:187exec
miniqmcreference::DiracDetermi[...]OhmmsVector.h:178exec
qmcplusplus::WaveFunction::eva[...]stl_vector.h:993exec
main.omp_outlined.62miniqmc.cpp:433exec
__kmp_invoke_microtasklibomp.so
__kmp_invoke_task_funclibomp.so
__kmp_launch_threadlibomp.so
__kmp_launch_worker(void*)libomp.so
start_threadlibc.so.6
thread_startlibc.so.6
No callchains for this object
No callchains for this object
×