auto armpl::clag::spec::get_spec<armpl::clag::spec::strategy_tag<armpl::clag::matmul::l3_matmul_strategy_tag>, armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double> >(armpl::clag::spec::strategy_tag<armpl::clag::matmul::l3_matmul_strategy_tag>, armpl::clag::spec::problem_context<armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double>, armpl::clag::spec::sve_architecture_spec> const&) [clone .isra.0] - Load Distribution

minmedavgmax
Percentile Index10 20 30 40 50 60 70 80 90 100
Value


minmedavgmax
Percentile Index10 20 30 40 50 60 70 80 90 100
Value

auto armpl::clag::spec::get_spec<armpl::clag::spec::strategy_tag<armpl::clag::matmul::l3_matmul_strategy_tag>, armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double> >(armpl::clag::spec::strategy_tag<armpl::clag::matmul::l3_matmul_strategy_tag>, armpl::clag::spec::problem_context<armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double>, armpl::clag::spec::sve_architecture_spec> const&) [clone .isra.0] - Sorted Load Distribution

minmedavgmax
Percentile Index10 20 30 40 50 60 70 80 90 100
Value


minmedavgmax
Percentile Index10 20 30 40 50 60 70 80 90 100
Value

auto armpl::clag::spec::get_spec<armpl::clag::spec::strategy_tag<armpl::clag::matmul::l3_matmul_strategy_tag>, armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double> >(armpl::clag::spec::strategy_tag<armpl::clag::matmul::l3_matmul_strategy_tag>, armpl::clag::spec::problem_context<armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double>, armpl::clag::spec::sve_architecture_spec> const&) [clone .isra.0] - Load Distribution All Threads

minmedavgmax
Percentile Index10 20 30 40 50 60 70 80 90 100
Value


minmedavgmax
Percentile Index10 20 30 40 50 60 70 80 90 100
Value

auto armpl::clag::spec::get_spec<armpl::clag::spec::strategy_tag<armpl::clag::matmul::l3_matmul_strategy_tag>, armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double> >(armpl::clag::spec::strategy_tag<armpl::clag::matmul::l3_matmul_strategy_tag>, armpl::clag::spec::problem_context<armpl::clag::matmul::matmul3<armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double const> >, armpl::clag::general_matrix<armpl::clag::matrix_base<double> >, double>, armpl::clag::spec::sve_architecture_spec> const&) [clone .isra.0]

Columns Filter

(1x1) Efficiency (1x1) Potential Speed-Up (%) (1x2) Efficiency (1x2) Potential Speed-Up (%) (1x4) Efficiency (1x4) Potential Speed-Up (%) (1x8) Efficiency (1x8) Potential Speed-Up (%) (1x16) Efficiency (1x16) Potential Speed-Up (%) (1x24) Efficiency (1x24) Potential Speed-Up (%) (1x32) Efficiency (1x32) Potential Speed-Up (%) (1x40) Efficiency (1x40) Potential Speed-Up (%) (1x48) Efficiency (1x48) Potential Speed-Up (%) (1x56) Efficiency (1x56) Potential Speed-Up (%) (1x64) Efficiency (1x64) Potential Speed-Up (%)
(1x1) Efficiency(1x1) Potential Speed-Up (%)(1x2) Efficiency(1x2) Potential Speed-Up (%)(1x4) Efficiency(1x4) Potential Speed-Up (%)(1x8) Efficiency(1x8) Potential Speed-Up (%)(1x16) Efficiency(1x16) Potential Speed-Up (%)(1x24) Efficiency(1x24) Potential Speed-Up (%)(1x32) Efficiency(1x32) Potential Speed-Up (%)(1x40) Efficiency(1x40) Potential Speed-Up (%)(1x48) Efficiency(1x48) Potential Speed-Up (%)(1x56) Efficiency(1x56) Potential Speed-Up (%)(1x64) Efficiency(1x64) Potential Speed-Up (%)
10

Speed-Up and Efficiency

No callchains for this object
Coverage (%)NameSource LocationModule
50.00+auto armpl::clag::execute_stra[...]libarmpl_lp64.so
void armpl::clag::compute_impl[...]libarmpl_lp64.so
void armpl::clag::gemm<true, i[...]libarmpl_lp64.so
qmcplusplus::DelayedUpdate<dou[...]DelayedUpdate.h:190exec
void qmcplusplus::DelayedUpdat[...]DelayedUpdate.h:153exec
miniqmcreference::DiracDetermi[...]DiracDeterminantRef.cpp:129exec
qmcplusplus::WaveFunction::acc[...]stl_vector.h:993exec
main.omp_outlined.62miniqmc.cpp:450exec
__kmp_invoke_microtasklibomp.so
__kmp_invoke_task_funclibomp.so
__kmp_fork_calllibomp.so
__kmpc_fork_calllibomp.so
mainminiqmc.cpp:409exec
__libc_start_call_mainlibc.so.6
__libc_start_mainlibc.so.6
_startnew_allocator.h:172exec
50.00+void armpl::clag::compute_impl[...]libarmpl_lp64.so
void armpl::clag::triangular_s[...]libarmpl_lp64.so
void armpl::clag::triangular_s[...]libarmpl_lp64.so
void armpl::clag::triangular_s[...]libarmpl_lp64.so
auto armpl::clag::execute_stra[...]libarmpl_lp64.so
void armpl::clag::compute_impl[...]libarmpl_lp64.so
auto armpl::clag::execute_stra[...]libarmpl_lp64.so
void armpl::clag::compute_impl[...]libarmpl_lp64.so
void armpl::clag::getrf<true, [...]libarmpl_lp64.so
qmcplusplus::DiracMatrix<doubl[...]BLAS.hpp:790exec
miniqmcreference::DiracDetermi[...]DelayedUpdate.h:79exec
miniqmcreference::DiracDetermi[...]DiracDeterminantRef.cpp:238exec
qmcplusplus::WaveFunction::eva[...]WaveFunction.cpp:171exec
main.omp_outlinedminiqmc.cpp:379exec
__kmp_invoke_microtasklibomp.so
__kmp_invoke_task_funclibomp.so
__kmp_launch_threadlibomp.so
__kmp_launch_worker(void*)libomp.so
start_threadlibc.so.6
thread_startlibc.so.6
No callchains for this object
No callchains for this object
No callchains for this object
No callchains for this object
No callchains for this object
No callchains for this object
No callchains for this object
No callchains for this object
No callchains for this object
×