options

Functions and Loops

Columns Filter

Coverage run_1_thread (%) Coverage run_2_threads (%) Coverage run_4_threads (%) Coverage run_8_threads (%) Coverage run_16_threads (%) Coverage run_32_threads (%) Coverage run_48_threads (%) Coverage run_64_threads (%) Coverage Excluding Loops run_1_thread (%) Coverage Excluding Loops run_2_threads (%) Coverage Excluding Loops run_4_threads (%) Coverage Excluding Loops run_8_threads (%) Coverage Excluding Loops run_16_threads (%) Coverage Excluding Loops run_32_threads (%) Coverage Excluding Loops run_48_threads (%) Coverage Excluding Loops run_64_threads (%) Max Inclusive Time Over Threads run_1_thread (s) Max Inclusive Time Over Threads run_2_threads (s) Max Inclusive Time Over Threads run_4_threads (s) Max Inclusive Time Over Threads run_8_threads (s) Max Inclusive Time Over Threads run_16_threads (s) Max Inclusive Time Over Threads run_32_threads (s) Max Inclusive Time Over Threads run_48_threads (s) Max Inclusive Time Over Threads run_64_threads (s) Max Exclusive Time Over Threads run_1_thread (s) Max Exclusive Time Over Threads run_2_threads (s) Max Exclusive Time Over Threads run_4_threads (s) Max Exclusive Time Over Threads run_8_threads (s) Max Exclusive Time Over Threads run_16_threads (s) Max Exclusive Time Over Threads run_32_threads (s) Max Exclusive Time Over Threads run_48_threads (s) Max Exclusive Time Over Threads run_64_threads (s) Inclusive Time w.r.t. Wall Time run_1_thread (s) Inclusive Time w.r.t. Wall Time run_2_threads (s) Inclusive Time w.r.t. Wall Time run_4_threads (s) Inclusive Time w.r.t. Wall Time run_8_threads (s) Inclusive Time w.r.t. Wall Time run_16_threads (s) Inclusive Time w.r.t. Wall Time run_32_threads (s) Inclusive Time w.r.t. Wall Time run_48_threads (s) Inclusive Time w.r.t. Wall Time run_64_threads (s) Exclusive Time w.r.t. Wall Time run_1_thread (s) Exclusive Time w.r.t. Wall Time run_2_threads (s) Exclusive Time w.r.t. Wall Time run_4_threads (s) Exclusive Time w.r.t. Wall Time run_8_threads (s) Exclusive Time w.r.t. Wall Time run_16_threads (s) Exclusive Time w.r.t. Wall Time run_32_threads (s) Exclusive Time w.r.t. Wall Time run_48_threads (s) Exclusive Time w.r.t. Wall Time run_64_threads (s) Nb Threads run_1_thread Nb Threads run_2_threads Nb Threads run_4_threads Nb Threads run_8_threads Nb Threads run_16_threads Nb Threads run_32_threads Nb Threads run_48_threads Nb Threads run_64_threads Deviation (coverage) run_1_thread Deviation (coverage) run_2_threads Deviation (coverage) run_4_threads Deviation (coverage) run_8_threads Deviation (coverage) run_16_threads Deviation (coverage) run_32_threads Deviation (coverage) run_48_threads Deviation (coverage) run_64_threads Deviation (walltime) run_1_thread Deviation (walltime) run_2_threads Deviation (walltime) run_4_threads Deviation (walltime) run_8_threads Deviation (walltime) run_16_threads Deviation (walltime) run_32_threads Deviation (walltime) run_48_threads Deviation (walltime) run_64_threads Categories run_1_thread Categories run_2_threads Categories run_4_threads Categories run_8_threads Categories run_16_threads Categories run_32_threads Categories run_48_threads Categories run_64_threads GFLOPS run_1_thread GFLOPS run_2_threads GFLOPS run_4_threads GFLOPS run_8_threads GFLOPS run_16_threads GFLOPS run_32_threads GFLOPS run_48_threads GFLOPS run_64_threads Compilation Options (run_1_thread) Efficiency (run_1_thread) Potential Speed-Up (%) (run_2_threads) Efficiency (run_2_threads) Potential Speed-Up (%) (run_4_threads) Efficiency (run_4_threads) Potential Speed-Up (%) (run_8_threads) Efficiency (run_8_threads) Potential Speed-Up (%) (run_16_threads) Efficiency (run_16_threads) Potential Speed-Up (%) (run_32_threads) Efficiency (run_32_threads) Potential Speed-Up (%) (run_48_threads) Efficiency (run_48_threads) Potential Speed-Up (%) (run_64_threads) Efficiency (run_64_threads) Potential Speed-Up (%)
NameModuleCoverage run_1_thread (%)Coverage run_2_threads (%)Coverage run_4_threads (%)Coverage run_8_threads (%)Coverage run_16_threads (%)Coverage run_32_threads (%)Coverage run_48_threads (%)Coverage run_64_threads (%)Coverage Excluding Loops run_1_thread (%)Coverage Excluding Loops run_2_threads (%)Coverage Excluding Loops run_4_threads (%)Coverage Excluding Loops run_8_threads (%)Coverage Excluding Loops run_16_threads (%)Coverage Excluding Loops run_32_threads (%)Coverage Excluding Loops run_48_threads (%)Coverage Excluding Loops run_64_threads (%)Max Inclusive Time Over Threads run_1_thread (s)Max Inclusive Time Over Threads run_2_threads (s)Max Inclusive Time Over Threads run_4_threads (s)Max Inclusive Time Over Threads run_8_threads (s)Max Inclusive Time Over Threads run_16_threads (s)Max Inclusive Time Over Threads run_32_threads (s)Max Inclusive Time Over Threads run_48_threads (s)Max Inclusive Time Over Threads run_64_threads (s)Max Exclusive Time Over Threads run_1_thread (s)Max Exclusive Time Over Threads run_2_threads (s)Max Exclusive Time Over Threads run_4_threads (s)Max Exclusive Time Over Threads run_8_threads (s)Max Exclusive Time Over Threads run_16_threads (s)Max Exclusive Time Over Threads run_32_threads (s)Max Exclusive Time Over Threads run_48_threads (s)Max Exclusive Time Over Threads run_64_threads (s)Inclusive Time w.r.t. Wall Time run_1_thread (s)Inclusive Time w.r.t. Wall Time run_2_threads (s)Inclusive Time w.r.t. Wall Time run_4_threads (s)Inclusive Time w.r.t. Wall Time run_8_threads (s)Inclusive Time w.r.t. Wall Time run_16_threads (s)Inclusive Time w.r.t. Wall Time run_32_threads (s)Inclusive Time w.r.t. Wall Time run_48_threads (s)Inclusive Time w.r.t. Wall Time run_64_threads (s)Exclusive Time w.r.t. Wall Time run_1_thread (s)Exclusive Time w.r.t. Wall Time run_2_threads (s)Exclusive Time w.r.t. Wall Time run_4_threads (s)Exclusive Time w.r.t. Wall Time run_8_threads (s)Exclusive Time w.r.t. Wall Time run_16_threads (s)Exclusive Time w.r.t. Wall Time run_32_threads (s)Exclusive Time w.r.t. Wall Time run_48_threads (s)Exclusive Time w.r.t. Wall Time run_64_threads (s)Nb Threads run_1_threadNb Threads run_2_threadsNb Threads run_4_threadsNb Threads run_8_threadsNb Threads run_16_threadsNb Threads run_32_threadsNb Threads run_48_threadsNb Threads run_64_threadsDeviation (coverage) run_1_threadDeviation (coverage) run_2_threadsDeviation (coverage) run_4_threadsDeviation (coverage) run_8_threadsDeviation (coverage) run_16_threadsDeviation (coverage) run_32_threadsDeviation (coverage) run_48_threadsDeviation (coverage) run_64_threadsDeviation (walltime) run_1_threadDeviation (walltime) run_2_threadsDeviation (walltime) run_4_threadsDeviation (walltime) run_8_threadsDeviation (walltime) run_16_threadsDeviation (walltime) run_32_threadsDeviation (walltime) run_48_threadsDeviation (walltime) run_64_threadsCategories run_1_threadCategories run_2_threadsCategories run_4_threadsCategories run_8_threadsCategories run_16_threadsCategories run_32_threadsCategories run_48_threadsCategories run_64_threadsGFLOPS run_1_threadGFLOPS run_2_threadsGFLOPS run_4_threadsGFLOPS run_8_threadsGFLOPS run_16_threadsGFLOPS run_32_threadsGFLOPS run_48_threadsGFLOPS run_64_threadsCompilation Options(run_1_thread) Efficiency(run_1_thread) Potential Speed-Up (%)(run_2_threads) Efficiency(run_2_threads) Potential Speed-Up (%)(run_4_threads) Efficiency(run_4_threads) Potential Speed-Up (%)(run_8_threads) Efficiency(run_8_threads) Potential Speed-Up (%)(run_16_threads) Efficiency(run_16_threads) Potential Speed-Up (%)(run_32_threads) Efficiency(run_32_threads) Potential Speed-Up (%)(run_48_threads) Efficiency(run_48_threads) Potential Speed-Up (%)(run_64_threads) Efficiency(run_64_threads) Potential Speed-Up (%)
k_means(int, point_t&, point_t&, int*, point_t&, int, int) [clone .omp_outlined]+kmeans-acfl-O3-soa95.8994.3391.3385.8376.8863.2553.7246.900.000.000.000.000.000.000.000.00215.89108.3254.0927.3313.616.854.583.440.000.000.000.000.000.000.000.00215.89110.9157.8431.3817.5810.207.455.970.000.000.000.000.000.000.000.001248163248640.003.194.044.664.733.883.112.610.000.190.060.040.020.010.010.01Exe (%): 100.00Exe (%): 100.00Exe (%): 100.00Exe (%): 100.00Exe (%): 100.00Exe (%): 100.00Exe (%): 100.00Exe (%): 100.004.158.0815.5028.5650.9987.88120.37150.11Arm C/C++/Fortran Compiler version 24.10.1 (build number 4) (based on LLVM 19.1.0) /opt/arm/arm-linux-compiler-24.10.1_Ubuntu-20.04/llvm-bin/clang-19 --driver-mode=g++ -I . -MMD -MP -march=native -std=c++14 -g -fno-omit-frame-pointer -fopenmp -O3 -grecord-...100.972.520.936.110.8612.030.7717.870.6621.410.621.270.5620.4
Loop 7 - main_soa.cpp:58-69 - kmeans-acfl-O3-soa+95.8994.3391.3385.8376.8863.2553.7246.900.000.000.000.000.000.000.000.00215.89108.5954.7227.6813.947.274.873.690.000.000.000.000.000.000.000.00215.89110.9157.8431.3817.5810.207.455.970.000.000.000.000.000.000.000.00000001000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.00
Loop 8 - main_soa.cpp:59-69 - kmeans-acfl-O3-soa+95.8994.3391.3385.8376.8863.2553.7246.9019.4019.1718.1717.4815.7512.8410.729.34215.89108.5954.7227.6813.947.274.873.6943.6722.2511.165.752.911.581.050.79215.89110.9157.8431.3817.5810.207.455.9743.6722.5411.516.393.602.071.491.191248163248640.000.351.051.241.051.200.970.900.000.380.320.150.090.090.060.064.017.8415.2727.5248.7784.70118.33146.77100.970.60.950.930.852.550.763.810.664.370.614.160.573.98
Loop 9 - main_soa.cpp:62-67 - kmeans-acfl-O3-soa76.5075.1673.1668.3561.1350.4143.0037.5676.5075.1673.1668.3561.1350.4143.0037.56172.2286.3443.5621.9211.035.693.822.89172.2286.3443.5621.9211.035.693.822.89172.2288.3846.3424.9913.988.135.964.78172.2288.3846.3424.9913.988.135.964.781248163248640.002.843.203.513.843.132.622.310.000.190.310.150.080.090.060.064.198.1415.5528.8251.5688.69120.88150.94100.971.920.935.180.869.470.7714.060.6617.040.617.110.5616.42
k_means(int, point_t&, point_t&, int*, point_t&, int, int)+kmeans-acfl-O3-soa4.114.033.913.653.272.682.281.990.000.000.000.000.000.000.000.009.249.249.249.269.249.269.289.290.000.000.000.000.000.000.010.009.244.742.471.330.750.430.320.250.000.000.000.000.000.000.000.00111111110.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.00Exe (%): 100.00Exe (%): 100.00Exe (%): 100.00Exe (%): 100.00Exe (%): 100.00Exe (%): 100.00Exe (%): 100.00Exe (%): 100.000.541.062.023.756.6911.5615.8519.77Arm C/C++/Fortran Compiler version 24.10.1 (build number 4) (based on LLVM 19.1.0) /opt/arm/arm-linux-compiler-24.10.1_Ubuntu-20.04/llvm-bin/clang-19 --driver-mode=g++ -I . -MMD -MP -march=native -std=c++14 -g -fno-omit-frame-pointer -fopenmp -O3 -grecord-...100.980.10.930.260.870.490.770.740.670.890.610.890.570.85
Loop 4 - main_soa.cpp:56-93 - kmeans-acfl-O3-soa [...]+4.114.033.913.653.272.682.271.990.000.000.000.000.000.000.000.009.249.249.249.269.249.269.279.290.000.000.000.000.000.000.000.009.244.742.471.330.750.430.320.250.000.000.000.000.000.000.000.00000000000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.00
Loop 6 - main_soa.cpp:81-84 - kmeans-acfl-O3-soa4.114.033.913.653.272.682.271.994.114.033.913.653.272.682.271.999.249.249.249.269.249.269.279.299.249.249.249.269.249.269.279.299.244.742.471.330.750.430.320.259.244.742.471.330.750.430.320.25111111110.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.541.062.023.756.6911.5615.8619.77100.980.10.930.260.870.490.770.740.670.890.610.880.570.85
Loop 5 - main_soa.cpp:86-93 - kmeans-acfl-O3-soa0.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.00000000000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.00
kmp_flag_native<unsigned long long, (flag_type)1, true>::notdone_check()libomp.so0.000.120.410.811.502.473.183.880.000.120.410.811.502.473.183.880.000.280.370.340.350.380.380.420.000.280.370.340.350.380.380.420.000.150.260.300.340.400.440.490.000.150.260.300.340.400.440.490138163147630.000.000.080.360.460.370.500.510.000.000.050.110.080.040.040.04NAOMP (%): 100.00OMP (%): 100.00OMP (%): 100.00OMP (%): 100.00OMP (%): 100.00OMP (%): 100.00OMP (%): 100.000.000.000.000.000.000.000.000.001010101010101010
unknown_functionlibc.so.60.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.00000000010.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.00NANANANANANANAPthread (%): 100.000.000.000.000.000.000.000.000.00
__sched_yieldlibc.so.60.000.070.170.370.781.281.741.990.000.070.170.370.781.281.741.990.000.150.160.170.210.180.200.210.000.150.160.170.210.180.200.210.000.080.110.130.180.210.240.250.000.080.110.130.180.210.240.250138153147630.000.000.060.160.190.170.310.370.000.000.040.050.030.020.030.03NAPthread (%): 100.00
System (%): 0.00
Pthread (%): 100.00Pthread (%): 99.47
OMP (%): 0.53
Pthread (%): 100.00
System (%): 0.00
Pthread (%): 100.00
System (%): 0.00
Pthread (%): 100.00
System (%): 0.00
Pthread (%): 100.00
System (%): 0.00
0.000.000.000.000.000.000.000.001010101010101010
unknown_function[vdso]0.000.010.030.070.140.200.280.330.000.000.000.000.000.000.000.000.000.020.030.060.050.060.050.050.000.000.000.000.000.000.000.000.000.010.020.030.030.030.040.040.000.000.000.000.000.000.000.000137153147630.000.000.010.060.060.100.120.150.000.000.010.020.010.010.010.01NAPthread (%): 100.00Pthread (%): 100.00Pthread (%): 100.00Pthread (%): 100.00
Others (%): 0.00
Pthread (%): 100.00Pthread (%): 100.00
Others (%): 0.00
Pthread (%): 100.00
Others (%): 0.00
0.000.000.000.000.000.000.000.001010101010101010
parse_printf_formatlibc.so.60.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.00000010010.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.00NANANANAIO (%): 100.00NANAIO (%): 100.000.000.000.000.000.000.000.000.00
__kmp_hyper_barrier_release(barrier_type, kmp_info*, int, int, int, void*)libomp.so0.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.00000000100.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.00NANANANANANAOMP (%): 100.00NA0.000.000.000.000.000.000.000.00
kmp_flag_64<false, true>::wait(kmp_info*, int, void*)libomp.so0.001.424.139.2217.3229.9338.6044.660.001.424.139.2217.3229.9338.6044.660.003.263.313.443.483.483.533.510.003.263.313.443.483.483.533.510.001.672.623.373.964.835.355.690.001.672.623.373.964.835.355.690138153248640.000.000.093.790.405.575.815.780.000.000.051.180.080.590.490.42NAOMP (%): 100.00OMP (%): 100.00OMP (%): 100.00OMP (%): 100.00OMP (%): 100.00OMP (%): 100.00OMP (%): 100.000.000.000.000.000.000.000.000.001010101010101010
__kmp_join_barrier(int)libomp.so0.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.00000000100.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.00NANANANANANAOMP (%): 100.00NA0.000.000.000.000.000.000.000.00
__kmp_yieldlibomp.so0.000.010.000.010.020.060.060.060.000.010.000.010.020.060.060.060.000.020.000.010.020.010.010.020.000.020.000.010.020.010.010.020.000.010.000.000.010.010.010.010.000.010.000.000.010.010.010.01012472629380.000.000.000.020.030.030.040.060.000.000.000.000.000.000.000.00NAOMP (%): 100.00OMP (%): 100.00OMP (%): 100.00OMP (%): 100.00OMP (%): 100.00OMP (%): 100.00OMP (%): 100.000.000.000.000.000.000.000.000.001010101010101010
__kmp_init_implicit_tasklibomp.so0.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.00000000100.000.000.000.000.000.000.000.000.000.000.000.000.000.000.000.00NANANANANANAOMP (%): 100.00NA0.000.000.000.000.000.000.000.00
×