options

Loops Index

57 loops have been discarded from the report because their ratio ((Max Inclusive Time Over Threads * 100) / Max Thread Active Time) is lower than the threshold set by object_coverage_threshold (0.01%). It represents about 0.02% of the application. To include them, change the value of object_coverage_threshold in the experiment directory configuration file, then rerun the command with the additionnal parameter --force-static-analysis

Columns Filter

Level Max Thread Time / Walltime gcc_3 (%) Exclusive Coverage gcc_3 (%) Inclusive Coverage gcc_3 (%) Max Exclusive Time Over Threads gcc_3 (s) Max Inclusive Time Over Threads gcc_3 (s) Exclusive Time w.r.t. Wall Time gcc_3 (s) Inclusive Time w.r.t. Wall Time gcc_3 (s) Nb Threads gcc_3 GFLOPS gcc_3 Vectorization Ratio (%) Vector Length Use (%) Speedup If No Scalar Integer Speedup If FP Vectorized Speedup If Fully Vectorized Speedup If Perfect Load Balancing gcc_3 Stride 0 Stride 1 Stride n Stride Unknown Stride Indirect Array Access Efficiency Level Max Thread Time / Walltime Exclusive Coverage Inclusive Coverage Max Exclusive Time Over Threads Max Inclusive Time Over Threads Exclusive Time w.r.t. Wall Time Inclusive Time w.r.t. Wall Time Nb Threads GFLOPS Vectorization Ratio Vector Length Use Speedup If No Scalar Integer Speedup If FP Vectorized Speedup If Fully Vectorized Speedup If Perfect Load Balancing Stride 0 Stride 1 Stride n Stride Unknown Stride Indirect Array Access Efficiency
Loop idSource LocationSource FunctionLevelMax Thread Time / Walltime gcc_3 (%)Exclusive Coverage gcc_3 (%)Inclusive Coverage gcc_3 (%)Max Exclusive Time Over Threads gcc_3 (s)Max Inclusive Time Over Threads gcc_3 (s)Exclusive Time w.r.t. Wall Time gcc_3 (s)Inclusive Time w.r.t. Wall Time gcc_3 (s)Nb Threads gcc_3GFLOPS gcc_3Vectorization Ratio (%)Vector Length Use (%)Speedup If No Scalar IntegerSpeedup If FP VectorizedSpeedup If Fully VectorizedSpeedup If Perfect Load Balancing gcc_3Stride 0Stride 1Stride nStride UnknownStride IndirectArray Access Efficiency
29352exec - pair_eam_intel.cpp:312-323void LAMMPS_NS::PairEAMIntel::eval<1, 0, 1, float, double>(int, int, LAMMPS_NS::IntelBuffers<float, double>*, LAMMPS_NS::PairEAMIntel::ForceConst<float> const&, int, int) [clone ._omp_fn.0]Innermost9.2511.9911.9918.0918.0921.0621.06256227.9906.2512.91161.07NANANANANA0.00
29340exec - pair_eam_intel.cpp:513-527void LAMMPS_NS::PairEAMIntel::eval<1, 0, 1, float, double>(int, int, LAMMPS_NS::IntelBuffers<float, double>*, LAMMPS_NS::PairEAMIntel::ForceConst<float> const&, int, int) [clone ._omp_fn.0]Innermost9.1111.4711.4717.8317.8320.1520.15256239.6406.251.151.38161.1NANANANANA0.00
29341exec - pair_eam_intel.cpp:541-588 [...]void LAMMPS_NS::PairEAMIntel::eval<1, 0, 1, float, double>(int, int, LAMMPS_NS::IntelBuffers<float, double>*, LAMMPS_NS::PairEAMIntel::ForceConst<float> const&, int, int) [clone ._omp_fn.0]Innermost7.319.169.1614.3014.3016.0916.09256865.8114.899.971.021.989.221.111503175.00
26581exec - npair_intel.cpp:474-558 [...]void LAMMPS_NS::NPairIntel::bin_newton<float, double, 0, 0, 0, 0, 0>(int, LAMMPS_NS::NeighList*, LAMMPS_NS::IntelBuffers<float, double>*, int, int, int) [clone ._omp_fn.0]Innermost2.963.833.835.785.786.736.73256430.5306.251.12.36161.07NANANANANA0.00
29353exec - pair_eam_intel.cpp:335-359 [...]void LAMMPS_NS::PairEAMIntel::eval<1, 0, 1, float, double>(int, int, LAMMPS_NS::IntelBuffers<float, double>*, LAMMPS_NS::PairEAMIntel::ForceConst<float> const&, int, int) [clone ._omp_fn.0]Innermost2.663.363.365.215.215.905.90256704.5007.6611.8371.10005050.00
29351exec - pair_eam_intel.cpp:291-363 [...]void LAMMPS_NS::PairEAMIntel::eval<1, 0, 1, float, double>(int, int, LAMMPS_NS::IntelBuffers<float, double>*, LAMMPS_NS::PairEAMIntel::ForceConst<float> const&, int, int) [clone ._omp_fn.0]Outermost0.861.0216.371.6924.731.8028.76256339.853.647.951.673.1514.941.17NANANANANA0.00
26589exec - npair_intel.cpp:343-379 [...]void LAMMPS_NS::NPairIntel::bin_newton<float, double, 0, 0, 0, 0, 0>(int, LAMMPS_NS::NeighList*, LAMMPS_NS::IntelBuffers<float, double>*, int, int, int) [clone ._omp_fn.0]InBetween0.630.740.741.231.231.301.3025614.6831.3721.322.1719.421.18NANANANANA0.00
7258exec - fix_nve_intel.cpp:78-80LAMMPS_NS::FixNVEIntel::initial_integrate(int)Single0.750.730.731.461.461.281.28256156.281005011.1521.4203000100.00
29524exec - intel_buffers.h:228-231void LAMMPS_NS::PairEAMIntel::compute<float, double>(int, int, LAMMPS_NS::IntelBuffers<float, double>*, LAMMPS_NS::PairEAMIntel::ForceConst<float> const&) [clone ._omp_fn.0]Single0.600.660.661.181.181.161.162560.005014.06115.331.260128059.09
7072exec - fix_intel.cpp:884-885void LAMMPS_NS::FixIntel::add_oresults<LAMMPS_NS::IntelBuffers<float, double>::vec3_acc_t, double>(LAMMPS_NS::IntelBuffers<float, double>::vec3_acc_t const*, double const*, int, int, int, int) [clone ._omp_fn.0]Single0.590.590.591.141.141.041.0425666.94100501121.3802000100.00
26590exec - npair_intel.cpp:364-369void LAMMPS_NS::NPairIntel::bin_newton<float, double, 0, 0, 0, 0, 0>(int, LAMMPS_NS::NeighList*, LAMMPS_NS::IntelBuffers<float, double>*, int, int, int) [clone ._omp_fn.0]Innermost0.530.580.581.031.031.021.022560.0006.251.331161.260504077.78
29339exec - pair_eam_intel.cpp:484-606 [...]void LAMMPS_NS::PairEAMIntel::eval<1, 0, 1, float, double>(int, int, LAMMPS_NS::IntelBuffers<float, double>*, LAMMPS_NS::PairEAMIntel::ForceConst<float> const&, int, int) [clone ._omp_fn.0]Outermost0.480.5421.170.9433.080.9537.18256571.0012.99.881.92.0213.991.24NANANANANA0.00
7264exec - fix_nve_intel.cpp:134-135LAMMPS_NS::FixNVEIntel::final_integrate()Single0.490.420.420.960.960.740.74256134.371005011.0621.602000100.00
29328exec - pair_eam_intel.cpp:312-323void LAMMPS_NS::PairEAMIntel::eval<1, 1, 1, float, double>(int, int, LAMMPS_NS::IntelBuffers<float, double>*, LAMMPS_NS::PairEAMIntel::ForceConst<float> const&, int, int) [clone ._omp_fn.0]Innermost0.270.330.330.530.530.570.57256224.2706.2512.91161.14NANANANANA0.00
29315exec - pair_eam_intel.cpp:513-527void LAMMPS_NS::PairEAMIntel::eval<1, 1, 1, float, double>(int, int, LAMMPS_NS::IntelBuffers<float, double>*, LAMMPS_NS::PairEAMIntel::ForceConst<float> const&, int, int) [clone ._omp_fn.0]Innermost0.260.300.300.510.510.540.54256243.0006.251.151.38161.2NANANANANA0.00
26582exec - npair_intel.cpp:330-762 [...]void LAMMPS_NS::NPairIntel::bin_newton<float, double, 0, 0, 0, 0, 0>(int, LAMMPS_NS::NeighList*, LAMMPS_NS::IntelBuffers<float, double>*, int, int, int) [clone ._omp_fn.0]Outermost0.280.305.530.558.360.539.72256413.211.148.113.092.5614.691.3NANANANANA0.00
29317exec - pair_eam_intel.cpp:541-592 [...]void LAMMPS_NS::PairEAMIntel::eval<1, 1, 1, float, double>(int, int, LAMMPS_NS::IntelBuffers<float, double>*, LAMMPS_NS::PairEAMIntel::ForceConst<float> const&, int, int) [clone ._omp_fn.0]Innermost0.250.280.280.490.490.500.50256807.4413.739.81.011.9210.221.231503175.00
7889exec - atom_vec.cpp:735-739LAMMPS_NS::AtomVec::unpack_reverse(int, int*, double*)Single0.220.210.210.440.440.370.3725652.50012.51.141.2881.470044155.56
29342exec - pair_eam_intel.cpp:439-450void LAMMPS_NS::PairEAMIntel::eval<1, 0, 1, float, double>(int, int, LAMMPS_NS::IntelBuffers<float, double>*, LAMMPS_NS::PairEAMIntel::ForceConst<float> const&, int, int) [clone ._omp_fn.0]Single0.220.200.200.420.420.360.36256362.136.98.841.061.5612.521.471003241.67
9017exec - memory.h:53-80 [...]LAMMPS_NS::CommBrick::borders()Innermost0.170.170.170.330.330.300.302560.004.3511.552.72.1412.841.33NANANANANA0.00
1898exec - neighbor.cpp:2430-2435LAMMPS_NS::Neighbor::check_distance()Single0.210.170.170.410.410.290.29256150.842515.6311.086.121.740208060.00
8053exec - atom_vec.cpp:362-366LAMMPS_NS::AtomVec::pack_comm(int, int*, double*, int, int*)Single0.210.160.160.410.410.280.282560.00012.51.11181.80124156.25
7228exec - intel_buffers.h:210-214void LAMMPS_NS::NBinIntel::bin_atoms<float, double>(LAMMPS_NS::IntelBuffers<float, double>*) [clone ._omp_fn.0]Single0.130.130.130.250.250.230.232560.0033.3311.46115.331.310124064.29
29329exec - pair_eam_intel.cpp:335-359 [...]void LAMMPS_NS::PairEAMIntel::eval<1, 1, 1, float, double>(int, int, LAMMPS_NS::IntelBuffers<float, double>*, LAMMPS_NS::PairEAMIntel::ForceConst<float> const&, int, int) [clone ._omp_fn.0]Innermost0.100.090.090.210.210.170.17256671.0307.6611.8271.530005050.00
2000exec - neighbor.cpp:2480-2483LAMMPS_NS::Neighbor::build(int)Single0.100.090.090.190.190.150.152560.00012.51.11181.580208060.00
26588exec - npair_intel.cpp:414-457 [...]void LAMMPS_NS::NPairIntel::bin_newton<float, double, 0, 0, 0, 0, 0>(int, LAMMPS_NS::NeighList*, LAMMPS_NS::IntelBuffers<float, double>*, int, int, int) [clone ._omp_fn.0]Innermost0.080.070.070.170.170.130.13256306.6506.41.111.71161.62NANANANANA0.00
8969exec - comm_brick.cpp:709-1517 [...]LAMMPS_NS::CommBrick::exchange()Innermost0.070.060.060.140.140.100.102560.00510.942.63.0513.741.73NANANANANA0.00
20065exec - pair_eam.cpp:976-978LAMMPS_NS::PairEAM::unpack_reverse_comm(int, int*, double*)Single0.050.040.040.100.100.070.0725692.31012.51.041.4781.750208060.00
6231exec - domain_omp.cpp:57-57 [...]LAMMPS_NS::DomainOMP::pbc() [clone ._omp_fn.0]Single0.060.040.040.110.110.060.062560.00100501122.1701000100.00
7236exec - nbin_intel.cpp:220-225void LAMMPS_NS::NBinIntel::bin_atoms<float, double>(LAMMPS_NS::IntelBuffers<float, double>*)Single0.050.030.030.090.090.060.06256171.6107.811115.042.110012053.85
7722exec - atom.cpp:2414-2426LAMMPS_NS::Atom::sort()Single0.050.030.030.090.090.060.06256310.8509.381.522.1211.562.021004060.00
7992exec - atom_vec.cpp:1035-1041LAMMPS_NS::AtomVec::unpack_border(int, int, double*)Single0.050.030.030.090.090.050.052560.00010.582110.672.090064065.00
8015exec - atom_vec.cpp:804-810 [...]LAMMPS_NS::AtomVec::pack_border(int, int*, double*, int, int*)Single0.040.030.030.080.080.050.052560.0017.3912.231.1817.331.940122438.89
29327exec - pair_eam_intel.cpp:291-363 [...]void LAMMPS_NS::PairEAMIntel::eval<1, 1, 1, float, double>(int, int, LAMMPS_NS::IntelBuffers<float, double>*, LAMMPS_NS::PairEAMIntel::ForceConst<float> const&, int, int) [clone ._omp_fn.0]Outermost0.050.030.450.090.660.050.79256325.883.647.951.673.1514.942.46NANANANANA0.00
7235exec - nbin_intel.cpp:232-233void LAMMPS_NS::NBinIntel::bin_atoms<float, double>(LAMMPS_NS::IntelBuffers<float, double>*)Innermost0.040.030.030.070.070.050.052560.0009.38111620100150.00
8033exec - atom_vec.cpp:378-382LAMMPS_NS::AtomVec::pack_comm(int, int*, double*, int, int*)Single0.100.030.030.190.190.040.0418457.10012.51.111.1183.860124156.25
6230exec - domain_omp.cpp:74-150LAMMPS_NS::DomainOMP::pbc() [clone ._omp_fn.1]Single0.040.020.020.090.090.040.042560.09011.41.921.9211.572.47NANANANANA0.00
7721exec - atom.cpp:2439-2441LAMMPS_NS::Atom::sort()Innermost0.040.020.020.070.070.040.042560.0009.3811162.480100150.00
7170exec - intel_buffers.cpp:624-624LAMMPS_NS::IntelBuffers<float, double>::fdotr_reduce_l5(int, int, int, int, double&, double&, double&, double&, double&, double&)Single0.030.020.020.050.050.030.03256223.85011.2511.239.62.023040085.71
29207exec - pair_eam_intel.cpp:830-832LAMMPS_NS::PairEAMIntel::pack_forward_comm(int, int*, double*, int, int*)Single0.030.020.020.060.060.030.032550.0010039.291122.470110158.33
20064exec - pair_eam.cpp:965-965LAMMPS_NS::PairEAM::pack_reverse_comm(int, int, double*)Single0.030.020.020.050.050.030.032490.24100501122.2502000100.00
29314exec - pair_eam_intel.cpp:429-614 [...]void LAMMPS_NS::PairEAMIntel::eval<1, 1, 1, float, double>(int, int, LAMMPS_NS::IntelBuffers<float, double>*, LAMMPS_NS::PairEAMIntel::ForceConst<float> const&, int, int) [clone ._omp_fn.0]Outermost0.030.020.600.060.920.031.06256555.6322.0812.341.92.1413.052.79NANANANANA0.00
7234exec - nbin_intel.cpp:229-233void LAMMPS_NS::NBinIntel::bin_atoms<float, double>(LAMMPS_NS::IntelBuffers<float, double>*)Outermost0.030.010.040.060.110.030.072480.0006.771115.412.750002050.00
29205exec - pair_eam_intel.cpp:847-847LAMMPS_NS::PairEAMIntel::unpack_forward_comm(int, int, double*)Single0.030.010.010.050.050.020.022540.0010043.75112.42.5902000100.00
10532exec - compute_temp.cpp:90-92LAMMPS_NS::ComputeTemp::compute_scalar()Single0.020.010.010.040.040.020.02256171.23011.361.271.3102.49NANANANANA0.00
7719exec - atom.cpp:2462-2464LAMMPS_NS::Atom::sort()Innermost0.020.010.010.040.040.020.022450.0008.3311163.112001250.00
7720exec - atom.cpp:2437-2441LAMMPS_NS::Atom::sort()Outermost0.020.010.030.050.080.020.052340.0006.881115.33.070002050.00
29318exec - pair_eam_intel.cpp:439-461void LAMMPS_NS::PairEAMIntel::eval<1, 1, 1, float, double>(int, int, LAMMPS_NS::IntelBuffers<float, double>*, LAMMPS_NS::PairEAMIntel::ForceConst<float> const&, int, int) [clone ._omp_fn.0]Single0.020.010.010.030.030.010.01256539.073.968.8111.7412.172.92101258.33
7718exec - atom.cpp:2458-2467LAMMPS_NS::Atom::sort()Outermost0.020.010.020.040.060.010.032160.0006.631115.553.83NANANANANA70.00
8014exec - atom_vec.cpp:823-829 [...]LAMMPS_NS::AtomVec::pack_border(int, int*, double*, int, int*)Single0.030.010.010.050.050.010.0118353.9017.3912.231.11.17.334.490202437.50
26587exec - npair_intel.cpp:392-398void LAMMPS_NS::NPairIntel::bin_newton<float, double, 0, 0, 0, 0, 0>(int, LAMMPS_NS::NeighList*, LAMMPS_NS::IntelBuffers<float, double>*, int, int, int) [clone ._omp_fn.0]Innermost0.010.000.000.030.030.010.011780.0006.251.671162.950604080.00
4658exec - verlet.cpp:246-380 [...]LAMMPS_NS::Verlet::run(int)Single0.010.000.000.020.020.000.001391.511.927.813.01115.742.91NANANANANA0.00
×