| Function: ideal_gas_kernel(int, int, int, int, clover::Buffer2D<double>&, clover::Buffer2D<double>&, ... | Module: exec | Source: ideal_gas.cpp:37-45 [...] | Coverage (incl. loops): 6.90% | (excl. loops): 0.01% |
|---|
| Function: ideal_gas_kernel(int, int, int, int, clover::Buffer2D<double>&, clover::Buffer2D<double>&, ... | Module: exec | Source: ideal_gas.cpp:37-45 [...] | Coverage (incl. loops): 6.90% | (excl. loops): 0.01% |
|---|
/home/eoseret/qaas/qaas_runs/178-219-7589/intel/CloverLeaf2.0-CXX/build/CloverLeaf2.0-CXX/src/omp/ideal_gas.cpp: 37 - 45 |
-------------------------------------------------------------------------------- |
37: #pragma omp parallel for simd collapse(2) |
38: for (int j = (y_min + 1); j < (y_max + 2); j++) { |
39: for (int i = (x_min + 1); i < (x_max + 2); i++) { |
40: double v = 1.0 / density(i, j); |
41: pressure(i, j) = (1.4 - 1.0) * density(i, j) * energy(i, j); |
42: double pressurebyenergy = (1.4 - 1.0) * density(i, j); |
43: double pressurebyvolume = -density(i, j) * pressure(i, j); |
44: double sound_speed_squared = v * v * (pressure(i, j) * pressurebyenergy - pressurebyvolume); |
45: soundspeed(i, j) = std::sqrt(sound_speed_squared); |
/home/eoseret/qaas/qaas_runs/178-219-7589/intel/CloverLeaf2.0-CXX/build/CloverLeaf2.0-CXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
0x437080 STP X29, X30, [SP, #912]! |
0x437084 ADD X29, SP, #0 |
0x437088 STP X19, X20, [SP, #16] |
0x43708c ORR X20, XZR, X0 |
0x437090 STP X21, X22, [SP, #32] |
0x437094 STP X23, X24, [SP, #48] |
0x437098 LDP W3, W22, [X0, #40] |
0x43709c LDR W23, [X0, #32] |
0x4370a0 LDR W0, [X0, #36] |
0x4370a4 ADD W1, W3, #1 |
0x4370a8 ADD W22, W22, #2 |
0x4370ac CMP W1, W22 |
0x4370b0 B.GE 437428 |
0x4370b4 ADD W23, W23, #1 |
0x4370b8 ADD W19, W0, #2 |
0x4370bc STP X25, X26, [SP, #64] |
0x4370c0 SUB W25, W22, W1 |
0x4370c4 STR W1, [SP, #108] |
0x4370c8 CMP W23, W19 |
0x4370cc B.GE 437424 |
0x4370d0 SUB W24, W19, W23 |
0x4370d4 BL 410210 |
0x4370d8 MUL W26, W25, W24 |
0x4370dc ORR W21, WZR, W0 |
0x4370e0 BL 410240 |
0x4370e4 LDR W6, [SP, #108] |
0x4370e8 ORR W4, WZR, W0 |
0x4370ec UDIV W2, W26, W21 |
0x4370f0 MSUB W5, W2, W21, W26 |
0x4370f4 CMP W0, W5 |
0x4370f8 B.CC 437458 |
0x4370fc MADD W21, W2, W4, W5 |
0x437100 ADD W7, W2, W21 |
0x437104 STR W7, [SP, #108] |
0x437108 CMP W21, W7 |
0x43710c B.CS 437424 |
0x437110 UDIV W8, W21, W24 |
0x437114 ORR X9, XZR, #0x66 |
0x437118 ADRP X10, |
0x43711c MOVK X9, #16374 |
0x437120 STP X27, X28, [SP, #80] |
0x437124 FMOV D24, #1.0000000 |
0x437128 FMOV V27.2D, #1.0000000 |
0x43712c FMOV D26, X9 |
0x437130 LDR D25, [X10, #504] |
0x437134 LDP X28, X27, [X20] |
0x437138 LDP X26, X25, [X20, #16] |
0x43713c MSUB W11, W8, W24, W21 |
0x437140 ADD W12, W8, W6 |
0x437144 DUP V28.2D, V25.D[0] |
0x437148 SBFM X5, X12, #0, #31 |
0x43714c DUP V29.2D, V26.D[0] |
0x437150 ADD W4, W11, W23 |
0x437154 SUB W30, W19, W4 |
0x437158 HINT #0 |
0x43715c HINT #0 |
(246) 0x437160 CMP W2, W30 |
(246) 0x437164 CSEL W2, W2, W30, #9 |
(246) 0x437168 ADD W19, W21, W2 |
(246) 0x43716c CMP W21, W19 |
(246) 0x437170 B.CS 437404 |
(246) 0x437174 LDR X13, [X26] |
(246) 0x437178 LDR X14, [X25] |
(246) 0x43717c LDR X15, [X27] |
(246) 0x437180 MUL X12, X5, X13 |
(246) 0x437184 LDR X16, [X28] |
(246) 0x437188 MUL X14, X5, X14 |
(246) 0x43718c LDR X20, [X25, #16] |
(246) 0x437190 MUL X13, X5, X15 |
(246) 0x437194 LDR X21, [X26, #16] |
(246) 0x437198 MUL X10, X5, X16 |
(246) 0x43719c LDR X30, [X27, #16] |
(246) 0x4371a0 LDR X18, [X28, #16] |
(246) 0x4371a4 CMP W2, #1 |
(246) 0x4371a8 B.EQ 4373b4 |
(246) 0x4371ac UBFM W17, W2, #1, #31 |
(246) 0x4371b0 SBFM X3, X4, #0, #31 |
(246) 0x4371b4 UBFM X11, X17, #60, #59 |
(246) 0x4371b8 ADD X6, X10, X3 |
(246) 0x4371bc SUB X7, X11, #16 |
(246) 0x4371c0 ADD X17, X13, X3 |
(246) 0x4371c4 ADD X1, X18, X6,LSL #3 |
(246) 0x4371c8 UBFM X9, X7, #4, #63 |
(246) 0x4371cc ADD X16, X12, X3 |
(246) 0x4371d0 ADD X8, X30, X17,LSL #3 |
(246) 0x4371d4 ADD X15, X9, #1 |
(246) 0x4371d8 ADD X3, X14, X3 |
(246) 0x4371dc ADD X7, X21, X16,LSL #3 |
(246) 0x4371e0 ANDS X9, X15, #0x3 |
(246) 0x4371e4 MOVZ X0, #0 |
(246) 0x4371e8 UBFM X15, X6, #61, #60 |
(246) 0x4371ec UBFM X17, X17, #61, #60 |
(246) 0x4371f0 ADD X6, X20, X3,LSL #3 |
(246) 0x4371f4 UBFM X16, X16, #61, #60 |
(246) 0x4371f8 UBFM X3, X3, #61, #60 |
(246) 0x4371fc B.EQ 4372c0 |
(246) 0x437200 CMP X9, #1 |
(246) 0x437204 B.EQ 437280 |
(246) 0x437208 CMP X9, #2 |
(246) 0x43720c B.EQ 437248 |
(246) 0x437210 LDR Q23, [X18, X15] |
(246) 0x437214 MOVZ X0, #16 |
(246) 0x437218 LDR Q30, [X30, X17] |
(246) 0x43721c FDIV V31.2D, V27.2D, V23.2D |
(246) 0x437220 FMUL V0.2D, V30.2D, V23.2D |
(246) 0x437224 FMUL V1.2D, V31.2D, V31.2D |
(246) 0x437228 FMUL V2.2D, V0.2D, V28.2D |
(246) 0x43722c STR Q2, [X21, X16] |
(246) 0x437230 LDR Q3, [X18, X15] |
(246) 0x437234 FMUL V4.2D, V3.2D, V29.2D |
(246) 0x437238 FMUL V5.2D, V4.2D, V2.2D |
(246) 0x43723c FMUL V6.2D, V5.2D, V1.2D |
(246) 0x437240 FSQRT V7.2D, V6.2D |
(246) 0x437244 STR Q7, [X20, X3] |
(246) 0x437248 LDR Q16, [X1, X0] |
(246) 0x43724c LDR Q17, [X8, X0] |
(246) 0x437250 FDIV V18.2D, V27.2D, V16.2D |
(246) 0x437254 FMUL V19.2D, V17.2D, V16.2D |
(246) 0x437258 FMUL V20.2D, V18.2D, V18.2D |
(246) 0x43725c FMUL V21.2D, V19.2D, V28.2D |
(246) 0x437260 STR Q21, [X7, X0] |
(246) 0x437264 LDR Q22, [X1, X0] |
(246) 0x437268 FMUL V23.2D, V22.2D, V29.2D |
(246) 0x43726c FMUL V30.2D, V23.2D, V21.2D |
(246) 0x437270 FMUL V31.2D, V30.2D, V20.2D |
(246) 0x437274 FSQRT V0.2D, V31.2D |
(246) 0x437278 STR Q0, [X6, X0] |
(246) 0x43727c ADD X0, X0, #16 |
(246) 0x437280 LDR Q1, [X1, X0] |
(246) 0x437284 LDR Q2, [X8, X0] |
(246) 0x437288 FDIV V3.2D, V27.2D, V1.2D |
(246) 0x43728c FMUL V4.2D, V2.2D, V1.2D |
(246) 0x437290 FMUL V5.2D, V3.2D, V3.2D |
(246) 0x437294 FMUL V6.2D, V4.2D, V28.2D |
(246) 0x437298 STR Q6, [X7, X0] |
(246) 0x43729c LDR Q7, [X1, X0] |
(246) 0x4372a0 FMUL V16.2D, V7.2D, V29.2D |
(246) 0x4372a4 FMUL V17.2D, V16.2D, V6.2D |
(246) 0x4372a8 FMUL V18.2D, V17.2D, V5.2D |
(246) 0x4372ac FSQRT V19.2D, V18.2D |
(246) 0x4372b0 STR Q19, [X6, X0] |
(246) 0x4372b4 ADD X0, X0, #16 |
(246) 0x4372b8 CMP X11, X0 |
(246) 0x4372bc B.EQ 4373a8 |
(247) 0x4372c0 LDR Q20, [X1, X0] |
(247) 0x4372c4 ADD X17, X0, #16 |
(247) 0x4372c8 ADD X15, X0, #32 |
(247) 0x4372cc ADD X9, X0, #48 |
(247) 0x4372d0 LDR Q21, [X8, X0] |
(247) 0x4372d4 FDIV V22.2D, V27.2D, V20.2D |
(247) 0x4372d8 FMUL V30.2D, V21.2D, V20.2D |
(247) 0x4372dc FMUL V23.2D, V22.2D, V22.2D |
(247) 0x4372e0 FMUL V0.2D, V30.2D, V28.2D |
(247) 0x4372e4 STR Q0, [X7, X0] |
(247) 0x4372e8 LDR Q31, [X1, X0] |
(247) 0x4372ec FMUL V1.2D, V31.2D, V29.2D |
(247) 0x4372f0 FMUL V2.2D, V1.2D, V0.2D |
(247) 0x4372f4 FMUL V3.2D, V2.2D, V23.2D |
(247) 0x4372f8 FSQRT V4.2D, V3.2D |
(247) 0x4372fc STR Q4, [X6, X0] |
(247) 0x437300 ADD X0, X0, #64 |
(247) 0x437304 LDR Q5, [X1, X17] |
(247) 0x437308 LDR Q6, [X8, X17] |
(247) 0x43730c FDIV V7.2D, V27.2D, V5.2D |
(247) 0x437310 FMUL V16.2D, V6.2D, V5.2D |
(247) 0x437314 FMUL V17.2D, V7.2D, V7.2D |
(247) 0x437318 FMUL V18.2D, V16.2D, V28.2D |
(247) 0x43731c STR Q18, [X7, X17] |
(247) 0x437320 LDR Q19, [X1, X17] |
(247) 0x437324 FMUL V20.2D, V19.2D, V29.2D |
(247) 0x437328 FMUL V21.2D, V20.2D, V18.2D |
(247) 0x43732c FMUL V22.2D, V21.2D, V17.2D |
(247) 0x437330 FSQRT V30.2D, V22.2D |
(247) 0x437334 STR Q30, [X6, X17] |
(247) 0x437338 LDR Q23, [X1, X15] |
(247) 0x43733c LDR Q0, [X8, X15] |
(247) 0x437340 FDIV V31.2D, V27.2D, V23.2D |
(247) 0x437344 FMUL V1.2D, V0.2D, V23.2D |
(247) 0x437348 FMUL V2.2D, V31.2D, V31.2D |
(247) 0x43734c FMUL V3.2D, V1.2D, V28.2D |
(247) 0x437350 STR Q3, [X7, X15] |
(247) 0x437354 LDR Q4, [X1, X15] |
(247) 0x437358 FMUL V5.2D, V4.2D, V29.2D |
(247) 0x43735c FMUL V6.2D, V5.2D, V3.2D |
(247) 0x437360 FMUL V7.2D, V6.2D, V2.2D |
(247) 0x437364 FSQRT V16.2D, V7.2D |
(247) 0x437368 STR Q16, [X6, X15] |
(247) 0x43736c LDR Q17, [X1, X9] |
(247) 0x437370 LDR Q18, [X8, X9] |
(247) 0x437374 FDIV V19.2D, V27.2D, V17.2D |
(247) 0x437378 FMUL V20.2D, V18.2D, V17.2D |
(247) 0x43737c FMUL V21.2D, V19.2D, V19.2D |
(247) 0x437380 FMUL V22.2D, V20.2D, V28.2D |
(247) 0x437384 STR Q22, [X7, X9] |
(247) 0x437388 LDR Q30, [X1, X9] |
(247) 0x43738c FMUL V23.2D, V30.2D, V29.2D |
(247) 0x437390 FMUL V0.2D, V23.2D, V22.2D |
(247) 0x437394 FMUL V31.2D, V0.2D, V21.2D |
(247) 0x437398 FSQRT V1.2D, V31.2D |
(247) 0x43739c STR Q1, [X6, X9] |
(247) 0x4373a0 CMP X11, X0 |
(247) 0x4373a4 B.NE 4372c0 |
(246) 0x4373a8 TBZ W2, #0, 437400 |
(246) 0x4373ac AND W2, W2, #0xfffffffe |
(246) 0x4373b0 ADD W4, W4, W2 |
(246) 0x4373b4 SBFM X11, X4, #0, #31 |
(246) 0x4373b8 ADD X10, X10, X11 |
(246) 0x4373bc ADD X13, X13, X11 |
(246) 0x4373c0 UBFM X1, X10, #61, #60 |
(246) 0x4373c4 ADD X12, X12, X11 |
(246) 0x4373c8 LDR D2, [X30, X13,LSL #3] |
(246) 0x4373cc ADD X14, X14, X11 |
(246) 0x4373d0 LDR D3, [X18, X1] |
(246) 0x4373d4 FMUL D4, D3, D2 |
(246) 0x4373d8 FDIV D5, D24, D3 |
(246) 0x4373dc FMUL D6, D4, D25 |
(246) 0x4373e0 STR D6, [X21, X12,LSL #3] |
(246) 0x4373e4 LDR D7, [X18, X1] |
(246) 0x4373e8 FMUL D16, D5, D5 |
(246) 0x4373ec FMUL D17, D7, D26 |
(246) 0x4373f0 FMUL D18, D17, D6 |
(246) 0x4373f4 FMUL D19, D18, D16 |
(246) 0x4373f8 FSQRT D20, D19 |
(246) 0x4373fc STR D20, [X20, X14,LSL #3] |
(246) 0x437400 ORR W21, WZR, W19 |
(246) 0x437404 ADD X5, X5, #1 |
(246) 0x437408 CMP W22, W5 |
(246) 0x43740c B.LE 43743c |
(246) 0x437410 LDR W19, [SP, #108] |
(246) 0x437414 ORR W4, WZR, W23 |
(246) 0x437418 ORR W30, WZR, W24 |
(246) 0x43741c SUB W2, W19, W21 |
(246) 0x437420 B 437160 |
0x437424 LDP X25, X26, [SP, #64] |
0x437428 LDP X19, X20, [SP, #16] |
0x43742c LDP X21, X22, [SP, #32] |
0x437430 LDP X23, X24, [SP, #48] |
0x437434 LDP X29, X30, [SP], #112 |
0x437438 RET |
0x43743c LDP X25, X26, [SP, #64] |
0x437440 LDP X27, X28, [SP, #80] |
0x437444 LDP X19, X20, [SP, #16] |
0x437448 LDP X21, X22, [SP, #32] |
0x43744c LDP X23, X24, [SP, #48] |
0x437450 LDP X29, X30, [SP], #112 |
0x437454 RET |
0x437458 ADD W2, W2, #1 |
0x43745c MOVZ W5, #0 |
0x437460 B 4370fc |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►47.07+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | PdV(global_variables&, bool) | PdV.cpp:115 | exec |
| ○ | hydro(global_variables&, paral[...] | hydro.cpp:64 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| ►46.98+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | timestep(global_variables&, pa[...] | timestep.cpp:47 | exec |
| ○ | hydro(global_variables&, paral[...] | basic_string.h:1076 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| ►4.33+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | field_summary(global_variables[...] | field_summary.cpp:51 | exec |
| ○ | hydro(global_variables&, paral[...] | hydro.cpp:96 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►50.77+ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►23.16+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | timestep(global_variables&, pa[...] | timestep.cpp:47 | exec |
| ○ | hydro(global_variables&, paral[...] | basic_string.h:1076 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| ►23.14+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | PdV(global_variables&, bool) | PdV.cpp:115 | exec |
| ○ | hydro(global_variables&, paral[...] | hydro.cpp:64 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| ►2.14+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | field_summary(global_variables[...] | field_summary.cpp:51 | exec |
| ○ | hydro(global_variables&, paral[...] | hydro.cpp:96 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►76.12+ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►11.23+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | PdV(global_variables&, bool) | PdV.cpp:115 | exec |
| ○ | hydro(global_variables&, paral[...] | hydro.cpp:64 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| ►11.22+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | timestep(global_variables&, pa[...] | timestep.cpp:47 | exec |
| ○ | hydro(global_variables&, paral[...] | basic_string.h:1076 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| ►1.04+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | field_summary(global_variables[...] | field_summary.cpp:51 | exec |
| ○ | hydro(global_variables&, paral[...] | hydro.cpp:96 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►88.31+ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►5.52+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | PdV(global_variables&, bool) | PdV.cpp:115 | exec |
| ○ | hydro(global_variables&, paral[...] | hydro.cpp:64 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| ►5.48+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | timestep(global_variables&, pa[...] | timestep.cpp:47 | exec |
| ○ | hydro(global_variables&, paral[...] | basic_string.h:1076 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►94.12+ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►2.79+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | PdV(global_variables&, bool) | PdV.cpp:115 | exec |
| ○ | hydro(global_variables&, paral[...] | hydro.cpp:64 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| ►2.74+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | timestep(global_variables&, pa[...] | timestep.cpp:47 | exec |
| ○ | hydro(global_variables&, paral[...] | basic_string.h:1076 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►95.74+ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►2.01+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | timestep(global_variables&, pa[...] | timestep.cpp:47 | exec |
| ○ | hydro(global_variables&, paral[...] | basic_string.h:1076 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| ►2.00+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | PdV(global_variables&, bool) | PdV.cpp:115 | exec |
| ○ | hydro(global_variables&, paral[...] | hydro.cpp:64 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►96.84+ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►1.50+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | timestep(global_variables&, pa[...] | timestep.cpp:47 | exec |
| ○ | hydro(global_variables&, paral[...] | basic_string.h:1076 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| ►1.48+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | PdV(global_variables&, bool) | PdV.cpp:115 | exec |
| ○ | hydro(global_variables&, paral[...] | hydro.cpp:64 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►97.47+ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►1.20+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | timestep(global_variables&, pa[...] | timestep.cpp:47 | exec |
| ○ | hydro(global_variables&, paral[...] | basic_string.h:1076 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| ►1.18+ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | ideal_gas(global_variables&, i[...] | ideal_gas.cpp:47 | exec |
| ○ | PdV(global_variables&, bool) | PdV.cpp:115 | exec |
| ○ | hydro(global_variables&, paral[...] | hydro.cpp:64 | exec |
| ○ | main | clover_leaf.cpp:209 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | clover_leaf.cpp:51 | exec |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►97.90+ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►98.21+ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►98.43+ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 |
| min | med | avg | max |
|---|---|---|---|
| Percentile Index | 10 | 20 | 30 | 40 | 50 | 60 | 70 | 80 | 90 | 100 |
|---|---|---|---|---|---|---|---|---|---|---|
| Value |
| min | med | avg | max |
|---|---|---|---|
| Percentile Index | 10 | 20 | 30 | 40 | 50 | 60 | 70 | 80 | 90 | 100 |
|---|---|---|---|---|---|---|---|---|---|---|
| Value |
| Path / |
The code analyzed by CQA in that panel excludes loops and represents 0.01% of application time for run 1x1
| Source file and lines | ideal_gas.cpp:37-45 |
| Module | exec |
| nb instructions | 72 |
| nb uops | 70 |
| loop length | 288 |
| used w registers | 20 |
| used x registers | 18 |
| used b registers | 0 |
| used h registers | 0 |
| used s registers | 1 |
| used d registers | 3 |
| used q registers | 0 |
| used v registers | 5 |
| used z registers | 0 |
| nb stack references | 20 |
| micro-operation queue | 8.75 cycles |
| front end | 8.75 cycles |
| P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| uops | 4.50 | 4.50 | 8.25 | 8.25 | 8.25 | 8.25 | 1.25 | 1.25 | 1.25 | 1.25 | 8.67 | 8.67 | 8.67 | 4.00 | 4.00 |
| cycles | 4.50 | 4.50 | 8.25 | 8.25 | 8.25 | 8.25 | 1.25 | 1.25 | 1.25 | 1.25 | 8.67 | 8.67 | 8.67 | 4.00 | 4.00 |
| Cycles executing div or sqrt instructions | 10.00-25.00 |
| Front-end | 8.75 |
| Dispatch | 8.67 |
| DIV/SQRT | 10.00-25.00 |
| Overall L1 | 10.00-25.00 |
| all | 3% |
| load | 0% |
| store | 0% |
| mul | 0% |
| add-sub | 0% |
| fma | 0% |
| other | 15% |
| all | 33% |
| load | NA (no load vectorizable/vectorized instructions) |
| store | NA (no store vectorizable/vectorized instructions) |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | NA (no add-sub vectorizable/vectorized instructions) |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 33% |
| all | 5% |
| load | 0% |
| store | 0% |
| mul | 0% |
| add-sub | 0% |
| fma | 0% |
| div/sqrt | 0% |
| other | 20% |
| all | 29% |
| load | 41% |
| store | 40% |
| mul | 12% |
| add-sub | 13% |
| fma | 12% |
| other | 26% |
| all | 33% |
| load | NA (no load vectorizable/vectorized instructions) |
| store | NA (no store vectorizable/vectorized instructions) |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | NA (no add-sub vectorizable/vectorized instructions) |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 33% |
| all | 29% |
| load | 41% |
| store | 40% |
| mul | 12% |
| add-sub | 13% |
| fma | 12% |
| div/sqrt | 12% |
| other | 29% |
| Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput | Vectorization |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| STP X29, X30, [SP, #912]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ORR X20, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| STP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| STP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| LDP W3, W22, [X0, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | scal (25.0%) |
| LDR W23, [X0, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | scal (12.5%) |
| LDR W0, [X0, #36] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | N/A |
| ADD W1, W3, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| ADD W22, W22, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| CMP W1, W22 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
| B.GE 437428 <_Z16ideal_gas_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_._omp_fn.0+0x3a8> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| ADD W23, W23, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| ADD W19, W0, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| STP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| SUB W25, W22, W1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| STR W1, [SP, #108] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (12.5%) |
| CMP W23, W19 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
| B.GE 437424 <_Z16ideal_gas_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_._omp_fn.0+0x3a4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| SUB W24, W19, W23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| BL 410210 <@plt_start@+0x1f0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| MUL W26, W25, W24 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | scal (12.5%) |
| ORR W21, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| BL 410240 <@plt_start@+0x220> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| LDR W6, [SP, #108] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | scal (12.5%) |
| ORR W4, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| UDIV W2, W26, W21 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5-12 | 5-12.50 | N/A |
| MSUB W5, W2, W21, W26 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (12.5%) |
| CMP W0, W5 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
| B.CC 437458 <_Z16ideal_gas_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_._omp_fn.0+0x3d8> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| MADD W21, W2, W4, W5 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (12.5%) |
| ADD W7, W2, W21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| STR W7, [SP, #108] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (12.5%) |
| CMP W21, W7 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
| B.CS 437424 <_Z16ideal_gas_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_._omp_fn.0+0x3a4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| UDIV W8, W21, W24 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5-12 | 5-12.50 | scal (12.5%) |
| ORR X9, XZR, #0x66 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADRP X10, <462118> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| MOVK X9, #16374 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| STP X27, X28, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| FMOV D24, #1.0000000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 | scal (25.0%) |
| FMOV V27.2D, #1.0000000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 | vect (50.0%) |
| FMOV D26, X9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 | scal (25.0%) |
| LDR D25, [X10, #504] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 | scal (25.0%) |
| LDP X28, X27, [X20] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X26, X25, [X20, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| MSUB W11, W8, W24, W21 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (12.5%) |
| ADD W12, W8, W6 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| DUP V28.2D, V25.D[0] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 | vect (50.0%) |
| SBFM X5, X12, #0, #31 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (100.0%) |
| DUP V29.2D, V26.D[0] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 | vect (50.0%) |
| ADD W4, W11, W23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| SUB W30, W19, W4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| LDP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | N/A |
| LDP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X29, X30, [SP], #112 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| RET | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| LDP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X27, X28, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | N/A |
| LDP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X29, X30, [SP], #112 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| RET | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| ADD W2, W2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| MOVZ W5, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| B 4370fc <_Z16ideal_gas_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_._omp_fn.0+0x7c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
The code analyzed by CQA in that panel excludes loops and represents 0.01% of application time for run 1x1
| Source file and lines | ideal_gas.cpp:37-45 |
| Module | exec |
| nb instructions | 72 |
| nb uops | 70 |
| loop length | 288 |
| used w registers | 20 |
| used x registers | 18 |
| used b registers | 0 |
| used h registers | 0 |
| used s registers | 1 |
| used d registers | 3 |
| used q registers | 0 |
| used v registers | 5 |
| used z registers | 0 |
| nb stack references | 20 |
| micro-operation queue | 8.75 cycles |
| front end | 8.75 cycles |
| P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| uops | 4.50 | 4.50 | 8.25 | 8.25 | 8.25 | 8.25 | 1.25 | 1.25 | 1.25 | 1.25 | 8.67 | 8.67 | 8.67 | 4.00 | 4.00 |
| cycles | 4.50 | 4.50 | 8.25 | 8.25 | 8.25 | 8.25 | 1.25 | 1.25 | 1.25 | 1.25 | 8.67 | 8.67 | 8.67 | 4.00 | 4.00 |
| Cycles executing div or sqrt instructions | 10.00-25.00 |
| Front-end | 8.75 |
| Dispatch | 8.67 |
| DIV/SQRT | 10.00-25.00 |
| Overall L1 | 10.00-25.00 |
| all | 3% |
| load | 0% |
| store | 0% |
| mul | 0% |
| add-sub | 0% |
| fma | 0% |
| other | 15% |
| all | 33% |
| load | NA (no load vectorizable/vectorized instructions) |
| store | NA (no store vectorizable/vectorized instructions) |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | NA (no add-sub vectorizable/vectorized instructions) |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 33% |
| all | 5% |
| load | 0% |
| store | 0% |
| mul | 0% |
| add-sub | 0% |
| fma | 0% |
| div/sqrt | 0% |
| other | 20% |
| all | 29% |
| load | 41% |
| store | 40% |
| mul | 12% |
| add-sub | 13% |
| fma | 12% |
| other | 26% |
| all | 33% |
| load | NA (no load vectorizable/vectorized instructions) |
| store | NA (no store vectorizable/vectorized instructions) |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | NA (no add-sub vectorizable/vectorized instructions) |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 33% |
| all | 29% |
| load | 41% |
| store | 40% |
| mul | 12% |
| add-sub | 13% |
| fma | 12% |
| div/sqrt | 12% |
| other | 29% |
| Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput | Vectorization |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| STP X29, X30, [SP, #912]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ORR X20, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| STP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| STP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| LDP W3, W22, [X0, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | scal (25.0%) |
| LDR W23, [X0, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | scal (12.5%) |
| LDR W0, [X0, #36] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | N/A |
| ADD W1, W3, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| ADD W22, W22, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| CMP W1, W22 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
| B.GE 437428 <_Z16ideal_gas_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_._omp_fn.0+0x3a8> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| ADD W23, W23, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| ADD W19, W0, #2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| STP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| SUB W25, W22, W1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| STR W1, [SP, #108] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (12.5%) |
| CMP W23, W19 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
| B.GE 437424 <_Z16ideal_gas_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_._omp_fn.0+0x3a4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| SUB W24, W19, W23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| BL 410210 <@plt_start@+0x1f0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| MUL W26, W25, W24 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 | scal (12.5%) |
| ORR W21, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| BL 410240 <@plt_start@+0x220> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| LDR W6, [SP, #108] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | scal (12.5%) |
| ORR W4, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| UDIV W2, W26, W21 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5-12 | 5-12.50 | N/A |
| MSUB W5, W2, W21, W26 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (12.5%) |
| CMP W0, W5 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
| B.CC 437458 <_Z16ideal_gas_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_._omp_fn.0+0x3d8> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| MADD W21, W2, W4, W5 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (12.5%) |
| ADD W7, W2, W21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| STR W7, [SP, #108] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (12.5%) |
| CMP W21, W7 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 | scal (12.5%) |
| B.CS 437424 <_Z16ideal_gas_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_._omp_fn.0+0x3a4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| UDIV W8, W21, W24 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5-12 | 5-12.50 | scal (12.5%) |
| ORR X9, XZR, #0x66 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| ADRP X10, <462118> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| MOVK X9, #16374 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| STP X27, X28, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| FMOV D24, #1.0000000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 | scal (25.0%) |
| FMOV V27.2D, #1.0000000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 | vect (50.0%) |
| FMOV D26, X9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 | scal (25.0%) |
| LDR D25, [X10, #504] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 | scal (25.0%) |
| LDP X28, X27, [X20] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X26, X25, [X20, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| MSUB W11, W8, W24, W21 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 | scal (12.5%) |
| ADD W12, W8, W6 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| DUP V28.2D, V25.D[0] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 | vect (50.0%) |
| SBFM X5, X12, #0, #31 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (100.0%) |
| DUP V29.2D, V26.D[0] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 | vect (50.0%) |
| ADD W4, W11, W23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| SUB W30, W19, W4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| HINT #0 | N/A | ||||||||||||||||||
| HINT #0 | N/A | ||||||||||||||||||
| LDP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | N/A |
| LDP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X29, X30, [SP], #112 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| RET | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| LDP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X27, X28, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | N/A |
| LDP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X29, X30, [SP], #112 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| RET | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| ADD W2, W2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| MOVZ W5, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (12.5%) |
| B 4370fc <_Z16ideal_gas_kerneliiiiRN6clover8Buffer2DIdEES2_S2_S2_._omp_fn.0+0x7c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| Run 1x1 | Number processes: 1Number nodes: NARun Command: <executable>MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-219-7589/intel/CloverLeaf2.0-CXX/run/oneview_runs/multicore/gcc_4/oneview_run_1782227431OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_NUM_THREADS: 1OMP_PLACES: threads |
|---|---|
| Run 1x2 | Number processes: 1Run Command: <executable>MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-219-7589/intel/CloverLeaf2.0-CXX/run/oneview_runs/multicore/gcc_4/oneview_run_1782227431OMP_NUM_THREADS: 2OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x4 | Number processes: 1Run Command: <executable>MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-219-7589/intel/CloverLeaf2.0-CXX/run/oneview_runs/multicore/gcc_4/oneview_run_1782227431OMP_NUM_THREADS: 4OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x8 | Number processes: 1Run Command: <executable>MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-219-7589/intel/CloverLeaf2.0-CXX/run/oneview_runs/multicore/gcc_4/oneview_run_1782227431OMP_NUM_THREADS: 8OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x16 | Number processes: 1Run Command: <executable>MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-219-7589/intel/CloverLeaf2.0-CXX/run/oneview_runs/multicore/gcc_4/oneview_run_1782227431OMP_NUM_THREADS: 16OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x24 | Number processes: 1Run Command: <executable>MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-219-7589/intel/CloverLeaf2.0-CXX/run/oneview_runs/multicore/gcc_4/oneview_run_1782227431OMP_NUM_THREADS: 24OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x32 | Number processes: 1Run Command: <executable>MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-219-7589/intel/CloverLeaf2.0-CXX/run/oneview_runs/multicore/gcc_4/oneview_run_1782227431OMP_NUM_THREADS: 32OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x40 | Number processes: 1Run Command: <executable>MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-219-7589/intel/CloverLeaf2.0-CXX/run/oneview_runs/multicore/gcc_4/oneview_run_1782227431OMP_NUM_THREADS: 40OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x48 | Number processes: 1Run Command: <executable>MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-219-7589/intel/CloverLeaf2.0-CXX/run/oneview_runs/multicore/gcc_4/oneview_run_1782227431OMP_NUM_THREADS: 48OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x56 | Number processes: 1Run Command: <executable>MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-219-7589/intel/CloverLeaf2.0-CXX/run/oneview_runs/multicore/gcc_4/oneview_run_1782227431OMP_NUM_THREADS: 56OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x64 | Number processes: 1Run Command: <executable>MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-219-7589/intel/CloverLeaf2.0-CXX/run/oneview_runs/multicore/gcc_4/oneview_run_1782227431OMP_NUM_THREADS: 64OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| (1x1) Efficiency | (1x1) Potential Speed-Up (%) | (1x2) Efficiency | (1x2) Potential Speed-Up (%) | (1x4) Efficiency | (1x4) Potential Speed-Up (%) | (1x8) Efficiency | (1x8) Potential Speed-Up (%) | (1x16) Efficiency | (1x16) Potential Speed-Up (%) | (1x24) Efficiency | (1x24) Potential Speed-Up (%) | (1x32) Efficiency | (1x32) Potential Speed-Up (%) | (1x40) Efficiency | (1x40) Potential Speed-Up (%) | (1x48) Efficiency | (1x48) Potential Speed-Up (%) | (1x56) Efficiency | (1x56) Potential Speed-Up (%) | (1x64) Efficiency | (1x64) Potential Speed-Up (%) |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 1 | 0 | 1 | 0.02 | 0.99 | 0.06 | 0.98 | 0.1 | 0.9 | 0.41 | 0.66 | 1.39 | 0.52 | 2.02 | 0.43 | 2.51 | 0.35 | 2.91 | 0.3 | 3.2 | 0.26 | 3.4 |
| Run | Number of threads | Efficiency (ideal is 1) | Speedup | Ideal Speedup | Time (s) | Coverage (%) |
|---|---|---|---|---|---|---|
| 1x1 | 1 | 1 | 1 | 1 | 102.50501251221 | 6.8966107368469 |
| 1x2 | 2 | 1 | 1.99 | 2 | 52.024993896484 | 6.8535118103027 |
| 1x4 | 4 | 0.99 | 3.97 | 4 | 26.030002593994 | 6.7421908378601 |
| 1x8 | 8 | 0.98 | 7.87 | 8 | 13.065000534058 | 6.0031208992004 |
| 1x16 | 16 | 0.9 | 14.45 | 16 | 6.9199995994568 | 4.216733455658 |
| 1x24 | 24 | 0.66 | 15.9 | 24 | 6.4000020027161 | 4.1098318099976 |
| 1x32 | 32 | 0.52 | 16.74 | 32 | 6.0300002098083 | 4.2408084869385 |
| 1x40 | 40 | 0.43 | 17.09 | 40 | 5.8949995040894 | 4.3821244239807 |
| 1x48 | 48 | 0.35 | 16.94 | 48 | 5.9400005340576 | 4.4970636367798 |
| 1x56 | 56 | 0.3 | 16.73 | 56 | 6.0250000953674 | 4.5621814727783 |
| 1x64 | 64 | 0.26 | 16.59 | 64 | 6.1200017929077 | 4.5932712554932 |
| Name | Coverage (%) | Time (s) |
|---|---|---|
| ▼ideal_gas_kernel(int, int, int, int, clover::Buffer2D | 6.90 | 102.51 |
| ▼Loop 246 - ideal_gas.cpp:39-45 - exec– | 0.00 | 0.00 |
| ○Loop 247 - ideal_gas.cpp:40-45 - exec | 6.89 | 102.36 |
