Function: field_summary(global_variables&, parallel_&) [clone ._omp_fn.0] | Module: exec | Source: field_summary.cpp:75-91 [...] | Coverage: 0.34% |
---|
Function: field_summary(global_variables&, parallel_&) [clone ._omp_fn.0] | Module: exec | Source: field_summary.cpp:75-91 [...] | Coverage: 0.34% |
---|
/home/hbollore/qaas-runs/170-290-5445/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
/home/hbollore/qaas-runs/170-290-5445/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/field_summary.cpp: 75 - 91 |
-------------------------------------------------------------------------------- |
75: #pragma omp parallel for simd reduction(+ : press) reduction(+ : ke) reduction(+ : ie) reduction(+ : mass) reduction(+ : vol) |
76: for (int idx = (0); idx < ((ymax - ymin + 1) * (xmax - xmin + 1)); idx++) { |
77: const int j = xmin + 1 + idx % (xmax - xmin + 1); |
78: const int k = ymin + 1 + idx / (xmax - xmin + 1); |
79: double vsqrd = 0.0; |
80: for (int kv = k; kv <= k + 1; ++kv) { |
81: for (int jv = j; jv <= j + 1; ++jv) { |
82: vsqrd += 0.25 * (field.xvel0(jv, kv) * field.xvel0(jv, kv) + field.yvel0(jv, kv) * field.yvel0(jv, kv)); |
83: } |
84: } |
85: double cell_vol = field.volume(j, k); |
86: double cell_mass = cell_vol * field.density0(j, k); |
87: vol += cell_vol; |
88: mass += cell_mass; |
89: ie += cell_mass * field.energy0(j, k); |
90: ke += cell_mass * 0.5 * vsqrd; |
91: press += cell_vol * field.pressure(j, k); |
0x4262a0 STP X29, X30, [SP, #848]! |
0x4262a4 ADD X29, SP, #0 |
0x4262a8 ADRP X1, |
0x4262ac STP X19, X20, [SP, #16] |
0x4262b0 STP X21, X22, [SP, #32] |
0x4262b4 ORR X21, XZR, X0 |
0x4262b8 STP X23, X24, [SP, #48] |
0x4262bc LDP W19, W24, [X0, #48] |
0x4262c0 LDR W4, [X21, #56] |
0x4262c4 LDR W23, [X21, #60] |
0x4262c8 SUB W0, W19, W24 |
0x4262cc STR D8, [SP, #88] |
0x4262d0 LDR X2, [X1, #3864] |
0x4262d4 ADD W3, W0, #1 |
0x4262d8 SUB W5, W4, W23 |
0x4262dc ADD W22, W5, #1 |
0x4262e0 LDR X0, [X2] |
0x4262e4 STR X0, [SP, #168] |
0x4262e8 MOVZ X0, #0 |
0x4262ec MADD W19, W5, W3, W3 |
0x4262f0 BL 403530 |
0x4262f4 ORR W20, WZR, W0 |
0x4262f8 BL 4033c0 |
0x4262fc SDIV W6, W19, W20 |
0x426300 MSUB W7, W6, W20, W19 |
0x426304 CMP W0, W7 |
0x426308 B.LT 42659c |
(310) 0x42630c MADD W5, W6, W0, W7 |
(310) 0x426310 ADD W7, W6, W5 |
(310) 0x426314 CMP W5, W7 |
(310) 0x426318 B.GE 426524 |
(310) 0x42631c MOVI D27, #0 |
(310) 0x426320 LDR X12, [X21] |
(310) 0x426324 FMOV D21, #0.1250000 |
(310) 0x426328 ADD W10, W23, #1 |
(310) 0x42632c ADD W11, W24, #1 |
(310) 0x426330 STP X25, X26, [SP, #64] |
(310) 0x426334 FMOV D19, D27 |
(310) 0x426338 FMOV D18, D27 |
(310) 0x42633c FMOV D17, D27 |
(310) 0x426340 FMOV D16, D27 |
(310) 0x426344 LDR X19, [X12] |
(310) 0x426348 LDR X18, [X12, #16] |
(310) 0x42634c LDR X17, [X12, #48] |
(310) 0x426350 LDR X16, [X12, #64] |
(310) 0x426354 LDR X15, [X12, #96] |
(310) 0x426358 LDR X14, [X12, #112] |
(310) 0x42635c LDR X9, [X12, #168] |
(310) 0x426360 LDR X0, [X12, #184] |
(310) 0x426364 LDR X8, [X12, #216] |
(310) 0x426368 LDR X6, [X12, #232] |
(310) 0x42636c LDR X13, [X12, #656] |
(310) 0x426370 LDR X12, [X12, #672] |
(310) 0x426374 STR X27, [SP, #80] |
(310) 0x426378 HINT #0 |
(310) 0x42637c HINT #0 |
(311) 0x426380 SDIV W25, W5, W22 |
(311) 0x426384 ADD W26, W25, W11 |
(311) 0x426388 MSUB W27, W25, W22, W5 |
(311) 0x42638c ADD W5, W5, #1 |
(311) 0x426390 SBFM X3, X26, #0, #31 |
(311) 0x426394 ADD W30, W26, #1 |
(311) 0x426398 SBFM X2, X30, #0, #31 |
(311) 0x42639c MADD X24, X8, X3, XZR |
(311) 0x4263a0 ADD W1, W27, W10 |
(311) 0x4263a4 SBFM X20, X1, #0, #31 |
(311) 0x4263a8 MADD X23, X9, X3, XZR |
(311) 0x4263ac ADD W4, W1, #1 |
(311) 0x4263b0 SBFM X27, X4, #0, #31 |
(311) 0x4263b4 MADD X30, X9, X2, XZR |
(311) 0x4263b8 ADD X25, X20, X24 |
(311) 0x4263bc ADD X4, X24, X27 |
(311) 0x4263c0 MADD X2, X8, X2, XZR |
(311) 0x4263c4 ADD X26, X20, X23 |
(311) 0x4263c8 ADD X23, X23, X27 |
(311) 0x4263cc MADD X24, X3, X13, X20 |
(311) 0x4263d0 LDR D2, [X6, X25,LSL #3] |
(311) 0x4263d4 ADD X25, X20, X30 |
(311) 0x4263d8 ADD X30, X27, X30 |
(311) 0x4263dc ADD X1, X27, X2 |
(311) 0x4263e0 ADD X2, X20, X2 |
(311) 0x4263e4 MADD X27, X3, X19, X20 |
(311) 0x4263e8 LDR D6, [X0, X26,LSL #3] |
(311) 0x4263ec MADD X26, X17, X3, X20 |
(311) 0x4263f0 MADD X3, X15, X3, X20 |
(311) 0x4263f4 LDR D1, [X0, X23,LSL #3] |
(311) 0x4263f8 FMUL D7, D2, D2 |
(311) 0x4263fc LDR D5, [X6, X4,LSL #3] |
(311) 0x426400 LDR D4, [X0, X25,LSL #3] |
(311) 0x426404 LDR D3, [X6, X2,LSL #3] |
(311) 0x426408 FMADD D20, D6, D6, D7 |
(311) 0x42640c LDR D22, [X12, X24,LSL #3] |
(311) 0x426410 LDR D23, [X18, X27,LSL #3] |
(311) 0x426414 FMADD D24, D1, D1, D20 |
(311) 0x426418 LDR D25, [X0, X30,LSL #3] |
(311) 0x42641c LDR D26, [X6, X1,LSL #3] |
(311) 0x426420 FADD D27, D27, D22 |
(311) 0x426424 FMUL D28, D22, D23 |
(311) 0x426428 LDR D29, [X16, X26,LSL #3] |
(311) 0x42642c FMADD D30, D5, D5, D24 |
(311) 0x426430 LDR D31, [X14, X3,LSL #3] |
(311) 0x426434 FMADD D0, D4, D4, D30 |
(311) 0x426438 FMUL D8, D28, D21 |
(311) 0x42643c FMADD D18, D28, D29, D18 |
(311) 0x426440 FADD D19, D19, D28 |
(311) 0x426444 FMADD D16, D22, D31, D16 |
(311) 0x426448 FMADD D2, D3, D3, D0 |
(311) 0x42644c FMADD D6, D25, D25, D2 |
(311) 0x426450 FMADD D1, D26, D26, D6 |
(311) 0x426454 FMADD D17, D8, D1, D17 |
(311) 0x426458 CMP W7, W5 |
(311) 0x42645c B.NE 426380 |
(310) 0x426460 CNTD X16, ALL |
(310) 0x426464 ADDVL X22, SP, #63 |
(310) 0x426468 DUP Z21.D, #0 |
(310) 0x42646c ADDVL X10, SP, #63 |
(310) 0x426470 ADDVL X11, SP, #63 |
(310) 0x426474 PTRUE P0.B, VL1 |
(310) 0x426478 ADDVL X19, SP, #63 |
(310) 0x42647c ADDVL X18, SP, #63 |
(310) 0x426480 ORR Z7.D, Z21.D, Z21.D |
(310) 0x426484 ADD X22, X22, #128 |
(310) 0x426488 ORR X7, XZR, X16 |
(310) 0x42648c ORR Z3.D, Z21.D, Z21.D |
(310) 0x426490 ADD X10, X10, #136 |
(310) 0x426494 ADD X11, X11, #144 |
(310) 0x426498 ORR Z20.D, Z21.D, Z21.D |
(310) 0x42649c ADD X19, X19, #152 |
(310) 0x4264a0 ADD X18, X18, #160 |
(310) 0x4264a4 ORR Z4.D, Z21.D, Z21.D |
(310) 0x4264a8 MOVZ X17, #1 |
(310) 0x4264ac STP D16, D17, [SP, #128] |
(310) 0x4264b0 STP D18, D19, [SP, #144] |
(310) 0x4264b4 STR D27, [SP, #160] |
(310) 0x4264b8 HINT #0 |
(310) 0x4264bc HINT #0 |
(312) 0x4264c0 LD1D {Z22.D}, P0/Z, [X22, X16,LSL #3] |
(312) 0x4264c4 LD1D {Z5.D}, P0/Z, [X10, X16,LSL #3] |
(312) 0x4264c8 LD1D {Z23.D}, P0/Z, [X11, X16,LSL #3] |
(312) 0x4264cc LD1D {Z24.D}, P0/Z, [X19, X16,LSL #3] |
(312) 0x4264d0 LD1D {Z25.D}, P0/Z, [X18, X16,LSL #3] |
(312) 0x4264d4 FADD Z4.D, P0/M, Z4.D, Z22.D |
(312) 0x4264d8 FADD Z20.D, P0/M, Z20.D, Z5.D |
(312) 0x4264dc FADD Z3.D, P0/M, Z3.D, Z23.D |
(312) 0x4264e0 FADD Z7.D, P0/M, Z7.D, Z24.D |
(312) 0x4264e4 FADD Z21.D, P0/M, Z21.D, Z25.D |
(312) 0x4264e8 WHILELO P0.D, X16, X17 |
(312) 0x4264ec ADD X16, X16, X7 |
(312) 0x4264f0 B.NE 4264c0 |
(310) 0x4264f4 PTRUE P1.B, ALL |
(310) 0x4264f8 FADDV D26, P1, Z21.D |
(310) 0x4264fc FADDV D27, P1, Z7.D |
(310) 0x426500 MOV V26.D[1], V27.D[0] |
(310) 0x426504 FADDV D0, P1, Z3.D |
(310) 0x426508 FADDV D28, P1, Z20.D |
(310) 0x42650c FADDV D8, P1, Z4.D |
(310) 0x426510 MOV V0.D[1], V28.D[0] |
(310) 0x426514 LDP X25, X26, [SP, #64] |
(310) 0x426518 STR Q26, [SP, #112] |
(310) 0x42651c LDR X27, [SP, #80] |
(310) 0x426520 B 426530 |
(310) 0x426524 MOVI V0.2D, #0 |
(310) 0x426528 MOVI D8, #0 |
(310) 0x42652c STR Q0, [SP, #112] |
(310) 0x426530 STR Q0, [SP, #96] |
(310) 0x426534 BL 4034e0 |
(310) 0x426538 LDUR Q29, [X21, #8] |
(310) 0x42653c LDUR Q30, [X21, #24] |
(310) 0x426540 LDR D31, [X21, #40] |
(310) 0x426544 LDR Q18, [SP, #96] |
(310) 0x426548 LDR Q0, [SP, #112] |
(310) 0x42654c FADD D8, D31, D8 |
(310) 0x426550 FADD V16.2D, V30.2D, V18.2D |
(310) 0x426554 FADD V19.2D, V29.2D, V0.2D |
(310) 0x426558 STR D8, [X21, #40] |
(310) 0x42655c STUR Q16, [X21, #24] |
(310) 0x426560 STUR Q19, [X21, #8] |
(310) 0x426564 ADRP X21, |
(310) 0x426568 BL 4033f0 |
(310) 0x42656c LDR X15, [X21, #3864] |
(310) 0x426570 LDR X2, [SP, #168] |
(310) 0x426574 LDR X1, [X15] |
(310) 0x426578 SUBS X2, X2, X1 |
(310) 0x42657c MOVZ X1, #0 |
(310) 0x426580 B.NE 4265a8 |
(310) 0x426584 LDP X19, X20, [SP, #16] |
(310) 0x426588 LDP X21, X22, [SP, #32] |
(310) 0x42658c LDP X23, X24, [SP, #48] |
(310) 0x426590 LDR D8, [SP, #88] |
(310) 0x426594 LDP X29, X30, [SP], #176 |
(310) 0x426598 RET |
(310) 0x42659c ADD W6, W6, #1 |
(310) 0x4265a0 MOVZ W7, #0 |
(310) 0x4265a4 B 42630c |
0x4265a8 STP X25, X26, [SP, #64] |
0x4265ac STR X27, [SP, #80] |
0x4265b0 BL 403150 |
0x4265b4 HINT #0 |
0x4265b8 HINT #0 |
0x4265bc HINT #0 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►98.43+ | __kmp_GOMP_microtask_wrapper(i[...] | libomp.so | |
○ | __kmp_invoke_microtask | libomp.so | |
►1.26+ | GOMP_parallel | libomp.so | |
○ | field_summary(global_variables[...] | field_summary.cpp:75 | exec |
○ | hydro(global_variables&, paral[...] | hydro.cpp:96 | exec |
○ | main | iostream:74 | exec |
○ | __libc_start_main | libc-2.31.so | |
○ | _start | iostream:74 | exec |
Path / |
Source file and lines | field_summary.cpp:75-91 |
Module | exec |
nb instructions | 33 |
loop length | 132 |
nb stack references | 0 |
front end | 3.75 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.00 | 2.00 | 4.25 | 4.25 | 4.25 | 4.25 | 0.50 | 0.50 | 0.00 | 0.00 | 4.33 | 4.33 | 4.33 | 3.50 | 3.50 |
cycles | 2.00 | 2.00 | 4.25 | 4.25 | 4.25 | 4.25 | 0.50 | 0.50 | 0.00 | 0.00 | 4.33 | 4.33 | 4.33 | 3.50 | 3.50 |
Cycles executing div or sqrt instructions | 1.00-0.50 |
Front-end | 3.75 |
Overall L1 | 4.33 |
all | 0% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
STP X29, X30, [SP, #848]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X1, <4622a8> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ORR X21, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDP W19, W24, [X0, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR W4, [X21, #56] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR W23, [X21, #60] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUB W0, W19, W24 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D8, [SP, #88] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR X2, [X1, #3864] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD W3, W0, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB W5, W4, W23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD W22, W5, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X0, [X2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X0, [SP, #168] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MOVZ X0, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MADD W19, W5, W3, W3 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
BL 403530 <@plt_start@+0x4b0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR W20, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 4033c0 <@plt_start@+0x340> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SDIV W6, W19, W20 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5-12 | 1-0.50 |
MSUB W7, W6, W20, W19 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
CMP W0, W7 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LT 42659c <_Z13field_summaryR16global_variablesR9parallel_._omp_fn.0+0x2fc> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
STP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
BL 403150 <@plt_start@+0xd0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Source file and lines | field_summary.cpp:75-91 |
Module | exec |
nb instructions | 33 |
loop length | 132 |
nb stack references | 0 |
front end | 3.75 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.00 | 2.00 | 4.25 | 4.25 | 4.25 | 4.25 | 0.50 | 0.50 | 0.00 | 0.00 | 4.33 | 4.33 | 4.33 | 3.50 | 3.50 |
cycles | 2.00 | 2.00 | 4.25 | 4.25 | 4.25 | 4.25 | 0.50 | 0.50 | 0.00 | 0.00 | 4.33 | 4.33 | 4.33 | 3.50 | 3.50 |
Cycles executing div or sqrt instructions | 1.00-0.50 |
Front-end | 3.75 |
Overall L1 | 4.33 |
all | 0% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
STP X29, X30, [SP, #848]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X1, <4622a8> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ORR X21, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDP W19, W24, [X0, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR W4, [X21, #56] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR W23, [X21, #60] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUB W0, W19, W24 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D8, [SP, #88] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR X2, [X1, #3864] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD W3, W0, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB W5, W4, W23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD W22, W5, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X0, [X2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X0, [SP, #168] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MOVZ X0, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MADD W19, W5, W3, W3 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
BL 403530 <@plt_start@+0x4b0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR W20, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 4033c0 <@plt_start@+0x340> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SDIV W6, W19, W20 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5-12 | 1-0.50 |
MSUB W7, W6, W20, W19 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
CMP W0, W7 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LT 42659c <_Z13field_summaryR16global_variablesR9parallel_._omp_fn.0+0x2fc> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
STP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
BL 403150 <@plt_start@+0xd0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼field_summary(global_variables&, parallel_&) [clone ._omp_fn.0]– | 0.34 | 0.45 |
▼Loop 310 - field_summary.cpp:75-91 - exec– | 0 | 0 |
○Loop 311 - context.h:69-69 - exec | 0.34 | 0.45 |
○Loop 312 - field_summary.cpp:76-76 - exec | 0 | 0 |