Function: advancePosition._omp_fn.0 | Module: exec | Source: timestep.c:85-94 | Coverage: 0.76% |
---|
Function: advancePosition._omp_fn.0 | Module: exec | Source: timestep.c:85-94 | Coverage: 0.76% |
---|
/home/hbollore/qaas-runs/170-265-5545/intel/CoMD/build/CoMD/CoMD/src-openmp/timestep.c: 85 - 94 |
-------------------------------------------------------------------------------- |
85: #pragma omp parallel for |
86: for (int iBox=0; iBox<nBoxes; iBox++) |
87: { |
88: for (int iOff=MAXATOMS*iBox,ii=0; ii<s->boxes->nAtoms[iBox]; ii++,iOff++) |
89: { |
90: int iSpecies = s->atoms->iSpecies[iOff]; |
91: real_t invMass = 1.0/s->species[iSpecies].mass; |
92: s->atoms->r[iOff][0] += dt*s->atoms->p[iOff][0]*invMass; |
93: s->atoms->r[iOff][1] += dt*s->atoms->p[iOff][1]*invMass; |
94: s->atoms->r[iOff][2] += dt*s->atoms->p[iOff][2]*invMass; |
0x40c740 STP X29, X30, [SP, #976]! |
0x40c744 ADD X29, SP, #0 |
0x40c748 STR X21, [SP, #32] |
0x40c74c LDR W21, [X0, #16] |
0x40c750 STP X19, X20, [SP, #16] |
0x40c754 ORR X20, XZR, X0 |
0x40c758 BL 4024a0 |
0x40c75c ORR W19, WZR, W0 |
0x40c760 BL 4023f0 |
0x40c764 SDIV W1, W21, W19 |
0x40c768 ORR W14, WZR, W0 |
0x40c76c MSUB W2, W1, W19, W21 |
0x40c770 CMP W0, W2 |
0x40c774 B.LT 40c930 |
(115) 0x40c778 MADD W3, W1, W14, W2 |
(115) 0x40c77c ADD W16, W1, W3 |
(115) 0x40c780 CMP W3, W16 |
(115) 0x40c784 B.GE 40c920 |
(113) 0x40c788 LDR X17, [X20] |
(113) 0x40c78c UBFM W15, W3, #26, #25 |
(113) 0x40c790 MOVZ W0, #24 |
(113) 0x40c794 FMOV D4, #1.0000000 |
(113) 0x40c798 SBFM X14, X3, #0, #31 |
(113) 0x40c79c LDR D0, [X20, #8] |
(113) 0x40c7a0 SMADDL X15, W15, W0, XZR |
(113) 0x40c7a4 LDR X4, [X17, #24] |
(113) 0x40c7a8 LDR X18, [X4, #120] |
(113) 0x40c7ac LDR W5, [X18, X14,LSL #2] |
(113) 0x40c7b0 CMP W5, #0 |
(113) 0x40c7b4 B.LE 40c910 |
(113) 0x40c7b8 LDP X10, X13, [X17, #32] |
(113) 0x40c7bc SUB W9, W5, #1 |
(113) 0x40c7c0 UBFM X7, X14, #56, #55 |
(113) 0x40c7c4 ADD X8, X9, X14,LSL #6 |
(113) 0x40c7c8 ORR X0, XZR, X15 |
(113) 0x40c7cc LDP X6, X30, [X10, #16] |
(113) 0x40c7d0 LDR X20, [X10, #32] |
(113) 0x40c7d4 ADD X11, X6, #4 |
(113) 0x40c7d8 ADD X3, X6, X7 |
(113) 0x40c7dc ADD X21, X11, X8,LSL #2 |
(113) 0x40c7e0 ADD X19, X30, #8 |
(113) 0x40c7e4 ADD X2, X30, #16 |
(113) 0x40c7e8 SUB X1, X21, X3 |
(113) 0x40c7ec ADD X12, X20, #8 |
(113) 0x40c7f0 ADD X4, X20, #16 |
(113) 0x40c7f4 TBZ W1, #2, 40c860 |
0x40c7f8 LDRSW X5, [X6, X7] |
0x40c7fc ADD X3, X3, #4 |
0x40c800 ADD X0, X15, #24 |
0x40c804 LDR D3, [X20, X15] |
0x40c808 LDR D2, [X30, X15] |
0x40c80c ADD X9, X13, X5,LSL #4 |
0x40c810 LDR D1, [X9, #8] |
0x40c814 FMUL D5, D0, D3 |
0x40c818 FDIV D6, D4, D1 |
0x40c81c FMADD D7, D6, D5, D2 |
0x40c820 STR D7, [X30, X15] |
0x40c824 LDR D16, [X12, X15] |
0x40c828 LDR D17, [X19, X15] |
0x40c82c FMUL D18, D0, D16 |
0x40c830 FMADD D19, D6, D18, D17 |
0x40c834 STR D19, [X19, X15] |
0x40c838 LDR D20, [X4, X15] |
0x40c83c LDR D21, [X2, X15] |
0x40c840 FMUL D22, D0, D20 |
0x40c844 FMADD D23, D6, D22, D21 |
0x40c848 STR D23, [X2, X15] |
0x40c84c CMP X3, X21 |
0x40c850 B.EQ 40c910 |
0x40c854 HINT #0 |
0x40c858 HINT #0 |
0x40c85c HINT #0 |
(114) 0x40c860 ORR X8, XZR, X3 |
(114) 0x40c864 LDR D24, [X20, X0] |
(114) 0x40c868 ADD X10, X0, #24 |
(114) 0x40c86c LDRSW X7, [X8], #4 |
(114) 0x40c870 LDR D25, [X30, X0] |
(114) 0x40c874 FMUL D26, D0, D24 |
(114) 0x40c878 LDRSW X6, [X3, #4] |
(114) 0x40c87c ADD X11, X13, X7,LSL #4 |
(114) 0x40c880 ADD X3, X8, #4 |
(114) 0x40c884 LDR D27, [X11, #8] |
(114) 0x40c888 ADD X1, X13, X6,LSL #4 |
(114) 0x40c88c FDIV D28, D4, D27 |
(114) 0x40c890 FMADD D29, D28, D26, D25 |
(114) 0x40c894 STR D29, [X30, X0] |
(114) 0x40c898 LDR D30, [X12, X0] |
(114) 0x40c89c LDR D31, [X19, X0] |
(114) 0x40c8a0 FMUL D3, D0, D30 |
(114) 0x40c8a4 FMADD D2, D28, D3, D31 |
(114) 0x40c8a8 STR D2, [X19, X0] |
(114) 0x40c8ac LDR D5, [X4, X0] |
(114) 0x40c8b0 LDR D1, [X2, X0] |
(114) 0x40c8b4 FMUL D6, D0, D5 |
(114) 0x40c8b8 FMADD D7, D28, D6, D1 |
(114) 0x40c8bc STR D7, [X2, X0] |
(114) 0x40c8c0 ADD X0, X0, #48 |
(114) 0x40c8c4 LDR D19, [X1, #8] |
(114) 0x40c8c8 LDR D16, [X20, X10] |
(114) 0x40c8cc LDR D17, [X30, X10] |
(114) 0x40c8d0 FDIV D20, D4, D19 |
(114) 0x40c8d4 FMUL D18, D0, D16 |
(114) 0x40c8d8 FMADD D21, D20, D18, D17 |
(114) 0x40c8dc STR D21, [X30, X10] |
(114) 0x40c8e0 LDR D22, [X12, X10] |
(114) 0x40c8e4 LDR D23, [X19, X10] |
(114) 0x40c8e8 FMUL D24, D0, D22 |
(114) 0x40c8ec FMADD D25, D20, D24, D23 |
(114) 0x40c8f0 STR D25, [X19, X10] |
(114) 0x40c8f4 LDR D26, [X4, X10] |
(114) 0x40c8f8 LDR D27, [X2, X10] |
(114) 0x40c8fc FMUL D28, D0, D26 |
(114) 0x40c900 FMADD D29, D20, D28, D27 |
(114) 0x40c904 STR D29, [X2, X10] |
(114) 0x40c908 CMP X3, X21 |
(114) 0x40c90c B.NE 40c860 |
(113) 0x40c910 ADD X14, X14, #1 |
(113) 0x40c914 ADD X15, X15, #1536 |
(113) 0x40c918 CMP W16, W14 |
(113) 0x40c91c B.GT 40c7ac |
(115) 0x40c920 LDP X19, X20, [SP, #16] |
(115) 0x40c924 LDR X21, [SP, #32] |
(115) 0x40c928 LDP X29, X30, [SP], #48 |
(115) 0x40c92c RET |
(115) 0x40c930 ADD W1, W1, #1 |
(115) 0x40c934 MOVZ W2, #0 |
(115) 0x40c938 B 40c778 |
0x40c93c HINT #0 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►97.93+ | __kmp_GOMP_microtask_wrapper(i[...] | libomp.so | |
○ | __kmp_invoke_microtask | libomp.so | |
►2.07+ | GOMP_parallel | libomp.so | |
○ | timestep | timestep.c:43 | exec |
○ | main | CoMD.c:125 | exec |
○ | __libc_start_main | libc-2.31.so | |
○ | _start | CoMD.c:266 | exec |
Path / |
Source file and lines | timestep.c:85-94 |
Module | exec |
nb instructions | 41 |
loop length | 164 |
nb stack references | 0 |
front end | 4.63 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.00 | 2.00 | 3.50 | 3.50 | 3.50 | 3.50 | 2.50 | 2.50 | 2.50 | 2.50 | 5.00 | 5.00 | 5.00 | 1.50 | 1.50 |
cycles | 2.00 | 2.00 | 3.50 | 3.50 | 3.50 | 3.50 | 2.50 | 2.50 | 2.50 | 2.50 | 5.00 | 5.00 | 5.00 | 1.50 | 1.50 |
Cycles executing div or sqrt instructions | 2.00-1.00 |
Front-end | 4.63 |
Overall L1 | 5.00 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
STP X29, X30, [SP, #976]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X21, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR W21, [X0, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ORR X20, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 4024a0 <@plt_start@+0x280> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR W19, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 4023f0 <@plt_start@+0x1d0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SDIV W1, W21, W19 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5-12 | 1-0.50 |
ORR W14, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MSUB W2, W1, W19, W21 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
CMP W0, W2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LT 40c930 <advancePosition._omp_fn.0+0x1f0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDRSW X5, [X6, X7] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD X3, X3, #4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X0, X15, #24 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR D3, [X20, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDR D2, [X30, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ADD X9, X13, X5,LSL #4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR D1, [X9, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
FMUL D5, D0, D3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 3 | 0.25 |
FDIV D6, D4, D1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 7-15 | 1-0.50 |
FMADD D7, D6, D5, D2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 4 | 0.25 |
STR D7, [X30, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D16, [X12, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDR D17, [X19, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
FMUL D18, D0, D16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 3 | 0.25 |
FMADD D19, D6, D18, D17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 4 | 0.25 |
STR D19, [X19, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D20, [X4, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDR D21, [X2, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
FMUL D22, D0, D20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 3 | 0.25 |
FMADD D23, D6, D22, D21 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 4 | 0.25 |
STR D23, [X2, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
CMP X3, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.EQ 40c910 <advancePosition._omp_fn.0+0x1d0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Source file and lines | timestep.c:85-94 |
Module | exec |
nb instructions | 41 |
loop length | 164 |
nb stack references | 0 |
front end | 4.63 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.00 | 2.00 | 3.50 | 3.50 | 3.50 | 3.50 | 2.50 | 2.50 | 2.50 | 2.50 | 5.00 | 5.00 | 5.00 | 1.50 | 1.50 |
cycles | 2.00 | 2.00 | 3.50 | 3.50 | 3.50 | 3.50 | 2.50 | 2.50 | 2.50 | 2.50 | 5.00 | 5.00 | 5.00 | 1.50 | 1.50 |
Cycles executing div or sqrt instructions | 2.00-1.00 |
Front-end | 4.63 |
Overall L1 | 5.00 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
STP X29, X30, [SP, #976]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X21, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR W21, [X0, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ORR X20, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 4024a0 <@plt_start@+0x280> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR W19, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 4023f0 <@plt_start@+0x1d0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SDIV W1, W21, W19 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5-12 | 1-0.50 |
ORR W14, WZR, W0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MSUB W2, W1, W19, W21 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
CMP W0, W2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LT 40c930 <advancePosition._omp_fn.0+0x1f0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDRSW X5, [X6, X7] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD X3, X3, #4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X0, X15, #24 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR D3, [X20, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDR D2, [X30, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ADD X9, X13, X5,LSL #4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR D1, [X9, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
FMUL D5, D0, D3 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 3 | 0.25 |
FDIV D6, D4, D1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 7-15 | 1-0.50 |
FMADD D7, D6, D5, D2 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 4 | 0.25 |
STR D7, [X30, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D16, [X12, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDR D17, [X19, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
FMUL D18, D0, D16 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 3 | 0.25 |
FMADD D19, D6, D18, D17 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 4 | 0.25 |
STR D19, [X19, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D20, [X4, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDR D21, [X2, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
FMUL D22, D0, D20 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 3 | 0.25 |
FMADD D23, D6, D22, D21 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 4 | 0.25 |
STR D23, [X2, X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
CMP X3, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.EQ 40c910 <advancePosition._omp_fn.0+0x1d0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼advancePosition._omp_fn.0– | 0.76 | 0.13 |
▼Loop 113 - timestep.c:85-94 - exec– | 0 | 0 |
○Loop 114 - timestep.c:88-94 - exec | 0.71 | 0.12 |
○Loop 115 - timestep.c:85-86 - exec | 0 | 0 |