Function: sortAtomsInCell | Module: exec | Source: haloExchange.c:614-645 | Coverage: 0.68% |
---|
Function: sortAtomsInCell | Module: exec | Source: haloExchange.c:614-645 | Coverage: 0.68% |
---|
/home/hbollore/qaas/qaas-runs/169-814-5713/intel/CoMD/build/CoMD/CoMD/src-openmp/haloExchange.c: 614 - 645 |
-------------------------------------------------------------------------------- |
614: { |
615: int nAtoms = boxes->nAtoms[iBox]; |
616: |
617: AtomMsg tmp[nAtoms]; |
618: |
619: int begin = iBox*MAXATOMS; |
620: int end = begin + nAtoms; |
621: for (int ii=begin, iTmp=0; ii<end; ++ii, ++iTmp) |
622: { |
623: tmp[iTmp].gid = atoms->gid[ii]; |
624: tmp[iTmp].type = atoms->iSpecies[ii]; |
625: tmp[iTmp].rx = atoms->r[ii][0]; |
626: tmp[iTmp].ry = atoms->r[ii][1]; |
627: tmp[iTmp].rz = atoms->r[ii][2]; |
628: tmp[iTmp].px = atoms->p[ii][0]; |
629: tmp[iTmp].py = atoms->p[ii][1]; |
630: tmp[iTmp].pz = atoms->p[ii][2]; |
631: } |
632: qsort(&tmp, nAtoms, sizeof(AtomMsg), sortAtomsById); |
633: for (int ii=begin, iTmp=0; ii<end; ++ii, ++iTmp) |
634: { |
635: atoms->gid[ii] = tmp[iTmp].gid; |
636: atoms->iSpecies[ii] = tmp[iTmp].type; |
637: atoms->r[ii][0] = tmp[iTmp].rx; |
638: atoms->r[ii][1] = tmp[iTmp].ry; |
639: atoms->r[ii][2] = tmp[iTmp].rz; |
640: atoms->p[ii][0] = tmp[iTmp].px; |
641: atoms->p[ii][1] = tmp[iTmp].py; |
642: atoms->p[ii][2] = tmp[iTmp].pz; |
643: } |
644: |
645: } |
0x406c24 STP X29, X30, [SP, #944]! |
0x406c28 ADD X29, SP, #0 |
0x406c2c ADRP X3, |
0x406c30 LDR X4, [X1, #120] |
0x406c34 MOVZ W1, #56 |
0x406c38 STP X19, X20, [SP, #16] |
0x406c3c LDR X5, [X3, #4048] |
0x406c40 STP X21, X22, [SP, #32] |
0x406c44 ORR X22, XZR, X0 |
0x406c48 LDR W20, [X4, X2,SXTW #2] |
0x406c4c STR X23, [SP, #48] |
0x406c50 LDR X0, [X5] |
0x406c54 STR X0, [X29, #72] |
0x406c58 MOVZ X0, #0 |
0x406c5c SUB SP, SP, #16 |
0x406c60 SMADDL X0, W20, W1, XZR |
0x406c64 SBFM X1, X20, #0, #31 |
0x406c68 ADD X6, X0, #15 |
0x406c6c AND X7, X6, #7152 |
0x406c70 AND X8, X6, #7932 |
0x406c74 SUB X9, SP, X7,UXTX |
0x406c78 CMP SP, X9,UXTX |
0x406c7c B.EQ 406c90 |
(67) 0x406c80 SUB SP, SP, #16 |
(67) 0x406c84 STR XZR, [SP, #1024] |
(67) 0x406c88 CMP SP, X9,UXTX |
(67) 0x406c8c B.NE 406c80 |
0x406c90 AND X10, X8, #5056 |
0x406c94 SUB SP, SP, X10,UXTX |
0x406c98 STR XZR, [SP] |
0x406c9c CMP X10, #1024 |
0x406ca0 B.CS 407008 |
(64) 0x406ca4 UBFM W21, W2, #26, #25 |
(64) 0x406ca8 ADD X19, SP, #16 |
(64) 0x406cac ADD W20, W20, W21 |
(64) 0x406cb0 CMP W21, W20 |
(64) 0x406cb4 B.GE 407010 |
(64) 0x406cb8 MOVZ W11, #24 |
(64) 0x406cbc LDP X17, X18, [X22, #24] |
(64) 0x406cc0 SBFM X23, X21, #0, #31 |
(64) 0x406cc4 ORN W12, WZR, W21 |
(64) 0x406cc8 ADD X6, X23, #1 |
(64) 0x406ccc SMADDL X21, W21, W11, XZR |
(64) 0x406cd0 ADD W13, W20, W12 |
(64) 0x406cd4 ADD X10, X19, #56 |
(64) 0x406cd8 LDP X15, X16, [X22, #8] |
(64) 0x406cdc AND W14, W13, #0 |
(64) 0x406ce0 ADD X30, X17, X21 |
(64) 0x406ce4 ADD X0, X18, X21 |
(64) 0x406ce8 ADD X5, X30, #24 |
(64) 0x406cec ADD X4, X0, #24 |
(64) 0x406cf0 LDR D0, [X30] |
(64) 0x406cf4 LDR W3, [X15, X23,LSL #2] |
(64) 0x406cf8 STR W3, [X19] |
(64) 0x406cfc LDR W7, [X16, X23,LSL #2] |
(64) 0x406d00 STR D0, [X19, #8] |
(64) 0x406d04 LDR D1, [X30, #8] |
(64) 0x406d08 STR W7, [X19, #4] |
(64) 0x406d0c STR D1, [X19, #16] |
(64) 0x406d10 LDR D2, [X30, #16] |
(64) 0x406d14 STR D2, [X19, #24] |
(64) 0x406d18 LDR D3, [X0] |
(64) 0x406d1c STR D3, [X19, #32] |
(64) 0x406d20 LDR D4, [X0, #8] |
(64) 0x406d24 STR D4, [X19, #40] |
(64) 0x406d28 LDR D5, [X0, #16] |
(64) 0x406d2c STR D5, [X19, #48] |
(64) 0x406d30 CMP W20, W6 |
(64) 0x406d34 B.LE 406e48 |
(64) 0x406d38 CBZ W14, 406da0 |
0x406d3c LDR D6, [X5] |
0x406d40 LDR W8, [X15, X6,LSL #2] |
0x406d44 STR W8, [X10] |
0x406d48 LDR W9, [X16, X6,LSL #2] |
0x406d4c ADD X6, X6, #1 |
0x406d50 STR D6, [X10, #8] |
0x406d54 LDR D7, [X5, #8] |
0x406d58 STR W9, [X10, #4] |
0x406d5c STR D7, [X10, #16] |
0x406d60 LDR D16, [X5, #16] |
0x406d64 ADD X5, X30, #48 |
0x406d68 STR D16, [X10, #24] |
0x406d6c LDR D17, [X4] |
0x406d70 STR D17, [X10, #32] |
0x406d74 LDR D18, [X4, #8] |
0x406d78 STR D18, [X10, #40] |
0x406d7c LDR D19, [X4, #16] |
0x406d80 ADD X4, X0, #48 |
0x406d84 STR D19, [X10, #48] |
0x406d88 ADD X10, X19, #112 |
0x406d8c CMP W20, W6 |
0x406d90 B.LE 406e48 |
0x406d94 HINT #0 |
0x406d98 HINT #0 |
0x406d9c HINT #0 |
(66) 0x406da0 LDR D20, [X5] |
(66) 0x406da4 ADD X2, X6, #1 |
(66) 0x406da8 ADD X12, X10, #56 |
(66) 0x406dac ADD X13, X5, #24 |
(66) 0x406db0 ADD X14, X4, #24 |
(66) 0x406db4 LDR W11, [X15, X6,LSL #2] |
(66) 0x406db8 ADD X10, X10, #112 |
(66) 0x406dbc ADD X5, X5, #48 |
(66) 0x406dc0 ADD X4, X4, #48 |
(66) 0x406dc4 STUR W11, [X10, #400] |
(66) 0x406dc8 LDR W17, [X16, X6,LSL #2] |
(66) 0x406dcc ADD X6, X6, #2 |
(66) 0x406dd0 STUR D20, [X10, #408] |
(66) 0x406dd4 LDUR D21, [X5, #472] |
(66) 0x406dd8 STUR W17, [X10, #404] |
(66) 0x406ddc LDR W18, [X15, X2,LSL #2] |
(66) 0x406de0 STUR D21, [X10, #416] |
(66) 0x406de4 LDUR D22, [X5, #480] |
(66) 0x406de8 STUR D22, [X10, #424] |
(66) 0x406dec LDUR D23, [X4, #464] |
(66) 0x406df0 STUR D23, [X10, #432] |
(66) 0x406df4 LDUR D24, [X4, #472] |
(66) 0x406df8 STUR D24, [X10, #440] |
(66) 0x406dfc LDUR D25, [X4, #480] |
(66) 0x406e00 STUR W18, [X10, #456] |
(66) 0x406e04 LDR W30, [X16, X2,LSL #2] |
(66) 0x406e08 STUR D25, [X10, #448] |
(66) 0x406e0c LDUR D26, [X5, #488] |
(66) 0x406e10 STR W30, [X12, #4] |
(66) 0x406e14 STR D26, [X12, #8] |
(66) 0x406e18 LDR D27, [X13, #8] |
(66) 0x406e1c STR D27, [X12, #16] |
(66) 0x406e20 LDR D28, [X13, #16] |
(66) 0x406e24 STR D28, [X12, #24] |
(66) 0x406e28 LDUR D29, [X4, #488] |
(66) 0x406e2c STR D29, [X12, #32] |
(66) 0x406e30 LDR D30, [X14, #8] |
(66) 0x406e34 STR D30, [X12, #40] |
(66) 0x406e38 LDR D31, [X14, #16] |
(66) 0x406e3c STR D31, [X12, #48] |
(66) 0x406e40 CMP W20, W6 |
(66) 0x406e44 B.GT 406da0 |
(64) 0x406e48 ADRP X15, |
(64) 0x406e4c MOVZ X2, #56 |
(64) 0x406e50 ADD X3, X15, #3936 |
(64) 0x406e54 ORR X0, XZR, X19 |
(64) 0x406e58 BL 401de0 |
(64) 0x406e5c LDR W7, [X19] |
(64) 0x406e60 ORN W1, WZR, W23 |
(64) 0x406e64 ADD X4, X23, #1 |
(64) 0x406e68 LDP X9, X8, [X22, #8] |
(64) 0x406e6c ADD W3, W20, W1 |
(64) 0x406e70 ADD X13, X19, #56 |
(64) 0x406e74 AND W6, W3, #0 |
(64) 0x406e78 LDP X5, X0, [X22, #24] |
(64) 0x406e7c LDR D0, [X19, #8] |
(64) 0x406e80 STR W7, [X9, X23,LSL #2] |
(64) 0x406e84 ADD X10, X5, X21 |
(64) 0x406e88 ADD X21, X0, X21 |
(64) 0x406e8c LDR W22, [X19, #4] |
(64) 0x406e90 ADD X12, X10, #24 |
(64) 0x406e94 ADD X2, X21, #24 |
(64) 0x406e98 STR W22, [X8, X23,LSL #2] |
(64) 0x406e9c STR D0, [X10] |
(64) 0x406ea0 LDR D1, [X19, #16] |
(64) 0x406ea4 STR D1, [X10, #8] |
(64) 0x406ea8 LDR D2, [X19, #24] |
(64) 0x406eac STR D2, [X10, #16] |
(64) 0x406eb0 LDR D3, [X19, #32] |
(64) 0x406eb4 STR D3, [X21] |
(64) 0x406eb8 LDR D4, [X19, #40] |
(64) 0x406ebc STR D4, [X21, #8] |
(64) 0x406ec0 LDR D5, [X19, #48] |
(64) 0x406ec4 STR D5, [X21, #16] |
(64) 0x406ec8 CMP W20, W4 |
(64) 0x406ecc B.LE 406fd4 |
(64) 0x406ed0 CBZ W6, 406f2c |
0x406ed4 LDR W16, [X13] |
0x406ed8 LDR D6, [X13, #8] |
0x406edc STR W16, [X9, X4,LSL #2] |
0x406ee0 LDR W23, [X13, #4] |
0x406ee4 STR W23, [X8, X4,LSL #2] |
0x406ee8 ADD X4, X4, #1 |
0x406eec STR D6, [X12] |
0x406ef0 LDR D7, [X13, #16] |
0x406ef4 STR D7, [X12, #8] |
0x406ef8 LDR D16, [X13, #24] |
0x406efc STR D16, [X12, #16] |
0x406f00 ADD X12, X10, #48 |
0x406f04 LDR D17, [X13, #32] |
0x406f08 STR D17, [X2] |
0x406f0c LDR D18, [X13, #40] |
0x406f10 STR D18, [X2, #8] |
0x406f14 LDR D19, [X13, #48] |
0x406f18 ADD X13, X19, #112 |
0x406f1c STR D19, [X2, #16] |
0x406f20 ADD X2, X21, #48 |
0x406f24 CMP W20, W4 |
0x406f28 B.LE 406fd4 |
(65) 0x406f2c LDR W18, [X13] |
(65) 0x406f30 ADD X14, X13, #56 |
(65) 0x406f34 ADD X19, X4, #1 |
(65) 0x406f38 ADD X11, X12, #24 |
(65) 0x406f3c ADD X17, X2, #24 |
(65) 0x406f40 LDR D20, [X13, #8] |
(65) 0x406f44 ADD X12, X12, #48 |
(65) 0x406f48 ADD X13, X13, #112 |
(65) 0x406f4c ADD X2, X2, #48 |
(65) 0x406f50 STR W18, [X9, X4,LSL #2] |
(65) 0x406f54 LDUR W30, [X13, #404] |
(65) 0x406f58 STR W30, [X8, X4,LSL #2] |
(65) 0x406f5c ADD X4, X4, #2 |
(65) 0x406f60 LDUR W15, [X13, #456] |
(65) 0x406f64 STUR D20, [X12, #464] |
(65) 0x406f68 LDUR D21, [X13, #416] |
(65) 0x406f6c STUR D21, [X12, #472] |
(65) 0x406f70 LDUR D22, [X13, #424] |
(65) 0x406f74 STUR D22, [X12, #480] |
(65) 0x406f78 LDUR D23, [X13, #432] |
(65) 0x406f7c STUR D23, [X2, #464] |
(65) 0x406f80 LDUR D24, [X13, #440] |
(65) 0x406f84 STUR D24, [X2, #472] |
(65) 0x406f88 LDUR D25, [X13, #448] |
(65) 0x406f8c STUR D25, [X2, #480] |
(65) 0x406f90 STR W15, [X9, X19,LSL #2] |
(65) 0x406f94 LDR W1, [X14, #4] |
(65) 0x406f98 LDR D26, [X14, #8] |
(65) 0x406f9c STR W1, [X8, X19,LSL #2] |
(65) 0x406fa0 STUR D26, [X12, #488] |
(65) 0x406fa4 LDR D27, [X14, #16] |
(65) 0x406fa8 STUR D27, [X12, #496] |
(65) 0x406fac LDR D28, [X14, #24] |
(65) 0x406fb0 STR D28, [X11, #16] |
(65) 0x406fb4 LDR D29, [X14, #32] |
(65) 0x406fb8 STUR D29, [X2, #488] |
(65) 0x406fbc LDR D30, [X14, #40] |
(65) 0x406fc0 STR D30, [X17, #8] |
(65) 0x406fc4 LDR D31, [X14, #48] |
(65) 0x406fc8 STR D31, [X17, #16] |
(65) 0x406fcc CMP W20, W4 |
(65) 0x406fd0 B.GT 406f2c |
(64) 0x406fd4 ADRP X20, |
(64) 0x406fd8 LDR X3, [X20, #4048] |
(64) 0x406fdc LDR X2, [X29, #72] |
(64) 0x406fe0 LDR X1, [X3] |
(64) 0x406fe4 SUBS X2, X2, X1 |
(64) 0x406fe8 MOVZ X1, #0 |
(64) 0x406fec B.NE 407028 |
(64) 0x406ff0 ADD SP, X29, #0 |
(64) 0x406ff4 LDP X19, X20, [SP, #16] |
(64) 0x406ff8 LDP X21, X22, [SP, #32] |
(64) 0x406ffc LDR X23, [SP, #48] |
(64) 0x407000 LDP X29, X30, [SP], #80 |
(64) 0x407004 RET |
(64) 0x407008 STR XZR, [SP, #1024] |
(64) 0x40700c B 406ca4 |
(64) 0x407010 ADRP X2, |
(64) 0x407014 ORR X0, XZR, X19 |
(64) 0x407018 ADD X3, X2, #3936 |
(64) 0x40701c MOVZ X2, #56 |
(64) 0x407020 BL 401de0 |
(64) 0x407024 B 406fd4 |
0x407028 BL 401f10 |
0x40702c HINT #0 |
0x407030 HINT #0 |
0x407034 HINT #0 |
0x407038 HINT #0 |
0x40703c HINT #0 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►18.18+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | GOMP_parallel | libomp.so | |
○ | redistributeAtoms | timestep.c:155 | exec |
○ | timestep | timestep.c:47 | exec |
○ | main | CoMD.c:125 | exec |
○ | __libc_start_main | libc-2.31.so | |
○ | _start | CoMD.c:150 | exec |
►16.36+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | GOMP_parallel | libomp.so | |
○ | redistributeAtoms | timestep.c:155 | exec |
○ | timestep | timestep.c:47 | exec |
○ | main | CoMD.c:125 | exec |
○ | __libc_start_main | libc-2.31.so | |
○ | _start | CoMD.c:150 | exec |
►16.36+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | GOMP_parallel | libomp.so | |
○ | redistributeAtoms | timestep.c:155 | exec |
○ | timestep | timestep.c:47 | exec |
○ | main | CoMD.c:125 | exec |
○ | __libc_start_main | libc-2.31.so | |
○ | _start | CoMD.c:150 | exec |
►16.36+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | GOMP_parallel | libomp.so | |
○ | redistributeAtoms | timestep.c:155 | exec |
○ | timestep | timestep.c:47 | exec |
○ | main | CoMD.c:125 | exec |
○ | __libc_start_main | libc-2.31.so | |
○ | _start | CoMD.c:150 | exec |
►12.73+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | GOMP_parallel | libomp.so | |
○ | redistributeAtoms | timestep.c:155 | exec |
○ | timestep | timestep.c:47 | exec |
○ | main | CoMD.c:125 | exec |
○ | __libc_start_main | libc-2.31.so | |
○ | _start | CoMD.c:150 | exec |
►10.91+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | GOMP_parallel | libomp.so | |
○ | redistributeAtoms | timestep.c:155 | exec |
○ | timestep | timestep.c:47 | exec |
○ | main | CoMD.c:125 | exec |
○ | __libc_start_main | libc-2.31.so | |
○ | _start | CoMD.c:150 | exec |
►5.45+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | GOMP_parallel | libomp.so | |
○ | redistributeAtoms | timestep.c:155 | exec |
○ | timestep | timestep.c:47 | exec |
○ | main | CoMD.c:125 | exec |
○ | __libc_start_main | libc-2.31.so | |
○ | _start | CoMD.c:150 | exec |
►3.64+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | GOMP_parallel | libomp.so | |
○ | redistributeAtoms | timestep.c:155 | exec |
○ | timestep | timestep.c:47 | exec |
○ | main | CoMD.c:125 | exec |
○ | __libc_start_main | libc-2.31.so | |
○ | _start | CoMD.c:150 | exec |
Path / |
Source file and lines | haloExchange.c:614-645 |
Module | exec |
nb instructions | 81 |
loop length | 324 |
nb stack references | 0 |
front end | 9.13 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.50 | 2.50 | 7.00 | 7.00 | 7.00 | 7.00 | 6.00 | 6.00 | 0.00 | 0.00 | 14.00 | 14.00 | 14.00 | 5.00 | 5.00 |
cycles | 2.50 | 2.50 | 7.00 | 7.00 | 7.00 | 7.00 | 6.00 | 6.00 | 0.00 | 0.00 | 14.00 | 14.00 | 14.00 | 5.00 | 5.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 9.13 |
Overall L1 | 14.00 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
STP X29, X30, [SP, #944]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X3, <420c2c> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X4, [X1, #120] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
MOVZ W1, #56 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X5, [X3, #4048] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ORR X22, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR W20, [X4, X2,SXTW #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X23, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X0, [X5] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X0, [X29, #72] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MOVZ X0, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB SP, SP, #16 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SMADDL X0, W20, W1, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SBFM X1, X20, #0, #31 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X6, X0, #15 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND X7, X6, #7152 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND X8, X6, #7932 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X9, SP, X7,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
CMP SP, X9,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
B.EQ 406c90 <sortAtomsInCell+0x6c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND X10, X8, #5056 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB SP, SP, X10,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
STR XZR, [SP] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
CMP X10, #1024 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.CS 407008 <sortAtomsInCell+0x3e4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR D6, [X5] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDR W8, [X15, X6,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR W8, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR W9, [X16, X6,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD X6, X6, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D6, [X10, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D7, [X5, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR W9, [X10, #4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR D7, [X10, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D16, [X5, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ADD X5, X30, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D16, [X10, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D17, [X4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D17, [X10, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D18, [X4, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D18, [X10, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D19, [X4, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ADD X4, X0, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D19, [X10, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
ADD X10, X19, #112 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP W20, W6 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LE 406e48 <sortAtomsInCell+0x224> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
LDR W16, [X13] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR D6, [X13, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR W16, [X9, X4,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR W23, [X13, #4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR W23, [X8, X4,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X4, X4, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D6, [X12] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D7, [X13, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D7, [X12, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D16, [X13, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D16, [X12, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
ADD X12, X10, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR D17, [X13, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D17, [X2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D18, [X13, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D18, [X2, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D19, [X13, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ADD X13, X19, #112 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D19, [X2, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
ADD X2, X21, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP W20, W4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LE 406fd4 <sortAtomsInCell+0x3b0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
BL 401f10 <@plt_start@+0x1b0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Source file and lines | haloExchange.c:614-645 |
Module | exec |
nb instructions | 81 |
loop length | 324 |
nb stack references | 0 |
front end | 9.13 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.50 | 2.50 | 7.00 | 7.00 | 7.00 | 7.00 | 6.00 | 6.00 | 0.00 | 0.00 | 14.00 | 14.00 | 14.00 | 5.00 | 5.00 |
cycles | 2.50 | 2.50 | 7.00 | 7.00 | 7.00 | 7.00 | 6.00 | 6.00 | 0.00 | 0.00 | 14.00 | 14.00 | 14.00 | 5.00 | 5.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 9.13 |
Overall L1 | 14.00 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
STP X29, X30, [SP, #944]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X3, <420c2c> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X4, [X1, #120] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
MOVZ W1, #56 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X5, [X3, #4048] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ORR X22, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR W20, [X4, X2,SXTW #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X23, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X0, [X5] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X0, [X29, #72] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MOVZ X0, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB SP, SP, #16 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SMADDL X0, W20, W1, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SBFM X1, X20, #0, #31 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X6, X0, #15 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND X7, X6, #7152 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND X8, X6, #7932 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X9, SP, X7,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
CMP SP, X9,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
B.EQ 406c90 <sortAtomsInCell+0x6c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND X10, X8, #5056 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB SP, SP, X10,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
STR XZR, [SP] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
CMP X10, #1024 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.CS 407008 <sortAtomsInCell+0x3e4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR D6, [X5] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDR W8, [X15, X6,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR W8, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR W9, [X16, X6,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD X6, X6, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D6, [X10, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D7, [X5, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR W9, [X10, #4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR D7, [X10, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D16, [X5, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ADD X5, X30, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D16, [X10, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D17, [X4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D17, [X10, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D18, [X4, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D18, [X10, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D19, [X4, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ADD X4, X0, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D19, [X10, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
ADD X10, X19, #112 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP W20, W6 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LE 406e48 <sortAtomsInCell+0x224> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
LDR W16, [X13] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR D6, [X13, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR W16, [X9, X4,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR W23, [X13, #4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR W23, [X8, X4,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X4, X4, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D6, [X12] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D7, [X13, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D7, [X12, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D16, [X13, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D16, [X12, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
ADD X12, X10, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR D17, [X13, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D17, [X2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D18, [X13, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D18, [X2, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D19, [X13, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ADD X13, X19, #112 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D19, [X2, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
ADD X2, X21, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP W20, W4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LE 406fd4 <sortAtomsInCell+0x3b0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
BL 401f10 <@plt_start@+0x1b0> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼sortAtomsInCell– | 0.68 | 0.28 |
▼Loop 64 - haloExchange.c:617-645 - exec– | 0.06 | 0.02 |
○Loop 66 - haloExchange.c:621-630 - exec | 0.43 | 0.17 |
○Loop 65 - haloExchange.c:633-642 - exec | 0.16 | 0.06 |
○Loop 67 - haloExchange.c:617-617 - exec | 0 | 0 |