Function: sortAtomsInCell | Module: exec | Source: haloExchange.c:614-645 | Coverage: 1.2% |
---|
Function: sortAtomsInCell | Module: exec | Source: haloExchange.c:614-645 | Coverage: 1.2% |
---|
/home/hbollore/qaas-runs/170-265-5545/intel/CoMD/build/CoMD/CoMD/src-openmp/haloExchange.c: 614 - 645 |
-------------------------------------------------------------------------------- |
614: { |
615: int nAtoms = boxes->nAtoms[iBox]; |
616: |
617: AtomMsg tmp[nAtoms]; |
618: |
619: int begin = iBox*MAXATOMS; |
620: int end = begin + nAtoms; |
621: for (int ii=begin, iTmp=0; ii<end; ++ii, ++iTmp) |
622: { |
623: tmp[iTmp].gid = atoms->gid[ii]; |
624: tmp[iTmp].type = atoms->iSpecies[ii]; |
625: tmp[iTmp].rx = atoms->r[ii][0]; |
626: tmp[iTmp].ry = atoms->r[ii][1]; |
627: tmp[iTmp].rz = atoms->r[ii][2]; |
628: tmp[iTmp].px = atoms->p[ii][0]; |
629: tmp[iTmp].py = atoms->p[ii][1]; |
630: tmp[iTmp].pz = atoms->p[ii][2]; |
631: } |
632: qsort(&tmp, nAtoms, sizeof(AtomMsg), sortAtomsById); |
633: for (int ii=begin, iTmp=0; ii<end; ++ii, ++iTmp) |
634: { |
635: atoms->gid[ii] = tmp[iTmp].gid; |
636: atoms->iSpecies[ii] = tmp[iTmp].type; |
637: atoms->r[ii][0] = tmp[iTmp].rx; |
638: atoms->r[ii][1] = tmp[iTmp].ry; |
639: atoms->r[ii][2] = tmp[iTmp].rz; |
640: atoms->p[ii][0] = tmp[iTmp].px; |
641: atoms->p[ii][1] = tmp[iTmp].py; |
642: atoms->p[ii][2] = tmp[iTmp].pz; |
643: } |
644: |
645: } |
0x407164 STP X29, X30, [SP, #944]! |
0x407168 ADD X29, SP, #0 |
0x40716c ADRP X3, |
0x407170 LDR X4, [X1, #120] |
0x407174 MOVZ W1, #56 |
0x407178 STP X19, X20, [SP, #16] |
0x40717c LDR X5, [X3, #3976] |
0x407180 STP X21, X22, [SP, #32] |
0x407184 ORR X22, XZR, X0 |
0x407188 LDR W20, [X4, X2,SXTW #2] |
0x40718c STR X23, [SP, #48] |
0x407190 LDR X0, [X5] |
0x407194 STR X0, [X29, #72] |
0x407198 MOVZ X0, #0 |
0x40719c SUB SP, SP, #16 |
0x4071a0 SMADDL X0, W20, W1, XZR |
0x4071a4 SBFM X1, X20, #0, #31 |
0x4071a8 ADD X6, X0, #15 |
0x4071ac AND X7, X6, #7152 |
0x4071b0 AND X8, X6, #7932 |
0x4071b4 SUB X9, SP, X7,UXTX |
0x4071b8 CMP SP, X9,UXTX |
0x4071bc B.EQ 4071d0 |
(70) 0x4071c0 SUB SP, SP, #16 |
(70) 0x4071c4 STR XZR, [SP, #1024] |
(70) 0x4071c8 CMP SP, X9,UXTX |
(70) 0x4071cc B.NE 4071c0 |
0x4071d0 AND X10, X8, #5056 |
0x4071d4 SUB SP, SP, X10,UXTX |
0x4071d8 STR XZR, [SP] |
0x4071dc CMP X10, #1024 |
0x4071e0 B.CS 407548 |
(67) 0x4071e4 UBFM W21, W2, #26, #25 |
(67) 0x4071e8 ADD X19, SP, #16 |
(67) 0x4071ec ADD W20, W20, W21 |
(67) 0x4071f0 CMP W21, W20 |
(67) 0x4071f4 B.GE 407550 |
(67) 0x4071f8 MOVZ W11, #24 |
(67) 0x4071fc LDP X17, X18, [X22, #24] |
(67) 0x407200 SBFM X23, X21, #0, #31 |
(67) 0x407204 ORN W12, WZR, W21 |
(67) 0x407208 ADD X6, X23, #1 |
(67) 0x40720c SMADDL X21, W21, W11, XZR |
(67) 0x407210 ADD W13, W20, W12 |
(67) 0x407214 ADD X10, X19, #56 |
(67) 0x407218 LDP X15, X16, [X22, #8] |
(67) 0x40721c AND W14, W13, #0 |
(67) 0x407220 ADD X30, X17, X21 |
(67) 0x407224 ADD X0, X18, X21 |
(67) 0x407228 ADD X5, X30, #24 |
(67) 0x40722c ADD X4, X0, #24 |
(67) 0x407230 LDR D0, [X30] |
(67) 0x407234 LDR W3, [X15, X23,LSL #2] |
(67) 0x407238 STR W3, [X19] |
(67) 0x40723c LDR W7, [X16, X23,LSL #2] |
(67) 0x407240 STR D0, [X19, #8] |
(67) 0x407244 LDR D1, [X30, #8] |
(67) 0x407248 STR W7, [X19, #4] |
(67) 0x40724c STR D1, [X19, #16] |
(67) 0x407250 LDR D2, [X30, #16] |
(67) 0x407254 STR D2, [X19, #24] |
(67) 0x407258 LDR D3, [X0] |
(67) 0x40725c STR D3, [X19, #32] |
(67) 0x407260 LDR D4, [X0, #8] |
(67) 0x407264 STR D4, [X19, #40] |
(67) 0x407268 LDR D5, [X0, #16] |
(67) 0x40726c STR D5, [X19, #48] |
(67) 0x407270 CMP W20, W6 |
(67) 0x407274 B.LE 407388 |
(67) 0x407278 CBZ W14, 4072e0 |
0x40727c LDR D6, [X5] |
0x407280 LDR W8, [X15, X6,LSL #2] |
0x407284 STR W8, [X10] |
0x407288 LDR W9, [X16, X6,LSL #2] |
0x40728c ADD X6, X6, #1 |
0x407290 STR D6, [X10, #8] |
0x407294 LDR D7, [X5, #8] |
0x407298 STR W9, [X10, #4] |
0x40729c STR D7, [X10, #16] |
0x4072a0 LDR D16, [X5, #16] |
0x4072a4 ADD X5, X30, #48 |
0x4072a8 STR D16, [X10, #24] |
0x4072ac LDR D17, [X4] |
0x4072b0 STR D17, [X10, #32] |
0x4072b4 LDR D18, [X4, #8] |
0x4072b8 STR D18, [X10, #40] |
0x4072bc LDR D19, [X4, #16] |
0x4072c0 ADD X4, X0, #48 |
0x4072c4 STR D19, [X10, #48] |
0x4072c8 ADD X10, X19, #112 |
0x4072cc CMP W20, W6 |
0x4072d0 B.LE 407388 |
0x4072d4 HINT #0 |
0x4072d8 HINT #0 |
0x4072dc HINT #0 |
(69) 0x4072e0 LDR D20, [X5] |
(69) 0x4072e4 ADD X2, X6, #1 |
(69) 0x4072e8 ADD X12, X10, #56 |
(69) 0x4072ec ADD X13, X5, #24 |
(69) 0x4072f0 ADD X14, X4, #24 |
(69) 0x4072f4 LDR W11, [X15, X6,LSL #2] |
(69) 0x4072f8 ADD X10, X10, #112 |
(69) 0x4072fc ADD X5, X5, #48 |
(69) 0x407300 ADD X4, X4, #48 |
(69) 0x407304 STUR W11, [X10, #400] |
(69) 0x407308 LDR W17, [X16, X6,LSL #2] |
(69) 0x40730c ADD X6, X6, #2 |
(69) 0x407310 STUR D20, [X10, #408] |
(69) 0x407314 LDUR D21, [X5, #472] |
(69) 0x407318 STUR W17, [X10, #404] |
(69) 0x40731c LDR W18, [X15, X2,LSL #2] |
(69) 0x407320 STUR D21, [X10, #416] |
(69) 0x407324 LDUR D22, [X5, #480] |
(69) 0x407328 STUR D22, [X10, #424] |
(69) 0x40732c LDUR D23, [X4, #464] |
(69) 0x407330 STUR D23, [X10, #432] |
(69) 0x407334 LDUR D24, [X4, #472] |
(69) 0x407338 STUR D24, [X10, #440] |
(69) 0x40733c LDUR D25, [X4, #480] |
(69) 0x407340 STUR W18, [X10, #456] |
(69) 0x407344 LDR W30, [X16, X2,LSL #2] |
(69) 0x407348 STUR D25, [X10, #448] |
(69) 0x40734c LDUR D26, [X5, #488] |
(69) 0x407350 STR W30, [X12, #4] |
(69) 0x407354 STR D26, [X12, #8] |
(69) 0x407358 LDR D27, [X13, #8] |
(69) 0x40735c STR D27, [X12, #16] |
(69) 0x407360 LDR D28, [X13, #16] |
(69) 0x407364 STR D28, [X12, #24] |
(69) 0x407368 LDUR D29, [X4, #488] |
(69) 0x40736c STR D29, [X12, #32] |
(69) 0x407370 LDR D30, [X14, #8] |
(69) 0x407374 STR D30, [X12, #40] |
(69) 0x407378 LDR D31, [X14, #16] |
(69) 0x40737c STR D31, [X12, #48] |
(69) 0x407380 CMP W20, W6 |
(69) 0x407384 B.GT 4072e0 |
(67) 0x407388 ADRP X15, |
(67) 0x40738c MOVZ X2, #56 |
(67) 0x407390 ADD X3, X15, #928 |
(67) 0x407394 ORR X0, XZR, X19 |
(67) 0x407398 BL 402320 |
(67) 0x40739c LDR W7, [X19] |
(67) 0x4073a0 ORN W1, WZR, W23 |
(67) 0x4073a4 ADD X4, X23, #1 |
(67) 0x4073a8 LDP X9, X8, [X22, #8] |
(67) 0x4073ac ADD W3, W20, W1 |
(67) 0x4073b0 ADD X13, X19, #56 |
(67) 0x4073b4 AND W6, W3, #0 |
(67) 0x4073b8 LDP X5, X0, [X22, #24] |
(67) 0x4073bc LDR D0, [X19, #8] |
(67) 0x4073c0 STR W7, [X9, X23,LSL #2] |
(67) 0x4073c4 ADD X10, X5, X21 |
(67) 0x4073c8 ADD X21, X0, X21 |
(67) 0x4073cc LDR W22, [X19, #4] |
(67) 0x4073d0 ADD X12, X10, #24 |
(67) 0x4073d4 ADD X2, X21, #24 |
(67) 0x4073d8 STR W22, [X8, X23,LSL #2] |
(67) 0x4073dc STR D0, [X10] |
(67) 0x4073e0 LDR D1, [X19, #16] |
(67) 0x4073e4 STR D1, [X10, #8] |
(67) 0x4073e8 LDR D2, [X19, #24] |
(67) 0x4073ec STR D2, [X10, #16] |
(67) 0x4073f0 LDR D3, [X19, #32] |
(67) 0x4073f4 STR D3, [X21] |
(67) 0x4073f8 LDR D4, [X19, #40] |
(67) 0x4073fc STR D4, [X21, #8] |
(67) 0x407400 LDR D5, [X19, #48] |
(67) 0x407404 STR D5, [X21, #16] |
(67) 0x407408 CMP W20, W4 |
(67) 0x40740c B.LE 407514 |
(67) 0x407410 CBZ W6, 40746c |
0x407414 LDR W16, [X13] |
0x407418 LDR D6, [X13, #8] |
0x40741c STR W16, [X9, X4,LSL #2] |
0x407420 LDR W23, [X13, #4] |
0x407424 STR W23, [X8, X4,LSL #2] |
0x407428 ADD X4, X4, #1 |
0x40742c STR D6, [X12] |
0x407430 LDR D7, [X13, #16] |
0x407434 STR D7, [X12, #8] |
0x407438 LDR D16, [X13, #24] |
0x40743c STR D16, [X12, #16] |
0x407440 ADD X12, X10, #48 |
0x407444 LDR D17, [X13, #32] |
0x407448 STR D17, [X2] |
0x40744c LDR D18, [X13, #40] |
0x407450 STR D18, [X2, #8] |
0x407454 LDR D19, [X13, #48] |
0x407458 ADD X13, X19, #112 |
0x40745c STR D19, [X2, #16] |
0x407460 ADD X2, X21, #48 |
0x407464 CMP W20, W4 |
0x407468 B.LE 407514 |
(68) 0x40746c LDR W18, [X13] |
(68) 0x407470 ADD X14, X13, #56 |
(68) 0x407474 ADD X19, X4, #1 |
(68) 0x407478 ADD X11, X12, #24 |
(68) 0x40747c ADD X17, X2, #24 |
(68) 0x407480 LDR D20, [X13, #8] |
(68) 0x407484 ADD X12, X12, #48 |
(68) 0x407488 ADD X13, X13, #112 |
(68) 0x40748c ADD X2, X2, #48 |
(68) 0x407490 STR W18, [X9, X4,LSL #2] |
(68) 0x407494 LDUR W30, [X13, #404] |
(68) 0x407498 STR W30, [X8, X4,LSL #2] |
(68) 0x40749c ADD X4, X4, #2 |
(68) 0x4074a0 LDUR W15, [X13, #456] |
(68) 0x4074a4 STUR D20, [X12, #464] |
(68) 0x4074a8 LDUR D21, [X13, #416] |
(68) 0x4074ac STUR D21, [X12, #472] |
(68) 0x4074b0 LDUR D22, [X13, #424] |
(68) 0x4074b4 STUR D22, [X12, #480] |
(68) 0x4074b8 LDUR D23, [X13, #432] |
(68) 0x4074bc STUR D23, [X2, #464] |
(68) 0x4074c0 LDUR D24, [X13, #440] |
(68) 0x4074c4 STUR D24, [X2, #472] |
(68) 0x4074c8 LDUR D25, [X13, #448] |
(68) 0x4074cc STUR D25, [X2, #480] |
(68) 0x4074d0 STR W15, [X9, X19,LSL #2] |
(68) 0x4074d4 LDR W1, [X14, #4] |
(68) 0x4074d8 LDR D26, [X14, #8] |
(68) 0x4074dc STR W1, [X8, X19,LSL #2] |
(68) 0x4074e0 STUR D26, [X12, #488] |
(68) 0x4074e4 LDR D27, [X14, #16] |
(68) 0x4074e8 STUR D27, [X12, #496] |
(68) 0x4074ec LDR D28, [X14, #24] |
(68) 0x4074f0 STR D28, [X11, #16] |
(68) 0x4074f4 LDR D29, [X14, #32] |
(68) 0x4074f8 STUR D29, [X2, #488] |
(68) 0x4074fc LDR D30, [X14, #40] |
(68) 0x407500 STR D30, [X17, #8] |
(68) 0x407504 LDR D31, [X14, #48] |
(68) 0x407508 STR D31, [X17, #16] |
(68) 0x40750c CMP W20, W4 |
(68) 0x407510 B.GT 40746c |
(67) 0x407514 ADRP X20, |
(67) 0x407518 LDR X3, [X20, #3976] |
(67) 0x40751c LDR X2, [X29, #72] |
(67) 0x407520 LDR X1, [X3] |
(67) 0x407524 SUBS X2, X2, X1 |
(67) 0x407528 MOVZ X1, #0 |
(67) 0x40752c B.NE 407568 |
(67) 0x407530 ADD SP, X29, #0 |
(67) 0x407534 LDP X19, X20, [SP, #16] |
(67) 0x407538 LDP X21, X22, [SP, #32] |
(67) 0x40753c LDR X23, [SP, #48] |
(67) 0x407540 LDP X29, X30, [SP], #80 |
(67) 0x407544 RET |
(67) 0x407548 STR XZR, [SP, #1024] |
(67) 0x40754c B 4071e4 |
(67) 0x407550 ADRP X2, |
(67) 0x407554 ORR X0, XZR, X19 |
(67) 0x407558 ADD X3, X2, #928 |
(67) 0x40755c MOVZ X2, #56 |
(67) 0x407560 BL 402320 |
(67) 0x407564 B 407514 |
0x407568 BL 402290 |
0x40756c HINT #0 |
0x407570 HINT #0 |
0x407574 HINT #0 |
0x407578 HINT #0 |
0x40757c HINT #0 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►13.03+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | __kmp_GOMP_microtask_wrapper(i[...] | libomp.so | |
○ | __kmp_invoke_microtask | libomp.so | |
►12.80+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | __kmp_GOMP_microtask_wrapper(i[...] | libomp.so | |
○ | __kmp_invoke_microtask | libomp.so | |
►12.57+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | __kmp_GOMP_microtask_wrapper(i[...] | libomp.so | |
○ | __kmp_invoke_microtask | libomp.so | |
►12.53+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | __kmp_GOMP_microtask_wrapper(i[...] | libomp.so | |
○ | __kmp_invoke_microtask | libomp.so | |
►12.10+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | __kmp_GOMP_microtask_wrapper(i[...] | libomp.so | |
○ | __kmp_invoke_microtask | libomp.so | |
►12.07+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | __kmp_GOMP_microtask_wrapper(i[...] | libomp.so | |
○ | __kmp_invoke_microtask | libomp.so | |
►11.99+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | __kmp_GOMP_microtask_wrapper(i[...] | libomp.so | |
○ | __kmp_invoke_microtask | libomp.so | |
►11.45+ | redistributeAtoms._omp_fn.0 | timestep.c:154 | exec |
○ | __kmp_GOMP_microtask_wrapper(i[...] | libomp.so | |
○ | __kmp_invoke_microtask | libomp.so |
Path / |
Source file and lines | haloExchange.c:614-645 |
Module | exec |
nb instructions | 81 |
loop length | 324 |
nb stack references | 0 |
front end | 9.13 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.50 | 2.50 | 7.00 | 7.00 | 7.00 | 7.00 | 6.00 | 6.00 | 0.00 | 0.00 | 14.00 | 14.00 | 14.00 | 5.00 | 5.00 |
cycles | 2.50 | 2.50 | 7.00 | 7.00 | 7.00 | 7.00 | 6.00 | 6.00 | 0.00 | 0.00 | 14.00 | 14.00 | 14.00 | 5.00 | 5.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 9.13 |
Overall L1 | 14.00 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
STP X29, X30, [SP, #944]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X3, <42116c> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X4, [X1, #120] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
MOVZ W1, #56 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X5, [X3, #3976] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ORR X22, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR W20, [X4, X2,SXTW #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X23, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X0, [X5] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X0, [X29, #72] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MOVZ X0, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB SP, SP, #16 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SMADDL X0, W20, W1, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SBFM X1, X20, #0, #31 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X6, X0, #15 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND X7, X6, #7152 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND X8, X6, #7932 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X9, SP, X7,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
CMP SP, X9,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
B.EQ 4071d0 <sortAtomsInCell+0x6c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND X10, X8, #5056 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB SP, SP, X10,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
STR XZR, [SP] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
CMP X10, #1024 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.CS 407548 <sortAtomsInCell+0x3e4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR D6, [X5] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDR W8, [X15, X6,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR W8, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR W9, [X16, X6,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD X6, X6, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D6, [X10, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D7, [X5, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR W9, [X10, #4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR D7, [X10, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D16, [X5, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ADD X5, X30, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D16, [X10, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D17, [X4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D17, [X10, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D18, [X4, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D18, [X10, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D19, [X4, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ADD X4, X0, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D19, [X10, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
ADD X10, X19, #112 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP W20, W6 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LE 407388 <sortAtomsInCell+0x224> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
LDR W16, [X13] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR D6, [X13, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR W16, [X9, X4,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR W23, [X13, #4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR W23, [X8, X4,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X4, X4, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D6, [X12] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D7, [X13, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D7, [X12, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D16, [X13, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D16, [X12, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
ADD X12, X10, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR D17, [X13, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D17, [X2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D18, [X13, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D18, [X2, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D19, [X13, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ADD X13, X19, #112 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D19, [X2, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
ADD X2, X21, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP W20, W4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LE 407514 <sortAtomsInCell+0x3b0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
BL 402290 <@plt_start@+0x70> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Source file and lines | haloExchange.c:614-645 |
Module | exec |
nb instructions | 81 |
loop length | 324 |
nb stack references | 0 |
front end | 9.13 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 2.50 | 2.50 | 7.00 | 7.00 | 7.00 | 7.00 | 6.00 | 6.00 | 0.00 | 0.00 | 14.00 | 14.00 | 14.00 | 5.00 | 5.00 |
cycles | 2.50 | 2.50 | 7.00 | 7.00 | 7.00 | 7.00 | 6.00 | 6.00 | 0.00 | 0.00 | 14.00 | 14.00 | 14.00 | 5.00 | 5.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 9.13 |
Overall L1 | 14.00 |
all | 0% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
STP X29, X30, [SP, #944]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X3, <42116c> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X4, [X1, #120] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
MOVZ W1, #56 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X5, [X3, #3976] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ORR X22, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR W20, [X4, X2,SXTW #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X23, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X0, [X5] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X0, [X29, #72] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MOVZ X0, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB SP, SP, #16 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SMADDL X0, W20, W1, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SBFM X1, X20, #0, #31 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X6, X0, #15 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND X7, X6, #7152 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
AND X8, X6, #7932 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X9, SP, X7,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
CMP SP, X9,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
B.EQ 4071d0 <sortAtomsInCell+0x6c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
AND X10, X8, #5056 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB SP, SP, X10,UXTX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
STR XZR, [SP] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
CMP X10, #1024 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.CS 407548 <sortAtomsInCell+0x3e4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR D6, [X5] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDR W8, [X15, X6,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR W8, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR W9, [X16, X6,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD X6, X6, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D6, [X10, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D7, [X5, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR W9, [X10, #4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR D7, [X10, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D16, [X5, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ADD X5, X30, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D16, [X10, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D17, [X4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D17, [X10, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D18, [X4, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D18, [X10, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D19, [X4, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ADD X4, X0, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D19, [X10, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
ADD X10, X19, #112 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP W20, W6 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LE 407388 <sortAtomsInCell+0x224> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
LDR W16, [X13] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR D6, [X13, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR W16, [X9, X4,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR W23, [X13, #4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR W23, [X8, X4,LSL #2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X4, X4, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D6, [X12] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D7, [X13, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D7, [X12, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D16, [X13, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D16, [X12, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
ADD X12, X10, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR D17, [X13, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D17, [X2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D18, [X13, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STR D18, [X2, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D19, [X13, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ADD X13, X19, #112 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D19, [X2, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
ADD X2, X21, #48 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP W20, W4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LE 407514 <sortAtomsInCell+0x3b0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
BL 402290 <@plt_start@+0x70> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼sortAtomsInCell– | 1.2 | 0.21 |
▼Loop 67 - haloExchange.c:617-645 - exec– | 0.35 | 0.06 |
○Loop 69 - haloExchange.c:621-630 - exec | 0.71 | 0.12 |
○Loop 68 - haloExchange.c:633-642 - exec | 0.12 | 0.02 |
○Loop 70 - haloExchange.c:617-617 - exec | 0 | 0 |