| Function: hypre_qsort2abs | Module: exec | Source: par_interp.c:3178-3192 | Coverage (incl. loops): 0.02% | (excl. loops): 0.01% |
|---|
| Function: hypre_qsort2abs | Module: exec | Source: par_interp.c:3178-3192 | Coverage (incl. loops): 0.02% | (excl. loops): 0.01% |
|---|
/home/eoseret/qaas/qaas_runs/178-188-3659/intel/AMG/build/AMG/AMG/parcsr_ls/par_interp.c: 3178 - 3192 |
-------------------------------------------------------------------------------- |
3178: { |
3179: HYPRE_Int i, last; |
3180: if (left >= right) |
3181: return; |
3182: hypre_swap2( v, w, left, (left+right)/2); |
3183: last = left; |
3184: for (i = left+1; i <= right; i++) |
3185: if (fabs(w[i]) > fabs(w[left])) |
3186: { |
3187: hypre_swap2(v, w, ++last, i); |
3188: } |
3189: hypre_swap2(v, w, left, last); |
3190: hypre_qsort2abs(v, w, left, last-1); |
3191: hypre_qsort2abs(v, w, last+1, right); |
3192: } |
0x45052c STP X29, X30, [SP, #928]! |
0x450530 ADD X29, SP, #0 |
0x450534 STP X19, X20, [SP, #16] |
0x450538 ORR X20, XZR, X1 |
0x45053c STP X21, X22, [SP, #32] |
0x450540 ORR X22, XZR, X2 |
0x450544 STP X23, X24, [SP, #48] |
0x450548 ORR X24, XZR, X0 |
0x45054c STP X25, X26, [SP, #64] |
0x450550 ORR X25, XZR, X3 |
0x450554 STR X27, [SP, #80] |
(595) 0x450558 CMP X25, X22 |
(595) 0x45055c B.LE 4506f4 |
(596) 0x450560 ADD X3, X25, X22 |
(596) 0x450564 ORR X2, XZR, X22 |
(596) 0x450568 ADD X4, X3, X3,LSR #63 |
(596) 0x45056c ORR X1, XZR, X20 |
(596) 0x450570 ORR X0, XZR, X24 |
(596) 0x450574 ADD X19, X22, #1 |
(596) 0x450578 SBFM X3, X4, #1, #63 |
(596) 0x45057c BL 529a40 |
(596) 0x450580 CMP X25, X19 |
(596) 0x450584 B.LT 450a10 |
(596) 0x450588 UBFM X27, X22, #61, #60 |
(596) 0x45058c LDR D31, [X20, X19,LSL #3] |
(596) 0x450590 SUB X26, X25, X19 |
(596) 0x450594 ADD X23, X20, X22,LSL #3 |
(596) 0x450598 AND X26, X26, #0x7 |
(596) 0x45059c ORR X21, XZR, X22 |
(596) 0x4505a0 LDR D30, [X20, X27] |
(596) 0x4505a4 FABS D0, D31 |
(596) 0x4505a8 FABS D1, D30 |
(596) 0x4505ac FCMPE D0, D1 |
(596) 0x4505b0 B.GT 4509d8 |
(596) 0x4505b4 ADD X19, X19, #1 |
(596) 0x4505b8 CMP X25, X19 |
(596) 0x4505bc B.LT 4506c0 |
(596) 0x4505c0 CBZ X26, 4507f8 |
(596) 0x4505c4 CMP X26, #1 |
(596) 0x4505c8 B.EQ 45069c |
(596) 0x4505cc CMP X26, #2 |
(596) 0x4505d0 B.EQ 450680 |
(596) 0x4505d4 CMP X26, #3 |
(596) 0x4505d8 B.EQ 450664 |
(596) 0x4505dc CMP X26, #4 |
(596) 0x4505e0 B.EQ 450648 |
(596) 0x4505e4 CMP X26, #5 |
(596) 0x4505e8 B.EQ 45062c |
(596) 0x4505ec CMP X26, #6 |
(596) 0x4505f0 B.EQ 450610 |
(596) 0x4505f4 LDR D29, [X20, X19,LSL #3] |
(596) 0x4505f8 LDR D28, [X20, X27] |
(596) 0x4505fc FABS D2, D29 |
(596) 0x450600 FABS D3, D28 |
(596) 0x450604 FCMPE D2, D3 |
(596) 0x450608 B.GT 450a48 |
(596) 0x45060c ADD X19, X19, #1 |
(596) 0x450610 LDR D27, [X20, X19,LSL #3] |
(596) 0x450614 LDR D26, [X20, X27] |
(596) 0x450618 FABS D4, D27 |
(596) 0x45061c FABS D5, D26 |
(596) 0x450620 FCMPE D4, D5 |
(596) 0x450624 B.GT 450a2c |
(596) 0x450628 ADD X19, X19, #1 |
(596) 0x45062c LDR D25, [X20, X19,LSL #3] |
(596) 0x450630 LDR D24, [X20, X27] |
(596) 0x450634 FABS D6, D25 |
(596) 0x450638 FABS D7, D24 |
(596) 0x45063c FCMPE D6, D7 |
(596) 0x450640 B.GT 4509bc |
(596) 0x450644 ADD X19, X19, #1 |
(596) 0x450648 LDR D23, [X20, X19,LSL #3] |
(596) 0x45064c LDR D22, [X20, X27] |
(596) 0x450650 FABS D16, D23 |
(596) 0x450654 FABS D17, D22 |
(596) 0x450658 FCMPE D16, D17 |
(596) 0x45065c B.GT 4509a0 |
(596) 0x450660 ADD X19, X19, #1 |
(596) 0x450664 LDR D21, [X20, X19,LSL #3] |
(596) 0x450668 LDR D20, [X20, X27] |
(596) 0x45066c FABS D18, D21 |
(596) 0x450670 FABS D19, D20 |
(596) 0x450674 FCMPE D18, D19 |
(596) 0x450678 B.GT 450984 |
(596) 0x45067c ADD X19, X19, #1 |
(596) 0x450680 LDR D31, [X20, X19,LSL #3] |
(596) 0x450684 LDR D30, [X20, X27] |
(596) 0x450688 FABS D0, D31 |
(596) 0x45068c FABS D1, D30 |
(596) 0x450690 FCMPE D0, D1 |
(596) 0x450694 B.GT 450968 |
(596) 0x450698 ADD X19, X19, #1 |
(596) 0x45069c LDR D29, [X20, X19,LSL #3] |
(596) 0x4506a0 LDR D28, [X20, X27] |
(596) 0x4506a4 FABS D2, D29 |
(596) 0x4506a8 FABS D3, D28 |
(596) 0x4506ac FCMPE D2, D3 |
(596) 0x4506b0 B.GT 4509f4 |
(596) 0x4506b4 ADD X19, X19, #1 |
(596) 0x4506b8 CMP X25, X19 |
(596) 0x4506bc B.GE 4507f8 |
(596) 0x4506c0 ORR X2, XZR, X22 |
(596) 0x4506c4 ORR X3, XZR, X21 |
(596) 0x4506c8 ORR X1, XZR, X20 |
(596) 0x4506cc ORR X0, XZR, X24 |
(596) 0x4506d0 BL 529a40 |
(596) 0x4506d4 ORR X2, XZR, X22 |
(596) 0x4506d8 SUB X3, X21, #1 |
(596) 0x4506dc ORR X1, XZR, X20 |
(596) 0x4506e0 ORR X0, XZR, X24 |
(596) 0x4506e4 ADD X22, X21, #1 |
(596) 0x4506e8 BL 45052c |
(596) 0x4506ec CMP X22, X25 |
(596) 0x4506f0 B.LT 450560 |
0x4506f4 LDR X27, [SP, #80] |
0x4506f8 LDP X19, X20, [SP, #16] |
0x4506fc LDP X21, X22, [SP, #32] |
0x450700 LDP X23, X24, [SP, #48] |
0x450704 LDP X25, X26, [SP, #64] |
0x450708 LDP X29, X30, [SP], #96 |
0x45070c RET |
(597) 0x450710 ADD X21, X21, #1 |
(597) 0x450714 ORR X3, XZR, X19 |
(597) 0x450718 ORR X2, XZR, X21 |
(597) 0x45071c ORR X1, XZR, X20 |
(597) 0x450720 ORR X0, XZR, X24 |
(597) 0x450724 ADD X19, X19, #1 |
(597) 0x450728 BL 529a40 |
(597) 0x45072c LDR D25, [X20, X19,LSL #3] |
(597) 0x450730 LDR D6, [X23] |
(597) 0x450734 FABS D24, D25 |
(597) 0x450738 FABS D7, D6 |
(597) 0x45073c FCMPE D24, D7 |
(597) 0x450740 B.GT 45082c |
(597) 0x450744 ADD X3, X19, #1 |
(597) 0x450748 LDR D16, [X23] |
(597) 0x45074c LDR D23, [X20, X3,LSL #3] |
(597) 0x450750 FABS D17, D16 |
(597) 0x450754 FABS D22, D23 |
(597) 0x450758 FCMPE D22, D17 |
(597) 0x45075c B.GT 450860 |
(597) 0x450760 ADD X3, X19, #2 |
(597) 0x450764 LDR D18, [X23] |
(597) 0x450768 LDR D21, [X20, X3,LSL #3] |
(597) 0x45076c FABS D19, D18 |
(597) 0x450770 FABS D20, D21 |
(597) 0x450774 FCMPE D20, D19 |
(597) 0x450778 B.GT 450890 |
(597) 0x45077c ADD X3, X19, #3 |
(597) 0x450780 LDR D30, [X23] |
(597) 0x450784 LDR D31, [X20, X3,LSL #3] |
(597) 0x450788 FABS D1, D30 |
(597) 0x45078c FABS D0, D31 |
(597) 0x450790 FCMPE D0, D1 |
(597) 0x450794 B.GT 4508c0 |
(597) 0x450798 ADD X3, X19, #4 |
(597) 0x45079c LDR D28, [X23] |
(597) 0x4507a0 LDR D29, [X20, X3,LSL #3] |
(597) 0x4507a4 FABS D3, D28 |
(597) 0x4507a8 FABS D2, D29 |
(597) 0x4507ac FCMPE D2, D3 |
(597) 0x4507b0 B.GT 4508f0 |
(597) 0x4507b4 ADD X3, X19, #5 |
(597) 0x4507b8 LDR D26, [X23] |
(597) 0x4507bc LDR D27, [X20, X3,LSL #3] |
(597) 0x4507c0 FABS D5, D26 |
(597) 0x4507c4 FABS D4, D27 |
(597) 0x4507c8 FCMPE D4, D5 |
(597) 0x4507cc B.GT 450920 |
(597) 0x4507d0 ADD X3, X19, #6 |
(597) 0x4507d4 LDR D24, [X23] |
(597) 0x4507d8 LDR D25, [X20, X3,LSL #3] |
(597) 0x4507dc FABS D7, D24 |
(597) 0x4507e0 FABS D6, D25 |
(597) 0x4507e4 FCMPE D6, D7 |
(597) 0x4507e8 B.GT 450950 |
(597) 0x4507ec ADD X19, X19, #7 |
(597) 0x4507f0 CMP X25, X19 |
(597) 0x4507f4 B.LT 4506c0 |
(597) 0x4507f8 LDR D27, [X20, X19,LSL #3] |
(597) 0x4507fc LDR D4, [X23] |
(597) 0x450800 FABS D26, D27 |
(597) 0x450804 FABS D5, D4 |
(597) 0x450808 FCMPE D26, D5 |
(597) 0x45080c B.GT 450710 |
(597) 0x450810 ADD X19, X19, #1 |
(597) 0x450814 LDR D6, [X23] |
(597) 0x450818 LDR D25, [X20, X19,LSL #3] |
(597) 0x45081c FABS D7, D6 |
(597) 0x450820 FABS D24, D25 |
(597) 0x450824 FCMPE D24, D7 |
(597) 0x450828 B.LS 450744 |
(597) 0x45082c ADD X21, X21, #1 |
(597) 0x450830 ORR X3, XZR, X19 |
(597) 0x450834 ORR X2, XZR, X21 |
(597) 0x450838 ORR X1, XZR, X20 |
(597) 0x45083c ORR X0, XZR, X24 |
(597) 0x450840 BL 529a40 |
(597) 0x450844 ADD X3, X19, #1 |
(597) 0x450848 LDR D16, [X23] |
(597) 0x45084c LDR D23, [X20, X3,LSL #3] |
(597) 0x450850 FABS D17, D16 |
(597) 0x450854 FABS D22, D23 |
(597) 0x450858 FCMPE D22, D17 |
(597) 0x45085c B.LS 450760 |
(597) 0x450860 ADD X21, X21, #1 |
(597) 0x450864 ORR X1, XZR, X20 |
(597) 0x450868 ORR X2, XZR, X21 |
(597) 0x45086c ORR X0, XZR, X24 |
(597) 0x450870 BL 529a40 |
(597) 0x450874 ADD X3, X19, #2 |
(597) 0x450878 LDR D18, [X23] |
(597) 0x45087c LDR D21, [X20, X3,LSL #3] |
(597) 0x450880 FABS D19, D18 |
(597) 0x450884 FABS D20, D21 |
(597) 0x450888 FCMPE D20, D19 |
(597) 0x45088c B.LS 45077c |
(597) 0x450890 ADD X21, X21, #1 |
(597) 0x450894 ORR X1, XZR, X20 |
(597) 0x450898 ORR X2, XZR, X21 |
(597) 0x45089c ORR X0, XZR, X24 |
(597) 0x4508a0 BL 529a40 |
(597) 0x4508a4 ADD X3, X19, #3 |
(597) 0x4508a8 LDR D30, [X23] |
(597) 0x4508ac LDR D31, [X20, X3,LSL #3] |
(597) 0x4508b0 FABS D1, D30 |
(597) 0x4508b4 FABS D0, D31 |
(597) 0x4508b8 FCMPE D0, D1 |
(597) 0x4508bc B.LS 450798 |
(597) 0x4508c0 ADD X21, X21, #1 |
(597) 0x4508c4 ORR X1, XZR, X20 |
(597) 0x4508c8 ORR X2, XZR, X21 |
(597) 0x4508cc ORR X0, XZR, X24 |
(597) 0x4508d0 BL 529a40 |
(597) 0x4508d4 ADD X3, X19, #4 |
(597) 0x4508d8 LDR D28, [X23] |
(597) 0x4508dc LDR D29, [X20, X3,LSL #3] |
(597) 0x4508e0 FABS D3, D28 |
(597) 0x4508e4 FABS D2, D29 |
(597) 0x4508e8 FCMPE D2, D3 |
(597) 0x4508ec B.LS 4507b4 |
(597) 0x4508f0 ADD X21, X21, #1 |
(597) 0x4508f4 ORR X1, XZR, X20 |
(597) 0x4508f8 ORR X2, XZR, X21 |
(597) 0x4508fc ORR X0, XZR, X24 |
(597) 0x450900 BL 529a40 |
(597) 0x450904 ADD X3, X19, #5 |
(597) 0x450908 LDR D26, [X23] |
(597) 0x45090c LDR D27, [X20, X3,LSL #3] |
(597) 0x450910 FABS D5, D26 |
(597) 0x450914 FABS D4, D27 |
(597) 0x450918 FCMPE D4, D5 |
(597) 0x45091c B.LS 4507d0 |
(597) 0x450920 ADD X21, X21, #1 |
(597) 0x450924 ORR X1, XZR, X20 |
(597) 0x450928 ORR X2, XZR, X21 |
(597) 0x45092c ORR X0, XZR, X24 |
(597) 0x450930 BL 529a40 |
(597) 0x450934 ADD X3, X19, #6 |
(597) 0x450938 LDR D24, [X23] |
(597) 0x45093c LDR D25, [X20, X3,LSL #3] |
(597) 0x450940 FABS D7, D24 |
(597) 0x450944 FABS D6, D25 |
(597) 0x450948 FCMPE D6, D7 |
(597) 0x45094c B.LS 4507ec |
(597) 0x450950 ADD X21, X21, #1 |
(597) 0x450954 ORR X1, XZR, X20 |
(597) 0x450958 ORR X2, XZR, X21 |
(597) 0x45095c ORR X0, XZR, X24 |
(597) 0x450960 BL 529a40 |
(597) 0x450964 B 4507ec |
(596) 0x450968 ADD X21, X21, #1 |
(596) 0x45096c ORR X3, XZR, X19 |
(596) 0x450970 ORR X2, XZR, X21 |
(596) 0x450974 ORR X1, XZR, X20 |
(596) 0x450978 ORR X0, XZR, X24 |
(596) 0x45097c BL 529a40 |
(596) 0x450980 B 450698 |
(596) 0x450984 ADD X21, X21, #1 |
(596) 0x450988 ORR X3, XZR, X19 |
(596) 0x45098c ORR X2, XZR, X21 |
(596) 0x450990 ORR X1, XZR, X20 |
(596) 0x450994 ORR X0, XZR, X24 |
(596) 0x450998 BL 529a40 |
(596) 0x45099c B 45067c |
(596) 0x4509a0 ADD X21, X21, #1 |
(596) 0x4509a4 ORR X3, XZR, X19 |
(596) 0x4509a8 ORR X2, XZR, X21 |
(596) 0x4509ac ORR X1, XZR, X20 |
(596) 0x4509b0 ORR X0, XZR, X24 |
(596) 0x4509b4 BL 529a40 |
(596) 0x4509b8 B 450660 |
(596) 0x4509bc ADD X21, X21, #1 |
(596) 0x4509c0 ORR X3, XZR, X19 |
(596) 0x4509c4 ORR X2, XZR, X21 |
(596) 0x4509c8 ORR X1, XZR, X20 |
(596) 0x4509cc ORR X0, XZR, X24 |
(596) 0x4509d0 BL 529a40 |
(596) 0x4509d4 B 450644 |
(596) 0x4509d8 ORR X3, XZR, X19 |
(596) 0x4509dc ORR X2, XZR, X19 |
(596) 0x4509e0 ORR X1, XZR, X20 |
(596) 0x4509e4 ORR X0, XZR, X24 |
(596) 0x4509e8 ORR X21, XZR, X19 |
(596) 0x4509ec BL 529a40 |
(596) 0x4509f0 B 4505b4 |
(596) 0x4509f4 ADD X21, X21, #1 |
(596) 0x4509f8 ORR X3, XZR, X19 |
(596) 0x4509fc ORR X2, XZR, X21 |
(596) 0x450a00 ORR X1, XZR, X20 |
(596) 0x450a04 ORR X0, XZR, X24 |
(596) 0x450a08 BL 529a40 |
(596) 0x450a0c B 4506b4 |
(595) 0x450a10 ORR X3, XZR, X22 |
(595) 0x450a14 ORR X2, XZR, X22 |
(595) 0x450a18 ORR X1, XZR, X20 |
(595) 0x450a1c ORR X0, XZR, X24 |
(595) 0x450a20 SUB X25, X22, #1 |
(595) 0x450a24 BL 529a40 |
(595) 0x450a28 B 450558 |
(596) 0x450a2c ADD X21, X21, #1 |
(596) 0x450a30 ORR X3, XZR, X19 |
(596) 0x450a34 ORR X2, XZR, X21 |
(596) 0x450a38 ORR X1, XZR, X20 |
(596) 0x450a3c ORR X0, XZR, X24 |
(596) 0x450a40 BL 529a40 |
(596) 0x450a44 B 450628 |
(596) 0x450a48 ADD X21, X21, #1 |
(596) 0x450a4c ORR X3, XZR, X19 |
(596) 0x450a50 ORR X2, XZR, X21 |
(596) 0x450a54 ORR X1, XZR, X20 |
(596) 0x450a58 ORR X0, XZR, X24 |
(596) 0x450a5c BL 529a40 |
(596) 0x450a60 B 45060c |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►46.15+ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2726 | exec |
| ○ | hypre_BoomerAMGBuildExtPIInter[...] | par_lr_interp.c:1811 | exec |
| ○ | hypre_BoomerAMGSetup | par_amg_setup.c:850 | exec |
| ○ | hypre_PCGSetup | pcg.c:234 | exec |
| ○ | main | amg.c:398 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | amg.c:253 | exec |
| ►30.77+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2726 | exec |
| ○ | hypre_BoomerAMGBuildExtPIInter[...] | par_lr_interp.c:1811 | exec |
| ○ | hypre_BoomerAMGSetup | par_amg_setup.c:850 | exec |
| ○ | hypre_PCGSetup | pcg.c:234 | exec |
| ○ | main | amg.c:398 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | amg.c:253 | exec |
| ►7.69+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2726 | exec |
| ○ | hypre_BoomerAMGBuildExtPIInter[...] | par_lr_interp.c:1811 | exec |
| ○ | hypre_BoomerAMGSetup | par_amg_setup.c:850 | exec |
| ○ | hypre_PCGSetup | pcg.c:234 | exec |
| ○ | main | amg.c:398 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | amg.c:253 | exec |
| ►7.69+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2726 | exec |
| ○ | hypre_BoomerAMGBuildExtPIInter[...] | par_lr_interp.c:1811 | exec |
| ○ | hypre_BoomerAMGSetup | par_amg_setup.c:850 | exec |
| ○ | hypre_PCGSetup | pcg.c:234 | exec |
| ○ | main | amg.c:398 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | amg.c:253 | exec |
| ►7.69+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2726 | exec |
| ○ | hypre_BoomerAMGBuildExtPIInter[...] | par_lr_interp.c:1811 | exec |
| ○ | hypre_BoomerAMGSetup | par_amg_setup.c:850 | exec |
| ○ | hypre_PCGSetup | pcg.c:234 | exec |
| ○ | main | amg.c:398 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | amg.c:253 | exec |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►27.27+ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2726 | exec |
| ○ | hypre_BoomerAMGBuildExtPIInter[...] | par_lr_interp.c:1811 | exec |
| ○ | hypre_BoomerAMGSetup | par_amg_setup.c:850 | exec |
| ○ | hypre_PCGSetup | pcg.c:234 | exec |
| ○ | main | amg.c:398 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | amg.c:253 | exec |
| ►27.27+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►18.18+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2726 | exec |
| ○ | hypre_BoomerAMGBuildExtPIInter[...] | par_lr_interp.c:1811 | exec |
| ○ | hypre_BoomerAMGSetup | par_amg_setup.c:850 | exec |
| ○ | hypre_PCGSetup | pcg.c:234 | exec |
| ○ | main | amg.c:398 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | amg.c:253 | exec |
| ►9.09+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►9.09+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2726 | exec |
| ○ | hypre_BoomerAMGBuildExtPIInter[...] | par_lr_interp.c:1811 | exec |
| ○ | hypre_BoomerAMGSetup | par_amg_setup.c:850 | exec |
| ○ | hypre_PCGSetup | pcg.c:234 | exec |
| ○ | main | amg.c:398 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | amg.c:253 | exec |
| ►9.09+ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►42.86+ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►28.57+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►14.29+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►14.29+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►33.33+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►33.33+ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►11.11+ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2726 | exec |
| ○ | hypre_BoomerAMGBuildExtPIInter[...] | par_lr_interp.c:1811 | exec |
| ○ | hypre_BoomerAMGSetup | par_amg_setup.c:850 | exec |
| ○ | hypre_PCGSetup | pcg.c:234 | exec |
| ○ | main | amg.c:398 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | amg.c:253 | exec |
| ►11.11+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►5.56+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►5.56+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2726 | exec |
| ○ | hypre_BoomerAMGBuildExtPIInter[...] | par_lr_interp.c:1811 | exec |
| ○ | hypre_BoomerAMGSetup | par_amg_setup.c:850 | exec |
| ○ | hypre_PCGSetup | pcg.c:234 | exec |
| ○ | main | amg.c:398 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | amg.c:253 | exec |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►38.46+ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►30.77+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►23.08+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►7.69+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►57.14+ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►28.57+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►4.76+ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | GOMP_parallel | libgomp.so.1.0.0 | |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2726 | exec |
| ○ | hypre_BoomerAMGBuildExtPIInter[...] | par_lr_interp.c:1811 | exec |
| ○ | hypre_BoomerAMGSetup | par_amg_setup.c:850 | exec |
| ○ | hypre_PCGSetup | pcg.c:234 | exec |
| ○ | main | amg.c:398 | exec |
| ○ | __libc_start_call_main | libc.so.6 | |
| ○ | __libc_start_main | libc.so.6 | |
| ○ | _start | amg.c:253 | exec |
| ►4.76+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►4.76+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►53.33+ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►40.00+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►6.67+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►57.14+ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►21.43+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►14.29+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►7.14+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►46.15+ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►38.46+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►7.69+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►7.69+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►50.00+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►42.86+ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►7.14+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 |
| Coverage (%) | Name | Source Location | Module |
|---|---|---|---|
| ►42.86+ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►35.71+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►14.29+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 | |
| ►7.14+ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_qsort2abs | par_interp.c:3180 | exec |
| ○ | hypre_BoomerAMGInterpTruncatio[...] | par_interp.c:2913 | exec |
| ○ | omp_fulfill_event | libgomp.so.1.0.0 | |
| ○ | start_thread | libc.so.6 | |
| ○ | thread_start | libc.so.6 |
| min | med | avg | max |
|---|---|---|---|
| Percentile Index | 10 | 20 | 30 | 40 | 50 | 60 | 70 | 80 | 90 | 100 |
|---|---|---|---|---|---|---|---|---|---|---|
| Value |
| min | med | avg | max |
|---|---|---|---|
| Percentile Index | 10 | 20 | 30 | 40 | 50 | 60 | 70 | 80 | 90 | 100 |
|---|---|---|---|---|---|---|---|---|---|---|
| Value |
| Path / |
The code analyzed by CQA in that panel excludes loops and represents 0.01% of application time for run 1x1
| Source file and lines | par_interp.c:3178-3192 |
| Module | exec |
| nb instructions | 18 |
| nb uops | 18 |
| loop length | 72 |
| used w registers | 0 |
| used x registers | 16 |
| used b registers | 0 |
| used h registers | 0 |
| used s registers | 1 |
| used d registers | 0 |
| used q registers | 0 |
| used v registers | 0 |
| used z registers | 0 |
| nb stack references | 12 |
| micro-operation queue | 2.25 cycles |
| front end | 2.25 cycles |
| P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| uops | 0.50 | 0.50 | 1.50 | 1.50 | 1.50 | 1.50 | 0.00 | 0.00 | 0.00 | 0.00 | 4.00 | 4.00 | 4.00 | 3.00 | 3.00 |
| cycles | 0.50 | 0.50 | 1.50 | 1.50 | 1.50 | 1.50 | 0.00 | 0.00 | 0.00 | 0.00 | 4.00 | 4.00 | 4.00 | 3.00 | 3.00 |
| Cycles executing div or sqrt instructions | NA |
| Front-end | 2.25 |
| Dispatch | 4.00 |
| Overall L1 | 4.00 |
| all | 0% |
| load | 0% |
| store | 0% |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | NA (no add-sub vectorizable/vectorized instructions) |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 0% |
| all | 40% |
| load | 45% |
| store | 45% |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | NA (no add-sub vectorizable/vectorized instructions) |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 25% |
| Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput | Vectorization |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| STP X29, X30, [SP, #928]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ORR X20, XZR, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| STP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ORR X22, XZR, X2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| STP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ORR X24, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| STP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ORR X25, XZR, X3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| STR X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (25.0%) |
| LDR X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | scal (25.0%) |
| LDP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X29, X30, [SP], #96 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | N/A |
| RET | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
The code analyzed by CQA in that panel excludes loops and represents 0.01% of application time for run 1x1
| Source file and lines | par_interp.c:3178-3192 |
| Module | exec |
| nb instructions | 18 |
| nb uops | 18 |
| loop length | 72 |
| used w registers | 0 |
| used x registers | 16 |
| used b registers | 0 |
| used h registers | 0 |
| used s registers | 1 |
| used d registers | 0 |
| used q registers | 0 |
| used v registers | 0 |
| used z registers | 0 |
| nb stack references | 12 |
| micro-operation queue | 2.25 cycles |
| front end | 2.25 cycles |
| P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| uops | 0.50 | 0.50 | 1.50 | 1.50 | 1.50 | 1.50 | 0.00 | 0.00 | 0.00 | 0.00 | 4.00 | 4.00 | 4.00 | 3.00 | 3.00 |
| cycles | 0.50 | 0.50 | 1.50 | 1.50 | 1.50 | 1.50 | 0.00 | 0.00 | 0.00 | 0.00 | 4.00 | 4.00 | 4.00 | 3.00 | 3.00 |
| Cycles executing div or sqrt instructions | NA |
| Front-end | 2.25 |
| Dispatch | 4.00 |
| Overall L1 | 4.00 |
| all | 0% |
| load | 0% |
| store | 0% |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | NA (no add-sub vectorizable/vectorized instructions) |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 0% |
| all | 40% |
| load | 45% |
| store | 45% |
| mul | NA (no mul vectorizable/vectorized instructions) |
| add-sub | NA (no add-sub vectorizable/vectorized instructions) |
| fma | NA (no fma vectorizable/vectorized instructions) |
| div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
| other | 25% |
| Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput | Vectorization |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| STP X29, X30, [SP, #928]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | N/A |
| STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ORR X20, XZR, X1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| STP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ORR X22, XZR, X2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| STP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ORR X24, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| STP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (50.0%) |
| ORR X25, XZR, X3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 | scal (25.0%) |
| STR X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 | scal (25.0%) |
| LDR X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 | scal (25.0%) |
| LDP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | scal (50.0%) |
| LDP X29, X30, [SP], #96 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 | N/A |
| RET | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 | N/A |
| Run 1x1 | Number processes: 1Number nodes: NARun Command: <executable> -n 400 400 400MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-188-3659/intel/AMG/run/oneview_runs/multicore/gcc_1/oneview_run_1781892409OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_NUM_THREADS: 1OMP_PLACES: threads |
|---|---|
| Run 1x2 | Number processes: 1Run Command: <executable> -n 400 400 400MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-188-3659/intel/AMG/run/oneview_runs/multicore/gcc_1/oneview_run_1781892409OMP_NUM_THREADS: 2OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x4 | Number processes: 1Run Command: <executable> -n 400 400 400MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-188-3659/intel/AMG/run/oneview_runs/multicore/gcc_1/oneview_run_1781892409OMP_NUM_THREADS: 4OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x8 | Number processes: 1Run Command: <executable> -n 400 400 400MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-188-3659/intel/AMG/run/oneview_runs/multicore/gcc_1/oneview_run_1781892409OMP_NUM_THREADS: 8OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x16 | Number processes: 1Run Command: <executable> -n 400 400 400MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-188-3659/intel/AMG/run/oneview_runs/multicore/gcc_1/oneview_run_1781892409OMP_NUM_THREADS: 16OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x24 | Number processes: 1Run Command: <executable> -n 400 400 400MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-188-3659/intel/AMG/run/oneview_runs/multicore/gcc_1/oneview_run_1781892409OMP_NUM_THREADS: 24OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x32 | Number processes: 1Run Command: <executable> -n 400 400 400MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-188-3659/intel/AMG/run/oneview_runs/multicore/gcc_1/oneview_run_1781892409OMP_NUM_THREADS: 32OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x40 | Number processes: 1Run Command: <executable> -n 400 400 400MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-188-3659/intel/AMG/run/oneview_runs/multicore/gcc_1/oneview_run_1781892409OMP_NUM_THREADS: 40OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x48 | Number processes: 1Run Command: <executable> -n 400 400 400MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-188-3659/intel/AMG/run/oneview_runs/multicore/gcc_1/oneview_run_1781892409OMP_NUM_THREADS: 48OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x56 | Number processes: 1Run Command: <executable> -n 400 400 400MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-188-3659/intel/AMG/run/oneview_runs/multicore/gcc_1/oneview_run_1781892409OMP_NUM_THREADS: 56OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| Run 1x64 | Number processes: 1Run Command: <executable> -n 400 400 400MPI Command: mpirun -n <number_processes> --bind-to core --map-by package:PE=64 --rank-by fill --report-bindings Dataset: Run Directory: /home/eoseret/qaas/qaas_runs/178-188-3659/intel/AMG/run/oneview_runs/multicore/gcc_1/oneview_run_1781892409OMP_NUM_THREADS: 64OMP_PROC_BIND: spreadOMP_DISPLAY_AFFINITY: TRUEOMP_AFFINITY_FORMAT: 'OMP: pid %P tid %i thread %n bound to OS proc set {%A}'OMP_DISPLAY_ENV: TRUEOMP_PLACES: threads |
| (1x1) Efficiency | (1x1) Potential Speed-Up (%) | (1x2) Efficiency | (1x2) Potential Speed-Up (%) | (1x4) Efficiency | (1x4) Potential Speed-Up (%) | (1x8) Efficiency | (1x8) Potential Speed-Up (%) | (1x16) Efficiency | (1x16) Potential Speed-Up (%) | (1x24) Efficiency | (1x24) Potential Speed-Up (%) | (1x32) Efficiency | (1x32) Potential Speed-Up (%) | (1x40) Efficiency | (1x40) Potential Speed-Up (%) | (1x48) Efficiency | (1x48) Potential Speed-Up (%) | (1x56) Efficiency | (1x56) Potential Speed-Up (%) | (1x64) Efficiency | (1x64) Potential Speed-Up (%) |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 1 | 0 | 2.28 | 0 | 6.69 | 0 | 4.69 | 0 | 12.25 | 0 | 10.92 | 0 | 19.85 | 0 | 26.61 | 0 | 33.47 | 0 | 36.66 | 0 | 41.2 | 0 |
| Run | Number of threads | Efficiency (ideal is 1) | Speedup | Ideal Speedup | Time (s) | Coverage (%) |
|---|---|---|---|---|---|---|
| 1x1 | 1 | 1 | 1 | 1 | 0.065000005066395 | 0.01878073439002 |
| 1x2 | 2 | 2.28 | 2.28 | 2 | 0.029999997466803 | 0.015233279205859 |
| 1x4 | 2 | 6.69 | 6.69 | 4 | 0.02000000141561 | 0.009482198394835 |
| 1x8 | 7 | 4.69 | 4.69 | 8 | 0.019999999552965 | 0.022413088008761 |
| 1x16 | 11 | 12.25 | 12.25 | 16 | 0.010000000707805 | 0.010092378593981 |
| 1x24 | 17 | 10.92 | 10.92 | 24 | 0.0099999997764826 | 0.011917351745069 |
| 1x32 | 12 | 19.85 | 19.85 | 32 | 0.010000000707805 | 0.0070075336843729 |
| 1x40 | 13 | 26.61 | 26.61 | 40 | 0.0099999997764826 | 0.0055314064957201 |
| 1x48 | 12 | 33.47 | 33.47 | 48 | 0.010000000707805 | 0.0043834773823619 |
| 1x56 | 12 | 36.66 | 36.66 | 56 | 0.010000000707805 | 0.0040665143169463 |
| 1x64 | 13 | 41.2 | 41.2 | 64 | 0.010000000707805 | 0.0035514950286597 |
| Name | Coverage (%) | Time (s) |
|---|---|---|
| ▼hypre_qsort2abs– | 0.02 | 0.06 |
| ▼Loop 595 - par_interp.c:3180-3191 - exec– | 0.00 | 0.00 |
| ▼Loop 596 - par_interp.c:3180-3191 - exec– | 0.01 | 0.05 |
| ○Loop 597 - par_interp.c:3184-3187 - exec | 0.00 | 0.00 |
