Function: .omp_outlined. | Module: exec | Source: accelerate.cpp:40-53 [...] | Coverage: 7.28% |
---|
Function: .omp_outlined. | Module: exec | Source: accelerate.cpp:40-53 [...] | Coverage: 7.28% |
---|
/home/hbollore/qaas-runs/170-290-5445/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/context.h: 69 - 69 |
-------------------------------------------------------------------------------- |
69: T &operator()(size_t i, size_t j) const { return data[i + j * sizeX]; } |
/home/hbollore/qaas-runs/170-290-5445/intel/CloverLeafCXX/build/CloverLeafCXX/src/omp/accelerate.cpp: 40 - 53 |
-------------------------------------------------------------------------------- |
40: #pragma omp parallel for simd collapse(2) |
41: for (int j = (y_min + 1); j < (y_max + 1 + 2); j++) { |
42: for (int i = (x_min + 1); i < (x_max + 1 + 2); i++) { |
43: double stepbymass_s = halfdt / ((density0(i - 1, j - 1) * volume(i - 1, j - 1) + density0(i - 1, j + 0) * volume(i - 1, j + 0) + |
44: density0(i, j) * volume(i, j) + density0(i + 0, j - 1) * volume(i + 0, j - 1)) * |
45: 0.25); |
46: xvel1(i, j) = xvel0(i, j) - stepbymass_s * (xarea(i, j) * (pressure(i, j) - pressure(i - 1, j + 0)) + |
47: xarea(i + 0, j - 1) * (pressure(i + 0, j - 1) - pressure(i - 1, j - 1))); |
48: yvel1(i, j) = yvel0(i, j) - stepbymass_s * (yarea(i, j) * (pressure(i, j) - pressure(i + 0, j - 1)) + |
49: yarea(i - 1, j + 0) * (pressure(i - 1, j + 0) - pressure(i - 1, j - 1))); |
50: xvel1(i, j) = xvel1(i, j) - stepbymass_s * (xarea(i, j) * (viscosity(i, j) - viscosity(i - 1, j + 0)) + |
51: xarea(i + 0, j - 1) * (viscosity(i + 0, j - 1) - viscosity(i - 1, j - 1))); |
52: yvel1(i, j) = yvel1(i, j) - stepbymass_s * (yarea(i, j) * (viscosity(i, j) - viscosity(i + 0, j - 1)) + |
53: yarea(i - 1, j + 0) * (viscosity(i - 1, j + 0) - viscosity(i - 1, j - 1))); |
0x419aa0 STP D15, D14, [SP, #864]! |
0x419aa4 STP D13, D12, [SP, #16] |
0x419aa8 STP D11, D10, [SP, #32] |
0x419aac STP D9, D8, [SP, #48] |
0x419ab0 STP X29, X30, [SP, #64] |
0x419ab4 STP X28, X27, [SP, #80] |
0x419ab8 STP X26, X25, [SP, #96] |
0x419abc STP X24, X23, [SP, #112] |
0x419ac0 STP X22, X21, [SP, #128] |
0x419ac4 STP X20, X19, [SP, #144] |
0x419ac8 ADD X29, SP, #64 |
0x419acc ADDVL SP, SP, #60 |
0x419ad0 SUB SP, SP, #208 |
0x419ad4 LDR W10, [X2] |
0x419ad8 LDR W8, [X3] |
0x419adc ADD W11, W10, #1 |
0x419ae0 ADD W8, W8, #3 |
0x419ae4 SUBS W8, W8, W11 |
0x419ae8 B.LE 41a114 |
0x419aec LDR W12, [X4] |
0x419af0 LDR W9, [X5] |
0x419af4 ADD W2, W12, #1 |
0x419af8 ADD W9, W9, #3 |
0x419afc CMP W9, W2 |
0x419b00 B.LE 41a114 |
0x419b04 STP X12, X11, [SP, #136] |
0x419b08 LDP X13, X12, [X29, #136] |
0x419b0c LDP X15, X14, [X29, #120] |
0x419b10 ADD X4, SP, #200 |
0x419b14 ADD X5, SP, #192 |
0x419b18 LDP X17, X16, [X29, #104] |
0x419b1c LDR X18, [X29, #96] |
0x419b20 STP X10, X6, [SP, #152] |
0x419b24 ADD X6, SP, #184 |
0x419b28 LDP X11, X10, [X29, #152] |
0x419b2c LDR X3, [X7] |
0x419b30 LDR X25, [X7, #16] |
0x419b34 MOVZ W7, #1 |
0x419b38 LDR X1, [X18] |
0x419b3c LDR X27, [X18, #16] |
0x419b40 LDR X18, [X17] |
0x419b44 LDR X20, [X17, #16] |
0x419b48 LDR X17, [X16] |
0x419b4c LDR X22, [X16, #16] |
0x419b50 LDR X16, [X15] |
0x419b54 LDR X21, [X15, #16] |
0x419b58 LDR X15, [X14] |
0x419b5c LDR X19, [X14, #16] |
0x419b60 LDR X14, [X13] |
0x419b64 LDR X28, [X13, #16] |
0x419b68 LDR X13, [X12] |
0x419b6c LDR X12, [X12, #16] |
0x419b70 LDR X24, [X11, #16] |
0x419b74 LDR X23, [X10, #16] |
0x419b78 STR X2, [SP, #112] |
0x419b7c STR WZR, [SP, #180] |
0x419b80 STP X12, X13, [SP, #48] |
0x419b84 LDR X12, [X11] |
0x419b88 SUB W11, W9, W2 |
0x419b8c MOVN X9, #0 |
0x419b90 MOVZ W2, #34 |
0x419b94 UMADDL X26, W11, W8, X9 |
0x419b98 STP X1, X3, [SP, #80] |
0x419b9c LDR X9, [X10] |
0x419ba0 LDR W1, [X0] |
0x419ba4 MOVZ W8, #1 |
0x419ba8 ADRP X0, |
0x419bac ADD X0, X0, #2952 |
0x419bb0 ADD X3, SP, #180 |
0x419bb4 STP X17, X18, [SP, #120] |
0x419bb8 STR X16, [SP, #24] |
0x419bbc STP X14, X15, [SP, #64] |
0x419bc0 STR X11, [SP, #168] |
0x419bc4 STR X8, [SP, #184] |
0x419bc8 STR X8, [SP] |
0x419bcc STP X26, XZR, [SP, #192] |
0x419bd0 STR W1, [SP, #100] |
0x419bd4 STP X9, X12, [SP, #32] |
0x419bd8 BL 402ee0 |
0x419bdc LDP X8, X13, [SP, #192] |
0x419be0 CMP X8, X26 |
0x419be4 CSEL X8, X8, X26, #11 |
0x419be8 CMP X13, X8 |
0x419bec B.GT 41a104 |
0x419bf0 ADD X4, X8, #1 |
0x419bf4 CNTD X10, ALL |
0x419bf8 ORR X9, XZR, X13 |
0x419bfc SUB X11, X4, X13 |
0x419c00 CMP X11, X10 |
0x419c04 B.CC 419ef0 |
0x419c08 UDIV X9, X11, X10 |
0x419c0c SUB X8, X29, #64 |
0x419c10 PTRUE P0.D, ALL |
0x419c14 MADD X12, X9, X10, XZR |
0x419c18 DUP Z1.D, X10 |
0x419c1c STR Z1, [X8, #511, MUL VL] |
0x419c20 LDR X8, [SP, #168] |
0x419c24 ADD X9, X13, X12 |
0x419c28 SUB X11, X11, X12 |
0x419c2c INDEX Z0.D, X13, #1 |
0x419c30 LDR X13, [SP, #144] |
0x419c34 DUP Z2.D, X8 |
0x419c38 SUB X8, X29, #64 |
0x419c3c DUP Z1.D, X13 |
0x419c40 STR Z1, [X8, #510, MUL VL] |
0x419c44 LDR X8, [SP, #112] |
0x419c48 DUP Z1.D, X8 |
0x419c4c SUB X8, X29, #64 |
0x419c50 STR Z1, [X8, #509, MUL VL] |
0x419c54 SUB X8, X29, #64 |
0x419c58 LDR X13, [SP, #136] |
0x419c5c DUP Z1.D, X13 |
0x419c60 STR Z1, [X8, #508, MUL VL] |
0x419c64 LDR X8, [SP, #120] |
0x419c68 LDR X13, [SP, #152] |
0x419c6c DUP Z17.D, X8 |
0x419c70 LDR X8, [SP, #24] |
0x419c74 DUP Z6.D, X13 |
0x419c78 LDR X13, [SP, #88] |
0x419c7c DUP Z18.D, X8 |
0x419c80 DUP Z7.D, X13 |
0x419c84 LDP X8, X13, [SP, #72] |
0x419c88 DUP Z19.D, X8 |
0x419c8c LDR X8, [SP, #128] |
0x419c90 DUP Z16.D, X13 |
0x419c94 LDR X13, [SP, #160] |
0x419c98 DUP Z20.D, X8 |
0x419c9c LDR X8, [SP, #56] |
0x419ca0 DUP Z21.D, X8 |
0x419ca4 LDR X8, [SP, #40] |
0x419ca8 DUP Z22.D, X8 |
0x419cac LDR X8, [SP, #64] |
0x419cb0 DUP Z23.D, X8 |
0x419cb4 LDR X8, [SP, #32] |
0x419cb8 DUP Z25.D, X8 |
0x419cbc LDR X8, [SP, #48] |
(188) 0x419cc0 SUB X14, X29, #64 |
(188) 0x419cc4 MOVPRFX Z28, Z0 |
(188) 0x419cc8 SDIV Z28.D, P0/M, Z28.D, Z2.D |
(188) 0x419ccc MOVPRFX Z27, Z0 |
(188) 0x419cd0 MLS Z27.D, P0/M, Z28.D, Z2.D |
(188) 0x419cd4 SUBS X12, X12, X10 |
(188) 0x419cd8 LDR Z1, [X14, #510, MUL VL] |
(188) 0x419cdc SUB X14, X29, #64 |
(188) 0x419ce0 ADD Z29.D, Z1.D, Z28.D |
(188) 0x419ce4 LDR Z1, [X14, #509, MUL VL] |
(188) 0x419ce8 SUB X14, X29, #64 |
(188) 0x419cec ADD Z28.D, Z6.D, Z28.D |
(188) 0x419cf0 SXTW Z28.D, P0/M, Z28.D |
(188) 0x419cf4 MOVPRFX Z31, Z7 |
(188) 0x419cf8 MUL Z31.D, P0/M, Z31.D, Z28.D |
(188) 0x419cfc MOVPRFX Z9, Z16 |
(188) 0x419d00 MUL Z9.D, P0/M, Z9.D, Z28.D |
(188) 0x419d04 SXTW Z29.D, P0/M, Z29.D |
(188) 0x419d08 MOVPRFX Z11, Z7 |
(188) 0x419d0c MUL Z11.D, P0/M, Z11.D, Z29.D |
(188) 0x419d10 MOVPRFX Z13, Z16 |
(188) 0x419d14 MUL Z13.D, P0/M, Z13.D, Z29.D |
(188) 0x419d18 ADD Z26.D, Z1.D, Z27.D |
(188) 0x419d1c LDR Z1, [X14, #508, MUL VL] |
(188) 0x419d20 LD1RD {Z30.D}, P0/Z, [X13] |
(188) 0x419d24 SUB X14, X29, #64 |
(188) 0x419d28 ADD Z27.D, Z1.D, Z27.D |
(188) 0x419d2c ADR Z8.D, [Z31, Z27.D,SXTW] |
(188) 0x419d30 ADR Z10.D, [Z9, Z27.D,SXTW] |
(188) 0x419d34 ADR Z12.D, [Z11, Z27.D,SXTW] |
(188) 0x419d38 ADR Z14.D, [Z13, Z27.D,SXTW] |
(188) 0x419d3c ADR Z11.D, [Z11, Z26.D,SXTW] |
(188) 0x419d40 ADR Z31.D, [Z31, Z26.D,SXTW] |
(188) 0x419d44 ADR Z9.D, [Z9, Z26.D,SXTW] |
(188) 0x419d48 LD1D {Z8.D}, P0/Z, [X25, Z8.D,LSL #3] |
(188) 0x419d4c LD1D {Z10.D}, P0/Z, [X27, Z10.D,LSL #3] |
(188) 0x419d50 LD1D {Z12.D}, P0/Z, [X25, Z12.D,LSL #3] |
(188) 0x419d54 LD1D {Z14.D}, P0/Z, [X27, Z14.D,LSL #3] |
(188) 0x419d58 LD1D {Z11.D}, P0/Z, [X25, Z11.D,LSL #3] |
(188) 0x419d5c FMUL Z12.D, Z12.D, Z14.D |
(188) 0x419d60 MOVPRFX Z14, Z26 |
(188) 0x419d64 SXTW Z14.D, P0/M, Z26.D |
(188) 0x419d68 MOVPRFX Z24, Z14 |
(188) 0x419d6c MLA Z24.D, P0/M, Z18.D, Z28.D |
(188) 0x419d70 FMAD Z8.D, P0/M, Z10.D, Z12.D |
(188) 0x419d74 ADR Z10.D, [Z13, Z26.D,SXTW] |
(188) 0x419d78 LD1D {Z10.D}, P0/Z, [X27, Z10.D,LSL #3] |
(188) 0x419d7c LD1D {Z31.D}, P0/Z, [X25, Z31.D,LSL #3] |
(188) 0x419d80 LD1D {Z9.D}, P0/Z, [X27, Z9.D,LSL #3] |
(188) 0x419d84 FMLA Z8.D, P0/M, Z11.D, Z10.D |
(188) 0x419d88 MOVPRFX Z11, Z19 |
(188) 0x419d8c MUL Z11.D, P0/M, Z11.D, Z29.D |
(188) 0x419d90 ADR Z12.D, [Z11, Z26.D,SXTW] |
(188) 0x419d94 ADR Z11.D, [Z11, Z27.D,SXTW] |
(188) 0x419d98 MOVPRFX Z10, Z14 |
(188) 0x419d9c MLA Z10.D, P0/M, Z17.D, Z29.D |
(188) 0x419da0 LD1D {Z10.D}, P0/Z, [X22, Z10.D,LSL #3] |
(188) 0x419da4 FMAD Z31.D, P0/M, Z9.D, Z8.D |
(188) 0x419da8 MOVPRFX Z8, Z14 |
(188) 0x419dac MLA Z8.D, P0/M, Z18.D, Z29.D |
(188) 0x419db0 LD1D {Z9.D}, P0/Z, [X21, Z8.D,LSL #3] |
(188) 0x419db4 LD1D {Z13.D}, P0/Z, [X19, Z12.D,LSL #3] |
(188) 0x419db8 LD1D {Z15.D}, P0/Z, [X19, Z11.D,LSL #3] |
(188) 0x419dbc LD1D {Z1.D}, P0/Z, [X21, Z24.D,LSL #3] |
(188) 0x419dc0 FSUB Z13.D, Z13.D, Z15.D |
(188) 0x419dc4 MOVPRFX Z15, Z19 |
(188) 0x419dc8 MUL Z15.D, P0/M, Z15.D, Z28.D |
(188) 0x419dcc ADR Z3.D, [Z15, Z26.D,SXTW] |
(188) 0x419dd0 ADR Z15.D, [Z15, Z27.D,SXTW] |
(188) 0x419dd4 MUL Z28.D, P0/M, Z28.D, Z25.D |
(188) 0x419dd8 LD1D {Z4.D}, P0/Z, [X19, Z3.D,LSL #3] |
(188) 0x419ddc LD1D {Z5.D}, P0/Z, [X19, Z15.D,LSL #3] |
(188) 0x419de0 FSUB Z4.D, Z4.D, Z5.D |
(188) 0x419de4 MOVPRFX Z5, Z30 |
(188) 0x419de8 FNEG Z5.D, P0/M, Z30.D |
(188) 0x419dec MOVPRFX Z30, Z22 |
(188) 0x419df0 MUL Z30.D, P0/M, Z30.D, Z29.D |
(188) 0x419df4 FMUL Z1.D, Z1.D, Z4.D |
(188) 0x419df8 FDUP Z4.D, #80 |
(188) 0x419dfc FMUL Z4.D, Z31.D, Z4.D |
(188) 0x419e00 ADR Z31.D, [Z30, Z26.D,SXTW] |
(188) 0x419e04 ADR Z30.D, [Z30, Z27.D,SXTW] |
(188) 0x419e08 FMLA Z1.D, P0/M, Z9.D, Z13.D |
(188) 0x419e0c FDIVR Z4.D, P0/M, Z4.D, Z5.D |
(188) 0x419e10 MOVPRFX Z5, Z14 |
(188) 0x419e14 MLA Z5.D, P0/M, Z20.D, Z29.D |
(188) 0x419e18 FMAD Z1.D, P0/M, Z4.D, Z10.D |
(188) 0x419e1c ST1D {Z1.D}, P0, [X20, Z5.D,LSL #3] |
(188) 0x419e20 MOVPRFX Z1, Z14 |
(188) 0x419e24 MLA Z1.D, P0/M, Z21.D, Z29.D |
(188) 0x419e28 LD1D {Z1.D}, P0/Z, [X8, Z1.D,LSL #3] |
(188) 0x419e2c LD1D {Z9.D}, P0/Z, [X24, Z31.D,LSL #3] |
(188) 0x419e30 LD1D {Z10.D}, P0/Z, [X19, Z12.D,LSL #3] |
(188) 0x419e34 LD1D {Z3.D}, P0/Z, [X19, Z3.D,LSL #3] |
(188) 0x419e38 FSUB Z3.D, Z10.D, Z3.D |
(188) 0x419e3c LD1D {Z10.D}, P0/Z, [X24, Z30.D,LSL #3] |
(188) 0x419e40 LD1D {Z11.D}, P0/Z, [X19, Z11.D,LSL #3] |
(188) 0x419e44 LD1D {Z12.D}, P0/Z, [X19, Z15.D,LSL #3] |
(188) 0x419e48 FSUB Z11.D, Z11.D, Z12.D |
(188) 0x419e4c FMUL Z10.D, Z10.D, Z11.D |
(188) 0x419e50 FMAD Z3.D, P0/M, Z9.D, Z10.D |
(188) 0x419e54 FMLA Z1.D, P0/M, Z4.D, Z3.D |
(188) 0x419e58 MOVPRFX Z3, Z14 |
(188) 0x419e5c MLA Z3.D, P0/M, Z23.D, Z29.D |
(188) 0x419e60 MUL Z29.D, P0/M, Z29.D, Z25.D |
(188) 0x419e64 ST1D {Z1.D}, P0, [X28, Z3.D,LSL #3] |
(188) 0x419e68 ADR Z9.D, [Z29, Z26.D,SXTW] |
(188) 0x419e6c ADR Z29.D, [Z29, Z27.D,SXTW] |
(188) 0x419e70 ADR Z26.D, [Z28, Z26.D,SXTW] |
(188) 0x419e74 ADR Z27.D, [Z28, Z27.D,SXTW] |
(188) 0x419e78 LD1D {Z1.D}, P0/Z, [X20, Z5.D,LSL #3] |
(188) 0x419e7c LD1D {Z8.D}, P0/Z, [X21, Z8.D,LSL #3] |
(188) 0x419e80 LD1D {Z10.D}, P0/Z, [X23, Z9.D,LSL #3] |
(188) 0x419e84 LD1D {Z11.D}, P0/Z, [X23, Z29.D,LSL #3] |
(188) 0x419e88 LD1D {Z24.D}, P0/Z, [X21, Z24.D,LSL #3] |
(188) 0x419e8c LD1D {Z12.D}, P0/Z, [X23, Z26.D,LSL #3] |
(188) 0x419e90 LD1D {Z28.D}, P0/Z, [X23, Z27.D,LSL #3] |
(188) 0x419e94 FSUB Z28.D, Z12.D, Z28.D |
(188) 0x419e98 FMUL Z24.D, Z24.D, Z28.D |
(188) 0x419e9c FSUB Z28.D, Z10.D, Z11.D |
(188) 0x419ea0 FMLA Z24.D, P0/M, Z8.D, Z28.D |
(188) 0x419ea4 FMLA Z1.D, P0/M, Z4.D, Z24.D |
(188) 0x419ea8 ST1D {Z1.D}, P0, [X20, Z5.D,LSL #3] |
(188) 0x419eac LD1D {Z1.D}, P0/Z, [X28, Z3.D,LSL #3] |
(188) 0x419eb0 LD1D {Z5.D}, P0/Z, [X24, Z31.D,LSL #3] |
(188) 0x419eb4 LD1D {Z24.D}, P0/Z, [X23, Z9.D,LSL #3] |
(188) 0x419eb8 LD1D {Z26.D}, P0/Z, [X23, Z26.D,LSL #3] |
(188) 0x419ebc LD1D {Z28.D}, P0/Z, [X24, Z30.D,LSL #3] |
(188) 0x419ec0 FSUB Z24.D, Z24.D, Z26.D |
(188) 0x419ec4 LD1D {Z26.D}, P0/Z, [X23, Z29.D,LSL #3] |
(188) 0x419ec8 LD1D {Z27.D}, P0/Z, [X23, Z27.D,LSL #3] |
(188) 0x419ecc FSUB Z26.D, Z26.D, Z27.D |
(188) 0x419ed0 FMUL Z26.D, Z28.D, Z26.D |
(188) 0x419ed4 FMAD Z5.D, P0/M, Z24.D, Z26.D |
(188) 0x419ed8 FMLA Z1.D, P0/M, Z4.D, Z5.D |
(188) 0x419edc LDR Z4, [X14, #511, MUL VL] |
(188) 0x419ee0 ST1D {Z1.D}, P0, [X28, Z3.D,LSL #3] |
(188) 0x419ee4 ADD Z0.D, Z0.D, Z4.D |
(188) 0x419ee8 B.NE 419cc0 |
0x419eec CBZ X11, 41a104 |
0x419ef0 LDR X8, [SP, #168] |
0x419ef4 LDP X30, X7, [SP, #80] |
0x419ef8 STR X22, [SP, #104] |
0x419efc FMOV D0, #-0.2500000 |
0x419f00 SUB W8, WZR, W8 |
0x419f04 LDP X26, X10, [SP, #24] |
0x419f08 LDP X22, X3, [SP, #64] |
0x419f0c LDP X6, X5, [SP, #48] |
0x419f10 STR W8, [SP, #112] |
0x419f14 LDR X8, [SP, #40] |
0x419f18 HINT #0 |
0x419f1c HINT #0 |
(187) 0x419f20 LDR X11, [SP, #168] |
(187) 0x419f24 LDR X12, [SP, #144] |
(187) 0x419f28 LDR W14, [SP, #112] |
(187) 0x419f2c SDIV X11, X9, X11 |
(187) 0x419f30 ADD W13, W12, W11 |
(187) 0x419f34 LDP X2, X12, [SP, #128] |
(187) 0x419f38 SBFM X13, X13, #0, #31 |
(187) 0x419f3c ADD W12, W12, W9 |
(187) 0x419f40 ADD X9, X9, #1 |
(187) 0x419f44 CMP X4, X9 |
(187) 0x419f48 MADD W14, W14, W11, W12 |
(187) 0x419f4c LDR X12, [SP, #152] |
(187) 0x419f50 ADD W12, W12, W11 |
(187) 0x419f54 SBFM X11, X14, #0, #31 |
(187) 0x419f58 ADD W14, W14, #1 |
(187) 0x419f5c SBFM X14, X14, #0, #31 |
(187) 0x419f60 SBFM X12, X12, #0, #31 |
(187) 0x419f64 MADD X2, X2, X13, X14 |
(187) 0x419f68 MADD X15, X7, X12, XZR |
(187) 0x419f6c ADD X16, X15, X11 |
(187) 0x419f70 ADD X15, X15, X14 |
(187) 0x419f74 LDR D1, [X25, X16,LSL #3] |
(187) 0x419f78 MADD X16, X30, X12, XZR |
(187) 0x419f7c ADD X17, X16, X11 |
(187) 0x419f80 LDR D2, [X27, X17,LSL #3] |
(187) 0x419f84 MADD X17, X7, X13, XZR |
(187) 0x419f88 ADD X18, X17, X11 |
(187) 0x419f8c ADD X17, X17, X14 |
(187) 0x419f90 LDR D3, [X25, X18,LSL #3] |
(187) 0x419f94 MADD X18, X30, X13, XZR |
(187) 0x419f98 ADD X0, X18, X11 |
(187) 0x419f9c LDR D4, [X27, X0,LSL #3] |
(187) 0x419fa0 LDR X0, [SP, #160] |
(187) 0x419fa4 FMUL D3, D3, D4 |
(187) 0x419fa8 FMADD D1, D1, D2, D3 |
(187) 0x419fac LDR D3, [X25, X17,LSL #3] |
(187) 0x419fb0 ADD X17, X18, X14 |
(187) 0x419fb4 LDR D2, [X0] |
(187) 0x419fb8 MADD X0, X3, X12, XZR |
(187) 0x419fbc MADD X18, X26, X12, X14 |
(187) 0x419fc0 MADD X12, X10, X12, XZR |
(187) 0x419fc4 LDR D4, [X27, X17,LSL #3] |
(187) 0x419fc8 ADD X1, X0, X14 |
(187) 0x419fcc ADD X0, X0, X11 |
(187) 0x419fd0 LDR D7, [X19, X1,LSL #3] |
(187) 0x419fd4 LDR D16, [X19, X0,LSL #3] |
(187) 0x419fd8 FMADD D1, D3, D4, D1 |
(187) 0x419fdc LDR D3, [X25, X15,LSL #3] |
(187) 0x419fe0 ADD X15, X16, X14 |
(187) 0x419fe4 LDR X16, [SP, #104] |
(187) 0x419fe8 LDR D4, [X27, X15,LSL #3] |
(187) 0x419fec LDR X15, [SP, #120] |
(187) 0x419ff0 FSUB D7, D7, S16 |
(187) 0x419ff4 MADD X15, X15, X13, X14 |
(187) 0x419ff8 FMADD D1, D3, D4, D1 |
(187) 0x419ffc LDR D3, [X16, X15,LSL #3] |
(187) 0x41a000 MADD X16, X3, X13, XZR |
(187) 0x41a004 MADD X15, X26, X13, X14 |
(187) 0x41a008 ADD X17, X16, X14 |
(187) 0x41a00c ADD X16, X16, X11 |
(187) 0x41a010 LDR D4, [X21, X15,LSL #3] |
(187) 0x41a014 LDR D5, [X19, X17,LSL #3] |
(187) 0x41a018 LDR D6, [X19, X16,LSL #3] |
(187) 0x41a01c FMUL D1, D1, D0 |
(187) 0x41a020 FDIV D1, D2, D1 |
(187) 0x41a024 FSUB D5, D5, S6 |
(187) 0x41a028 LDR D6, [X21, X18,LSL #3] |
(187) 0x41a02c FMUL D6, D6, D7 |
(187) 0x41a030 FMADD D4, D4, D5, D6 |
(187) 0x41a034 FMADD D2, D1, D4, D3 |
(187) 0x41a038 STR D2, [X20, X2,LSL #3] |
(187) 0x41a03c LDR D2, [X19, X17,LSL #3] |
(187) 0x41a040 LDR D3, [X19, X1,LSL #3] |
(187) 0x41a044 MADD X17, X5, X13, X14 |
(187) 0x41a048 MADD X1, X8, X13, XZR |
(187) 0x41a04c LDR D5, [X19, X16,LSL #3] |
(187) 0x41a050 LDR D7, [X19, X0,LSL #3] |
(187) 0x41a054 MADD X0, X22, X13, X14 |
(187) 0x41a058 MADD X13, X10, X13, XZR |
(187) 0x41a05c LDR D4, [X6, X17,LSL #3] |
(187) 0x41a060 ADD X17, X1, X11 |
(187) 0x41a064 ADD X16, X1, X14 |
(187) 0x41a068 LDR D6, [X24, X16,LSL #3] |
(187) 0x41a06c FSUB D2, D2, S3 |
(187) 0x41a070 LDR D3, [X24, X17,LSL #3] |
(187) 0x41a074 FSUB D5, D5, S7 |
(187) 0x41a078 FMUL D3, D3, D5 |
(187) 0x41a07c FMADD D2, D6, D2, D3 |
(187) 0x41a080 FMADD D2, D1, D2, D4 |
(187) 0x41a084 STR D2, [X28, X0,LSL #3] |
(187) 0x41a088 LDR D2, [X21, X18,LSL #3] |
(187) 0x41a08c ADD X18, X13, X14 |
(187) 0x41a090 ADD X13, X13, X11 |
(187) 0x41a094 ADD X14, X12, X14 |
(187) 0x41a098 ADD X11, X12, X11 |
(187) 0x41a09c LDR D3, [X21, X15,LSL #3] |
(187) 0x41a0a0 LDR D4, [X20, X2,LSL #3] |
(187) 0x41a0a4 LDR D7, [X23, X14,LSL #3] |
(187) 0x41a0a8 LDR D16, [X23, X11,LSL #3] |
(187) 0x41a0ac LDR D5, [X23, X18,LSL #3] |
(187) 0x41a0b0 LDR D6, [X23, X13,LSL #3] |
(187) 0x41a0b4 FSUB D7, D7, S16 |
(187) 0x41a0b8 FSUB D5, D5, S6 |
(187) 0x41a0bc FMUL D2, D2, D7 |
(187) 0x41a0c0 FMADD D2, D3, D5, D2 |
(187) 0x41a0c4 FMADD D2, D1, D2, D4 |
(187) 0x41a0c8 STR D2, [X20, X2,LSL #3] |
(187) 0x41a0cc LDR D2, [X23, X18,LSL #3] |
(187) 0x41a0d0 LDR D3, [X23, X14,LSL #3] |
(187) 0x41a0d4 LDR D5, [X23, X13,LSL #3] |
(187) 0x41a0d8 LDR D6, [X23, X11,LSL #3] |
(187) 0x41a0dc LDR D4, [X24, X17,LSL #3] |
(187) 0x41a0e0 LDR D7, [X24, X16,LSL #3] |
(187) 0x41a0e4 LDR D16, [X28, X0,LSL #3] |
(187) 0x41a0e8 FSUB D2, D2, S3 |
(187) 0x41a0ec FSUB D3, D5, S6 |
(187) 0x41a0f0 FMUL D3, D4, D3 |
(187) 0x41a0f4 FMADD D2, D7, D2, D3 |
(187) 0x41a0f8 FMADD D1, D1, D2, D16 |
(187) 0x41a0fc STR D1, [X28, X0,LSL #3] |
(187) 0x41a100 B.NE 419f20 |
0x41a104 LDR W1, [SP, #100] |
0x41a108 ADRP X0, |
0x41a10c ADD X0, X0, #2976 |
0x41a110 BL 402d80 |
0x41a114 ADDVL SP, SP, #4 |
0x41a118 ADD SP, SP, #208 |
0x41a11c LDP D9, D8, [SP, #48] |
0x41a120 LDP D11, D10, [SP, #32] |
0x41a124 LDP D13, D12, [SP, #16] |
0x41a128 LDP X20, X19, [SP, #144] |
0x41a12c LDP X22, X21, [SP, #128] |
0x41a130 LDP X24, X23, [SP, #112] |
0x41a134 LDP X26, X25, [SP, #96] |
0x41a138 LDP X28, X27, [SP, #80] |
0x41a13c LDP X29, X30, [SP, #64] |
0x41a140 LDP D15, D14, [SP], #160 |
0x41a144 RET |
0x41a148 HINT #0 |
0x41a14c HINT #0 |
0x42a4dc HINT #0 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
○100.00 | __kmp_invoke_microtask | libomp.so |
Path / |
Source file and lines | accelerate.cpp:40-53 |
Module | exec |
nb instructions | 169 |
loop length | 676 |
nb stack references | 0 |
front end | 20.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.00 | 4.00 | 13.50 | 13.25 | 23.00 | 13.25 | 2.50 | 2.50 | 2.50 | 2.50 | 31.83 | 31.50 | 31.67 | 11.50 | 11.50 |
cycles | 4.00 | 4.00 | 13.50 | 13.25 | 23.00 | 13.25 | 2.50 | 2.50 | 2.50 | 2.50 | 31.83 | 31.50 | 31.67 | 11.50 | 11.50 |
Cycles executing div or sqrt instructions | 1.00-0.50 |
Front-end | 20.50 |
Overall L1 | 31.83 |
all | 30% |
load | 100% |
store | 100% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
STP D15, D14, [SP, #864]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP D13, D12, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP D11, D10, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP D9, D8, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP X29, X30, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X28, X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X26, X25, [SP, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X24, X23, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X22, X21, [SP, #128] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X20, X19, [SP, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X29, SP, #64 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADDVL SP, SP, #60 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SUB SP, SP, #208 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR W10, [X2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR W8, [X3] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD W11, W10, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD W8, W8, #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUBS W8, W8, W11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LE 41a114 <.omp_outlined.+0x674> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR W12, [X4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR W9, [X5] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD W2, W12, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD W9, W9, #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP W9, W2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LE 41a114 <.omp_outlined.+0x674> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
STP X12, X11, [SP, #136] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDP X13, X12, [X29, #136] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X15, X14, [X29, #120] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
ADD X4, SP, #200 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X5, SP, #192 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDP X17, X16, [X29, #104] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X18, [X29, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STP X10, X6, [SP, #152] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X6, SP, #184 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDP X11, X10, [X29, #152] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X3, [X7] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X25, [X7, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
MOVZ W7, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X1, [X18] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X27, [X18, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X18, [X17] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X20, [X17, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X17, [X16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X22, [X16, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X16, [X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X21, [X15, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X15, [X14] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X19, [X14, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X14, [X13] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X28, [X13, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X13, [X12] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X12, [X12, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X24, [X11, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X23, [X10, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X2, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR WZR, [SP, #180] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X12, X13, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X12, [X11] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUB W11, W9, W2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVN X9, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ W2, #34 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UMADDL X26, W11, W8, X9 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
STP X1, X3, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X9, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR W1, [X0] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
MOVZ W8, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X0, <462ba8> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X0, X0, #2952 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X3, SP, #180 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X17, X18, [SP, #120] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR X16, [SP, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X14, X15, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR X11, [SP, #168] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR X8, [SP, #184] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR X8, [SP] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X26, XZR, [SP, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR W1, [SP, #100] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X9, X12, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
BL 402ee0 <@plt_start@+0x190> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDP X8, X13, [SP, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
CMP X8, X26 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CSEL X8, X8, X26, #11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X13, X8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GT 41a104 <.omp_outlined.+0x664> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X4, X8, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X10, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
ORR X9, XZR, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X11, X4, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X11, X10 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.CC 419ef0 <.omp_outlined.+0x450> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
UDIV X9, X11, X10 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5-20 | 1-0.50 |
SUB X8, X29, #64 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PTRUE P0.D, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
MADD X12, X9, X10, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
DUP Z1.D, X10 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
STR Z1, [X8, #511, MUL VL] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR X8, [SP, #168] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD X9, X13, X12 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X11, X11, X12 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
INDEX Z0.D, X13, #1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 2 |
LDR X13, [SP, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z2.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SUB X8, X29, #64 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
DUP Z1.D, X13 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
STR Z1, [X8, #510, MUL VL] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR X8, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z1.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SUB X8, X29, #64 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR Z1, [X8, #509, MUL VL] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
SUB X8, X29, #64 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X13, [SP, #136] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z1.D, X13 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
STR Z1, [X8, #508, MUL VL] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR X8, [SP, #120] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X13, [SP, #152] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z17.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X8, [SP, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z6.D, X13 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X13, [SP, #88] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z18.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DUP Z7.D, X13 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDP X8, X13, [SP, #72] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
DUP Z19.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X8, [SP, #128] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z16.D, X13 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X13, [SP, #160] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z20.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X8, [SP, #56] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z21.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X8, [SP, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z22.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X8, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z23.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X8, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z25.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X8, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
CBZ X11, 41a104 <.omp_outlined.+0x664> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X8, [SP, #168] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X30, X7, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
STR X22, [SP, #104] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
FMOV D0, #-0.2500000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 |
SUB W8, WZR, W8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDP X26, X10, [SP, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X22, X3, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X6, X5, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
STR W8, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X8, [SP, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
LDR W1, [SP, #100] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADRP X0, <462108> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X0, X0, #2976 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 402d80 <@plt_start@+0x30> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADDVL SP, SP, #4 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
ADD SP, SP, #208 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDP D9, D8, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDP D11, D10, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDP D13, D12, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDP X20, X19, [SP, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X22, X21, [SP, #128] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X24, X23, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X26, X25, [SP, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X28, X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X29, X30, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP D15, D14, [SP], #160 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
RET | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Source file and lines | accelerate.cpp:40-53 |
Module | exec |
nb instructions | 169 |
loop length | 676 |
nb stack references | 0 |
front end | 20.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.00 | 4.00 | 13.50 | 13.25 | 23.00 | 13.25 | 2.50 | 2.50 | 2.50 | 2.50 | 31.83 | 31.50 | 31.67 | 11.50 | 11.50 |
cycles | 4.00 | 4.00 | 13.50 | 13.25 | 23.00 | 13.25 | 2.50 | 2.50 | 2.50 | 2.50 | 31.83 | 31.50 | 31.67 | 11.50 | 11.50 |
Cycles executing div or sqrt instructions | 1.00-0.50 |
Front-end | 20.50 |
Overall L1 | 31.83 |
all | 30% |
load | 100% |
store | 100% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | 0% |
div/sqrt | 0% |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
STP D15, D14, [SP, #864]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP D13, D12, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP D11, D10, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP D9, D8, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP X29, X30, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X28, X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X26, X25, [SP, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X24, X23, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X22, X21, [SP, #128] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X20, X19, [SP, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X29, SP, #64 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADDVL SP, SP, #60 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SUB SP, SP, #208 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR W10, [X2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR W8, [X3] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD W11, W10, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD W8, W8, #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUBS W8, W8, W11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LE 41a114 <.omp_outlined.+0x674> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR W12, [X4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR W9, [X5] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD W2, W12, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD W9, W9, #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP W9, W2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.LE 41a114 <.omp_outlined.+0x674> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
STP X12, X11, [SP, #136] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDP X13, X12, [X29, #136] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X15, X14, [X29, #120] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
ADD X4, SP, #200 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X5, SP, #192 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDP X17, X16, [X29, #104] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X18, [X29, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STP X10, X6, [SP, #152] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X6, SP, #184 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDP X11, X10, [X29, #152] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X3, [X7] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X25, [X7, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
MOVZ W7, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X1, [X18] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X27, [X18, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X18, [X17] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X20, [X17, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X17, [X16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X22, [X16, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X16, [X15] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X21, [X15, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X15, [X14] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X19, [X14, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X14, [X13] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X28, [X13, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X13, [X12] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X12, [X12, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X24, [X11, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X23, [X10, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X2, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR WZR, [SP, #180] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X12, X13, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X12, [X11] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUB W11, W9, W2 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVN X9, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ W2, #34 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UMADDL X26, W11, W8, X9 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
STP X1, X3, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X9, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR W1, [X0] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
MOVZ W8, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X0, <462ba8> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X0, X0, #2952 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X3, SP, #180 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X17, X18, [SP, #120] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR X16, [SP, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X14, X15, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR X11, [SP, #168] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR X8, [SP, #184] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR X8, [SP] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X26, XZR, [SP, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR W1, [SP, #100] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X9, X12, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
BL 402ee0 <@plt_start@+0x190> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDP X8, X13, [SP, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
CMP X8, X26 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CSEL X8, X8, X26, #11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X13, X8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GT 41a104 <.omp_outlined.+0x664> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X4, X8, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X10, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
ORR X9, XZR, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X11, X4, X13 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X11, X10 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.CC 419ef0 <.omp_outlined.+0x450> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
UDIV X9, X11, X10 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5-20 | 1-0.50 |
SUB X8, X29, #64 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PTRUE P0.D, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
MADD X12, X9, X10, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
DUP Z1.D, X10 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
STR Z1, [X8, #511, MUL VL] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR X8, [SP, #168] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD X9, X13, X12 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X11, X11, X12 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
INDEX Z0.D, X13, #1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 2 |
LDR X13, [SP, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z2.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SUB X8, X29, #64 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
DUP Z1.D, X13 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
STR Z1, [X8, #510, MUL VL] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR X8, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z1.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
SUB X8, X29, #64 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR Z1, [X8, #509, MUL VL] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
SUB X8, X29, #64 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X13, [SP, #136] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z1.D, X13 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
STR Z1, [X8, #508, MUL VL] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR X8, [SP, #120] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X13, [SP, #152] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z17.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X8, [SP, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z6.D, X13 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X13, [SP, #88] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z18.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
DUP Z7.D, X13 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDP X8, X13, [SP, #72] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
DUP Z19.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X8, [SP, #128] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z16.D, X13 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X13, [SP, #160] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z20.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X8, [SP, #56] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z21.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X8, [SP, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z22.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X8, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z23.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X8, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
DUP Z25.D, X8 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LDR X8, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
CBZ X11, 41a104 <.omp_outlined.+0x664> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X8, [SP, #168] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X30, X7, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
STR X22, [SP, #104] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
FMOV D0, #-0.2500000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 |
SUB W8, WZR, W8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDP X26, X10, [SP, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X22, X3, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X6, X5, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
STR W8, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X8, [SP, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
LDR W1, [SP, #100] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADRP X0, <462108> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X0, X0, #2976 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 402d80 <@plt_start@+0x30> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADDVL SP, SP, #4 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
ADD SP, SP, #208 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDP D9, D8, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDP D11, D10, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDP D13, D12, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDP X20, X19, [SP, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X22, X21, [SP, #128] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X24, X23, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X26, X25, [SP, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X28, X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X29, X30, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP D15, D14, [SP], #160 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
RET | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼.omp_outlined.– | 7.28 | 9.72 |
○Loop 188 - accelerate.cpp:40-53 - exec | 7.28 | 9.68 |
○Loop 187 - accelerate.cpp:41-53 - exec | 0 | 0 |