Function: hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6 | Module: exec | Source: csr_matvec.c:243-404 [...] | Coverage: 46.55% |
---|
Function: hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6 | Module: exec | Source: csr_matvec.c:243-404 [...] | Coverage: 46.55% |
---|
/home/hbollore/qaas/qaas-runs/169-817-3176/intel/AMG/build/AMG/AMG/seq_mv/csr_matvec.c: 243 - 404 |
-------------------------------------------------------------------------------- |
243: #pragma omp parallel private(i,jj,tempx) |
244: #endif |
245: { |
246: HYPRE_Int iBegin = hypre_CSRMatrixGetLoadBalancedPartitionBegin(A); |
247: HYPRE_Int iEnd = hypre_CSRMatrixGetLoadBalancedPartitionEnd(A); |
248: hypre_assert(iBegin <= iEnd); |
249: hypre_assert(iBegin >= 0 && iBegin <= num_rows); |
250: hypre_assert(iEnd >= 0 && iEnd <= num_rows); |
251: |
252: if (0 == temp) |
253: { |
254: if (1 == alpha) // JSP: a common path |
255: { |
256: for (i = iBegin; i < iEnd; i++) |
257: { |
258: tempx = 0.0; |
259: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
260: { |
261: tempx += A_data[jj] * x_data[A_j[jj]]; |
262: } |
263: y_data[i] = tempx; |
264: } |
265: } // y = A*x |
266: else if (-1 == alpha) |
267: { |
268: for (i = iBegin; i < iEnd; i++) |
269: { |
270: tempx = 0.0; |
271: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
272: { |
273: tempx -= A_data[jj] * x_data[A_j[jj]]; |
274: } |
275: y_data[i] = tempx; |
276: } |
277: } // y = -A*x |
278: else |
279: { |
280: for (i = iBegin; i < iEnd; i++) |
281: { |
282: tempx = 0.0; |
283: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
284: { |
285: tempx += A_data[jj] * x_data[A_j[jj]]; |
286: } |
287: y_data[i] = alpha*tempx; |
288: } |
289: } // y = alpha*A*x |
290: } // temp == 0 |
291: else if (-1 == temp) // beta == -alpha |
292: { |
293: if (1 == alpha) // JSP: a common path |
294: { |
295: for (i = iBegin; i < iEnd; i++) |
296: { |
297: tempx = -b_data[i]; |
298: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
299: { |
300: tempx += A_data[jj] * x_data[A_j[jj]]; |
301: } |
302: y_data[i] = tempx; |
303: } |
304: } // y = A*x - y |
305: else if (-1 == alpha) // JSP: a common path |
306: { |
307: for (i = iBegin; i < iEnd; i++) |
308: { |
309: tempx = b_data[i]; |
310: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
311: { |
312: tempx -= A_data[jj] * x_data[A_j[jj]]; |
313: } |
314: y_data[i] = tempx; |
315: } |
316: } // y = -A*x + y |
317: else |
318: { |
319: for (i = iBegin; i < iEnd; i++) |
320: { |
321: tempx = -b_data[i]; |
322: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
323: { |
324: tempx += A_data[jj] * x_data[A_j[jj]]; |
325: } |
326: y_data[i] = alpha*tempx; |
327: } |
328: } // y = alpha*(A*x - y) |
329: } // temp == -1 |
330: else if (1 == temp) |
331: { |
332: if (1 == alpha) // JSP: a common path |
333: { |
334: for (i = iBegin; i < iEnd; i++) |
335: { |
336: tempx = b_data[i]; |
337: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
338: { |
339: tempx += A_data[jj] * x_data[A_j[jj]]; |
340: } |
341: y_data[i] = tempx; |
342: } |
343: } // y = A*x + y |
344: else if (-1 == alpha) |
345: { |
346: for (i = iBegin; i < iEnd; i++) |
347: { |
348: tempx = -b_data[i]; |
349: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
350: { |
351: tempx -= A_data[jj] * x_data[A_j[jj]]; |
352: } |
353: y_data[i] = tempx; |
354: } |
355: } // y = -A*x - y |
356: else |
357: { |
358: for (i = iBegin; i < iEnd; i++) |
359: { |
360: tempx = b_data[i]; |
361: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
362: { |
363: tempx += A_data[jj] * x_data[A_j[jj]]; |
364: } |
365: y_data[i] = alpha*tempx; |
[...] |
371: if (1 == alpha) // JSP: a common path |
372: { |
373: for (i = iBegin; i < iEnd; i++) |
374: { |
375: tempx = b_data[i]*temp; |
376: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
377: { |
378: tempx += A_data[jj] * x_data[A_j[jj]]; |
379: } |
380: y_data[i] = tempx; |
381: } |
382: } // y = A*x + temp*y |
383: else if (-1 == alpha) |
384: { |
385: for (i = iBegin; i < iEnd; i++) |
386: { |
387: tempx = -b_data[i]*temp; |
388: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
389: { |
390: tempx -= A_data[jj] * x_data[A_j[jj]]; |
391: } |
392: y_data[i] = tempx; |
393: } |
394: } // y = -A*x - temp*y |
395: else |
396: { |
397: for (i = iBegin; i < iEnd; i++) |
398: { |
399: tempx = b_data[i]*temp; |
400: for (jj = A_i[i]; jj < A_i[i+1]; jj++) |
401: { |
402: tempx += A_data[jj] * x_data[A_j[jj]]; |
403: } |
404: y_data[i] = alpha*tempx; |
0x4f8ecc STP X29, X30, [SP, #912]! |
0x4f8ed0 ORR X1, XZR, X0 |
0x4f8ed4 ADD X29, SP, #0 |
0x4f8ed8 STP X21, X22, [SP, #32] |
0x4f8edc STP X25, X26, [SP, #64] |
0x4f8ee0 LDP X21, X25, [X0, #8] |
0x4f8ee4 STP D8, D9, [SP, #96] |
0x4f8ee8 LDR D9, [X0] |
0x4f8eec ORR X0, XZR, X21 |
0x4f8ef0 STP X19, X20, [SP, #16] |
0x4f8ef4 LDR D8, [X1, #72] |
0x4f8ef8 STP X23, X24, [SP, #48] |
0x4f8efc LDP X22, X24, [X1, #24] |
0x4f8f00 LDP X20, X26, [X1, #48] |
0x4f8f04 LDR X23, [X1, #64] |
0x4f8f08 STR X27, [SP, #80] |
0x4f8f0c LDR X27, [X1, #40] |
0x4f8f10 BL 4f7f80 |
0x4f8f14 ORR X19, XZR, X0 |
0x4f8f18 ORR X0, XZR, X21 |
0x4f8f1c BL 4f8024 |
0x4f8f20 ORR X21, XZR, X0 |
0x4f8f24 CMP X19, X0 |
0x4f8f28 B.GT 4f9270 |
0x4f8f2c CMP X19, #0 |
0x4f8f30 CCMP X27, X19, #1, #10 |
0x4f8f34 B.LT 4f9234 |
0x4f8f38 CMP X21, #0 |
0x4f8f3c CCMP X27, X21, #1, #10 |
0x4f8f40 B.LT 4f91f8 |
0x4f8f44 FCMP D8, #0 |
0x4f8f48 B.EQ 4f9018 |
0x4f8f4c FMOV D0, #-1.0000000 |
0x4f8f50 FMOV D1, #1.0000000 |
0x4f8f54 FCMP D8, D0 |
0x4f8f58 B.NE 4f9148 |
0x4f8f5c FCMP D9, D1 |
0x4f8f60 B.EQ 4f92ac |
0x4f8f64 FCMP D9, D0 |
0x4f8f68 B.EQ 4f9508 |
0x4f8f6c CMP X19, X21 |
0x4f8f70 B.GE 4f8ff8 |
0x4f8f74 ADD X8, X22, #8 |
0x4f8f78 CNTD X9, ALL |
0x4f8f7c PTRUE P4.B, ALL |
(3780) 0x4f8f80 LDR D27, [X26, X19,LSL #3] |
(3780) 0x4f8f84 LDR X10, [X22, X19,LSL #3] |
(3780) 0x4f8f88 LDR X0, [X8, X19,LSL #3] |
(3780) 0x4f8f8c FNEG D0, D27 |
(3780) 0x4f8f90 CMP X10, X0 |
(3780) 0x4f8f94 B.GE 4f8fe4 |
(3780) 0x4f8f98 UBFM X11, X10, #61, #60 |
(3780) 0x4f8f9c MOVZ X15, #0 |
(3780) 0x4f8fa0 DUP Z28.D, #0 |
(3780) 0x4f8fa4 ADD X12, X25, X11 |
(3780) 0x4f8fa8 ADD X13, X24, X11 |
(3780) 0x4f8fac SUB X14, X0, X10 |
(3780) 0x4f8fb0 WHILELO P5.D, XZR, X14 |
(3780) 0x4f8fb4 HINT #0 |
(3780) 0x4f8fb8 HINT #0 |
(3780) 0x4f8fbc HINT #0 |
(3781) 0x4f8fc0 LD1D {Z29.D}, P5/Z, [X13, X15,LSL #3] |
(3781) 0x4f8fc4 LD1D {Z30.D}, P5/Z, [X12, X15,LSL #3] |
(3781) 0x4f8fc8 LD1D {Z31.D}, P5/Z, [X20, Z29.D,LSL #3] |
(3781) 0x4f8fcc ADD X15, X15, X9 |
(3781) 0x4f8fd0 FMLA Z28.D, P5/M, Z31.D, Z30.D |
(3781) 0x4f8fd4 WHILELO P5.D, X15, X14 |
(3781) 0x4f8fd8 B.NE 4f8fc0 |
(3780) 0x4f8fdc FADDV D8, P4, Z28.D |
(3780) 0x4f8fe0 FSUB D0, D8, S27 |
(3780) 0x4f8fe4 FMUL D1, D9, D0 |
(3780) 0x4f8fe8 STR D1, [X23, X19,LSL #3] |
(3780) 0x4f8fec ADD X19, X19, #1 |
(3780) 0x4f8ff0 CMP X21, X19 |
(3780) 0x4f8ff4 B.NE 4f8f80 |
(3754) 0x4f8ff8 LDP X19, X20, [SP, #16] |
(3754) 0x4f8ffc LDP X21, X22, [SP, #32] |
(3754) 0x4f9000 LDP X23, X24, [SP, #48] |
(3754) 0x4f9004 LDP X25, X26, [SP, #64] |
(3754) 0x4f9008 LDR X27, [SP, #80] |
(3754) 0x4f900c LDP D8, D9, [SP, #96] |
(3754) 0x4f9010 LDP X29, X30, [SP], #112 |
(3754) 0x4f9014 RET |
(3754) 0x4f9018 FMOV D22, #1.0000000 |
(3754) 0x4f901c FCMP D9, D22 |
(3754) 0x4f9020 B.NE 4f90ac |
(3754) 0x4f9024 CMP X19, X21 |
(3754) 0x4f9028 B.GE 4f8ff8 |
(3754) 0x4f902c ADD X11, X22, #8 |
(3754) 0x4f9030 LDR X26, [X22, X19,LSL #3] |
(3754) 0x4f9034 CNTD X12, ALL |
(3754) 0x4f9038 PTRUE P6.B, ALL |
(3754) 0x4f903c LDR X13, [X11, X19,LSL #3] |
(3754) 0x4f9040 CMP X13, X26 |
(3754) 0x4f9044 B.LE 4f90a4 |
(3762) 0x4f9048 UBFM X3, X26, #61, #60 |
(3762) 0x4f904c MOVZ X1, #0 |
(3762) 0x4f9050 DUP Z9.D, #0 |
(3762) 0x4f9054 ADD X14, X25, X3 |
(3762) 0x4f9058 ADD X15, X24, X3 |
(3762) 0x4f905c SUB X16, X13, X26 |
(3762) 0x4f9060 WHILELO P7.D, XZR, X16 |
(3761) 0x4f9064 LD1D {Z4.D}, P7/Z, [X15, X1,LSL #3] |
(3761) 0x4f9068 LD1D {Z5.D}, P7/Z, [X14, X1,LSL #3] |
(3761) 0x4f906c LD1D {Z2.D}, P7/Z, [X20, Z4.D,LSL #3] |
(3761) 0x4f9070 ADD X1, X1, X12 |
(3761) 0x4f9074 FMLA Z9.D, P7/M, Z2.D, Z5.D |
(3761) 0x4f9078 WHILELO P7.D, X1, X16 |
(3761) 0x4f907c B.NE 4f9064 |
(3762) 0x4f9080 FADDV D6, P6, Z9.D |
(3762) 0x4f9084 STR D6, [X23, X19,LSL #3] |
(3762) 0x4f9088 ADD X19, X19, #1 |
(3762) 0x4f908c CMP X21, X19 |
(3762) 0x4f9090 B.EQ 4f8ff8 |
(3762) 0x4f9094 LDR X26, [X22, X19,LSL #3] |
(3762) 0x4f9098 LDR X13, [X11, X19,LSL #3] |
(3762) 0x4f909c CMP X13, X26 |
(3762) 0x4f90a0 B.GT 4f9048 |
(3763) 0x4f90a4 MOVI D6, #0 |
(3763) 0x4f90a8 B 4f9084 |
(3754) 0x4f90ac FMOV D23, #-1.0000000 |
(3754) 0x4f90b0 FCMP D9, D23 |
(3754) 0x4f90b4 B.NE 4f93f8 |
(3754) 0x4f90b8 CMP X19, X21 |
(3754) 0x4f90bc B.GE 4f8ff8 |
(3754) 0x4f90c0 ADD X6, X22, #8 |
(3754) 0x4f90c4 LDR X5, [X22, X19,LSL #3] |
(3754) 0x4f90c8 CNTD X4, ALL |
(3754) 0x4f90cc PTRUE P4.B, ALL |
(3754) 0x4f90d0 LDR X7, [X6, X19,LSL #3] |
(3754) 0x4f90d4 CMP X5, X7 |
(3754) 0x4f90d8 B.GE 4f9140 |
(3754) 0x4f90dc HINT #0 |
(3759) 0x4f90e0 UBFM X8, X5, #61, #60 |
(3759) 0x4f90e4 MOVZ X2, #0 |
(3759) 0x4f90e8 DUP Z30.D, #0 |
(3759) 0x4f90ec ADD X9, X25, X8 |
(3759) 0x4f90f0 ADD X10, X24, X8 |
(3759) 0x4f90f4 SUB X0, X7, X5 |
(3759) 0x4f90f8 WHILELO P5.D, XZR, X0 |
(3759) 0x4f90fc HINT #0 |
(3758) 0x4f9100 LD1D {Z31.D}, P5/Z, [X10, X2,LSL #3] |
(3758) 0x4f9104 LD1D {Z8.D}, P5/Z, [X9, X2,LSL #3] |
(3758) 0x4f9108 LD1D {Z0.D}, P5/Z, [X20, Z31.D,LSL #3] |
(3758) 0x4f910c ADD X2, X2, X4 |
(3758) 0x4f9110 FMLS Z30.D, P5/M, Z0.D, Z8.D |
(3758) 0x4f9114 WHILELO P5.D, X2, X0 |
(3758) 0x4f9118 B.NE 4f9100 |
(3759) 0x4f911c FADDV D1, P4, Z30.D |
(3759) 0x4f9120 STR D1, [X23, X19,LSL #3] |
(3759) 0x4f9124 ADD X19, X19, #1 |
(3759) 0x4f9128 CMP X21, X19 |
(3759) 0x4f912c B.EQ 4f8ff8 |
(3759) 0x4f9130 LDR X5, [X22, X19,LSL #3] |
(3759) 0x4f9134 LDR X7, [X6, X19,LSL #3] |
(3759) 0x4f9138 CMP X5, X7 |
(3759) 0x4f913c B.LT 4f90e0 |
(3760) 0x4f9140 MOVI D1, #0 |
(3760) 0x4f9144 B 4f9120 |
0x4f9148 FCMP D8, D1 |
0x4f914c B.NE 4f9354 |
0x4f9150 FCMP D9, D1 |
0x4f9154 B.EQ 4f948c |
0x4f9158 FCMP D9, D0 |
0x4f915c B.NE 4f9618 |
0x4f9160 CMP X19, X21 |
0x4f9164 B.GE 4f8ff8 |
0x4f9168 ADD X10, X22, #8 |
0x4f916c CNTD X11, ALL |
0x4f9170 PTRUE P1.B, ALL |
0x4f9174 HINT #0 |
0x4f9178 HINT #0 |
0x4f917c HINT #0 |
(3774) 0x4f9180 LDR D6, [X26, X19,LSL #3] |
(3774) 0x4f9184 LDR X12, [X22, X19,LSL #3] |
(3774) 0x4f9188 LDR X13, [X10, X19,LSL #3] |
(3774) 0x4f918c FNEG D20, D6 |
(3774) 0x4f9190 CMP X12, X13 |
(3774) 0x4f9194 B.GE 4f91e4 |
(3774) 0x4f9198 UBFM X14, X12, #61, #60 |
(3774) 0x4f919c MOVZ X18, #0 |
(3774) 0x4f91a0 DUP Z7.D, #0 |
(3774) 0x4f91a4 ADD X15, X25, X14 |
(3774) 0x4f91a8 ADD X16, X24, X14 |
(3774) 0x4f91ac SUB X17, X13, X12 |
(3774) 0x4f91b0 WHILELO P0.D, XZR, X17 |
(3774) 0x4f91b4 HINT #0 |
(3774) 0x4f91b8 HINT #0 |
(3774) 0x4f91bc HINT #0 |
(3775) 0x4f91c0 LD1D {Z16.D}, P0/Z, [X16, X18,LSL #3] |
(3775) 0x4f91c4 LD1D {Z17.D}, P0/Z, [X15, X18,LSL #3] |
(3775) 0x4f91c8 LD1D {Z18.D}, P0/Z, [X20, Z16.D,LSL #3] |
(3775) 0x4f91cc ADD X18, X18, X11 |
(3775) 0x4f91d0 FMLS Z7.D, P0/M, Z18.D, Z17.D |
(3775) 0x4f91d4 WHILELO P0.D, X18, X17 |
(3775) 0x4f91d8 B.NE 4f91c0 |
(3774) 0x4f91dc FADDV D19, P1, Z7.D |
(3774) 0x4f91e0 FSUB D20, D19, S6 |
(3774) 0x4f91e4 STR D20, [X23, X19,LSL #3] |
(3774) 0x4f91e8 ADD X19, X19, #1 |
(3774) 0x4f91ec CMP X21, X19 |
(3774) 0x4f91f0 B.NE 4f9180 |
0x4f91f4 B 4f8ff8 |
0x4f91f8 ADRP X11, |
0x4f91fc ADRP X12, |
0x4f9200 LDR X13, [X11, #3912] |
0x4f9204 ADRP X14, |
0x4f9208 ADD X2, X12, #3616 |
0x4f920c ADD X1, X14, #424 |
0x4f9210 LDR X0, [X13] |
0x4f9214 BL 503b24 |
0x4f9218 ADRP X15, |
0x4f921c MOVZ X3, #0 |
0x4f9220 ADD X0, X15, #3648 |
0x4f9224 MOVZ X2, #1 |
0x4f9228 MOVZ X1, #250 |
0x4f922c BL 506500 |
0x4f9230 B 4f8f44 |
0x4f9234 ADRP X6, |
0x4f9238 ADRP X7, |
0x4f923c LDR X8, [X6, #3912] |
0x4f9240 ADRP X9, |
0x4f9244 ADD X2, X7, #3736 |
0x4f9248 ADD X1, X9, #424 |
0x4f924c LDR X0, [X8] |
0x4f9250 BL 503b24 |
0x4f9254 ADRP X10, |
0x4f9258 MOVZ X3, #0 |
0x4f925c ADD X0, X10, #3648 |
0x4f9260 MOVZ X2, #1 |
0x4f9264 MOVZ X1, #249 |
0x4f9268 BL 506500 |
0x4f926c B 4f8f38 |
0x4f9270 ADRP X0, |
0x4f9274 ADRP X4, |
0x4f9278 LDR X3, [X0, #3912] |
0x4f927c ADRP X2, |
0x4f9280 ADD X1, X4, #424 |
0x4f9284 ADD X2, X2, #3176 |
0x4f9288 LDR X0, [X3] |
0x4f928c BL 503b24 |
0x4f9290 ADRP X5, |
0x4f9294 MOVZ X3, #0 |
0x4f9298 ADD X0, X5, #3648 |
0x4f929c MOVZ X2, #1 |
0x4f92a0 MOVZ X1, #248 |
0x4f92a4 BL 506500 |
0x4f92a8 B 4f8f2c |
0x4f92ac CMP X19, X21 |
0x4f92b0 B.GE 4f8ff8 |
0x4f92b4 ADD X8, X22, #8 |
0x4f92b8 CNTD X9, ALL |
0x4f92bc PTRUE P1.B, ALL |
(3776) 0x4f92c0 LDR D7, [X26, X19,LSL #3] |
(3776) 0x4f92c4 LDR X10, [X22, X19,LSL #3] |
(3776) 0x4f92c8 LDR X0, [X8, X19,LSL #3] |
(3776) 0x4f92cc FNEG D21, D7 |
(3776) 0x4f92d0 CMP X10, X0 |
(3776) 0x4f92d4 B.GE 4f9324 |
(3776) 0x4f92d8 UBFM X2, X10, #61, #60 |
(3776) 0x4f92dc MOVZ X1, #0 |
(3776) 0x4f92e0 DUP Z16.D, #0 |
(3776) 0x4f92e4 ADD X3, X25, X2 |
(3776) 0x4f92e8 ADD X11, X24, X2 |
(3776) 0x4f92ec SUB X12, X0, X10 |
(3776) 0x4f92f0 WHILELO P0.D, XZR, X12 |
(3776) 0x4f92f4 HINT #0 |
(3776) 0x4f92f8 HINT #0 |
(3776) 0x4f92fc HINT #0 |
(3777) 0x4f9300 LD1D {Z17.D}, P0/Z, [X11, X1,LSL #3] |
(3777) 0x4f9304 LD1D {Z18.D}, P0/Z, [X3, X1,LSL #3] |
(3777) 0x4f9308 LD1D {Z19.D}, P0/Z, [X20, Z17.D,LSL #3] |
(3777) 0x4f930c ADD X1, X1, X9 |
(3777) 0x4f9310 FMLA Z16.D, P0/M, Z19.D, Z18.D |
(3777) 0x4f9314 WHILELO P0.D, X1, X12 |
(3777) 0x4f9318 B.NE 4f9300 |
(3776) 0x4f931c FADDV D20, P1, Z16.D |
(3776) 0x4f9320 FSUB D21, D20, S7 |
(3776) 0x4f9324 STR D21, [X23, X19,LSL #3] |
(3776) 0x4f9328 ADD X19, X19, #1 |
(3776) 0x4f932c CMP X21, X19 |
(3776) 0x4f9330 B.NE 4f92c0 |
0x4f9334 LDP X19, X20, [SP, #16] |
0x4f9338 LDP X21, X22, [SP, #32] |
0x4f933c LDP X23, X24, [SP, #48] |
0x4f9340 LDP X25, X26, [SP, #64] |
0x4f9344 LDR X27, [SP, #80] |
0x4f9348 LDP D8, D9, [SP, #96] |
0x4f934c LDP X29, X30, [SP], #112 |
0x4f9350 RET |
0x4f9354 FCMP D9, D1 |
0x4f9358 B.EQ 4f9588 |
0x4f935c FCMP D9, D0 |
0x4f9360 B.NE 4f969c |
0x4f9364 CMP X19, X21 |
0x4f9368 B.GE 4f8ff8 |
0x4f936c ADD X6, X22, #8 |
0x4f9370 CNTD X4, ALL |
0x4f9374 PTRUE P2.B, ALL |
0x4f9378 HINT #0 |
0x4f937c HINT #0 |
(3768) 0x4f9380 LDR D18, [X26, X19,LSL #3] |
(3768) 0x4f9384 LDR X5, [X22, X19,LSL #3] |
(3768) 0x4f9388 LDR X7, [X6, X19,LSL #3] |
(3768) 0x4f938c FMUL D19, D8, D18 |
(3768) 0x4f9390 FNEG D25, D19 |
(3768) 0x4f9394 CMP X5, X7 |
(3768) 0x4f9398 B.GE 4f93e4 |
(3768) 0x4f939c UBFM X8, X5, #61, #60 |
(3768) 0x4f93a0 MOVZ X12, #0 |
(3768) 0x4f93a4 DUP Z20.D, #0 |
(3768) 0x4f93a8 ADD X9, X25, X8 |
(3768) 0x4f93ac ADD X10, X24, X8 |
(3768) 0x4f93b0 SUB X11, X7, X5 |
(3768) 0x4f93b4 WHILELO P3.D, XZR, X11 |
(3768) 0x4f93b8 HINT #0 |
(3768) 0x4f93bc HINT #0 |
(3769) 0x4f93c0 LD1D {Z21.D}, P3/Z, [X10, X12,LSL #3] |
(3769) 0x4f93c4 LD1D {Z22.D}, P3/Z, [X9, X12,LSL #3] |
(3769) 0x4f93c8 LD1D {Z23.D}, P3/Z, [X20, Z21.D,LSL #3] |
(3769) 0x4f93cc ADD X12, X12, X4 |
(3769) 0x4f93d0 FMLS Z20.D, P3/M, Z23.D, Z22.D |
(3769) 0x4f93d4 WHILELO P3.D, X12, X11 |
(3769) 0x4f93d8 B.NE 4f93c0 |
(3768) 0x4f93dc FADDV D24, P2, Z20.D |
(3768) 0x4f93e0 FSUB D25, D24, S19 |
(3768) 0x4f93e4 STR D25, [X23, X19,LSL #3] |
(3768) 0x4f93e8 ADD X19, X19, #1 |
(3768) 0x4f93ec CMP X21, X19 |
(3768) 0x4f93f0 B.NE 4f9380 |
0x4f93f4 B 4f8ff8 |
(3754) 0x4f93f8 CMP X19, X21 |
(3754) 0x4f93fc B.GE 4f8ff8 |
(3754) 0x4f9400 ADD X26, X22, #8 |
(3754) 0x4f9404 LDR X14, [X22, X19,LSL #3] |
(3754) 0x4f9408 CNTD X13, ALL |
(3754) 0x4f940c PTRUE P2.B, ALL |
(3754) 0x4f9410 LDR X15, [X26, X19,LSL #3] |
(3754) 0x4f9414 CMP X14, X15 |
(3754) 0x4f9418 B.GE 4f9484 |
(3754) 0x4f941c HINT #0 |
(3756) 0x4f9420 UBFM X16, X14, #61, #60 |
(3756) 0x4f9424 MOVZ X27, #0 |
(3756) 0x4f9428 DUP Z24.D, #0 |
(3756) 0x4f942c ADD X17, X25, X16 |
(3756) 0x4f9430 ADD X18, X24, X16 |
(3756) 0x4f9434 SUB X30, X15, X14 |
(3756) 0x4f9438 WHILELO P3.D, XZR, X30 |
(3756) 0x4f943c HINT #0 |
(3755) 0x4f9440 LD1D {Z25.D}, P3/Z, [X18, X27,LSL #3] |
(3755) 0x4f9444 LD1D {Z26.D}, P3/Z, [X17, X27,LSL #3] |
(3755) 0x4f9448 LD1D {Z27.D}, P3/Z, [X20, Z25.D,LSL #3] |
(3755) 0x4f944c ADD X27, X27, X13 |
(3755) 0x4f9450 FMLA Z24.D, P3/M, Z27.D, Z26.D |
(3755) 0x4f9454 WHILELO P3.D, X27, X30 |
(3755) 0x4f9458 B.NE 4f9440 |
(3756) 0x4f945c FADDV D28, P2, Z24.D |
(3756) 0x4f9460 FMUL D29, D9, D28 |
(3756) 0x4f9464 STR D29, [X23, X19,LSL #3] |
(3756) 0x4f9468 ADD X19, X19, #1 |
(3756) 0x4f946c CMP X21, X19 |
(3756) 0x4f9470 B.EQ 4f8ff8 |
(3756) 0x4f9474 LDR X14, [X22, X19,LSL #3] |
(3756) 0x4f9478 LDR X15, [X26, X19,LSL #3] |
(3756) 0x4f947c CMP X14, X15 |
(3756) 0x4f9480 B.LT 4f9420 |
(3757) 0x4f9484 MOVI D29, #0 |
(3757) 0x4f9488 B 4f9464 |
0x4f948c CMP X19, X21 |
0x4f9490 B.GE 4f8ff8 |
0x4f9494 ADD X30, X22, #8 |
0x4f9498 CNTD X27, ALL |
0x4f949c PTRUE P2.B, ALL |
(3770) 0x4f94a0 LDR X6, [X22, X19,LSL #3] |
(3770) 0x4f94a4 LDR X4, [X30, X19,LSL #3] |
(3770) 0x4f94a8 LDR D26, [X26, X19,LSL #3] |
(3770) 0x4f94ac CMP X6, X4 |
(3770) 0x4f94b0 B.GE 4f94f4 |
(3770) 0x4f94b4 UBFM X5, X6, #61, #60 |
(3770) 0x4f94b8 MOVZ X1, #0 |
(3770) 0x4f94bc DUP Z21.D, #0 |
(3770) 0x4f94c0 ADD X7, X25, X5 |
(3770) 0x4f94c4 ADD X2, X24, X5 |
(3770) 0x4f94c8 SUB X3, X4, X6 |
(3770) 0x4f94cc WHILELO P3.D, XZR, X3 |
(3771) 0x4f94d0 LD1D {Z22.D}, P3/Z, [X2, X1,LSL #3] |
(3771) 0x4f94d4 LD1D {Z23.D}, P3/Z, [X7, X1,LSL #3] |
(3771) 0x4f94d8 LD1D {Z24.D}, P3/Z, [X20, Z22.D,LSL #3] |
(3771) 0x4f94dc ADD X1, X1, X27 |
(3771) 0x4f94e0 FMLA Z21.D, P3/M, Z24.D, Z23.D |
(3771) 0x4f94e4 WHILELO P3.D, X1, X3 |
(3771) 0x4f94e8 B.NE 4f94d0 |
(3770) 0x4f94ec FADDV D25, P2, Z21.D |
(3770) 0x4f94f0 FADD D26, D26, D25 |
(3770) 0x4f94f4 STR D26, [X23, X19,LSL #3] |
(3770) 0x4f94f8 ADD X19, X19, #1 |
(3770) 0x4f94fc CMP X21, X19 |
(3770) 0x4f9500 B.NE 4f94a0 |
0x4f9504 B 4f8ff8 |
0x4f9508 CMP X19, X21 |
0x4f950c B.GE 4f8ff8 |
0x4f9510 ADD X16, X22, #8 |
0x4f9514 CNTD X17, ALL |
0x4f9518 PTRUE P6.B, ALL |
0x4f951c HINT #0 |
(3778) 0x4f9520 LDR X18, [X22, X19,LSL #3] |
(3778) 0x4f9524 LDR X30, [X16, X19,LSL #3] |
(3778) 0x4f9528 LDR D3, [X26, X19,LSL #3] |
(3778) 0x4f952c CMP X18, X30 |
(3778) 0x4f9530 B.GE 4f9574 |
(3778) 0x4f9534 UBFM X27, X18, #61, #60 |
(3778) 0x4f9538 MOVZ X7, #0 |
(3778) 0x4f953c DUP Z9.D, #0 |
(3778) 0x4f9540 ADD X6, X25, X27 |
(3778) 0x4f9544 ADD X4, X24, X27 |
(3778) 0x4f9548 SUB X5, X30, X18 |
(3778) 0x4f954c WHILELO P7.D, XZR, X5 |
(3779) 0x4f9550 LD1D {Z4.D}, P7/Z, [X4, X7,LSL #3] |
(3779) 0x4f9554 LD1D {Z5.D}, P7/Z, [X6, X7,LSL #3] |
(3779) 0x4f9558 LD1D {Z2.D}, P7/Z, [X20, Z4.D,LSL #3] |
(3779) 0x4f955c ADD X7, X7, X17 |
(3779) 0x4f9560 FMLS Z9.D, P7/M, Z2.D, Z5.D |
(3779) 0x4f9564 WHILELO P7.D, X7, X5 |
(3779) 0x4f9568 B.NE 4f9550 |
(3778) 0x4f956c FADDV D6, P6, Z9.D |
(3778) 0x4f9570 FADD D3, D3, D6 |
(3778) 0x4f9574 STR D3, [X23, X19,LSL #3] |
(3778) 0x4f9578 ADD X19, X19, #1 |
(3778) 0x4f957c CMP X21, X19 |
(3778) 0x4f9580 B.NE 4f9520 |
0x4f9584 B 4f8ff8 |
0x4f9588 CMP X19, X21 |
0x4f958c B.GE 4f8ff8 |
0x4f9590 ADD X13, X22, #8 |
0x4f9594 CNTD X14, ALL |
0x4f9598 PTRUE P4.B, ALL |
0x4f959c HINT #0 |
(3764) 0x4f95a0 LDR D26, [X26, X19,LSL #3] |
(3764) 0x4f95a4 LDR X15, [X22, X19,LSL #3] |
(3764) 0x4f95a8 LDR X16, [X13, X19,LSL #3] |
(3764) 0x4f95ac FMUL D9, D8, D26 |
(3764) 0x4f95b0 CMP X15, X16 |
(3764) 0x4f95b4 B.GE 4f9604 |
(3764) 0x4f95b8 UBFM X17, X15, #61, #60 |
(3764) 0x4f95bc MOVZ X1, #0 |
(3764) 0x4f95c0 DUP Z27.D, #0 |
(3764) 0x4f95c4 ADD X18, X25, X17 |
(3764) 0x4f95c8 ADD X30, X24, X17 |
(3764) 0x4f95cc SUB X27, X16, X15 |
(3764) 0x4f95d0 WHILELO P5.D, XZR, X27 |
(3764) 0x4f95d4 HINT #0 |
(3764) 0x4f95d8 HINT #0 |
(3764) 0x4f95dc HINT #0 |
(3765) 0x4f95e0 LD1D {Z28.D}, P5/Z, [X30, X1,LSL #3] |
(3765) 0x4f95e4 LD1D {Z29.D}, P5/Z, [X18, X1,LSL #3] |
(3765) 0x4f95e8 LD1D {Z30.D}, P5/Z, [X20, Z28.D,LSL #3] |
(3765) 0x4f95ec ADD X1, X1, X14 |
(3765) 0x4f95f0 FMLA Z27.D, P5/M, Z30.D, Z29.D |
(3765) 0x4f95f4 WHILELO P5.D, X1, X27 |
(3765) 0x4f95f8 B.NE 4f95e0 |
(3764) 0x4f95fc FADDV D31, P4, Z27.D |
(3764) 0x4f9600 FADD D9, D9, D31 |
(3764) 0x4f9604 STR D9, [X23, X19,LSL #3] |
(3764) 0x4f9608 ADD X19, X19, #1 |
(3764) 0x4f960c CMP X21, X19 |
(3764) 0x4f9610 B.NE 4f95a0 |
0x4f9614 B 4f8ff8 |
0x4f9618 CMP X19, X21 |
0x4f961c B.GE 4f8ff8 |
0x4f9620 ADD X6, X22, #8 |
0x4f9624 CNTD X4, ALL |
0x4f9628 PTRUE P6.B, ALL |
(3772) 0x4f962c LDR X5, [X22, X19,LSL #3] |
(3772) 0x4f9630 LDR X7, [X6, X19,LSL #3] |
(3772) 0x4f9634 LDR D3, [X26, X19,LSL #3] |
(3772) 0x4f9638 CMP X5, X7 |
(3772) 0x4f963c B.GE 4f9684 |
(3772) 0x4f9640 UBFM X2, X5, #61, #60 |
(3772) 0x4f9644 MOVZ X0, #0 |
(3772) 0x4f9648 DUP Z8.D, #0 |
(3772) 0x4f964c ADD X3, X25, X2 |
(3772) 0x4f9650 ADD X8, X24, X2 |
(3772) 0x4f9654 SUB X9, X7, X5 |
(3772) 0x4f9658 WHILELO P7.D, XZR, X9 |
(3772) 0x4f965c HINT #0 |
(3773) 0x4f9660 LD1D {Z0.D}, P7/Z, [X8, X0,LSL #3] |
(3773) 0x4f9664 LD1D {Z1.D}, P7/Z, [X3, X0,LSL #3] |
(3773) 0x4f9668 LD1D {Z4.D}, P7/Z, [X20, Z0.D,LSL #3] |
(3773) 0x4f966c ADD X0, X0, X4 |
(3773) 0x4f9670 FMLA Z8.D, P7/M, Z4.D, Z1.D |
(3773) 0x4f9674 WHILELO P7.D, X0, X9 |
(3773) 0x4f9678 B.NE 4f9660 |
(3772) 0x4f967c FADDV D5, P6, Z8.D |
(3772) 0x4f9680 FADD D3, D3, D5 |
(3772) 0x4f9684 FMUL D2, D9, D3 |
(3772) 0x4f9688 STR D2, [X23, X19,LSL #3] |
(3772) 0x4f968c ADD X19, X19, #1 |
(3772) 0x4f9690 CMP X21, X19 |
(3772) 0x4f9694 B.NE 4f962c |
0x4f9698 B 4f8ff8 |
0x4f969c CMP X19, X21 |
0x4f96a0 B.GE 4f8ff8 |
0x4f96a4 ADD X16, X22, #8 |
0x4f96a8 CNTD X17, ALL |
0x4f96ac PTRUE P1.B, ALL |
(3766) 0x4f96b0 LDR D3, [X26, X19,LSL #3] |
(3766) 0x4f96b4 LDR X18, [X22, X19,LSL #3] |
(3766) 0x4f96b8 LDR X30, [X16, X19,LSL #3] |
(3766) 0x4f96bc FMUL D16, D8, D3 |
(3766) 0x4f96c0 CMP X18, X30 |
(3766) 0x4f96c4 B.GE 4f9708 |
(3766) 0x4f96c8 UBFM X1, X18, #61, #60 |
(3766) 0x4f96cc MOVZ X0, #0 |
(3766) 0x4f96d0 DUP Z4.D, #0 |
(3766) 0x4f96d4 ADD X27, X25, X1 |
(3766) 0x4f96d8 ADD X2, X24, X1 |
(3766) 0x4f96dc SUB X3, X30, X18 |
(3766) 0x4f96e0 WHILELO P0.D, XZR, X3 |
(3767) 0x4f96e4 LD1D {Z5.D}, P0/Z, [X2, X0,LSL #3] |
(3767) 0x4f96e8 LD1D {Z2.D}, P0/Z, [X27, X0,LSL #3] |
(3767) 0x4f96ec LD1D {Z6.D}, P0/Z, [X20, Z5.D,LSL #3] |
(3767) 0x4f96f0 ADD X0, X0, X17 |
(3767) 0x4f96f4 FMLA Z4.D, P0/M, Z6.D, Z2.D |
(3767) 0x4f96f8 WHILELO P0.D, X0, X3 |
(3767) 0x4f96fc B.NE 4f96e4 |
(3766) 0x4f9700 FADDV D7, P1, Z4.D |
(3766) 0x4f9704 FADD D16, D16, D7 |
(3766) 0x4f9708 FMUL D17, D9, D16 |
(3766) 0x4f970c STR D17, [X23, X19,LSL #3] |
(3766) 0x4f9710 ADD X19, X19, #1 |
(3766) 0x4f9714 CMP X21, X19 |
(3766) 0x4f9718 B.NE 4f96b0 |
0x4f971c B 4f8ff8 |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►62.79+ | GOMP_parallel | libomp.so | |
○ | hypre_CSRMatrixMatvecOutOfPlac[...] | csr_matvec.c:243 | exec |
○ | hypre_ParCSRMatrixMatvecOutOfP[...] | par_csr_matvec.c:216 | exec |
○ | hypre_ParCSRRelax | ams.c:78 | exec |
○ | hypre_BoomerAMGCycle | par_cycle.c:394 | exec |
○ | hypre_BoomerAMGSolve | par_amg_solve.c:235 | exec |
○ | hypre_PCGSolve | pcg.c:545 | exec |
○ | main | amg.c:419 | exec |
○ | __libc_start_main | libc-2.31.so | |
○ | _start | amg.c:599 | exec |
►15.05+ | GOMP_parallel | libomp.so | |
○ | hypre_CSRMatrixMatvecOutOfPlac[...] | csr_matvec.c:243 | exec |
○ | hypre_ParCSRMatrixMatvecOutOfP[...] | par_csr_matvec.c:216 | exec |
○ | hypre_BoomerAMGCycle | par_cycle.c:428 | exec |
○ | hypre_BoomerAMGSolve | par_amg_solve.c:235 | exec |
○ | hypre_PCGSolve | pcg.c:545 | exec |
○ | main | amg.c:419 | exec |
○ | __libc_start_main | libc-2.31.so | |
○ | _start | amg.c:599 | exec |
►14.63+ | GOMP_parallel | libomp.so | |
○ | hypre_CSRMatrixMatvecOutOfPlac[...] | csr_matvec.c:243 | exec |
○ | hypre_ParCSRMatrixMatvecOutOfP[...] | par_csr_matvec.c:216 | exec |
○ | hypre_PCGSolve | pcg.c:496 | exec |
○ | main | amg.c:419 | exec |
○ | __libc_start_main | libc-2.31.so | |
○ | _start | amg.c:599 | exec |
►3.14+ | GOMP_parallel | libomp.so | |
○ | hypre_CSRMatrixMatvecOutOfPlac[...] | csr_matvec.c:243 | exec |
○ | hypre_ParCSRMatrixMatvecOutOfP[...] | par_csr_matvec.c:216 | exec |
○ | hypre_BoomerAMGCycle | par_cycle.c:461 | exec |
○ | hypre_BoomerAMGSolve | par_amg_solve.c:235 | exec |
○ | hypre_PCGSolve | pcg.c:545 | exec |
○ | main | amg.c:419 | exec |
○ | __libc_start_main | libc-2.31.so | |
○ | _start | amg.c:599 | exec |
►2.79+ | GOMP_parallel | libomp.so | |
○ | hypre_CSRMatrixMatvecOutOfPlac[...] | csr_matvec.c:243 | exec |
○ | hypre_ParCSRMatrixMatvecOutOfP[...] | par_csr_matvec.c:216 | exec |
○ | hypre_ParCSRRelax | ams.c:78 | exec |
○ | hypre_BoomerAMGCycle | par_cycle.c:394 | exec |
○ | hypre_BoomerAMGSolve | par_amg_solve.c:235 | exec |
○ | hypre_PCGSolve | pcg.c:424 | exec |
○ | main | amg.c:419 | exec |
○ | __libc_start_main | libc-2.31.so | |
○ | _start | amg.c:599 | exec |
Path / |
Source file and lines | csr_matvec.c:243-404 |
Module | exec |
nb instructions | 162 |
loop length | 648 |
nb stack references | 0 |
front end | 19.38 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.00 | 20.00 | 21.50 | 21.50 | 21.50 | 21.50 | 9.00 | 1.00 | 1.00 | 1.00 | 9.17 | 8.83 | 9.00 | 3.00 | 3.00 |
cycles | 20.00 | 20.00 | 21.50 | 21.50 | 21.50 | 21.50 | 9.00 | 1.00 | 1.00 | 1.00 | 9.17 | 8.83 | 9.00 | 3.00 | 3.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 19.38 |
Overall L1 | 21.50 |
all | 3% |
load | 33% |
store | 100% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
STP X29, X30, [SP, #912]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ORR X1, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDP X21, X25, [X0, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
STP D8, D9, [SP, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D9, [X0] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ORR X0, XZR, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR D8, [X1, #72] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDP X22, X24, [X1, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X20, X26, [X1, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X23, [X1, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X27, [X1, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
BL 4f7f80 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR X19, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X0, XZR, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 4f8024 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR X21, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X19, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GT 4f9270 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x3a4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CCMP X27, X19, #1, #10 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
B.LT 4f9234 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x368> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X21, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CCMP X27, X21, #1, #10 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
B.LT 4f91f8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x32c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FCMP D8, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.EQ 4f9018 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x14c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FMOV D0, #-1.0000000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 |
FMOV D1, #1.0000000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 |
FCMP D8, D0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.NE 4f9148 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x27c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FCMP D9, D1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.EQ 4f92ac <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x3e0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FCMP D9, D0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.EQ 4f9508 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x63c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X8, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X9, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P4.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
FCMP D8, D1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.NE 4f9354 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x488> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FCMP D9, D1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.EQ 4f948c <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x5c0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FCMP D9, D0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.NE 4f9618 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x74c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X10, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X11, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P1.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
B 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADRP X11, <52d1f8> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X12, <50c1fc> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X13, [X11, #3912] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADRP X14, <50c204> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X2, X12, #3616 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X1, X14, #424 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X0, [X13] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
BL 503b24 <hypre_fprintf> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADRP X15, <50c218> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X3, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X0, X15, #3648 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X1, #250 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 506500 <hypre_error_handler> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
B 4f8f44 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x78> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADRP X6, <52d234> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X7, <50c238> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X8, [X6, #3912] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADRP X9, <50c240> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X2, X7, #3736 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X1, X9, #424 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X0, [X8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
BL 503b24 <hypre_fprintf> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADRP X10, <50c254> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X3, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X0, X10, #3648 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X1, #249 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 506500 <hypre_error_handler> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
B 4f8f38 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x6c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADRP X0, <52d270> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X4, <50c274> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X3, [X0, #3912] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADRP X2, <50c27c> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X1, X4, #424 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X2, X2, #3176 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X0, [X3] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
BL 503b24 <hypre_fprintf> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADRP X5, <50c290> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X3, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X0, X5, #3648 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X1, #248 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 506500 <hypre_error_handler> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
B 4f8f2c <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x60> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X8, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X9, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P1.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
LDP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP D8, D9, [SP, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDP X29, X30, [SP], #112 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
RET | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FCMP D9, D1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.EQ 4f9588 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x6bc> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FCMP D9, D0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.NE 4f969c <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x7d0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X6, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X4, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P2.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
B 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X30, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X27, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P2.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X16, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X17, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P6.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
HINT #0 | ||||||||||||||||||
B 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X13, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X14, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P4.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
HINT #0 | ||||||||||||||||||
B 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X6, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X4, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P6.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X16, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X17, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P1.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
Source file and lines | csr_matvec.c:243-404 |
Module | exec |
nb instructions | 162 |
loop length | 648 |
nb stack references | 0 |
front end | 19.38 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 20.00 | 20.00 | 21.50 | 21.50 | 21.50 | 21.50 | 9.00 | 1.00 | 1.00 | 1.00 | 9.17 | 8.83 | 9.00 | 3.00 | 3.00 |
cycles | 20.00 | 20.00 | 21.50 | 21.50 | 21.50 | 21.50 | 9.00 | 1.00 | 1.00 | 1.00 | 9.17 | 8.83 | 9.00 | 3.00 | 3.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 19.38 |
Overall L1 | 21.50 |
all | 3% |
load | 33% |
store | 100% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
STP X29, X30, [SP, #912]! | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ORR X1, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X29, SP, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDP X21, X25, [X0, #8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
STP D8, D9, [SP, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
LDR D9, [X0] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
ORR X0, XZR, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR D8, [X1, #72] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
STP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDP X22, X24, [X1, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X20, X26, [X1, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X23, [X1, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X27, [X1, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
BL 4f7f80 <hypre_CSRMatrixGetLoadBalancedPartitionBegin> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR X19, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X0, XZR, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 4f8024 <hypre_CSRMatrixGetLoadBalancedPartitionEnd> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR X21, XZR, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CMP X19, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GT 4f9270 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x3a4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CCMP X27, X19, #1, #10 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
B.LT 4f9234 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x368> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X21, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
CCMP X27, X21, #1, #10 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
B.LT 4f91f8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x32c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FCMP D8, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.EQ 4f9018 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x14c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FMOV D0, #-1.0000000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 |
FMOV D1, #1.0000000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 |
FCMP D8, D0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.NE 4f9148 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x27c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FCMP D9, D1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.EQ 4f92ac <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x3e0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FCMP D9, D0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.EQ 4f9508 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x63c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X8, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X9, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P4.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
FCMP D8, D1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.NE 4f9354 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x488> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FCMP D9, D1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.EQ 4f948c <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x5c0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FCMP D9, D0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.NE 4f9618 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x74c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X10, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X11, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P1.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
B 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADRP X11, <52d1f8> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X12, <50c1fc> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X13, [X11, #3912] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADRP X14, <50c204> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X2, X12, #3616 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X1, X14, #424 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X0, [X13] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
BL 503b24 <hypre_fprintf> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADRP X15, <50c218> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X3, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X0, X15, #3648 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X1, #250 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 506500 <hypre_error_handler> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
B 4f8f44 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x78> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADRP X6, <52d234> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X7, <50c238> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X8, [X6, #3912] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADRP X9, <50c240> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X2, X7, #3736 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X1, X9, #424 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X0, [X8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
BL 503b24 <hypre_fprintf> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADRP X10, <50c254> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X3, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X0, X10, #3648 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X1, #249 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 506500 <hypre_error_handler> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
B 4f8f38 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x6c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADRP X0, <52d270> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X4, <50c274> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X3, [X0, #3912] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADRP X2, <50c27c> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X1, X4, #424 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X2, X2, #3176 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X0, [X3] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
BL 503b24 <hypre_fprintf> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADRP X5, <50c290> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X3, #0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X0, X5, #3648 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X2, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X1, #248 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 506500 <hypre_error_handler> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
B 4f8f2c <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x60> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X8, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X9, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P1.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
LDP X19, X20, [SP, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X21, X22, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X23, X24, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X25, X26, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X27, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP D8, D9, [SP, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDP X29, X30, [SP], #112 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
RET | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FCMP D9, D1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.EQ 4f9588 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x6bc> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
FCMP D9, D0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B.NE 4f969c <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x7d0> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X6, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X4, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P2.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
B 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X30, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X27, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P2.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X16, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X17, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P6.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
HINT #0 | ||||||||||||||||||
B 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X13, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X14, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P4.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
HINT #0 | ||||||||||||||||||
B 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X6, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X4, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P6.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
CMP X19, X21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GE 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ADD X16, X22, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X17, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
PTRUE P1.B, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
B 4f8ff8 <hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6+0x12c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼hypre_CSRMatrixMatvecOutOfPlace._omp_fn.6– | 46.55 | 7.17 |
▼Loop 3778 - csr_matvec.c:307-314 - exec– | 2.82 | 0.43 |
○Loop 3779 - csr_matvec.c:310-312 - exec | 35.36 | 5.45 |
▼Loop 3770 - csr_matvec.c:334-341 - exec– | 0.42 | 0.06 |
○Loop 3771 - csr_matvec.c:337-339 - exec | 1.14 | 0.17 |
▼Loop 3764 - csr_matvec.c:373-380 - exec– | 0 | 0 |
○Loop 3765 - csr_matvec.c:376-378 - exec | 0 | 0 |
▼Loop 3754 - csr_matvec.c:243-287 - exec– | 0 | 0 |
▼Loop 3762 - csr_matvec.c:256-263 - exec– | 0.26 | 0.04 |
○Loop 3761 - csr_matvec.c:259-261 - exec | 6.55 | 1.01 |
○Loop 3760 - csr_matvec.c:270-270 - exec | 0 | 0 |
▼Loop 3756 - csr_matvec.c:280-287 - exec– | 0 | 0 |
○Loop 3755 - csr_matvec.c:283-285 - exec | 0 | 0 |
○Loop 3757 - csr_matvec.c:283-283 - exec | 0 | 0 |
○Loop 3763 - csr_matvec.c:258-258 - exec | 0 | 0 |
▼Loop 3759 - csr_matvec.c:268-275 - exec– | 0 | 0 |
○Loop 3758 - csr_matvec.c:271-273 - exec | 0 | 0 |
▼Loop 3766 - csr_matvec.c:397-404 - exec– | 0 | 0 |
○Loop 3767 - csr_matvec.c:400-402 - exec | 0 | 0 |
▼Loop 3776 - csr_matvec.c:295-302 - exec– | 0 | 0 |
○Loop 3777 - csr_matvec.c:298-300 - exec | 0 | 0 |
▼Loop 3774 - csr_matvec.c:346-353 - exec– | 0 | 0 |
○Loop 3775 - csr_matvec.c:349-351 - exec | 0 | 0 |
▼Loop 3768 - csr_matvec.c:385-392 - exec– | 0 | 0 |
○Loop 3769 - csr_matvec.c:388-390 - exec | 0 | 0 |
▼Loop 3780 - csr_matvec.c:319-326 - exec– | 0 | 0 |
○Loop 3781 - csr_matvec.c:322-324 - exec | 0 | 0 |
▼Loop 3772 - csr_matvec.c:358-365 - exec– | 0 | 0 |
○Loop 3773 - csr_matvec.c:361-363 - exec | 0 | 0 |