Function: __nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_ | Module: exec | Source: viscosity_kernel.f90-pp.f90:50-96 | Coverage: 13.32% |
---|
Function: __nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_ | Module: exec | Source: viscosity_kernel.f90-pp.f90:50-96 | Coverage: 13.32% |
---|
/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/build/CMakeFiles/clover_leaf.dir/CloverLeaf_ref/kernels/viscosity_kernel.f90-pp.f90: 50 - 96 |
-------------------------------------------------------------------------------- |
50: # 50 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
51: !$OMP PARALLEL |
52: # 52 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
53: !$OMP DO PRIVATE(ugrad,vgrad,div,strain2,pgradx,pgrady,pgradx2,pgrady2,limiter,pgrad,xgrad,ygrad,grad,grad2,dirx,diry) |
54: DO k=y_min,y_max |
55: !$OMP SIMD |
56: DO j=x_min,x_max |
57: ugrad=(xvel0(j+1,k )+xvel0(j+1,k+1))-(xvel0(j ,k )+xvel0(j ,k+1)) |
58: # 58 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
59: vgrad=(yvel0(j ,k+1)+yvel0(j+1,k+1))-(yvel0(j ,k )+yvel0(j+1,k )) |
60: # 60 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
61: div = (celldx(j)*(ugrad)+ celldy(k)*(vgrad)) |
62: # 62 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
63: strain2 = 0.5_8*(xvel0(j, k+1) + xvel0(j+1,k+1)-xvel0(j ,k )-xvel0(j+1,k ))/celldy(k) & |
64: + 0.5_8*(yvel0(j+1,k ) + yvel0(j+1,k+1)-yvel0(j ,k )-yvel0(j ,k+1))/celldx(j) |
65: # 65 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
66: pgradx=(pressure(j+1,k)-pressure(j-1,k))/(celldx(j)+celldx(j+1)) |
67: pgrady=(pressure(j,k+1)-pressure(j,k-1))/(celldy(k)+celldy(k+1)) |
68: # 68 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
69: pgradx2 = pgradx*pgradx |
70: pgrady2 = pgrady*pgrady |
71: # 71 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
72: limiter = ((0.5_8*(ugrad)/celldx(j))*pgradx2+(0.5_8*(vgrad)/celldy(k))*pgrady2+strain2*pgradx*pgrady) & |
73: /MAX(pgradx2+pgrady2,1.0e-16_8) |
74: # 74 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
75: IF ((limiter.GT.0.0).OR.(div.GE.0.0))THEN |
76: viscosity(j,k) = 0.0 |
77: ELSE |
78: dirx=1.0_8 |
79: IF(pgradx.LT.0.0) dirx=-1.0_8 |
80: pgradx = dirx*MAX(1.0e-16_8,ABS(pgradx)) |
81: diry=1.0_8 |
82: IF(pgradx.LT.0.0) diry=-1.0_8 |
83: pgrady = diry*MAX(1.0e-16_8,ABS(pgrady)) |
84: pgrad = SQRT(pgradx**2+pgrady**2) |
85: xgrad = ABS(celldx(j)*pgrad/pgradx) |
86: ygrad = ABS(celldy(k)*pgrad/pgrady) |
87: grad = MIN(xgrad,ygrad) |
88: grad2 = grad*grad |
89: # 89 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
90: viscosity(j,k)=2.0_8*density0(j,k)*grad2*limiter*limiter |
91: ENDIF |
92: # 92 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
93: ENDDO |
94: ENDDO |
95: !$OMP END DO |
96: # 96 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
0x44c8f0 SUB SP, SP, #288 |
0x44c8f4 STP X29, X30, [SP, #192] |
0x44c8f8 STP X28, X27, [SP, #208] |
0x44c8fc STP X26, X25, [SP, #224] |
0x44c900 STP X24, X23, [SP, #240] |
0x44c904 STP X22, X21, [SP, #256] |
0x44c908 STP X20, X19, [SP, #272] |
0x44c90c LDP X8, X9, [X2] |
0x44c910 LDR W20, [X0] |
0x44c914 ORR X0, XZR, XZR |
0x44c918 STR X2, [SP, #144] |
0x44c91c ADD X3, SP, #188 |
0x44c920 ADD X4, SP, #184 |
0x44c924 ADD X5, SP, #180 |
0x44c928 ADD X6, SP, #176 |
0x44c92c MOVZ W2, #34 |
0x44c930 MOVZ W7, #1 |
0x44c934 STR WZR, [SP, #188] |
0x44c938 LDR W19, [X9] |
0x44c93c LDR W8, [X8] |
0x44c940 ORR W1, WZR, W20 |
0x44c944 STP W19, W8, [SP, #180] |
0x44c948 MOVZ W8, #1 |
0x44c94c STR W8, [SP, #176] |
0x44c950 STR W8, [SP] |
0x44c954 BL 404b70 |
0x44c958 LDRSW X21, [SP, #184] |
0x44c95c CMP W21, W19 |
0x44c960 B.GT 44cf94 |
0x44c964 LDR W9, [SP, #180] |
0x44c968 SUBS W9, W9, W21 |
0x44c96c B.MI 44cf94 |
0x44c970 LDR X8, [SP, #144] |
0x44c974 LDP X12, X10, [X8, #16] |
0x44c978 LDR W11, [X10] |
0x44c97c LDRSW X3, [X12] |
0x44c980 SUBS W10, W11, W3 |
0x44c984 B.MI 44cf94 |
0x44c988 LDR X8, [SP, #144] |
0x44c98c STR W20, [SP, #20] |
0x44c990 ADD W20, W9, #1 |
0x44c994 ADD W18, W10, #1 |
0x44c998 SUB W17, W11, W3 |
0x44c99c ADD X16, X21, #1 |
0x44c9a0 FMOV D3, #0.5000000 |
0x44c9a4 DUP Z4.D, #0 |
0x44c9a8 LDR X10, [X8, #56] |
0x44c9ac LDP X14, X9, [X8, #128] |
0x44c9b0 LDR X19, [X8, #144] |
0x44c9b4 LDP X4, X23, [X8, #168] |
0x44c9b8 ADD X12, X8, #208 |
0x44c9bc LDR X11, [X8, #32] |
0x44c9c0 LDR X0, [X8, #192] |
0x44c9c4 LDR X5, [X8, #112] |
0x44c9c8 CMP W18, #1 |
0x44c9cc STR W18, [SP, #140] |
0x44c9d0 CSINC W18, W18, WZR, #11 |
0x44c9d4 SUB W17, W17, W18 |
0x44c9d8 ORR X25, XZR, X3 |
0x44c9dc UBFM X15, X3, #61, #60 |
0x44c9e0 INDEX Z0.D, X3, #1 |
0x44c9e4 SUB X2, X21, #1 |
0x44c9e8 PTRUE P0.D, ALL |
0x44c9ec ADRP X1, |
0x44c9f0 LDR D1, [X1, #1328] |
0x44c9f4 CNTD X13, ALL |
0x44c9f8 DUP Z5.D, X13 |
0x44c9fc ADD W17, W17, #1 |
0x44ca00 LDR X6, [X10] |
0x44ca04 LDR X7, [X14] |
0x44ca08 LDR X9, [X9] |
0x44ca0c LDP X10, X14, [X8, #96] |
0x44ca10 ADD X8, X19, #8 |
0x44ca14 ADD X18, X23, #8 |
0x44ca18 SUB X1, X23, #8 |
0x44ca1c STP X8, X19, [SP, #96] |
0x44ca20 ADD X8, X14, #8 |
0x44ca24 LDR X10, [X10] |
0x44ca28 UBFM X3, X6, #61, #60 |
0x44ca2c UBFM X9, X9, #61, #60 |
0x44ca30 MADD X2, X7, X2, XZR |
0x44ca34 STR X7, [SP, #128] |
0x44ca38 STP X8, X23, [SP, #48] |
0x44ca3c LDR X8, [X4] |
0x44ca40 MADD X4, X6, X21, XZR |
0x44ca44 SUB X24, X4, X10 |
0x44ca48 STR X8, [SP, #88] |
0x44ca4c ADD X8, X11, #8 |
0x44ca50 STR X8, [SP, #40] |
0x44ca54 ADD X8, X17, #1 |
0x44ca58 MADD X17, X6, X16, XZR |
0x44ca5c MADD X16, X7, X16, XZR |
0x44ca60 ADD X19, X15, X17,LSL #3 |
0x44ca64 STP X6, X8, [SP, #112] |
0x44ca68 LDR X8, [X0] |
0x44ca6c UBFM X6, X7, #61, #60 |
0x44ca70 UBFM X0, X10, #61, #60 |
0x44ca74 STP X6, X3, [SP, #72] |
0x44ca78 SUB X3, X17, X10 |
0x44ca7c ADD X10, X16, X25 |
0x44ca80 SUB X6, X15, X9 |
0x44ca84 ADD X15, X15, X4,LSL #3 |
0x44ca88 ORR X4, XZR, X25 |
0x44ca8c MADD X7, X7, X21, XZR |
0x44ca90 SUB X17, X19, X0 |
0x44ca94 SUB X15, X15, X0 |
0x44ca98 ADD X22, X5, X6 |
0x44ca9c STR X4, [SP, #64] |
0x44caa0 SUB X10, X10, X8 |
0x44caa4 SUB X29, X2, X8 |
0x44caa8 SUB X30, X16, X8 |
0x44caac STR X8, [SP, #24] |
0x44cab0 MOVZ X16, #1 |
0x44cab4 ADD X26, X11, X17 |
0x44cab8 ADD X28, X11, X15 |
0x44cabc ADD X11, X2, X25 |
0x44cac0 ADD X25, X14, X17 |
0x44cac4 ADD X27, X14, X15 |
0x44cac8 ORR X14, XZR, X4 |
0x44cacc ADD X19, X23, X10,LSL #3 |
0x44cad0 ADRP X10, |
0x44cad4 ADD X10, X10, #1328 |
0x44cad8 LD1RD {Z2.D}, P0/Z, [X10] |
0x44cadc SUB X11, X11, X8 |
0x44cae0 UBFM X10, X7, #61, #60 |
0x44cae4 SUB X0, X10, X8,LSL #3 |
0x44cae8 ADD X6, X23, X11,LSL #3 |
0x44caec ORR X23, XZR, X3 |
0x44caf0 SUB X3, X7, X8 |
0x44caf4 SUB X8, X5, X9 |
0x44caf8 ORR X7, XZR, X4 |
0x44cafc STR X8, [SP, #32] |
0x44cb00 B 44cb5c |
(1091) 0x44cb04 LDR X21, [SP, #168] |
(1091) 0x44cb08 LDR X7, [SP, #64] |
(1091) 0x44cb0c LDR W20, [SP, #164] |
(1091) 0x44cb10 LDR X23, [SP, #152] |
(1093) 0x44cb14 LDP X10, X8, [SP, #72] |
(1093) 0x44cb18 LDR X9, [SP, #128] |
(1093) 0x44cb1c ADD X21, X21, #1 |
(1093) 0x44cb20 SUBS W20, W20, #1 |
(1093) 0x44cb24 ADD X25, X25, X8 |
(1093) 0x44cb28 ADD X26, X26, X8 |
(1093) 0x44cb2c ADD X27, X27, X8 |
(1093) 0x44cb30 ADD X28, X28, X8 |
(1093) 0x44cb34 LDR X8, [SP, #112] |
(1093) 0x44cb38 ADD X19, X19, X10 |
(1093) 0x44cb3c ADD X6, X6, X10 |
(1093) 0x44cb40 ADD X29, X29, X9 |
(1093) 0x44cb44 ADD X30, X30, X9 |
(1093) 0x44cb48 ADD X0, X0, X10 |
(1093) 0x44cb4c ADD X3, X3, X9 |
(1093) 0x44cb50 ADD X23, X23, X8 |
(1093) 0x44cb54 ADD X24, X24, X8 |
(1093) 0x44cb58 B.LE 44cf90 |
(1093) 0x44cb5c LDR X8, [SP, #88] |
(1093) 0x44cb60 LDR W17, [SP, #140] |
(1093) 0x44cb64 SUB X9, X21, X8 |
(1093) 0x44cb68 LDR X8, [SP, #104] |
(1093) 0x44cb6c LDR D6, [X8, X9,LSL #3] |
(1093) 0x44cb70 LDR X8, [SP, #96] |
(1093) 0x44cb74 LDR D7, [X8, X9,LSL #3] |
(1093) 0x44cb78 LDR X8, [SP, #120] |
(1093) 0x44cb7c ORR X9, XZR, X7 |
(1093) 0x44cb80 CMP X8, X13 |
(1093) 0x44cb84 FADD D7, D6, D7 |
(1093) 0x44cb88 B.CC 44cd98 |
(1093) 0x44cb8c LDR X8, [SP, #128] |
(1093) 0x44cb90 ORR X14, XZR, XZR |
(1093) 0x44cb94 DUP Z16.D, Z6.D[0] |
(1093) 0x44cb98 DUP Z17.D, Z7.D[0] |
(1093) 0x44cb9c MADD X10, X8, X21, XZR |
(1093) 0x44cba0 LDR X8, [SP, #120] |
(1093) 0x44cba4 ORR Z19.D, Z0.D, Z0.D |
(1093) 0x44cba8 UDIV X9, X8, X13 |
(1093) 0x44cbac MADD X15, X9, X13, XZR |
(1093) 0x44cbb0 SUB X11, X8, X15 |
(1093) 0x44cbb4 LDR W8, [SP, #140] |
(1093) 0x44cbb8 ADD X9, X15, X7 |
(1093) 0x44cbbc SUB W17, W8, W15 |
(1093) 0x44cbc0 LDR X8, [SP, #24] |
(1093) 0x44cbc4 SUB X10, X10, X8 |
(1093) 0x44cbc8 LDR X8, [SP, #144] |
(1093) 0x44cbcc DUP Z18.D, X10 |
(1093) 0x44cbd0 LDR X10, [X8, #200] |
(1093) 0x44cbd4 HINT #0 |
(1093) 0x44cbd8 HINT #0 |
(1093) 0x44cbdc HINT #0 |
(1092) 0x44cbe0 UBFM X2, X14, #61, #60 |
(1092) 0x44cbe4 ADD X4, X26, X2 |
(1092) 0x44cbe8 ADD X5, X28, X2 |
(1092) 0x44cbec LD1D {Z20.D}, P0/Z, [X4, X16,LSL #3] |
(1092) 0x44cbf0 LD1D {Z21.D}, P0/Z, [X5, X16,LSL #3] |
(1092) 0x44cbf4 LD1D {Z23.D}, P0/Z, [X4, MUL VL] |
(1092) 0x44cbf8 ADD X4, X25, X2 |
(1092) 0x44cbfc LD1D {Z24.D}, P0/Z, [X5, MUL VL] |
(1092) 0x44cc00 LD1D {Z26.D}, P0/Z, [X4, X16,LSL #3] |
(1092) 0x44cc04 LD1D {Z27.D}, P0/Z, [X4, MUL VL] |
(1092) 0x44cc08 ADD X4, X27, X2 |
(1092) 0x44cc0c ADD X2, X22, X2 |
(1092) 0x44cc10 LD1D {Z28.D}, P0/Z, [X4, X16,LSL #3] |
(1092) 0x44cc14 FADD Z25.D, Z23.D, Z24.D |
(1092) 0x44cc18 LD1D {Z29.D}, P0/Z, [X4, MUL VL] |
(1092) 0x44cc1c LD1D {Z31.D}, P0/Z, [X2, MUL VL] |
(1092) 0x44cc20 FADD Z22.D, Z20.D, Z21.D |
(1092) 0x44cc24 FADD Z20.D, Z20.D, Z23.D |
(1092) 0x44cc28 FSUB Z22.D, Z22.D, Z25.D |
(1092) 0x44cc2c FADD Z25.D, Z26.D, Z27.D |
(1092) 0x44cc30 FSUB Z20.D, Z20.D, Z24.D |
(1092) 0x44cc34 FADD Z26.D, Z26.D, Z28.D |
(1092) 0x44cc38 FSUB Z20.D, Z20.D, Z21.D |
(1092) 0x44cc3c FADD Z30.D, Z28.D, Z29.D |
(1092) 0x44cc40 FSUB Z26.D, Z26.D, Z29.D |
(1092) 0x44cc44 FMUL Z20.D, P0/M, Z20.D, #0 |
(1092) 0x44cc48 MOVPRFX Z21, Z20 |
(1092) 0x44cc4c FDIV Z21.D, P0/M, Z21.D, Z16.D |
(1092) 0x44cc50 ADD Z20.D, Z18.D, Z19.D |
(1092) 0x44cc54 FSUB Z25.D, Z25.D, Z30.D |
(1092) 0x44cc58 MOVPRFX Z29, Z25 |
(1092) 0x44cc5c FMUL Z29.D, P0/M, Z29.D, #0 |
(1092) 0x44cc60 FDIV Z29.D, P0/M, Z29.D, Z16.D |
(1092) 0x44cc64 ADD Z19.D, Z19.D, Z5.D |
(1092) 0x44cc68 FSUB Z26.D, Z26.D, Z27.D |
(1092) 0x44cc6c FMOV X4, D20 |
(1092) 0x44cc70 FMUL Z27.D, Z22.D, Z31.D |
(1092) 0x44cc74 FMUL Z22.D, P0/M, Z22.D, #0 |
(1092) 0x44cc78 FMUL Z26.D, P0/M, Z26.D, #0 |
(1092) 0x44cc7c LD1D {Z23.D}, P0/Z, [X18, X4,LSL #3] |
(1092) 0x44cc80 LD1D {Z24.D}, P0/Z, [X1, X4,LSL #3] |
(1092) 0x44cc84 FDIV Z22.D, P0/M, Z22.D, Z31.D |
(1092) 0x44cc88 FMAD Z25.D, P0/M, Z16.D, Z27.D |
(1092) 0x44cc8c FDIV Z26.D, P0/M, Z26.D, Z31.D |
(1092) 0x44cc90 FCMGE P2.D, P0/Z, Z25.D, #0 |
(1092) 0x44cc94 FSUB Z23.D, Z23.D, Z24.D |
(1092) 0x44cc98 LD1D {Z24.D}, P0/Z, [X2, X16,LSL #3] |
(1092) 0x44cc9c FADD Z24.D, Z31.D, Z24.D |
(1092) 0x44cca0 FDIV Z23.D, P0/M, Z23.D, Z24.D |
(1092) 0x44cca4 LD1D {Z24.D}, P0/Z, [X19, X14,LSL #3] |
(1092) 0x44cca8 FADD Z21.D, Z21.D, Z26.D |
(1092) 0x44ccac LD1D {Z26.D}, P0/Z, [X6, X14,LSL #3] |
(1092) 0x44ccb0 ADD X14, X14, X13 |
(1092) 0x44ccb4 CMP X15, X14 |
(1092) 0x44ccb8 FSUB Z24.D, Z24.D, Z26.D |
(1092) 0x44ccbc FDIV Z24.D, P0/M, Z24.D, Z17.D |
(1092) 0x44ccc0 FMUL Z26.D, Z23.D, Z23.D |
(1092) 0x44ccc4 FMUL Z21.D, Z21.D, Z23.D |
(1092) 0x44ccc8 FMUL Z22.D, Z22.D, Z26.D |
(1092) 0x44cccc FMUL Z28.D, Z24.D, Z24.D |
(1092) 0x44ccd0 FMLA Z22.D, P0/M, Z28.D, Z29.D |
(1092) 0x44ccd4 FMAD Z21.D, P0/M, Z24.D, Z22.D |
(1092) 0x44ccd8 FADD Z22.D, Z26.D, Z28.D |
(1092) 0x44ccdc FCMGE P1.D, P0/Z, Z22.D, Z2.D |
(1092) 0x44cce0 SEL Z22.D, P1, Z22.D, Z2.D |
(1092) 0x44cce4 FDIV Z21.D, P0/M, Z21.D, Z22.D |
(1092) 0x44cce8 MOVPRFX Z22, Z23 |
(1092) 0x44ccec FABS Z22.D, P0/M, Z23.D |
(1092) 0x44ccf0 FCMGE P3.D, P0/Z, Z22.D, Z2.D |
(1092) 0x44ccf4 SEL Z22.D, P3, Z22.D, Z2.D |
(1092) 0x44ccf8 FCMLT P3.D, P0/Z, Z23.D, #0 |
(1092) 0x44ccfc MOVPRFX Z23, Z22 |
(1092) 0x44cd00 FNEG Z23.D, P0/M, Z22.D |
(1092) 0x44cd04 EOR P3.B, P0/Z, P3.B, P0.B |
(1092) 0x44cd08 SEL Z22.D, P3, Z22.D, Z23.D |
(1092) 0x44cd0c MOVPRFX Z23, Z24 |
(1092) 0x44cd10 FABS Z23.D, P0/M, Z24.D |
(1092) 0x44cd14 FCMLT P3.D, P0/Z, Z22.D, #0 |
(1092) 0x44cd18 EOR P3.B, P0/Z, P3.B, P0.B |
(1092) 0x44cd1c FCMGT P1.D, P0/Z, Z21.D, #0 |
(1092) 0x44cd20 EOR P1.B, P0/Z, P1.B, P0.B |
(1092) 0x44cd24 BIC P1.B, P1/Z, P1.B, P2.B |
(1092) 0x44cd28 FCMGE P2.D, P0/Z, Z23.D, Z2.D |
(1092) 0x44cd2c SEL Z23.D, P2, Z23.D, Z2.D |
(1092) 0x44cd30 MOVPRFX Z24, Z23 |
(1092) 0x44cd34 FNEG Z24.D, P0/M, Z23.D |
(1092) 0x44cd38 SEL Z23.D, P3, Z23.D, Z24.D |
(1092) 0x44cd3c FMUL Z24.D, Z23.D, Z23.D |
(1092) 0x44cd40 FMLA Z24.D, P0/M, Z22.D, Z22.D |
(1092) 0x44cd44 FSQRT Z24.D, P0/M, Z24.D |
(1092) 0x44cd48 FMUL Z25.D, Z31.D, Z24.D |
(1092) 0x44cd4c FMUL Z24.D, Z16.D, Z24.D |
(1092) 0x44cd50 FDIVR Z22.D, P0/M, Z22.D, Z25.D |
(1092) 0x44cd54 FDIVR Z23.D, P0/M, Z23.D, Z24.D |
(1092) 0x44cd58 FABS Z22.D, P0/M, Z22.D |
(1092) 0x44cd5c FABS Z23.D, P0/M, Z23.D |
(1092) 0x44cd60 FCMGE P2.D, P0/Z, Z22.D, Z23.D |
(1092) 0x44cd64 SEL Z22.D, P2, Z23.D, Z22.D |
(1092) 0x44cd68 LD1D {Z23.D}, P1/Z, [X12, Z4.D,LSL #3] |
(1092) 0x44cd6c FMUL Z22.D, Z22.D, Z22.D |
(1092) 0x44cd70 ADR Z23.D, [Z23, Z20.D,LSL #3] |
(1092) 0x44cd74 LD1D {Z23.D}, P1/Z, [V23.D] |
(1092) 0x44cd78 FADD Z23.D, Z23.D, Z23.D |
(1092) 0x44cd7c FMUL Z22.D, Z22.D, Z23.D |
(1092) 0x44cd80 FMUL Z22.D, Z21.D, Z22.D |
(1092) 0x44cd84 FMUL Z21.D, Z21.D, Z22.D |
(1092) 0x44cd88 SEL Z21.D, P1, Z21.D, Z4.D |
(1092) 0x44cd8c ST1D {Z21.D}, P0, [X10, Z20.D,LSL #3] |
(1092) 0x44cd90 B.NE 44cbe0 |
(1093) 0x44cd94 CBZ X11, 44cb14 |
(1091) 0x44cd98 LDR X8, [SP, #144] |
(1091) 0x44cd9c ADD X14, X9, X29 |
(1091) 0x44cda0 STR X23, [SP, #152] |
(1091) 0x44cda4 STR W20, [SP, #164] |
(1091) 0x44cda8 ADD W20, W17, #1 |
(1091) 0x44cdac ADD X15, X9, X24 |
(1091) 0x44cdb0 ORR X11, XZR, XZR |
(1091) 0x44cdb4 UBFM X15, X15, #61, #60 |
(1091) 0x44cdb8 STR X21, [SP, #168] |
(1091) 0x44cdbc LDR X10, [X8, #200] |
(1091) 0x44cdc0 LDP X7, X8, [SP, #48] |
(1091) 0x44cdc4 ADD X2, X8, X14,LSL #3 |
(1091) 0x44cdc8 ADD X14, X9, X23 |
(1091) 0x44cdcc LDR X23, [SP, #40] |
(1091) 0x44cdd0 ADD X21, X7, X15 |
(1091) 0x44cdd4 UBFM X14, X14, #61, #60 |
(1091) 0x44cdd8 ADD X4, X7, X14 |
(1091) 0x44cddc ADD X17, X23, X14 |
(1091) 0x44cde0 ADD X14, X9, X30 |
(1091) 0x44cde4 ADD X15, X23, X15 |
(1091) 0x44cde8 ADD X5, X8, X14,LSL #3 |
(1091) 0x44cdec UBFM X8, X9, #61, #60 |
(1091) 0x44cdf0 ADD X9, X9, X3 |
(1091) 0x44cdf4 ADD X14, X0, X8 |
(1091) 0x44cdf8 UBFM X7, X9, #61, #60 |
(1091) 0x44cdfc ADD X9, X10, X7 |
(1091) 0x44ce00 LDR X10, [SP, #32] |
(1091) 0x44ce04 ADD X7, X1, X7 |
(1091) 0x44ce08 ADD X10, X10, X8 |
(1091) 0x44ce0c B 44ce34 |
0x44ce10 HINT #0 |
0x44ce14 HINT #0 |
0x44ce18 HINT #0 |
0x44ce1c HINT #0 |
(1091) 0x44ce20 SUB W20, W20, #1 |
(1091) 0x44ce24 STR D22, [X9, X11] |
(1091) 0x44ce28 ADD X11, X11, #8 |
(1091) 0x44ce2c CMP W20, #1 |
(1091) 0x44ce30 B.LE 44cb04 |
(1091) 0x44ce34 ADD X8, X17, X11 |
(1091) 0x44ce38 ADD X23, X15, X11 |
(1091) 0x44ce3c LDP D21, D19, [X8, #1016] |
(1091) 0x44ce40 LDP D22, D20, [X23, #1016] |
(1091) 0x44ce44 ADD X8, X4, X11 |
(1091) 0x44ce48 FADD D16, D19, D20 |
(1091) 0x44ce4c FADD D17, D21, D22 |
(1091) 0x44ce50 FADD D19, D19, D21 |
(1091) 0x44ce54 FSUB D17, D16, S17 |
(1091) 0x44ce58 LDP D23, D16, [X8, #1016] |
(1091) 0x44ce5c ADD X8, X21, X11 |
(1091) 0x44ce60 FSUB D19, D19, S22 |
(1091) 0x44ce64 LDR D22, [X2, X11] |
(1091) 0x44ce68 LDP D25, D24, [X8, #1016] |
(1091) 0x44ce6c ADD X8, X10, X11 |
(1091) 0x44ce70 FSUB D19, D19, S20 |
(1091) 0x44ce74 FMUL D19, D19, D3 |
(1091) 0x44ce78 FADD D18, D16, D23 |
(1091) 0x44ce7c FADD D16, D16, D24 |
(1091) 0x44ce80 FDIV D19, D19, D6 |
(1091) 0x44ce84 FSUB D16, D16, S25 |
(1091) 0x44ce88 FADD D26, D24, D25 |
(1091) 0x44ce8c FMUL D25, D17, D3 |
(1091) 0x44ce90 FSUB D16, D16, S23 |
(1091) 0x44ce94 FSUB D18, D18, S26 |
(1091) 0x44ce98 FMUL D23, D16, D3 |
(1091) 0x44ce9c LDP D16, D24, [X8] |
(1091) 0x44cea0 ADD X8, X7, X11 |
(1091) 0x44cea4 LDR D20, [X8, #16] |
(1091) 0x44cea8 LDR D21, [X8] |
(1091) 0x44ceac FDIV D23, D23, D16 |
(1091) 0x44ceb0 FDIV D25, D25, D16 |
(1091) 0x44ceb4 FSUB D20, D20, S21 |
(1091) 0x44ceb8 FADD D21, D16, D24 |
(1091) 0x44cebc FMUL D24, D18, D3 |
(1091) 0x44cec0 FDIV D20, D20, D21 |
(1091) 0x44cec4 LDR D21, [X5, X11] |
(1091) 0x44cec8 FDIV D24, D24, D6 |
(1091) 0x44cecc FSUB D21, D21, S22 |
(1091) 0x44ced0 FDIV D21, D21, D7 |
(1091) 0x44ced4 FADD D19, D19, D23 |
(1091) 0x44ced8 FMUL D22, D20, D20 |
(1091) 0x44cedc FMUL D19, D19, D20 |
(1091) 0x44cee0 FMUL D25, D25, D22 |
(1091) 0x44cee4 FMUL D23, D21, D21 |
(1091) 0x44cee8 FMADD D24, D23, D24, D25 |
(1091) 0x44ceec FADD D22, D22, D23 |
(1091) 0x44cef0 FMAXNM D22, D22, D1 |
(1091) 0x44cef4 FMADD D19, D21, D19, D24 |
(1091) 0x44cef8 FDIV D19, D19, D22 |
(1091) 0x44cefc MOVI D22, #0 |
(1091) 0x44cf00 FCMP D19, #0 |
(1091) 0x44cf04 B.GT 44ce20 |
(1091) 0x44cf08 FMUL D17, D17, D16 |
(1091) 0x44cf0c FMADD D17, D6, D18, D17 |
(1091) 0x44cf10 FCMP D17, #0 |
(1091) 0x44cf14 B.GE 44ce20 |
(1091) 0x44cf18 FABS D17, D20 |
(1091) 0x44cf1c FCMP D20, #0 |
(1091) 0x44cf20 LDR X8, [X12] |
(1091) 0x44cf24 ADD X8, X8, X14 |
(1091) 0x44cf28 FMAXNM D17, D17, D1 |
(1091) 0x44cf2c FNEG D18, D17 |
(1091) 0x44cf30 FCSEL D17, D17, D18, #5 |
(1091) 0x44cf34 FABS D18, D21 |
(1091) 0x44cf38 FMAXNM D18, D18, D1 |
(1091) 0x44cf3c FCMP D17, #0 |
(1091) 0x44cf40 FNEG D20, D18 |
(1091) 0x44cf44 FCSEL D18, D18, D20, #5 |
(1091) 0x44cf48 FMUL D20, D18, D18 |
(1091) 0x44cf4c FMADD D20, D17, D17, D20 |
(1091) 0x44cf50 FSQRT D20, D20 |
(1091) 0x44cf54 FMUL D16, D16, D20 |
(1091) 0x44cf58 FDIV D16, D16, D17 |
(1091) 0x44cf5c FMUL D17, D6, D20 |
(1091) 0x44cf60 FDIV D17, D17, D18 |
(1091) 0x44cf64 FABS D16, D16 |
(1091) 0x44cf68 FABS D17, D17 |
(1091) 0x44cf6c FCMP D16, D17 |
(1091) 0x44cf70 FCSEL D16, D17, D16, #10 |
(1091) 0x44cf74 LDR D17, [X8, X11] |
(1091) 0x44cf78 FMUL D16, D16, D16 |
(1091) 0x44cf7c FADD D17, D17, D17 |
(1091) 0x44cf80 FMUL D16, D16, D17 |
(1091) 0x44cf84 FMUL D16, D19, D16 |
(1091) 0x44cf88 FMUL D22, D19, D16 |
(1091) 0x44cf8c B 44ce20 |
0x44cf90 LDR W20, [SP, #20] |
0x44cf94 ORR X0, XZR, XZR |
0x44cf98 ORR W1, WZR, W20 |
0x44cf9c BL 404c90 |
0x44cfa0 ORR X0, XZR, XZR |
0x44cfa4 ORR W1, WZR, W20 |
0x44cfa8 BL 404870 |
0x44cfac LDP X20, X19, [SP, #272] |
0x44cfb0 LDP X22, X21, [SP, #256] |
0x44cfb4 LDP X24, X23, [SP, #240] |
0x44cfb8 LDP X26, X25, [SP, #224] |
0x44cfbc LDP X28, X27, [SP, #208] |
0x44cfc0 LDP X29, X30, [SP, #192] |
0x44cfc4 ADD SP, SP, #288 |
0x44cfc8 RET |
0x44cfcc HINT #0 |
0x44cfd0 HINT #0 |
0x44cfd4 HINT #0 |
0x44cfd8 HINT #0 |
0x44cfdc HINT #0 |
Path / |
Source file and lines | viscosity_kernel.f90-pp.f90:50-96 |
Module | exec |
nb instructions | 157 |
loop length | 628 |
nb stack references | 0 |
front end | 18.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.00 | 4.00 | 20.75 | 20.75 | 20.75 | 20.75 | 1.00 | 1.00 | 0.50 | 0.50 | 19.00 | 19.00 | 19.00 | 11.50 | 11.50 |
cycles | 4.00 | 4.00 | 20.75 | 20.75 | 20.75 | 20.75 | 1.00 | 1.00 | 0.50 | 0.50 | 19.00 | 19.00 | 19.00 | 11.50 | 11.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 18.50 |
Overall L1 | 20.75 |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
SUB SP, SP, #288 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X29, X30, [SP, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X28, X27, [SP, #208] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X26, X25, [SP, #224] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X24, X23, [SP, #240] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X22, X21, [SP, #256] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X20, X19, [SP, #272] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDP X8, X9, [X2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR W20, [X0] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ORR X0, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X2, [SP, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X3, SP, #188 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X4, SP, #184 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X5, SP, #180 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X6, SP, #176 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ W2, #34 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ W7, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR WZR, [SP, #188] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR W19, [X9] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR W8, [X8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ORR W1, WZR, W20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP W19, W8, [SP, #180] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MOVZ W8, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR W8, [SP, #176] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR W8, [SP] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
BL 404b70 <@plt_start@+0x330> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDRSW X21, [SP, #184] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
CMP W21, W19 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GT 44cf94 <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x6a4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR W9, [SP, #180] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUBS W9, W9, W21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.MI 44cf94 <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x6a4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X8, [SP, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X12, X10, [X8, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR W11, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDRSW X3, [X12] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUBS W10, W11, W3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.MI 44cf94 <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x6a4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X8, [SP, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR W20, [SP, #20] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD W20, W9, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD W18, W10, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB W17, W11, W3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X16, X21, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
FMOV D3, #0.5000000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 |
DUP Z4.D, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
LDR X10, [X8, #56] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X14, X9, [X8, #128] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X19, [X8, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X4, X23, [X8, #168] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
ADD X12, X8, #208 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X11, [X8, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X0, [X8, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X5, [X8, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
CMP W18, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
STR W18, [SP, #140] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
CSINC W18, W18, WZR, #11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB W17, W17, W18 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X25, XZR, X3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X15, X3, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
INDEX Z0.D, X3, #1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 2 |
SUB X2, X21, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PTRUE P0.D, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
ADRP X1, <4609ec> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR D1, [X1, #1328] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
CNTD X13, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
DUP Z5.D, X13 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD W17, W17, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X6, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X7, [X14] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X9, [X9] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X10, X14, [X8, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
ADD X8, X19, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X18, X23, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X1, X23, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X8, X19, [SP, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X8, X14, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X10, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
UBFM X3, X6, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X9, X9, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MADD X2, X7, X2, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
STR X7, [SP, #128] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X8, X23, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X8, [X4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
MADD X4, X6, X21, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SUB X24, X4, X10 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X8, [SP, #88] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X8, X11, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X8, [SP, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X8, X17, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MADD X17, X6, X16, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
MADD X16, X7, X16, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
ADD X19, X15, X17,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X6, X8, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X8, [X0] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
UBFM X6, X7, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X0, X10, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X6, X3, [SP, #72] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
SUB X3, X17, X10 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X10, X16, X25 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X6, X15, X9 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X15, X15, X4,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X4, XZR, X25 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MADD X7, X7, X21, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SUB X17, X19, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X15, X15, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X22, X5, X6 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X4, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
SUB X10, X10, X8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X29, X2, X8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X30, X16, X8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X8, [SP, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MOVZ X16, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X26, X11, X17 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X28, X11, X15 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X11, X2, X25 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X25, X14, X17 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X27, X14, X15 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X14, XZR, X4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X19, X23, X10,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X10, <460ad0> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X10, X10, #1328 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LD1RD {Z2.D}, P0/Z, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 6 | 0.50 |
SUB X11, X11, X8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X10, X7, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X0, X10, X8,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X6, X23, X11,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X23, XZR, X3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X3, X7, X8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X8, X5, X9 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X7, XZR, X4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X8, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
B 44cb5c <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x26c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
LDR W20, [SP, #20] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ORR X0, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR W1, WZR, W20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 404c90 <@plt_start@+0x450> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR X0, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR W1, WZR, W20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 404870 <@plt_start@+0x30> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDP X20, X19, [SP, #272] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X22, X21, [SP, #256] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X24, X23, [SP, #240] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X26, X25, [SP, #224] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X28, X27, [SP, #208] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X29, X30, [SP, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
ADD SP, SP, #288 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
RET | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Source file and lines | viscosity_kernel.f90-pp.f90:50-96 |
Module | exec |
nb instructions | 157 |
loop length | 628 |
nb stack references | 0 |
front end | 18.50 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.00 | 4.00 | 20.75 | 20.75 | 20.75 | 20.75 | 1.00 | 1.00 | 0.50 | 0.50 | 19.00 | 19.00 | 19.00 | 11.50 | 11.50 |
cycles | 4.00 | 4.00 | 20.75 | 20.75 | 20.75 | 20.75 | 1.00 | 1.00 | 0.50 | 0.50 | 19.00 | 19.00 | 19.00 | 11.50 | 11.50 |
Cycles executing div or sqrt instructions | NA |
Front-end | 18.50 |
Overall L1 | 20.75 |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
SUB SP, SP, #288 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X29, X30, [SP, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X28, X27, [SP, #208] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X26, X25, [SP, #224] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X24, X23, [SP, #240] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X22, X21, [SP, #256] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X20, X19, [SP, #272] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDP X8, X9, [X2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR W20, [X0] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ORR X0, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X2, [SP, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X3, SP, #188 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X4, SP, #184 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X5, SP, #180 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X6, SP, #176 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ W2, #34 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ W7, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR WZR, [SP, #188] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR W19, [X9] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR W8, [X8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ORR W1, WZR, W20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP W19, W8, [SP, #180] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MOVZ W8, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR W8, [SP, #176] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR W8, [SP] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
BL 404b70 <@plt_start@+0x330> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDRSW X21, [SP, #184] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
CMP W21, W19 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GT 44cf94 <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x6a4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR W9, [SP, #180] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUBS W9, W9, W21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.MI 44cf94 <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x6a4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X8, [SP, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X12, X10, [X8, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR W11, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDRSW X3, [X12] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUBS W10, W11, W3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.MI 44cf94 <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x6a4> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X8, [SP, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STR W20, [SP, #20] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD W20, W9, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD W18, W10, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB W17, W11, W3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X16, X21, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
FMOV D3, #0.5000000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 |
DUP Z4.D, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
LDR X10, [X8, #56] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X14, X9, [X8, #128] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X19, [X8, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X4, X23, [X8, #168] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
ADD X12, X8, #208 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X11, [X8, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X0, [X8, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X5, [X8, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
CMP W18, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
STR W18, [SP, #140] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
CSINC W18, W18, WZR, #11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB W17, W17, W18 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X25, XZR, X3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X15, X3, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
INDEX Z0.D, X3, #1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 2 |
SUB X2, X21, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PTRUE P0.D, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
ADRP X1, <4609ec> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR D1, [X1, #1328] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
CNTD X13, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
DUP Z5.D, X13 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD W17, W17, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X6, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X7, [X14] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X9, [X9] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X10, X14, [X8, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
ADD X8, X19, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X18, X23, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X1, X23, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X8, X19, [SP, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X8, X14, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X10, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
UBFM X3, X6, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X9, X9, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MADD X2, X7, X2, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
STR X7, [SP, #128] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X8, X23, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X8, [X4] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
MADD X4, X6, X21, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SUB X24, X4, X10 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X8, [SP, #88] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X8, X11, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X8, [SP, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X8, X17, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MADD X17, X6, X16, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
MADD X16, X7, X16, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
ADD X19, X15, X17,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X6, X8, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR X8, [X0] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
UBFM X6, X7, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X0, X10, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X6, X3, [SP, #72] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
SUB X3, X17, X10 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X10, X16, X25 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X6, X15, X9 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X15, X15, X4,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X4, XZR, X25 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MADD X7, X7, X21, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
SUB X17, X19, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X15, X15, X0 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X22, X5, X6 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X4, [SP, #64] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
SUB X10, X10, X8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X29, X2, X8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X30, X16, X8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X8, [SP, #24] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MOVZ X16, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X26, X11, X17 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X28, X11, X15 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X11, X2, X25 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X25, X14, X17 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X27, X14, X15 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X14, XZR, X4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X19, X23, X10,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X10, <460ad0> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X10, X10, #1328 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LD1RD {Z2.D}, P0/Z, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 6 | 0.50 |
SUB X11, X11, X8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X10, X7, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X0, X10, X8,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X6, X23, X11,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X23, XZR, X3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X3, X7, X8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X8, X5, X9 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X7, XZR, X4 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X8, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
B 44cb5c <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x26c> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
LDR W20, [SP, #20] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ORR X0, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR W1, WZR, W20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 404c90 <@plt_start@+0x450> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR X0, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR W1, WZR, W20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 404870 <@plt_start@+0x30> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDP X20, X19, [SP, #272] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X22, X21, [SP, #256] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X24, X23, [SP, #240] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X26, X25, [SP, #224] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X28, X27, [SP, #208] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X29, X30, [SP, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
ADD SP, SP, #288 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
RET | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_– | 13.32 | 3.02 |
▼Loop 1091 - viscosity_kernel.f90-pp.f90:53-93 - exec– | 0 | 0 |
▼Loop 1093 - viscosity_kernel.f90-pp.f90:53-93 - exec– | 0 | 0 |
○Loop 1092 - viscosity_kernel.f90-pp.f90:56-89 - exec | 13.32 | 3.02 |