Function: __nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_ | Module: exec | Source: viscosity_kernel.f90-pp.f90:50-96 | Coverage: 11.51% |
---|
Function: __nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_ | Module: exec | Source: viscosity_kernel.f90-pp.f90:50-96 | Coverage: 11.51% |
---|
/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/armclang_5/CMakeFiles/clover_leaf.dir/CloverLeaf_ref/kernels/viscosity_kernel.f90-pp.f90: 50 - 96 |
-------------------------------------------------------------------------------- |
50: # 50 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
51: !$OMP PARALLEL |
52: # 52 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
53: !$OMP DO PRIVATE(ugrad,vgrad,div,strain2,pgradx,pgrady,pgradx2,pgrady2,limiter,pgrad,xgrad,ygrad,grad,grad2,dirx,diry) |
54: DO k=y_min,y_max |
55: !$OMP SIMD |
56: DO j=x_min,x_max |
57: ugrad=(xvel0(j+1,k )+xvel0(j+1,k+1))-(xvel0(j ,k )+xvel0(j ,k+1)) |
58: # 58 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
59: vgrad=(yvel0(j ,k+1)+yvel0(j+1,k+1))-(yvel0(j ,k )+yvel0(j+1,k )) |
60: # 60 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
61: div = (celldx(j)*(ugrad)+ celldy(k)*(vgrad)) |
62: # 62 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
63: strain2 = 0.5_8*(xvel0(j, k+1) + xvel0(j+1,k+1)-xvel0(j ,k )-xvel0(j+1,k ))/celldy(k) & |
64: + 0.5_8*(yvel0(j+1,k ) + yvel0(j+1,k+1)-yvel0(j ,k )-yvel0(j ,k+1))/celldx(j) |
65: # 65 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
66: pgradx=(pressure(j+1,k)-pressure(j-1,k))/(celldx(j)+celldx(j+1)) |
67: pgrady=(pressure(j,k+1)-pressure(j,k-1))/(celldy(k)+celldy(k+1)) |
68: # 68 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
69: pgradx2 = pgradx*pgradx |
70: pgrady2 = pgrady*pgrady |
71: # 71 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
72: limiter = ((0.5_8*(ugrad)/celldx(j))*pgradx2+(0.5_8*(vgrad)/celldy(k))*pgrady2+strain2*pgradx*pgrady) & |
73: /MAX(pgradx2+pgrady2,1.0e-16_8) |
74: # 74 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
75: IF ((limiter.GT.0.0).OR.(div.GE.0.0))THEN |
76: viscosity(j,k) = 0.0 |
77: ELSE |
78: dirx=1.0_8 |
79: IF(pgradx.LT.0.0) dirx=-1.0_8 |
80: pgradx = dirx*MAX(1.0e-16_8,ABS(pgradx)) |
81: diry=1.0_8 |
82: IF(pgradx.LT.0.0) diry=-1.0_8 |
83: pgrady = diry*MAX(1.0e-16_8,ABS(pgrady)) |
84: pgrad = SQRT(pgradx**2+pgrady**2) |
85: xgrad = ABS(celldx(j)*pgrad/pgradx) |
86: ygrad = ABS(celldy(k)*pgrad/pgrady) |
87: grad = MIN(xgrad,ygrad) |
88: grad2 = grad*grad |
89: # 89 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
90: viscosity(j,k)=2.0_8*density0(j,k)*grad2*limiter*limiter |
91: ENDIF |
92: # 92 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
93: ENDDO |
94: ENDDO |
95: !$OMP END DO |
96: # 96 "/home/hbollore/qaas-runs/170-307-1706/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90" |
0x44cb90 SUB SP, SP, #320 |
0x44cb94 STR D10, [SP, #192] |
0x44cb98 STP D9, D8, [SP, #208] |
0x44cb9c STP X29, X30, [SP, #224] |
0x44cba0 STP X28, X27, [SP, #240] |
0x44cba4 STP X26, X25, [SP, #256] |
0x44cba8 STP X24, X23, [SP, #272] |
0x44cbac STP X22, X21, [SP, #288] |
0x44cbb0 STP X20, X19, [SP, #304] |
0x44cbb4 LDP X8, X9, [X2] |
0x44cbb8 LDR W20, [X0] |
0x44cbbc ORR X0, XZR, XZR |
0x44cbc0 STR X2, [SP, #152] |
0x44cbc4 ADD X3, SP, #204 |
0x44cbc8 ADD X4, SP, #200 |
0x44cbcc ADD X5, SP, #188 |
0x44cbd0 ADD X6, SP, #184 |
0x44cbd4 MOVZ W2, #34 |
0x44cbd8 MOVZ W7, #1 |
0x44cbdc STR WZR, [SP, #204] |
0x44cbe0 LDR W8, [X8] |
0x44cbe4 LDR W19, [X9] |
0x44cbe8 ORR W1, WZR, W20 |
0x44cbec STR W8, [SP, #200] |
0x44cbf0 MOVZ W8, #1 |
0x44cbf4 STP W8, W19, [SP, #184] |
0x44cbf8 STR W8, [SP] |
0x44cbfc BL 404ae0 |
0x44cc00 LDRSW X21, [SP, #200] |
0x44cc04 CMP W21, W19 |
0x44cc08 B.GT 44d1e8 |
0x44cc0c LDR W9, [SP, #188] |
0x44cc10 SUBS W9, W9, W21 |
0x44cc14 B.MI 44d1e8 |
0x44cc18 LDR X8, [SP, #152] |
0x44cc1c LDP X11, X10, [X8, #16] |
0x44cc20 LDR W13, [X10] |
0x44cc24 LDRSW X7, [X11] |
0x44cc28 SUBS W10, W13, W7 |
0x44cc2c B.MI 44d1e8 |
0x44cc30 LDR X8, [SP, #152] |
0x44cc34 ADD W18, W10, #1 |
0x44cc38 STR W20, [SP, #28] |
0x44cc3c ADD W20, W9, #1 |
0x44cc40 SUB W16, W13, W7 |
0x44cc44 UBFM X14, X7, #61, #60 |
0x44cc48 STR X7, [SP, #72] |
0x44cc4c FMOV D3, #1.0000000 |
0x44cc50 CMP W18, #1 |
0x44cc54 STR W18, [SP, #148] |
0x44cc58 INDEX Z0.D, X7, #1 |
0x44cc5c ADRP X1, |
0x44cc60 ADD X15, X21, #1 |
0x44cc64 LDR D1, [X1, #1584] |
0x44cc68 CSINC W18, W18, WZR, #11 |
0x44cc6c SUB X0, X21, #1 |
0x44cc70 PTRUE P0.D, ALL |
0x44cc74 FMOV D4, #0.5000000 |
0x44cc78 DUP Z5.D, #0 |
0x44cc7c LDP X11, X10, [X8, #128] |
0x44cc80 LDR X9, [X8, #56] |
0x44cc84 LDR X17, [X8, #192] |
0x44cc88 ADD X12, X8, #208 |
0x44cc8c LDR X2, [X8, #144] |
0x44cc90 LDR X4, [X8, #32] |
0x44cc94 SUB W16, W16, W18 |
0x44cc98 CNTD X13, ALL |
0x44cc9c DUP Z6.D, X13 |
0x44cca0 ADD W16, W16, #1 |
0x44cca4 ADD X16, X16, #1 |
0x44cca8 LDR X10, [X10] |
0x44ccac LDR X5, [X9] |
0x44ccb0 LDR X19, [X11] |
0x44ccb4 LDP X9, X11, [X8, #96] |
0x44ccb8 LDR X23, [X17] |
0x44ccbc LDP X17, X6, [X8, #168] |
0x44ccc0 LDR X8, [X8, #112] |
0x44ccc4 ADD X1, X4, #8 |
0x44ccc8 STR X2, [SP, #112] |
0x44cccc ADD X2, X2, #8 |
0x44ccd0 STR X1, [SP, #48] |
0x44ccd4 STR X2, [SP, #104] |
0x44ccd8 UBFM X10, X10, #61, #60 |
0x44ccdc ADD X22, X11, #8 |
0x44cce0 LDR X9, [X9] |
0x44cce4 LDR X17, [X17] |
0x44cce8 STP X5, X16, [SP, #120] |
0x44ccec MADD X16, X5, X15, XZR |
0x44ccf0 MADD X1, X5, X21, XZR |
0x44ccf4 MADD X15, X19, X15, XZR |
0x44ccf8 UBFM X3, X5, #61, #60 |
0x44ccfc UBFM X5, X19, #61, #60 |
0x44cd00 MADD X0, X19, X0, XZR |
0x44cd04 STR X19, [SP, #136] |
0x44cd08 STR X23, [SP, #32] |
0x44cd0c ADD X18, X6, #8 |
0x44cd10 SUB X2, X6, #8 |
0x44cd14 STP X22, X6, [SP, #56] |
0x44cd18 SUB X7, X14, X10 |
0x44cd1c STP X5, X3, [SP, #80] |
0x44cd20 MADD X5, X19, X21, XZR |
0x44cd24 ADD X19, X14, X16,LSL #3 |
0x44cd28 ADD X14, X14, X1,LSL #3 |
0x44cd2c SUB X29, X0, X23 |
0x44cd30 SUB X30, X15, X23 |
0x44cd34 ADD X22, X8, X7 |
0x44cd38 LDR X7, [SP, #72] |
0x44cd3c SUB X8, X8, X10 |
0x44cd40 STR X17, [SP, #96] |
0x44cd44 UBFM X17, X9, #61, #60 |
0x44cd48 SUB X3, X16, X9 |
0x44cd4c SUB X24, X1, X9 |
0x44cd50 SUB X16, X19, X17 |
0x44cd54 SUB X14, X14, X17 |
0x44cd58 STR X8, [SP, #40] |
0x44cd5c ADD X9, X15, X7 |
0x44cd60 ADD X25, X11, X16 |
0x44cd64 ADD X27, X11, X14 |
0x44cd68 ADD X11, X0, X7 |
0x44cd6c ADD X26, X4, X16 |
0x44cd70 ADD X28, X4, X14 |
0x44cd74 MOVZ X0, #1 |
0x44cd78 SUB X9, X9, X23 |
0x44cd7c SUB X11, X11, X23 |
0x44cd80 ADD X19, X6, X9,LSL #3 |
0x44cd84 ADRP X9, |
0x44cd88 ADD X9, X9, #1584 |
0x44cd8c ADD X16, X6, X11,LSL #3 |
0x44cd90 LD1RD {Z2.D}, P0/Z, [X9] |
0x44cd94 UBFM X9, X5, #61, #60 |
0x44cd98 SUB X5, X5, X23 |
0x44cd9c SUB X1, X9, X23,LSL #3 |
0x44cda0 ORR X23, XZR, X3 |
0x44cda4 B 44ce00 |
(1095) 0x44cda8 LDR X21, [SP, #176] |
(1095) 0x44cdac LDR X7, [SP, #72] |
(1095) 0x44cdb0 LDR W20, [SP, #172] |
(1095) 0x44cdb4 LDR X23, [SP, #160] |
(1095) 0x44cdb8 LDP X10, X8, [SP, #80] |
(1095) 0x44cdbc LDR X9, [SP, #136] |
(1095) 0x44cdc0 ADD X21, X21, #1 |
(1095) 0x44cdc4 SUBS W20, W20, #1 |
(1095) 0x44cdc8 ADD X25, X25, X8 |
(1095) 0x44cdcc ADD X26, X26, X8 |
(1095) 0x44cdd0 ADD X27, X27, X8 |
(1095) 0x44cdd4 ADD X28, X28, X8 |
(1095) 0x44cdd8 LDR X8, [SP, #120] |
(1095) 0x44cddc ADD X19, X19, X10 |
(1095) 0x44cde0 ADD X16, X16, X10 |
(1095) 0x44cde4 ADD X29, X29, X9 |
(1095) 0x44cde8 ADD X30, X30, X9 |
(1095) 0x44cdec ADD X1, X1, X10 |
(1095) 0x44cdf0 ADD X5, X5, X9 |
(1095) 0x44cdf4 ADD X23, X23, X8 |
(1095) 0x44cdf8 ADD X24, X24, X8 |
(1095) 0x44cdfc B.LE 44d1e4 |
(1095) 0x44ce00 LDR X8, [SP, #96] |
(1095) 0x44ce04 LDR W14, [SP, #148] |
(1095) 0x44ce08 SUB X9, X21, X8 |
(1095) 0x44ce0c LDR X8, [SP, #112] |
(1095) 0x44ce10 LDR D7, [X8, X9,LSL #3] |
(1095) 0x44ce14 LDR X8, [SP, #104] |
(1095) 0x44ce18 LDR D16, [X8, X9,LSL #3] |
(1095) 0x44ce1c LDR X8, [SP, #128] |
(1095) 0x44ce20 ORR X9, XZR, X7 |
(1095) 0x44ce24 CMP X8, X13 |
(1095) 0x44ce28 FADD D17, D16, D7 |
(1095) 0x44ce2c FDIV D16, D3, D7 |
(1095) 0x44ce30 B.CC 44d004 |
(1095) 0x44ce34 LDP X11, X8, [SP, #128] |
(1095) 0x44ce38 FDIV D21, D3, D17 |
(1095) 0x44ce3c ORR X10, XZR, XZR |
(1095) 0x44ce40 DUP Z18.D, Z7.D[0] |
(1095) 0x44ce44 DUP Z19.D, Z16.D[0] |
(1095) 0x44ce48 UDIV X9, X11, X13 |
(1095) 0x44ce4c MADD X17, X8, X21, XZR |
(1095) 0x44ce50 LDR W8, [SP, #148] |
(1095) 0x44ce54 ORR Z22.D, Z0.D, Z0.D |
(1095) 0x44ce58 DUP Z21.D, Z21.D[0] |
(1095) 0x44ce5c MADD X15, X9, X13, XZR |
(1095) 0x44ce60 SUB W14, W8, W15 |
(1095) 0x44ce64 LDR X8, [SP, #32] |
(1095) 0x44ce68 SUB X11, X11, X15 |
(1095) 0x44ce6c ADD X9, X15, X7 |
(1095) 0x44ce70 SUB X17, X17, X8 |
(1095) 0x44ce74 LDR X8, [SP, #152] |
(1095) 0x44ce78 DUP Z20.D, X17 |
(1095) 0x44ce7c LDR X17, [X8, #200] |
(1097) 0x44ce80 UBFM X3, X10, #61, #60 |
(1097) 0x44ce84 ADD X4, X26, X3 |
(1097) 0x44ce88 ADD X6, X28, X3 |
(1097) 0x44ce8c LD1D {Z23.D}, P0/Z, [X4, X0,LSL #3] |
(1097) 0x44ce90 LD1D {Z24.D}, P0/Z, [X6, X0,LSL #3] |
(1097) 0x44ce94 LD1D {Z25.D}, P0/Z, [X4, MUL VL] |
(1097) 0x44ce98 LD1D {Z26.D}, P0/Z, [X6, MUL VL] |
(1097) 0x44ce9c ADD X4, X25, X3 |
(1097) 0x44cea0 LD1D {Z29.D}, P0/Z, [X4, X0,LSL #3] |
(1097) 0x44cea4 LD1D {Z30.D}, P0/Z, [X4, MUL VL] |
(1097) 0x44cea8 ADD X4, X27, X3 |
(1097) 0x44ceac ADD X3, X22, X3 |
(1097) 0x44ceb0 FADD Z28.D, Z25.D, Z26.D |
(1097) 0x44ceb4 FADD Z27.D, Z24.D, Z23.D |
(1097) 0x44ceb8 FADD Z23.D, Z23.D, Z25.D |
(1097) 0x44cebc FADD Z24.D, Z24.D, Z26.D |
(1097) 0x44cec0 FSUB Z23.D, Z23.D, Z24.D |
(1097) 0x44cec4 ADD Z24.D, Z20.D, Z22.D |
(1097) 0x44cec8 FSUB Z27.D, Z27.D, Z28.D |
(1097) 0x44cecc LD1D {Z28.D}, P0/Z, [X4, X0,LSL #3] |
(1097) 0x44ced0 LD1D {Z31.D}, P0/Z, [X4, MUL VL] |
(1097) 0x44ced4 LD1D {Z10.D}, P0/Z, [X3, MUL VL] |
(1097) 0x44ced8 FADD Z8.D, Z30.D, Z29.D |
(1097) 0x44cedc ADD Z22.D, Z22.D, Z6.D |
(1097) 0x44cee0 FMOV X4, D24 |
(1097) 0x44cee4 FMUL Z23.D, P0/M, Z23.D, #0 |
(1097) 0x44cee8 LD1D {Z25.D}, P0/Z, [X18, X4,LSL #3] |
(1097) 0x44ceec LD1D {Z26.D}, P0/Z, [X2, X4,LSL #3] |
(1097) 0x44cef0 FADD Z9.D, Z28.D, Z31.D |
(1097) 0x44cef4 FADD Z28.D, Z29.D, Z28.D |
(1097) 0x44cef8 FADD Z29.D, Z30.D, Z31.D |
(1097) 0x44cefc FSUB Z28.D, Z28.D, Z29.D |
(1097) 0x44cf00 FSUB Z30.D, Z8.D, Z9.D |
(1097) 0x44cf04 MOVPRFX Z8, Z27 |
(1097) 0x44cf08 FMUL Z8.D, P0/M, Z8.D, #0 |
(1097) 0x44cf0c FMUL Z28.D, P0/M, Z28.D, #0 |
(1097) 0x44cf10 FSUB Z25.D, Z25.D, Z26.D |
(1097) 0x44cf14 LD1D {Z26.D}, P0/Z, [X3, X0,LSL #3] |
(1097) 0x44cf18 FDIV Z28.D, P0/M, Z28.D, Z10.D |
(1097) 0x44cf1c FADD Z26.D, Z26.D, Z10.D |
(1097) 0x44cf20 FDIV Z25.D, P0/M, Z25.D, Z26.D |
(1097) 0x44cf24 LD1D {Z26.D}, P0/Z, [X19, X10,LSL #3] |
(1097) 0x44cf28 FMAD Z23.D, P0/M, Z19.D, Z28.D |
(1097) 0x44cf2c LD1D {Z28.D}, P0/Z, [X16, X10,LSL #3] |
(1097) 0x44cf30 ADD X10, X10, X13 |
(1097) 0x44cf34 CMP X15, X10 |
(1097) 0x44cf38 FMUL Z29.D, Z25.D, Z25.D |
(1097) 0x44cf3c FSUB Z26.D, Z26.D, Z28.D |
(1097) 0x44cf40 FMUL Z23.D, Z25.D, Z23.D |
(1097) 0x44cf44 FMUL Z28.D, Z18.D, Z30.D |
(1097) 0x44cf48 FMUL Z30.D, P0/M, Z30.D, #0 |
(1097) 0x44cf4c FCMGE P2.D, P0/Z, Z25.D, #0 |
(1097) 0x44cf50 FABS Z25.D, P0/M, Z25.D |
(1097) 0x44cf54 FMUL Z26.D, Z26.D, Z21.D |
(1097) 0x44cf58 FMAXNM Z25.D, P0/M, Z25.D, Z2.D |
(1097) 0x44cf5c FMUL Z8.D, Z8.D, Z29.D |
(1097) 0x44cf60 FMAD Z27.D, P0/M, Z10.D, Z28.D |
(1097) 0x44cf64 FMUL Z31.D, Z26.D, Z26.D |
(1097) 0x44cf68 FDIV Z8.D, P0/M, Z8.D, Z10.D |
(1097) 0x44cf6c FMUL Z30.D, Z30.D, Z31.D |
(1097) 0x44cf70 FADD Z28.D, Z31.D, Z29.D |
(1097) 0x44cf74 FMAXNM Z28.D, P0/M, Z28.D, Z2.D |
(1097) 0x44cf78 FMAD Z23.D, P0/M, Z26.D, Z8.D |
(1097) 0x44cf7c FABS Z26.D, P0/M, Z26.D |
(1097) 0x44cf80 FMAXNM Z26.D, P0/M, Z26.D, Z2.D |
(1097) 0x44cf84 FMLA Z23.D, P0/M, Z30.D, Z19.D |
(1097) 0x44cf88 FDIV Z23.D, P0/M, Z23.D, Z28.D |
(1097) 0x44cf8c FCMLE P1.D, P0/Z, Z23.D, #0 |
(1097) 0x44cf90 FCMLT P1.D, P1/Z, Z27.D, #0 |
(1097) 0x44cf94 MOVPRFX Z27, Z25 |
(1097) 0x44cf98 FNEG Z27.D, P0/M, Z25.D |
(1097) 0x44cf9c SEL Z25.D, P2, Z25.D, Z27.D |
(1097) 0x44cfa0 MOVPRFX Z27, Z26 |
(1097) 0x44cfa4 FNEG Z27.D, P0/M, Z26.D |
(1097) 0x44cfa8 FCMGE P2.D, P0/Z, Z25.D, #0 |
(1097) 0x44cfac SEL Z26.D, P2, Z26.D, Z27.D |
(1097) 0x44cfb0 FMUL Z27.D, Z25.D, Z25.D |
(1097) 0x44cfb4 FMLA Z27.D, P0/M, Z26.D, Z26.D |
(1097) 0x44cfb8 FSQRT Z27.D, P0/M, Z27.D |
(1097) 0x44cfbc FMUL Z28.D, Z27.D, Z10.D |
(1097) 0x44cfc0 FMUL Z27.D, Z27.D, Z18.D |
(1097) 0x44cfc4 FDIVR Z25.D, P0/M, Z25.D, Z28.D |
(1097) 0x44cfc8 FDIVR Z26.D, P0/M, Z26.D, Z27.D |
(1097) 0x44cfcc FABS Z25.D, P0/M, Z25.D |
(1097) 0x44cfd0 FABS Z26.D, P0/M, Z26.D |
(1097) 0x44cfd4 FMINNM Z25.D, P0/M, Z25.D, Z26.D |
(1097) 0x44cfd8 LD1D {Z26.D}, P1/Z, [X12, Z5.D,LSL #3] |
(1097) 0x44cfdc FMUL Z23.D, Z25.D, Z23.D |
(1097) 0x44cfe0 ADR Z26.D, [Z26, Z24.D,LSL #3] |
(1097) 0x44cfe4 FMUL Z23.D, Z23.D, Z23.D |
(1097) 0x44cfe8 LD1D {Z26.D}, P1/Z, [V26.D] |
(1097) 0x44cfec FADD Z25.D, Z26.D, Z26.D |
(1097) 0x44cff0 FMUL Z23.D, Z23.D, Z25.D |
(1097) 0x44cff4 SEL Z23.D, P1, Z23.D, Z5.D |
(1097) 0x44cff8 ST1D {Z23.D}, P0, [X17, Z24.D,LSL #3] |
(1097) 0x44cffc B.NE 44ce80 |
(1095) 0x44d000 CBZ X11, 44cdb8 |
(1095) 0x44d004 LDR X8, [SP, #152] |
(1095) 0x44d008 STR X21, [SP, #176] |
(1095) 0x44d00c ADD X10, X9, X29 |
(1095) 0x44d010 FDIV D17, D3, D17 |
(1095) 0x44d014 STR X23, [SP, #160] |
(1095) 0x44d018 ADD X15, X9, X24 |
(1095) 0x44d01c STR W20, [SP, #172] |
(1095) 0x44d020 ORR X11, XZR, XZR |
(1095) 0x44d024 ADD W20, W14, #1 |
(1095) 0x44d028 UBFM X15, X15, #61, #60 |
(1095) 0x44d02c LDR X7, [X8, #200] |
(1095) 0x44d030 LDP X21, X8, [SP, #56] |
(1095) 0x44d034 ADD X3, X8, X10,LSL #3 |
(1095) 0x44d038 ADD X10, X9, X23 |
(1095) 0x44d03c LDR X23, [SP, #48] |
(1095) 0x44d040 UBFM X10, X10, #61, #60 |
(1095) 0x44d044 ADD X4, X21, X10 |
(1095) 0x44d048 ADD X21, X21, X15 |
(1095) 0x44d04c ADD X17, X23, X10 |
(1095) 0x44d050 ADD X10, X9, X30 |
(1095) 0x44d054 ADD X15, X23, X15 |
(1095) 0x44d058 ADD X6, X8, X10,LSL #3 |
(1095) 0x44d05c UBFM X10, X9, #61, #60 |
(1095) 0x44d060 ADD X9, X9, X5 |
(1095) 0x44d064 ADD X14, X1, X10 |
(1095) 0x44d068 UBFM X8, X9, #61, #60 |
(1095) 0x44d06c ADD X9, X7, X8 |
(1095) 0x44d070 ADD X7, X2, X8 |
(1095) 0x44d074 LDR X8, [SP, #40] |
(1095) 0x44d078 ADD X10, X8, X10 |
(1095) 0x44d07c B 44d094 |
(1096) 0x44d080 SUB W20, W20, #1 |
(1096) 0x44d084 STR D24, [X9, X11] |
(1096) 0x44d088 ADD X11, X11, #8 |
(1096) 0x44d08c CMP W20, #1 |
(1096) 0x44d090 B.LE 44cda8 |
(1096) 0x44d094 ADD X8, X17, X11 |
(1096) 0x44d098 ADD X23, X15, X11 |
(1096) 0x44d09c LDP D23, D21, [X8, #1016] |
(1096) 0x44d0a0 LDP D24, D22, [X23, #1016] |
(1096) 0x44d0a4 ADD X8, X4, X11 |
(1096) 0x44d0a8 FADD D18, D22, D21 |
(1096) 0x44d0ac FADD D19, D23, D24 |
(1096) 0x44d0b0 FADD D21, D21, D23 |
(1096) 0x44d0b4 FADD D22, D22, D24 |
(1096) 0x44d0b8 LDR D24, [X3, X11] |
(1096) 0x44d0bc FSUB D19, D18, S19 |
(1096) 0x44d0c0 LDP D25, D18, [X8, #1016] |
(1096) 0x44d0c4 ADD X8, X21, X11 |
(1096) 0x44d0c8 FSUB D21, D21, S22 |
(1096) 0x44d0cc LDP D27, D26, [X8, #1016] |
(1096) 0x44d0d0 ADD X8, X10, X11 |
(1096) 0x44d0d4 FMUL D21, D21, D4 |
(1096) 0x44d0d8 FADD D20, D25, D18 |
(1096) 0x44d0dc FADD D18, D18, D26 |
(1096) 0x44d0e0 FADD D25, D25, D27 |
(1096) 0x44d0e4 FADD D28, D26, D27 |
(1096) 0x44d0e8 FMUL D27, D19, D4 |
(1096) 0x44d0ec FSUB D18, D18, S25 |
(1096) 0x44d0f0 FSUB D20, D20, S28 |
(1096) 0x44d0f4 FMUL D25, D18, D4 |
(1096) 0x44d0f8 LDP D18, D26, [X8] |
(1096) 0x44d0fc ADD X8, X7, X11 |
(1096) 0x44d100 LDR D22, [X8, #16] |
(1096) 0x44d104 LDR D23, [X8] |
(1096) 0x44d108 FDIV D25, D25, D18 |
(1096) 0x44d10c FSUB D22, D22, S23 |
(1096) 0x44d110 FADD D23, D26, D18 |
(1096) 0x44d114 FMUL D26, D20, D4 |
(1096) 0x44d118 FDIV D22, D22, D23 |
(1096) 0x44d11c LDR D23, [X6, X11] |
(1096) 0x44d120 FSUB D23, D23, S24 |
(1096) 0x44d124 FMUL D23, D23, D17 |
(1096) 0x44d128 FMADD D21, D21, D16, D25 |
(1096) 0x44d12c FMUL D25, D23, D23 |
(1096) 0x44d130 FMUL D26, D26, D25 |
(1096) 0x44d134 FMUL D24, D22, D22 |
(1096) 0x44d138 FMUL D28, D22, D23 |
(1096) 0x44d13c FMUL D27, D27, D24 |
(1096) 0x44d140 FADD D24, D25, D24 |
(1096) 0x44d144 FMAXNM D24, D24, D1 |
(1096) 0x44d148 FDIV D27, D27, D18 |
(1096) 0x44d14c FMADD D21, D28, D21, D27 |
(1096) 0x44d150 FMADD D21, D26, D16, D21 |
(1096) 0x44d154 FDIV D21, D21, D24 |
(1096) 0x44d158 MOVI D24, #0 |
(1096) 0x44d15c FCMP D21, #0 |
(1096) 0x44d160 B.GT 44d080 |
(1096) 0x44d164 FMUL D20, D7, D20 |
(1096) 0x44d168 FMADD D19, D18, D19, D20 |
(1096) 0x44d16c FCMP D19, #0 |
(1096) 0x44d170 B.GE 44d080 |
(1096) 0x44d174 FABS D19, D22 |
(1096) 0x44d178 FCMP D22, #0 |
(1096) 0x44d17c LDR X8, [X12] |
(1096) 0x44d180 ADD X8, X8, X14 |
(1096) 0x44d184 FMAXNM D19, D19, D1 |
(1096) 0x44d188 FNEG D20, D19 |
(1096) 0x44d18c FCSEL D19, D19, D20, #10 |
(1096) 0x44d190 FABS D20, D23 |
(1096) 0x44d194 FMAXNM D20, D20, D1 |
(1096) 0x44d198 FCMP D19, #0 |
(1096) 0x44d19c FNEG D22, D20 |
(1096) 0x44d1a0 FCSEL D20, D20, D22, #10 |
(1096) 0x44d1a4 FMUL D22, D19, D19 |
(1096) 0x44d1a8 FMADD D22, D20, D20, D22 |
(1096) 0x44d1ac FSQRT D22, D22 |
(1096) 0x44d1b0 FMUL D18, D22, D18 |
(1096) 0x44d1b4 FDIV D18, D18, D19 |
(1096) 0x44d1b8 FMUL D19, D22, D7 |
(1096) 0x44d1bc FDIV D19, D19, D20 |
(1096) 0x44d1c0 FABS D18, D18 |
(1096) 0x44d1c4 FABS D19, D19 |
(1096) 0x44d1c8 FMINNM D18, D18, D19 |
(1096) 0x44d1cc LDR D19, [X8, X11] |
(1096) 0x44d1d0 FMUL D18, D18, D21 |
(1096) 0x44d1d4 FMUL D18, D18, D18 |
(1096) 0x44d1d8 FADD D19, D19, D19 |
(1096) 0x44d1dc FMUL D24, D18, D19 |
(1096) 0x44d1e0 B 44d080 |
0x44d1e4 LDR W20, [SP, #28] |
0x44d1e8 ORR X0, XZR, XZR |
0x44d1ec ORR W1, WZR, W20 |
0x44d1f0 BL 404bf0 |
0x44d1f4 ORR X0, XZR, XZR |
0x44d1f8 ORR W1, WZR, W20 |
0x44d1fc BL 4047f0 |
0x44d200 LDP D9, D8, [SP, #208] |
0x44d204 LDR D10, [SP, #192] |
0x44d208 LDP X20, X19, [SP, #304] |
0x44d20c LDP X22, X21, [SP, #288] |
0x44d210 LDP X24, X23, [SP, #272] |
0x44d214 LDP X26, X25, [SP, #256] |
0x44d218 LDP X28, X27, [SP, #240] |
0x44d21c LDP X29, X30, [SP, #224] |
0x44d220 ADD SP, SP, #320 |
0x44d224 RET |
0x44d228 HINT #0 |
0x44d22c HINT #0 |
0x44d230 HINT #0 |
0x44d234 HINT #0 |
0x44d238 HINT #0 |
0x44d23c HINT #0 |
Path / |
Source file and lines | viscosity_kernel.f90-pp.f90:50-96 |
Module | exec |
nb instructions | 157 |
loop length | 628 |
nb stack references | 0 |
front end | 18.88 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.00 | 4.00 | 19.75 | 19.75 | 19.75 | 19.75 | 2.00 | 2.00 | 1.00 | 1.00 | 21.17 | 20.83 | 21.00 | 12.00 | 12.00 |
cycles | 4.00 | 4.00 | 19.75 | 19.75 | 19.75 | 19.75 | 2.00 | 2.00 | 1.00 | 1.00 | 21.17 | 20.83 | 21.00 | 12.00 | 12.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 18.88 |
Overall L1 | 21.17 |
all | 4% |
load | 25% |
store | 50% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
SUB SP, SP, #320 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D10, [SP, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP D9, D8, [SP, #208] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP X29, X30, [SP, #224] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X28, X27, [SP, #240] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X26, X25, [SP, #256] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X24, X23, [SP, #272] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X22, X21, [SP, #288] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X20, X19, [SP, #304] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDP X8, X9, [X2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR W20, [X0] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ORR X0, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X2, [SP, #152] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X3, SP, #204 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X4, SP, #200 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X5, SP, #188 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X6, SP, #184 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ W2, #34 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ W7, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR WZR, [SP, #204] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR W8, [X8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR W19, [X9] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ORR W1, WZR, W20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR W8, [SP, #200] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MOVZ W8, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP W8, W19, [SP, #184] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR W8, [SP] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
BL 404ae0 <@plt_start@+0x320> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDRSW X21, [SP, #200] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
CMP W21, W19 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GT 44d1e8 <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x658> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR W9, [SP, #188] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUBS W9, W9, W21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.MI 44d1e8 <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x658> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X8, [SP, #152] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X11, X10, [X8, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR W13, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDRSW X7, [X11] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUBS W10, W13, W7 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.MI 44d1e8 <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x658> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X8, [SP, #152] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD W18, W10, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR W20, [SP, #28] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD W20, W9, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB W16, W13, W7 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X14, X7, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X7, [SP, #72] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
FMOV D3, #1.0000000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 |
CMP W18, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
STR W18, [SP, #148] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
INDEX Z0.D, X7, #1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 2 |
ADRP X1, <460c5c> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X15, X21, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR D1, [X1, #1584] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
CSINC W18, W18, WZR, #11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X0, X21, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PTRUE P0.D, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
FMOV D4, #0.5000000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 |
DUP Z5.D, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
LDP X11, X10, [X8, #128] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X9, [X8, #56] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X17, [X8, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD X12, X8, #208 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X2, [X8, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X4, [X8, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUB W16, W16, W18 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X13, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
DUP Z6.D, X13 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD W16, W16, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X16, X16, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X10, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X5, [X9] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X19, [X11] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X9, X11, [X8, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X23, [X17] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X17, X6, [X8, #168] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X8, [X8, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD X1, X4, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X2, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X2, X2, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X1, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR X2, [SP, #104] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
UBFM X10, X10, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X22, X11, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X9, [X9] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X17, [X17] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STP X5, X16, [SP, #120] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MADD X16, X5, X15, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
MADD X1, X5, X21, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
MADD X15, X19, X15, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
UBFM X3, X5, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X5, X19, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MADD X0, X19, X0, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
STR X19, [SP, #136] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR X23, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X18, X6, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X2, X6, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X22, X6, [SP, #56] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
SUB X7, X14, X10 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X5, X3, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MADD X5, X19, X21, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
ADD X19, X14, X16,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X14, X14, X1,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X29, X0, X23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X30, X15, X23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X22, X8, X7 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X7, [SP, #72] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUB X8, X8, X10 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X17, [SP, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
UBFM X17, X9, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X3, X16, X9 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X24, X1, X9 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X16, X19, X17 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X14, X14, X17 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X8, [SP, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X9, X15, X7 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X25, X11, X16 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X27, X11, X14 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X11, X0, X7 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X26, X4, X16 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X28, X4, X14 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X0, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X9, X9, X23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X11, X11, X23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X19, X6, X9,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X9, <460d84> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X9, X9, #1584 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X16, X6, X11,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LD1RD {Z2.D}, P0/Z, [X9] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 6 | 0.50 |
UBFM X9, X5, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X5, X5, X23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X1, X9, X23,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X23, XZR, X3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
B 44ce00 <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x270> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR W20, [SP, #28] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ORR X0, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR W1, WZR, W20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 404bf0 <@plt_start@+0x430> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR X0, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR W1, WZR, W20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 4047f0 <@plt_start@+0x30> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDP D9, D8, [SP, #208] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDR D10, [SP, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDP X20, X19, [SP, #304] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X22, X21, [SP, #288] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X24, X23, [SP, #272] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X26, X25, [SP, #256] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X28, X27, [SP, #240] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X29, X30, [SP, #224] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
ADD SP, SP, #320 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
RET | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Source file and lines | viscosity_kernel.f90-pp.f90:50-96 |
Module | exec |
nb instructions | 157 |
loop length | 628 |
nb stack references | 0 |
front end | 18.88 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.00 | 4.00 | 19.75 | 19.75 | 19.75 | 19.75 | 2.00 | 2.00 | 1.00 | 1.00 | 21.17 | 20.83 | 21.00 | 12.00 | 12.00 |
cycles | 4.00 | 4.00 | 19.75 | 19.75 | 19.75 | 19.75 | 2.00 | 2.00 | 1.00 | 1.00 | 21.17 | 20.83 | 21.00 | 12.00 | 12.00 |
Cycles executing div or sqrt instructions | NA |
Front-end | 18.88 |
Overall L1 | 21.17 |
all | 4% |
load | 25% |
store | 50% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | 0% |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | P12 | P13 | P14 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
SUB SP, SP, #320 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR D10, [SP, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP D9, D8, [SP, #208] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 2 | 0.50 |
STP X29, X30, [SP, #224] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X28, X27, [SP, #240] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X26, X25, [SP, #256] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X24, X23, [SP, #272] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X22, X21, [SP, #288] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STP X20, X19, [SP, #304] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDP X8, X9, [X2] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR W20, [X0] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ORR X0, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X2, [SP, #152] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X3, SP, #204 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X4, SP, #200 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X5, SP, #188 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X6, SP, #184 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ W2, #34 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ W7, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR WZR, [SP, #204] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
LDR W8, [X8] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR W19, [X9] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ORR W1, WZR, W20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR W8, [SP, #200] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MOVZ W8, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP W8, W19, [SP, #184] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR W8, [SP] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
BL 404ae0 <@plt_start@+0x320> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDRSW X21, [SP, #200] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
CMP W21, W19 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.GT 44d1e8 <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x658> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR W9, [SP, #188] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUBS W9, W9, W21 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.MI 44d1e8 <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x658> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X8, [SP, #152] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X11, X10, [X8, #16] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR W13, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDRSW X7, [X11] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUBS W10, W13, W7 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
B.MI 44d1e8 <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x658> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR X8, [SP, #152] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD W18, W10, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR W20, [SP, #28] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD W20, W9, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB W16, W13, W7 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X14, X7, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X7, [SP, #72] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
FMOV D3, #1.0000000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 |
CMP W18, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
STR W18, [SP, #148] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
INDEX Z0.D, X7, #1 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5 | 2 |
ADRP X1, <460c5c> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X15, X21, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR D1, [X1, #1584] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
CSINC W18, W18, WZR, #11 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X0, X21, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
PTRUE P0.D, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
FMOV D4, #0.5000000 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 2 | 0.25 |
DUP Z5.D, #0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 0.50 |
LDP X11, X10, [X8, #128] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X9, [X8, #56] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X17, [X8, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD X12, X8, #208 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X2, [X8, #144] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X4, [X8, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUB W16, W16, W18 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
CNTD X13, ALL | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
DUP Z6.D, X13 | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD W16, W16, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X16, X16, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X10, [X10] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X5, [X9] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X19, [X11] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X9, X11, [X8, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X23, [X17] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDP X17, X6, [X8, #168] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDR X8, [X8, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ADD X1, X4, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X2, [SP, #112] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X2, X2, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X1, [SP, #48] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR X2, [SP, #104] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
UBFM X10, X10, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X22, X11, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X9, [X9] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
LDR X17, [X17] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
STP X5, X16, [SP, #120] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MADD X16, X5, X15, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
MADD X1, X5, X21, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
MADD X15, X19, X15, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
UBFM X3, X5, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
UBFM X5, X19, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MADD X0, X19, X0, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
STR X19, [SP, #136] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
STR X23, [SP, #32] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X18, X6, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X2, X6, #8 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X22, X6, [SP, #56] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
SUB X7, X14, X10 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STP X5, X3, [SP, #80] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
MADD X5, X19, X21, XZR | 1 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2 | 1 |
ADD X19, X14, X16,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X14, X14, X1,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X29, X0, X23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X30, X15, X23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X22, X8, X7 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LDR X7, [SP, #72] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
SUB X8, X8, X10 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X17, [SP, #96] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
UBFM X17, X9, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X3, X16, X9 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X24, X1, X9 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X16, X19, X17 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X14, X14, X17 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
STR X8, [SP, #40] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0.50 | 0.50 | 1 | 0.50 |
ADD X9, X15, X7 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X25, X11, X16 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X27, X11, X14 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X11, X0, X7 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X26, X4, X16 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X28, X4, X14 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
MOVZ X0, #1 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X9, X9, X23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X11, X11, X23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X19, X6, X9,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADRP X9, <460d84> | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X9, X9, #1584 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ADD X16, X6, X11,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
LD1RD {Z2.D}, P0/Z, [X9] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0.50 | 0 | 0 | 0 | 6 | 0.50 |
UBFM X9, X5, #61, #60 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X5, X5, X23 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
SUB X1, X9, X23,LSL #3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR X23, XZR, X3 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
B 44ce00 <__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_+0x270> | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDR W20, [SP, #28] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 0.33 |
ORR X0, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR W1, WZR, W20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 404bf0 <@plt_start@+0x430> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
ORR X0, XZR, XZR | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
ORR W1, WZR, W20 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
BL 4047f0 <@plt_start@+0x30> | 1 | 0.50 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LDP D9, D8, [SP, #208] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDR D10, [SP, #192] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 6 | 0.33 |
LDP X20, X19, [SP, #304] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X22, X21, [SP, #288] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X24, X23, [SP, #272] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X26, X25, [SP, #256] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X28, X27, [SP, #240] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
LDP X29, X30, [SP, #224] | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 0.33 | 0.33 | 0 | 0 | 4 | 1 |
ADD SP, SP, #320 | 1 | 0 | 0 | 0.25 | 0.25 | 0.25 | 0.25 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.25 |
RET | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 | ||||||||||||||||||
HINT #0 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼__nv_viscosity_kernel_module_viscosity_kernel__F1L50_1_– | 11.51 | 2.32 |
▼Loop 1095 - viscosity_kernel.f90-pp.f90:53-93 - exec– | 0 | 0 |
○Loop 1097 - viscosity_kernel.f90-pp.f90:56-89 - exec | 11.51 | 2.32 |
○Loop 1096 - viscosity_kernel.f90-pp.f90:56-92 - exec | 0 | 0 |