Function: viscosity_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: viscosity_kernel.f90:50-94 | Coverage: 4.23% |
---|
Function: viscosity_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: viscosity_kernel.f90:50-94 | Coverage: 4.23% |
---|
/scratch_na/users/xoserete/qaas_runs/171-419-3245/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90: 50 - 94 |
-------------------------------------------------------------------------------- |
50: !$OMP PARALLEL |
51: |
52: !$OMP DO PRIVATE(ugrad,vgrad,div,strain2,pgradx,pgrady,pgradx2,pgrady2,limiter,pgrad,xgrad,ygrad,grad,grad2,dirx,diry) |
53: DO k=y_min,y_max |
54: !$OMP SIMD |
55: DO j=x_min,x_max |
56: ugrad=(xvel0(j+1,k )+xvel0(j+1,k+1))-(xvel0(j ,k )+xvel0(j ,k+1)) |
57: |
58: vgrad=(yvel0(j ,k+1)+yvel0(j+1,k+1))-(yvel0(j ,k )+yvel0(j+1,k )) |
59: |
60: div = (celldx(j)*(ugrad)+ celldy(k)*(vgrad)) |
61: |
62: strain2 = 0.5_8*(xvel0(j, k+1) + xvel0(j+1,k+1)-xvel0(j ,k )-xvel0(j+1,k ))/celldy(k) & |
63: + 0.5_8*(yvel0(j+1,k ) + yvel0(j+1,k+1)-yvel0(j ,k )-yvel0(j ,k+1))/celldx(j) |
64: |
65: pgradx=(pressure(j+1,k)-pressure(j-1,k))/(celldx(j)+celldx(j+1)) |
66: pgrady=(pressure(j,k+1)-pressure(j,k-1))/(celldy(k)+celldy(k+1)) |
67: |
68: pgradx2 = pgradx*pgradx |
69: pgrady2 = pgrady*pgrady |
70: |
71: limiter = ((0.5_8*(ugrad)/celldx(j))*pgradx2+(0.5_8*(vgrad)/celldy(k))*pgrady2+strain2*pgradx*pgrady) & |
72: /MAX(pgradx2+pgrady2,1.0e-16_8) |
73: |
74: IF ((limiter.GT.0.0).OR.(div.GE.0.0))THEN |
75: viscosity(j,k) = 0.0 |
76: ELSE |
77: dirx=1.0_8 |
78: IF(pgradx.LT.0.0) dirx=-1.0_8 |
79: pgradx = dirx*MAX(1.0e-16_8,ABS(pgradx)) |
80: diry=1.0_8 |
81: IF(pgradx.LT.0.0) diry=-1.0_8 |
82: pgrady = diry*MAX(1.0e-16_8,ABS(pgrady)) |
83: pgrad = SQRT(pgradx**2+pgrady**2) |
84: xgrad = ABS(celldx(j)*pgrad/pgradx) |
85: ygrad = ABS(celldy(k)*pgrad/pgrady) |
86: grad = MIN(xgrad,ygrad) |
87: grad2 = grad*grad |
88: |
89: viscosity(j,k)=2.0_8*density0(j,k)*grad2*limiter*limiter |
90: ENDIF |
91: |
92: ENDDO |
93: ENDDO |
94: !$OMP END DO |
0x468800 PUSH %RBP |
0x468801 MOV %RSP,%RBP |
0x468804 PUSH %R15 |
0x468806 PUSH %R14 |
0x468808 PUSH %R13 |
0x46880a PUSH %R12 |
0x46880c PUSH %RBX |
0x46880d AND $-0x20,%RSP |
0x468811 SUB $0x2c0,%RSP |
0x468818 MOV 0x50(%RBP),%EBX |
0x46881b MOV 0x48(%RBP),%EAX |
0x46881e SUB %EBX,%EAX |
0x468820 MOVL $0,0x3c(%RSP) |
0x468828 JS 4688a5 |
0x46882a MOV %R9,%R15 |
0x46882d MOV %RCX,%R12 |
0x468830 MOV %RDI,0x70(%RSP) |
0x468835 MOV (%RDI),%ESI |
0x468837 MOVL $0,0x14(%RSP) |
0x46883f MOV %EAX,0x10(%RSP) |
0x468843 MOVL $0x1,0x38(%RSP) |
0x46884b SUB $0x8,%RSP |
0x46884f LEA 0x40(%RSP),%RAX |
0x468854 LEA 0x44(%RSP),%RCX |
0x468859 LEA 0x1c(%RSP),%R8 |
0x46885e LEA 0x18(%RSP),%R9 |
0x468863 MOV $0x73a630,%EDI |
0x468868 MOV %ESI,0x34(%RSP) |
0x46886c MOV $0x22,%EDX |
0x468871 PUSH $0x1 |
0x468873 PUSH $0x1 |
0x468875 PUSH %RAX |
0x468876 CALL 404520 <__kmpc_for_static_init_4@plt> |
0x46887b ADD $0x20,%RSP |
0x46887f MOV 0x14(%RSP),%EAX |
0x468883 MOV 0x10(%RSP),%ECX |
0x468887 SUB %EAX,%ECX |
0x468889 MOV %ECX,0x30(%RSP) |
0x46888d JAE 4688c0 |
0x46888f MOV $0x73a650,%EDI |
0x468894 MOV 0x2c(%RSP),%ESI |
0x468898 VZEROUPPER |
0x46889b CALL 404110 <__kmpc_for_static_fini@plt> |
0x4688a0 MOV 0x70(%RSP),%RDI |
0x4688a5 MOV (%RDI),%ESI |
0x4688a7 MOV $0x73a670,%EDI |
0x4688ac CALL 4045e0 <__kmpc_barrier@plt> |
0x4688b1 LEA -0x28(%RBP),%RSP |
0x4688b5 POP %RBX |
0x4688b6 POP %R12 |
0x4688b8 POP %R13 |
0x4688ba POP %R14 |
0x4688bc POP %R15 |
0x4688be POP %RBP |
0x4688bf RET |
0x4688c0 MOV %RAX,%RSI |
0x4688c3 MOV 0x60(%RBP),%RAX |
0x4688c7 MOV 0x58(%RBP),%RCX |
0x4688cb MOVSXD (%RAX),%RDI |
0x4688ce MOV (%RCX),%ECX |
0x4688d0 SUB %EDI,%ECX |
0x4688d2 ADD %EBX,%ESI |
0x4688d4 LEA -0x2(%R12),%EAX |
0x4688d9 CLTQ |
0x4688db MOV %RAX,0x100(%RSP) |
0x4688e3 MOV %RCX,0x138(%RSP) |
0x4688eb LEA 0x1(%RCX),%EAX |
0x4688ee CMP $0x2,%EAX |
0x4688f1 MOV $0x1,%ECX |
0x4688f6 CMOVGE %EAX,%ECX |
0x4688f9 MOV %RCX,0x48(%RSP) |
0x4688fe AND $0x7ffffffc,%ECX |
0x468904 MOV %RCX,0x20(%RSP) |
0x468909 MOVSXD %R12D,%RCX |
0x46890c MOVSXD %R15D,%RDX |
0x46890f LEA -0x2(%RDX),%RAX |
0x468913 MOV %RAX,0xd8(%RSP) |
0x46891b MOV %RDI,0xe0(%RSP) |
0x468923 LEA (,%RDI,8),%RAX |
0x46892b SAL $0x3,%RDX |
0x46892f SUB %RDX,%RAX |
0x468932 MOV $0x2,%EDI |
0x468937 SUB %RCX,%RDI |
0x46893a MOV %RDI,0xf8(%RSP) |
0x468942 MOV $0x1,%EDI |
0x468947 SUB %RCX,%RDI |
0x46894a MOV %RDI,0xf0(%RSP) |
0x468952 MOV $0x10,%EDI |
0x468957 SUB %RDX,%RDI |
0x46895a MOV $0x18,%R8D |
0x468960 SUB %RDX,%R8 |
0x468963 MOV $0x3,%EDX |
0x468968 SUB %RCX,%RDX |
0x46896b MOV %RDX,0xe8(%RSP) |
0x468973 ADD $-0x2,%RCX |
0x468977 MOV %RCX,0x40(%RSP) |
0x46897c MOV 0x40(%RBP),%RCX |
0x468980 MOV 0x30(%RBP),%RDX |
0x468984 MOV 0x28(%RBP),%R9 |
0x468988 MOV 0x20(%RBP),%R10 |
0x46898c MOV 0x18(%RBP),%RBX |
0x468990 MOV 0x10(%RBP),%R14 |
0x468994 LEA 0x18(%R9,%RAX,1),%R11 |
0x468999 MOV %R11,0x98(%RSP) |
0x4689a1 LEA 0x10(%R10,%RAX,1),%R11 |
0x4689a6 MOV %R11,0x90(%RSP) |
0x4689ae LEA 0x10(%RDX,%RAX,1),%R11 |
0x4689b3 MOV %R11,0x158(%RSP) |
0x4689bb LEA 0x10(%R9,%RAX,1),%R11 |
0x4689c0 MOV %R11,0x88(%RSP) |
0x4689c8 LEA 0x18(%RCX,%RAX,1),%R11 |
0x4689cd LEA 0x18(%R14,%RAX,1),%R15 |
0x4689d2 MOV %R15,0x80(%RSP) |
0x4689da ADD %RBX,%RAX |
0x4689dd ADD $0x18,%RAX |
0x4689e1 MOV %RAX,0x78(%RSP) |
0x4689e6 ADD %RDI,%R10 |
0x4689e9 MOV %R10,0xb8(%RSP) |
0x4689f1 ADD %RDI,%RDX |
0x4689f4 MOV %RDX,0xc0(%RSP) |
0x4689fc ADD %R9,%RDI |
0x4689ff MOV %RDI,0xd0(%RSP) |
0x468a07 LEA (%RCX,%R8,1),%RAX |
0x468a0b MOV %RAX,0xb0(%RSP) |
0x468a13 LEA (%R9,%R8,1),%RAX |
0x468a17 MOV %RAX,0xa8(%RSP) |
0x468a1f LEA (%R14,%R8,1),%RAX |
0x468a23 MOV %RAX,0xa0(%RSP) |
0x468a2b ADD %RBX,%R8 |
0x468a2e MOV %R8,0xc8(%RSP) |
0x468a36 VMOVSD 0x89ae2(%RIP),%XMM15 |
0x468a3e VMOVSD 0x8a7ba(%RIP),%XMM1 |
0x468a46 VMOVSD 0xa7448(%RIP),%XMM16 |
0x468a50 VMOVSD 0xa7446(%RIP),%XMM17 |
0x468a5a VBROADCASTSD 0x89abc(%RIP),%YMM20 |
0x468a64 VXORPD %XMM18,%XMM18,%XMM18 |
0x468a6a XOR %EDI,%EDI |
0x468a6c MOV %RSI,0x108(%RSP) |
0x468a74 MOV %ESI,%ECX |
0x468a76 JMP 468a9d |
0x468a78 NOPL (%RAX,%RAX,1) |
(1026) 0x468a80 MOV 0x150(%RSP),%RDX |
(1026) 0x468a88 LEA 0x1(%RDX),%EAX |
(1026) 0x468a8b MOV 0x34(%RSP),%ECX |
(1026) 0x468a8f INC %ECX |
(1026) 0x468a91 CMP 0x30(%RSP),%EDX |
(1026) 0x468a95 MOV %EAX,%EDI |
(1026) 0x468a97 JE 46888f |
(1026) 0x468a9d CMPL $0,0x138(%RSP) |
(1026) 0x468aa5 MOV %ECX,0x34(%RSP) |
(1026) 0x468aa9 MOV %RDI,0x150(%RSP) |
(1026) 0x468ab1 JS 468a80 |
(1026) 0x468ab3 MOVSXD %ECX,%RBX |
(1026) 0x468ab6 MOV 0xf8(%RSP),%RAX |
(1026) 0x468abe LEA (%RAX,%RBX,1),%R8 |
(1026) 0x468ac2 MOV 0xf0(%RSP),%RAX |
(1026) 0x468aca LEA (%RAX,%RBX,1),%R14 |
(1026) 0x468ace ADD 0xe8(%RSP),%RBX |
(1026) 0x468ad6 MOV 0x108(%RSP),%RCX |
(1026) 0x468ade LEA (%RCX,%RDI,1),%EAX |
(1026) 0x468ae1 MOVSXD %EAX,%R13 |
(1026) 0x468ae4 MOV %R13,%RAX |
(1026) 0x468ae7 MOV 0x100(%RSP),%RDX |
(1026) 0x468aef SUB %RDX,%RAX |
(1026) 0x468af2 ADD %EDI,%ECX |
(1026) 0x468af4 INC %ECX |
(1026) 0x468af6 MOVSXD %ECX,%RCX |
(1026) 0x468af9 SUB %RDX,%RCX |
(1026) 0x468afc MOV 0x68(%RBP),%RDX |
(1026) 0x468b00 MOV (%RDX),%R12 |
(1026) 0x468b03 MOV 0x38(%RBP),%RDX |
(1026) 0x468b07 VMOVSD (%RDX,%RAX,8),%XMM4 |
(1026) 0x468b0c MOV 0x70(%RBP),%RAX |
(1026) 0x468b10 MOV (%RAX),%R9 |
(1026) 0x468b13 MOV 0x78(%RBP),%RAX |
(1026) 0x468b17 MOV (%RAX),%RDI |
(1026) 0x468b1a VADDSD (%RDX,%RCX,8),%XMM4,%XMM2 |
(1026) 0x468b1f MOV 0x80(%RBP),%RAX |
(1026) 0x468b26 MOV (%RAX),%R10 |
(1026) 0x468b29 CMPQ $0,0x20(%RSP) |
(1026) 0x468b2f VMOVAPD %XMM4,0x180(%RSP) |
(1026) 0x468b38 MOV %R12,0x148(%RSP) |
(1026) 0x468b40 MOV %R9,0x140(%RSP) |
(1026) 0x468b48 JE 4691f0 |
(1026) 0x468b4e VMOVAPD %XMM13,0x60(%RSP) |
(1026) 0x468b54 VMOVAPD %XMM31,%XMM0 |
(1026) 0x468b5a VBROADCASTSD %XMM13,%YMM31 |
(1026) 0x468b60 VBROADCASTSD %XMM14,%YMM29 |
(1026) 0x468b66 VMOVAPD %XMM19,0x1b0(%RSP) |
(1026) 0x468b6e VBROADCASTSD %XMM19,%YMM27 |
(1026) 0x468b74 VMOVAPD %XMM30,0x1a0(%RSP) |
(1026) 0x468b7c VBROADCASTSD %XMM30,%YMM25 |
(1026) 0x468b82 VBROADCASTSD 0x170(%RSP),%YMM24 |
(1026) 0x468b8a VMOVAPD %XMM0,0x190(%RSP) |
(1026) 0x468b93 VBROADCASTSD %XMM0,%YMM23 |
(1026) 0x468b99 VBROADCASTSD 0x160(%RSP),%YMM22 |
(1026) 0x468ba1 SUB 0x40(%RSP),%R13 |
(1026) 0x468ba6 MOV %R12,%RAX |
(1026) 0x468ba9 IMUL %R13,%RAX |
(1026) 0x468bad MOV %RAX,0x18(%RSP) |
(1026) 0x468bb2 LEA 0x1(%R13),%RCX |
(1026) 0x468bb6 MOV %R12,%RAX |
(1026) 0x468bb9 IMUL %RCX,%RAX |
(1026) 0x468bbd MOV %RAX,0x110(%RSP) |
(1026) 0x468bc5 IMUL %R9,%RCX |
(1026) 0x468bc9 MOV %RCX,0x58(%RSP) |
(1026) 0x468bce MOV %R9,%RAX |
(1026) 0x468bd1 IMUL %R13,%RAX |
(1026) 0x468bd5 MOV %RAX,0x50(%RSP) |
(1026) 0x468bda VBROADCASTSD %XMM4,%YMM26 |
(1026) 0x468be0 IMUL %RDI,%R13 |
(1026) 0x468be4 VDIVSD %XMM4,%XMM15,%XMM0 |
(1026) 0x468be8 VBROADCASTSD %XMM0,%YMM28 |
(1026) 0x468bee VMOVSD %XMM2,0x130(%RSP) |
(1026) 0x468bf7 VDIVSD %XMM2,%XMM15,%XMM0 |
(1026) 0x468bfb VBROADCASTSD %XMM0,%YMM30 |
(1026) 0x468c01 MOV %RDI,%RSI |
(1026) 0x468c04 IMUL %R8,%RSI |
(1026) 0x468c08 ADD 0x98(%RSP),%RSI |
(1026) 0x468c10 MOV %R10,0x118(%RSP) |
(1026) 0x468c18 IMUL %R8,%R10 |
(1026) 0x468c1c ADD 0x90(%RSP),%R10 |
(1026) 0x468c24 MOV %RDI,%RDX |
(1026) 0x468c27 MOV %R14,0x128(%RSP) |
(1026) 0x468c2f IMUL %R14,%RDX |
(1026) 0x468c33 MOV 0x88(%RSP),%RAX |
(1026) 0x468c3b ADD %RAX,%RDX |
(1026) 0x468c3e MOV %RDI,0x120(%RSP) |
(1026) 0x468c46 MOV %RDI,%R14 |
(1026) 0x468c49 IMUL %RBX,%R14 |
(1026) 0x468c4d ADD %RAX,%R14 |
(1026) 0x468c50 MOV %R9,%R15 |
(1026) 0x468c53 IMUL %R8,%R15 |
(1026) 0x468c57 MOV 0x80(%RSP),%RAX |
(1026) 0x468c5f ADD %RAX,%R15 |
(1026) 0x468c62 IMUL %RBX,%R9 |
(1026) 0x468c66 ADD %RAX,%R9 |
(1026) 0x468c69 MOV %R12,%RCX |
(1026) 0x468c6c IMUL %RBX,%RCX |
(1026) 0x468c70 MOV 0x78(%RSP),%RDI |
(1026) 0x468c75 ADD %RDI,%RCX |
(1026) 0x468c78 MOV %R12,%RAX |
(1026) 0x468c7b IMUL %R8,%RAX |
(1026) 0x468c7f ADD %RDI,%RAX |
(1026) 0x468c82 VPCMPEQD %YMM12,%YMM12,%YMM12 |
(1026) 0x468c87 XOR %R12D,%R12D |
(1026) 0x468c8a VPCMPEQD %YMM11,%YMM11,%YMM11 |
(1026) 0x468c8f VPCMPEQD %YMM3,%YMM3,%YMM3 |
(1026) 0x468c93 VPCMPEQD %YMM6,%YMM6,%YMM6 |
(1026) 0x468c97 VPCMPEQD %YMM9,%YMM9,%YMM9 |
(1026) 0x468c9c VPCMPEQD %YMM2,%YMM2,%YMM2 |
(1026) 0x468ca0 VPCMPEQD %YMM0,%YMM0,%YMM0 |
(1026) 0x468ca4 VBROADCASTSD 0xa71eb(%RIP),%YMM1 |
(1026) 0x468cad JMP 468de7 |
0x468cb2 NOPW %CS:(%RAX,%RAX,1) |
(1028) 0x468cc0 VCMPPD $0x1,%YMM13,%YMM18,%K2 |
(1028) 0x468cc7 VBROADCASTSD 0xa71d0(%RIP),%YMM7 |
(1028) 0x468cd0 VBLENDMPD %YMM7,%YMM20,%YMM4{%K2} |
(1028) 0x468cd6 VBROADCASTSD 0x896c8(%RIP),%YMM19 |
(1028) 0x468ce0 VANDPD %YMM19,%YMM18,%YMM5 |
(1028) 0x468ce6 VMAXPD %YMM1,%YMM5,%YMM5 |
(1028) 0x468cea VMULPD %YMM5,%YMM4,%YMM5 |
(1028) 0x468cee VCMPPD $0x1,%YMM13,%YMM5,%K2 |
(1028) 0x468cf5 VBLENDMPD %YMM7,%YMM20,%YMM7{%K2} |
(1028) 0x468cfb VANDPD %YMM19,%YMM17,%YMM8 |
(1028) 0x468d01 VMAXPD %YMM1,%YMM8,%YMM8 |
(1028) 0x468d05 VMULPD %YMM7,%YMM8,%YMM8 |
(1028) 0x468d09 VMULPD %YMM5,%YMM5,%YMM10 |
(1028) 0x468d0d VFMADD231PD %YMM8,%YMM8,%YMM10 |
(1028) 0x468d12 VSQRTPD %YMM10,%YMM10 |
(1028) 0x468d17 VMULPD %YMM21,%YMM10,%YMM15 |
(1028) 0x468d1d VDIVPD %YMM5,%YMM15,%YMM5 |
(1028) 0x468d21 VANDPD %YMM19,%YMM5,%YMM5 |
(1028) 0x468d27 VMULPD %YMM26,%YMM10,%YMM15 |
(1028) 0x468d2d VDIVPD %YMM8,%YMM15,%YMM8 |
(1028) 0x468d32 VANDPD %YMM19,%YMM8,%YMM8 |
(1028) 0x468d38 VMINPD %YMM8,%YMM5,%YMM15 |
(1028) 0x468d3d VMULPD %YMM15,%YMM15,%YMM17 |
(1028) 0x468d43 VMULPD %YMM16,%YMM16,%YMM16 |
(1028) 0x468d49 VADDPD %YMM17,%YMM17,%YMM18 |
(1028) 0x468d4f VMULPD %YMM18,%YMM16,%YMM16 |
(1028) 0x468d55 IMUL %R8,%RDI |
(1028) 0x468d59 ADD 0x158(%RSP),%RDI |
(1028) 0x468d61 VMOVUPD (%RDI,%R12,8),%YMM18{%K1}{z} |
(1028) 0x468d68 VPBROADCASTQ %R12,%YMM19 |
(1028) 0x468d6e VPADDQ 0x89448(%RIP),%YMM19,%YMM19 |
(1028) 0x468d78 VMOVDQA64 %YMM19,%YMM0{%K1} |
(1028) 0x468d7e VMOVAPD %YMM4,%YMM31{%K1} |
(1028) 0x468d84 VMOVDQA64 %YMM19,%YMM2{%K1} |
(1028) 0x468d8a VMOVAPD %YMM7,%YMM29{%K1} |
(1028) 0x468d90 VMOVDQA64 %YMM19,%YMM9{%K1} |
(1028) 0x468d96 VMOVAPD %YMM10,%YMM27{%K1} |
(1028) 0x468d9c VMOVDQA64 %YMM19,%YMM6{%K1} |
(1028) 0x468da2 VMOVAPD %YMM5,%YMM25{%K1} |
(1028) 0x468da8 VMOVDQA64 %YMM19,%YMM3{%K1} |
(1028) 0x468dae VMOVAPD %YMM8,%YMM24{%K1} |
(1028) 0x468db4 VMOVDQA64 %YMM19,%YMM11{%K1} |
(1028) 0x468dba VMOVAPD %YMM15,%YMM23{%K1} |
(1028) 0x468dc0 VMOVDQA64 %YMM19,%YMM12{%K1} |
(1028) 0x468dc6 VMOVAPD %YMM17,%YMM22{%K1} |
(1028) 0x468dcc VMULPD %YMM18,%YMM16,%YMM4{%K1}{z} |
(1028) 0x468dd2 VMOVUPD %YMM4,(%R10,%R12,8) |
(1028) 0x468dd8 ADD $0x4,%R12 |
(1028) 0x468ddc CMP 0x20(%RSP),%R12 |
(1028) 0x468de1 JAE 468f60 |
(1028) 0x468de7 VMOVUPD -0x8(%RAX,%R12,8),%YMM16 |
(1028) 0x468df2 VMOVUPD (%RAX,%R12,8),%YMM17 |
(1028) 0x468df9 VMOVUPD -0x8(%RCX,%R12,8),%YMM18 |
(1028) 0x468e04 VMOVUPD (%RCX,%R12,8),%YMM19 |
(1028) 0x468e0b VADDPD %YMM17,%YMM19,%YMM21 |
(1028) 0x468e11 VADDPD %YMM18,%YMM16,%YMM5 |
(1028) 0x468e17 VSUBPD %YMM5,%YMM21,%YMM5 |
(1028) 0x468e1d VMOVUPD -0x8(%R9,%R12,8),%YMM7 |
(1028) 0x468e24 VMOVAPD %YMM20,%YMM13 |
(1028) 0x468e2a VMOVUPD (%R9,%R12,8),%YMM20 |
(1028) 0x468e31 VMOVUPD -0x8(%R15,%R12,8),%YMM15 |
(1028) 0x468e38 VMOVUPD (%R15,%R12,8),%YMM4 |
(1028) 0x468e3e VADDPD %YMM7,%YMM20,%YMM8 |
(1028) 0x468e44 VADDPD %YMM4,%YMM15,%YMM10 |
(1028) 0x468e48 VMOVUPD -0x8(%R11,%R12,8),%YMM21 |
(1028) 0x468e53 VSUBPD %YMM10,%YMM8,%YMM8 |
(1028) 0x468e58 VMULPD %YMM5,%YMM21,%YMM10 |
(1028) 0x468e5e VFMADD231PD %YMM8,%YMM26,%YMM10 |
(1028) 0x468e64 VADDPD %YMM16,%YMM17,%YMM16 |
(1028) 0x468e6a VSUBPD %YMM16,%YMM19,%YMM16 |
(1028) 0x468e70 VADDPD %YMM18,%YMM16,%YMM16 |
(1028) 0x468e76 VBROADCASTSD 0x8a380(%RIP),%YMM19 |
(1028) 0x468e80 VMULPD %YMM19,%YMM16,%YMM16 |
(1028) 0x468e86 VADDPD %YMM7,%YMM15,%YMM7 |
(1028) 0x468e8a VSUBPD %YMM7,%YMM20,%YMM7 |
(1028) 0x468e90 VMOVAPD %YMM13,%YMM20 |
(1028) 0x468e96 VXORPD %XMM13,%XMM13,%XMM13 |
(1028) 0x468e9b VADDPD %YMM4,%YMM7,%YMM4 |
(1028) 0x468e9f VMULPD %YMM19,%YMM4,%YMM4 |
(1028) 0x468ea5 VDIVPD %YMM21,%YMM20,%YMM7 |
(1028) 0x468eab VMULPD %YMM7,%YMM4,%YMM4 |
(1028) 0x468eaf VFMADD231PD %YMM16,%YMM28,%YMM4 |
(1028) 0x468eb5 VMOVUPD (%RSI,%R12,8),%YMM15 |
(1028) 0x468ebb VSUBPD -0x10(%RSI,%R12,8),%YMM15,%YMM15 |
(1028) 0x468ec2 VADDPD (%R11,%R12,8),%YMM21,%YMM16 |
(1028) 0x468ec9 VMOVUPD (%R14,%R12,8),%YMM17 |
(1028) 0x468ed0 VSUBPD (%RDX,%R12,8),%YMM17,%YMM17 |
(1028) 0x468ed7 VDIVPD %YMM16,%YMM15,%YMM18 |
(1028) 0x468edd VMULPD %YMM30,%YMM17,%YMM17 |
(1028) 0x468ee3 VMULPD %YMM18,%YMM18,%YMM15 |
(1028) 0x468ee9 VMULPD %YMM17,%YMM17,%YMM16 |
(1028) 0x468eef VMULPD %YMM19,%YMM5,%YMM5 |
(1028) 0x468ef5 VMULPD %YMM7,%YMM5,%YMM5 |
(1028) 0x468ef9 VMULPD %YMM5,%YMM15,%YMM5 |
(1028) 0x468efd VMULPD %YMM19,%YMM8,%YMM7 |
(1028) 0x468f03 VMULPD %YMM16,%YMM7,%YMM7 |
(1028) 0x468f09 VMULPD %YMM4,%YMM18,%YMM4 |
(1028) 0x468f0f VFMADD213PD %YMM5,%YMM17,%YMM4 |
(1028) 0x468f15 VFMADD231PD %YMM7,%YMM28,%YMM4 |
(1028) 0x468f1b VADDPD %YMM15,%YMM16,%YMM5 |
(1028) 0x468f21 VMAXPD %YMM1,%YMM5,%YMM5 |
(1028) 0x468f25 VDIVPD %YMM5,%YMM4,%YMM16 |
(1028) 0x468f2b VCMPPD $0x6,%YMM10,%YMM13,%K1 |
(1028) 0x468f32 VCMPPD $0x5,%YMM16,%YMM13,%K1{%K1} |
(1028) 0x468f39 KORTESTB %K1,%K1 |
(1028) 0x468f3d JE 468cc0 |
(1028) 0x468f43 MOV 0x88(%RBP),%RDI |
(1028) 0x468f4a MOV (%RDI),%RDI |
(1028) 0x468f4d JMP 468cc0 |
0x468f52 NOPW %CS:(%RAX,%RAX,1) |
(1026) 0x468f60 VPCMPEQD %YMM7,%YMM7,%YMM7 |
(1026) 0x468f64 VPTEST %YMM7,%YMM0 |
(1026) 0x468f69 VMOVAPD 0x60(%RSP),%XMM13 |
(1026) 0x468f6f JB 468faf |
(1026) 0x468f71 VEXTRACTI128 $0x1,%YMM0,%XMM4 |
(1026) 0x468f77 VPMAXSQ %XMM4,%XMM0,%XMM4 |
(1026) 0x468f7d VPSHUFD $-0x12,%XMM4,%XMM5 |
(1026) 0x468f82 VPMAXSQ %XMM5,%XMM4,%XMM4 |
(1026) 0x468f88 VPBROADCASTQ %XMM4,%YMM4 |
(1026) 0x468f8d VPCMPEQQ %YMM4,%YMM0,%K0 |
(1026) 0x468f93 KMOVD %K0,%EAX |
(1026) 0x468f97 TZCNT %EAX,%EAX |
(1026) 0x468f9b VMOVAPD %YMM31,0x280(%RSP) |
(1026) 0x468fa3 AND $0x3,%EAX |
(1026) 0x468fa6 VMOVSD 0x280(%RSP,%RAX,8),%XMM13 |
(1026) 0x468faf VPTEST %YMM7,%YMM2 |
(1026) 0x468fb4 VMOVAPD 0x1a0(%RSP),%XMM30 |
(1026) 0x468fbc MOV 0x128(%RSP),%R14 |
(1026) 0x468fc4 MOV 0x120(%RSP),%RDI |
(1026) 0x468fcc MOV 0x118(%RSP),%R10 |
(1026) 0x468fd4 MOV 0x110(%RSP),%R15 |
(1026) 0x468fdc JB 46901c |
(1026) 0x468fde VEXTRACTI128 $0x1,%YMM2,%XMM0 |
(1026) 0x468fe4 VPMAXSQ %XMM0,%XMM2,%XMM0 |
(1026) 0x468fea VPSHUFD $-0x12,%XMM0,%XMM4 |
(1026) 0x468fef VPMAXSQ %XMM4,%XMM0,%XMM0 |
(1026) 0x468ff5 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x468ffa VPCMPEQQ %YMM0,%YMM2,%K0 |
(1026) 0x469000 KMOVD %K0,%EAX |
(1026) 0x469004 TZCNT %EAX,%EAX |
(1026) 0x469008 VMOVAPD %YMM29,0x260(%RSP) |
(1026) 0x469010 AND $0x3,%EAX |
(1026) 0x469013 VMOVSD 0x260(%RSP,%RAX,8),%XMM14 |
(1026) 0x46901c VPTEST %YMM7,%YMM9 |
(1026) 0x469021 VMOVAPD 0x1b0(%RSP),%XMM19 |
(1026) 0x469029 VMOVAPD 0x190(%RSP),%XMM31 |
(1026) 0x469031 JB 469070 |
(1026) 0x469033 VEXTRACTI128 $0x1,%YMM9,%XMM0 |
(1026) 0x469039 VPMAXSQ %XMM0,%XMM9,%XMM0 |
(1026) 0x46903f VPSHUFD $-0x12,%XMM0,%XMM2 |
(1026) 0x469044 VPMAXSQ %XMM2,%XMM0,%XMM0 |
(1026) 0x46904a VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46904f VPCMPEQQ %YMM0,%YMM9,%K0 |
(1026) 0x469055 KMOVD %K0,%EAX |
(1026) 0x469059 TZCNT %EAX,%EAX |
(1026) 0x46905d VMOVAPD %YMM27,0x240(%RSP) |
(1026) 0x469065 AND $0x3,%EAX |
(1026) 0x469068 VMOVSD 0x240(%RSP,%RAX,8),%XMM19 |
(1026) 0x469070 VPTEST %YMM7,%YMM6 |
(1026) 0x469075 VMOVSD 0x894a3(%RIP),%XMM15 |
(1026) 0x46907d VMOVSD 0xa6e11(%RIP),%XMM16 |
(1026) 0x469087 VMOVSD 0xa6e0f(%RIP),%XMM17 |
(1026) 0x469091 VMOVSD 0x8a167(%RIP),%XMM1 |
(1026) 0x469099 VXORPD %XMM18,%XMM18,%XMM18 |
(1026) 0x46909f VMOVAPD 0x180(%RSP),%XMM4 |
(1026) 0x4690a8 JB 4690e7 |
(1026) 0x4690aa VEXTRACTI128 $0x1,%YMM6,%XMM0 |
(1026) 0x4690b0 VPMAXSQ %XMM0,%XMM6,%XMM0 |
(1026) 0x4690b6 VPSHUFD $-0x12,%XMM0,%XMM2 |
(1026) 0x4690bb VPMAXSQ %XMM2,%XMM0,%XMM0 |
(1026) 0x4690c1 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x4690c6 VPCMPEQQ %YMM0,%YMM6,%K0 |
(1026) 0x4690cc KMOVD %K0,%EAX |
(1026) 0x4690d0 TZCNT %EAX,%EAX |
(1026) 0x4690d4 VMOVAPD %YMM25,0x220(%RSP) |
(1026) 0x4690dc AND $0x3,%EAX |
(1026) 0x4690df VMOVSD 0x220(%RSP,%RAX,8),%XMM30 |
(1026) 0x4690e7 VPTEST %YMM7,%YMM3 |
(1026) 0x4690ec JB 469135 |
(1026) 0x4690ee VEXTRACTI128 $0x1,%YMM3,%XMM0 |
(1026) 0x4690f4 VPMAXSQ %XMM0,%XMM3,%XMM0 |
(1026) 0x4690fa VPSHUFD $-0x12,%XMM0,%XMM2 |
(1026) 0x4690ff VPMAXSQ %XMM2,%XMM0,%XMM0 |
(1026) 0x469105 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46910a VPCMPEQQ %YMM0,%YMM3,%K0 |
(1026) 0x469110 KMOVD %K0,%EAX |
(1026) 0x469114 TZCNT %EAX,%EAX |
(1026) 0x469118 VMOVAPD %YMM24,0x200(%RSP) |
(1026) 0x469120 AND $0x3,%EAX |
(1026) 0x469123 VMOVQ 0x200(%RSP,%RAX,8),%XMM0 |
(1026) 0x46912c VMOVDQA %XMM0,0x170(%RSP) |
(1026) 0x469135 VPTEST %YMM7,%YMM11 |
(1026) 0x46913a JB 469179 |
(1026) 0x46913c VEXTRACTI128 $0x1,%YMM11,%XMM0 |
(1026) 0x469142 VPMAXSQ %XMM0,%XMM11,%XMM0 |
(1026) 0x469148 VPSHUFD $-0x12,%XMM0,%XMM2 |
(1026) 0x46914d VPMAXSQ %XMM2,%XMM0,%XMM0 |
(1026) 0x469153 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x469158 VPCMPEQQ %YMM0,%YMM11,%K0 |
(1026) 0x46915e KMOVD %K0,%EAX |
(1026) 0x469162 TZCNT %EAX,%EAX |
(1026) 0x469166 VMOVAPD %YMM23,0x1e0(%RSP) |
(1026) 0x46916e AND $0x3,%EAX |
(1026) 0x469171 VMOVSD 0x1e0(%RSP,%RAX,8),%XMM31 |
(1026) 0x469179 VPTEST %YMM7,%YMM12 |
(1026) 0x46917e JB 4691c7 |
(1026) 0x469180 VEXTRACTI128 $0x1,%YMM12,%XMM0 |
(1026) 0x469186 VPMAXSQ %XMM0,%XMM12,%XMM0 |
(1026) 0x46918c VPSHUFD $-0x12,%XMM0,%XMM2 |
(1026) 0x469191 VPMAXSQ %XMM2,%XMM0,%XMM0 |
(1026) 0x469197 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46919c VPCMPEQQ %YMM0,%YMM12,%K0 |
(1026) 0x4691a2 KMOVD %K0,%EAX |
(1026) 0x4691a6 TZCNT %EAX,%EAX |
(1026) 0x4691aa VMOVAPD %YMM22,0x1c0(%RSP) |
(1026) 0x4691b2 AND $0x3,%EAX |
(1026) 0x4691b5 VMOVQ 0x1c0(%RSP,%RAX,8),%XMM0 |
(1026) 0x4691be VMOVDQA %XMM0,0x160(%RSP) |
(1026) 0x4691c7 MOV 0x20(%RSP),%RAX |
(1026) 0x4691cc MOV %RAX,%RDX |
(1026) 0x4691cf CMP 0x48(%RSP),%RAX |
(1026) 0x4691d4 VMOVSD 0x130(%RSP),%XMM2 |
(1026) 0x4691dd JE 468a80 |
(1026) 0x4691e3 JMP 469224 |
0x4691e5 NOPW %CS:(%RAX,%RAX,1) |
(1026) 0x4691f0 SUB 0x40(%RSP),%R13 |
(1026) 0x4691f5 MOV %R9,%RAX |
(1026) 0x4691f8 IMUL %R13,%RAX |
(1026) 0x4691fc MOV %RAX,0x50(%RSP) |
(1026) 0x469201 LEA 0x1(%R13),%R15 |
(1026) 0x469205 IMUL %R15,%R9 |
(1026) 0x469209 MOV %R9,0x58(%RSP) |
(1026) 0x46920e MOV %R12,%RAX |
(1026) 0x469211 IMUL %R13,%RAX |
(1026) 0x469215 MOV %RAX,0x18(%RSP) |
(1026) 0x46921a IMUL %R12,%R15 |
(1026) 0x46921e IMUL %RDI,%R13 |
(1026) 0x469222 XOR %EDX,%EDX |
(1026) 0x469224 MOV 0x10(%RBP),%RCX |
(1026) 0x469228 MOV 0x50(%RSP),%R12 |
(1026) 0x46922d ADD %RCX,%R12 |
(1026) 0x469230 MOV 0xe0(%RSP),%RAX |
(1026) 0x469238 MOV %RDX,0x60(%RSP) |
(1026) 0x46923d ADD %RAX,%RDX |
(1026) 0x469240 MOV %RDX,%R9 |
(1026) 0x469243 MOV 0xd8(%RSP),%RSI |
(1026) 0x46924b SUB %RSI,%R9 |
(1026) 0x46924e VMOVSD (%R12,%R9,8),%XMM3 |
(1026) 0x469254 MOV 0x58(%RSP),%RAX |
(1026) 0x469259 ADD %RCX,%RAX |
(1026) 0x46925c VMOVSD (%RAX,%R9,8),%XMM12 |
(1026) 0x469262 MOV 0x18(%RBP),%RAX |
(1026) 0x469266 MOV 0x18(%RSP),%RCX |
(1026) 0x46926b ADD %RAX,%RCX |
(1026) 0x46926e VMOVSD (%RCX,%R9,8),%XMM11 |
(1026) 0x469274 NOT %RSI |
(1026) 0x469277 ADD %RDX,%RSI |
(1026) 0x46927a ADD %RAX,%R15 |
(1026) 0x46927d VMOVSD (%R15,%R9,8),%XMM6 |
(1026) 0x469283 IMUL %R8,%R10 |
(1026) 0x469287 LEA (%R10,%RDX,8),%RAX |
(1026) 0x46928b MOV 0xc0(%RSP),%RCX |
(1026) 0x469293 LEA (%RCX,%RDX,8),%RCX |
(1026) 0x469297 MOV %RCX,0x18(%RSP) |
(1026) 0x46929c ADD 0x28(%RBP),%R13 |
(1026) 0x4692a0 VMOVSD (%R13,%RSI,8),%XMM24 |
(1026) 0x4692a8 IMUL %RDI,%R14 |
(1026) 0x4692ac LEA (%R14,%RDX,8),%R10 |
(1026) 0x4692b0 MOV %RDI,%RSI |
(1026) 0x4692b3 IMUL %RBX,%RSI |
(1026) 0x4692b7 LEA (%RSI,%RDX,8),%RSI |
(1026) 0x4692bb VMOVSD (%R13,%R9,8),%XMM22 |
(1026) 0x4692c3 IMUL %R8,%RDI |
(1026) 0x4692c7 LEA (%RDI,%RDX,8),%RDI |
(1026) 0x4692cb MOV 0x140(%RSP),%RCX |
(1026) 0x4692d3 MOV %RCX,%R14 |
(1026) 0x4692d6 IMUL %R8,%R14 |
(1026) 0x4692da LEA (%R14,%RDX,8),%R13 |
(1026) 0x4692de IMUL %RBX,%RCX |
(1026) 0x4692e2 LEA (%RCX,%RDX,8),%R12 |
(1026) 0x4692e6 MOV 0x148(%RSP),%RCX |
(1026) 0x4692ee IMUL %RCX,%RBX |
(1026) 0x4692f2 LEA (%RBX,%RDX,8),%RBX |
(1026) 0x4692f6 IMUL %R8,%RCX |
(1026) 0x4692fa LEA (%RCX,%RDX,8),%R14 |
(1026) 0x4692fe MOV 0xb0(%RSP),%RCX |
(1026) 0x469306 LEA (%RCX,%RDX,8),%R15 |
(1026) 0x46930a MOV 0x40(%RBP),%RCX |
(1026) 0x46930e VMOVSD (%RCX,%R9,8),%XMM0 |
(1026) 0x469314 VDIVSD %XMM4,%XMM15,%XMM9 |
(1026) 0x469318 VDIVSD %XMM2,%XMM15,%XMM2 |
(1026) 0x46931c MOV 0x48(%RSP),%RDX |
(1026) 0x469321 SUB 0x60(%RSP),%RDX |
(1026) 0x469326 ADD 0xb8(%RSP),%RAX |
(1026) 0x46932e MOV 0xd0(%RSP),%RCX |
(1026) 0x469336 ADD %RCX,%R10 |
(1026) 0x469339 ADD %RCX,%RSI |
(1026) 0x46933c ADD 0xa8(%RSP),%RDI |
(1026) 0x469344 MOV 0xa0(%RSP),%RCX |
(1026) 0x46934c ADD %RCX,%R13 |
(1026) 0x46934f ADD %RCX,%R12 |
(1026) 0x469352 MOV 0xc8(%RSP),%RCX |
(1026) 0x46935a ADD %RCX,%RBX |
(1026) 0x46935d ADD %RCX,%R14 |
(1026) 0x469360 XOR %R9D,%R9D |
(1026) 0x469363 JMP 469389 |
0x469365 NOPW %CS:(%RAX,%RAX,1) |
(1027) 0x469370 VMOVSD %XMM26,(%RAX,%R9,8) |
(1027) 0x469377 INC %R9 |
(1027) 0x46937a VMOVAPD %XMM23,%XMM24 |
(1027) 0x469380 CMP %R9,%RDX |
(1027) 0x469383 JE 468a80 |
(1027) 0x469389 VMOVAPD %XMM0,%XMM25 |
(1027) 0x46938f VMOVAPD %XMM22,%XMM23 |
(1027) 0x469395 VMOVAPD %XMM6,%XMM0 |
(1027) 0x469399 VMOVAPD %XMM11,%XMM4 |
(1027) 0x46939d VMOVAPD %XMM12,%XMM5 |
(1027) 0x4693a1 VMOVAPD %XMM3,%XMM7 |
(1027) 0x4693a5 VMOVSD (%R14,%R9,8),%XMM11 |
(1027) 0x4693ab VMOVSD (%RBX,%R9,8),%XMM6 |
(1027) 0x4693b1 VADDSD %XMM6,%XMM11,%XMM8 |
(1027) 0x4693b5 VADDSD %XMM0,%XMM4,%XMM10 |
(1027) 0x4693b9 VMOVSD (%R12,%R9,8),%XMM12 |
(1027) 0x4693bf VMOVSD (%R13,%R9,8),%XMM3 |
(1027) 0x4693c6 VSUBSD %XMM10,%XMM8,%XMM29 |
(1027) 0x4693cc VADDSD %XMM5,%XMM12,%XMM8 |
(1027) 0x4693d0 VADDSD %XMM3,%XMM7,%XMM10 |
(1027) 0x4693d4 VSUBSD %XMM10,%XMM8,%XMM28 |
(1027) 0x4693da VADDSD %XMM4,%XMM11,%XMM4 |
(1027) 0x4693de VSUBSD %XMM4,%XMM6,%XMM4 |
(1027) 0x4693e2 VADDSD %XMM0,%XMM4,%XMM0 |
(1027) 0x4693e6 VMULSD %XMM1,%XMM0,%XMM0 |
(1027) 0x4693ea VADDSD %XMM7,%XMM5,%XMM4 |
(1027) 0x4693ee VSUBSD %XMM4,%XMM12,%XMM4 |
(1027) 0x4693f2 VADDSD %XMM3,%XMM4,%XMM4 |
(1027) 0x4693f6 VMULSD %XMM1,%XMM4,%XMM4 |
(1027) 0x4693fa VDIVSD %XMM25,%XMM15,%XMM5 |
(1027) 0x469400 VMULSD %XMM5,%XMM4,%XMM4 |
(1027) 0x469404 VFMADD231SD %XMM0,%XMM9,%XMM4 |
(1027) 0x469409 VMOVSD (%RDI,%R9,8),%XMM22 |
(1027) 0x469410 VSUBSD %XMM24,%XMM22,%XMM7 |
(1027) 0x469416 VMOVSD (%R15,%R9,8),%XMM0 |
(1027) 0x46941c VADDSD %XMM25,%XMM0,%XMM8 |
(1027) 0x469422 VDIVSD %XMM8,%XMM7,%XMM27 |
(1027) 0x469428 VMOVSD (%RSI,%R9,8),%XMM7 |
(1027) 0x46942e VSUBSD (%R10,%R9,8),%XMM7,%XMM7 |
(1027) 0x469434 VMULSD %XMM2,%XMM7,%XMM24 |
(1027) 0x46943a VMULSD %XMM27,%XMM27,%XMM7 |
(1027) 0x469440 VMULSD %XMM24,%XMM24,%XMM8 |
(1027) 0x469446 VMULSD %XMM1,%XMM29,%XMM10 |
(1027) 0x46944c VMULSD %XMM5,%XMM10,%XMM5 |
(1027) 0x469450 VMULSD %XMM7,%XMM5,%XMM5 |
(1027) 0x469454 VMULSD %XMM1,%XMM28,%XMM10 |
(1027) 0x46945a VMULSD %XMM8,%XMM10,%XMM10 |
(1027) 0x46945f VMULSD %XMM4,%XMM27,%XMM4 |
(1027) 0x469465 VFMADD213SD %XMM5,%XMM24,%XMM4 |
(1027) 0x46946b VFMADD231SD %XMM10,%XMM9,%XMM4 |
(1027) 0x469470 VADDSD %XMM7,%XMM8,%XMM5 |
(1027) 0x469474 VMAXSD %XMM16,%XMM5,%XMM5 |
(1027) 0x46947a VDIVSD %XMM5,%XMM4,%XMM21 |
(1027) 0x469480 VXORPD %XMM26,%XMM26,%XMM26 |
(1027) 0x469486 VUCOMISD %XMM26,%XMM21 |
(1027) 0x46948c JA 469370 |
(1027) 0x469492 VMULSD %XMM29,%XMM25,%XMM4 |
(1027) 0x469498 VMOVAPD 0x180(%RSP),%XMM10 |
(1027) 0x4694a1 VFMADD213SD %XMM4,%XMM10,%XMM28 |
(1027) 0x4694a7 VUCOMISD %XMM18,%XMM28 |
(1027) 0x4694ad JAE 469370 |
(1027) 0x4694b3 VCMPSD $0x1,%XMM18,%XMM27,%K1 |
(1027) 0x4694ba VMOVAPD %XMM15,%XMM13 |
(1027) 0x4694bf VMOVSD %XMM17,%XMM13,%XMM13{%K1} |
(1027) 0x4694c5 VMOVDDUP 0x88edb(%RIP),%XMM4 |
(1027) 0x4694cd VANDPD %XMM4,%XMM27,%XMM5 |
(1027) 0x4694d3 VMAXSD %XMM16,%XMM5,%XMM5 |
(1027) 0x4694d9 VMULSD %XMM5,%XMM13,%XMM5 |
(1027) 0x4694dd VCMPSD $0x1,%XMM18,%XMM5,%K1 |
(1027) 0x4694e4 VMOVAPD %XMM15,%XMM14 |
(1027) 0x4694e9 VMOVSD %XMM17,%XMM14,%XMM14{%K1} |
(1027) 0x4694ef VANDPD %XMM4,%XMM24,%XMM7 |
(1027) 0x4694f5 VMAXSD %XMM16,%XMM7,%XMM7 |
(1027) 0x4694fb VMULSD %XMM7,%XMM14,%XMM7 |
(1027) 0x4694ff VMULSD %XMM5,%XMM5,%XMM8 |
(1027) 0x469503 VFMADD231SD %XMM7,%XMM7,%XMM8 |
(1027) 0x469508 VSQRTSD %XMM8,%XMM8,%XMM19 |
(1027) 0x46950e VMULSD %XMM25,%XMM19,%XMM8 |
(1027) 0x469514 VDIVSD %XMM5,%XMM8,%XMM5 |
(1027) 0x469518 VANDPD %XMM4,%XMM5,%XMM30 |
(1027) 0x46951e VMULSD %XMM10,%XMM19,%XMM5 |
(1027) 0x469524 VDIVSD %XMM7,%XMM5,%XMM5 |
(1027) 0x469528 VANDPD %XMM4,%XMM5,%XMM4 |
(1027) 0x46952c VMOVAPD %XMM4,0x170(%RSP) |
(1027) 0x469535 VMINSD %XMM4,%XMM30,%XMM31 |
(1027) 0x46953b VMULSD %XMM31,%XMM31,%XMM5 |
(1027) 0x469541 VMULSD %XMM21,%XMM21,%XMM4 |
(1027) 0x469547 VMOVAPD %XMM5,0x160(%RSP) |
(1027) 0x469550 VADDSD %XMM5,%XMM5,%XMM5 |
(1027) 0x469554 VMULSD %XMM5,%XMM4,%XMM4 |
(1027) 0x469558 MOV 0x88(%RBP),%RCX |
(1027) 0x46955f MOV (%RCX),%RCX |
(1027) 0x469562 IMUL %R8,%RCX |
(1027) 0x469566 ADD 0x18(%RSP),%RCX |
(1027) 0x46956b VMULSD (%RCX,%R9,8),%XMM4,%XMM26 |
(1027) 0x469572 JMP 469370 |
0x469577 NOPW (%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
►100.00+ | __kmp_invoke_microtask | libiomp5.so | |
○ | __kmp_invoke_task_func | libiomp5.so |
Path / |
Source file and lines | viscosity_kernel.f90:50-94 |
Module | exec |
nb instructions | 146 |
nb uops | 150 |
loop length | 699 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 5 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 46 |
micro-operation queue | 25.00 cycles |
front end | 25.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.10 | 9.00 | 10.00 | 10.00 | 21.50 | 9.07 | 8.90 | 21.50 | 21.50 | 21.50 | 8.93 | 10.00 |
cycles | 9.10 | 13.37 | 10.00 | 10.00 | 21.50 | 9.07 | 8.90 | 21.50 | 21.50 | 21.50 | 8.93 | 10.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 24.53-24.58 |
Stall cycles | 0.00 |
Front-end | 25.00 |
Dispatch | 21.50 |
Overall L1 | 25.00 |
all | 2% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 20% |
all | 16% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 4% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 28% |
all | 11% |
load | 6% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 14% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 11% |
load | 10% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x2c0,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x50(%RBP),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVL $0,0x3c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JS 4688a5 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xa5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R9,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVL $0,0x14(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0x1,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x40(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x44(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x1c(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x18(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x73a630,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x34(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 404520 <__kmpc_for_static_init_4@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x14(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RSP),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EAX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ECX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 4688c0 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xc0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x73a650,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x2c(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404110 <__kmpc_for_static_fini@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x70(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x73a670,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4045e0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EDI,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %EBX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA -0x2(%R12),%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CLTQ | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %RAX,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0x138(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%RCX),%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP $0x2,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVGE %EAX,%ECX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND $0x7ffffffc,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD %R12D,%RCX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOVSXD %R15D,%RDX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
LEA -0x2(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
SUB %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x2,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RCX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,0xf8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RCX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x10,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x18,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x3,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x2,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x18(%R9,%RAX,1),%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x10(%R10,%RAX,1),%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x10(%RDX,%RAX,1),%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x158(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x10(%R9,%RAX,1),%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x18(%RCX,%RAX,1),%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x18(%R14,%RAX,1),%R15 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R15,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RBX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD $0x18,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R9,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%R8,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R9,%R8,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R14,%R8,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RBX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x89ae2(%RIP),%XMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8a7ba(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0xa7448(%RIP),%XMM16 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0xa7446(%RIP),%XMM17 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0x89abc(%RIP),%YMM20 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VXORPD %XMM18,%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,0x108(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %ESI,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 468a9d <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x29d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | viscosity_kernel.f90:50-94 |
Module | exec |
nb instructions | 146 |
nb uops | 150 |
loop length | 699 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 5 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 46 |
micro-operation queue | 25.00 cycles |
front end | 25.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 9.10 | 9.00 | 10.00 | 10.00 | 21.50 | 9.07 | 8.90 | 21.50 | 21.50 | 21.50 | 8.93 | 10.00 |
cycles | 9.10 | 13.37 | 10.00 | 10.00 | 21.50 | 9.07 | 8.90 | 21.50 | 21.50 | 21.50 | 8.93 | 10.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 24.53-24.58 |
Stall cycles | 0.00 |
Front-end | 25.00 |
Dispatch | 21.50 |
Overall L1 | 25.00 |
all | 2% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 20% |
all | 16% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 4% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 28% |
all | 11% |
load | 6% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 13% |
all | 14% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 11% |
load | 10% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | 6% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 15% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x2c0,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x50(%RBP),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVL $0,0x3c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JS 4688a5 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xa5> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %R9,%R15 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVL $0,0x14(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0x1,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x40(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x44(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x1c(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x18(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x73a630,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x34(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 404520 <__kmpc_for_static_init_4@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x14(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RSP),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EAX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ECX,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 4688c0 <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xc0> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x73a650,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x2c(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404110 <__kmpc_for_static_fini@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x70(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x73a670,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4045e0 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
MOV %RAX,%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x60(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x58(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVSXD (%RAX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RCX),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EDI,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %EBX,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA -0x2(%R12),%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CLTQ | 1 | 0 | 0.50 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.33 |
MOV %RAX,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0x138(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x1(%RCX),%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
CMP $0x2,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVGE %EAX,%ECX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RCX,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND $0x7ffffffc,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RCX,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD %R12D,%RCX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOVSXD %R15D,%RDX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
LEA -0x2(%RDX),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RDI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
SUB %RDX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x2,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RCX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,0xf8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x1,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RCX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x10,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RDX,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x18,%R8D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RDX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x3,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD $-0x2,%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RCX,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x28(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x20(%RBP),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x18(%R9,%RAX,1),%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x10(%R10,%RAX,1),%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x10(%RDX,%RAX,1),%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x158(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x10(%R9,%RAX,1),%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x18(%RCX,%RAX,1),%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA 0x18(%R14,%RAX,1),%R15 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R15,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RBX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD $0x18,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RAX,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDI,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDI,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R9,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%R8,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R9,%R8,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R14,%R8,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RBX,%R8 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R8,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x89ae2(%RIP),%XMM15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8a7ba(%RIP),%XMM1 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0xa7448(%RIP),%XMM16 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0xa7446(%RIP),%XMM17 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0x89abc(%RIP),%YMM20 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VXORPD %XMM18,%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %EDI,%EDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,0x108(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %ESI,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 468a9d <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x29d> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼viscosity_kernel_.DIR.OMP.PARALLEL.2– | 4.23 | 1.36 |
▼Loop 1026 - viscosity_kernel.f90:53-89 - exec– | 0 | 0 |
○Loop 1028 - viscosity_kernel.f90:53-89 - exec | 4.23 | 1.35 |
○Loop 1027 - viscosity_kernel.f90:55-89 - exec | 0 | 0 |