Function: viscosity_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: viscosity_kernel.f90:50-94 | Coverage: 2.21% |
---|
Function: viscosity_kernel_.DIR.OMP.PARALLEL.2 | Module: exec | Source: viscosity_kernel.f90:50-94 | Coverage: 2.21% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-152-3172/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/viscosity_kernel.f90: 50 - 94 |
-------------------------------------------------------------------------------- |
50: !$OMP PARALLEL |
51: |
52: !$OMP DO PRIVATE(ugrad,vgrad,div,strain2,pgradx,pgrady,pgradx2,pgrady2,limiter,pgrad,xgrad,ygrad,grad,grad2,dirx,diry) |
53: DO k=y_min,y_max |
54: !$OMP SIMD |
55: DO j=x_min,x_max |
56: ugrad=(xvel0(j+1,k )+xvel0(j+1,k+1))-(xvel0(j ,k )+xvel0(j ,k+1)) |
57: |
58: vgrad=(yvel0(j ,k+1)+yvel0(j+1,k+1))-(yvel0(j ,k )+yvel0(j+1,k )) |
59: |
60: div = (celldx(j)*(ugrad)+ celldy(k)*(vgrad)) |
61: |
62: strain2 = 0.5_8*(xvel0(j, k+1) + xvel0(j+1,k+1)-xvel0(j ,k )-xvel0(j+1,k ))/celldy(k) & |
63: + 0.5_8*(yvel0(j+1,k ) + yvel0(j+1,k+1)-yvel0(j ,k )-yvel0(j ,k+1))/celldx(j) |
64: |
65: pgradx=(pressure(j+1,k)-pressure(j-1,k))/(celldx(j)+celldx(j+1)) |
66: pgrady=(pressure(j,k+1)-pressure(j,k-1))/(celldy(k)+celldy(k+1)) |
67: |
68: pgradx2 = pgradx*pgradx |
69: pgrady2 = pgrady*pgrady |
70: |
71: limiter = ((0.5_8*(ugrad)/celldx(j))*pgradx2+(0.5_8*(vgrad)/celldy(k))*pgrady2+strain2*pgradx*pgrady) & |
72: /MAX(pgradx2+pgrady2,1.0e-16_8) |
73: |
74: IF ((limiter.GT.0.0).OR.(div.GE.0.0))THEN |
75: viscosity(j,k) = 0.0 |
76: ELSE |
77: dirx=1.0_8 |
78: IF(pgradx.LT.0.0) dirx=-1.0_8 |
79: pgradx = dirx*MAX(1.0e-16_8,ABS(pgradx)) |
80: diry=1.0_8 |
81: IF(pgradx.LT.0.0) diry=-1.0_8 |
82: pgrady = diry*MAX(1.0e-16_8,ABS(pgrady)) |
83: pgrad = SQRT(pgradx**2+pgrady**2) |
84: xgrad = ABS(celldx(j)*pgrad/pgradx) |
85: ygrad = ABS(celldy(k)*pgrad/pgrady) |
86: grad = MIN(xgrad,ygrad) |
87: grad2 = grad*grad |
88: |
89: viscosity(j,k)=2.0_8*density0(j,k)*grad2*limiter*limiter |
90: ENDIF |
91: |
92: ENDDO |
93: ENDDO |
94: !$OMP END DO |
0x46b220 PUSH %RBP |
0x46b221 MOV %RSP,%RBP |
0x46b224 PUSH %R15 |
0x46b226 PUSH %R14 |
0x46b228 PUSH %R13 |
0x46b22a PUSH %R12 |
0x46b22c PUSH %RBX |
0x46b22d AND $-0x20,%RSP |
0x46b231 SUB $0x300,%RSP |
0x46b238 MOV %R9,0x30(%RSP) |
0x46b23d MOV %R8,0x28(%RSP) |
0x46b242 MOV 0x40(%RBP),%EBX |
0x46b245 MOV 0x38(%RBP),%EAX |
0x46b248 SUB %EBX,%EAX |
0x46b24a MOVL $0,0x24(%RSP) |
0x46b252 JS 46b2cf |
0x46b254 MOV %RCX,%R12 |
0x46b257 MOV %RDX,%R13 |
0x46b25a MOV %RDI,0x48(%RSP) |
0x46b25f MOV (%RDI),%ESI |
0x46b261 MOVL $0,0x10(%RSP) |
0x46b269 MOV %EAX,0xc(%RSP) |
0x46b26d MOVL $0x1,0x20(%RSP) |
0x46b275 SUB $0x8,%RSP |
0x46b279 LEA 0x28(%RSP),%RAX |
0x46b27e LEA 0x2c(%RSP),%RCX |
0x46b283 LEA 0x18(%RSP),%R8 |
0x46b288 LEA 0x14(%RSP),%R9 |
0x46b28d MOV $0x53d630,%EDI |
0x46b292 MOV %ESI,0x1c(%RSP) |
0x46b296 MOV $0x22,%EDX |
0x46b29b PUSH $0x1 |
0x46b29d PUSH $0x1 |
0x46b29f PUSH %RAX |
0x46b2a0 CALL 404670 <__kmpc_for_static_init_4@plt> |
0x46b2a5 ADD $0x20,%RSP |
0x46b2a9 MOV 0x10(%RSP),%EAX |
0x46b2ad MOV 0xc(%RSP),%ECX |
0x46b2b1 SUB %EAX,%ECX |
0x46b2b3 MOV %ECX,0x18(%RSP) |
0x46b2b7 JAE 46b2ea |
0x46b2b9 MOV $0x53d650,%EDI |
0x46b2be MOV 0x14(%RSP),%ESI |
0x46b2c2 VZEROUPPER |
0x46b2c5 CALL 404230 <__kmpc_for_static_fini@plt> |
0x46b2ca MOV 0x48(%RSP),%RDI |
0x46b2cf MOV (%RDI),%ESI |
0x46b2d1 MOV $0x53d670,%EDI |
0x46b2d6 CALL 404740 <__kmpc_barrier@plt> |
0x46b2db LEA -0x28(%RBP),%RSP |
0x46b2df POP %RBX |
0x46b2e0 POP %R12 |
0x46b2e2 POP %R13 |
0x46b2e4 POP %R14 |
0x46b2e6 POP %R15 |
0x46b2e8 POP %RBP |
0x46b2e9 RET |
0x46b2ea MOV %RAX,%RDI |
0x46b2ed MOV 0x50(%RBP),%RDX |
0x46b2f1 MOV 0x48(%RBP),%RSI |
0x46b2f5 SAL $0x20,%R12 |
0x46b2f9 MOV $-0x200000000,%RAX |
0x46b303 LEA (%R12,%RAX,1),%RCX |
0x46b307 MOV %RCX,%R8 |
0x46b30a SAR $0x20,%R8 |
0x46b30e SAL $0x20,%R13 |
0x46b312 ADD %R13,%RAX |
0x46b315 MOV %RAX,%R9 |
0x46b318 SAR $0x20,%R9 |
0x46b31c MOVSXD (%RDX),%R10 |
0x46b31f MOV (%RSI),%EDX |
0x46b321 SUB %R10D,%EDX |
0x46b324 ADD %EBX,%EDI |
0x46b326 MOV %RDX,0x130(%RSP) |
0x46b32e INC %EDX |
0x46b330 CMP $0x2,%EDX |
0x46b333 MOV $0x1,%ESI |
0x46b338 CMOVGE %EDX,%ESI |
0x46b33b MOV %RSI,0x38(%RSP) |
0x46b340 AND $0x7ffffffc,%ESI |
0x46b346 MOV %RSI,0xd8(%RSP) |
0x46b34e TEST %RCX,%RCX |
0x46b351 MOV $-0x1,%RSI |
0x46b358 CMOVNS %RCX,%RSI |
0x46b35c TEST %RSI,%RSI |
0x46b35f MOV $0x1,%R11D |
0x46b365 CMOVG %R11,%RSI |
0x46b369 MOV $0x200000000,%RBX |
0x46b373 MOV %RBX,%RDX |
0x46b376 SUB %R12,%RDX |
0x46b379 CMP %RDX,%RCX |
0x46b37c CMOVG %RCX,%RDX |
0x46b380 LEA (,%R10,8),%RCX |
0x46b388 SHR $0x20,%RDX |
0x46b38c IMUL %RSI,%RDX |
0x46b390 MOV $-0x1,%RSI |
0x46b397 SAL $0x3,%RDX |
0x46b39b SUB %RDX,%RCX |
0x46b39e TEST %RAX,%RAX |
0x46b3a1 CMOVNS %RAX,%RSI |
0x46b3a5 TEST %RSI,%RSI |
0x46b3a8 CMOVG %R11,%RSI |
0x46b3ac SUB %R13,%RBX |
0x46b3af MOV 0x30(%RBP),%R14 |
0x46b3b3 CMP %RBX,%RAX |
0x46b3b6 CMOVG %RAX,%RBX |
0x46b3ba MOV %R8,%RAX |
0x46b3bd NOT %RAX |
0x46b3c0 MOV %RAX,0xa8(%RSP) |
0x46b3c8 SHR $0x20,%RBX |
0x46b3cc IMUL %RSI,%RBX |
0x46b3d0 NEG %RBX |
0x46b3d3 MOV %RBX,0xc8(%RSP) |
0x46b3db MOV $0x8,%ESI |
0x46b3e0 SUB %RDX,%RSI |
0x46b3e3 MOV %R9,%RAX |
0x46b3e6 NOT %RAX |
0x46b3e9 MOV %RAX,0xc0(%RSP) |
0x46b3f1 MOV %R9,0xe0(%RSP) |
0x46b3f9 SUB %R9,%R11 |
0x46b3fc MOV %R11,0xd0(%RSP) |
0x46b404 MOV 0x20(%RBP),%RAX |
0x46b408 MOV 0x18(%RBP),%R9 |
0x46b40c MOV 0x10(%RBP),%RDX |
0x46b410 LEA 0x8(%R9,%RCX,1),%R11 |
0x46b415 MOV %R11,0x78(%RSP) |
0x46b41a ADD %RCX,%RDX |
0x46b41d MOV %RDX,0x70(%RSP) |
0x46b422 LEA (%RAX,%RCX,1),%RAX |
0x46b426 MOV %RAX,0x68(%RSP) |
0x46b42b LEA (%R9,%RCX,1),%RAX |
0x46b42f MOV %RAX,0x60(%RSP) |
0x46b434 LEA 0x8(%R14,%RCX,1),%RAX |
0x46b439 MOV %RAX,0x158(%RSP) |
0x46b441 MOV 0x28(%RSP),%RDX |
0x46b446 LEA 0x8(%RDX,%RCX,1),%RAX |
0x46b44b MOV %RAX,0x58(%RSP) |
0x46b450 MOV 0x30(%RSP),%RAX |
0x46b455 LEA 0x8(%RAX,%RCX,1),%RCX |
0x46b45a MOV %RCX,0x50(%RSP) |
0x46b45f MOV %R10,0xb0(%RSP) |
0x46b467 MOV %R8,0xb8(%RSP) |
0x46b46f SUB %R8,%R10 |
0x46b472 MOV %R10,0x98(%RSP) |
0x46b47a LEA (%R14,%RSI,1),%RCX |
0x46b47e MOV %RCX,0x90(%RSP) |
0x46b486 LEA (%R9,%RSI,1),%RCX |
0x46b48a MOV %RCX,0x88(%RSP) |
0x46b492 LEA (%RDX,%RSI,1),%RCX |
0x46b496 MOV %RCX,0x80(%RSP) |
0x46b49e ADD %RAX,%RSI |
0x46b4a1 MOV %RSI,0xa0(%RSP) |
0x46b4a9 VMOVSD 0x89ecd(%RIP),%XMM21 |
0x46b4b3 VMOVSD 0x8ab43(%RIP),%XMM22 |
0x46b4bd VMOVSD 0xa6b19(%RIP),%XMM23 |
0x46b4c7 VMOVSD 0xa6b17(%RIP),%XMM25 |
0x46b4d1 VBROADCASTSD 0x89ea6(%RIP),%YMM14 |
0x46b4da VXORPD %XMM18,%XMM18,%XMM18 |
0x46b4e0 XOR %R9D,%R9D |
0x46b4e3 MOV %RDI,0xe8(%RSP) |
0x46b4eb MOV %EDI,%ESI |
0x46b4ed JMP 46b50e |
0x46b4ef NOP |
(1026) 0x46b4f0 MOV 0x150(%RSP),%RCX |
(1026) 0x46b4f8 LEA 0x1(%RCX),%EAX |
(1026) 0x46b4fb MOV 0x1c(%RSP),%ESI |
(1026) 0x46b4ff INC %ESI |
(1026) 0x46b501 CMP 0x18(%RSP),%ECX |
(1026) 0x46b505 MOV %EAX,%R9D |
(1026) 0x46b508 JE 46b2b9 |
(1026) 0x46b50e CMPL $0,0x130(%RSP) |
(1026) 0x46b516 MOV %ESI,0x1c(%RSP) |
(1026) 0x46b51a MOV %R9,0x150(%RSP) |
(1026) 0x46b522 JS 46b4f0 |
(1026) 0x46b524 MOVSXD %ESI,%R8 |
(1026) 0x46b527 MOV 0xc8(%RSP),%RAX |
(1026) 0x46b52f LEA (%RAX,%R8,1),%RBX |
(1026) 0x46b533 MOV 0xc0(%RSP),%RAX |
(1026) 0x46b53b LEA (%RAX,%R8,1),%R13 |
(1026) 0x46b53f ADD 0xd0(%RSP),%R8 |
(1026) 0x46b547 MOV 0xe8(%RSP),%RCX |
(1026) 0x46b54f LEA (%RCX,%R9,1),%EAX |
(1026) 0x46b553 MOVSXD %EAX,%R10 |
(1026) 0x46b556 MOV 0xe0(%RSP),%RDX |
(1026) 0x46b55e SUB %RDX,%R10 |
(1026) 0x46b561 LEA (%RCX,%R9,1),%EAX |
(1026) 0x46b565 INC %EAX |
(1026) 0x46b567 CLTQ |
(1026) 0x46b569 SUB %RDX,%RAX |
(1026) 0x46b56c MOV 0x58(%RBP),%RCX |
(1026) 0x46b570 MOV (%RCX),%R15 |
(1026) 0x46b573 MOV 0x28(%RBP),%RDX |
(1026) 0x46b577 VMOVSD (%RDX,%R10,8),%XMM20 |
(1026) 0x46b57e MOV 0x60(%RBP),%RCX |
(1026) 0x46b582 MOV (%RCX),%R14 |
(1026) 0x46b585 MOV 0x68(%RBP),%RCX |
(1026) 0x46b589 MOV (%RCX),%R11 |
(1026) 0x46b58c VADDSD (%RDX,%RAX,8),%XMM20,%XMM1 |
(1026) 0x46b593 MOV 0x70(%RBP),%RAX |
(1026) 0x46b597 MOV (%RAX),%R12 |
(1026) 0x46b59a MOV 0xd8(%RSP),%RDI |
(1026) 0x46b5a2 TEST %RDI,%RDI |
(1026) 0x46b5a5 VMOVAPD %XMM20,0x170(%RSP) |
(1026) 0x46b5ad MOV %R8,0x148(%RSP) |
(1026) 0x46b5b5 MOV %R12,0x140(%RSP) |
(1026) 0x46b5bd MOV %R14,0x138(%RSP) |
(1026) 0x46b5c5 JE 46bd20 |
(1026) 0x46b5cb VMOVAPD %XMM8,0x1f0(%RSP) |
(1026) 0x46b5d4 VBROADCASTSD %XMM8,%YMM4 |
(1026) 0x46b5d9 VMOVAPD %XMM26,0x1e0(%RSP) |
(1026) 0x46b5e1 VBROADCASTSD %XMM26,%YMM17 |
(1026) 0x46b5e7 VMOVAPD %XMM27,0x1d0(%RSP) |
(1026) 0x46b5ef VBROADCASTSD %XMM27,%YMM16 |
(1026) 0x46b5f5 VMOVAPD %XMM28,0x1c0(%RSP) |
(1026) 0x46b5fd VBROADCASTSD %XMM28,%YMM15 |
(1026) 0x46b603 VMOVAPD %XMM31,0x1b0(%RSP) |
(1026) 0x46b60b VBROADCASTSD %XMM31,%YMM19 |
(1026) 0x46b611 VMOVAPD %XMM29,0x160(%RSP) |
(1026) 0x46b619 VBROADCASTSD %XMM29,%YMM0 |
(1026) 0x46b61f VMOVAPD %XMM30,0x1a0(%RSP) |
(1026) 0x46b627 VBROADCASTSD %XMM30,%YMM27 |
(1026) 0x46b62d MOV %R15,%RAX |
(1026) 0x46b630 IMUL %R10,%RAX |
(1026) 0x46b634 MOV %RAX,0x100(%RSP) |
(1026) 0x46b63c LEA 0x1(%R10),%RCX |
(1026) 0x46b640 MOV %R15,%RAX |
(1026) 0x46b643 IMUL %RCX,%RAX |
(1026) 0x46b647 MOV %RAX,0x108(%RSP) |
(1026) 0x46b64f IMUL %R14,%RCX |
(1026) 0x46b653 MOV %RCX,0xf8(%RSP) |
(1026) 0x46b65b MOV %R14,%RAX |
(1026) 0x46b65e IMUL %R10,%RAX |
(1026) 0x46b662 MOV %RAX,0xf0(%RSP) |
(1026) 0x46b66a VBROADCASTSD %XMM20,%YMM24 |
(1026) 0x46b670 VDIVSD %XMM20,%XMM21,%XMM2 |
(1026) 0x46b676 VBROADCASTSD %XMM2,%YMM26 |
(1026) 0x46b67c IMUL %R11,%R10 |
(1026) 0x46b680 MOV %R10,0x40(%RSP) |
(1026) 0x46b685 VMOVSD %XMM1,0x118(%RSP) |
(1026) 0x46b68e VDIVSD %XMM1,%XMM21,%XMM2 |
(1026) 0x46b694 VBROADCASTSD %XMM2,%YMM1 |
(1026) 0x46b699 VMOVAPD %YMM1,0x180(%RSP) |
(1026) 0x46b6a2 MOV %R11,%RAX |
(1026) 0x46b6a5 IMUL %RBX,%RAX |
(1026) 0x46b6a9 ADD 0x78(%RSP),%RAX |
(1026) 0x46b6ae IMUL %RBX,%R12 |
(1026) 0x46b6b2 ADD 0x70(%RSP),%R12 |
(1026) 0x46b6b7 MOV %R11,%RDX |
(1026) 0x46b6ba MOV %R13,0x128(%RSP) |
(1026) 0x46b6c2 IMUL %R13,%R11 |
(1026) 0x46b6c6 MOV 0x60(%RSP),%RCX |
(1026) 0x46b6cb ADD %RCX,%R11 |
(1026) 0x46b6ce MOV %R15,%R10 |
(1026) 0x46b6d1 MOV %RDX,0x110(%RSP) |
(1026) 0x46b6d9 MOV %RDX,%R15 |
(1026) 0x46b6dc IMUL %R8,%R15 |
(1026) 0x46b6e0 ADD %RCX,%R15 |
(1026) 0x46b6e3 MOV %R14,%RSI |
(1026) 0x46b6e6 IMUL %RBX,%RSI |
(1026) 0x46b6ea MOV 0x58(%RSP),%RCX |
(1026) 0x46b6ef ADD %RCX,%RSI |
(1026) 0x46b6f2 MOV %R14,%RDX |
(1026) 0x46b6f5 IMUL %R8,%RDX |
(1026) 0x46b6f9 ADD %RCX,%RDX |
(1026) 0x46b6fc MOV %R10,%R14 |
(1026) 0x46b6ff IMUL %R8,%R14 |
(1026) 0x46b703 MOV 0x50(%RSP),%RCX |
(1026) 0x46b708 ADD %RCX,%R14 |
(1026) 0x46b70b MOV %R10,0x120(%RSP) |
(1026) 0x46b713 MOV %RBX,%R8 |
(1026) 0x46b716 IMUL %RBX,%R10 |
(1026) 0x46b71a ADD %RCX,%R10 |
(1026) 0x46b71d VPCMPEQD %YMM7,%YMM7,%YMM7 |
(1026) 0x46b721 XOR %R13D,%R13D |
(1026) 0x46b724 VPCMPEQD %YMM12,%YMM12,%YMM12 |
(1026) 0x46b729 VPCMPEQD %YMM11,%YMM11,%YMM11 |
(1026) 0x46b72e VPCMPEQD %YMM3,%YMM3,%YMM3 |
(1026) 0x46b732 VPCMPEQD %YMM6,%YMM6,%YMM6 |
(1026) 0x46b736 VPCMPEQD %YMM9,%YMM9,%YMM9 |
(1026) 0x46b73b VPCMPEQD %YMM5,%YMM5,%YMM5 |
(1026) 0x46b73f MOV 0x68(%RSP),%R9 |
(1026) 0x46b744 VMOVAPD %YMM14,%YMM18 |
(1026) 0x46b74a VBROADCASTSD 0xa688d(%RIP),%YMM8 |
(1026) 0x46b753 VXORPD %XMM28,%XMM28,%XMM28 |
(1026) 0x46b759 JMP 46b8c9 |
0x46b75e XCHG %AX,%AX |
(1028) 0x46b760 VCMPPD $0x1,%YMM13,%YMM22,%K3 |
(1028) 0x46b767 VBROADCASTSD 0xa6878(%RIP),%YMM8 |
(1028) 0x46b770 VBLENDMPD %YMM8,%YMM18,%YMM31{%K3} |
(1028) 0x46b776 VBROADCASTSD 0x89a80(%RIP),%YMM29 |
(1028) 0x46b780 VANDPD %YMM29,%YMM22,%YMM1 |
(1028) 0x46b786 VMAXPD %YMM1,%YMM14,%YMM1 |
(1028) 0x46b78a VMULPD %YMM31,%YMM1,%YMM1 |
(1028) 0x46b790 VCMPPD $0x1,%YMM13,%YMM1,%K3 |
(1028) 0x46b797 VBLENDMPD %YMM8,%YMM18,%YMM25{%K3} |
(1028) 0x46b79d VANDPD %YMM29,%YMM21,%YMM13 |
(1028) 0x46b7a3 VMAXPD %YMM13,%YMM14,%YMM13 |
(1028) 0x46b7a8 VMULPD %YMM25,%YMM13,%YMM13 |
(1028) 0x46b7ae VMULPD %YMM1,%YMM1,%YMM20 |
(1028) 0x46b7b4 VFMADD231PD %YMM13,%YMM13,%YMM20 |
(1028) 0x46b7ba VXORPD %XMM28,%XMM28,%XMM28 |
(1028) 0x46b7c0 VSQRTPD %YMM20,%YMM23 |
(1028) 0x46b7c6 VMULPD %YMM2,%YMM23,%YMM2 |
(1028) 0x46b7cc VDIVPD %YMM1,%YMM2,%YMM1 |
(1028) 0x46b7d0 VANDPD %YMM29,%YMM1,%YMM22 |
(1028) 0x46b7d6 VMULPD %YMM24,%YMM23,%YMM1 |
(1028) 0x46b7dc VDIVPD %YMM13,%YMM1,%YMM1 |
(1028) 0x46b7e1 VANDPD %YMM29,%YMM1,%YMM21 |
(1028) 0x46b7e7 VCMPPD $0x2,%YMM21,%YMM22,%K3 |
(1028) 0x46b7ee VBLENDMPD %YMM22,%YMM21,%YMM30{%K3} |
(1028) 0x46b7f4 VMULPD %YMM30,%YMM30,%YMM29 |
(1028) 0x46b7fa VMULPD %YMM10,%YMM10,%YMM1 |
(1028) 0x46b7ff IMUL %R8,%RCX |
(1028) 0x46b803 ADD %R9,%RCX |
(1028) 0x46b806 VMOVUPD (%RCX,%R13,8),%YMM2{%K2}{z} |
(1028) 0x46b80d VADDPD %YMM29,%YMM29,%YMM10 |
(1028) 0x46b813 VMULPD %YMM2,%YMM1,%YMM1 |
(1028) 0x46b817 VMULPD %YMM1,%YMM10,%YMM1 |
(1028) 0x46b81b VPBROADCASTQ %R13,%YMM2 |
(1028) 0x46b821 VPADDQ 0x897f7(%RIP),%YMM2,%YMM2 |
(1028) 0x46b829 VPBLENDMQ %YMM5,%YMM2,%YMM5{%K1} |
(1028) 0x46b82f VMOVAPD %YMM4,%YMM31{%K1} |
(1028) 0x46b835 VPBLENDMQ %YMM9,%YMM2,%YMM9{%K1} |
(1028) 0x46b83b VMOVAPD %YMM17,%YMM25{%K1} |
(1028) 0x46b841 VPBLENDMQ %YMM6,%YMM2,%YMM6{%K1} |
(1028) 0x46b847 VMOVAPD %YMM16,%YMM23{%K1} |
(1028) 0x46b84d VPBLENDMQ %YMM3,%YMM2,%YMM3{%K1} |
(1028) 0x46b853 VMOVAPD %YMM15,%YMM22{%K1} |
(1028) 0x46b859 VPBLENDMQ %YMM11,%YMM2,%YMM11{%K1} |
(1028) 0x46b85f VMOVAPD %YMM19,%YMM21{%K1} |
(1028) 0x46b865 VPBLENDMQ %YMM12,%YMM2,%YMM12{%K1} |
(1028) 0x46b86b VMOVAPD %YMM0,%YMM30{%K1} |
(1028) 0x46b871 VMOVDQA64 %YMM7,%YMM2{%K1} |
(1028) 0x46b877 VMOVAPD %YMM27,%YMM29{%K1} |
(1028) 0x46b87d VMOVAPD %YMM28,%YMM1{%K1} |
(1028) 0x46b883 VMOVUPD %YMM1,(%R12,%R13,8) |
(1028) 0x46b889 ADD $0x4,%R13 |
(1028) 0x46b88d VMOVDQA %YMM2,%YMM7 |
(1028) 0x46b891 VMOVAPD %YMM29,%YMM27 |
(1028) 0x46b897 VMOVAPD %YMM30,%YMM0 |
(1028) 0x46b89d VMOVAPD %YMM21,%YMM19 |
(1028) 0x46b8a3 VMOVAPD %YMM22,%YMM15 |
(1028) 0x46b8a9 VMOVAPD %YMM23,%YMM16 |
(1028) 0x46b8af VMOVAPD %YMM25,%YMM17 |
(1028) 0x46b8b5 VMOVAPD %YMM31,%YMM4 |
(1028) 0x46b8bb CMP %RDI,%R13 |
(1028) 0x46b8be VMOVAPD %YMM14,%YMM8 |
(1028) 0x46b8c3 JAE 46ba60 |
(1028) 0x46b8c9 VMOVUPD -0x8(%R10,%R13,8),%YMM10 |
(1028) 0x46b8d0 VMOVUPD (%R10,%R13,8),%YMM21 |
(1028) 0x46b8d7 VMOVUPD -0x8(%R14,%R13,8),%YMM22 |
(1028) 0x46b8e2 VMOVUPD (%R14,%R13,8),%YMM23 |
(1028) 0x46b8e9 VADDPD %YMM21,%YMM23,%YMM2 |
(1028) 0x46b8ef VADDPD %YMM22,%YMM10,%YMM25 |
(1028) 0x46b8f5 VMOVUPD -0x8(%RDX,%R13,8),%YMM29 |
(1028) 0x46b900 VMOVUPD (%RDX,%R13,8),%YMM30 |
(1028) 0x46b907 VSUBPD %YMM25,%YMM2,%YMM25 |
(1028) 0x46b90d VMOVUPD -0x8(%RSI,%R13,8),%YMM31 |
(1028) 0x46b918 VMOVUPD (%RSI,%R13,8),%YMM20 |
(1028) 0x46b91f VADDPD %YMM29,%YMM30,%YMM2 |
(1028) 0x46b925 VADDPD %YMM20,%YMM31,%YMM1 |
(1028) 0x46b92b VSUBPD %YMM1,%YMM2,%YMM1 |
(1028) 0x46b92f MOV 0x158(%RSP),%RCX |
(1028) 0x46b937 VMOVUPD -0x8(%RCX,%R13,8),%YMM2 |
(1028) 0x46b93e VMULPD %YMM25,%YMM2,%YMM13 |
(1028) 0x46b944 VFMADD231PD %YMM1,%YMM24,%YMM13 |
(1028) 0x46b94a VADDPD %YMM10,%YMM21,%YMM10 |
(1028) 0x46b950 VSUBPD %YMM10,%YMM23,%YMM10 |
(1028) 0x46b956 VADDPD %YMM22,%YMM10,%YMM10 |
(1028) 0x46b95c VBROADCASTSD 0x8a69b(%RIP),%YMM14 |
(1028) 0x46b965 VMULPD %YMM14,%YMM10,%YMM10 |
(1028) 0x46b96a VADDPD %YMM31,%YMM29,%YMM21 |
(1028) 0x46b970 VSUBPD %YMM21,%YMM30,%YMM21 |
(1028) 0x46b976 VADDPD %YMM20,%YMM21,%YMM20 |
(1028) 0x46b97c VMULPD %YMM14,%YMM20,%YMM20 |
(1028) 0x46b982 VDIVPD %YMM2,%YMM18,%YMM23 |
(1028) 0x46b988 VMULPD %YMM23,%YMM20,%YMM20 |
(1028) 0x46b98e VMOVUPD (%RAX,%R13,8),%YMM21 |
(1028) 0x46b995 VFMADD231PD %YMM10,%YMM26,%YMM20 |
(1028) 0x46b99b VSUBPD -0x10(%RAX,%R13,8),%YMM21,%YMM10 |
(1028) 0x46b9a6 VADDPD (%RCX,%R13,8),%YMM2,%YMM21 |
(1028) 0x46b9ad VDIVPD %YMM21,%YMM10,%YMM22 |
(1028) 0x46b9b3 VMOVUPD (%R15,%R13,8),%YMM10 |
(1028) 0x46b9b9 VSUBPD (%R11,%R13,8),%YMM10,%YMM10 |
(1028) 0x46b9bf VMULPD 0x180(%RSP),%YMM10,%YMM21 |
(1028) 0x46b9c7 VMULPD %YMM22,%YMM22,%YMM10 |
(1028) 0x46b9cd VMULPD %YMM21,%YMM21,%YMM29 |
(1028) 0x46b9d3 VMULPD %YMM14,%YMM25,%YMM25 |
(1028) 0x46b9d9 VMULPD %YMM23,%YMM25,%YMM23 |
(1028) 0x46b9df VMULPD %YMM10,%YMM23,%YMM23 |
(1028) 0x46b9e5 VMULPD %YMM1,%YMM14,%YMM1 |
(1028) 0x46b9e9 VMULPD %YMM29,%YMM1,%YMM1 |
(1028) 0x46b9ef VMULPD %YMM20,%YMM22,%YMM20 |
(1028) 0x46b9f5 VFMADD213PD %YMM23,%YMM21,%YMM20 |
(1028) 0x46b9fb VFMADD231PD %YMM1,%YMM26,%YMM20 |
(1028) 0x46ba01 VADDPD %YMM10,%YMM29,%YMM1 |
(1028) 0x46ba07 VMAXPD %YMM8,%YMM1,%YMM1 |
(1028) 0x46ba0c VDIVPD %YMM1,%YMM20,%YMM10 |
(1028) 0x46ba12 VCMPPD $0x1,%YMM10,%YMM28,%K1 |
(1028) 0x46ba19 VCMPPD $0x2,%YMM13,%YMM28,%K0 |
(1028) 0x46ba20 VCMPPD $0x6,%YMM13,%YMM28,%K1{%K1} |
(1028) 0x46ba27 KORW %K1,%K0,%K1 |
(1028) 0x46ba2b KNOTW %K1,%K2 |
(1028) 0x46ba2f KMOVD %K2,%EBX |
(1028) 0x46ba33 TEST $0xf,%BL |
(1028) 0x46ba36 VMOVAPD %YMM8,%YMM14 |
(1028) 0x46ba3b VXORPD %XMM13,%XMM13,%XMM13 |
(1028) 0x46ba40 JE 46b760 |
(1028) 0x46ba46 MOV 0x78(%RBP),%RCX |
(1028) 0x46ba4a MOV (%RCX),%RCX |
(1028) 0x46ba4d JMP 46b760 |
0x46ba52 NOPW %CS:(%RAX,%RAX,1) |
(1026) 0x46ba60 VMOVAPD %YMM18,%YMM14 |
(1026) 0x46ba66 VPCMPEQD %YMM4,%YMM4,%YMM4 |
(1026) 0x46ba6a VPTEST %YMM4,%YMM5 |
(1026) 0x46ba6f VMOVAPD 0x1f0(%RSP),%XMM8 |
(1026) 0x46ba78 JB 46bab8 |
(1026) 0x46ba7a VEXTRACTI128 $0x1,%YMM5,%XMM0 |
(1026) 0x46ba80 VPMAXSQ %XMM0,%XMM5,%XMM0 |
(1026) 0x46ba86 VPSHUFD $-0x12,%XMM0,%XMM1 |
(1026) 0x46ba8b VPMAXSQ %XMM1,%XMM0,%XMM0 |
(1026) 0x46ba91 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46ba96 VPCMPEQQ %YMM0,%YMM5,%K0 |
(1026) 0x46ba9c KMOVD %K0,%EAX |
(1026) 0x46baa0 TZCNT %EAX,%EAX |
(1026) 0x46baa4 VMOVAPD %YMM31,0x2c0(%RSP) |
(1026) 0x46baac AND $0x3,%EAX |
(1026) 0x46baaf VMOVSD 0x2c0(%RSP,%RAX,8),%XMM8 |
(1026) 0x46bab8 VPTEST %YMM4,%YMM9 |
(1026) 0x46babd VXORPD %XMM18,%XMM18,%XMM18 |
(1026) 0x46bac3 VMOVAPD 0x1e0(%RSP),%XMM26 |
(1026) 0x46bacb VMOVAPD 0x1d0(%RSP),%XMM27 |
(1026) 0x46bad3 VMOVAPD 0x1c0(%RSP),%XMM28 |
(1026) 0x46badb MOV 0x128(%RSP),%R13 |
(1026) 0x46bae3 MOV 0x120(%RSP),%R15 |
(1026) 0x46baeb MOV 0x110(%RSP),%R11 |
(1026) 0x46baf3 MOV 0x108(%RSP),%RSI |
(1026) 0x46bafb MOV 0xf8(%RSP),%R9 |
(1026) 0x46bb03 MOV 0xf0(%RSP),%RBX |
(1026) 0x46bb0b JB 46bb4a |
(1026) 0x46bb0d VEXTRACTI128 $0x1,%YMM9,%XMM0 |
(1026) 0x46bb13 VPMAXSQ %XMM0,%XMM9,%XMM0 |
(1026) 0x46bb19 VPSHUFD $-0x12,%XMM0,%XMM1 |
(1026) 0x46bb1e VPMAXSQ %XMM1,%XMM0,%XMM0 |
(1026) 0x46bb24 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46bb29 VPCMPEQQ %YMM0,%YMM9,%K0 |
(1026) 0x46bb2f KMOVD %K0,%EAX |
(1026) 0x46bb33 TZCNT %EAX,%EAX |
(1026) 0x46bb37 VMOVAPD %YMM25,0x2a0(%RSP) |
(1026) 0x46bb3f AND $0x3,%EAX |
(1026) 0x46bb42 VMOVSD 0x2a0(%RSP,%RAX,8),%XMM26 |
(1026) 0x46bb4a VPTEST %YMM4,%YMM6 |
(1026) 0x46bb4f VMOVAPD 0x1b0(%RSP),%XMM31 |
(1026) 0x46bb57 JB 46bb96 |
(1026) 0x46bb59 VEXTRACTI128 $0x1,%YMM6,%XMM0 |
(1026) 0x46bb5f VPMAXSQ %XMM0,%XMM6,%XMM0 |
(1026) 0x46bb65 VPSHUFD $-0x12,%XMM0,%XMM1 |
(1026) 0x46bb6a VPMAXSQ %XMM1,%XMM0,%XMM0 |
(1026) 0x46bb70 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46bb75 VPCMPEQQ %YMM0,%YMM6,%K0 |
(1026) 0x46bb7b KMOVD %K0,%EAX |
(1026) 0x46bb7f TZCNT %EAX,%EAX |
(1026) 0x46bb83 VMOVAPD %YMM23,0x280(%RSP) |
(1026) 0x46bb8b AND $0x3,%EAX |
(1026) 0x46bb8e VMOVSD 0x280(%RSP,%RAX,8),%XMM27 |
(1026) 0x46bb96 VPTEST %YMM4,%YMM3 |
(1026) 0x46bb9b VMOVSD 0xa6443(%RIP),%XMM25 |
(1026) 0x46bba5 VMOVAPD 0x170(%RSP),%XMM20 |
(1026) 0x46bbad JB 46bbec |
(1026) 0x46bbaf VEXTRACTI128 $0x1,%YMM3,%XMM0 |
(1026) 0x46bbb5 VPMAXSQ %XMM0,%XMM3,%XMM0 |
(1026) 0x46bbbb VPSHUFD $-0x12,%XMM0,%XMM1 |
(1026) 0x46bbc0 VPMAXSQ %XMM1,%XMM0,%XMM0 |
(1026) 0x46bbc6 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46bbcb VPCMPEQQ %YMM0,%YMM3,%K0 |
(1026) 0x46bbd1 KMOVD %K0,%EAX |
(1026) 0x46bbd5 TZCNT %EAX,%EAX |
(1026) 0x46bbd9 VMOVAPD %YMM22,0x260(%RSP) |
(1026) 0x46bbe1 AND $0x3,%EAX |
(1026) 0x46bbe4 VMOVSD 0x260(%RSP,%RAX,8),%XMM28 |
(1026) 0x46bbec VPTEST %YMM4,%YMM11 |
(1026) 0x46bbf1 VMOVSD 0xa63e5(%RIP),%XMM23 |
(1026) 0x46bbfb JB 46bc3a |
(1026) 0x46bbfd VEXTRACTI128 $0x1,%YMM11,%XMM0 |
(1026) 0x46bc03 VPMAXSQ %XMM0,%XMM11,%XMM0 |
(1026) 0x46bc09 VPSHUFD $-0x12,%XMM0,%XMM1 |
(1026) 0x46bc0e VPMAXSQ %XMM1,%XMM0,%XMM0 |
(1026) 0x46bc14 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46bc19 VPCMPEQQ %YMM0,%YMM11,%K0 |
(1026) 0x46bc1f KMOVD %K0,%EAX |
(1026) 0x46bc23 TZCNT %EAX,%EAX |
(1026) 0x46bc27 VMOVAPD %YMM21,0x240(%RSP) |
(1026) 0x46bc2f AND $0x3,%EAX |
(1026) 0x46bc32 VMOVSD 0x240(%RSP,%RAX,8),%XMM31 |
(1026) 0x46bc3a VPTEST %YMM4,%YMM12 |
(1026) 0x46bc3f VMOVSD 0x8a3b7(%RIP),%XMM22 |
(1026) 0x46bc49 JB 46bc92 |
(1026) 0x46bc4b VEXTRACTI128 $0x1,%YMM12,%XMM0 |
(1026) 0x46bc51 VPMAXSQ %XMM0,%XMM12,%XMM0 |
(1026) 0x46bc57 VPSHUFD $-0x12,%XMM0,%XMM1 |
(1026) 0x46bc5c VPMAXSQ %XMM1,%XMM0,%XMM0 |
(1026) 0x46bc62 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46bc67 VPCMPEQQ %YMM0,%YMM12,%K0 |
(1026) 0x46bc6d KMOVD %K0,%EAX |
(1026) 0x46bc71 TZCNT %EAX,%EAX |
(1026) 0x46bc75 VMOVAPD %YMM30,0x220(%RSP) |
(1026) 0x46bc7d AND $0x3,%EAX |
(1026) 0x46bc80 VMOVSD 0x220(%RSP,%RAX,8),%XMM0 |
(1026) 0x46bc89 VMOVAPD %XMM0,0x160(%RSP) |
(1026) 0x46bc92 VPTEST %YMM4,%YMM2 |
(1026) 0x46bc97 VMOVSD 0x896df(%RIP),%XMM21 |
(1026) 0x46bca1 VMOVAPD 0x1a0(%RSP),%XMM30 |
(1026) 0x46bca9 JB 46bce8 |
(1026) 0x46bcab VEXTRACTI128 $0x1,%YMM2,%XMM0 |
(1026) 0x46bcb1 VPMAXSQ %XMM0,%XMM2,%XMM0 |
(1026) 0x46bcb7 VPSHUFD $-0x12,%XMM0,%XMM1 |
(1026) 0x46bcbc VPMAXSQ %XMM1,%XMM0,%XMM0 |
(1026) 0x46bcc2 VPBROADCASTQ %XMM0,%YMM0 |
(1026) 0x46bcc7 VPCMPEQQ %YMM0,%YMM2,%K0 |
(1026) 0x46bccd KMOVD %K0,%EAX |
(1026) 0x46bcd1 TZCNT %EAX,%EAX |
(1026) 0x46bcd5 VMOVAPD %YMM29,0x200(%RSP) |
(1026) 0x46bcdd AND $0x3,%EAX |
(1026) 0x46bce0 VMOVSD 0x200(%RSP,%RAX,8),%XMM30 |
(1026) 0x46bce8 MOV %RDI,%RDX |
(1026) 0x46bceb CMP 0x38(%RSP),%RDI |
(1026) 0x46bcf0 VMOVAPD 0x160(%RSP),%XMM29 |
(1026) 0x46bcf8 VMOVSD 0x118(%RSP),%XMM1 |
(1026) 0x46bd01 MOV 0x100(%RSP),%RDI |
(1026) 0x46bd09 JE 46b4f0 |
(1026) 0x46bd0f JMP 46bd4b |
0x46bd11 NOPW %CS:(%RAX,%RAX,1) |
(1026) 0x46bd20 MOV %RBX,%R8 |
(1026) 0x46bd23 MOV %R14,%RBX |
(1026) 0x46bd26 IMUL %R10,%RBX |
(1026) 0x46bd2a LEA 0x1(%R10),%RSI |
(1026) 0x46bd2e MOV %R14,%R9 |
(1026) 0x46bd31 IMUL %RSI,%R9 |
(1026) 0x46bd35 MOV %R15,%RDI |
(1026) 0x46bd38 IMUL %R10,%RDI |
(1026) 0x46bd3c IMUL %R15,%RSI |
(1026) 0x46bd40 IMUL %R11,%R10 |
(1026) 0x46bd44 MOV %R10,0x40(%RSP) |
(1026) 0x46bd49 XOR %EDX,%EDX |
(1026) 0x46bd4b MOV 0x28(%RSP),%RAX |
(1026) 0x46bd50 ADD %RAX,%RBX |
(1026) 0x46bd53 MOV 0xb0(%RSP),%RCX |
(1026) 0x46bd5b LEA (%RCX,%RDX,1),%R10 |
(1026) 0x46bd5f MOV %R10,%R14 |
(1026) 0x46bd62 SUB 0xb8(%RSP),%R14 |
(1026) 0x46bd6a VMOVSD (%RBX,%R14,8),%XMM3 |
(1026) 0x46bd70 ADD %RAX,%R9 |
(1026) 0x46bd73 VMOVSD (%R9,%R14,8),%XMM11 |
(1026) 0x46bd79 MOV 0x30(%RSP),%RAX |
(1026) 0x46bd7e ADD %RAX,%RDI |
(1026) 0x46bd81 VMOVSD (%RDI,%R14,8),%XMM12 |
(1026) 0x46bd87 MOV 0xa8(%RSP),%RCX |
(1026) 0x46bd8f ADD %R10,%RCX |
(1026) 0x46bd92 ADD %RAX,%RSI |
(1026) 0x46bd95 VMOVSD (%RSI,%R14,8),%XMM24 |
(1026) 0x46bd9c IMUL %R11,%R13 |
(1026) 0x46bda0 MOV %R11,%R9 |
(1026) 0x46bda3 MOV %R8,%R12 |
(1026) 0x46bda6 IMUL %R8,%R11 |
(1026) 0x46bdaa LEA (%R11,%R10,8),%RAX |
(1026) 0x46bdae MOV 0x18(%RBP),%RSI |
(1026) 0x46bdb2 MOV 0x40(%RSP),%R8 |
(1026) 0x46bdb7 ADD %RSI,%R8 |
(1026) 0x46bdba VMOVSD (%R8,%RCX,8),%XMM4 |
(1026) 0x46bdc0 MOV 0x138(%RSP),%RSI |
(1026) 0x46bdc8 MOV %RSI,%RCX |
(1026) 0x46bdcb IMUL %R12,%RCX |
(1026) 0x46bdcf LEA (%RCX,%R10,8),%R11 |
(1026) 0x46bdd3 MOV 0x148(%RSP),%RCX |
(1026) 0x46bddb IMUL %RCX,%RSI |
(1026) 0x46bddf LEA (%RSI,%R10,8),%RSI |
(1026) 0x46bde3 IMUL %RCX,%R9 |
(1026) 0x46bde7 IMUL %R15,%RCX |
(1026) 0x46bdeb LEA (%RCX,%R10,8),%RBX |
(1026) 0x46bdef IMUL %R12,%R15 |
(1026) 0x46bdf3 LEA (%R15,%R10,8),%RCX |
(1026) 0x46bdf7 MOV 0x90(%RSP),%RDI |
(1026) 0x46bdff LEA (%RDI,%R10,8),%R15 |
(1026) 0x46be03 VMOVQ (%R8,%R14,8),%XMM9 |
(1026) 0x46be09 MOV 0x30(%RBP),%RDI |
(1026) 0x46be0d VMOVSD (%RDI,%R14,8),%XMM0 |
(1026) 0x46be13 VDIVSD %XMM20,%XMM21,%XMM6 |
(1026) 0x46be19 VDIVSD %XMM1,%XMM21,%XMM2 |
(1026) 0x46be1f MOV 0x38(%RSP),%R8 |
(1026) 0x46be24 SUB %RDX,%R8 |
(1026) 0x46be27 MOV %R12,0x180(%RSP) |
(1026) 0x46be2f MOV 0x140(%RSP),%RDI |
(1026) 0x46be37 IMUL %R12,%RDI |
(1026) 0x46be3b ADD 0x98(%RSP),%RDX |
(1026) 0x46be43 LEA (%RDI,%RDX,8),%R12 |
(1026) 0x46be47 ADD 0x10(%RBP),%R12 |
(1026) 0x46be4b MOV 0x20(%RBP),%RDI |
(1026) 0x46be4f LEA (%RDI,%RDX,8),%R14 |
(1026) 0x46be53 LEA (%R13,%RDX,8),%R13 |
(1026) 0x46be58 MOV 0x18(%RBP),%RDI |
(1026) 0x46be5c ADD %RDI,%R13 |
(1026) 0x46be5f LEA (%R9,%RDX,8),%RDX |
(1026) 0x46be63 ADD %RDI,%RDX |
(1026) 0x46be66 ADD 0x88(%RSP),%RAX |
(1026) 0x46be6e MOV 0x80(%RSP),%RDI |
(1026) 0x46be76 ADD %RDI,%R11 |
(1026) 0x46be79 ADD %RDI,%RSI |
(1026) 0x46be7c MOV 0xa0(%RSP),%RDI |
(1026) 0x46be84 ADD %RDI,%RBX |
(1026) 0x46be87 ADD %RDI,%RCX |
(1026) 0x46be8a XOR %R10D,%R10D |
(1026) 0x46be8d JMP 46beaf |
0x46be8f NOP |
(1027) 0x46be90 VMOVSD %XMM17,(%R12,%R10,8) |
(1027) 0x46be97 INC %R10 |
(1027) 0x46be9a VMOVDQA %XMM9,%XMM4 |
(1027) 0x46be9e VMOVAPD %XMM5,%XMM9 |
(1027) 0x46bea2 VMOVAPD %XMM7,%XMM0 |
(1027) 0x46bea6 CMP %R10,%R8 |
(1027) 0x46bea9 JE 46b4f0 |
(1027) 0x46beaf VMOVAPD %XMM24,%XMM1 |
(1027) 0x46beb5 VMOVAPD %XMM12,%XMM5 |
(1027) 0x46beb9 VMOVSD (%RCX,%R10,8),%XMM12 |
(1027) 0x46bebf VMOVSD (%RBX,%R10,8),%XMM24 |
(1027) 0x46bec6 VMOVAPD %XMM11,%XMM7 |
(1027) 0x46beca VMOVAPD %XMM3,%XMM10 |
(1027) 0x46bece VADDSD %XMM12,%XMM24,%XMM3 |
(1027) 0x46bed4 VADDSD %XMM1,%XMM5,%XMM11 |
(1027) 0x46bed8 VSUBSD %XMM11,%XMM3,%XMM13 |
(1027) 0x46bedd VMOVSD (%RSI,%R10,8),%XMM11 |
(1027) 0x46bee3 VMOVSD (%R11,%R10,8),%XMM3 |
(1027) 0x46bee9 VADDSD %XMM7,%XMM11,%XMM15 |
(1027) 0x46beed VADDSD %XMM3,%XMM10,%XMM16 |
(1027) 0x46bef3 VSUBSD %XMM16,%XMM15,%XMM17 |
(1027) 0x46bef9 VMULSD %XMM13,%XMM0,%XMM19 |
(1027) 0x46beff VFMADD231SD %XMM17,%XMM20,%XMM19 |
(1027) 0x46bf05 VADDSD %XMM5,%XMM12,%XMM5 |
(1027) 0x46bf09 VSUBSD %XMM5,%XMM24,%XMM5 |
(1027) 0x46bf0f VADDSD %XMM1,%XMM5,%XMM1 |
(1027) 0x46bf13 VMULSD %XMM22,%XMM1,%XMM1 |
(1027) 0x46bf19 VADDSD %XMM7,%XMM10,%XMM5 |
(1027) 0x46bf1d VSUBSD %XMM5,%XMM11,%XMM5 |
(1027) 0x46bf21 VADDSD %XMM3,%XMM5,%XMM5 |
(1027) 0x46bf25 VMULSD %XMM22,%XMM5,%XMM5 |
(1027) 0x46bf2b VDIVSD %XMM0,%XMM21,%XMM10 |
(1027) 0x46bf31 VMULSD %XMM10,%XMM5,%XMM20 |
(1027) 0x46bf37 VFMADD231SD %XMM1,%XMM6,%XMM20 |
(1027) 0x46bf3d VMOVSD (%RAX,%R10,8),%XMM5 |
(1027) 0x46bf43 VSUBSD %XMM4,%XMM5,%XMM1 |
(1027) 0x46bf47 VMOVSD (%R15,%R10,8),%XMM7 |
(1027) 0x46bf4d VADDSD %XMM0,%XMM7,%XMM4 |
(1027) 0x46bf51 VDIVSD %XMM4,%XMM1,%XMM16 |
(1027) 0x46bf57 VMOVSD (%RDX,%R10,8),%XMM1 |
(1027) 0x46bf5d VSUBSD (%R13,%R10,8),%XMM1,%XMM1 |
(1027) 0x46bf64 VMULSD %XMM2,%XMM1,%XMM15 |
(1027) 0x46bf68 VMULSD %XMM16,%XMM16,%XMM1 |
(1027) 0x46bf6e VMULSD %XMM15,%XMM15,%XMM4 |
(1027) 0x46bf73 VMULSD %XMM22,%XMM13,%XMM13 |
(1027) 0x46bf79 VMULSD %XMM10,%XMM13,%XMM10 |
(1027) 0x46bf7e VMULSD %XMM1,%XMM10,%XMM10 |
(1027) 0x46bf82 VMULSD %XMM22,%XMM17,%XMM13 |
(1027) 0x46bf88 VMULSD %XMM4,%XMM13,%XMM13 |
(1027) 0x46bf8c VMULSD %XMM20,%XMM16,%XMM17 |
(1027) 0x46bf92 VMOVAPD 0x170(%RSP),%XMM20 |
(1027) 0x46bf9a VFMADD213SD %XMM10,%XMM15,%XMM17 |
(1027) 0x46bfa0 VFMADD231SD %XMM13,%XMM6,%XMM17 |
(1027) 0x46bfa6 VADDSD %XMM1,%XMM4,%XMM1 |
(1027) 0x46bfaa VMAXSD %XMM23,%XMM1,%XMM1 |
(1027) 0x46bfb0 VDIVSD %XMM1,%XMM17,%XMM4 |
(1027) 0x46bfb6 VXORPD %XMM17,%XMM17,%XMM17 |
(1027) 0x46bfbc XOR %EDI,%EDI |
(1027) 0x46bfbe VUCOMISD %XMM17,%XMM4 |
(1027) 0x46bfc4 SETBE %DIL |
(1027) 0x46bfc8 XOR %R9D,%R9D |
(1027) 0x46bfcb VUCOMISD %XMM17,%XMM19 |
(1027) 0x46bfd1 SETB %R9B |
(1027) 0x46bfd5 CMP %R9B,%DIL |
(1027) 0x46bfd8 CMOVB %EDI,%R9D |
(1027) 0x46bfdc CMP $0x1,%R9B |
(1027) 0x46bfe0 JNE 46be90 |
(1027) 0x46bfe6 VCMPSD $0x1,%XMM18,%XMM16,%K1 |
(1027) 0x46bfed VMOVAPD %XMM21,%XMM8 |
(1027) 0x46bff3 VMOVSD %XMM25,%XMM8,%XMM8{%K1} |
(1027) 0x46bff9 VMOVDDUP 0x891ff(%RIP),%XMM1 |
(1027) 0x46c001 VANDPD %XMM1,%XMM16,%XMM10 |
(1027) 0x46c007 VMAXSD %XMM10,%XMM23,%XMM10 |
(1027) 0x46c00d VMULSD %XMM8,%XMM10,%XMM10 |
(1027) 0x46c012 VCMPSD $0x1,%XMM18,%XMM10,%K1 |
(1027) 0x46c019 VMOVAPD %XMM21,%XMM26 |
(1027) 0x46c01f VMOVSD %XMM25,%XMM26,%XMM26{%K1} |
(1027) 0x46c025 VANDPD %XMM1,%XMM15,%XMM13 |
(1027) 0x46c029 VMAXSD %XMM13,%XMM23,%XMM13 |
(1027) 0x46c02f VMULSD %XMM26,%XMM13,%XMM13 |
(1027) 0x46c035 VMULSD %XMM10,%XMM10,%XMM15 |
(1027) 0x46c03a VFMADD231SD %XMM13,%XMM13,%XMM15 |
(1027) 0x46c03f VSQRTSD %XMM15,%XMM15,%XMM27 |
(1027) 0x46c045 VMULSD %XMM0,%XMM27,%XMM0 |
(1027) 0x46c04b VDIVSD %XMM10,%XMM0,%XMM0 |
(1027) 0x46c050 VANDPD %XMM1,%XMM0,%XMM28 |
(1027) 0x46c056 VMULSD %XMM20,%XMM27,%XMM0 |
(1027) 0x46c05c VDIVSD %XMM13,%XMM0,%XMM0 |
(1027) 0x46c061 VANDPD %XMM1,%XMM0,%XMM31 |
(1027) 0x46c067 VCMPSD $0x2,%XMM31,%XMM28,%K1 |
(1027) 0x46c06e VMOVAPD %XMM31,%XMM29 |
(1027) 0x46c074 VMOVSD %XMM28,%XMM29,%XMM29{%K1} |
(1027) 0x46c07a VMULSD %XMM29,%XMM29,%XMM30 |
(1027) 0x46c080 VMULSD %XMM4,%XMM4,%XMM0 |
(1027) 0x46c084 VADDSD %XMM30,%XMM30,%XMM1 |
(1027) 0x46c08a VMULSD %XMM1,%XMM0,%XMM0 |
(1027) 0x46c08e MOV 0x78(%RBP),%RDI |
(1027) 0x46c092 MOV (%RDI),%RDI |
(1027) 0x46c095 IMUL 0x180(%RSP),%RDI |
(1027) 0x46c09e ADD %R14,%RDI |
(1027) 0x46c0a1 VMULSD (%RDI,%R10,8),%XMM0,%XMM17 |
(1027) 0x46c0a8 JMP 46be90 |
0x46c0ad NOPL (%RAX) |
Path / |
Source file and lines | viscosity_kernel.f90:50-94 |
Module | exec |
nb instructions | 168 |
nb uops | 172 |
loop length | 755 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 5 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 43 |
micro-operation queue | 28.67 cycles |
front end | 28.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 12.30 | 12.20 | 10.00 | 10.00 | 22.00 | 12.20 | 12.10 | 22.00 | 22.00 | 22.00 | 12.20 | 10.00 |
cycles | 12.30 | 13.60 | 10.00 | 10.00 | 22.00 | 12.20 | 12.10 | 22.00 | 22.00 | 22.00 | 12.20 | 10.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 28.14-28.20 |
Stall cycles | 0.00 |
Front-end | 28.67 |
Dispatch | 22.00 |
Overall L1 | 28.67 |
all | 1% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 16% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 3% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
all | 11% |
load | 6% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 11% |
load | 11% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x300,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVL $0,0x24(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JS 46b2cf <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xaf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVL $0,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0xc(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0x1,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x28(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x2c(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x18(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x14(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x53d630,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 404670 <__kmpc_for_static_init_4@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x10(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc(%RSP),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EAX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ECX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 46b2ea <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xca> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x53d650,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x14(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404230 <__kmpc_for_static_fini@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x48(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x53d670,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 404740 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SAL $0x20,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $-0x200000000,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
LEA (%R12,%RAX,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
SAL $0x20,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %R13,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%R9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOVSXD (%RDX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%EDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %R10D,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %EBX,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP $0x2,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVGE %EDX,%ESI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND $0x7ffffffc,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RSI,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $-0x1,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVNS %RCX,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $0x1,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %R11,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $0x200000000,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RCX,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA (,%R10,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RSI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV $-0x1,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
SUB %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVNS %RAX,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVG %R11,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB %R13,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x30(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RBX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R8,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x20,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RSI,%RBX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NEG %RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R9,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R11,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(%R9,%RCX,1),%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RAX,%RCX,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R9,%RCX,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x8(%R14,%RCX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,0x158(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(%RDX,%RCX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(%RAX,%RCX,1),%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RCX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R14,%RSI,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R9,%RSI,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RDX,%RSI,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x89ecd(%RIP),%XMM21 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8ab43(%RIP),%XMM22 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0xa6b19(%RIP),%XMM23 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0xa6b17(%RIP),%XMM25 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0x89ea6(%RIP),%YMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VXORPD %XMM18,%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EDI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 46b50e <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x2ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | viscosity_kernel.f90:50-94 |
Module | exec |
nb instructions | 168 |
nb uops | 172 |
loop length | 755 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 5 |
used ymm registers | 1 |
used zmm registers | 0 |
nb stack references | 43 |
micro-operation queue | 28.67 cycles |
front end | 28.67 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 12.30 | 12.20 | 10.00 | 10.00 | 22.00 | 12.20 | 12.10 | 22.00 | 22.00 | 22.00 | 12.20 | 10.00 |
cycles | 12.30 | 13.60 | 10.00 | 10.00 | 22.00 | 12.20 | 12.10 | 22.00 | 22.00 | 22.00 | 12.20 | 10.00 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 28.14-28.20 |
Stall cycles | 0.00 |
Front-end | 28.67 |
Dispatch | 22.00 |
Overall L1 | 28.67 |
all | 1% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 5% |
all | 16% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 50% |
all | 3% |
load | 0% |
store | 0% |
mul | 0% |
add-sub | 0% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 10% |
all | 11% |
load | 6% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 12% |
all | 14% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 18% |
all | 11% |
load | 11% |
store | 11% |
mul | 12% |
add-sub | 12% |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 13% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x300,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RBP),%EBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x38(%RBP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EBX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOVL $0,0x24(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JS 46b2cf <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xaf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %RCX,%R12 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDX,%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RDI,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOVL $0,0x10(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EAX,0xc(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVL $0x1,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB $0x8,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x28(%RSP),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x2c(%RSP),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x18(%RSP),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA 0x14(%RSP),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x53d630,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x22,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH $0x1 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RAX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
CALL 404670 <__kmpc_for_static_init_4@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
ADD $0x20,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x10(%RSP),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xc(%RSP),%ECX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %EAX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ECX,0x18(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JAE 46b2ea <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0xca> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV $0x53d650,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x14(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
CALL 404230 <__kmpc_for_static_fini@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x48(%RSP),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RDI),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV $0x53d670,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 404740 <__kmpc_barrier@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
MOV %RAX,%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV 0x50(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x48(%RBP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SAL $0x20,%R12 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV $-0x200000000,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
LEA (%R12,%RAX,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%R8 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
SAL $0x20,%R13 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %R13,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SAR $0x20,%R9 | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOVSXD (%RDX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RSI),%EDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
SUB %R10D,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %EBX,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
INC %EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP $0x2,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x1,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVGE %EDX,%ESI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
AND $0x7ffffffc,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %RSI,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
TEST %RCX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $-0x1,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVNS %RCX,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
MOV $0x1,%R11D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %R11,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV $0x200000000,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.28 |
MOV %RBX,%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
SUB %R12,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RCX,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
LEA (,%R10,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
SHR $0x20,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RSI,%RDX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV $-0x1,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SAL $0x3,%RDX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
SUB %RDX,%RCX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
TEST %RAX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVNS %RAX,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
TEST %RSI,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
CMOVG %R11,%RSI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
SUB %R13,%RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x30(%RBP),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %RBX,%RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMOVG %RAX,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
MOV %R8,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SHR $0x20,%RBX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
IMUL %RSI,%RBX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
NEG %RBX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RBX,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV $0x8,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %RDX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %RAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R9,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R11,0xd0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x18(%RBP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x10(%RBP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(%R9,%RCX,1),%R11 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RCX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDX,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RAX,%RCX,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R9,%RCX,1),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA 0x8(%R14,%RCX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,0x158(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(%RDX,%RCX,1),%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RAX,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x30(%RSP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x8(%RAX,%RCX,1),%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RCX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %R8,%R10 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R10,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R14,%RSI,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R9,%RSI,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RDX,%RSI,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RAX,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RSI,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVSD 0x89ecd(%RIP),%XMM21 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x8ab43(%RIP),%XMM22 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0xa6b19(%RIP),%XMM23 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0xa6b17(%RIP),%XMM25 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VBROADCASTSD 0x89ea6(%RIP),%YMM14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 3 | 0.33 |
VXORPD %XMM18,%XMM18,%XMM18 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %EDI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
JMP 46b50e <viscosity_kernel_module_mp_viscosity_kernel_.DIR.OMP.PARALLEL.2+0x2ee> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼viscosity_kernel_.DIR.OMP.PARALLEL.2– | 2.21 | 1.68 |
▼Loop 1026 - viscosity_kernel.f90:53-89 - exec– | 0 | 0 |
○Loop 1028 - viscosity_kernel.f90:53-89 - exec | 2.2 | 1.68 |
○Loop 1027 - viscosity_kernel.f90:55-89 - exec | 0 | 0 |