Function: __accelerate_kernel_module_MOD_accelerate_kernel._omp_fn.0 | Module: exec | Source: accelerate_kernel.f90:57-76 [...] | Coverage: 4.56% |
---|
Function: __accelerate_kernel_module_MOD_accelerate_kernel._omp_fn.0 | Module: exec | Source: accelerate_kernel.f90:57-76 [...] | Coverage: 4.56% |
---|
/scratch_na/users/xoserete/qaas_runs/171-415-7190/intel/CloverLeafFC/build/CloverLeafFC/CloverLeaf_ref/kernels/accelerate_kernel.f90: 57 - 76 |
-------------------------------------------------------------------------------- |
57: !$OMP PARALLEL |
58: |
59: !$OMP DO PRIVATE(j,k,stepbymass_s) |
60: DO k=y_min,y_max+1 |
61: !$OMP SIMD |
[...] |
67: *0.25_8) |
68: |
69: xvel1(j,k)=xvel0(j,k)-stepbymass_s*(xarea(j ,k )*(pressure(j ,k )-pressure(j-1,k )) & |
70: +xarea(j ,k-1)*(pressure(j ,k-1)-pressure(j-1,k-1))) |
71: yvel1(j,k)=yvel0(j,k)-stepbymass_s*(yarea(j ,k )*(pressure(j ,k )-pressure(j ,k-1)) & |
72: +yarea(j-1,k )*(pressure(j-1,k )-pressure(j-1,k-1))) |
73: xvel1(j,k)=xvel1(j,k)-stepbymass_s*(xarea(j ,k )*(viscosity(j ,k )-viscosity(j-1,k )) & |
74: +xarea(j ,k-1)*(viscosity(j ,k-1)-viscosity(j-1,k-1))) |
75: yvel1(j,k)=yvel1(j,k)-stepbymass_s*(yarea(j ,k )*(viscosity(j ,k )-viscosity(j ,k-1)) & |
76: +yarea(j-1,k )*(viscosity(j-1,k )-viscosity(j-1,k-1))) |
0x407180 PUSH %RBP |
0x407181 MOV %RSP,%RBP |
0x407184 PUSH %R15 |
0x407186 PUSH %R14 |
0x407188 PUSH %R13 |
0x40718a PUSH %R12 |
0x40718c PUSH %RBX |
0x40718d MOV %RDI,%RBX |
0x407190 AND $-0x20,%RSP |
0x407194 SUB $0x320,%RSP |
0x40719b MOV 0x10(%RDI),%RAX |
0x40719f MOV (%RAX),%R12D |
0x4071a2 CALL 402080 <@plt_start@+0x60> |
0x4071a7 MOV %EAX,%R13D |
0x4071aa CALL 402180 <@plt_start@+0x160> |
0x4071af MOV 0x18(%RBX),%RDX |
0x4071b3 MOV %EAX,%ECX |
0x4071b5 MOV (%RDX),%EAX |
0x4071b7 ADD $0x2,%EAX |
0x4071ba SUB %R12D,%EAX |
0x4071bd CLTD |
0x4071be IDIV %R13D |
0x4071c1 CMP %EDX,%ECX |
0x4071c3 JL 40824f |
0x4071c9 IMUL %EAX,%ECX |
0x4071cc ADD %ECX,%EDX |
0x4071ce ADD %EDX,%EAX |
0x4071d0 CMP %EAX,%EDX |
0x4071d2 JGE 40822d |
0x4071d8 ADD %R12D,%EAX |
0x4071db MOV 0x98(%RBX),%R14 |
0x4071e2 LEA (%R12,%RDX,1),%R13D |
0x4071e6 MOV 0xa0(%RBX),%RSI |
0x4071ed MOV 0x78(%RBX),%R15 |
0x4071f1 MOV (%RBX),%R12 |
0x4071f4 MOV %EAX,0xbc(%RSP) |
0x4071fb MOV 0x8(%RBX),%RAX |
0x4071ff MOV 0xb8(%RBX),%RDI |
0x407206 MOV %R14,0x1d0(%RSP) |
0x40720e MOVSXD (%R12),%RDX |
0x407212 MOV 0xa8(%RBX),%RCX |
0x407219 MOV %RSI,0xc8(%RSP) |
0x407221 MOV (%RAX),%R14D |
0x407224 MOV 0x88(%RBX),%R10 |
0x40722b MOV %R15,0xc0(%RSP) |
0x407233 MOV 0x70(%RBX),%RSI |
0x407237 MOV 0x30(%RBX),%R12 |
0x40723b MOV %RDI,0x108(%RSP) |
0x407243 MOV 0x50(%RBX),%RAX |
0x407247 LEA 0x2(%R14),%R15D |
0x40724b MOV 0xc0(%RBX),%R8 |
0x407252 MOV %R14D,0x2e0(%RSP) |
0x40725a MOV 0x20(%RBX),%R14 |
0x40725e MOV 0xb0(%RBX),%R9 |
0x407265 MOV %RCX,0x100(%RSP) |
0x40726d MOV 0x90(%RBX),%R11 |
0x407274 VMOVSD 0x80(%RBX),%XMM4 |
0x40727c MOV %R10,0xf8(%RSP) |
0x407284 MOV %RSI,0xf0(%RSP) |
0x40728c MOV %R13D,0x1dc(%RSP) |
0x407294 VMOVDDUP %XMM4,%XMM7 |
0x407298 VBROADCASTSD %XMM4,%YMM3 |
0x40729d MOV %R15D,0xb8(%RSP) |
0x4072a5 MOV 0x38(%RBX),%R15 |
0x4072a9 MOV %R12,0x2d0(%RSP) |
0x4072b1 MOV %RAX,0x280(%RSP) |
0x4072b9 MOV %R14,0x2c8(%RSP) |
0x4072c1 MOV 0x58(%RBX),%RAX |
0x4072c5 MOV 0x60(%RBX),%R12 |
0x4072c9 MOV 0x40(%RBX),%R14 |
0x4072cd MOV %R9,0x38(%RSP) |
0x4072d2 ADD %RDX,%R9 |
0x4072d5 MOV %RAX,0x270(%RSP) |
0x4072dd MOV 0x68(%RBX),%RAX |
0x4072e1 MOV %R9,0x118(%RSP) |
0x4072e9 MOV %RAX,0x260(%RSP) |
0x4072f1 LEA (,%RSI,8),%RAX |
0x4072f9 MOV %RAX,0x50(%RSP) |
0x4072fe MOVSXD %R13D,%RAX |
0x407301 MOV 0xc0(%RSP),%R13 |
0x407309 IMUL %RAX,%RSI |
0x40730d MOV %R12,0x278(%RSP) |
0x407315 MOV 0x28(%RBX),%R12 |
0x407319 ADD %RDX,%R13 |
0x40731c MOV %EDX,0x1d8(%RSP) |
0x407323 MOV %R13,0x110(%RSP) |
0x40732b MOV %RSI,0x258(%RSP) |
0x407333 ADD %R13,%RSI |
0x407336 LEA (,%RCX,8),%R13 |
0x40733e IMUL %RAX,%RCX |
0x407342 MOV %RSI,0x170(%RSP) |
0x40734a LEA (%R15,%RSI,8),%RSI |
0x40734e MOV %RSI,0x300(%RSP) |
0x407356 MOV %R13,0x48(%RSP) |
0x40735b MOV 0xd0(%RBX),%R13 |
0x407362 ADD %RCX,%R9 |
0x407365 MOV %RCX,0x250(%RSP) |
0x40736d MOV 0x2d0(%RSP),%RCX |
0x407375 MOV %R9,0x178(%RSP) |
0x40737d LEA (%RCX,%R9,8),%R9 |
0x407381 LEA (%R13,%RDX,1),%RCX |
0x407386 MOV %R13,0x2a8(%RSP) |
0x40738e MOV %R9,0x2d8(%RSP) |
0x407396 MOV 0xc8(%RBX),%R9 |
0x40739d LEA (,%RDI,8),%R13 |
0x4073a5 IMUL %RAX,%RDI |
0x4073a9 MOV %R12,0x268(%RSP) |
0x4073b1 MOV 0x48(%RBX),%R12 |
0x4073b5 LEA (,%R9,8),%RSI |
0x4073bd MOV %R9,0xb0(%RSP) |
0x4073c5 IMUL %RAX,%R9 |
0x4073c9 MOV %RSI,0xa8(%RSP) |
0x4073d1 MOV 0x280(%RSP),%RSI |
0x4073d9 MOV %R9,0x2b0(%RSP) |
0x4073e1 ADD %RCX,%R9 |
0x4073e4 MOV %R9,0x188(%RSP) |
0x4073ec LEA (%RSI,%R9,8),%R9 |
0x4073f0 LEA (,%R10,8),%RSI |
0x4073f8 MOV %R9,0x2c0(%RSP) |
0x407400 MOV 0xd8(%RBX),%R9 |
0x407407 IMUL %RAX,%R10 |
0x40740b MOV %R8,0x40(%RSP) |
0x407410 LEA (%R8,%RDX,1),%R8 |
0x407414 MOV 0x2c8(%RSP),%RCX |
0x40741c MOV %R13,0xa0(%RSP) |
0x407424 LEA (,%R9,8),%R13 |
0x40742c MOV %R8,0x120(%RSP) |
0x407434 MOV %RDI,0x2a0(%RSP) |
0x40743c ADD %R8,%RDI |
0x40743f MOV 0xe0(%RBX),%R8 |
0x407446 MOV %R9,0x90(%RSP) |
0x40744e IMUL %RAX,%R9 |
0x407452 MOV %R11,0x30(%RSP) |
0x407457 ADD %RDX,%R11 |
0x40745a MOV %R13,0x88(%RSP) |
0x407462 MOV 0xf8(%RBX),%R13 |
0x407469 MOV %RDI,0x168(%RSP) |
0x407471 LEA (%RCX,%RDI,8),%RDI |
0x407475 LEA (%R8,%RDX,1),%RCX |
0x407479 MOV %RSI,0x98(%RSP) |
0x407481 MOV 0x278(%RSP),%RSI |
0x407489 MOV %R11,0x128(%RSP) |
0x407491 ADD %R10,%R11 |
0x407494 MOV %RDI,0x308(%RSP) |
0x40749c LEA (%RCX,%R9,1),%RDI |
0x4074a0 MOV 0x100(%RBX),%RCX |
0x4074a7 MOV %R11,0x180(%RSP) |
0x4074af LEA (%R14,%R11,8),%R11 |
0x4074b3 MOV %R8,0x298(%RSP) |
0x4074bb LEA (,%R13,8),%R8 |
0x4074c3 MOV %R13,0x80(%RSP) |
0x4074cb IMUL %RAX,%R13 |
0x4074cf MOV %R11,0x318(%RSP) |
0x4074d7 MOV %R9,%R11 |
0x4074da LEA (%RSI,%RDI,8),%R9 |
0x4074de MOV %RDI,0x160(%RSP) |
0x4074e6 LEA (%RCX,%RDX,1),%RDI |
0x4074ea MOV %R9,0xe8(%RSP) |
0x4074f2 MOV 0x270(%RSP),%R9 |
0x4074fa LEA (%RDI,%R13,1),%RSI |
0x4074fe MOV %R8,0x78(%RSP) |
0x407503 MOV 0xe8(%RBX),%R8 |
0x40750a MOV %RCX,0x288(%RSP) |
0x407512 MOV %R13,0x290(%RSP) |
0x40751a LEA (,%R8,8),%RCX |
0x407522 LEA (%R9,%RSI,8),%R13 |
0x407526 MOV %RSI,0x158(%RSP) |
0x40752e MOV %R13,0x2b8(%RSP) |
0x407536 MOV %R8,0x70(%RSP) |
0x40753b IMUL %RAX,%R8 |
0x40753f MOV %RCX,0x68(%RSP) |
0x407544 MOV 0xf0(%RBX),%R9 |
0x40754b MOV 0x268(%RSP),%R13 |
0x407553 LEA (%R9,%RDX,1),%RDI |
0x407557 ADD %R8,%R9 |
0x40755a LEA (%RDI,%R8,1),%RSI |
0x40755e LEA (%R13,%RSI,8),%RCX |
0x407563 MOV %RSI,0x150(%RSP) |
0x40756b MOV 0x108(%RBX),%RSI |
0x407572 MOV 0x260(%RSP),%R13 |
0x40757a MOV %RCX,0x310(%RSP) |
0x407582 LEA (,%RSI,8),%RDI |
0x40758a MOV %RSI,0x138(%RSP) |
0x407592 MOV %RDI,0x60(%RSP) |
0x407597 IMUL %RAX,%RSI |
0x40759b MOV 0x110(%RBX),%RDI |
0x4075a2 LEA (%RDI,%RDX,1),%RBX |
0x4075a6 LEA (%RBX,%RSI,1),%RCX |
0x4075aa LEA (%RSI,%RDI,1),%R8 |
0x4075ae LEA (%R13,%RCX,8),%RBX |
0x4075b3 MOV %RCX,0x148(%RSP) |
0x4075bb MOV 0x1d0(%RSP),%RCX |
0x4075c3 MOV %RBX,0xe0(%RSP) |
0x4075cb MOV 0xc8(%RSP),%RBX |
0x4075d3 IMUL %RCX,%RAX |
0x4075d7 LEA (,%RCX,8),%R13 |
0x4075df LEA (%RBX,%RDX,1),%RDX |
0x4075e3 MOV %R13,0x58(%RSP) |
0x4075e8 MOV 0x258(%RSP),%RBX |
0x4075f0 MOV %RDX,0x130(%RSP) |
0x4075f8 MOV 0xc0(%RSP),%R13 |
0x407600 ADD %RAX,%RDX |
0x407603 LEA (%R12,%RDX,8),%RCX |
0x407607 MOV %RDX,0x140(%RSP) |
0x40760f MOV 0x250(%RSP),%RDX |
0x407617 ADD %RBX,%R13 |
0x40761a MOV %RCX,0xd8(%RSP) |
0x407622 MOV 0x38(%RSP),%RCX |
0x407627 MOV %R13,0x258(%RSP) |
0x40762f MOV 0x2a8(%RSP),%R13 |
0x407637 LEA (%RDX,%RCX,1),%RBX |
0x40763b MOV 0x2b0(%RSP),%RDX |
0x407643 MOV 0x2a0(%RSP),%RCX |
0x40764b MOV %RBX,0x210(%RSP) |
0x407653 MOV 0x40(%RSP),%RBX |
0x407658 ADD %RDX,%R13 |
0x40765b MOV %R13,0x218(%RSP) |
0x407663 LEA (%RCX,%RBX,1),%RDX |
0x407667 MOV 0x30(%RSP),%R13 |
0x40766c MOV 0x298(%RSP),%RCX |
0x407674 MOV %RDX,0x220(%RSP) |
0x40767c LEA (%R10,%R13,1),%R10 |
0x407680 LEA (%R11,%RCX,1),%R11 |
0x407684 MOV %R10,0x228(%RSP) |
0x40768c MOV %R11,0x230(%RSP) |
0x407694 MOV 0x1d8(%RSP),%EDI |
0x40769b MOV 0x2e0(%RSP),%ESI |
0x4076a2 MOV 0x290(%RSP),%RBX |
0x4076aa MOV %R9,0x240(%RSP) |
0x4076b2 MOV 0xc8(%RSP),%R9 |
0x4076ba MOV 0x288(%RSP),%RDX |
0x4076c2 MOV %R8,0x248(%RSP) |
0x4076ca SUB %EDI,%ESI |
0x4076cc VMOVSD 0x7d6ac(%RIP),%XMM5 |
0x4076d4 LEA 0x2(%RSI),%R13D |
0x4076d8 ADD %RAX,%R9 |
0x4076db ADD %RBX,%RDX |
0x4076de MOV %ESI,0x24(%RSP) |
0x4076e2 MOV %R13D,%EAX |
0x4076e5 MOV %R13D,%R10D |
0x4076e8 LEA 0x1(%RSI),%ECX |
0x4076eb AND $0x3,%R13D |
0x4076ef AND $-0x4,%R10D |
0x4076f3 SHR $0x2,%EAX |
0x4076f6 MOV %RDX,0x238(%RSP) |
0x4076fe VMOVDDUP %XMM5,%XMM6 |
0x407702 MOV %R10D,0x20(%RSP) |
0x407707 SAL $0x5,%RAX |
0x40770b ADD %EDI,%R10D |
0x40770e VBROADCASTSD %XMM5,%YMM2 |
0x407713 MOV %R9,0x250(%RSP) |
0x40771b MOV %RAX,0x208(%RSP) |
0x407723 MOV %R10D,0x1c(%RSP) |
0x407728 MOV %ECX,0x2c(%RSP) |
0x40772c MOV %R13D,0x28(%RSP) |
0x407731 NOPL (%RAX) |
(15) 0x407738 MOV 0xb8(%RSP),%R11D |
(15) 0x407740 CMP %R11D,0x1d8(%RSP) |
(15) 0x407748 JGE 408084 |
(15) 0x40774e MOV 0x1dc(%RSP),%EAX |
(15) 0x407755 MOV 0xf0(%RSP),%R8 |
(15) 0x40775d MOV 0xc0(%RSP),%RBX |
(15) 0x407765 MOV 0x100(%RSP),%R9 |
(15) 0x40776d DEC %EAX |
(15) 0x40776f MOV 0x108(%RSP),%R10 |
(15) 0x407777 MOV 0x38(%RSP),%RSI |
(15) 0x40777c CLTQ |
(15) 0x40777e MOV 0x40(%RSP),%R13 |
(15) 0x407783 MOV 0x30(%RSP),%R11 |
(15) 0x407788 IMUL %RAX,%R8 |
(15) 0x40778c IMUL %RAX,%R9 |
(15) 0x407790 IMUL %RAX,%R10 |
(15) 0x407794 LEA (%RBX,%R8,1),%RDX |
(15) 0x407798 MOV 0xf8(%RSP),%RBX |
(15) 0x4077a0 MOV %R8,0x1c8(%RSP) |
(15) 0x4077a8 MOV %RDX,0x200(%RSP) |
(15) 0x4077b0 MOV 0x1d0(%RSP),%RDX |
(15) 0x4077b8 LEA (%RSI,%R9,1),%RDI |
(15) 0x4077bc IMUL %RAX,%RBX |
(15) 0x4077c0 MOV 0xc8(%RSP),%RSI |
(15) 0x4077c8 LEA (%R13,%R10,1),%RCX |
(15) 0x4077cd MOV %R9,0x1c0(%RSP) |
(15) 0x4077d5 IMUL %RDX,%RAX |
(15) 0x4077d9 MOV %RDI,0x1f8(%RSP) |
(15) 0x4077e1 MOV %R10,0x1b8(%RSP) |
(15) 0x4077e9 ADD %RBX,%R11 |
(15) 0x4077ec MOV %RCX,0x1f0(%RSP) |
(15) 0x4077f4 ADD %RAX,%RSI |
(15) 0x4077f7 CMPL $0x2,0x2c(%RSP) |
(15) 0x4077fc MOV %RBX,0x1b0(%RSP) |
(15) 0x407804 MOV %RAX,%R13 |
(15) 0x407807 MOV %R11,0x1e8(%RSP) |
(15) 0x40780f MOV %RAX,0x190(%RSP) |
(15) 0x407817 MOV %RSI,0x1e0(%RSP) |
(15) 0x40781f JBE 408240 |
(15) 0x407825 MOV 0x110(%RSP),%RDI |
(15) 0x40782d MOV 0x118(%RSP),%R11 |
(15) 0x407835 MOV %R15,0x1a8(%RSP) |
(15) 0x40783d MOV 0x2d0(%RSP),%RDX |
(15) 0x407845 MOV %R12,0xd0(%RSP) |
(15) 0x40784d LEA (%R8,%RDI,1),%R8 |
(15) 0x407851 ADD %R11,%R9 |
(15) 0x407854 MOV 0x300(%RSP),%RDI |
(15) 0x40785c MOV 0x318(%RSP),%R11 |
(15) 0x407864 SAL $0x3,%R8 |
(15) 0x407868 SAL $0x3,%R9 |
(15) 0x40786c MOV %R14,0x1a0(%RSP) |
(15) 0x407874 LEA -0x8(%R15,%R8,1),%RCX |
(15) 0x407879 LEA (%R15,%R8,1),%RAX |
(15) 0x40787d MOV 0x2d8(%RSP),%R8 |
(15) 0x407885 SUB $0x8,%RDI |
(15) 0x407889 MOV %RCX,0x2b0(%RSP) |
(15) 0x407891 LEA -0x8(%RDX,%R9,1),%RSI |
(15) 0x407896 LEA (%RDX,%R9,1),%R9 |
(15) 0x40789a MOV 0x120(%RSP),%RDX |
(15) 0x4078a2 LEA -0x8(%R8),%RCX |
(15) 0x4078a6 MOV %RAX,0x2a0(%RSP) |
(15) 0x4078ae MOV 0x128(%RSP),%RAX |
(15) 0x4078b6 LEA -0x8(%R11),%R11 |
(15) 0x4078ba MOV %RCX,0x288(%RSP) |
(15) 0x4078c2 MOV 0x130(%RSP),%RCX |
(15) 0x4078ca LEA (%R10,%RDX,1),%R10 |
(15) 0x4078ce LEA (%RBX,%RAX,1),%RBX |
(15) 0x4078d2 MOV %RSI,0x2a8(%RSP) |
(15) 0x4078da MOV 0x2c8(%RSP),%RSI |
(15) 0x4078e2 XOR %EAX,%EAX |
(15) 0x4078e4 SAL $0x3,%RBX |
(15) 0x4078e8 ADD %RCX,%R13 |
(15) 0x4078eb MOV %R9,0x298(%RSP) |
(15) 0x4078f3 SAL $0x3,%R13 |
(15) 0x4078f7 LEA (%R14,%RBX,1),%R9 |
(15) 0x4078fb LEA -0x8(%R14,%RBX,1),%R8 |
(15) 0x407900 MOV %RDI,0x290(%RSP) |
(15) 0x407908 MOV 0xd8(%RSP),%RBX |
(15) 0x407910 MOV 0x310(%RSP),%RDI |
(15) 0x407918 LEA (%R12,%R13,1),%RCX |
(15) 0x40791c LEA -0x8(%R12,%R13,1),%RDX |
(15) 0x407921 MOV 0xe8(%RSP),%R12 |
(15) 0x407929 MOV 0xe0(%RSP),%R13 |
(15) 0x407931 LEA (%RSI,%R10,8),%R10 |
(15) 0x407935 LEA -0x8(%RDI),%RDI |
(15) 0x407939 LEA -0x8(%RBX),%RSI |
(15) 0x40793d MOV %RBX,%R14 |
(16) 0x407940 MOV 0x298(%RSP),%R15 |
(16) 0x407948 MOV 0x2a0(%RSP),%RBX |
(16) 0x407950 VMOVUPD (%R15,%RAX,1),%YMM0 |
(16) 0x407956 MOV 0x2b0(%RSP),%R15 |
(16) 0x40795e VMULPD (%RBX,%RAX,1),%YMM0,%YMM8 |
(16) 0x407963 VMOVUPD (%R15,%RAX,1),%YMM1 |
(16) 0x407969 VMOVAPD %YMM0,0x2e0(%RSP) |
(16) 0x407972 MOV 0x2a8(%RSP),%RBX |
(16) 0x40797a MOV 0x290(%RSP),%R15 |
(16) 0x407982 VMOVUPD (%R15,%RAX,1),%YMM9 |
(16) 0x407988 MOV 0x2d8(%RSP),%R15 |
(16) 0x407990 VFMADD231PD (%RBX,%RAX,1),%YMM1,%YMM8 |
(16) 0x407996 MOV 0x288(%RSP),%RBX |
(16) 0x40799e VMULPD (%RBX,%RAX,1),%YMM9,%YMM10 |
(16) 0x4079a3 MOV 0x300(%RSP),%RBX |
(16) 0x4079ab VMOVUPD (%RBX,%RAX,1),%YMM11 |
(16) 0x4079b0 MOV 0x318(%RSP),%RBX |
(16) 0x4079b8 VMOVUPD (%RBX,%RAX,1),%YMM15 |
(16) 0x4079bd MOV 0x2c0(%RSP),%RBX |
(16) 0x4079c5 VFMADD231PD (%R15,%RAX,1),%YMM11,%YMM10 |
(16) 0x4079cb MOV 0x308(%RSP),%R15 |
(16) 0x4079d3 VSUBPD (%R11,%RAX,1),%YMM15,%YMM0 |
(16) 0x4079d9 VADDPD %YMM10,%YMM8,%YMM12 |
(16) 0x4079de VMOVUPD (%R9,%RAX,1),%YMM8 |
(16) 0x4079e4 VSUBPD (%R8,%RAX,1),%YMM8,%YMM1 |
(16) 0x4079ea VMULPD %YMM2,%YMM12,%YMM13 |
(16) 0x4079ee VMULPD (%R10,%RAX,1),%YMM1,%YMM9 |
(16) 0x4079f4 VDIVPD %YMM13,%YMM3,%YMM14 |
(16) 0x4079f9 VFMADD132PD (%R15,%RAX,1),%YMM9,%YMM0 |
(16) 0x4079ff MOV 0x318(%RSP),%R15 |
(16) 0x407a07 VFNMADD213PD (%RBX,%RAX,1),%YMM14,%YMM0 |
(16) 0x407a0d VMOVUPD %YMM0,(%R12,%RAX,1) |
(16) 0x407a13 VMOVUPD (%R15,%RAX,1),%YMM10 |
(16) 0x407a19 VMOVUPD (%R11,%RAX,1),%YMM11 |
(16) 0x407a1f VSUBPD (%R9,%RAX,1),%YMM10,%YMM12 |
(16) 0x407a25 VSUBPD (%R8,%RAX,1),%YMM11,%YMM13 |
(16) 0x407a2b MOV 0x310(%RSP),%RBX |
(16) 0x407a33 MOV 0x2b8(%RSP),%R15 |
(16) 0x407a3b VMULPD (%RDI,%RAX,1),%YMM13,%YMM15 |
(16) 0x407a40 VFMADD132PD (%RBX,%RAX,1),%YMM15,%YMM12 |
(16) 0x407a46 MOV 0x308(%RSP),%RBX |
(16) 0x407a4e VFNMADD213PD (%R15,%RAX,1),%YMM14,%YMM12 |
(16) 0x407a54 MOV 0x310(%RSP),%R15 |
(16) 0x407a5c VMOVUPD %YMM12,(%R13,%RAX,1) |
(16) 0x407a63 VMOVUPD (%RCX,%RAX,1),%YMM8 |
(16) 0x407a68 VMOVUPD (%R14,%RAX,1),%YMM0 |
(16) 0x407a6e VSUBPD (%RDX,%RAX,1),%YMM8,%YMM9 |
(16) 0x407a73 VSUBPD (%RSI,%RAX,1),%YMM0,%YMM1 |
(16) 0x407a78 VMULPD (%R10,%RAX,1),%YMM9,%YMM10 |
(16) 0x407a7e VFMADD132PD (%RBX,%RAX,1),%YMM10,%YMM1 |
(16) 0x407a84 MOV 0x208(%RSP),%RBX |
(16) 0x407a8c VFNMADD213PD (%R12,%RAX,1),%YMM14,%YMM1 |
(16) 0x407a92 VMOVUPD %YMM1,(%R12,%RAX,1) |
(16) 0x407a98 VMOVUPD (%RSI,%RAX,1),%YMM13 |
(16) 0x407a9d VMOVUPD (%R14,%RAX,1),%YMM12 |
(16) 0x407aa3 VSUBPD (%RDX,%RAX,1),%YMM13,%YMM15 |
(16) 0x407aa8 VSUBPD (%RCX,%RAX,1),%YMM12,%YMM11 |
(16) 0x407aad VMULPD (%RDI,%RAX,1),%YMM15,%YMM0 |
(16) 0x407ab2 VFMADD132PD (%R15,%RAX,1),%YMM0,%YMM11 |
(16) 0x407ab8 VFNMADD213PD (%R13,%RAX,1),%YMM11,%YMM14 |
(16) 0x407abf VMOVUPD %YMM14,(%R13,%RAX,1) |
(16) 0x407ac6 ADD $0x20,%RAX |
(16) 0x407aca CMP %RBX,%RAX |
(16) 0x407acd JNE 407940 |
(15) 0x407ad3 MOV 0x28(%RSP),%R11D |
(15) 0x407ad8 MOV 0x1a8(%RSP),%R15 |
(15) 0x407ae0 MOV 0x1a0(%RSP),%R14 |
(15) 0x407ae8 MOV 0xd0(%RSP),%R12 |
(15) 0x407af0 TEST %R11D,%R11D |
(15) 0x407af3 JE 408084 |
(15) 0x407af9 MOV 0x20(%RSP),%EAX |
(15) 0x407afd MOV 0x1c(%RSP),%R9D |
(15) 0x407b02 MOV 0x24(%RSP),%R10D |
(15) 0x407b07 SUB %EAX,%R10D |
(15) 0x407b0a LEA 0x2(%R10),%R8D |
(15) 0x407b0e MOV %R8D,0xd0(%RSP) |
(15) 0x407b16 CMP $-0x1,%R10D |
(15) 0x407b1a JE 407e7e |
(15) 0x407b20 MOV 0x1c8(%RSP),%RDI |
(15) 0x407b28 MOV 0x110(%RSP),%RSI |
(15) 0x407b30 MOV 0x1c0(%RSP),%RDX |
(15) 0x407b38 MOV 0x118(%RSP),%RCX |
(15) 0x407b40 MOV 0x170(%RSP),%R11 |
(15) 0x407b48 ADD %RSI,%RDI |
(15) 0x407b4b MOV 0x178(%RSP),%R10 |
(15) 0x407b53 LEA (%RDI,%RAX,1),%RBX |
(15) 0x407b57 ADD %RCX,%RDX |
(15) 0x407b5a MOV 0x188(%RSP),%RDI |
(15) 0x407b62 MOV 0x168(%RSP),%RSI |
(15) 0x407b6a ADD %RAX,%R11 |
(15) 0x407b6d LEA (%RDX,%RAX,1),%R13 |
(15) 0x407b71 LEA (%R10,%RAX,1),%R8 |
(15) 0x407b75 MOV %R11,0x2a0(%RSP) |
(15) 0x407b7d MOV 0x180(%RSP),%R11 |
(15) 0x407b85 LEA (%RSI,%RAX,1),%RDX |
(15) 0x407b89 MOV %R13,0x1a8(%RSP) |
(15) 0x407b91 LEA (%RDI,%RAX,1),%R13 |
(15) 0x407b95 MOV 0x2c8(%RSP),%RDI |
(15) 0x407b9d LEA (%R11,%RAX,1),%R10 |
(15) 0x407ba1 MOV 0x1b8(%RSP),%RSI |
(15) 0x407ba9 MOV %R8,0x298(%RSP) |
(15) 0x407bb1 LEA (%RDI,%RDX,8),%RCX |
(15) 0x407bb5 SAL $0x3,%R10 |
(15) 0x407bb9 MOV 0x120(%RSP),%RDX |
(15) 0x407bc1 LEA (%R14,%R10,1),%R11 |
(15) 0x407bc5 LEA -0x8(%R14,%R10,1),%R8 |
(15) 0x407bca MOV %RCX,0x290(%RSP) |
(15) 0x407bd2 MOV 0x128(%RSP),%R10 |
(15) 0x407bda MOV 0x1b0(%RSP),%RCX |
(15) 0x407be2 ADD %RDX,%RSI |
(15) 0x407be5 MOV 0x278(%RSP),%RDX |
(15) 0x407bed MOV %R8,0x288(%RSP) |
(15) 0x407bf5 ADD %RAX,%RSI |
(15) 0x407bf8 ADD %R10,%RCX |
(15) 0x407bfb LEA (%RDI,%RSI,8),%RDI |
(15) 0x407bff MOV 0x160(%RSP),%RSI |
(15) 0x407c07 ADD %RAX,%RCX |
(15) 0x407c0a MOV %RDI,0x2e0(%RSP) |
(15) 0x407c12 SAL $0x3,%RCX |
(15) 0x407c16 ADD %RAX,%RSI |
(15) 0x407c19 LEA -0x8(%R14,%RCX,1),%R8 |
(15) 0x407c1e LEA (%R14,%RCX,1),%R10 |
(15) 0x407c22 MOV 0x158(%RSP),%RCX |
(15) 0x407c2a MOV %R8,0x2b0(%RSP) |
(15) 0x407c32 MOV 0x150(%RSP),%R8 |
(15) 0x407c3a LEA (%RDX,%RSI,8),%RDI |
(15) 0x407c3e MOV %RDI,0x1c8(%RSP) |
(15) 0x407c46 MOV 0x268(%RSP),%RDI |
(15) 0x407c4e ADD %RAX,%RCX |
(15) 0x407c51 LEA (%RAX,%R8,1),%RSI |
(15) 0x407c55 MOV %RCX,0x1a0(%RSP) |
(15) 0x407c5d MOV 0x148(%RSP),%R8 |
(15) 0x407c65 SAL $0x3,%RSI |
(15) 0x407c69 LEA (%RDI,%RSI,1),%RDX |
(15) 0x407c6d LEA -0x8(%RDI,%RSI,1),%RCX |
(15) 0x407c72 MOV 0x260(%RSP),%RDI |
(15) 0x407c7a MOV %RCX,0x1b8(%RSP) |
(15) 0x407c82 LEA (%RAX,%R8,1),%RSI |
(15) 0x407c86 MOV %RDX,0x1c0(%RSP) |
(15) 0x407c8e MOV 0x140(%RSP),%RDX |
(15) 0x407c96 LEA (%RDI,%RSI,8),%RCX |
(15) 0x407c9a VMOVUPD (%R15,%RBX,8),%XMM1 |
(15) 0x407ca0 VMOVUPD -0x8(%R15,%RBX,8),%XMM12 |
(15) 0x407ca7 LEA (%RAX,%RDX,1),%RSI |
(15) 0x407cab MOV 0x190(%RSP),%RDX |
(15) 0x407cb3 MOV 0x288(%RSP),%RBX |
(15) 0x407cbb SAL $0x3,%RSI |
(15) 0x407cbf VMOVUPD (%R11),%XMM15 |
(15) 0x407cc4 LEA (%R12,%RSI,1),%R8 |
(15) 0x407cc8 LEA -0x8(%R12,%RSI,1),%RDI |
(15) 0x407ccd MOV 0x130(%RSP),%RSI |
(15) 0x407cd5 ADD %RSI,%RDX |
(15) 0x407cd8 MOV 0x298(%RSP),%RSI |
(15) 0x407ce0 ADD %RDX,%RAX |
(15) 0x407ce3 SAL $0x3,%RAX |
(15) 0x407ce7 LEA (%R12,%RAX,1),%RDX |
(15) 0x407ceb LEA -0x8(%R12,%RAX,1),%RAX |
(15) 0x407cf0 MOV %RDX,0x2a8(%RSP) |
(15) 0x407cf8 MOV 0x2d0(%RSP),%RDX |
(15) 0x407d00 MOV %RAX,0x1b0(%RSP) |
(15) 0x407d08 MOV 0x2a0(%RSP),%RAX |
(15) 0x407d10 VMOVUPD (%RDX,%RSI,8),%XMM14 |
(15) 0x407d15 MOV 0x1a8(%RSP),%RSI |
(15) 0x407d1d VMULPD (%R15,%RAX,8),%XMM14,%XMM8 |
(15) 0x407d23 MOV 0x298(%RSP),%RAX |
(15) 0x407d2b VMOVAPD %XMM14,0x190(%RSP) |
(15) 0x407d34 VSUBPD (%RBX),%XMM15,%XMM14 |
(15) 0x407d38 VMOVUPD -0x8(%RDX,%RAX,8),%XMM9 |
(15) 0x407d3e MOV 0x2a0(%RSP),%RAX |
(15) 0x407d46 VMULPD -0x8(%R15,%RAX,8),%XMM9,%XMM10 |
(15) 0x407d4d MOV 0x2e0(%RSP),%RAX |
(15) 0x407d55 VFMADD231PD (%RDX,%RSI,8),%XMM1,%XMM8 |
(15) 0x407d5b VFMADD231PD -0x8(%RDX,%RSI,8),%XMM12,%XMM10 |
(15) 0x407d62 MOV 0x2b0(%RSP),%RSI |
(15) 0x407d6a MOV 0x280(%RSP),%RDX |
(15) 0x407d72 VADDPD %XMM10,%XMM8,%XMM11 |
(15) 0x407d77 VMOVUPD (%R10),%XMM8 |
(15) 0x407d7c VSUBPD (%RSI),%XMM8,%XMM1 |
(15) 0x407d80 VMULPD %XMM6,%XMM11,%XMM13 |
(15) 0x407d84 VMULPD (%RAX),%XMM1,%XMM9 |
(15) 0x407d88 MOV 0x290(%RSP),%RAX |
(15) 0x407d90 VDIVPD %XMM13,%XMM7,%XMM0 |
(15) 0x407d95 VFMADD132PD (%RAX),%XMM9,%XMM14 |
(15) 0x407d9a VFNMADD213PD (%RDX,%R13,8),%XMM0,%XMM14 |
(15) 0x407da0 MOV 0x1c8(%RSP),%RDX |
(15) 0x407da8 MOV 0x2b0(%RSP),%R13 |
(15) 0x407db0 MOV 0x1a0(%RSP),%RSI |
(15) 0x407db8 VMOVUPD %XMM14,(%RDX) |
(15) 0x407dbc VMOVUPD (%RBX),%XMM11 |
(15) 0x407dc0 VMOVUPD (%R11),%XMM10 |
(15) 0x407dc5 MOV 0x1b8(%RSP),%R11 |
(15) 0x407dcd MOV 0x270(%RSP),%RBX |
(15) 0x407dd5 VSUBPD (%R13),%XMM11,%XMM13 |
(15) 0x407ddb VSUBPD (%R10),%XMM10,%XMM12 |
(15) 0x407de0 MOV 0x1c0(%RSP),%R10 |
(15) 0x407de8 MOV 0x2a8(%RSP),%R13 |
(15) 0x407df0 VMULPD (%R11),%XMM13,%XMM15 |
(15) 0x407df5 VFMADD132PD (%R10),%XMM15,%XMM12 |
(15) 0x407dfa VFNMADD213PD (%RBX,%RSI,8),%XMM0,%XMM12 |
(15) 0x407e00 MOV 0x1b0(%RSP),%RSI |
(15) 0x407e08 MOV 0x2e0(%RSP),%RBX |
(15) 0x407e10 VMOVUPD %XMM12,(%RCX) |
(15) 0x407e14 VMOVUPD (%R13),%XMM8 |
(15) 0x407e1a VMOVUPD (%R8),%XMM14 |
(15) 0x407e1f VSUBPD (%RSI),%XMM8,%XMM9 |
(15) 0x407e23 VSUBPD (%RDI),%XMM14,%XMM1 |
(15) 0x407e27 VMULPD (%RBX),%XMM9,%XMM10 |
(15) 0x407e2b VFMADD132PD (%RAX),%XMM10,%XMM1 |
(15) 0x407e30 VFNMADD213PD (%RDX),%XMM0,%XMM1 |
(15) 0x407e35 VMOVUPD %XMM1,(%RDX) |
(15) 0x407e39 VMOVUPD (%RDI),%XMM13 |
(15) 0x407e3d VMOVUPD (%R8),%XMM12 |
(15) 0x407e42 MOV 0x2a8(%RSP),%R8 |
(15) 0x407e4a VSUBPD (%RSI),%XMM13,%XMM15 |
(15) 0x407e4e VSUBPD (%R8),%XMM12,%XMM11 |
(15) 0x407e53 VMULPD (%R11),%XMM15,%XMM14 |
(15) 0x407e58 VFMADD132PD (%R10),%XMM14,%XMM11 |
(15) 0x407e5d VFNMADD213PD (%RCX),%XMM11,%XMM0 |
(15) 0x407e62 VMOVUPD %XMM0,(%RCX) |
(15) 0x407e66 MOV 0xd0(%RSP),%ECX |
(15) 0x407e6d TEST $0x1,%CL |
(15) 0x407e70 JE 408084 |
(15) 0x407e76 MOV %ECX,%EDI |
(15) 0x407e78 AND $-0x2,%EDI |
(15) 0x407e7b ADD %EDI,%R9D |
(15) 0x407e7e MOV 0x200(%RSP),%R13 |
(15) 0x407e86 LEA -0x1(%R9),%EAX |
(15) 0x407e8a MOV 0x258(%RSP),%R11 |
(15) 0x407e92 MOVSXD %EAX,%RDX |
(15) 0x407e95 MOVSXD %R9D,%RAX |
(15) 0x407e98 MOV 0x210(%RSP),%RBX |
(15) 0x407ea0 MOV 0x1f8(%RSP),%RSI |
(15) 0x407ea8 LEA (%R13,%RDX,1),%R8 |
(15) 0x407ead ADD %RAX,%R13 |
(15) 0x407eb0 LEA (%R11,%RAX,1),%R10 |
(15) 0x407eb4 VMOVSD (%R15,%R13,8),%XMM1 |
(15) 0x407eba LEA (%R11,%RDX,1),%R13 |
(15) 0x407ebe VMOVSD (%R15,%R10,8),%XMM0 |
(15) 0x407ec4 MOV %RBX,%R9 |
(15) 0x407ec7 MOV 0x2d0(%RSP),%R10 |
(15) 0x407ecf VMOVSD (%R15,%R13,8),%XMM9 |
(15) 0x407ed5 LEA (%RBX,%RDX,1),%RCX |
(15) 0x407ed9 ADD %RAX,%R9 |
(15) 0x407edc VMOVSD (%R15,%R8,8),%XMM12 |
(15) 0x407ee2 LEA (%RSI,%RDX,1),%RDI |
(15) 0x407ee6 ADD %RAX,%RSI |
(15) 0x407ee9 MOV 0x1e8(%RSP),%R11 |
(15) 0x407ef1 VMULSD (%R10,%R9,8),%XMM0,%XMM8 |
(15) 0x407ef7 MOV 0x220(%RSP),%R8 |
(15) 0x407eff VMULSD (%R10,%RCX,8),%XMM9,%XMM10 |
(15) 0x407f05 LEA (%R11,%RAX,1),%RCX |
(15) 0x407f09 LEA (%R11,%RDX,1),%R13 |
(15) 0x407f0d MOV 0x280(%RSP),%RBX |
(15) 0x407f15 LEA (%R8,%RAX,1),%R9 |
(15) 0x407f19 VFMADD231SD (%R10,%RSI,8),%XMM1,%XMM8 |
(15) 0x407f1f MOV 0x228(%RSP),%RSI |
(15) 0x407f27 VFMADD231SD (%R10,%RDI,8),%XMM12,%XMM10 |
(15) 0x407f2d MOV 0x1f0(%RSP),%R10 |
(15) 0x407f35 LEA (%RSI,%RAX,1),%R8 |
(15) 0x407f39 ADD %RDX,%RSI |
(15) 0x407f3c MOV 0x218(%RSP),%RDI |
(15) 0x407f44 ADD %RAX,%R10 |
(15) 0x407f47 VMOVSD (%R14,%R8,8),%XMM14 |
(15) 0x407f4d ADD %RAX,%RDI |
(15) 0x407f50 VSUBSD (%R14,%RSI,8),%XMM14,%XMM0 |
(15) 0x407f56 MOV 0x230(%RSP),%RSI |
(15) 0x407f5e VADDSD %XMM10,%XMM8,%XMM11 |
(15) 0x407f63 VMOVSD (%R14,%RCX,8),%XMM8 |
(15) 0x407f69 LEA (%RSI,%RAX,1),%R11 |
(15) 0x407f6d VSUBSD (%R14,%R13,8),%XMM8,%XMM1 |
(15) 0x407f73 MOV 0x2c8(%RSP),%R13 |
(15) 0x407f7b VMULSD %XMM5,%XMM11,%XMM13 |
(15) 0x407f7f VMULSD (%R13,%R10,8),%XMM1,%XMM9 |
(15) 0x407f86 VDIVSD %XMM13,%XMM4,%XMM15 |
(15) 0x407f8b VFMADD132SD (%R13,%R9,8),%XMM9,%XMM0 |
(15) 0x407f92 VFNMADD213SD (%RBX,%RDI,8),%XMM15,%XMM0 |
(15) 0x407f98 MOV 0x278(%RSP),%RDI |
(15) 0x407fa0 LEA (%RDI,%R11,8),%RSI |
(15) 0x407fa4 MOV 0x238(%RSP),%R11 |
(15) 0x407fac MOV 0x240(%RSP),%RDI |
(15) 0x407fb4 ADD %RAX,%RDI |
(15) 0x407fb7 LEA (%R11,%RAX,1),%R11 |
(15) 0x407fbb VMOVSD %XMM0,(%RSI) |
(15) 0x407fbf MOV 0x268(%RSP),%RBX |
(15) 0x407fc7 VMOVUPD -0x8(%R14,%R8,8),%XMM10 |
(15) 0x407fce MOV 0x248(%RSP),%R8 |
(15) 0x407fd6 VSUBPD -0x8(%R14,%RCX,8),%XMM10,%XMM12 |
(15) 0x407fdd LEA (%RBX,%RDI,8),%RDI |
(15) 0x407fe1 MOV 0x270(%RSP),%RBX |
(15) 0x407fe9 LEA (%R8,%RAX,1),%RCX |
(15) 0x407fed VMULPD -0x8(%RDI),%XMM12,%XMM11 |
(15) 0x407ff2 VUNPCKHPD %XMM11,%XMM11,%XMM13 |
(15) 0x407ff7 VADDPD %XMM11,%XMM13,%XMM14 |
(15) 0x407ffc VFNMADD213SD (%RBX,%R11,8),%XMM15,%XMM14 |
(15) 0x408002 MOV 0x260(%RSP),%R11 |
(15) 0x40800a MOV 0x1e0(%RSP),%RBX |
(15) 0x408012 LEA (%R11,%RCX,8),%RCX |
(15) 0x408016 MOV 0x250(%RSP),%R11 |
(15) 0x40801e LEA (%R11,%RAX,1),%R8 |
(15) 0x408022 ADD %RBX,%RAX |
(15) 0x408025 ADD %RDX,%R11 |
(15) 0x408028 ADD %RBX,%RDX |
(15) 0x40802b VMOVSD %XMM14,(%RCX) |
(15) 0x40802f VMOVSD (%R12,%RAX,8),%XMM8 |
(15) 0x408035 VMOVSD (%R12,%R8,8),%XMM0 |
(15) 0x40803b VSUBSD (%R12,%RDX,8),%XMM8,%XMM9 |
(15) 0x408041 VSUBSD (%R12,%R11,8),%XMM0,%XMM1 |
(15) 0x408047 VMULSD (%R13,%R10,8),%XMM9,%XMM10 |
(15) 0x40804e VFMADD132SD (%R13,%R9,8),%XMM10,%XMM1 |
(15) 0x408055 VFNMADD213SD (%RSI),%XMM15,%XMM1 |
(15) 0x40805a VMOVSD %XMM1,(%RSI) |
(15) 0x40805e VMOVUPD -0x8(%R12,%R8,8),%XMM12 |
(15) 0x408065 VSUBPD -0x8(%R12,%RAX,8),%XMM12,%XMM11 |
(15) 0x40806c VMULPD -0x8(%RDI),%XMM11,%XMM13 |
(15) 0x408071 VUNPCKHPD %XMM13,%XMM13,%XMM14 |
(15) 0x408076 VADDPD %XMM13,%XMM14,%XMM0 |
(15) 0x40807b VFNMADD213SD (%RCX),%XMM0,%XMM15 |
(15) 0x408080 VMOVSD %XMM15,(%RCX) |
(15) 0x408084 INCL 0x1dc(%RSP) |
(15) 0x40808b MOV 0x50(%RSP),%RAX |
(15) 0x408090 MOV 0x48(%RSP),%R9 |
(15) 0x408095 MOV 0xa8(%RSP),%R10 |
(15) 0x40809d MOV 0xa0(%RSP),%RSI |
(15) 0x4080a5 MOV 0x98(%RSP),%RDI |
(15) 0x4080ad MOV 0x88(%RSP),%RCX |
(15) 0x4080b5 MOV 0x78(%RSP),%R11 |
(15) 0x4080ba MOV 0x68(%RSP),%R8 |
(15) 0x4080bf MOV 0x60(%RSP),%RBX |
(15) 0x4080c4 MOV 0x58(%RSP),%R13 |
(15) 0x4080c9 ADD %RAX,0x300(%RSP) |
(15) 0x4080d1 ADD %R9,0x2d8(%RSP) |
(15) 0x4080d9 MOV 0x1dc(%RSP),%EDX |
(15) 0x4080e0 ADD %R10,0x2c0(%RSP) |
(15) 0x4080e8 ADD %RSI,0x308(%RSP) |
(15) 0x4080f0 ADD %RDI,0x318(%RSP) |
(15) 0x4080f8 ADD %RCX,0xe8(%RSP) |
(15) 0x408100 ADD %R11,0x2b8(%RSP) |
(15) 0x408108 ADD %R8,0x310(%RSP) |
(15) 0x408110 ADD %RBX,0xe0(%RSP) |
(15) 0x408118 ADD %R13,0xd8(%RSP) |
(15) 0x408120 MOV 0x100(%RSP),%RDI |
(15) 0x408128 MOV 0xf0(%RSP),%RAX |
(15) 0x408130 MOV 0xb0(%RSP),%RSI |
(15) 0x408138 MOV 0x108(%RSP),%RCX |
(15) 0x408140 MOV 0xf8(%RSP),%R9 |
(15) 0x408148 MOV 0x90(%RSP),%R8 |
(15) 0x408150 MOV 0x80(%RSP),%R10 |
(15) 0x408158 MOV 0x70(%RSP),%R11 |
(15) 0x40815d MOV 0x138(%RSP),%RBX |
(15) 0x408165 MOV 0x1d0(%RSP),%R13 |
(15) 0x40816d ADD %RAX,0x258(%RSP) |
(15) 0x408175 ADD %RDI,0x210(%RSP) |
(15) 0x40817d ADD %RSI,0x218(%RSP) |
(15) 0x408185 ADD %RCX,0x220(%RSP) |
(15) 0x40818d ADD %R9,0x228(%RSP) |
(15) 0x408195 ADD %R8,0x230(%RSP) |
(15) 0x40819d ADD %R10,0x238(%RSP) |
(15) 0x4081a5 ADD %R11,0x240(%RSP) |
(15) 0x4081ad ADD %RBX,0x248(%RSP) |
(15) 0x4081b5 ADD %R13,0x250(%RSP) |
(15) 0x4081bd ADD %RAX,0x170(%RSP) |
(15) 0x4081c5 MOV 0x138(%RSP),%RAX |
(15) 0x4081cd ADD %RDI,0x178(%RSP) |
(15) 0x4081d5 MOV 0x1d0(%RSP),%RDI |
(15) 0x4081dd ADD %RSI,0x188(%RSP) |
(15) 0x4081e5 ADD %RCX,0x168(%RSP) |
(15) 0x4081ed ADD %R9,0x180(%RSP) |
(15) 0x4081f5 ADD %R8,0x160(%RSP) |
(15) 0x4081fd ADD %R10,0x158(%RSP) |
(15) 0x408205 ADD %R11,0x150(%RSP) |
(15) 0x40820d ADD %RAX,0x148(%RSP) |
(15) 0x408215 ADD %RDI,0x140(%RSP) |
(15) 0x40821d CMP %EDX,0xbc(%RSP) |
(15) 0x408224 JG 407738 |
0x40822a VZEROUPPER |
0x40822d LEA -0x28(%RBP),%RSP |
0x408231 POP %RBX |
0x408232 POP %R12 |
0x408234 POP %R13 |
0x408236 POP %R14 |
0x408238 POP %R15 |
0x40823a POP %RBP |
0x40823b RET |
0x40823c NOPL (%RAX) |
(15) 0x408240 MOV 0x1d8(%RSP),%R9D |
(15) 0x408248 XOR %EAX,%EAX |
(15) 0x40824a JMP 407b02 |
0x40824f INC %EAX |
0x408251 XOR %EDX,%EDX |
0x408253 JMP 4071c9 |
0x408258 NOPL (%RAX,%RAX,1) |
Coverage (%) | Name | Source Location | Module |
---|---|---|---|
○98.12 | gomp_thread_start | team.c:130 | libgomp.so.1.0.0 |
○1.87 | GOMP_parallel | libgomp.h:985 | libgomp.so.1.0.0 |
Path / |
Source file and lines | accelerate_kernel.f90:57-76 |
Module | exec |
nb instructions | 270 |
nb uops | 276 |
loop length | 1503 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 85 |
micro-operation queue | 46.00 cycles |
front end | 46.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 10.80 | 14.00 | 24.00 | 24.00 | 47.00 | 10.80 | 10.80 | 47.00 | 47.00 | 47.00 | 10.60 | 24.00 |
cycles | 10.80 | 20.73 | 24.00 | 24.00 | 47.00 | 10.80 | 10.80 | 47.00 | 47.00 | 47.00 | 10.60 | 24.00 |
Cycles executing div or sqrt instructions | 6.00 |
FE+BE cycles | 47.11 |
Stall cycles | 1.28-1.28 |
RS full (events) | 6.14-4.63 |
Front-end | 46.00 |
Dispatch | 47.00 |
DIV/SQRT | 6.00 |
Overall L1 | 47.00 |
all | 1% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 20% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 1% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 12% |
all | 11% |
load | NA (no load vectorizable/vectorized instructions) |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 11% |
load | 12% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 6% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x320,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R12D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 402080 <@plt_start@+0x60> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %EAX,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 402180 <@plt_start@+0x160> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV (%RDX),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x2,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %R12D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CLTD | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R13D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
CMP %EDX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 40824f <__accelerate_kernel_module_MOD_accelerate_kernel._omp_fn.0+0x10cf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %EAX,%ECX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %ECX,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %EDX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %EAX,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 40822d <__accelerate_kernel_module_MOD_accelerate_kernel._omp_fn.0+0x10ad> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD %R12D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x98(%RBX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R12,%RDX,1),%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0xa0(%RBX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x78(%RBX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,0xbc(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x8(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,0x1d0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RAX),%R14D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x88(%RBX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RBX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,0x108(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x50(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x2(%R14),%R15D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0xc0(%RBX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14D,0x2e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb0(%RBX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RBX),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x80(%RBX),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,0xf8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13D,0x1dc(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVDDUP %XMM4,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VBROADCASTSD %XMM4,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R15D,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,0x2d0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x280(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x2c8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RBX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RBX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x270(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x118(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x260(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RSI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD %R13D,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV 0xc0(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %RAX,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,0x278(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %EDX,0x1d8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x110(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x258(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R13,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA (,%RCX,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RSI,0x170(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R15,%RSI,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,0x300(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xd0(%RBX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RCX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,0x250(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x2d0(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x178(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%R9,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R13,%RDX,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,0x2a8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x2d8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc8(%RBX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (,%RDI,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RAX,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,0x268(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RBX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (,%R9,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RAX,%R9 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RSI,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x280(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x2b0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RCX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,0x188(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RSI,%R9,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (,%R10,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,0x2c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xd8(%RBX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %RAX,%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R8,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R8,%RDX,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x2c8(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%R9,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0x2a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R8,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0xe0(%RBX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RAX,%R9 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R13,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xf8(%RBX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,0x168(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%RDI,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R8,%RDX,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x278(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,0x128(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R10,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,0x308(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%R9,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x100(%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R14,%R11,8),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,0x298(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%R13,8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RAX,%R13 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x318(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%RSI,%RDI,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%RDX,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x270(%RSP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDI,%R13,1),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xe8(%RBX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x288(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x290(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%R8,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R9,%RSI,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,0x158(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x2b8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RAX,%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RCX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xf0(%RBX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x268(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R9,%RDX,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %R8,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA (%RDI,%R8,1),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R13,%RSI,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,0x150(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x108(%RBX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x260(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x310(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RSI,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,0x138(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RAX,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x110(%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDI,%RDX,1),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RBX,%RSI,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RSI,%RDI,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R13,%RCX,8),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,0x148(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1d0(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc8(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %RCX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (,%RCX,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RBX,%RDX,1),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x258(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA (%R12,%RDX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x250(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RBX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,0x258(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x2a8(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDX,%RCX,1),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x2b0(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2a0(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,0x210(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R13,0x218(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%RBX,1),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x30(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x298(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R10,%R13,1),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R11,%RCX,1),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R10,0x228(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x230(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1d8(%RSP),%EDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2e0(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x290(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x240(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc8(%RSP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x288(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,0x248(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %EDI,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMOVSD 0x7d6ac(%RIP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x2(%RSI),%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
ADD %RAX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RBX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x24(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x1(%RSI),%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
AND $0x3,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
AND $-0x4,%R10D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x2,%EAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RDX,0x238(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVDDUP %XMM5,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV %R10D,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x5,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %EDI,%R10D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VBROADCASTSD %XMM5,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R9,0x250(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x208(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10D,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %ECX,0x2c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13D,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4071c9 <__accelerate_kernel_module_MOD_accelerate_kernel._omp_fn.0+0x49> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | accelerate_kernel.f90:57-76 |
Module | exec |
nb instructions | 270 |
nb uops | 276 |
loop length | 1503 |
used x86 registers | 16 |
used mmx registers | 0 |
used xmm registers | 4 |
used ymm registers | 2 |
used zmm registers | 0 |
nb stack references | 85 |
micro-operation queue | 46.00 cycles |
front end | 46.00 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 10.80 | 14.00 | 24.00 | 24.00 | 47.00 | 10.80 | 10.80 | 47.00 | 47.00 | 47.00 | 10.60 | 24.00 |
cycles | 10.80 | 20.73 | 24.00 | 24.00 | 47.00 | 10.80 | 10.80 | 47.00 | 47.00 | 47.00 | 10.60 | 24.00 |
Cycles executing div or sqrt instructions | 6.00 |
FE+BE cycles | 47.11 |
Stall cycles | 1.28-1.28 |
RS full (events) | 6.14-4.63 |
Front-end | 46.00 |
Dispatch | 47.00 |
DIV/SQRT | 6.00 |
Overall L1 | 47.00 |
all | 1% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 20% |
all | 0% |
load | 0% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 0% |
all | 1% |
load | 0% |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 0% |
other | 12% |
all | 11% |
load | NA (no load vectorizable/vectorized instructions) |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
other | 10% |
all | 12% |
load | 12% |
store | NA (no store vectorizable/vectorized instructions) |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 12% |
all | 11% |
load | 12% |
store | 11% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | 6% |
other | 11% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RDI,%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
AND $-0x20,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SUB $0x320,%RSP | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x10(%RDI),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RAX),%R12D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CALL 402080 <@plt_start@+0x60> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV %EAX,%R13D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
CALL 402180 <@plt_start@+0x160> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV 0x18(%RBX),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV (%RDX),%EAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD $0x2,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
SUB %R12D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CLTD | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 1 | 0.50 |
IDIV %R13D | 4 | 0 | 3 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 11-16 | 6 |
CMP %EDX,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JL 40824f <__accelerate_kernel_module_MOD_accelerate_kernel._omp_fn.0+0x10cf> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
IMUL %EAX,%ECX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
ADD %ECX,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %EDX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CMP %EAX,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
JGE 40822d <__accelerate_kernel_module_MOD_accelerate_kernel._omp_fn.0+0x10ad> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
ADD %R12D,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0x98(%RBX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R12,%RDX,1),%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0xa0(%RBX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x78(%RBX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV (%RBX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %EAX,0xbc(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x8(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb8(%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14,0x1d0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD (%R12),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xa8(%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RSI,0xc8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV (%RAX),%R14D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x88(%RBX),%R10 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R15,0xc0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x70(%RBX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x30(%RBX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,0x108(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x50(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x2(%R14),%R15D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV 0xc0(%RBX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R14D,0x2e0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x20(%RBX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0xb0(%RBX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x100(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x90(%RBX),%R11 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
VMOVSD 0x80(%RBX),%XMM4 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R10,0xf8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0xf0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13D,0x1dc(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVDDUP %XMM4,%XMM7 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
VBROADCASTSD %XMM4,%YMM3 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R15D,0xb8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RBX),%R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R12,0x2d0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x280(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,0x2c8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x58(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x60(%RBX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x40(%RBX),%R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x38(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RAX,0x270(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x68(%RBX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x118(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x260(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RSI,8),%RAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RAX,0x50(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOVSXD %R13D,%RAX | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
MOV 0xc0(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %RAX,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,0x278(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x28(%RBX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %EDX,0x1d8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x110(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RSI,0x258(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R13,%RSI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA (,%RCX,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RAX,%RCX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RSI,0x170(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R15,%RSI,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,0x300(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x48(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xd0(%RBX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RCX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,0x250(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x2d0(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x178(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%R9,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R13,%RDX,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,0x2a8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,0x2d8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc8(%RBX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (,%RDI,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
IMUL %RAX,%RDI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R12,0x268(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x48(%RBX),%R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (,%R9,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,0xb0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RAX,%R9 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RSI,0xa8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x280(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x2b0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RCX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R9,0x188(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RSI,%R9,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (,%R10,8),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,0x2c0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xd8(%RBX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %RAX,%R10 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R8,0x40(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R8,%RDX,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x2c8(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,0xa0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%R9,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,0x120(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0x2a0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R8,%RDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV 0xe0(%RBX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x90(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RAX,%R9 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x30(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %RDX,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R13,0x88(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xf8(%RBX),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,0x168(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%RDI,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R8,%RDX,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,0x98(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x278(%RSP),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,0x128(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
ADD %R10,%R11 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RDI,0x308(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%R9,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x100(%RBX),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R11,0x180(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R14,%R11,8),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,0x298(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%R13,8),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,0x80(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RAX,%R13 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R11,0x318(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R9,%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA (%RSI,%RDI,8),%R9 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDI,0x160(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%RDX,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R9,0xe8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x270(%RSP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDI,%R13,1),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R8,0x78(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xe8(%RBX),%R8 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x288(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x290(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%R8,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R9,%RSI,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,0x158(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13,0x2b8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R8,0x70(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RAX,%R8 | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %RCX,0x68(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xf0(%RBX),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x268(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%R9,%RDX,1),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD %R8,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA (%RDI,%R8,1),%RSI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R13,%RSI,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,0x150(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x108(%RBX),%RSI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x260(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RCX,0x310(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (,%RSI,8),%RDI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RSI,0x138(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RDI,0x60(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
IMUL %RAX,%RSI | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV 0x110(%RBX),%RDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDI,%RDX,1),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RBX,%RSI,1),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RSI,%RDI,1),%R8 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R13,%RCX,8),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RCX,0x148(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1d0(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,0xe0(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc8(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
IMUL %RCX,%RAX | 1 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
LEA (,%RCX,8),%R13 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%RBX,%RDX,1),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R13,0x58(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x258(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x130(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc0(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RAX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA (%R12,%RDX,8),%RCX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %RDX,0x140(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x250(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RBX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %RCX,0xd8(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x38(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R13,0x258(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x2a8(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA (%RDX,%RCX,1),%RBX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x2b0(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2a0(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RBX,0x210(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x40(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD %RDX,%R13 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %R13,0x218(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%RCX,%RBX,1),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV 0x30(%RSP),%R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x298(%RSP),%RCX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDX,0x220(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
LEA (%R10,%R13,1),%R10 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
LEA (%R11,%RCX,1),%R11 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV %R10,0x228(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R11,0x230(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x1d8(%RSP),%EDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x2e0(%RSP),%ESI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x290(%RSP),%RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R9,0x240(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc8(%RSP),%R9 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x288(%RSP),%RDX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %R8,0x248(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SUB %EDI,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VMOVSD 0x7d6ac(%RIP),%XMM5 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x2(%RSI),%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
ADD %RAX,%R9 | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %RBX,%RDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %ESI,0x24(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %R13D,%R10D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
LEA 0x1(%RSI),%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
AND $0x3,%R13D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
AND $-0x4,%R10D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
SHR $0x2,%EAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV %RDX,0x238(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
VMOVDDUP %XMM5,%XMM6 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 1 |
MOV %R10D,0x20(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
SAL $0x5,%RAX | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
ADD %EDI,%R10D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
VBROADCASTSD %XMM5,%YMM2 | 1 | 0 | 0 | 0 | 0 | 0 | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 1 |
MOV %R9,0x250(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %RAX,0x208(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R10D,0x1c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %ECX,0x2c(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R13D,0x28(%RSP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VZEROUPPER | 2 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 |
LEA -0x28(%RBP),%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
INC %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
XOR %EDX,%EDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
JMP 4071c9 <__accelerate_kernel_module_MOD_accelerate_kernel._omp_fn.0+0x49> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2.08 |
NOPL (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼__accelerate_kernel_module_MOD_accelerate_kernel._omp_fn.0– | 4.56 | 1.53 |
▼Loop 15 - accelerate_kernel.f90:67-76 - exec– | 0.01 | 0 |
○Loop 16 - accelerate_kernel.f90:67-76 - exec | 4.55 | 1.53 |