Function: updateLinkCells | Module: exec | Source: linkCells.c:209-385 [...] | Coverage: 0.31% |
---|
Function: updateLinkCells | Module: exec | Source: linkCells.c:209-385 [...] | Coverage: 0.31% |
---|
/home/eoseret/qaas_runs_CPU_9468/171-110-4860/intel/CoMD/build/CoMD/CoMD/src-openmp/linkCells.c: 209 - 385 |
-------------------------------------------------------------------------------- |
209: if (iz == gridSize[2]) |
210: { |
211: iBox = boxes->nLocalBoxes + 2*gridSize[2]*gridSize[1] + 2*gridSize[2]*(gridSize[0]+2) + |
212: (gridSize[0]+2)*(gridSize[1]+2) + (gridSize[0]+2)*(iy+1) + (ix+1); |
213: } |
214: // Halo in Z- |
215: else if (iz == -1) |
216: { |
217: iBox = boxes->nLocalBoxes + 2*gridSize[2]*gridSize[1] + 2*gridSize[2]*(gridSize[0]+2) + |
218: (gridSize[0]+2)*(iy+1) + (ix+1); |
219: } |
220: // Halo in Y+ |
221: else if (iy == gridSize[1]) |
[...] |
227: else if (iy == -1) |
228: { |
229: iBox = boxes->nLocalBoxes + 2*gridSize[2]*gridSize[1] + iz*(gridSize[0]+2) + (ix+1); |
230: } |
231: // Halo in X+ |
232: else if (ix == gridSize[0]) |
233: { |
234: iBox = boxes->nLocalBoxes + gridSize[1]*gridSize[2] + iz*gridSize[1] + iy; |
235: } |
236: // Halo in X- |
237: else if (ix == -1) |
238: { |
239: iBox = boxes->nLocalBoxes + iz*gridSize[1] + iy; |
240: } |
241: // local link celll. |
242: else |
243: { |
244: iBox = ix + gridSize[0]*iy + gridSize[0]*gridSize[1]*iz; |
245: } |
246: assert(iBox >= 0); |
247: assert(iBox < boxes->nTotalBoxes); |
[...] |
258: int nj = boxes->nAtoms[jBox]; |
259: copyAtom(boxes, atoms, iId, iBox, nj, jBox); |
260: boxes->nAtoms[jBox]++; |
261: |
262: assert(boxes->nAtoms[jBox] < MAXATOMS); |
263: |
264: boxes->nAtoms[iBox]--; |
265: int ni = boxes->nAtoms[iBox]; |
266: if (ni) copyAtom(boxes, atoms, ni, iBox, iId, iBox); |
267: |
268: if (jBox > boxes->nLocalBoxes) |
269: --atoms->nLocal; |
[...] |
288: { |
289: emptyHaloCells(boxes); |
290: |
291: for (int iBox=0; iBox<boxes->nLocalBoxes; ++iBox) |
292: { |
293: int iOff = iBox*MAXATOMS; |
294: int ii=0; |
295: while (ii < boxes->nAtoms[iBox]) |
296: { |
297: int jBox = getBoxFromCoord(boxes, atoms->r[iOff+ii]); |
298: if (jBox != iBox) |
299: moveAtom(boxes, atoms, ii, iBox, jBox); |
300: else |
301: ++ii; |
302: } |
303: } |
304: } |
[...] |
327: const int iOff = MAXATOMS*iBox+iAtom; |
328: const int jOff = MAXATOMS*jBox+jAtom; |
329: atoms->gid[jOff] = atoms->gid[iOff]; |
330: atoms->iSpecies[jOff] = atoms->iSpecies[iOff]; |
331: memcpy(atoms->r[jOff], atoms->r[iOff], sizeof(real3)); |
332: memcpy(atoms->p[jOff], atoms->p[iOff], sizeof(real3)); |
333: memcpy(atoms->f[jOff], atoms->f[iOff], sizeof(real3)); |
334: memcpy(atoms->U+jOff, atoms->U+iOff, sizeof(real_t)); |
[...] |
352: int ix = (int)(floor((rr[0] - localMin[0])*boxes->invBoxSize[0])); |
353: int iy = (int)(floor((rr[1] - localMin[1])*boxes->invBoxSize[1])); |
[...] |
359: if (rr[0] < localMax[0]) |
360: { |
361: if (ix == gridSize[0]) ix = gridSize[0] - 1; |
362: } |
363: else |
364: ix = gridSize[0]; // assign to halo cell |
365: if (rr[1] < localMax[1]) |
[...] |
371: if (rr[2] < localMax[2]) |
[...] |
384: for (int ii=boxes->nLocalBoxes; ii<boxes->nTotalBoxes; ++ii) |
385: boxes->nAtoms[ii] = 0; |
0x40d800 PUSH %RBP |
0x40d801 MOV %RSP,%RBP |
0x40d804 PUSH %R15 |
0x40d806 PUSH %R14 |
0x40d808 PUSH %R13 |
0x40d80a PUSH %R12 |
0x40d80c PUSH %RBX |
0x40d80d SUB $0x78,%RSP |
0x40d811 MOV %RSI,-0x48(%RBP) |
0x40d815 MOV 0xc(%RDI),%R14D |
0x40d819 MOV %RDI,-0x40(%RBP) |
0x40d81d MOV 0x14(%RDI),%EDI |
0x40d820 CMP %EDI,%R14D |
0x40d823 MOV %EDI,-0x38(%RBP) |
0x40d826 JGE 40d852 |
0x40d828 MOV %EDI,%ECX |
0x40d82a MOVSXD %R14D,%RDI |
0x40d82d SAL $0x2,%RDI |
0x40d831 MOV -0x40(%RBP),%RAX |
0x40d835 ADD 0x78(%RAX),%RDI |
0x40d839 MOV %R14D,%EAX |
0x40d83c NOT %EAX |
0x40d83e ADD %ECX,%EAX |
0x40d840 LEA 0x4(,%RAX,4),%RDX |
0x40d848 XOR %ESI,%ESI |
0x40d84a CALL 418370 <__intel_avx_rep_memset> |
0x40d84f MOV -0x38(%RBP),%EDI |
0x40d852 TEST %R14D,%R14D |
0x40d855 JLE 40dd40 |
0x40d85b MOV -0x40(%RBP),%RAX |
0x40d85f MOV 0x78(%RAX),%RAX |
0x40d863 LEA 0x1(%R14),%ECX |
0x40d867 MOV %ECX,-0x2c(%RBP) |
0x40d86a XOR %R9D,%R9D |
0x40d86d VPCMPEQD %XMM0,%XMM0,%XMM0 |
0x40d871 MOV %RAX,-0x60(%RBP) |
0x40d875 MOV %R14,-0xa0(%RBP) |
0x40d87c JMP 40d88c |
0x40d87e XCHG %AX,%AX |
(84) 0x40d880 INC %R9 |
(84) 0x40d883 CMP %R14,%R9 |
(84) 0x40d886 JE 40dd40 |
(84) 0x40d88c CMPL $0,(%RAX,%R9,4) |
(84) 0x40d891 JLE 40d880 |
(84) 0x40d893 MOVSXD %R9D,%RCX |
(84) 0x40d896 SAL $0x6,%RCX |
(84) 0x40d89a MOV %RCX,-0x88(%RBP) |
(84) 0x40d8a1 MOV -0x48(%RBP),%RCX |
(84) 0x40d8a5 MOV 0x18(%RCX),%R11 |
(84) 0x40d8a9 MOV -0x40(%RBP),%RAX |
(84) 0x40d8ad VMOVSD 0x30(%RAX),%XMM1 |
(84) 0x40d8b2 MOV (%RAX),%R13D |
(84) 0x40d8b5 LEA -0x1(%R13),%ECX |
(84) 0x40d8b9 MOV %ECX,-0x64(%RBP) |
(84) 0x40d8bc VMOVUPD 0x38(%RAX),%XMM2 |
(84) 0x40d8c1 VMOVUPD 0x20(%RAX),%XMM3 |
(84) 0x40d8c6 VMOVUPD 0x68(%RAX),%XMM4 |
(84) 0x40d8cb MOV 0x4(%RAX),%RBX |
(84) 0x40d8cf MOV -0x60(%RBP),%RAX |
(84) 0x40d8d3 VMOVQ %RBX,%XMM5 |
(84) 0x40d8d8 MOV %RBX,%RCX |
(84) 0x40d8db SHR $0x20,%RCX |
(84) 0x40d8df VPADDD %XMM0,%XMM5,%XMM6 |
(84) 0x40d8e3 MOV %RCX,-0x98(%RBP) |
(84) 0x40d8ea LEA (%RCX,%RCX,1),%EDX |
(84) 0x40d8ed MOV %RDX,%RCX |
(84) 0x40d8f0 MOV %RDX,-0x78(%RBP) |
(84) 0x40d8f4 IMUL %EBX,%ECX |
(84) 0x40d8f7 MOV %ECX,-0x34(%RBP) |
(84) 0x40d8fa LEA 0x2(%R13),%ECX |
(84) 0x40d8fe MOV %ECX,-0x30(%RBP) |
(84) 0x40d901 VPINSRD $0,%R14D,%XMM5,%XMM7 |
(84) 0x40d907 XOR %R15D,%R15D |
(84) 0x40d90a MOV %R13,-0x70(%RBP) |
(84) 0x40d90e MOV %RBX,-0x58(%RBP) |
(84) 0x40d912 MOV %R9,-0x50(%RBP) |
(84) 0x40d916 JMP 40d951 |
0x40d918 NOPW %CS:(%RAX,%RAX,1) |
0x40d927 NOPW %CS:(%RAX,%RAX,1) |
0x40d936 NOPW %CS:(%RAX,%RAX,1) |
(85) 0x40d940 INC %R15D |
(85) 0x40d943 MOV -0x58(%RBP),%RBX |
(85) 0x40d947 CMP (%RAX,%R9,4),%R15D |
(85) 0x40d94b JGE 40d880 |
(85) 0x40d951 MOV -0x88(%RBP),%RCX |
(85) 0x40d958 ADD %R15D,%ECX |
(85) 0x40d95b MOVSXD %ECX,%RCX |
(85) 0x40d95e MOV %RCX,-0x90(%RBP) |
(85) 0x40d965 LEA (%RCX,%RCX,2),%R12 |
(85) 0x40d969 VMOVSD (%R11,%R12,8),%XMM8 |
(85) 0x40d96f VUCOMISD %XMM8,%XMM1 |
(85) 0x40d974 MOV %R13D,%ECX |
(85) 0x40d977 JBE 40d99d |
(85) 0x40d979 MOV -0x40(%RBP),%RAX |
(85) 0x40d97d VSUBSD 0x18(%RAX),%XMM8,%XMM8 |
(85) 0x40d982 VMULSD 0x60(%RAX),%XMM8,%XMM8 |
(85) 0x40d987 MOV -0x60(%RBP),%RAX |
(85) 0x40d98b VROUNDSD $0x9,%XMM8,%XMM8,%XMM8 |
(85) 0x40d991 VCVTTSD2SI %XMM8,%ECX |
(85) 0x40d996 CMP %ECX,%R13D |
(85) 0x40d999 CMOVE -0x64(%RBP),%ECX |
(85) 0x40d99d VMOVUPD 0x8(%R11,%R12,8),%XMM9 |
(85) 0x40d9a4 VSUBPD %XMM3,%XMM9,%XMM8 |
(85) 0x40d9a8 VMULPD %XMM4,%XMM8,%XMM8 |
(85) 0x40d9ac VROUNDPD $0x9,%XMM8,%XMM8 |
(85) 0x40d9b2 VCVTTPD2DQ %XMM8,%XMM8 |
(85) 0x40d9b7 VPCMPEQD %XMM8,%XMM5,%K1 |
(85) 0x40d9bd VCMPPD $0x2,%XMM9,%XMM2,%K0 |
(85) 0x40d9c4 KSHIFTRB $0x1,%K0,%K2 |
(85) 0x40d9ca KMOVD %K2,%R10D |
(85) 0x40d9ce KMOVD %K0,%EDX |
(85) 0x40d9d2 VMOVDQA32 %XMM6,%XMM8{%K1} |
(85) 0x40d9d8 VMOVD %XMM8,%ESI |
(85) 0x40d9dc TEST $0x1,%DL |
(85) 0x40d9df MOV %ESI,%R8D |
(85) 0x40d9e2 CMOVNE %EBX,%R8D |
(85) 0x40d9e6 TEST $0x1,%R10B |
(85) 0x40d9ea JE 40da40 |
(85) 0x40d9ec ADD %EBX,%R8D |
(85) 0x40d9ef MOV -0x78(%RBP),%RDX |
(85) 0x40d9f3 LEA 0x3(%RDX,%R8,1),%EDX |
(85) 0x40d9f8 IMUL -0x30(%RBP),%EDX |
(85) 0x40d9fc ADD -0x2c(%RBP),%ECX |
(85) 0x40d9ff ADD -0x34(%RBP),%ECX |
(85) 0x40da02 ADD %EDX,%ECX |
(85) 0x40da04 JMP 40db11 |
0x40da09 NOPW %CS:(%RAX,%RAX,1) |
0x40da18 NOPW %CS:(%RAX,%RAX,1) |
0x40da27 NOPW %CS:(%RAX,%RAX,1) |
0x40da36 NOPW %CS:(%RAX,%RAX,1) |
(85) 0x40da40 MOV %R15,%R10 |
(85) 0x40da43 VPEXTRD $0x1,%XMM8,%R15D |
(85) 0x40da49 CMP $-0x1,%R15D |
(85) 0x40da4d JE 40da80 |
(85) 0x40da4f TEST $0x1,%DL |
(85) 0x40da52 JE 40dac0 |
(85) 0x40da54 ADD -0x98(%RBP),%R15D |
(85) 0x40da5b JMP 40db00 |
0x40da60 NOPW %CS:(%RAX,%RAX,1) |
0x40da6f NOPW %CS:(%RAX,%RAX,1) |
0x40da7e XCHG %AX,%AX |
(85) 0x40da80 MOV -0x78(%RBP),%RDX |
(85) 0x40da84 LEA 0x1(%R8,%RDX,1),%EDX |
(85) 0x40da89 IMUL -0x30(%RBP),%EDX |
(85) 0x40da8d ADD -0x2c(%RBP),%ECX |
(85) 0x40da90 ADD -0x34(%RBP),%ECX |
(85) 0x40da93 ADD %EDX,%ECX |
(85) 0x40da95 JMP 40db0e |
0x40da97 NOPW %CS:(%RAX,%RAX,1) |
0x40daa6 NOPW %CS:(%RAX,%RAX,1) |
0x40dab5 NOPW %CS:(%RAX,%RAX,1) |
(85) 0x40dac0 CMP $-0x1,%ESI |
(85) 0x40dac3 JE 40db00 |
(85) 0x40dac5 CMP %ECX,%R13D |
(85) 0x40dac8 JNE 40dcc0 |
(85) 0x40dace VPADDD %XMM7,%XMM8,%XMM8 |
(85) 0x40dad2 VPEXTRD $0x1,%XMM8,%EDX |
(85) 0x40dad8 IMUL %EBX,%EDX |
(85) 0x40dadb VMOVD %XMM8,%ECX |
(85) 0x40dadf ADD %EDX,%ECX |
(85) 0x40dae1 JMP 40db0e |
0x40dae3 NOPW %CS:(%RAX,%RAX,1) |
0x40daf2 NOPW %CS:(%RAX,%RAX,1) |
(85) 0x40db00 IMUL -0x30(%RBP),%R15D |
(85) 0x40db05 ADD -0x2c(%RBP),%ECX |
(85) 0x40db08 ADD -0x34(%RBP),%ECX |
(85) 0x40db0b ADD %R15D,%ECX |
(85) 0x40db0e MOV %R10,%R15 |
(85) 0x40db11 TEST %ECX,%ECX |
(85) 0x40db13 JS 40dd80 |
(85) 0x40db19 CMP %EDI,%ECX |
(85) 0x40db1b JGE 40ddc0 |
(85) 0x40db21 MOV %ECX,%EBX |
(85) 0x40db23 CMP %RBX,%R9 |
(85) 0x40db26 JE 40d940 |
(85) 0x40db2c MOV %R15,-0x80(%RBP) |
(85) 0x40db30 MOVSXD (%RAX,%RBX,4),%RSI |
(85) 0x40db34 MOVSXD %ECX,%RDX |
(85) 0x40db37 SAL $0x6,%RDX |
(85) 0x40db3b ADD %RSI,%RDX |
(85) 0x40db3e MOV -0x48(%RBP),%RAX |
(85) 0x40db42 MOV 0x8(%RAX),%R14 |
(85) 0x40db46 MOV -0x90(%RBP),%R13 |
(85) 0x40db4d MOV (%R14,%R13,4),%ESI |
(85) 0x40db51 MOV %ESI,(%R14,%RDX,4) |
(85) 0x40db55 MOV %R11,%R8 |
(85) 0x40db58 MOV 0x10(%RAX),%R11 |
(85) 0x40db5c MOV (%R11,%R13,4),%ESI |
(85) 0x40db60 MOV %ESI,(%R11,%RDX,4) |
(85) 0x40db64 LEA (%R8,%R12,8),%R12 |
(85) 0x40db68 LEA (,%RDX,8),%RSI |
(85) 0x40db70 LEA (%RSI,%RSI,2),%R10 |
(85) 0x40db74 MOV 0x10(%R12),%RSI |
(85) 0x40db79 MOV %RSI,0x10(%R8,%R10,1) |
(85) 0x40db7e VMOVUPS (%R12),%XMM8 |
(85) 0x40db84 MOV %R8,%RDI |
(85) 0x40db87 VMOVUPS %XMM8,(%R8,%R10,1) |
(85) 0x40db8d MOV 0x20(%RAX),%RSI |
(85) 0x40db91 LEA (,%R13,8),%R8 |
(85) 0x40db99 LEA (%R8,%R8,2),%R15 |
(85) 0x40db9d MOV 0x10(%RSI,%R15,1),%R8 |
(85) 0x40dba2 MOV %R8,0x10(%RSI,%R10,1) |
(85) 0x40dba7 VMOVUPS (%RSI,%R15,1),%XMM8 |
(85) 0x40dbad VMOVUPS %XMM8,(%RSI,%R10,1) |
(85) 0x40dbb3 MOV 0x28(%RAX),%R8 |
(85) 0x40dbb7 MOV 0x10(%R8,%R15,1),%R9 |
(85) 0x40dbbc MOV %R9,0x10(%R8,%R10,1) |
(85) 0x40dbc1 VMOVDQU (%R8,%R15,1),%XMM8 |
(85) 0x40dbc7 VMOVDQU %XMM8,(%R8,%R10,1) |
(85) 0x40dbcd MOV 0x30(%RAX),%R10 |
(85) 0x40dbd1 MOV -0x60(%RBP),%RAX |
(85) 0x40dbd5 MOV (%R10,%R13,8),%R9 |
(85) 0x40dbd9 MOV %R9,(%R10,%RDX,8) |
(85) 0x40dbdd MOV (%RAX,%RBX,4),%EDX |
(85) 0x40dbe0 LEA 0x1(%RDX),%R9D |
(85) 0x40dbe4 MOV %R9D,(%RAX,%RBX,4) |
(85) 0x40dbe8 CMP $0x3f,%EDX |
(85) 0x40dbeb JGE 40de00 |
(85) 0x40dbf1 MOV -0x50(%RBP),%RDX |
(85) 0x40dbf5 MOVSXD (%RAX,%RDX,4),%RBX |
(85) 0x40dbf9 DEC %RBX |
(85) 0x40dbfc MOV %EBX,(%RAX,%RDX,4) |
(85) 0x40dbff TEST %EBX,%EBX |
(85) 0x40dc01 JE 40dc7c |
(85) 0x40dc03 LEA (%RSI,%R15,1),%RDX |
(85) 0x40dc07 ADD -0x88(%RBP),%RBX |
(85) 0x40dc0e MOV (%R14,%RBX,4),%R9D |
(85) 0x40dc12 MOV -0x90(%RBP),%R13 |
(85) 0x40dc19 MOV %R9D,(%R14,%R13,4) |
(85) 0x40dc1d MOV (%R11,%RBX,4),%R9D |
(85) 0x40dc21 MOV %R9D,(%R11,%R13,4) |
(85) 0x40dc25 ADD %R8,%R15 |
(85) 0x40dc28 LEA (,%RBX,8),%R9 |
(85) 0x40dc30 LEA (%R9,%R9,2),%R9 |
(85) 0x40dc34 MOV %RDI,%R14 |
(85) 0x40dc37 MOV 0x10(%RDI,%R9,1),%R11 |
(85) 0x40dc3c MOV %R11,0x10(%R12) |
(85) 0x40dc41 VMOVUPS (%RDI,%R9,1),%XMM8 |
(85) 0x40dc47 VMOVUPS %XMM8,(%R12) |
(85) 0x40dc4d MOV 0x10(%RSI,%R9,1),%R11 |
(85) 0x40dc52 MOV %R11,0x10(%RDX) |
(85) 0x40dc56 VMOVUPS (%RSI,%R9,1),%XMM8 |
(85) 0x40dc5c VMOVUPS %XMM8,(%RDX) |
(85) 0x40dc60 MOV 0x10(%R8,%R9,1),%RDX |
(85) 0x40dc65 MOV %RDX,0x10(%R15) |
(85) 0x40dc69 VMOVDQU (%R8,%R9,1),%XMM8 |
(85) 0x40dc6f VMOVDQU %XMM8,(%R15) |
(85) 0x40dc74 MOV (%R10,%RBX,8),%RDX |
(85) 0x40dc78 MOV %RDX,(%R10,%R13,8) |
(85) 0x40dc7c MOV -0xa0(%RBP),%R14 |
(85) 0x40dc83 CMP %ECX,%R14D |
(85) 0x40dc86 JGE 40dc8e |
(85) 0x40dc88 MOV -0x48(%RBP),%RCX |
(85) 0x40dc8c DECL (%RCX) |
(85) 0x40dc8e MOV -0x38(%RBP),%ECX |
(85) 0x40dc91 MOV -0x50(%RBP),%R9 |
(85) 0x40dc95 MOV %RDI,%R11 |
(85) 0x40dc98 MOV %ECX,%EDI |
(85) 0x40dc9a MOV -0x70(%RBP),%R13 |
(85) 0x40dc9e MOV -0x58(%RBP),%RBX |
(85) 0x40dca2 MOV -0x80(%RBP),%R15 |
(85) 0x40dca6 CMP (%RAX,%R9,4),%R15D |
(85) 0x40dcaa JL 40d951 |
(84) 0x40dcb0 JMP 40d880 |
0x40dcb5 NOPW %CS:(%RAX,%RAX,1) |
(85) 0x40dcc0 IMUL %EBX,%R15D |
(85) 0x40dcc4 CMP $-0x1,%ECX |
(85) 0x40dcc7 JE 40dd00 |
(85) 0x40dcc9 ADD %ESI,%R15D |
(85) 0x40dccc IMUL %R13D,%R15D |
(85) 0x40dcd0 JMP 40db0b |
0x40dcd5 NOPW %CS:(%RAX,%RAX,1) |
0x40dce4 NOPW %CS:(%RAX,%RAX,1) |
0x40dcf3 NOPW %CS:(%RAX,%RAX,1) |
(85) 0x40dd00 ADD %R14D,%ESI |
(85) 0x40dd03 ADD %R15D,%ESI |
(85) 0x40dd06 MOV %ESI,%ECX |
(85) 0x40dd08 JMP 40db0e |
0x40dd0d NOPW %CS:(%RAX,%RAX,1) |
0x40dd1c NOPW %CS:(%RAX,%RAX,1) |
0x40dd2b NOPW %CS:(%RAX,%RAX,1) |
0x40dd3a NOPW (%RAX,%RAX,1) |
0x40dd40 ADD $0x78,%RSP |
0x40dd44 POP %RBX |
0x40dd45 POP %R12 |
0x40dd47 POP %R13 |
0x40dd49 POP %R14 |
0x40dd4b POP %R15 |
0x40dd4d POP %RBP |
0x40dd4e RET |
0x40dd4f NOPW %CS:(%RAX,%RAX,1) |
0x40dd5e NOPW %CS:(%RAX,%RAX,1) |
0x40dd6d NOPW %CS:(%RAX,%RAX,1) |
0x40dd7c NOPL (%RAX) |
0x40dd80 MOV $0x41b1dd,%EDI |
0x40dd85 MOV $0x41b102,%ESI |
0x40dd8a MOV $0x41b1e7,%ECX |
0x40dd8f MOV $0xf6,%EDX |
0x40dd94 CALL 4030c0 <__assert_fail@plt> |
0x40dd99 NOPW %CS:(%RAX,%RAX,1) |
0x40dda8 NOPW %CS:(%RAX,%RAX,1) |
0x40ddb7 NOPW (%RAX,%RAX,1) |
0x40ddc0 MOV $0x41b216,%EDI |
0x40ddc5 MOV $0x41b102,%ESI |
0x40ddca MOV $0x41b1e7,%ECX |
0x40ddcf MOV $0xf7,%EDX |
0x40ddd4 CALL 4030c0 <__assert_fail@plt> |
0x40ddd9 NOPW %CS:(%RAX,%RAX,1) |
0x40dde8 NOPW %CS:(%RAX,%RAX,1) |
0x40ddf7 NOPW (%RAX,%RAX,1) |
0x40de00 MOV $0x41b230,%EDI |
0x40de05 MOV $0x41b102,%ESI |
0x40de0a MOV $0x41b24f,%ECX |
0x40de0f MOV $0x106,%EDX |
0x40de14 CALL 4030c0 <__assert_fail@plt> |
0x40de19 NOPW %CS:(%RAX,%RAX,1) |
0x40de23 NOPW %CS:(%RAX,%RAX,1) |
0x40de2d NOPW %CS:(%RAX,%RAX,1) |
0x40de37 NOPW (%RAX,%RAX,1) |
Path / |
Source file and lines | linkCells.c:209-385 |
Module | exec |
nb instructions | 99 |
nb uops | 103 |
loop length | 686 |
used x86 registers | 13 |
used mmx registers | 0 |
used xmm registers | 1 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 6 |
micro-operation queue | 17.17 cycles |
front end | 17.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.80 | 4.80 | 4.67 | 4.67 | 8.00 | 4.87 | 4.80 | 8.00 | 8.00 | 8.00 | 4.73 | 4.67 |
cycles | 4.80 | 4.80 | 4.67 | 4.67 | 8.00 | 4.87 | 4.80 | 8.00 | 8.00 | 8.00 | 4.73 | 4.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 16.62 |
Stall cycles | 0.00 |
Front-end | 17.17 |
Dispatch | 8.00 |
Overall L1 | 17.17 |
all | 4% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 6% |
all | 8% |
load | NA (no load vectorizable/vectorized instructions) |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 7% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x78,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RSI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc(%RDI),%R14D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x14(%RDI),%EDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %EDI,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %EDI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 40d852 <updateLinkCells+0x52> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %EDI,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOVSXD %R14D,%RDI | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
SAL $0x2,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD 0x78(%RAX),%RDI | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %R14D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %ECX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x4(,%RAX,4),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 418370 <__intel_avx_rep_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x38(%RBP),%EDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14D,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 40dd40 <updateLinkCells+0x540> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x78(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%R14),%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %ECX,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPCMPEQD %XMM0,%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 40d88c <updateLinkCells+0x8c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x78,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x41b1dd,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x41b102,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x41b1e7,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf6,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4030c0 <__assert_fail@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x41b216,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x41b102,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x41b1e7,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf7,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4030c0 <__assert_fail@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x41b230,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x41b102,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x41b24f,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x106,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4030c0 <__assert_fail@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Source file and lines | linkCells.c:209-385 |
Module | exec |
nb instructions | 99 |
nb uops | 103 |
loop length | 686 |
used x86 registers | 13 |
used mmx registers | 0 |
used xmm registers | 1 |
used ymm registers | 0 |
used zmm registers | 0 |
nb stack references | 6 |
micro-operation queue | 17.17 cycles |
front end | 17.17 cycles |
P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|
uops | 4.80 | 4.80 | 4.67 | 4.67 | 8.00 | 4.87 | 4.80 | 8.00 | 8.00 | 8.00 | 4.73 | 4.67 |
cycles | 4.80 | 4.80 | 4.67 | 4.67 | 8.00 | 4.87 | 4.80 | 8.00 | 8.00 | 8.00 | 4.73 | 4.67 |
Cycles executing div or sqrt instructions | NA |
FE+BE cycles | 16.62 |
Stall cycles | 0.00 |
Front-end | 17.17 |
Dispatch | 8.00 |
Overall L1 | 17.17 |
all | 4% |
load | NA (no load vectorizable/vectorized instructions) |
store | 0% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 6% |
all | 8% |
load | NA (no load vectorizable/vectorized instructions) |
store | 10% |
mul | NA (no mul vectorizable/vectorized instructions) |
add-sub | NA (no add-sub vectorizable/vectorized instructions) |
fma | NA (no fma vectorizable/vectorized instructions) |
div/sqrt | NA (no div/sqrt vectorizable/vectorized instructions) |
other | 7% |
Instruction | Nb FU | P0 | P1 | P2 | P3 | P4 | P5 | P6 | P7 | P8 | P9 | P10 | P11 | Latency | Recip. throughput |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
PUSH %RBP | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
MOV %RSP,%RBP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
PUSH %R15 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R14 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R13 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %R12 | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
PUSH %RBX | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 5-12 | 0.50 |
SUB $0x78,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOV %RSI,-0x48(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0xc(%RDI),%R14D | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV %RDI,-0x40(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV 0x14(%RDI),%EDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
CMP %EDI,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV %EDI,-0x38(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JGE 40d852 <updateLinkCells+0x52> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV %EDI,%ECX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
MOVSXD %R14D,%RDI | 1 | 0 | 0.33 | 0 | 0 | 0 | 0.33 | 0 | 0 | 0 | 0 | 0.33 | 0 | 1 | 0.33 |
SAL $0x2,%RDI | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0-2 | 0.50 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
ADD 0x78(%RAX),%RDI | 1 | 0.20 | 0.20 | 0.33 | 0.33 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.33 | 1 | 0.33 |
MOV %R14D,%EAX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
NOT %EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
ADD %ECX,%EAX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
LEA 0x4(,%RAX,4),%RDX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XOR %ESI,%ESI | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
CALL 418370 <__intel_avx_rep_memset> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
MOV -0x38(%RBP),%EDI | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
TEST %R14D,%R14D | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 2 | 0.20 |
JLE 40dd40 <updateLinkCells+0x540> | 1 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0.50 |
MOV -0x40(%RBP),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
MOV 0x78(%RAX),%RAX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1 | 0.33 |
LEA 0x1(%R14),%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1-2 | 0.20 |
MOV %ECX,-0x2c(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
XOR %R9D,%R9D | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
VPCMPEQD %XMM0,%XMM0,%XMM0 | 1 | 0.50 | 0.50 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 3 | 0.50 |
MOV %RAX,-0x60(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
MOV %R14,-0xa0(%RBP) | 1 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 1 | 0.50 |
JMP 40d88c <updateLinkCells+0x8c> | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 5.84 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
XCHG %AX,%AX | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
ADD $0x78,%RSP | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 1 | 0.17 |
POP %RBX | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R12 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R13 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R14 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %R15 | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
POP %RBP | 1 | 0 | 0 | 0.33 | 0.33 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.33 | 1-6 | 0.33 |
RET | 1 | 0.50 | 0 | 0.33 | 0.33 | 0 | 0 | 0.50 | 0 | 0 | 0 | 0 | 0.33 | 0 | 2.13 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPL (%RAX) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x41b1dd,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x41b102,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x41b1e7,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf6,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4030c0 <__assert_fail@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x41b216,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x41b102,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x41b1e7,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0xf7,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4030c0 <__assert_fail@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
MOV $0x41b230,%EDI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x41b102,%ESI | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x41b24f,%ECX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
MOV $0x106,%EDX | 1 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0.20 | 0 | 0 | 0 | 0.20 | 0 | 1 | 0.20 |
CALL 4030c0 <__assert_fail@plt> | 2 | 0 | 0 | 0 | 0 | 0.50 | 0 | 0 | 0.50 | 0.50 | 0.50 | 0 | 0 | 0 | 1 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW %CS:(%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
NOPW (%RAX,%RAX,1) | 1 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.17 |
Name | Coverage (%) | Time (s) |
---|---|---|
▼updateLinkCells– | 0.31 | 0.05 |
▼Loop 84 - linkCells.c:209-371 - exec– | 0 | 0.02 |
○Loop 85 - linkCells.c:209-371 - exec | 0.3 | 2.21 |